Commit 50c3670f by xiaotong

using f-in-out method for initialization

parent b405b50e
...@@ -65,10 +65,13 @@ void T2TAttention::InitModel(int argc, const char ** argv, int myDevID, XMem * m ...@@ -65,10 +65,13 @@ void T2TAttention::InitModel(int argc, const char ** argv, int myDevID, XMem * m
InitTensor2D(&wk, d, dk, X_FLOAT, devID, mem); InitTensor2D(&wk, d, dk, X_FLOAT, devID, mem);
InitTensor2D(&wq, d, dk, X_FLOAT, devID, mem); InitTensor2D(&wq, d, dk, X_FLOAT, devID, mem);
InitTensor2D(&wv, d, dv, X_FLOAT, devID, mem); InitTensor2D(&wv, d, dv, X_FLOAT, devID, mem);
float finfoutk = sqrt(6/(d + dk));
float finfoutv = sqrt(6/(d + dv));
wk.SetDataRand(-minmax, minmax); wk.SetDataRand(-finfoutk, finfoutk);
wq.SetDataRand(-minmax, minmax); wq.SetDataRand(-finfoutk, finfoutk);
wv.SetDataRand(-minmax, minmax); wv.SetDataRand(-finfoutv, finfoutv);
} }
/* /*
......
Markdown 格式
0%
您添加了 0 到此讨论。请谨慎行事。
请先完成此评论的编辑!
注册 或者 后发表评论