修复gradient accumulation

This commit is contained in:
Duzeyao
2019-11-20 10:52:50 +08:00
parent 2ed6a8d06e
commit 44d8bc66a2
3 changed files with 15 additions and 7 deletions

View File

@@ -0,0 +1,10 @@
{
"initializer_range": 0.02,
"layer_norm_epsilon": 1e-05,
"n_ctx": 64,
"n_embd": 128,
"n_head": 2,
"n_layer": 1,
"n_positions": 64,
"vocab_size": 13317
}