forked from atselousov/transformer_chatbot
-
Notifications
You must be signed in to change notification settings - Fork 0
/
parameters_names.json
1 lines (1 loc) · 5.13 KB
/
parameters_names.json
1
["model/layers0/attn/qkv_proj/weight:0", "model/layers0/attn/qkv_proj/bias:0", "model/layers0/attn/out_proj/weight:0", "model/layers0/attn/out_proj/bias:0", "model/layers0/attn_norm/weight:0", "model/layers0/attn_norm/bias:0", "model/layers0/ff/layer_1/weight:0", "model/layers0/ff/layer_1/bias:0", "model/layers0/ff/layer_2/weight:0", "model/layers0/ff/layer_2/bias:0", "model/layers0/ff_norm/weight:0", "model/layers0/ff_norm/bias:0", "model/layers1/attn/qkv_proj/weight:0", "model/layers1/attn/qkv_proj/bias:0", "model/layers1/attn/out_proj/weight:0", "model/layers1/attn/out_proj/bias:0", "model/layers1/attn_norm/weight:0", "model/layers1/attn_norm/bias:0", "model/layers1/ff/layer_1/weight:0", "model/layers1/ff/layer_1/bias:0", "model/layers1/ff/layer_2/weight:0", "model/layers1/ff/layer_2/bias:0", "model/layers1/ff_norm/weight:0", "model/layers1/ff_norm/bias:0", "model/layers2/attn/qkv_proj/weight:0", "model/layers2/attn/qkv_proj/bias:0", "model/layers2/attn/out_proj/weight:0", "model/layers2/attn/out_proj/bias:0", "model/layers2/attn_norm/weight:0", "model/layers2/attn_norm/bias:0", "model/layers2/ff/layer_1/weight:0", "model/layers2/ff/layer_1/bias:0", "model/layers2/ff/layer_2/weight:0", "model/layers2/ff/layer_2/bias:0", "model/layers2/ff_norm/weight:0", "model/layers2/ff_norm/bias:0", "model/layers3/attn/qkv_proj/weight:0", "model/layers3/attn/qkv_proj/bias:0", "model/layers3/attn/out_proj/weight:0", "model/layers3/attn/out_proj/bias:0", "model/layers3/attn_norm/weight:0", "model/layers3/attn_norm/bias:0", "model/layers3/ff/layer_1/weight:0", "model/layers3/ff/layer_1/bias:0", "model/layers3/ff/layer_2/weight:0", "model/layers3/ff/layer_2/bias:0", "model/layers3/ff_norm/weight:0", "model/layers3/ff_norm/bias:0", "model/layers4/attn/qkv_proj/weight:0", "model/layers4/attn/qkv_proj/bias:0", "model/layers4/attn/out_proj/weight:0", "model/layers4/attn/out_proj/bias:0", "model/layers4/attn_norm/weight:0", "model/layers4/attn_norm/bias:0", "model/layers4/ff/layer_1/weight:0", "model/layers4/ff/layer_1/bias:0", "model/layers4/ff/layer_2/weight:0", "model/layers4/ff/layer_2/bias:0", "model/layers4/ff_norm/weight:0", "model/layers4/ff_norm/bias:0", "model/layers5/attn/qkv_proj/weight:0", "model/layers5/attn/qkv_proj/bias:0", "model/layers5/attn/out_proj/weight:0", "model/layers5/attn/out_proj/bias:0", "model/layers5/attn_norm/weight:0", "model/layers5/attn_norm/bias:0", "model/layers5/ff/layer_1/weight:0", "model/layers5/ff/layer_1/bias:0", "model/layers5/ff/layer_2/weight:0", "model/layers5/ff/layer_2/bias:0", "model/layers5/ff_norm/weight:0", "model/layers5/ff_norm/bias:0", "model/layers6/attn/qkv_proj/weight:0", "model/layers6/attn/qkv_proj/bias:0", "model/layers6/attn/out_proj/weight:0", "model/layers6/attn/out_proj/bias:0", "model/layers6/attn_norm/weight:0", "model/layers6/attn_norm/bias:0", "model/layers6/ff/layer_1/weight:0", "model/layers6/ff/layer_1/bias:0", "model/layers6/ff/layer_2/weight:0", "model/layers6/ff/layer_2/bias:0", "model/layers6/ff_norm/weight:0", "model/layers6/ff_norm/bias:0", "model/layers7/attn/qkv_proj/weight:0", "model/layers7/attn/qkv_proj/bias:0", "model/layers7/attn/out_proj/weight:0", "model/layers7/attn/out_proj/bias:0", "model/layers7/attn_norm/weight:0", "model/layers7/attn_norm/bias:0", "model/layers7/ff/layer_1/weight:0", "model/layers7/ff/layer_1/bias:0", "model/layers7/ff/layer_2/weight:0", "model/layers7/ff/layer_2/bias:0", "model/layers7/ff_norm/weight:0", "model/layers7/ff_norm/bias:0", "model/layers8/attn/qkv_proj/weight:0", "model/layers8/attn/qkv_proj/bias:0", "model/layers8/attn/out_proj/weight:0", "model/layers8/attn/out_proj/bias:0", "model/layers8/attn_norm/weight:0", "model/layers8/attn_norm/bias:0", "model/layers8/ff/layer_1/weight:0", "model/layers8/ff/layer_1/bias:0", "model/layers8/ff/layer_2/weight:0", "model/layers8/ff/layer_2/bias:0", "model/layers8/ff_norm/weight:0", "model/layers8/ff_norm/bias:0", "model/layers9/attn/qkv_proj/weight:0", "model/layers9/attn/qkv_proj/bias:0", "model/layers9/attn/out_proj/weight:0", "model/layers9/attn/out_proj/bias:0", "model/layers9/attn_norm/weight:0", "model/layers9/attn_norm/bias:0", "model/layers9/ff/layer_1/weight:0", "model/layers9/ff/layer_1/bias:0", "model/layers9/ff/layer_2/weight:0", "model/layers9/ff/layer_2/bias:0", "model/layers9/ff_norm/weight:0", "model/layers9/ff_norm/bias:0", "model/layers10/attn/qkv_proj/weight:0", "model/layers10/attn/qkv_proj/bias:0", "model/layers10/attn/out_proj/weight:0", "model/layers10/attn/out_proj/bias:0", "model/layers10/attn_norm/weight:0", "model/layers10/attn_norm/bias:0", "model/layers10/ff/layer_1/weight:0", "model/layers10/ff/layer_1/bias:0", "model/layers10/ff/layer_2/weight:0", "model/layers10/ff/layer_2/bias:0", "model/layers10/ff_norm/weight:0", "model/layers10/ff_norm/bias:0", "model/layers11/attn/qkv_proj/weight:0", "model/layers11/attn/qkv_proj/bias:0", "model/layers11/attn/out_proj/weight:0", "model/layers11/attn/out_proj/bias:0", "model/layers11/attn_norm/weight:0", "model/layers11/attn_norm/bias:0", "model/layers11/ff/layer_1/weight:0", "model/layers11/ff/layer_1/bias:0", "model/layers11/ff/layer_2/weight:0", "model/layers11/ff/layer_2/bias:0", "model/layers11/ff_norm/weight:0", "model/layers11/ff_norm/bias:0"]