tiny-random-bert-sharded-subfolder / bert /flax_model.msgpack.index.json
patrickvonplaten's picture
up
f89cf10
raw
history blame
7.46 kB
{
"metadata": {
"total_size": 351716
},
"weight_map": {
"embeddings/LayerNorm/bias": "flax_model-00004-of-00011.msgpack",
"embeddings/LayerNorm/scale": "flax_model-00004-of-00011.msgpack",
"embeddings/position_embeddings/embedding": "flax_model-00003-of-00011.msgpack",
"embeddings/token_type_embeddings/embedding": "flax_model-00004-of-00011.msgpack",
"embeddings/word_embeddings/embedding": "flax_model-00002-of-00011.msgpack",
"encoder/layer/0/attention/output/LayerNorm/bias": "flax_model-00005-of-00011.msgpack",
"encoder/layer/0/attention/output/LayerNorm/scale": "flax_model-00005-of-00011.msgpack",
"encoder/layer/0/attention/output/dense/bias": "flax_model-00005-of-00011.msgpack",
"encoder/layer/0/attention/output/dense/kernel": "flax_model-00005-of-00011.msgpack",
"encoder/layer/0/attention/self/key/bias": "flax_model-00004-of-00011.msgpack",
"encoder/layer/0/attention/self/key/kernel": "flax_model-00004-of-00011.msgpack",
"encoder/layer/0/attention/self/query/bias": "flax_model-00004-of-00011.msgpack",
"encoder/layer/0/attention/self/query/kernel": "flax_model-00004-of-00011.msgpack",
"encoder/layer/0/attention/self/value/bias": "flax_model-00004-of-00011.msgpack",
"encoder/layer/0/attention/self/value/kernel": "flax_model-00004-of-00011.msgpack",
"encoder/layer/0/intermediate/dense/bias": "flax_model-00005-of-00011.msgpack",
"encoder/layer/0/intermediate/dense/kernel": "flax_model-00005-of-00011.msgpack",
"encoder/layer/0/output/LayerNorm/bias": "flax_model-00005-of-00011.msgpack",
"encoder/layer/0/output/LayerNorm/scale": "flax_model-00005-of-00011.msgpack",
"encoder/layer/0/output/dense/bias": "flax_model-00005-of-00011.msgpack",
"encoder/layer/0/output/dense/kernel": "flax_model-00005-of-00011.msgpack",
"encoder/layer/1/attention/output/LayerNorm/bias": "flax_model-00006-of-00011.msgpack",
"encoder/layer/1/attention/output/LayerNorm/scale": "flax_model-00006-of-00011.msgpack",
"encoder/layer/1/attention/output/dense/bias": "flax_model-00006-of-00011.msgpack",
"encoder/layer/1/attention/output/dense/kernel": "flax_model-00006-of-00011.msgpack",
"encoder/layer/1/attention/self/key/bias": "flax_model-00006-of-00011.msgpack",
"encoder/layer/1/attention/self/key/kernel": "flax_model-00006-of-00011.msgpack",
"encoder/layer/1/attention/self/query/bias": "flax_model-00005-of-00011.msgpack",
"encoder/layer/1/attention/self/query/kernel": "flax_model-00005-of-00011.msgpack",
"encoder/layer/1/attention/self/value/bias": "flax_model-00006-of-00011.msgpack",
"encoder/layer/1/attention/self/value/kernel": "flax_model-00006-of-00011.msgpack",
"encoder/layer/1/intermediate/dense/bias": "flax_model-00006-of-00011.msgpack",
"encoder/layer/1/intermediate/dense/kernel": "flax_model-00006-of-00011.msgpack",
"encoder/layer/1/output/LayerNorm/bias": "flax_model-00007-of-00011.msgpack",
"encoder/layer/1/output/LayerNorm/scale": "flax_model-00007-of-00011.msgpack",
"encoder/layer/1/output/dense/bias": "flax_model-00007-of-00011.msgpack",
"encoder/layer/1/output/dense/kernel": "flax_model-00007-of-00011.msgpack",
"encoder/layer/2/attention/output/LayerNorm/bias": "flax_model-00008-of-00011.msgpack",
"encoder/layer/2/attention/output/LayerNorm/scale": "flax_model-00008-of-00011.msgpack",
"encoder/layer/2/attention/output/dense/bias": "flax_model-00008-of-00011.msgpack",
"encoder/layer/2/attention/output/dense/kernel": "flax_model-00008-of-00011.msgpack",
"encoder/layer/2/attention/self/key/bias": "flax_model-00007-of-00011.msgpack",
"encoder/layer/2/attention/self/key/kernel": "flax_model-00007-of-00011.msgpack",
"encoder/layer/2/attention/self/query/bias": "flax_model-00007-of-00011.msgpack",
"encoder/layer/2/attention/self/query/kernel": "flax_model-00007-of-00011.msgpack",
"encoder/layer/2/attention/self/value/bias": "flax_model-00007-of-00011.msgpack",
"encoder/layer/2/attention/self/value/kernel": "flax_model-00007-of-00011.msgpack",
"encoder/layer/2/intermediate/dense/bias": "flax_model-00008-of-00011.msgpack",
"encoder/layer/2/intermediate/dense/kernel": "flax_model-00008-of-00011.msgpack",
"encoder/layer/2/output/LayerNorm/bias": "flax_model-00008-of-00011.msgpack",
"encoder/layer/2/output/LayerNorm/scale": "flax_model-00008-of-00011.msgpack",
"encoder/layer/2/output/dense/bias": "flax_model-00008-of-00011.msgpack",
"encoder/layer/2/output/dense/kernel": "flax_model-00008-of-00011.msgpack",
"encoder/layer/3/attention/output/LayerNorm/bias": "flax_model-00009-of-00011.msgpack",
"encoder/layer/3/attention/output/LayerNorm/scale": "flax_model-00009-of-00011.msgpack",
"encoder/layer/3/attention/output/dense/bias": "flax_model-00009-of-00011.msgpack",
"encoder/layer/3/attention/output/dense/kernel": "flax_model-00009-of-00011.msgpack",
"encoder/layer/3/attention/self/key/bias": "flax_model-00009-of-00011.msgpack",
"encoder/layer/3/attention/self/key/kernel": "flax_model-00009-of-00011.msgpack",
"encoder/layer/3/attention/self/query/bias": "flax_model-00008-of-00011.msgpack",
"encoder/layer/3/attention/self/query/kernel": "flax_model-00008-of-00011.msgpack",
"encoder/layer/3/attention/self/value/bias": "flax_model-00009-of-00011.msgpack",
"encoder/layer/3/attention/self/value/kernel": "flax_model-00009-of-00011.msgpack",
"encoder/layer/3/intermediate/dense/bias": "flax_model-00009-of-00011.msgpack",
"encoder/layer/3/intermediate/dense/kernel": "flax_model-00009-of-00011.msgpack",
"encoder/layer/3/output/LayerNorm/bias": "flax_model-00010-of-00011.msgpack",
"encoder/layer/3/output/LayerNorm/scale": "flax_model-00010-of-00011.msgpack",
"encoder/layer/3/output/dense/bias": "flax_model-00010-of-00011.msgpack",
"encoder/layer/3/output/dense/kernel": "flax_model-00010-of-00011.msgpack",
"encoder/layer/4/attention/output/LayerNorm/bias": "flax_model-00011-of-00011.msgpack",
"encoder/layer/4/attention/output/LayerNorm/scale": "flax_model-00011-of-00011.msgpack",
"encoder/layer/4/attention/output/dense/bias": "flax_model-00011-of-00011.msgpack",
"encoder/layer/4/attention/output/dense/kernel": "flax_model-00011-of-00011.msgpack",
"encoder/layer/4/attention/self/key/bias": "flax_model-00010-of-00011.msgpack",
"encoder/layer/4/attention/self/key/kernel": "flax_model-00010-of-00011.msgpack",
"encoder/layer/4/attention/self/query/bias": "flax_model-00010-of-00011.msgpack",
"encoder/layer/4/attention/self/query/kernel": "flax_model-00010-of-00011.msgpack",
"encoder/layer/4/attention/self/value/bias": "flax_model-00010-of-00011.msgpack",
"encoder/layer/4/attention/self/value/kernel": "flax_model-00010-of-00011.msgpack",
"encoder/layer/4/intermediate/dense/bias": "flax_model-00011-of-00011.msgpack",
"encoder/layer/4/intermediate/dense/kernel": "flax_model-00011-of-00011.msgpack",
"encoder/layer/4/output/LayerNorm/bias": "flax_model-00011-of-00011.msgpack",
"encoder/layer/4/output/LayerNorm/scale": "flax_model-00011-of-00011.msgpack",
"encoder/layer/4/output/dense/bias": "flax_model-00011-of-00011.msgpack",
"encoder/layer/4/output/dense/kernel": "flax_model-00011-of-00011.msgpack",
"pooler/dense/bias": "flax_model-00011-of-00011.msgpack",
"pooler/dense/kernel": "flax_model-00011-of-00011.msgpack"
}
}