File size: 7,461 Bytes
f89cf10 |
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72 73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 |
{
"metadata": {
"total_size": 351716
},
"weight_map": {
"embeddings/LayerNorm/bias": "flax_model-00004-of-00011.msgpack",
"embeddings/LayerNorm/scale": "flax_model-00004-of-00011.msgpack",
"embeddings/position_embeddings/embedding": "flax_model-00003-of-00011.msgpack",
"embeddings/token_type_embeddings/embedding": "flax_model-00004-of-00011.msgpack",
"embeddings/word_embeddings/embedding": "flax_model-00002-of-00011.msgpack",
"encoder/layer/0/attention/output/LayerNorm/bias": "flax_model-00005-of-00011.msgpack",
"encoder/layer/0/attention/output/LayerNorm/scale": "flax_model-00005-of-00011.msgpack",
"encoder/layer/0/attention/output/dense/bias": "flax_model-00005-of-00011.msgpack",
"encoder/layer/0/attention/output/dense/kernel": "flax_model-00005-of-00011.msgpack",
"encoder/layer/0/attention/self/key/bias": "flax_model-00004-of-00011.msgpack",
"encoder/layer/0/attention/self/key/kernel": "flax_model-00004-of-00011.msgpack",
"encoder/layer/0/attention/self/query/bias": "flax_model-00004-of-00011.msgpack",
"encoder/layer/0/attention/self/query/kernel": "flax_model-00004-of-00011.msgpack",
"encoder/layer/0/attention/self/value/bias": "flax_model-00004-of-00011.msgpack",
"encoder/layer/0/attention/self/value/kernel": "flax_model-00004-of-00011.msgpack",
"encoder/layer/0/intermediate/dense/bias": "flax_model-00005-of-00011.msgpack",
"encoder/layer/0/intermediate/dense/kernel": "flax_model-00005-of-00011.msgpack",
"encoder/layer/0/output/LayerNorm/bias": "flax_model-00005-of-00011.msgpack",
"encoder/layer/0/output/LayerNorm/scale": "flax_model-00005-of-00011.msgpack",
"encoder/layer/0/output/dense/bias": "flax_model-00005-of-00011.msgpack",
"encoder/layer/0/output/dense/kernel": "flax_model-00005-of-00011.msgpack",
"encoder/layer/1/attention/output/LayerNorm/bias": "flax_model-00006-of-00011.msgpack",
"encoder/layer/1/attention/output/LayerNorm/scale": "flax_model-00006-of-00011.msgpack",
"encoder/layer/1/attention/output/dense/bias": "flax_model-00006-of-00011.msgpack",
"encoder/layer/1/attention/output/dense/kernel": "flax_model-00006-of-00011.msgpack",
"encoder/layer/1/attention/self/key/bias": "flax_model-00006-of-00011.msgpack",
"encoder/layer/1/attention/self/key/kernel": "flax_model-00006-of-00011.msgpack",
"encoder/layer/1/attention/self/query/bias": "flax_model-00005-of-00011.msgpack",
"encoder/layer/1/attention/self/query/kernel": "flax_model-00005-of-00011.msgpack",
"encoder/layer/1/attention/self/value/bias": "flax_model-00006-of-00011.msgpack",
"encoder/layer/1/attention/self/value/kernel": "flax_model-00006-of-00011.msgpack",
"encoder/layer/1/intermediate/dense/bias": "flax_model-00006-of-00011.msgpack",
"encoder/layer/1/intermediate/dense/kernel": "flax_model-00006-of-00011.msgpack",
"encoder/layer/1/output/LayerNorm/bias": "flax_model-00007-of-00011.msgpack",
"encoder/layer/1/output/LayerNorm/scale": "flax_model-00007-of-00011.msgpack",
"encoder/layer/1/output/dense/bias": "flax_model-00007-of-00011.msgpack",
"encoder/layer/1/output/dense/kernel": "flax_model-00007-of-00011.msgpack",
"encoder/layer/2/attention/output/LayerNorm/bias": "flax_model-00008-of-00011.msgpack",
"encoder/layer/2/attention/output/LayerNorm/scale": "flax_model-00008-of-00011.msgpack",
"encoder/layer/2/attention/output/dense/bias": "flax_model-00008-of-00011.msgpack",
"encoder/layer/2/attention/output/dense/kernel": "flax_model-00008-of-00011.msgpack",
"encoder/layer/2/attention/self/key/bias": "flax_model-00007-of-00011.msgpack",
"encoder/layer/2/attention/self/key/kernel": "flax_model-00007-of-00011.msgpack",
"encoder/layer/2/attention/self/query/bias": "flax_model-00007-of-00011.msgpack",
"encoder/layer/2/attention/self/query/kernel": "flax_model-00007-of-00011.msgpack",
"encoder/layer/2/attention/self/value/bias": "flax_model-00007-of-00011.msgpack",
"encoder/layer/2/attention/self/value/kernel": "flax_model-00007-of-00011.msgpack",
"encoder/layer/2/intermediate/dense/bias": "flax_model-00008-of-00011.msgpack",
"encoder/layer/2/intermediate/dense/kernel": "flax_model-00008-of-00011.msgpack",
"encoder/layer/2/output/LayerNorm/bias": "flax_model-00008-of-00011.msgpack",
"encoder/layer/2/output/LayerNorm/scale": "flax_model-00008-of-00011.msgpack",
"encoder/layer/2/output/dense/bias": "flax_model-00008-of-00011.msgpack",
"encoder/layer/2/output/dense/kernel": "flax_model-00008-of-00011.msgpack",
"encoder/layer/3/attention/output/LayerNorm/bias": "flax_model-00009-of-00011.msgpack",
"encoder/layer/3/attention/output/LayerNorm/scale": "flax_model-00009-of-00011.msgpack",
"encoder/layer/3/attention/output/dense/bias": "flax_model-00009-of-00011.msgpack",
"encoder/layer/3/attention/output/dense/kernel": "flax_model-00009-of-00011.msgpack",
"encoder/layer/3/attention/self/key/bias": "flax_model-00009-of-00011.msgpack",
"encoder/layer/3/attention/self/key/kernel": "flax_model-00009-of-00011.msgpack",
"encoder/layer/3/attention/self/query/bias": "flax_model-00008-of-00011.msgpack",
"encoder/layer/3/attention/self/query/kernel": "flax_model-00008-of-00011.msgpack",
"encoder/layer/3/attention/self/value/bias": "flax_model-00009-of-00011.msgpack",
"encoder/layer/3/attention/self/value/kernel": "flax_model-00009-of-00011.msgpack",
"encoder/layer/3/intermediate/dense/bias": "flax_model-00009-of-00011.msgpack",
"encoder/layer/3/intermediate/dense/kernel": "flax_model-00009-of-00011.msgpack",
"encoder/layer/3/output/LayerNorm/bias": "flax_model-00010-of-00011.msgpack",
"encoder/layer/3/output/LayerNorm/scale": "flax_model-00010-of-00011.msgpack",
"encoder/layer/3/output/dense/bias": "flax_model-00010-of-00011.msgpack",
"encoder/layer/3/output/dense/kernel": "flax_model-00010-of-00011.msgpack",
"encoder/layer/4/attention/output/LayerNorm/bias": "flax_model-00011-of-00011.msgpack",
"encoder/layer/4/attention/output/LayerNorm/scale": "flax_model-00011-of-00011.msgpack",
"encoder/layer/4/attention/output/dense/bias": "flax_model-00011-of-00011.msgpack",
"encoder/layer/4/attention/output/dense/kernel": "flax_model-00011-of-00011.msgpack",
"encoder/layer/4/attention/self/key/bias": "flax_model-00010-of-00011.msgpack",
"encoder/layer/4/attention/self/key/kernel": "flax_model-00010-of-00011.msgpack",
"encoder/layer/4/attention/self/query/bias": "flax_model-00010-of-00011.msgpack",
"encoder/layer/4/attention/self/query/kernel": "flax_model-00010-of-00011.msgpack",
"encoder/layer/4/attention/self/value/bias": "flax_model-00010-of-00011.msgpack",
"encoder/layer/4/attention/self/value/kernel": "flax_model-00010-of-00011.msgpack",
"encoder/layer/4/intermediate/dense/bias": "flax_model-00011-of-00011.msgpack",
"encoder/layer/4/intermediate/dense/kernel": "flax_model-00011-of-00011.msgpack",
"encoder/layer/4/output/LayerNorm/bias": "flax_model-00011-of-00011.msgpack",
"encoder/layer/4/output/LayerNorm/scale": "flax_model-00011-of-00011.msgpack",
"encoder/layer/4/output/dense/bias": "flax_model-00011-of-00011.msgpack",
"encoder/layer/4/output/dense/kernel": "flax_model-00011-of-00011.msgpack",
"pooler/dense/bias": "flax_model-00011-of-00011.msgpack",
"pooler/dense/kernel": "flax_model-00011-of-00011.msgpack"
}
}
|