doxx9999 commited on
Commit
aadaea4
·
verified ·
1 Parent(s): 8a93932

Upload manifest.json with huggingface_hub

Browse files
Files changed (1) hide show
  1. manifest.json +208 -208
manifest.json CHANGED
@@ -1,18 +1,18 @@
1
  {
2
  "encoder.embeddings.word_embeddings.weight": {
3
  "shape": [
4
- 32022,
5
  768
6
  ],
7
  "offset": 0,
8
- "size": 24592896
9
  },
10
  "encoder.embeddings.position_embeddings.weight": {
11
  "shape": [
12
  512,
13
  768
14
  ],
15
- "offset": 98371584,
16
  "size": 393216
17
  },
18
  "encoder.embeddings.token_type_embeddings.weight": {
@@ -20,21 +20,21 @@
20
  2,
21
  768
22
  ],
23
- "offset": 99944448,
24
  "size": 1536
25
  },
26
  "encoder.embeddings.LayerNorm.weight": {
27
  "shape": [
28
  768
29
  ],
30
- "offset": 99950592,
31
  "size": 768
32
  },
33
  "encoder.embeddings.LayerNorm.bias": {
34
  "shape": [
35
  768
36
  ],
37
- "offset": 99953664,
38
  "size": 768
39
  },
40
  "encoder.encoder.layer.0.attention.self.query.weight": {
@@ -42,14 +42,14 @@
42
  768,
43
  768
44
  ],
45
- "offset": 99956736,
46
  "size": 589824
47
  },
48
  "encoder.encoder.layer.0.attention.self.query.bias": {
49
  "shape": [
50
  768
51
  ],
52
- "offset": 102316032,
53
  "size": 768
54
  },
55
  "encoder.encoder.layer.0.attention.self.key.weight": {
@@ -57,14 +57,14 @@
57
  768,
58
  768
59
  ],
60
- "offset": 102319104,
61
  "size": 589824
62
  },
63
  "encoder.encoder.layer.0.attention.self.key.bias": {
64
  "shape": [
65
  768
66
  ],
67
- "offset": 104678400,
68
  "size": 768
69
  },
70
  "encoder.encoder.layer.0.attention.self.value.weight": {
@@ -72,14 +72,14 @@
72
  768,
73
  768
74
  ],
75
- "offset": 104681472,
76
  "size": 589824
77
  },
78
  "encoder.encoder.layer.0.attention.self.value.bias": {
79
  "shape": [
80
  768
81
  ],
82
- "offset": 107040768,
83
  "size": 768
84
  },
85
  "encoder.encoder.layer.0.attention.output.dense.weight": {
@@ -87,28 +87,28 @@
87
  768,
88
  768
89
  ],
90
- "offset": 107043840,
91
  "size": 589824
92
  },
93
  "encoder.encoder.layer.0.attention.output.dense.bias": {
94
  "shape": [
95
  768
96
  ],
97
- "offset": 109403136,
98
  "size": 768
99
  },
100
  "encoder.encoder.layer.0.attention.output.LayerNorm.weight": {
101
  "shape": [
102
  768
103
  ],
104
- "offset": 109406208,
105
  "size": 768
106
  },
107
  "encoder.encoder.layer.0.attention.output.LayerNorm.bias": {
108
  "shape": [
109
  768
110
  ],
111
- "offset": 109409280,
112
  "size": 768
113
  },
114
  "encoder.encoder.layer.0.intermediate.dense.weight": {
@@ -116,14 +116,14 @@
116
  3072,
117
  768
118
  ],
119
- "offset": 109412352,
120
  "size": 2359296
121
  },
122
  "encoder.encoder.layer.0.intermediate.dense.bias": {
123
  "shape": [
124
  3072
125
  ],
126
- "offset": 118849536,
127
  "size": 3072
128
  },
129
  "encoder.encoder.layer.0.output.dense.weight": {
@@ -131,28 +131,28 @@
131
  768,
132
  3072
133
  ],
134
- "offset": 118861824,
135
  "size": 2359296
136
  },
137
  "encoder.encoder.layer.0.output.dense.bias": {
138
  "shape": [
139
  768
140
  ],
141
- "offset": 128299008,
142
  "size": 768
143
  },
144
  "encoder.encoder.layer.0.output.LayerNorm.weight": {
145
  "shape": [
146
  768
147
  ],
148
- "offset": 128302080,
149
  "size": 768
150
  },
151
  "encoder.encoder.layer.0.output.LayerNorm.bias": {
152
  "shape": [
153
  768
154
  ],
155
- "offset": 128305152,
156
  "size": 768
157
  },
158
  "encoder.encoder.layer.1.attention.self.query.weight": {
@@ -160,14 +160,14 @@
160
  768,
161
  768
162
  ],
163
- "offset": 128308224,
164
  "size": 589824
165
  },
166
  "encoder.encoder.layer.1.attention.self.query.bias": {
167
  "shape": [
168
  768
169
  ],
170
- "offset": 130667520,
171
  "size": 768
172
  },
173
  "encoder.encoder.layer.1.attention.self.key.weight": {
@@ -175,14 +175,14 @@
175
  768,
176
  768
177
  ],
178
- "offset": 130670592,
179
  "size": 589824
180
  },
181
  "encoder.encoder.layer.1.attention.self.key.bias": {
182
  "shape": [
183
  768
184
  ],
185
- "offset": 133029888,
186
  "size": 768
187
  },
188
  "encoder.encoder.layer.1.attention.self.value.weight": {
@@ -190,14 +190,14 @@
190
  768,
191
  768
192
  ],
193
- "offset": 133032960,
194
  "size": 589824
195
  },
196
  "encoder.encoder.layer.1.attention.self.value.bias": {
197
  "shape": [
198
  768
199
  ],
200
- "offset": 135392256,
201
  "size": 768
202
  },
203
  "encoder.encoder.layer.1.attention.output.dense.weight": {
@@ -205,28 +205,28 @@
205
  768,
206
  768
207
  ],
208
- "offset": 135395328,
209
  "size": 589824
210
  },
211
  "encoder.encoder.layer.1.attention.output.dense.bias": {
212
  "shape": [
213
  768
214
  ],
215
- "offset": 137754624,
216
  "size": 768
217
  },
218
  "encoder.encoder.layer.1.attention.output.LayerNorm.weight": {
219
  "shape": [
220
  768
221
  ],
222
- "offset": 137757696,
223
  "size": 768
224
  },
225
  "encoder.encoder.layer.1.attention.output.LayerNorm.bias": {
226
  "shape": [
227
  768
228
  ],
229
- "offset": 137760768,
230
  "size": 768
231
  },
232
  "encoder.encoder.layer.1.intermediate.dense.weight": {
@@ -234,14 +234,14 @@
234
  3072,
235
  768
236
  ],
237
- "offset": 137763840,
238
  "size": 2359296
239
  },
240
  "encoder.encoder.layer.1.intermediate.dense.bias": {
241
  "shape": [
242
  3072
243
  ],
244
- "offset": 147201024,
245
  "size": 3072
246
  },
247
  "encoder.encoder.layer.1.output.dense.weight": {
@@ -249,28 +249,28 @@
249
  768,
250
  3072
251
  ],
252
- "offset": 147213312,
253
  "size": 2359296
254
  },
255
  "encoder.encoder.layer.1.output.dense.bias": {
256
  "shape": [
257
  768
258
  ],
259
- "offset": 156650496,
260
  "size": 768
261
  },
262
  "encoder.encoder.layer.1.output.LayerNorm.weight": {
263
  "shape": [
264
  768
265
  ],
266
- "offset": 156653568,
267
  "size": 768
268
  },
269
  "encoder.encoder.layer.1.output.LayerNorm.bias": {
270
  "shape": [
271
  768
272
  ],
273
- "offset": 156656640,
274
  "size": 768
275
  },
276
  "encoder.encoder.layer.2.attention.self.query.weight": {
@@ -278,14 +278,14 @@
278
  768,
279
  768
280
  ],
281
- "offset": 156659712,
282
  "size": 589824
283
  },
284
  "encoder.encoder.layer.2.attention.self.query.bias": {
285
  "shape": [
286
  768
287
  ],
288
- "offset": 159019008,
289
  "size": 768
290
  },
291
  "encoder.encoder.layer.2.attention.self.key.weight": {
@@ -293,14 +293,14 @@
293
  768,
294
  768
295
  ],
296
- "offset": 159022080,
297
  "size": 589824
298
  },
299
  "encoder.encoder.layer.2.attention.self.key.bias": {
300
  "shape": [
301
  768
302
  ],
303
- "offset": 161381376,
304
  "size": 768
305
  },
306
  "encoder.encoder.layer.2.attention.self.value.weight": {
@@ -308,14 +308,14 @@
308
  768,
309
  768
310
  ],
311
- "offset": 161384448,
312
  "size": 589824
313
  },
314
  "encoder.encoder.layer.2.attention.self.value.bias": {
315
  "shape": [
316
  768
317
  ],
318
- "offset": 163743744,
319
  "size": 768
320
  },
321
  "encoder.encoder.layer.2.attention.output.dense.weight": {
@@ -323,28 +323,28 @@
323
  768,
324
  768
325
  ],
326
- "offset": 163746816,
327
  "size": 589824
328
  },
329
  "encoder.encoder.layer.2.attention.output.dense.bias": {
330
  "shape": [
331
  768
332
  ],
333
- "offset": 166106112,
334
  "size": 768
335
  },
336
  "encoder.encoder.layer.2.attention.output.LayerNorm.weight": {
337
  "shape": [
338
  768
339
  ],
340
- "offset": 166109184,
341
  "size": 768
342
  },
343
  "encoder.encoder.layer.2.attention.output.LayerNorm.bias": {
344
  "shape": [
345
  768
346
  ],
347
- "offset": 166112256,
348
  "size": 768
349
  },
350
  "encoder.encoder.layer.2.intermediate.dense.weight": {
@@ -352,14 +352,14 @@
352
  3072,
353
  768
354
  ],
355
- "offset": 166115328,
356
  "size": 2359296
357
  },
358
  "encoder.encoder.layer.2.intermediate.dense.bias": {
359
  "shape": [
360
  3072
361
  ],
362
- "offset": 175552512,
363
  "size": 3072
364
  },
365
  "encoder.encoder.layer.2.output.dense.weight": {
@@ -367,28 +367,28 @@
367
  768,
368
  3072
369
  ],
370
- "offset": 175564800,
371
  "size": 2359296
372
  },
373
  "encoder.encoder.layer.2.output.dense.bias": {
374
  "shape": [
375
  768
376
  ],
377
- "offset": 185001984,
378
  "size": 768
379
  },
380
  "encoder.encoder.layer.2.output.LayerNorm.weight": {
381
  "shape": [
382
  768
383
  ],
384
- "offset": 185005056,
385
  "size": 768
386
  },
387
  "encoder.encoder.layer.2.output.LayerNorm.bias": {
388
  "shape": [
389
  768
390
  ],
391
- "offset": 185008128,
392
  "size": 768
393
  },
394
  "encoder.encoder.layer.3.attention.self.query.weight": {
@@ -396,14 +396,14 @@
396
  768,
397
  768
398
  ],
399
- "offset": 185011200,
400
  "size": 589824
401
  },
402
  "encoder.encoder.layer.3.attention.self.query.bias": {
403
  "shape": [
404
  768
405
  ],
406
- "offset": 187370496,
407
  "size": 768
408
  },
409
  "encoder.encoder.layer.3.attention.self.key.weight": {
@@ -411,14 +411,14 @@
411
  768,
412
  768
413
  ],
414
- "offset": 187373568,
415
  "size": 589824
416
  },
417
  "encoder.encoder.layer.3.attention.self.key.bias": {
418
  "shape": [
419
  768
420
  ],
421
- "offset": 189732864,
422
  "size": 768
423
  },
424
  "encoder.encoder.layer.3.attention.self.value.weight": {
@@ -426,14 +426,14 @@
426
  768,
427
  768
428
  ],
429
- "offset": 189735936,
430
  "size": 589824
431
  },
432
  "encoder.encoder.layer.3.attention.self.value.bias": {
433
  "shape": [
434
  768
435
  ],
436
- "offset": 192095232,
437
  "size": 768
438
  },
439
  "encoder.encoder.layer.3.attention.output.dense.weight": {
@@ -441,28 +441,28 @@
441
  768,
442
  768
443
  ],
444
- "offset": 192098304,
445
  "size": 589824
446
  },
447
  "encoder.encoder.layer.3.attention.output.dense.bias": {
448
  "shape": [
449
  768
450
  ],
451
- "offset": 194457600,
452
  "size": 768
453
  },
454
  "encoder.encoder.layer.3.attention.output.LayerNorm.weight": {
455
  "shape": [
456
  768
457
  ],
458
- "offset": 194460672,
459
  "size": 768
460
  },
461
  "encoder.encoder.layer.3.attention.output.LayerNorm.bias": {
462
  "shape": [
463
  768
464
  ],
465
- "offset": 194463744,
466
  "size": 768
467
  },
468
  "encoder.encoder.layer.3.intermediate.dense.weight": {
@@ -470,14 +470,14 @@
470
  3072,
471
  768
472
  ],
473
- "offset": 194466816,
474
  "size": 2359296
475
  },
476
  "encoder.encoder.layer.3.intermediate.dense.bias": {
477
  "shape": [
478
  3072
479
  ],
480
- "offset": 203904000,
481
  "size": 3072
482
  },
483
  "encoder.encoder.layer.3.output.dense.weight": {
@@ -485,28 +485,28 @@
485
  768,
486
  3072
487
  ],
488
- "offset": 203916288,
489
  "size": 2359296
490
  },
491
  "encoder.encoder.layer.3.output.dense.bias": {
492
  "shape": [
493
  768
494
  ],
495
- "offset": 213353472,
496
  "size": 768
497
  },
498
  "encoder.encoder.layer.3.output.LayerNorm.weight": {
499
  "shape": [
500
  768
501
  ],
502
- "offset": 213356544,
503
  "size": 768
504
  },
505
  "encoder.encoder.layer.3.output.LayerNorm.bias": {
506
  "shape": [
507
  768
508
  ],
509
- "offset": 213359616,
510
  "size": 768
511
  },
512
  "encoder.encoder.layer.4.attention.self.query.weight": {
@@ -514,14 +514,14 @@
514
  768,
515
  768
516
  ],
517
- "offset": 213362688,
518
  "size": 589824
519
  },
520
  "encoder.encoder.layer.4.attention.self.query.bias": {
521
  "shape": [
522
  768
523
  ],
524
- "offset": 215721984,
525
  "size": 768
526
  },
527
  "encoder.encoder.layer.4.attention.self.key.weight": {
@@ -529,14 +529,14 @@
529
  768,
530
  768
531
  ],
532
- "offset": 215725056,
533
  "size": 589824
534
  },
535
  "encoder.encoder.layer.4.attention.self.key.bias": {
536
  "shape": [
537
  768
538
  ],
539
- "offset": 218084352,
540
  "size": 768
541
  },
542
  "encoder.encoder.layer.4.attention.self.value.weight": {
@@ -544,14 +544,14 @@
544
  768,
545
  768
546
  ],
547
- "offset": 218087424,
548
  "size": 589824
549
  },
550
  "encoder.encoder.layer.4.attention.self.value.bias": {
551
  "shape": [
552
  768
553
  ],
554
- "offset": 220446720,
555
  "size": 768
556
  },
557
  "encoder.encoder.layer.4.attention.output.dense.weight": {
@@ -559,28 +559,28 @@
559
  768,
560
  768
561
  ],
562
- "offset": 220449792,
563
  "size": 589824
564
  },
565
  "encoder.encoder.layer.4.attention.output.dense.bias": {
566
  "shape": [
567
  768
568
  ],
569
- "offset": 222809088,
570
  "size": 768
571
  },
572
  "encoder.encoder.layer.4.attention.output.LayerNorm.weight": {
573
  "shape": [
574
  768
575
  ],
576
- "offset": 222812160,
577
  "size": 768
578
  },
579
  "encoder.encoder.layer.4.attention.output.LayerNorm.bias": {
580
  "shape": [
581
  768
582
  ],
583
- "offset": 222815232,
584
  "size": 768
585
  },
586
  "encoder.encoder.layer.4.intermediate.dense.weight": {
@@ -588,14 +588,14 @@
588
  3072,
589
  768
590
  ],
591
- "offset": 222818304,
592
  "size": 2359296
593
  },
594
  "encoder.encoder.layer.4.intermediate.dense.bias": {
595
  "shape": [
596
  3072
597
  ],
598
- "offset": 232255488,
599
  "size": 3072
600
  },
601
  "encoder.encoder.layer.4.output.dense.weight": {
@@ -603,28 +603,28 @@
603
  768,
604
  3072
605
  ],
606
- "offset": 232267776,
607
  "size": 2359296
608
  },
609
  "encoder.encoder.layer.4.output.dense.bias": {
610
  "shape": [
611
  768
612
  ],
613
- "offset": 241704960,
614
  "size": 768
615
  },
616
  "encoder.encoder.layer.4.output.LayerNorm.weight": {
617
  "shape": [
618
  768
619
  ],
620
- "offset": 241708032,
621
  "size": 768
622
  },
623
  "encoder.encoder.layer.4.output.LayerNorm.bias": {
624
  "shape": [
625
  768
626
  ],
627
- "offset": 241711104,
628
  "size": 768
629
  },
630
  "encoder.encoder.layer.5.attention.self.query.weight": {
@@ -632,14 +632,14 @@
632
  768,
633
  768
634
  ],
635
- "offset": 241714176,
636
  "size": 589824
637
  },
638
  "encoder.encoder.layer.5.attention.self.query.bias": {
639
  "shape": [
640
  768
641
  ],
642
- "offset": 244073472,
643
  "size": 768
644
  },
645
  "encoder.encoder.layer.5.attention.self.key.weight": {
@@ -647,14 +647,14 @@
647
  768,
648
  768
649
  ],
650
- "offset": 244076544,
651
  "size": 589824
652
  },
653
  "encoder.encoder.layer.5.attention.self.key.bias": {
654
  "shape": [
655
  768
656
  ],
657
- "offset": 246435840,
658
  "size": 768
659
  },
660
  "encoder.encoder.layer.5.attention.self.value.weight": {
@@ -662,14 +662,14 @@
662
  768,
663
  768
664
  ],
665
- "offset": 246438912,
666
  "size": 589824
667
  },
668
  "encoder.encoder.layer.5.attention.self.value.bias": {
669
  "shape": [
670
  768
671
  ],
672
- "offset": 248798208,
673
  "size": 768
674
  },
675
  "encoder.encoder.layer.5.attention.output.dense.weight": {
@@ -677,28 +677,28 @@
677
  768,
678
  768
679
  ],
680
- "offset": 248801280,
681
  "size": 589824
682
  },
683
  "encoder.encoder.layer.5.attention.output.dense.bias": {
684
  "shape": [
685
  768
686
  ],
687
- "offset": 251160576,
688
  "size": 768
689
  },
690
  "encoder.encoder.layer.5.attention.output.LayerNorm.weight": {
691
  "shape": [
692
  768
693
  ],
694
- "offset": 251163648,
695
  "size": 768
696
  },
697
  "encoder.encoder.layer.5.attention.output.LayerNorm.bias": {
698
  "shape": [
699
  768
700
  ],
701
- "offset": 251166720,
702
  "size": 768
703
  },
704
  "encoder.encoder.layer.5.intermediate.dense.weight": {
@@ -706,14 +706,14 @@
706
  3072,
707
  768
708
  ],
709
- "offset": 251169792,
710
  "size": 2359296
711
  },
712
  "encoder.encoder.layer.5.intermediate.dense.bias": {
713
  "shape": [
714
  3072
715
  ],
716
- "offset": 260606976,
717
  "size": 3072
718
  },
719
  "encoder.encoder.layer.5.output.dense.weight": {
@@ -721,28 +721,28 @@
721
  768,
722
  3072
723
  ],
724
- "offset": 260619264,
725
  "size": 2359296
726
  },
727
  "encoder.encoder.layer.5.output.dense.bias": {
728
  "shape": [
729
  768
730
  ],
731
- "offset": 270056448,
732
  "size": 768
733
  },
734
  "encoder.encoder.layer.5.output.LayerNorm.weight": {
735
  "shape": [
736
  768
737
  ],
738
- "offset": 270059520,
739
  "size": 768
740
  },
741
  "encoder.encoder.layer.5.output.LayerNorm.bias": {
742
  "shape": [
743
  768
744
  ],
745
- "offset": 270062592,
746
  "size": 768
747
  },
748
  "encoder.encoder.layer.6.attention.self.query.weight": {
@@ -750,14 +750,14 @@
750
  768,
751
  768
752
  ],
753
- "offset": 270065664,
754
  "size": 589824
755
  },
756
  "encoder.encoder.layer.6.attention.self.query.bias": {
757
  "shape": [
758
  768
759
  ],
760
- "offset": 272424960,
761
  "size": 768
762
  },
763
  "encoder.encoder.layer.6.attention.self.key.weight": {
@@ -765,14 +765,14 @@
765
  768,
766
  768
767
  ],
768
- "offset": 272428032,
769
  "size": 589824
770
  },
771
  "encoder.encoder.layer.6.attention.self.key.bias": {
772
  "shape": [
773
  768
774
  ],
775
- "offset": 274787328,
776
  "size": 768
777
  },
778
  "encoder.encoder.layer.6.attention.self.value.weight": {
@@ -780,14 +780,14 @@
780
  768,
781
  768
782
  ],
783
- "offset": 274790400,
784
  "size": 589824
785
  },
786
  "encoder.encoder.layer.6.attention.self.value.bias": {
787
  "shape": [
788
  768
789
  ],
790
- "offset": 277149696,
791
  "size": 768
792
  },
793
  "encoder.encoder.layer.6.attention.output.dense.weight": {
@@ -795,28 +795,28 @@
795
  768,
796
  768
797
  ],
798
- "offset": 277152768,
799
  "size": 589824
800
  },
801
  "encoder.encoder.layer.6.attention.output.dense.bias": {
802
  "shape": [
803
  768
804
  ],
805
- "offset": 279512064,
806
  "size": 768
807
  },
808
  "encoder.encoder.layer.6.attention.output.LayerNorm.weight": {
809
  "shape": [
810
  768
811
  ],
812
- "offset": 279515136,
813
  "size": 768
814
  },
815
  "encoder.encoder.layer.6.attention.output.LayerNorm.bias": {
816
  "shape": [
817
  768
818
  ],
819
- "offset": 279518208,
820
  "size": 768
821
  },
822
  "encoder.encoder.layer.6.intermediate.dense.weight": {
@@ -824,14 +824,14 @@
824
  3072,
825
  768
826
  ],
827
- "offset": 279521280,
828
  "size": 2359296
829
  },
830
  "encoder.encoder.layer.6.intermediate.dense.bias": {
831
  "shape": [
832
  3072
833
  ],
834
- "offset": 288958464,
835
  "size": 3072
836
  },
837
  "encoder.encoder.layer.6.output.dense.weight": {
@@ -839,28 +839,28 @@
839
  768,
840
  3072
841
  ],
842
- "offset": 288970752,
843
  "size": 2359296
844
  },
845
  "encoder.encoder.layer.6.output.dense.bias": {
846
  "shape": [
847
  768
848
  ],
849
- "offset": 298407936,
850
  "size": 768
851
  },
852
  "encoder.encoder.layer.6.output.LayerNorm.weight": {
853
  "shape": [
854
  768
855
  ],
856
- "offset": 298411008,
857
  "size": 768
858
  },
859
  "encoder.encoder.layer.6.output.LayerNorm.bias": {
860
  "shape": [
861
  768
862
  ],
863
- "offset": 298414080,
864
  "size": 768
865
  },
866
  "encoder.encoder.layer.7.attention.self.query.weight": {
@@ -868,14 +868,14 @@
868
  768,
869
  768
870
  ],
871
- "offset": 298417152,
872
  "size": 589824
873
  },
874
  "encoder.encoder.layer.7.attention.self.query.bias": {
875
  "shape": [
876
  768
877
  ],
878
- "offset": 300776448,
879
  "size": 768
880
  },
881
  "encoder.encoder.layer.7.attention.self.key.weight": {
@@ -883,14 +883,14 @@
883
  768,
884
  768
885
  ],
886
- "offset": 300779520,
887
  "size": 589824
888
  },
889
  "encoder.encoder.layer.7.attention.self.key.bias": {
890
  "shape": [
891
  768
892
  ],
893
- "offset": 303138816,
894
  "size": 768
895
  },
896
  "encoder.encoder.layer.7.attention.self.value.weight": {
@@ -898,14 +898,14 @@
898
  768,
899
  768
900
  ],
901
- "offset": 303141888,
902
  "size": 589824
903
  },
904
  "encoder.encoder.layer.7.attention.self.value.bias": {
905
  "shape": [
906
  768
907
  ],
908
- "offset": 305501184,
909
  "size": 768
910
  },
911
  "encoder.encoder.layer.7.attention.output.dense.weight": {
@@ -913,28 +913,28 @@
913
  768,
914
  768
915
  ],
916
- "offset": 305504256,
917
  "size": 589824
918
  },
919
  "encoder.encoder.layer.7.attention.output.dense.bias": {
920
  "shape": [
921
  768
922
  ],
923
- "offset": 307863552,
924
  "size": 768
925
  },
926
  "encoder.encoder.layer.7.attention.output.LayerNorm.weight": {
927
  "shape": [
928
  768
929
  ],
930
- "offset": 307866624,
931
  "size": 768
932
  },
933
  "encoder.encoder.layer.7.attention.output.LayerNorm.bias": {
934
  "shape": [
935
  768
936
  ],
937
- "offset": 307869696,
938
  "size": 768
939
  },
940
  "encoder.encoder.layer.7.intermediate.dense.weight": {
@@ -942,14 +942,14 @@
942
  3072,
943
  768
944
  ],
945
- "offset": 307872768,
946
  "size": 2359296
947
  },
948
  "encoder.encoder.layer.7.intermediate.dense.bias": {
949
  "shape": [
950
  3072
951
  ],
952
- "offset": 317309952,
953
  "size": 3072
954
  },
955
  "encoder.encoder.layer.7.output.dense.weight": {
@@ -957,28 +957,28 @@
957
  768,
958
  3072
959
  ],
960
- "offset": 317322240,
961
  "size": 2359296
962
  },
963
  "encoder.encoder.layer.7.output.dense.bias": {
964
  "shape": [
965
  768
966
  ],
967
- "offset": 326759424,
968
  "size": 768
969
  },
970
  "encoder.encoder.layer.7.output.LayerNorm.weight": {
971
  "shape": [
972
  768
973
  ],
974
- "offset": 326762496,
975
  "size": 768
976
  },
977
  "encoder.encoder.layer.7.output.LayerNorm.bias": {
978
  "shape": [
979
  768
980
  ],
981
- "offset": 326765568,
982
  "size": 768
983
  },
984
  "encoder.encoder.layer.8.attention.self.query.weight": {
@@ -986,14 +986,14 @@
986
  768,
987
  768
988
  ],
989
- "offset": 326768640,
990
  "size": 589824
991
  },
992
  "encoder.encoder.layer.8.attention.self.query.bias": {
993
  "shape": [
994
  768
995
  ],
996
- "offset": 329127936,
997
  "size": 768
998
  },
999
  "encoder.encoder.layer.8.attention.self.key.weight": {
@@ -1001,14 +1001,14 @@
1001
  768,
1002
  768
1003
  ],
1004
- "offset": 329131008,
1005
  "size": 589824
1006
  },
1007
  "encoder.encoder.layer.8.attention.self.key.bias": {
1008
  "shape": [
1009
  768
1010
  ],
1011
- "offset": 331490304,
1012
  "size": 768
1013
  },
1014
  "encoder.encoder.layer.8.attention.self.value.weight": {
@@ -1016,14 +1016,14 @@
1016
  768,
1017
  768
1018
  ],
1019
- "offset": 331493376,
1020
  "size": 589824
1021
  },
1022
  "encoder.encoder.layer.8.attention.self.value.bias": {
1023
  "shape": [
1024
  768
1025
  ],
1026
- "offset": 333852672,
1027
  "size": 768
1028
  },
1029
  "encoder.encoder.layer.8.attention.output.dense.weight": {
@@ -1031,28 +1031,28 @@
1031
  768,
1032
  768
1033
  ],
1034
- "offset": 333855744,
1035
  "size": 589824
1036
  },
1037
  "encoder.encoder.layer.8.attention.output.dense.bias": {
1038
  "shape": [
1039
  768
1040
  ],
1041
- "offset": 336215040,
1042
  "size": 768
1043
  },
1044
  "encoder.encoder.layer.8.attention.output.LayerNorm.weight": {
1045
  "shape": [
1046
  768
1047
  ],
1048
- "offset": 336218112,
1049
  "size": 768
1050
  },
1051
  "encoder.encoder.layer.8.attention.output.LayerNorm.bias": {
1052
  "shape": [
1053
  768
1054
  ],
1055
- "offset": 336221184,
1056
  "size": 768
1057
  },
1058
  "encoder.encoder.layer.8.intermediate.dense.weight": {
@@ -1060,14 +1060,14 @@
1060
  3072,
1061
  768
1062
  ],
1063
- "offset": 336224256,
1064
  "size": 2359296
1065
  },
1066
  "encoder.encoder.layer.8.intermediate.dense.bias": {
1067
  "shape": [
1068
  3072
1069
  ],
1070
- "offset": 345661440,
1071
  "size": 3072
1072
  },
1073
  "encoder.encoder.layer.8.output.dense.weight": {
@@ -1075,28 +1075,28 @@
1075
  768,
1076
  3072
1077
  ],
1078
- "offset": 345673728,
1079
  "size": 2359296
1080
  },
1081
  "encoder.encoder.layer.8.output.dense.bias": {
1082
  "shape": [
1083
  768
1084
  ],
1085
- "offset": 355110912,
1086
  "size": 768
1087
  },
1088
  "encoder.encoder.layer.8.output.LayerNorm.weight": {
1089
  "shape": [
1090
  768
1091
  ],
1092
- "offset": 355113984,
1093
  "size": 768
1094
  },
1095
  "encoder.encoder.layer.8.output.LayerNorm.bias": {
1096
  "shape": [
1097
  768
1098
  ],
1099
- "offset": 355117056,
1100
  "size": 768
1101
  },
1102
  "encoder.encoder.layer.9.attention.self.query.weight": {
@@ -1104,14 +1104,14 @@
1104
  768,
1105
  768
1106
  ],
1107
- "offset": 355120128,
1108
  "size": 589824
1109
  },
1110
  "encoder.encoder.layer.9.attention.self.query.bias": {
1111
  "shape": [
1112
  768
1113
  ],
1114
- "offset": 357479424,
1115
  "size": 768
1116
  },
1117
  "encoder.encoder.layer.9.attention.self.key.weight": {
@@ -1119,14 +1119,14 @@
1119
  768,
1120
  768
1121
  ],
1122
- "offset": 357482496,
1123
  "size": 589824
1124
  },
1125
  "encoder.encoder.layer.9.attention.self.key.bias": {
1126
  "shape": [
1127
  768
1128
  ],
1129
- "offset": 359841792,
1130
  "size": 768
1131
  },
1132
  "encoder.encoder.layer.9.attention.self.value.weight": {
@@ -1134,14 +1134,14 @@
1134
  768,
1135
  768
1136
  ],
1137
- "offset": 359844864,
1138
  "size": 589824
1139
  },
1140
  "encoder.encoder.layer.9.attention.self.value.bias": {
1141
  "shape": [
1142
  768
1143
  ],
1144
- "offset": 362204160,
1145
  "size": 768
1146
  },
1147
  "encoder.encoder.layer.9.attention.output.dense.weight": {
@@ -1149,28 +1149,28 @@
1149
  768,
1150
  768
1151
  ],
1152
- "offset": 362207232,
1153
  "size": 589824
1154
  },
1155
  "encoder.encoder.layer.9.attention.output.dense.bias": {
1156
  "shape": [
1157
  768
1158
  ],
1159
- "offset": 364566528,
1160
  "size": 768
1161
  },
1162
  "encoder.encoder.layer.9.attention.output.LayerNorm.weight": {
1163
  "shape": [
1164
  768
1165
  ],
1166
- "offset": 364569600,
1167
  "size": 768
1168
  },
1169
  "encoder.encoder.layer.9.attention.output.LayerNorm.bias": {
1170
  "shape": [
1171
  768
1172
  ],
1173
- "offset": 364572672,
1174
  "size": 768
1175
  },
1176
  "encoder.encoder.layer.9.intermediate.dense.weight": {
@@ -1178,14 +1178,14 @@
1178
  3072,
1179
  768
1180
  ],
1181
- "offset": 364575744,
1182
  "size": 2359296
1183
  },
1184
  "encoder.encoder.layer.9.intermediate.dense.bias": {
1185
  "shape": [
1186
  3072
1187
  ],
1188
- "offset": 374012928,
1189
  "size": 3072
1190
  },
1191
  "encoder.encoder.layer.9.output.dense.weight": {
@@ -1193,28 +1193,28 @@
1193
  768,
1194
  3072
1195
  ],
1196
- "offset": 374025216,
1197
  "size": 2359296
1198
  },
1199
  "encoder.encoder.layer.9.output.dense.bias": {
1200
  "shape": [
1201
  768
1202
  ],
1203
- "offset": 383462400,
1204
  "size": 768
1205
  },
1206
  "encoder.encoder.layer.9.output.LayerNorm.weight": {
1207
  "shape": [
1208
  768
1209
  ],
1210
- "offset": 383465472,
1211
  "size": 768
1212
  },
1213
  "encoder.encoder.layer.9.output.LayerNorm.bias": {
1214
  "shape": [
1215
  768
1216
  ],
1217
- "offset": 383468544,
1218
  "size": 768
1219
  },
1220
  "encoder.encoder.layer.10.attention.self.query.weight": {
@@ -1222,14 +1222,14 @@
1222
  768,
1223
  768
1224
  ],
1225
- "offset": 383471616,
1226
  "size": 589824
1227
  },
1228
  "encoder.encoder.layer.10.attention.self.query.bias": {
1229
  "shape": [
1230
  768
1231
  ],
1232
- "offset": 385830912,
1233
  "size": 768
1234
  },
1235
  "encoder.encoder.layer.10.attention.self.key.weight": {
@@ -1237,14 +1237,14 @@
1237
  768,
1238
  768
1239
  ],
1240
- "offset": 385833984,
1241
  "size": 589824
1242
  },
1243
  "encoder.encoder.layer.10.attention.self.key.bias": {
1244
  "shape": [
1245
  768
1246
  ],
1247
- "offset": 388193280,
1248
  "size": 768
1249
  },
1250
  "encoder.encoder.layer.10.attention.self.value.weight": {
@@ -1252,14 +1252,14 @@
1252
  768,
1253
  768
1254
  ],
1255
- "offset": 388196352,
1256
  "size": 589824
1257
  },
1258
  "encoder.encoder.layer.10.attention.self.value.bias": {
1259
  "shape": [
1260
  768
1261
  ],
1262
- "offset": 390555648,
1263
  "size": 768
1264
  },
1265
  "encoder.encoder.layer.10.attention.output.dense.weight": {
@@ -1267,28 +1267,28 @@
1267
  768,
1268
  768
1269
  ],
1270
- "offset": 390558720,
1271
  "size": 589824
1272
  },
1273
  "encoder.encoder.layer.10.attention.output.dense.bias": {
1274
  "shape": [
1275
  768
1276
  ],
1277
- "offset": 392918016,
1278
  "size": 768
1279
  },
1280
  "encoder.encoder.layer.10.attention.output.LayerNorm.weight": {
1281
  "shape": [
1282
  768
1283
  ],
1284
- "offset": 392921088,
1285
  "size": 768
1286
  },
1287
  "encoder.encoder.layer.10.attention.output.LayerNorm.bias": {
1288
  "shape": [
1289
  768
1290
  ],
1291
- "offset": 392924160,
1292
  "size": 768
1293
  },
1294
  "encoder.encoder.layer.10.intermediate.dense.weight": {
@@ -1296,14 +1296,14 @@
1296
  3072,
1297
  768
1298
  ],
1299
- "offset": 392927232,
1300
  "size": 2359296
1301
  },
1302
  "encoder.encoder.layer.10.intermediate.dense.bias": {
1303
  "shape": [
1304
  3072
1305
  ],
1306
- "offset": 402364416,
1307
  "size": 3072
1308
  },
1309
  "encoder.encoder.layer.10.output.dense.weight": {
@@ -1311,28 +1311,28 @@
1311
  768,
1312
  3072
1313
  ],
1314
- "offset": 402376704,
1315
  "size": 2359296
1316
  },
1317
  "encoder.encoder.layer.10.output.dense.bias": {
1318
  "shape": [
1319
  768
1320
  ],
1321
- "offset": 411813888,
1322
  "size": 768
1323
  },
1324
  "encoder.encoder.layer.10.output.LayerNorm.weight": {
1325
  "shape": [
1326
  768
1327
  ],
1328
- "offset": 411816960,
1329
  "size": 768
1330
  },
1331
  "encoder.encoder.layer.10.output.LayerNorm.bias": {
1332
  "shape": [
1333
  768
1334
  ],
1335
- "offset": 411820032,
1336
  "size": 768
1337
  },
1338
  "encoder.encoder.layer.11.attention.self.query.weight": {
@@ -1340,14 +1340,14 @@
1340
  768,
1341
  768
1342
  ],
1343
- "offset": 411823104,
1344
  "size": 589824
1345
  },
1346
  "encoder.encoder.layer.11.attention.self.query.bias": {
1347
  "shape": [
1348
  768
1349
  ],
1350
- "offset": 414182400,
1351
  "size": 768
1352
  },
1353
  "encoder.encoder.layer.11.attention.self.key.weight": {
@@ -1355,14 +1355,14 @@
1355
  768,
1356
  768
1357
  ],
1358
- "offset": 414185472,
1359
  "size": 589824
1360
  },
1361
  "encoder.encoder.layer.11.attention.self.key.bias": {
1362
  "shape": [
1363
  768
1364
  ],
1365
- "offset": 416544768,
1366
  "size": 768
1367
  },
1368
  "encoder.encoder.layer.11.attention.self.value.weight": {
@@ -1370,14 +1370,14 @@
1370
  768,
1371
  768
1372
  ],
1373
- "offset": 416547840,
1374
  "size": 589824
1375
  },
1376
  "encoder.encoder.layer.11.attention.self.value.bias": {
1377
  "shape": [
1378
  768
1379
  ],
1380
- "offset": 418907136,
1381
  "size": 768
1382
  },
1383
  "encoder.encoder.layer.11.attention.output.dense.weight": {
@@ -1385,28 +1385,28 @@
1385
  768,
1386
  768
1387
  ],
1388
- "offset": 418910208,
1389
  "size": 589824
1390
  },
1391
  "encoder.encoder.layer.11.attention.output.dense.bias": {
1392
  "shape": [
1393
  768
1394
  ],
1395
- "offset": 421269504,
1396
  "size": 768
1397
  },
1398
  "encoder.encoder.layer.11.attention.output.LayerNorm.weight": {
1399
  "shape": [
1400
  768
1401
  ],
1402
- "offset": 421272576,
1403
  "size": 768
1404
  },
1405
  "encoder.encoder.layer.11.attention.output.LayerNorm.bias": {
1406
  "shape": [
1407
  768
1408
  ],
1409
- "offset": 421275648,
1410
  "size": 768
1411
  },
1412
  "encoder.encoder.layer.11.intermediate.dense.weight": {
@@ -1414,14 +1414,14 @@
1414
  3072,
1415
  768
1416
  ],
1417
- "offset": 421278720,
1418
  "size": 2359296
1419
  },
1420
  "encoder.encoder.layer.11.intermediate.dense.bias": {
1421
  "shape": [
1422
  3072
1423
  ],
1424
- "offset": 430715904,
1425
  "size": 3072
1426
  },
1427
  "encoder.encoder.layer.11.output.dense.weight": {
@@ -1429,28 +1429,28 @@
1429
  768,
1430
  3072
1431
  ],
1432
- "offset": 430728192,
1433
  "size": 2359296
1434
  },
1435
  "encoder.encoder.layer.11.output.dense.bias": {
1436
  "shape": [
1437
  768
1438
  ],
1439
- "offset": 440165376,
1440
  "size": 768
1441
  },
1442
  "encoder.encoder.layer.11.output.LayerNorm.weight": {
1443
  "shape": [
1444
  768
1445
  ],
1446
- "offset": 440168448,
1447
  "size": 768
1448
  },
1449
  "encoder.encoder.layer.11.output.LayerNorm.bias": {
1450
  "shape": [
1451
  768
1452
  ],
1453
- "offset": 440171520,
1454
  "size": 768
1455
  },
1456
  "encoder.pooler.dense.weight": {
@@ -1458,14 +1458,14 @@
1458
  768,
1459
  768
1460
  ],
1461
- "offset": 440174592,
1462
  "size": 589824
1463
  },
1464
  "encoder.pooler.dense.bias": {
1465
  "shape": [
1466
  768
1467
  ],
1468
- "offset": 442533888,
1469
  "size": 768
1470
  },
1471
  "classifier.1.weight": {
@@ -1473,29 +1473,29 @@
1473
  256,
1474
  768
1475
  ],
1476
- "offset": 442536960,
1477
  "size": 196608
1478
  },
1479
  "classifier.1.bias": {
1480
  "shape": [
1481
  256
1482
  ],
1483
- "offset": 443323392,
1484
  "size": 256
1485
  },
1486
  "classifier.4.weight": {
1487
  "shape": [
1488
- 15,
1489
  256
1490
  ],
1491
- "offset": 443324416,
1492
- "size": 3840
1493
  },
1494
  "classifier.4.bias": {
1495
  "shape": [
1496
- 15
1497
  ],
1498
- "offset": 443339776,
1499
- "size": 15
1500
  }
1501
  }
 
1
  {
2
  "encoder.embeddings.word_embeddings.weight": {
3
  "shape": [
4
+ 32035,
5
  768
6
  ],
7
  "offset": 0,
8
+ "size": 24602880
9
  },
10
  "encoder.embeddings.position_embeddings.weight": {
11
  "shape": [
12
  512,
13
  768
14
  ],
15
+ "offset": 98411520,
16
  "size": 393216
17
  },
18
  "encoder.embeddings.token_type_embeddings.weight": {
 
20
  2,
21
  768
22
  ],
23
+ "offset": 99984384,
24
  "size": 1536
25
  },
26
  "encoder.embeddings.LayerNorm.weight": {
27
  "shape": [
28
  768
29
  ],
30
+ "offset": 99990528,
31
  "size": 768
32
  },
33
  "encoder.embeddings.LayerNorm.bias": {
34
  "shape": [
35
  768
36
  ],
37
+ "offset": 99993600,
38
  "size": 768
39
  },
40
  "encoder.encoder.layer.0.attention.self.query.weight": {
 
42
  768,
43
  768
44
  ],
45
+ "offset": 99996672,
46
  "size": 589824
47
  },
48
  "encoder.encoder.layer.0.attention.self.query.bias": {
49
  "shape": [
50
  768
51
  ],
52
+ "offset": 102355968,
53
  "size": 768
54
  },
55
  "encoder.encoder.layer.0.attention.self.key.weight": {
 
57
  768,
58
  768
59
  ],
60
+ "offset": 102359040,
61
  "size": 589824
62
  },
63
  "encoder.encoder.layer.0.attention.self.key.bias": {
64
  "shape": [
65
  768
66
  ],
67
+ "offset": 104718336,
68
  "size": 768
69
  },
70
  "encoder.encoder.layer.0.attention.self.value.weight": {
 
72
  768,
73
  768
74
  ],
75
+ "offset": 104721408,
76
  "size": 589824
77
  },
78
  "encoder.encoder.layer.0.attention.self.value.bias": {
79
  "shape": [
80
  768
81
  ],
82
+ "offset": 107080704,
83
  "size": 768
84
  },
85
  "encoder.encoder.layer.0.attention.output.dense.weight": {
 
87
  768,
88
  768
89
  ],
90
+ "offset": 107083776,
91
  "size": 589824
92
  },
93
  "encoder.encoder.layer.0.attention.output.dense.bias": {
94
  "shape": [
95
  768
96
  ],
97
+ "offset": 109443072,
98
  "size": 768
99
  },
100
  "encoder.encoder.layer.0.attention.output.LayerNorm.weight": {
101
  "shape": [
102
  768
103
  ],
104
+ "offset": 109446144,
105
  "size": 768
106
  },
107
  "encoder.encoder.layer.0.attention.output.LayerNorm.bias": {
108
  "shape": [
109
  768
110
  ],
111
+ "offset": 109449216,
112
  "size": 768
113
  },
114
  "encoder.encoder.layer.0.intermediate.dense.weight": {
 
116
  3072,
117
  768
118
  ],
119
+ "offset": 109452288,
120
  "size": 2359296
121
  },
122
  "encoder.encoder.layer.0.intermediate.dense.bias": {
123
  "shape": [
124
  3072
125
  ],
126
+ "offset": 118889472,
127
  "size": 3072
128
  },
129
  "encoder.encoder.layer.0.output.dense.weight": {
 
131
  768,
132
  3072
133
  ],
134
+ "offset": 118901760,
135
  "size": 2359296
136
  },
137
  "encoder.encoder.layer.0.output.dense.bias": {
138
  "shape": [
139
  768
140
  ],
141
+ "offset": 128338944,
142
  "size": 768
143
  },
144
  "encoder.encoder.layer.0.output.LayerNorm.weight": {
145
  "shape": [
146
  768
147
  ],
148
+ "offset": 128342016,
149
  "size": 768
150
  },
151
  "encoder.encoder.layer.0.output.LayerNorm.bias": {
152
  "shape": [
153
  768
154
  ],
155
+ "offset": 128345088,
156
  "size": 768
157
  },
158
  "encoder.encoder.layer.1.attention.self.query.weight": {
 
160
  768,
161
  768
162
  ],
163
+ "offset": 128348160,
164
  "size": 589824
165
  },
166
  "encoder.encoder.layer.1.attention.self.query.bias": {
167
  "shape": [
168
  768
169
  ],
170
+ "offset": 130707456,
171
  "size": 768
172
  },
173
  "encoder.encoder.layer.1.attention.self.key.weight": {
 
175
  768,
176
  768
177
  ],
178
+ "offset": 130710528,
179
  "size": 589824
180
  },
181
  "encoder.encoder.layer.1.attention.self.key.bias": {
182
  "shape": [
183
  768
184
  ],
185
+ "offset": 133069824,
186
  "size": 768
187
  },
188
  "encoder.encoder.layer.1.attention.self.value.weight": {
 
190
  768,
191
  768
192
  ],
193
+ "offset": 133072896,
194
  "size": 589824
195
  },
196
  "encoder.encoder.layer.1.attention.self.value.bias": {
197
  "shape": [
198
  768
199
  ],
200
+ "offset": 135432192,
201
  "size": 768
202
  },
203
  "encoder.encoder.layer.1.attention.output.dense.weight": {
 
205
  768,
206
  768
207
  ],
208
+ "offset": 135435264,
209
  "size": 589824
210
  },
211
  "encoder.encoder.layer.1.attention.output.dense.bias": {
212
  "shape": [
213
  768
214
  ],
215
+ "offset": 137794560,
216
  "size": 768
217
  },
218
  "encoder.encoder.layer.1.attention.output.LayerNorm.weight": {
219
  "shape": [
220
  768
221
  ],
222
+ "offset": 137797632,
223
  "size": 768
224
  },
225
  "encoder.encoder.layer.1.attention.output.LayerNorm.bias": {
226
  "shape": [
227
  768
228
  ],
229
+ "offset": 137800704,
230
  "size": 768
231
  },
232
  "encoder.encoder.layer.1.intermediate.dense.weight": {
 
234
  3072,
235
  768
236
  ],
237
+ "offset": 137803776,
238
  "size": 2359296
239
  },
240
  "encoder.encoder.layer.1.intermediate.dense.bias": {
241
  "shape": [
242
  3072
243
  ],
244
+ "offset": 147240960,
245
  "size": 3072
246
  },
247
  "encoder.encoder.layer.1.output.dense.weight": {
 
249
  768,
250
  3072
251
  ],
252
+ "offset": 147253248,
253
  "size": 2359296
254
  },
255
  "encoder.encoder.layer.1.output.dense.bias": {
256
  "shape": [
257
  768
258
  ],
259
+ "offset": 156690432,
260
  "size": 768
261
  },
262
  "encoder.encoder.layer.1.output.LayerNorm.weight": {
263
  "shape": [
264
  768
265
  ],
266
+ "offset": 156693504,
267
  "size": 768
268
  },
269
  "encoder.encoder.layer.1.output.LayerNorm.bias": {
270
  "shape": [
271
  768
272
  ],
273
+ "offset": 156696576,
274
  "size": 768
275
  },
276
  "encoder.encoder.layer.2.attention.self.query.weight": {
 
278
  768,
279
  768
280
  ],
281
+ "offset": 156699648,
282
  "size": 589824
283
  },
284
  "encoder.encoder.layer.2.attention.self.query.bias": {
285
  "shape": [
286
  768
287
  ],
288
+ "offset": 159058944,
289
  "size": 768
290
  },
291
  "encoder.encoder.layer.2.attention.self.key.weight": {
 
293
  768,
294
  768
295
  ],
296
+ "offset": 159062016,
297
  "size": 589824
298
  },
299
  "encoder.encoder.layer.2.attention.self.key.bias": {
300
  "shape": [
301
  768
302
  ],
303
+ "offset": 161421312,
304
  "size": 768
305
  },
306
  "encoder.encoder.layer.2.attention.self.value.weight": {
 
308
  768,
309
  768
310
  ],
311
+ "offset": 161424384,
312
  "size": 589824
313
  },
314
  "encoder.encoder.layer.2.attention.self.value.bias": {
315
  "shape": [
316
  768
317
  ],
318
+ "offset": 163783680,
319
  "size": 768
320
  },
321
  "encoder.encoder.layer.2.attention.output.dense.weight": {
 
323
  768,
324
  768
325
  ],
326
+ "offset": 163786752,
327
  "size": 589824
328
  },
329
  "encoder.encoder.layer.2.attention.output.dense.bias": {
330
  "shape": [
331
  768
332
  ],
333
+ "offset": 166146048,
334
  "size": 768
335
  },
336
  "encoder.encoder.layer.2.attention.output.LayerNorm.weight": {
337
  "shape": [
338
  768
339
  ],
340
+ "offset": 166149120,
341
  "size": 768
342
  },
343
  "encoder.encoder.layer.2.attention.output.LayerNorm.bias": {
344
  "shape": [
345
  768
346
  ],
347
+ "offset": 166152192,
348
  "size": 768
349
  },
350
  "encoder.encoder.layer.2.intermediate.dense.weight": {
 
352
  3072,
353
  768
354
  ],
355
+ "offset": 166155264,
356
  "size": 2359296
357
  },
358
  "encoder.encoder.layer.2.intermediate.dense.bias": {
359
  "shape": [
360
  3072
361
  ],
362
+ "offset": 175592448,
363
  "size": 3072
364
  },
365
  "encoder.encoder.layer.2.output.dense.weight": {
 
367
  768,
368
  3072
369
  ],
370
+ "offset": 175604736,
371
  "size": 2359296
372
  },
373
  "encoder.encoder.layer.2.output.dense.bias": {
374
  "shape": [
375
  768
376
  ],
377
+ "offset": 185041920,
378
  "size": 768
379
  },
380
  "encoder.encoder.layer.2.output.LayerNorm.weight": {
381
  "shape": [
382
  768
383
  ],
384
+ "offset": 185044992,
385
  "size": 768
386
  },
387
  "encoder.encoder.layer.2.output.LayerNorm.bias": {
388
  "shape": [
389
  768
390
  ],
391
+ "offset": 185048064,
392
  "size": 768
393
  },
394
  "encoder.encoder.layer.3.attention.self.query.weight": {
 
396
  768,
397
  768
398
  ],
399
+ "offset": 185051136,
400
  "size": 589824
401
  },
402
  "encoder.encoder.layer.3.attention.self.query.bias": {
403
  "shape": [
404
  768
405
  ],
406
+ "offset": 187410432,
407
  "size": 768
408
  },
409
  "encoder.encoder.layer.3.attention.self.key.weight": {
 
411
  768,
412
  768
413
  ],
414
+ "offset": 187413504,
415
  "size": 589824
416
  },
417
  "encoder.encoder.layer.3.attention.self.key.bias": {
418
  "shape": [
419
  768
420
  ],
421
+ "offset": 189772800,
422
  "size": 768
423
  },
424
  "encoder.encoder.layer.3.attention.self.value.weight": {
 
426
  768,
427
  768
428
  ],
429
+ "offset": 189775872,
430
  "size": 589824
431
  },
432
  "encoder.encoder.layer.3.attention.self.value.bias": {
433
  "shape": [
434
  768
435
  ],
436
+ "offset": 192135168,
437
  "size": 768
438
  },
439
  "encoder.encoder.layer.3.attention.output.dense.weight": {
 
441
  768,
442
  768
443
  ],
444
+ "offset": 192138240,
445
  "size": 589824
446
  },
447
  "encoder.encoder.layer.3.attention.output.dense.bias": {
448
  "shape": [
449
  768
450
  ],
451
+ "offset": 194497536,
452
  "size": 768
453
  },
454
  "encoder.encoder.layer.3.attention.output.LayerNorm.weight": {
455
  "shape": [
456
  768
457
  ],
458
+ "offset": 194500608,
459
  "size": 768
460
  },
461
  "encoder.encoder.layer.3.attention.output.LayerNorm.bias": {
462
  "shape": [
463
  768
464
  ],
465
+ "offset": 194503680,
466
  "size": 768
467
  },
468
  "encoder.encoder.layer.3.intermediate.dense.weight": {
 
470
  3072,
471
  768
472
  ],
473
+ "offset": 194506752,
474
  "size": 2359296
475
  },
476
  "encoder.encoder.layer.3.intermediate.dense.bias": {
477
  "shape": [
478
  3072
479
  ],
480
+ "offset": 203943936,
481
  "size": 3072
482
  },
483
  "encoder.encoder.layer.3.output.dense.weight": {
 
485
  768,
486
  3072
487
  ],
488
+ "offset": 203956224,
489
  "size": 2359296
490
  },
491
  "encoder.encoder.layer.3.output.dense.bias": {
492
  "shape": [
493
  768
494
  ],
495
+ "offset": 213393408,
496
  "size": 768
497
  },
498
  "encoder.encoder.layer.3.output.LayerNorm.weight": {
499
  "shape": [
500
  768
501
  ],
502
+ "offset": 213396480,
503
  "size": 768
504
  },
505
  "encoder.encoder.layer.3.output.LayerNorm.bias": {
506
  "shape": [
507
  768
508
  ],
509
+ "offset": 213399552,
510
  "size": 768
511
  },
512
  "encoder.encoder.layer.4.attention.self.query.weight": {
 
514
  768,
515
  768
516
  ],
517
+ "offset": 213402624,
518
  "size": 589824
519
  },
520
  "encoder.encoder.layer.4.attention.self.query.bias": {
521
  "shape": [
522
  768
523
  ],
524
+ "offset": 215761920,
525
  "size": 768
526
  },
527
  "encoder.encoder.layer.4.attention.self.key.weight": {
 
529
  768,
530
  768
531
  ],
532
+ "offset": 215764992,
533
  "size": 589824
534
  },
535
  "encoder.encoder.layer.4.attention.self.key.bias": {
536
  "shape": [
537
  768
538
  ],
539
+ "offset": 218124288,
540
  "size": 768
541
  },
542
  "encoder.encoder.layer.4.attention.self.value.weight": {
 
544
  768,
545
  768
546
  ],
547
+ "offset": 218127360,
548
  "size": 589824
549
  },
550
  "encoder.encoder.layer.4.attention.self.value.bias": {
551
  "shape": [
552
  768
553
  ],
554
+ "offset": 220486656,
555
  "size": 768
556
  },
557
  "encoder.encoder.layer.4.attention.output.dense.weight": {
 
559
  768,
560
  768
561
  ],
562
+ "offset": 220489728,
563
  "size": 589824
564
  },
565
  "encoder.encoder.layer.4.attention.output.dense.bias": {
566
  "shape": [
567
  768
568
  ],
569
+ "offset": 222849024,
570
  "size": 768
571
  },
572
  "encoder.encoder.layer.4.attention.output.LayerNorm.weight": {
573
  "shape": [
574
  768
575
  ],
576
+ "offset": 222852096,
577
  "size": 768
578
  },
579
  "encoder.encoder.layer.4.attention.output.LayerNorm.bias": {
580
  "shape": [
581
  768
582
  ],
583
+ "offset": 222855168,
584
  "size": 768
585
  },
586
  "encoder.encoder.layer.4.intermediate.dense.weight": {
 
588
  3072,
589
  768
590
  ],
591
+ "offset": 222858240,
592
  "size": 2359296
593
  },
594
  "encoder.encoder.layer.4.intermediate.dense.bias": {
595
  "shape": [
596
  3072
597
  ],
598
+ "offset": 232295424,
599
  "size": 3072
600
  },
601
  "encoder.encoder.layer.4.output.dense.weight": {
 
603
  768,
604
  3072
605
  ],
606
+ "offset": 232307712,
607
  "size": 2359296
608
  },
609
  "encoder.encoder.layer.4.output.dense.bias": {
610
  "shape": [
611
  768
612
  ],
613
+ "offset": 241744896,
614
  "size": 768
615
  },
616
  "encoder.encoder.layer.4.output.LayerNorm.weight": {
617
  "shape": [
618
  768
619
  ],
620
+ "offset": 241747968,
621
  "size": 768
622
  },
623
  "encoder.encoder.layer.4.output.LayerNorm.bias": {
624
  "shape": [
625
  768
626
  ],
627
+ "offset": 241751040,
628
  "size": 768
629
  },
630
  "encoder.encoder.layer.5.attention.self.query.weight": {
 
632
  768,
633
  768
634
  ],
635
+ "offset": 241754112,
636
  "size": 589824
637
  },
638
  "encoder.encoder.layer.5.attention.self.query.bias": {
639
  "shape": [
640
  768
641
  ],
642
+ "offset": 244113408,
643
  "size": 768
644
  },
645
  "encoder.encoder.layer.5.attention.self.key.weight": {
 
647
  768,
648
  768
649
  ],
650
+ "offset": 244116480,
651
  "size": 589824
652
  },
653
  "encoder.encoder.layer.5.attention.self.key.bias": {
654
  "shape": [
655
  768
656
  ],
657
+ "offset": 246475776,
658
  "size": 768
659
  },
660
  "encoder.encoder.layer.5.attention.self.value.weight": {
 
662
  768,
663
  768
664
  ],
665
+ "offset": 246478848,
666
  "size": 589824
667
  },
668
  "encoder.encoder.layer.5.attention.self.value.bias": {
669
  "shape": [
670
  768
671
  ],
672
+ "offset": 248838144,
673
  "size": 768
674
  },
675
  "encoder.encoder.layer.5.attention.output.dense.weight": {
 
677
  768,
678
  768
679
  ],
680
+ "offset": 248841216,
681
  "size": 589824
682
  },
683
  "encoder.encoder.layer.5.attention.output.dense.bias": {
684
  "shape": [
685
  768
686
  ],
687
+ "offset": 251200512,
688
  "size": 768
689
  },
690
  "encoder.encoder.layer.5.attention.output.LayerNorm.weight": {
691
  "shape": [
692
  768
693
  ],
694
+ "offset": 251203584,
695
  "size": 768
696
  },
697
  "encoder.encoder.layer.5.attention.output.LayerNorm.bias": {
698
  "shape": [
699
  768
700
  ],
701
+ "offset": 251206656,
702
  "size": 768
703
  },
704
  "encoder.encoder.layer.5.intermediate.dense.weight": {
 
706
  3072,
707
  768
708
  ],
709
+ "offset": 251209728,
710
  "size": 2359296
711
  },
712
  "encoder.encoder.layer.5.intermediate.dense.bias": {
713
  "shape": [
714
  3072
715
  ],
716
+ "offset": 260646912,
717
  "size": 3072
718
  },
719
  "encoder.encoder.layer.5.output.dense.weight": {
 
721
  768,
722
  3072
723
  ],
724
+ "offset": 260659200,
725
  "size": 2359296
726
  },
727
  "encoder.encoder.layer.5.output.dense.bias": {
728
  "shape": [
729
  768
730
  ],
731
+ "offset": 270096384,
732
  "size": 768
733
  },
734
  "encoder.encoder.layer.5.output.LayerNorm.weight": {
735
  "shape": [
736
  768
737
  ],
738
+ "offset": 270099456,
739
  "size": 768
740
  },
741
  "encoder.encoder.layer.5.output.LayerNorm.bias": {
742
  "shape": [
743
  768
744
  ],
745
+ "offset": 270102528,
746
  "size": 768
747
  },
748
  "encoder.encoder.layer.6.attention.self.query.weight": {
 
750
  768,
751
  768
752
  ],
753
+ "offset": 270105600,
754
  "size": 589824
755
  },
756
  "encoder.encoder.layer.6.attention.self.query.bias": {
757
  "shape": [
758
  768
759
  ],
760
+ "offset": 272464896,
761
  "size": 768
762
  },
763
  "encoder.encoder.layer.6.attention.self.key.weight": {
 
765
  768,
766
  768
767
  ],
768
+ "offset": 272467968,
769
  "size": 589824
770
  },
771
  "encoder.encoder.layer.6.attention.self.key.bias": {
772
  "shape": [
773
  768
774
  ],
775
+ "offset": 274827264,
776
  "size": 768
777
  },
778
  "encoder.encoder.layer.6.attention.self.value.weight": {
 
780
  768,
781
  768
782
  ],
783
+ "offset": 274830336,
784
  "size": 589824
785
  },
786
  "encoder.encoder.layer.6.attention.self.value.bias": {
787
  "shape": [
788
  768
789
  ],
790
+ "offset": 277189632,
791
  "size": 768
792
  },
793
  "encoder.encoder.layer.6.attention.output.dense.weight": {
 
795
  768,
796
  768
797
  ],
798
+ "offset": 277192704,
799
  "size": 589824
800
  },
801
  "encoder.encoder.layer.6.attention.output.dense.bias": {
802
  "shape": [
803
  768
804
  ],
805
+ "offset": 279552000,
806
  "size": 768
807
  },
808
  "encoder.encoder.layer.6.attention.output.LayerNorm.weight": {
809
  "shape": [
810
  768
811
  ],
812
+ "offset": 279555072,
813
  "size": 768
814
  },
815
  "encoder.encoder.layer.6.attention.output.LayerNorm.bias": {
816
  "shape": [
817
  768
818
  ],
819
+ "offset": 279558144,
820
  "size": 768
821
  },
822
  "encoder.encoder.layer.6.intermediate.dense.weight": {
 
824
  3072,
825
  768
826
  ],
827
+ "offset": 279561216,
828
  "size": 2359296
829
  },
830
  "encoder.encoder.layer.6.intermediate.dense.bias": {
831
  "shape": [
832
  3072
833
  ],
834
+ "offset": 288998400,
835
  "size": 3072
836
  },
837
  "encoder.encoder.layer.6.output.dense.weight": {
 
839
  768,
840
  3072
841
  ],
842
+ "offset": 289010688,
843
  "size": 2359296
844
  },
845
  "encoder.encoder.layer.6.output.dense.bias": {
846
  "shape": [
847
  768
848
  ],
849
+ "offset": 298447872,
850
  "size": 768
851
  },
852
  "encoder.encoder.layer.6.output.LayerNorm.weight": {
853
  "shape": [
854
  768
855
  ],
856
+ "offset": 298450944,
857
  "size": 768
858
  },
859
  "encoder.encoder.layer.6.output.LayerNorm.bias": {
860
  "shape": [
861
  768
862
  ],
863
+ "offset": 298454016,
864
  "size": 768
865
  },
866
  "encoder.encoder.layer.7.attention.self.query.weight": {
 
868
  768,
869
  768
870
  ],
871
+ "offset": 298457088,
872
  "size": 589824
873
  },
874
  "encoder.encoder.layer.7.attention.self.query.bias": {
875
  "shape": [
876
  768
877
  ],
878
+ "offset": 300816384,
879
  "size": 768
880
  },
881
  "encoder.encoder.layer.7.attention.self.key.weight": {
 
883
  768,
884
  768
885
  ],
886
+ "offset": 300819456,
887
  "size": 589824
888
  },
889
  "encoder.encoder.layer.7.attention.self.key.bias": {
890
  "shape": [
891
  768
892
  ],
893
+ "offset": 303178752,
894
  "size": 768
895
  },
896
  "encoder.encoder.layer.7.attention.self.value.weight": {
 
898
  768,
899
  768
900
  ],
901
+ "offset": 303181824,
902
  "size": 589824
903
  },
904
  "encoder.encoder.layer.7.attention.self.value.bias": {
905
  "shape": [
906
  768
907
  ],
908
+ "offset": 305541120,
909
  "size": 768
910
  },
911
  "encoder.encoder.layer.7.attention.output.dense.weight": {
 
913
  768,
914
  768
915
  ],
916
+ "offset": 305544192,
917
  "size": 589824
918
  },
919
  "encoder.encoder.layer.7.attention.output.dense.bias": {
920
  "shape": [
921
  768
922
  ],
923
+ "offset": 307903488,
924
  "size": 768
925
  },
926
  "encoder.encoder.layer.7.attention.output.LayerNorm.weight": {
927
  "shape": [
928
  768
929
  ],
930
+ "offset": 307906560,
931
  "size": 768
932
  },
933
  "encoder.encoder.layer.7.attention.output.LayerNorm.bias": {
934
  "shape": [
935
  768
936
  ],
937
+ "offset": 307909632,
938
  "size": 768
939
  },
940
  "encoder.encoder.layer.7.intermediate.dense.weight": {
 
942
  3072,
943
  768
944
  ],
945
+ "offset": 307912704,
946
  "size": 2359296
947
  },
948
  "encoder.encoder.layer.7.intermediate.dense.bias": {
949
  "shape": [
950
  3072
951
  ],
952
+ "offset": 317349888,
953
  "size": 3072
954
  },
955
  "encoder.encoder.layer.7.output.dense.weight": {
 
957
  768,
958
  3072
959
  ],
960
+ "offset": 317362176,
961
  "size": 2359296
962
  },
963
  "encoder.encoder.layer.7.output.dense.bias": {
964
  "shape": [
965
  768
966
  ],
967
+ "offset": 326799360,
968
  "size": 768
969
  },
970
  "encoder.encoder.layer.7.output.LayerNorm.weight": {
971
  "shape": [
972
  768
973
  ],
974
+ "offset": 326802432,
975
  "size": 768
976
  },
977
  "encoder.encoder.layer.7.output.LayerNorm.bias": {
978
  "shape": [
979
  768
980
  ],
981
+ "offset": 326805504,
982
  "size": 768
983
  },
984
  "encoder.encoder.layer.8.attention.self.query.weight": {
 
986
  768,
987
  768
988
  ],
989
+ "offset": 326808576,
990
  "size": 589824
991
  },
992
  "encoder.encoder.layer.8.attention.self.query.bias": {
993
  "shape": [
994
  768
995
  ],
996
+ "offset": 329167872,
997
  "size": 768
998
  },
999
  "encoder.encoder.layer.8.attention.self.key.weight": {
 
1001
  768,
1002
  768
1003
  ],
1004
+ "offset": 329170944,
1005
  "size": 589824
1006
  },
1007
  "encoder.encoder.layer.8.attention.self.key.bias": {
1008
  "shape": [
1009
  768
1010
  ],
1011
+ "offset": 331530240,
1012
  "size": 768
1013
  },
1014
  "encoder.encoder.layer.8.attention.self.value.weight": {
 
1016
  768,
1017
  768
1018
  ],
1019
+ "offset": 331533312,
1020
  "size": 589824
1021
  },
1022
  "encoder.encoder.layer.8.attention.self.value.bias": {
1023
  "shape": [
1024
  768
1025
  ],
1026
+ "offset": 333892608,
1027
  "size": 768
1028
  },
1029
  "encoder.encoder.layer.8.attention.output.dense.weight": {
 
1031
  768,
1032
  768
1033
  ],
1034
+ "offset": 333895680,
1035
  "size": 589824
1036
  },
1037
  "encoder.encoder.layer.8.attention.output.dense.bias": {
1038
  "shape": [
1039
  768
1040
  ],
1041
+ "offset": 336254976,
1042
  "size": 768
1043
  },
1044
  "encoder.encoder.layer.8.attention.output.LayerNorm.weight": {
1045
  "shape": [
1046
  768
1047
  ],
1048
+ "offset": 336258048,
1049
  "size": 768
1050
  },
1051
  "encoder.encoder.layer.8.attention.output.LayerNorm.bias": {
1052
  "shape": [
1053
  768
1054
  ],
1055
+ "offset": 336261120,
1056
  "size": 768
1057
  },
1058
  "encoder.encoder.layer.8.intermediate.dense.weight": {
 
1060
  3072,
1061
  768
1062
  ],
1063
+ "offset": 336264192,
1064
  "size": 2359296
1065
  },
1066
  "encoder.encoder.layer.8.intermediate.dense.bias": {
1067
  "shape": [
1068
  3072
1069
  ],
1070
+ "offset": 345701376,
1071
  "size": 3072
1072
  },
1073
  "encoder.encoder.layer.8.output.dense.weight": {
 
1075
  768,
1076
  3072
1077
  ],
1078
+ "offset": 345713664,
1079
  "size": 2359296
1080
  },
1081
  "encoder.encoder.layer.8.output.dense.bias": {
1082
  "shape": [
1083
  768
1084
  ],
1085
+ "offset": 355150848,
1086
  "size": 768
1087
  },
1088
  "encoder.encoder.layer.8.output.LayerNorm.weight": {
1089
  "shape": [
1090
  768
1091
  ],
1092
+ "offset": 355153920,
1093
  "size": 768
1094
  },
1095
  "encoder.encoder.layer.8.output.LayerNorm.bias": {
1096
  "shape": [
1097
  768
1098
  ],
1099
+ "offset": 355156992,
1100
  "size": 768
1101
  },
1102
  "encoder.encoder.layer.9.attention.self.query.weight": {
 
1104
  768,
1105
  768
1106
  ],
1107
+ "offset": 355160064,
1108
  "size": 589824
1109
  },
1110
  "encoder.encoder.layer.9.attention.self.query.bias": {
1111
  "shape": [
1112
  768
1113
  ],
1114
+ "offset": 357519360,
1115
  "size": 768
1116
  },
1117
  "encoder.encoder.layer.9.attention.self.key.weight": {
 
1119
  768,
1120
  768
1121
  ],
1122
+ "offset": 357522432,
1123
  "size": 589824
1124
  },
1125
  "encoder.encoder.layer.9.attention.self.key.bias": {
1126
  "shape": [
1127
  768
1128
  ],
1129
+ "offset": 359881728,
1130
  "size": 768
1131
  },
1132
  "encoder.encoder.layer.9.attention.self.value.weight": {
 
1134
  768,
1135
  768
1136
  ],
1137
+ "offset": 359884800,
1138
  "size": 589824
1139
  },
1140
  "encoder.encoder.layer.9.attention.self.value.bias": {
1141
  "shape": [
1142
  768
1143
  ],
1144
+ "offset": 362244096,
1145
  "size": 768
1146
  },
1147
  "encoder.encoder.layer.9.attention.output.dense.weight": {
 
1149
  768,
1150
  768
1151
  ],
1152
+ "offset": 362247168,
1153
  "size": 589824
1154
  },
1155
  "encoder.encoder.layer.9.attention.output.dense.bias": {
1156
  "shape": [
1157
  768
1158
  ],
1159
+ "offset": 364606464,
1160
  "size": 768
1161
  },
1162
  "encoder.encoder.layer.9.attention.output.LayerNorm.weight": {
1163
  "shape": [
1164
  768
1165
  ],
1166
+ "offset": 364609536,
1167
  "size": 768
1168
  },
1169
  "encoder.encoder.layer.9.attention.output.LayerNorm.bias": {
1170
  "shape": [
1171
  768
1172
  ],
1173
+ "offset": 364612608,
1174
  "size": 768
1175
  },
1176
  "encoder.encoder.layer.9.intermediate.dense.weight": {
 
1178
  3072,
1179
  768
1180
  ],
1181
+ "offset": 364615680,
1182
  "size": 2359296
1183
  },
1184
  "encoder.encoder.layer.9.intermediate.dense.bias": {
1185
  "shape": [
1186
  3072
1187
  ],
1188
+ "offset": 374052864,
1189
  "size": 3072
1190
  },
1191
  "encoder.encoder.layer.9.output.dense.weight": {
 
1193
  768,
1194
  3072
1195
  ],
1196
+ "offset": 374065152,
1197
  "size": 2359296
1198
  },
1199
  "encoder.encoder.layer.9.output.dense.bias": {
1200
  "shape": [
1201
  768
1202
  ],
1203
+ "offset": 383502336,
1204
  "size": 768
1205
  },
1206
  "encoder.encoder.layer.9.output.LayerNorm.weight": {
1207
  "shape": [
1208
  768
1209
  ],
1210
+ "offset": 383505408,
1211
  "size": 768
1212
  },
1213
  "encoder.encoder.layer.9.output.LayerNorm.bias": {
1214
  "shape": [
1215
  768
1216
  ],
1217
+ "offset": 383508480,
1218
  "size": 768
1219
  },
1220
  "encoder.encoder.layer.10.attention.self.query.weight": {
 
1222
  768,
1223
  768
1224
  ],
1225
+ "offset": 383511552,
1226
  "size": 589824
1227
  },
1228
  "encoder.encoder.layer.10.attention.self.query.bias": {
1229
  "shape": [
1230
  768
1231
  ],
1232
+ "offset": 385870848,
1233
  "size": 768
1234
  },
1235
  "encoder.encoder.layer.10.attention.self.key.weight": {
 
1237
  768,
1238
  768
1239
  ],
1240
+ "offset": 385873920,
1241
  "size": 589824
1242
  },
1243
  "encoder.encoder.layer.10.attention.self.key.bias": {
1244
  "shape": [
1245
  768
1246
  ],
1247
+ "offset": 388233216,
1248
  "size": 768
1249
  },
1250
  "encoder.encoder.layer.10.attention.self.value.weight": {
 
1252
  768,
1253
  768
1254
  ],
1255
+ "offset": 388236288,
1256
  "size": 589824
1257
  },
1258
  "encoder.encoder.layer.10.attention.self.value.bias": {
1259
  "shape": [
1260
  768
1261
  ],
1262
+ "offset": 390595584,
1263
  "size": 768
1264
  },
1265
  "encoder.encoder.layer.10.attention.output.dense.weight": {
 
1267
  768,
1268
  768
1269
  ],
1270
+ "offset": 390598656,
1271
  "size": 589824
1272
  },
1273
  "encoder.encoder.layer.10.attention.output.dense.bias": {
1274
  "shape": [
1275
  768
1276
  ],
1277
+ "offset": 392957952,
1278
  "size": 768
1279
  },
1280
  "encoder.encoder.layer.10.attention.output.LayerNorm.weight": {
1281
  "shape": [
1282
  768
1283
  ],
1284
+ "offset": 392961024,
1285
  "size": 768
1286
  },
1287
  "encoder.encoder.layer.10.attention.output.LayerNorm.bias": {
1288
  "shape": [
1289
  768
1290
  ],
1291
+ "offset": 392964096,
1292
  "size": 768
1293
  },
1294
  "encoder.encoder.layer.10.intermediate.dense.weight": {
 
1296
  3072,
1297
  768
1298
  ],
1299
+ "offset": 392967168,
1300
  "size": 2359296
1301
  },
1302
  "encoder.encoder.layer.10.intermediate.dense.bias": {
1303
  "shape": [
1304
  3072
1305
  ],
1306
+ "offset": 402404352,
1307
  "size": 3072
1308
  },
1309
  "encoder.encoder.layer.10.output.dense.weight": {
 
1311
  768,
1312
  3072
1313
  ],
1314
+ "offset": 402416640,
1315
  "size": 2359296
1316
  },
1317
  "encoder.encoder.layer.10.output.dense.bias": {
1318
  "shape": [
1319
  768
1320
  ],
1321
+ "offset": 411853824,
1322
  "size": 768
1323
  },
1324
  "encoder.encoder.layer.10.output.LayerNorm.weight": {
1325
  "shape": [
1326
  768
1327
  ],
1328
+ "offset": 411856896,
1329
  "size": 768
1330
  },
1331
  "encoder.encoder.layer.10.output.LayerNorm.bias": {
1332
  "shape": [
1333
  768
1334
  ],
1335
+ "offset": 411859968,
1336
  "size": 768
1337
  },
1338
  "encoder.encoder.layer.11.attention.self.query.weight": {
 
1340
  768,
1341
  768
1342
  ],
1343
+ "offset": 411863040,
1344
  "size": 589824
1345
  },
1346
  "encoder.encoder.layer.11.attention.self.query.bias": {
1347
  "shape": [
1348
  768
1349
  ],
1350
+ "offset": 414222336,
1351
  "size": 768
1352
  },
1353
  "encoder.encoder.layer.11.attention.self.key.weight": {
 
1355
  768,
1356
  768
1357
  ],
1358
+ "offset": 414225408,
1359
  "size": 589824
1360
  },
1361
  "encoder.encoder.layer.11.attention.self.key.bias": {
1362
  "shape": [
1363
  768
1364
  ],
1365
+ "offset": 416584704,
1366
  "size": 768
1367
  },
1368
  "encoder.encoder.layer.11.attention.self.value.weight": {
 
1370
  768,
1371
  768
1372
  ],
1373
+ "offset": 416587776,
1374
  "size": 589824
1375
  },
1376
  "encoder.encoder.layer.11.attention.self.value.bias": {
1377
  "shape": [
1378
  768
1379
  ],
1380
+ "offset": 418947072,
1381
  "size": 768
1382
  },
1383
  "encoder.encoder.layer.11.attention.output.dense.weight": {
 
1385
  768,
1386
  768
1387
  ],
1388
+ "offset": 418950144,
1389
  "size": 589824
1390
  },
1391
  "encoder.encoder.layer.11.attention.output.dense.bias": {
1392
  "shape": [
1393
  768
1394
  ],
1395
+ "offset": 421309440,
1396
  "size": 768
1397
  },
1398
  "encoder.encoder.layer.11.attention.output.LayerNorm.weight": {
1399
  "shape": [
1400
  768
1401
  ],
1402
+ "offset": 421312512,
1403
  "size": 768
1404
  },
1405
  "encoder.encoder.layer.11.attention.output.LayerNorm.bias": {
1406
  "shape": [
1407
  768
1408
  ],
1409
+ "offset": 421315584,
1410
  "size": 768
1411
  },
1412
  "encoder.encoder.layer.11.intermediate.dense.weight": {
 
1414
  3072,
1415
  768
1416
  ],
1417
+ "offset": 421318656,
1418
  "size": 2359296
1419
  },
1420
  "encoder.encoder.layer.11.intermediate.dense.bias": {
1421
  "shape": [
1422
  3072
1423
  ],
1424
+ "offset": 430755840,
1425
  "size": 3072
1426
  },
1427
  "encoder.encoder.layer.11.output.dense.weight": {
 
1429
  768,
1430
  3072
1431
  ],
1432
+ "offset": 430768128,
1433
  "size": 2359296
1434
  },
1435
  "encoder.encoder.layer.11.output.dense.bias": {
1436
  "shape": [
1437
  768
1438
  ],
1439
+ "offset": 440205312,
1440
  "size": 768
1441
  },
1442
  "encoder.encoder.layer.11.output.LayerNorm.weight": {
1443
  "shape": [
1444
  768
1445
  ],
1446
+ "offset": 440208384,
1447
  "size": 768
1448
  },
1449
  "encoder.encoder.layer.11.output.LayerNorm.bias": {
1450
  "shape": [
1451
  768
1452
  ],
1453
+ "offset": 440211456,
1454
  "size": 768
1455
  },
1456
  "encoder.pooler.dense.weight": {
 
1458
  768,
1459
  768
1460
  ],
1461
+ "offset": 440214528,
1462
  "size": 589824
1463
  },
1464
  "encoder.pooler.dense.bias": {
1465
  "shape": [
1466
  768
1467
  ],
1468
+ "offset": 442573824,
1469
  "size": 768
1470
  },
1471
  "classifier.1.weight": {
 
1473
  256,
1474
  768
1475
  ],
1476
+ "offset": 442576896,
1477
  "size": 196608
1478
  },
1479
  "classifier.1.bias": {
1480
  "shape": [
1481
  256
1482
  ],
1483
+ "offset": 443363328,
1484
  "size": 256
1485
  },
1486
  "classifier.4.weight": {
1487
  "shape": [
1488
+ 11,
1489
  256
1490
  ],
1491
+ "offset": 443364352,
1492
+ "size": 2816
1493
  },
1494
  "classifier.4.bias": {
1495
  "shape": [
1496
+ 11
1497
  ],
1498
+ "offset": 443375616,
1499
+ "size": 11
1500
  }
1501
  }