mkshing commited on
Commit
42faf3f
·
verified ·
1 Parent(s): cf4821f

Add files using upload-large-folder tool

Browse files
mlc-chat-config.json CHANGED
@@ -1,7 +1,7 @@
1
  {
2
  "version": "0.1.0",
3
  "model_type": "qwen2",
4
- "quantization": "q4f16_1",
5
  "model_config": {
6
  "hidden_act": "silu",
7
  "hidden_size": 1536,
@@ -27,11 +27,11 @@
27
  "attention_sink_size": -1,
28
  "tensor_parallel_shards": 1,
29
  "pipeline_parallel_stages": 1,
30
- "temperature": 0.7,
31
  "presence_penalty": 0.0,
32
  "frequency_penalty": 0.0,
33
  "repetition_penalty": 1.1,
34
- "top_p": 0.8,
35
  "tokenizer_files": [
36
  "tokenizer.json",
37
  "vocab.json",
@@ -47,7 +47,7 @@
47
  "conv_template": {
48
  "name": "qwen2",
49
  "system_template": "<|im_start|>system\n{system_message}<|im_end|>\n",
50
- "system_message": "あなたは誠実で優秀な日本人のアシスタントです。",
51
  "system_prefix_token_ids": null,
52
  "add_role_after_system_message": true,
53
  "roles": {
 
1
  {
2
  "version": "0.1.0",
3
  "model_type": "qwen2",
4
+ "quantization": "q4f32_1",
5
  "model_config": {
6
  "hidden_act": "silu",
7
  "hidden_size": 1536,
 
27
  "attention_sink_size": -1,
28
  "tensor_parallel_shards": 1,
29
  "pipeline_parallel_stages": 1,
30
+ "temperature": 0.8,
31
  "presence_penalty": 0.0,
32
  "frequency_penalty": 0.0,
33
  "repetition_penalty": 1.1,
34
+ "top_p": 0.95,
35
  "tokenizer_files": [
36
  "tokenizer.json",
37
  "vocab.json",
 
47
  "conv_template": {
48
  "name": "qwen2",
49
  "system_template": "<|im_start|>system\n{system_message}<|im_end|>\n",
50
+ "system_message": "あなたは、Sakana AI株式会社が開発したTinySwallowです。小型ながら、誠実で優秀なアシスタントです。",
51
  "system_prefix_token_ids": null,
52
  "add_role_after_system_message": true,
53
  "roles": {
ndarray-cache-b16.json ADDED
The diff for this file is too large to render. See raw diff
 
ndarray-cache.json CHANGED
@@ -1,8 +1,8 @@
1
  {
2
  "metadata": {
3
  "ParamSize": 311,
4
- "ParamBytes": 868547584.0,
5
- "BitsPerParam": 4.501079412165634
6
  },
7
  "records": [
8
  {
@@ -22,7 +22,7 @@
22
  "byteOffset": 0
23
  }
24
  ],
25
- "md5sum": "450bb8d4d126170e2f4f6b3fd5ac19c8"
26
  },
27
  {
28
  "dataPath": "params_shard_1.bin",
@@ -35,7 +35,7 @@
35
  151936,
36
  48
37
  ],
38
- "dtype": "float16",
39
  "format": "f32-to-bf16",
40
  "nbytes": 14585856,
41
  "byteOffset": 0
@@ -45,7 +45,7 @@
45
  "shape": [
46
  1536
47
  ],
48
- "dtype": "float16",
49
  "format": "f32-to-bf16",
50
  "nbytes": 3072,
51
  "byteOffset": 14585856
@@ -67,13 +67,13 @@
67
  1536,
68
  280
69
  ],
70
- "dtype": "float16",
71
  "format": "f32-to-bf16",
72
  "nbytes": 860160,
73
  "byteOffset": 21470208
74
  }
75
  ],
76
- "md5sum": "8e981e4915b04c93adb4e1b322b2b113"
77
  },
78
  {
79
  "dataPath": "params_shard_2.bin",
@@ -97,7 +97,7 @@
97
  17920,
98
  48
99
  ],
100
- "dtype": "float16",
101
  "format": "f32-to-bf16",
102
  "nbytes": 1720320,
103
  "byteOffset": 13762560
@@ -107,7 +107,7 @@
107
  "shape": [
108
  1536
109
  ],
110
- "dtype": "float16",
111
  "format": "f32-to-bf16",
112
  "nbytes": 3072,
113
  "byteOffset": 15482880
@@ -117,7 +117,7 @@
117
  "shape": [
118
  2048
119
  ],
120
- "dtype": "float16",
121
  "format": "f32-to-bf16",
122
  "nbytes": 4096,
123
  "byteOffset": 15485952
@@ -139,7 +139,7 @@
139
  2048,
140
  48
141
  ],
142
- "dtype": "float16",
143
  "format": "f32-to-bf16",
144
  "nbytes": 196608,
145
  "byteOffset": 17062912
@@ -161,7 +161,7 @@
161
  1536,
162
  48
163
  ],
164
- "dtype": "float16",
165
  "format": "f32-to-bf16",
166
  "nbytes": 147456,
167
  "byteOffset": 18439168
@@ -171,7 +171,7 @@
171
  "shape": [
172
  1536
173
  ],
174
- "dtype": "float16",
175
  "format": "f32-to-bf16",
176
  "nbytes": 3072,
177
  "byteOffset": 18586624
@@ -193,13 +193,13 @@
193
  1536,
194
  280
195
  ],
196
- "dtype": "float16",
197
  "format": "f32-to-bf16",
198
  "nbytes": 860160,
199
  "byteOffset": 25470976
200
  }
201
  ],
202
- "md5sum": "9ecab38a4c03476d22715fcc2f2eaadc"
203
  },
204
  {
205
  "dataPath": "params_shard_3.bin",
@@ -223,7 +223,7 @@
223
  17920,
224
  48
225
  ],
226
- "dtype": "float16",
227
  "format": "f32-to-bf16",
228
  "nbytes": 1720320,
229
  "byteOffset": 13762560
@@ -233,7 +233,7 @@
233
  "shape": [
234
  1536
235
  ],
236
- "dtype": "float16",
237
  "format": "f32-to-bf16",
238
  "nbytes": 3072,
239
  "byteOffset": 15482880
@@ -243,7 +243,7 @@
243
  "shape": [
244
  2048
245
  ],
246
- "dtype": "float16",
247
  "format": "f32-to-bf16",
248
  "nbytes": 4096,
249
  "byteOffset": 15485952
@@ -265,7 +265,7 @@
265
  2048,
266
  48
267
  ],
268
- "dtype": "float16",
269
  "format": "f32-to-bf16",
270
  "nbytes": 196608,
271
  "byteOffset": 17062912
@@ -287,7 +287,7 @@
287
  1536,
288
  48
289
  ],
290
- "dtype": "float16",
291
  "format": "f32-to-bf16",
292
  "nbytes": 147456,
293
  "byteOffset": 18439168
@@ -297,7 +297,7 @@
297
  "shape": [
298
  1536
299
  ],
300
- "dtype": "float16",
301
  "format": "f32-to-bf16",
302
  "nbytes": 3072,
303
  "byteOffset": 18586624
@@ -319,13 +319,13 @@
319
  1536,
320
  280
321
  ],
322
- "dtype": "float16",
323
  "format": "f32-to-bf16",
324
  "nbytes": 860160,
325
  "byteOffset": 25470976
326
  }
327
  ],
328
- "md5sum": "12811d3c4ef3f98c78a960387c3b951c"
329
  },
330
  {
331
  "dataPath": "params_shard_4.bin",
@@ -349,7 +349,7 @@
349
  17920,
350
  48
351
  ],
352
- "dtype": "float16",
353
  "format": "f32-to-bf16",
354
  "nbytes": 1720320,
355
  "byteOffset": 13762560
@@ -359,7 +359,7 @@
359
  "shape": [
360
  1536
361
  ],
362
- "dtype": "float16",
363
  "format": "f32-to-bf16",
364
  "nbytes": 3072,
365
  "byteOffset": 15482880
@@ -369,7 +369,7 @@
369
  "shape": [
370
  2048
371
  ],
372
- "dtype": "float16",
373
  "format": "f32-to-bf16",
374
  "nbytes": 4096,
375
  "byteOffset": 15485952
@@ -391,7 +391,7 @@
391
  2048,
392
  48
393
  ],
394
- "dtype": "float16",
395
  "format": "f32-to-bf16",
396
  "nbytes": 196608,
397
  "byteOffset": 17062912
@@ -413,7 +413,7 @@
413
  1536,
414
  48
415
  ],
416
- "dtype": "float16",
417
  "format": "f32-to-bf16",
418
  "nbytes": 147456,
419
  "byteOffset": 18439168
@@ -423,7 +423,7 @@
423
  "shape": [
424
  1536
425
  ],
426
- "dtype": "float16",
427
  "format": "f32-to-bf16",
428
  "nbytes": 3072,
429
  "byteOffset": 18586624
@@ -445,13 +445,13 @@
445
  1536,
446
  280
447
  ],
448
- "dtype": "float16",
449
  "format": "f32-to-bf16",
450
  "nbytes": 860160,
451
  "byteOffset": 25470976
452
  }
453
  ],
454
- "md5sum": "617e2ff92e25bda277d85c40dcb78ec9"
455
  },
456
  {
457
  "dataPath": "params_shard_5.bin",
@@ -475,7 +475,7 @@
475
  17920,
476
  48
477
  ],
478
- "dtype": "float16",
479
  "format": "f32-to-bf16",
480
  "nbytes": 1720320,
481
  "byteOffset": 13762560
@@ -485,7 +485,7 @@
485
  "shape": [
486
  1536
487
  ],
488
- "dtype": "float16",
489
  "format": "f32-to-bf16",
490
  "nbytes": 3072,
491
  "byteOffset": 15482880
@@ -495,7 +495,7 @@
495
  "shape": [
496
  2048
497
  ],
498
- "dtype": "float16",
499
  "format": "f32-to-bf16",
500
  "nbytes": 4096,
501
  "byteOffset": 15485952
@@ -517,7 +517,7 @@
517
  2048,
518
  48
519
  ],
520
- "dtype": "float16",
521
  "format": "f32-to-bf16",
522
  "nbytes": 196608,
523
  "byteOffset": 17062912
@@ -539,7 +539,7 @@
539
  1536,
540
  48
541
  ],
542
- "dtype": "float16",
543
  "format": "f32-to-bf16",
544
  "nbytes": 147456,
545
  "byteOffset": 18439168
@@ -549,7 +549,7 @@
549
  "shape": [
550
  1536
551
  ],
552
- "dtype": "float16",
553
  "format": "f32-to-bf16",
554
  "nbytes": 3072,
555
  "byteOffset": 18586624
@@ -571,13 +571,13 @@
571
  1536,
572
  280
573
  ],
574
- "dtype": "float16",
575
  "format": "f32-to-bf16",
576
  "nbytes": 860160,
577
  "byteOffset": 25470976
578
  }
579
  ],
580
- "md5sum": "4c19884f208520dff3f58ca4b46b2c2e"
581
  },
582
  {
583
  "dataPath": "params_shard_6.bin",
@@ -601,7 +601,7 @@
601
  17920,
602
  48
603
  ],
604
- "dtype": "float16",
605
  "format": "f32-to-bf16",
606
  "nbytes": 1720320,
607
  "byteOffset": 13762560
@@ -611,7 +611,7 @@
611
  "shape": [
612
  1536
613
  ],
614
- "dtype": "float16",
615
  "format": "f32-to-bf16",
616
  "nbytes": 3072,
617
  "byteOffset": 15482880
@@ -621,7 +621,7 @@
621
  "shape": [
622
  2048
623
  ],
624
- "dtype": "float16",
625
  "format": "f32-to-bf16",
626
  "nbytes": 4096,
627
  "byteOffset": 15485952
@@ -643,7 +643,7 @@
643
  2048,
644
  48
645
  ],
646
- "dtype": "float16",
647
  "format": "f32-to-bf16",
648
  "nbytes": 196608,
649
  "byteOffset": 17062912
@@ -665,7 +665,7 @@
665
  1536,
666
  48
667
  ],
668
- "dtype": "float16",
669
  "format": "f32-to-bf16",
670
  "nbytes": 147456,
671
  "byteOffset": 18439168
@@ -675,7 +675,7 @@
675
  "shape": [
676
  1536
677
  ],
678
- "dtype": "float16",
679
  "format": "f32-to-bf16",
680
  "nbytes": 3072,
681
  "byteOffset": 18586624
@@ -697,13 +697,13 @@
697
  1536,
698
  280
699
  ],
700
- "dtype": "float16",
701
  "format": "f32-to-bf16",
702
  "nbytes": 860160,
703
  "byteOffset": 25470976
704
  }
705
  ],
706
- "md5sum": "a1405f132ddf28625e0eff82d567726a"
707
  },
708
  {
709
  "dataPath": "params_shard_7.bin",
@@ -727,7 +727,7 @@
727
  17920,
728
  48
729
  ],
730
- "dtype": "float16",
731
  "format": "f32-to-bf16",
732
  "nbytes": 1720320,
733
  "byteOffset": 13762560
@@ -737,7 +737,7 @@
737
  "shape": [
738
  1536
739
  ],
740
- "dtype": "float16",
741
  "format": "f32-to-bf16",
742
  "nbytes": 3072,
743
  "byteOffset": 15482880
@@ -747,7 +747,7 @@
747
  "shape": [
748
  2048
749
  ],
750
- "dtype": "float16",
751
  "format": "f32-to-bf16",
752
  "nbytes": 4096,
753
  "byteOffset": 15485952
@@ -769,7 +769,7 @@
769
  2048,
770
  48
771
  ],
772
- "dtype": "float16",
773
  "format": "f32-to-bf16",
774
  "nbytes": 196608,
775
  "byteOffset": 17062912
@@ -791,7 +791,7 @@
791
  1536,
792
  48
793
  ],
794
- "dtype": "float16",
795
  "format": "f32-to-bf16",
796
  "nbytes": 147456,
797
  "byteOffset": 18439168
@@ -801,7 +801,7 @@
801
  "shape": [
802
  1536
803
  ],
804
- "dtype": "float16",
805
  "format": "f32-to-bf16",
806
  "nbytes": 3072,
807
  "byteOffset": 18586624
@@ -823,13 +823,13 @@
823
  1536,
824
  280
825
  ],
826
- "dtype": "float16",
827
  "format": "f32-to-bf16",
828
  "nbytes": 860160,
829
  "byteOffset": 25470976
830
  }
831
  ],
832
- "md5sum": "e3699419202e19145b9c7f5310810bb6"
833
  },
834
  {
835
  "dataPath": "params_shard_8.bin",
@@ -853,7 +853,7 @@
853
  17920,
854
  48
855
  ],
856
- "dtype": "float16",
857
  "format": "f32-to-bf16",
858
  "nbytes": 1720320,
859
  "byteOffset": 13762560
@@ -863,7 +863,7 @@
863
  "shape": [
864
  1536
865
  ],
866
- "dtype": "float16",
867
  "format": "f32-to-bf16",
868
  "nbytes": 3072,
869
  "byteOffset": 15482880
@@ -873,7 +873,7 @@
873
  "shape": [
874
  2048
875
  ],
876
- "dtype": "float16",
877
  "format": "f32-to-bf16",
878
  "nbytes": 4096,
879
  "byteOffset": 15485952
@@ -895,7 +895,7 @@
895
  2048,
896
  48
897
  ],
898
- "dtype": "float16",
899
  "format": "f32-to-bf16",
900
  "nbytes": 196608,
901
  "byteOffset": 17062912
@@ -917,7 +917,7 @@
917
  1536,
918
  48
919
  ],
920
- "dtype": "float16",
921
  "format": "f32-to-bf16",
922
  "nbytes": 147456,
923
  "byteOffset": 18439168
@@ -927,7 +927,7 @@
927
  "shape": [
928
  1536
929
  ],
930
- "dtype": "float16",
931
  "format": "f32-to-bf16",
932
  "nbytes": 3072,
933
  "byteOffset": 18586624
@@ -949,13 +949,13 @@
949
  1536,
950
  280
951
  ],
952
- "dtype": "float16",
953
  "format": "f32-to-bf16",
954
  "nbytes": 860160,
955
  "byteOffset": 25470976
956
  }
957
  ],
958
- "md5sum": "d9f34e0a589eab04ddc1357ce2e6d8c2"
959
  },
960
  {
961
  "dataPath": "params_shard_9.bin",
@@ -979,7 +979,7 @@
979
  17920,
980
  48
981
  ],
982
- "dtype": "float16",
983
  "format": "f32-to-bf16",
984
  "nbytes": 1720320,
985
  "byteOffset": 13762560
@@ -989,7 +989,7 @@
989
  "shape": [
990
  1536
991
  ],
992
- "dtype": "float16",
993
  "format": "f32-to-bf16",
994
  "nbytes": 3072,
995
  "byteOffset": 15482880
@@ -999,7 +999,7 @@
999
  "shape": [
1000
  2048
1001
  ],
1002
- "dtype": "float16",
1003
  "format": "f32-to-bf16",
1004
  "nbytes": 4096,
1005
  "byteOffset": 15485952
@@ -1021,7 +1021,7 @@
1021
  2048,
1022
  48
1023
  ],
1024
- "dtype": "float16",
1025
  "format": "f32-to-bf16",
1026
  "nbytes": 196608,
1027
  "byteOffset": 17062912
@@ -1043,7 +1043,7 @@
1043
  1536,
1044
  48
1045
  ],
1046
- "dtype": "float16",
1047
  "format": "f32-to-bf16",
1048
  "nbytes": 147456,
1049
  "byteOffset": 18439168
@@ -1053,7 +1053,7 @@
1053
  "shape": [
1054
  1536
1055
  ],
1056
- "dtype": "float16",
1057
  "format": "f32-to-bf16",
1058
  "nbytes": 3072,
1059
  "byteOffset": 18586624
@@ -1075,13 +1075,13 @@
1075
  1536,
1076
  280
1077
  ],
1078
- "dtype": "float16",
1079
  "format": "f32-to-bf16",
1080
  "nbytes": 860160,
1081
  "byteOffset": 25470976
1082
  }
1083
  ],
1084
- "md5sum": "3096e37cb41d061dfe06cd3fec3f7ad9"
1085
  },
1086
  {
1087
  "dataPath": "params_shard_10.bin",
@@ -1105,7 +1105,7 @@
1105
  17920,
1106
  48
1107
  ],
1108
- "dtype": "float16",
1109
  "format": "f32-to-bf16",
1110
  "nbytes": 1720320,
1111
  "byteOffset": 13762560
@@ -1115,7 +1115,7 @@
1115
  "shape": [
1116
  1536
1117
  ],
1118
- "dtype": "float16",
1119
  "format": "f32-to-bf16",
1120
  "nbytes": 3072,
1121
  "byteOffset": 15482880
@@ -1125,7 +1125,7 @@
1125
  "shape": [
1126
  2048
1127
  ],
1128
- "dtype": "float16",
1129
  "format": "f32-to-bf16",
1130
  "nbytes": 4096,
1131
  "byteOffset": 15485952
@@ -1147,7 +1147,7 @@
1147
  2048,
1148
  48
1149
  ],
1150
- "dtype": "float16",
1151
  "format": "f32-to-bf16",
1152
  "nbytes": 196608,
1153
  "byteOffset": 17062912
@@ -1169,7 +1169,7 @@
1169
  1536,
1170
  48
1171
  ],
1172
- "dtype": "float16",
1173
  "format": "f32-to-bf16",
1174
  "nbytes": 147456,
1175
  "byteOffset": 18439168
@@ -1179,7 +1179,7 @@
1179
  "shape": [
1180
  1536
1181
  ],
1182
- "dtype": "float16",
1183
  "format": "f32-to-bf16",
1184
  "nbytes": 3072,
1185
  "byteOffset": 18586624
@@ -1201,13 +1201,13 @@
1201
  1536,
1202
  280
1203
  ],
1204
- "dtype": "float16",
1205
  "format": "f32-to-bf16",
1206
  "nbytes": 860160,
1207
  "byteOffset": 25470976
1208
  }
1209
  ],
1210
- "md5sum": "0a809a750f7fa18dc74c7f711c4540dd"
1211
  },
1212
  {
1213
  "dataPath": "params_shard_11.bin",
@@ -1231,7 +1231,7 @@
1231
  17920,
1232
  48
1233
  ],
1234
- "dtype": "float16",
1235
  "format": "f32-to-bf16",
1236
  "nbytes": 1720320,
1237
  "byteOffset": 13762560
@@ -1241,7 +1241,7 @@
1241
  "shape": [
1242
  1536
1243
  ],
1244
- "dtype": "float16",
1245
  "format": "f32-to-bf16",
1246
  "nbytes": 3072,
1247
  "byteOffset": 15482880
@@ -1251,7 +1251,7 @@
1251
  "shape": [
1252
  2048
1253
  ],
1254
- "dtype": "float16",
1255
  "format": "f32-to-bf16",
1256
  "nbytes": 4096,
1257
  "byteOffset": 15485952
@@ -1273,7 +1273,7 @@
1273
  2048,
1274
  48
1275
  ],
1276
- "dtype": "float16",
1277
  "format": "f32-to-bf16",
1278
  "nbytes": 196608,
1279
  "byteOffset": 17062912
@@ -1295,7 +1295,7 @@
1295
  1536,
1296
  48
1297
  ],
1298
- "dtype": "float16",
1299
  "format": "f32-to-bf16",
1300
  "nbytes": 147456,
1301
  "byteOffset": 18439168
@@ -1305,7 +1305,7 @@
1305
  "shape": [
1306
  1536
1307
  ],
1308
- "dtype": "float16",
1309
  "format": "f32-to-bf16",
1310
  "nbytes": 3072,
1311
  "byteOffset": 18586624
@@ -1327,13 +1327,13 @@
1327
  1536,
1328
  280
1329
  ],
1330
- "dtype": "float16",
1331
  "format": "f32-to-bf16",
1332
  "nbytes": 860160,
1333
  "byteOffset": 25470976
1334
  }
1335
  ],
1336
- "md5sum": "096c7401ddcb44074251a93087eb194f"
1337
  },
1338
  {
1339
  "dataPath": "params_shard_12.bin",
@@ -1357,7 +1357,7 @@
1357
  17920,
1358
  48
1359
  ],
1360
- "dtype": "float16",
1361
  "format": "f32-to-bf16",
1362
  "nbytes": 1720320,
1363
  "byteOffset": 13762560
@@ -1367,7 +1367,7 @@
1367
  "shape": [
1368
  1536
1369
  ],
1370
- "dtype": "float16",
1371
  "format": "f32-to-bf16",
1372
  "nbytes": 3072,
1373
  "byteOffset": 15482880
@@ -1377,7 +1377,7 @@
1377
  "shape": [
1378
  2048
1379
  ],
1380
- "dtype": "float16",
1381
  "format": "f32-to-bf16",
1382
  "nbytes": 4096,
1383
  "byteOffset": 15485952
@@ -1399,7 +1399,7 @@
1399
  2048,
1400
  48
1401
  ],
1402
- "dtype": "float16",
1403
  "format": "f32-to-bf16",
1404
  "nbytes": 196608,
1405
  "byteOffset": 17062912
@@ -1421,7 +1421,7 @@
1421
  1536,
1422
  48
1423
  ],
1424
- "dtype": "float16",
1425
  "format": "f32-to-bf16",
1426
  "nbytes": 147456,
1427
  "byteOffset": 18439168
@@ -1431,7 +1431,7 @@
1431
  "shape": [
1432
  1536
1433
  ],
1434
- "dtype": "float16",
1435
  "format": "f32-to-bf16",
1436
  "nbytes": 3072,
1437
  "byteOffset": 18586624
@@ -1453,13 +1453,13 @@
1453
  1536,
1454
  280
1455
  ],
1456
- "dtype": "float16",
1457
  "format": "f32-to-bf16",
1458
  "nbytes": 860160,
1459
  "byteOffset": 25470976
1460
  }
1461
  ],
1462
- "md5sum": "7c97e40e182bc106208e2560a0b1dfdb"
1463
  },
1464
  {
1465
  "dataPath": "params_shard_13.bin",
@@ -1483,7 +1483,7 @@
1483
  17920,
1484
  48
1485
  ],
1486
- "dtype": "float16",
1487
  "format": "f32-to-bf16",
1488
  "nbytes": 1720320,
1489
  "byteOffset": 13762560
@@ -1493,7 +1493,7 @@
1493
  "shape": [
1494
  1536
1495
  ],
1496
- "dtype": "float16",
1497
  "format": "f32-to-bf16",
1498
  "nbytes": 3072,
1499
  "byteOffset": 15482880
@@ -1503,7 +1503,7 @@
1503
  "shape": [
1504
  2048
1505
  ],
1506
- "dtype": "float16",
1507
  "format": "f32-to-bf16",
1508
  "nbytes": 4096,
1509
  "byteOffset": 15485952
@@ -1525,7 +1525,7 @@
1525
  2048,
1526
  48
1527
  ],
1528
- "dtype": "float16",
1529
  "format": "f32-to-bf16",
1530
  "nbytes": 196608,
1531
  "byteOffset": 17062912
@@ -1547,7 +1547,7 @@
1547
  1536,
1548
  48
1549
  ],
1550
- "dtype": "float16",
1551
  "format": "f32-to-bf16",
1552
  "nbytes": 147456,
1553
  "byteOffset": 18439168
@@ -1557,7 +1557,7 @@
1557
  "shape": [
1558
  1536
1559
  ],
1560
- "dtype": "float16",
1561
  "format": "f32-to-bf16",
1562
  "nbytes": 3072,
1563
  "byteOffset": 18586624
@@ -1579,13 +1579,13 @@
1579
  1536,
1580
  280
1581
  ],
1582
- "dtype": "float16",
1583
  "format": "f32-to-bf16",
1584
  "nbytes": 860160,
1585
  "byteOffset": 25470976
1586
  }
1587
  ],
1588
- "md5sum": "f054e51f4b823b1e69051495ab37ae21"
1589
  },
1590
  {
1591
  "dataPath": "params_shard_14.bin",
@@ -1609,7 +1609,7 @@
1609
  17920,
1610
  48
1611
  ],
1612
- "dtype": "float16",
1613
  "format": "f32-to-bf16",
1614
  "nbytes": 1720320,
1615
  "byteOffset": 13762560
@@ -1619,7 +1619,7 @@
1619
  "shape": [
1620
  1536
1621
  ],
1622
- "dtype": "float16",
1623
  "format": "f32-to-bf16",
1624
  "nbytes": 3072,
1625
  "byteOffset": 15482880
@@ -1629,7 +1629,7 @@
1629
  "shape": [
1630
  2048
1631
  ],
1632
- "dtype": "float16",
1633
  "format": "f32-to-bf16",
1634
  "nbytes": 4096,
1635
  "byteOffset": 15485952
@@ -1651,7 +1651,7 @@
1651
  2048,
1652
  48
1653
  ],
1654
- "dtype": "float16",
1655
  "format": "f32-to-bf16",
1656
  "nbytes": 196608,
1657
  "byteOffset": 17062912
@@ -1673,7 +1673,7 @@
1673
  1536,
1674
  48
1675
  ],
1676
- "dtype": "float16",
1677
  "format": "f32-to-bf16",
1678
  "nbytes": 147456,
1679
  "byteOffset": 18439168
@@ -1683,7 +1683,7 @@
1683
  "shape": [
1684
  1536
1685
  ],
1686
- "dtype": "float16",
1687
  "format": "f32-to-bf16",
1688
  "nbytes": 3072,
1689
  "byteOffset": 18586624
@@ -1705,13 +1705,13 @@
1705
  1536,
1706
  280
1707
  ],
1708
- "dtype": "float16",
1709
  "format": "f32-to-bf16",
1710
  "nbytes": 860160,
1711
  "byteOffset": 25470976
1712
  }
1713
  ],
1714
- "md5sum": "2d83f486ffcbd8bc26aae206f1ec92ab"
1715
  },
1716
  {
1717
  "dataPath": "params_shard_15.bin",
@@ -1735,7 +1735,7 @@
1735
  17920,
1736
  48
1737
  ],
1738
- "dtype": "float16",
1739
  "format": "f32-to-bf16",
1740
  "nbytes": 1720320,
1741
  "byteOffset": 13762560
@@ -1745,7 +1745,7 @@
1745
  "shape": [
1746
  1536
1747
  ],
1748
- "dtype": "float16",
1749
  "format": "f32-to-bf16",
1750
  "nbytes": 3072,
1751
  "byteOffset": 15482880
@@ -1755,7 +1755,7 @@
1755
  "shape": [
1756
  2048
1757
  ],
1758
- "dtype": "float16",
1759
  "format": "f32-to-bf16",
1760
  "nbytes": 4096,
1761
  "byteOffset": 15485952
@@ -1777,7 +1777,7 @@
1777
  2048,
1778
  48
1779
  ],
1780
- "dtype": "float16",
1781
  "format": "f32-to-bf16",
1782
  "nbytes": 196608,
1783
  "byteOffset": 17062912
@@ -1799,7 +1799,7 @@
1799
  1536,
1800
  48
1801
  ],
1802
- "dtype": "float16",
1803
  "format": "f32-to-bf16",
1804
  "nbytes": 147456,
1805
  "byteOffset": 18439168
@@ -1809,7 +1809,7 @@
1809
  "shape": [
1810
  1536
1811
  ],
1812
- "dtype": "float16",
1813
  "format": "f32-to-bf16",
1814
  "nbytes": 3072,
1815
  "byteOffset": 18586624
@@ -1831,13 +1831,13 @@
1831
  1536,
1832
  280
1833
  ],
1834
- "dtype": "float16",
1835
  "format": "f32-to-bf16",
1836
  "nbytes": 860160,
1837
  "byteOffset": 25470976
1838
  }
1839
  ],
1840
- "md5sum": "38b3b988ccd76505411541303820a8dd"
1841
  },
1842
  {
1843
  "dataPath": "params_shard_16.bin",
@@ -1861,7 +1861,7 @@
1861
  17920,
1862
  48
1863
  ],
1864
- "dtype": "float16",
1865
  "format": "f32-to-bf16",
1866
  "nbytes": 1720320,
1867
  "byteOffset": 13762560
@@ -1871,7 +1871,7 @@
1871
  "shape": [
1872
  1536
1873
  ],
1874
- "dtype": "float16",
1875
  "format": "f32-to-bf16",
1876
  "nbytes": 3072,
1877
  "byteOffset": 15482880
@@ -1881,7 +1881,7 @@
1881
  "shape": [
1882
  2048
1883
  ],
1884
- "dtype": "float16",
1885
  "format": "f32-to-bf16",
1886
  "nbytes": 4096,
1887
  "byteOffset": 15485952
@@ -1903,7 +1903,7 @@
1903
  2048,
1904
  48
1905
  ],
1906
- "dtype": "float16",
1907
  "format": "f32-to-bf16",
1908
  "nbytes": 196608,
1909
  "byteOffset": 17062912
@@ -1925,7 +1925,7 @@
1925
  1536,
1926
  48
1927
  ],
1928
- "dtype": "float16",
1929
  "format": "f32-to-bf16",
1930
  "nbytes": 147456,
1931
  "byteOffset": 18439168
@@ -1935,7 +1935,7 @@
1935
  "shape": [
1936
  1536
1937
  ],
1938
- "dtype": "float16",
1939
  "format": "f32-to-bf16",
1940
  "nbytes": 3072,
1941
  "byteOffset": 18586624
@@ -1957,13 +1957,13 @@
1957
  1536,
1958
  280
1959
  ],
1960
- "dtype": "float16",
1961
  "format": "f32-to-bf16",
1962
  "nbytes": 860160,
1963
  "byteOffset": 25470976
1964
  }
1965
  ],
1966
- "md5sum": "1f6c30324d81ac27220768eaaafcc20a"
1967
  },
1968
  {
1969
  "dataPath": "params_shard_17.bin",
@@ -1987,7 +1987,7 @@
1987
  17920,
1988
  48
1989
  ],
1990
- "dtype": "float16",
1991
  "format": "f32-to-bf16",
1992
  "nbytes": 1720320,
1993
  "byteOffset": 13762560
@@ -1997,7 +1997,7 @@
1997
  "shape": [
1998
  1536
1999
  ],
2000
- "dtype": "float16",
2001
  "format": "f32-to-bf16",
2002
  "nbytes": 3072,
2003
  "byteOffset": 15482880
@@ -2007,7 +2007,7 @@
2007
  "shape": [
2008
  2048
2009
  ],
2010
- "dtype": "float16",
2011
  "format": "f32-to-bf16",
2012
  "nbytes": 4096,
2013
  "byteOffset": 15485952
@@ -2029,7 +2029,7 @@
2029
  2048,
2030
  48
2031
  ],
2032
- "dtype": "float16",
2033
  "format": "f32-to-bf16",
2034
  "nbytes": 196608,
2035
  "byteOffset": 17062912
@@ -2051,7 +2051,7 @@
2051
  1536,
2052
  48
2053
  ],
2054
- "dtype": "float16",
2055
  "format": "f32-to-bf16",
2056
  "nbytes": 147456,
2057
  "byteOffset": 18439168
@@ -2061,7 +2061,7 @@
2061
  "shape": [
2062
  1536
2063
  ],
2064
- "dtype": "float16",
2065
  "format": "f32-to-bf16",
2066
  "nbytes": 3072,
2067
  "byteOffset": 18586624
@@ -2083,13 +2083,13 @@
2083
  1536,
2084
  280
2085
  ],
2086
- "dtype": "float16",
2087
  "format": "f32-to-bf16",
2088
  "nbytes": 860160,
2089
  "byteOffset": 25470976
2090
  }
2091
  ],
2092
- "md5sum": "fd9d1e826dd2d63cd9ceaaefcdf22ab0"
2093
  },
2094
  {
2095
  "dataPath": "params_shard_18.bin",
@@ -2113,7 +2113,7 @@
2113
  17920,
2114
  48
2115
  ],
2116
- "dtype": "float16",
2117
  "format": "f32-to-bf16",
2118
  "nbytes": 1720320,
2119
  "byteOffset": 13762560
@@ -2123,7 +2123,7 @@
2123
  "shape": [
2124
  1536
2125
  ],
2126
- "dtype": "float16",
2127
  "format": "f32-to-bf16",
2128
  "nbytes": 3072,
2129
  "byteOffset": 15482880
@@ -2133,7 +2133,7 @@
2133
  "shape": [
2134
  2048
2135
  ],
2136
- "dtype": "float16",
2137
  "format": "f32-to-bf16",
2138
  "nbytes": 4096,
2139
  "byteOffset": 15485952
@@ -2155,7 +2155,7 @@
2155
  2048,
2156
  48
2157
  ],
2158
- "dtype": "float16",
2159
  "format": "f32-to-bf16",
2160
  "nbytes": 196608,
2161
  "byteOffset": 17062912
@@ -2177,7 +2177,7 @@
2177
  1536,
2178
  48
2179
  ],
2180
- "dtype": "float16",
2181
  "format": "f32-to-bf16",
2182
  "nbytes": 147456,
2183
  "byteOffset": 18439168
@@ -2187,7 +2187,7 @@
2187
  "shape": [
2188
  1536
2189
  ],
2190
- "dtype": "float16",
2191
  "format": "f32-to-bf16",
2192
  "nbytes": 3072,
2193
  "byteOffset": 18586624
@@ -2209,13 +2209,13 @@
2209
  1536,
2210
  280
2211
  ],
2212
- "dtype": "float16",
2213
  "format": "f32-to-bf16",
2214
  "nbytes": 860160,
2215
  "byteOffset": 25470976
2216
  }
2217
  ],
2218
- "md5sum": "bafab13f62a6f951ad3d8be51ca0e490"
2219
  },
2220
  {
2221
  "dataPath": "params_shard_19.bin",
@@ -2239,7 +2239,7 @@
2239
  17920,
2240
  48
2241
  ],
2242
- "dtype": "float16",
2243
  "format": "f32-to-bf16",
2244
  "nbytes": 1720320,
2245
  "byteOffset": 13762560
@@ -2249,7 +2249,7 @@
2249
  "shape": [
2250
  1536
2251
  ],
2252
- "dtype": "float16",
2253
  "format": "f32-to-bf16",
2254
  "nbytes": 3072,
2255
  "byteOffset": 15482880
@@ -2259,7 +2259,7 @@
2259
  "shape": [
2260
  2048
2261
  ],
2262
- "dtype": "float16",
2263
  "format": "f32-to-bf16",
2264
  "nbytes": 4096,
2265
  "byteOffset": 15485952
@@ -2281,7 +2281,7 @@
2281
  2048,
2282
  48
2283
  ],
2284
- "dtype": "float16",
2285
  "format": "f32-to-bf16",
2286
  "nbytes": 196608,
2287
  "byteOffset": 17062912
@@ -2303,7 +2303,7 @@
2303
  1536,
2304
  48
2305
  ],
2306
- "dtype": "float16",
2307
  "format": "f32-to-bf16",
2308
  "nbytes": 147456,
2309
  "byteOffset": 18439168
@@ -2313,7 +2313,7 @@
2313
  "shape": [
2314
  1536
2315
  ],
2316
- "dtype": "float16",
2317
  "format": "f32-to-bf16",
2318
  "nbytes": 3072,
2319
  "byteOffset": 18586624
@@ -2335,13 +2335,13 @@
2335
  1536,
2336
  280
2337
  ],
2338
- "dtype": "float16",
2339
  "format": "f32-to-bf16",
2340
  "nbytes": 860160,
2341
  "byteOffset": 25470976
2342
  }
2343
  ],
2344
- "md5sum": "bab51688f2303b8c1cf82e4d78a6706d"
2345
  },
2346
  {
2347
  "dataPath": "params_shard_20.bin",
@@ -2365,7 +2365,7 @@
2365
  17920,
2366
  48
2367
  ],
2368
- "dtype": "float16",
2369
  "format": "f32-to-bf16",
2370
  "nbytes": 1720320,
2371
  "byteOffset": 13762560
@@ -2375,7 +2375,7 @@
2375
  "shape": [
2376
  1536
2377
  ],
2378
- "dtype": "float16",
2379
  "format": "f32-to-bf16",
2380
  "nbytes": 3072,
2381
  "byteOffset": 15482880
@@ -2385,7 +2385,7 @@
2385
  "shape": [
2386
  2048
2387
  ],
2388
- "dtype": "float16",
2389
  "format": "f32-to-bf16",
2390
  "nbytes": 4096,
2391
  "byteOffset": 15485952
@@ -2407,7 +2407,7 @@
2407
  2048,
2408
  48
2409
  ],
2410
- "dtype": "float16",
2411
  "format": "f32-to-bf16",
2412
  "nbytes": 196608,
2413
  "byteOffset": 17062912
@@ -2429,7 +2429,7 @@
2429
  1536,
2430
  48
2431
  ],
2432
- "dtype": "float16",
2433
  "format": "f32-to-bf16",
2434
  "nbytes": 147456,
2435
  "byteOffset": 18439168
@@ -2439,7 +2439,7 @@
2439
  "shape": [
2440
  1536
2441
  ],
2442
- "dtype": "float16",
2443
  "format": "f32-to-bf16",
2444
  "nbytes": 3072,
2445
  "byteOffset": 18586624
@@ -2461,13 +2461,13 @@
2461
  1536,
2462
  280
2463
  ],
2464
- "dtype": "float16",
2465
  "format": "f32-to-bf16",
2466
  "nbytes": 860160,
2467
  "byteOffset": 25470976
2468
  }
2469
  ],
2470
- "md5sum": "90d61b33069538ba7fab57c993858c5b"
2471
  },
2472
  {
2473
  "dataPath": "params_shard_21.bin",
@@ -2491,7 +2491,7 @@
2491
  17920,
2492
  48
2493
  ],
2494
- "dtype": "float16",
2495
  "format": "f32-to-bf16",
2496
  "nbytes": 1720320,
2497
  "byteOffset": 13762560
@@ -2501,7 +2501,7 @@
2501
  "shape": [
2502
  1536
2503
  ],
2504
- "dtype": "float16",
2505
  "format": "f32-to-bf16",
2506
  "nbytes": 3072,
2507
  "byteOffset": 15482880
@@ -2511,7 +2511,7 @@
2511
  "shape": [
2512
  2048
2513
  ],
2514
- "dtype": "float16",
2515
  "format": "f32-to-bf16",
2516
  "nbytes": 4096,
2517
  "byteOffset": 15485952
@@ -2533,7 +2533,7 @@
2533
  2048,
2534
  48
2535
  ],
2536
- "dtype": "float16",
2537
  "format": "f32-to-bf16",
2538
  "nbytes": 196608,
2539
  "byteOffset": 17062912
@@ -2555,7 +2555,7 @@
2555
  1536,
2556
  48
2557
  ],
2558
- "dtype": "float16",
2559
  "format": "f32-to-bf16",
2560
  "nbytes": 147456,
2561
  "byteOffset": 18439168
@@ -2565,7 +2565,7 @@
2565
  "shape": [
2566
  1536
2567
  ],
2568
- "dtype": "float16",
2569
  "format": "f32-to-bf16",
2570
  "nbytes": 3072,
2571
  "byteOffset": 18586624
@@ -2587,13 +2587,13 @@
2587
  1536,
2588
  280
2589
  ],
2590
- "dtype": "float16",
2591
  "format": "f32-to-bf16",
2592
  "nbytes": 860160,
2593
  "byteOffset": 25470976
2594
  }
2595
  ],
2596
- "md5sum": "918bd8c7a9a2929a11bd3f56162d286a"
2597
  },
2598
  {
2599
  "dataPath": "params_shard_22.bin",
@@ -2617,7 +2617,7 @@
2617
  17920,
2618
  48
2619
  ],
2620
- "dtype": "float16",
2621
  "format": "f32-to-bf16",
2622
  "nbytes": 1720320,
2623
  "byteOffset": 13762560
@@ -2627,7 +2627,7 @@
2627
  "shape": [
2628
  1536
2629
  ],
2630
- "dtype": "float16",
2631
  "format": "f32-to-bf16",
2632
  "nbytes": 3072,
2633
  "byteOffset": 15482880
@@ -2637,7 +2637,7 @@
2637
  "shape": [
2638
  2048
2639
  ],
2640
- "dtype": "float16",
2641
  "format": "f32-to-bf16",
2642
  "nbytes": 4096,
2643
  "byteOffset": 15485952
@@ -2659,7 +2659,7 @@
2659
  2048,
2660
  48
2661
  ],
2662
- "dtype": "float16",
2663
  "format": "f32-to-bf16",
2664
  "nbytes": 196608,
2665
  "byteOffset": 17062912
@@ -2681,7 +2681,7 @@
2681
  1536,
2682
  48
2683
  ],
2684
- "dtype": "float16",
2685
  "format": "f32-to-bf16",
2686
  "nbytes": 147456,
2687
  "byteOffset": 18439168
@@ -2691,7 +2691,7 @@
2691
  "shape": [
2692
  1536
2693
  ],
2694
- "dtype": "float16",
2695
  "format": "f32-to-bf16",
2696
  "nbytes": 3072,
2697
  "byteOffset": 18586624
@@ -2713,13 +2713,13 @@
2713
  1536,
2714
  280
2715
  ],
2716
- "dtype": "float16",
2717
  "format": "f32-to-bf16",
2718
  "nbytes": 860160,
2719
  "byteOffset": 25470976
2720
  }
2721
  ],
2722
- "md5sum": "2683ae2968156de5dbe0f64c6ee35c8a"
2723
  },
2724
  {
2725
  "dataPath": "params_shard_23.bin",
@@ -2743,7 +2743,7 @@
2743
  17920,
2744
  48
2745
  ],
2746
- "dtype": "float16",
2747
  "format": "f32-to-bf16",
2748
  "nbytes": 1720320,
2749
  "byteOffset": 13762560
@@ -2753,7 +2753,7 @@
2753
  "shape": [
2754
  1536
2755
  ],
2756
- "dtype": "float16",
2757
  "format": "f32-to-bf16",
2758
  "nbytes": 3072,
2759
  "byteOffset": 15482880
@@ -2763,7 +2763,7 @@
2763
  "shape": [
2764
  2048
2765
  ],
2766
- "dtype": "float16",
2767
  "format": "f32-to-bf16",
2768
  "nbytes": 4096,
2769
  "byteOffset": 15485952
@@ -2785,7 +2785,7 @@
2785
  2048,
2786
  48
2787
  ],
2788
- "dtype": "float16",
2789
  "format": "f32-to-bf16",
2790
  "nbytes": 196608,
2791
  "byteOffset": 17062912
@@ -2807,7 +2807,7 @@
2807
  1536,
2808
  48
2809
  ],
2810
- "dtype": "float16",
2811
  "format": "f32-to-bf16",
2812
  "nbytes": 147456,
2813
  "byteOffset": 18439168
@@ -2817,7 +2817,7 @@
2817
  "shape": [
2818
  1536
2819
  ],
2820
- "dtype": "float16",
2821
  "format": "f32-to-bf16",
2822
  "nbytes": 3072,
2823
  "byteOffset": 18586624
@@ -2839,13 +2839,13 @@
2839
  1536,
2840
  280
2841
  ],
2842
- "dtype": "float16",
2843
  "format": "f32-to-bf16",
2844
  "nbytes": 860160,
2845
  "byteOffset": 25470976
2846
  }
2847
  ],
2848
- "md5sum": "5995b02e3e4c9ca1df23321165cfa94a"
2849
  },
2850
  {
2851
  "dataPath": "params_shard_24.bin",
@@ -2869,7 +2869,7 @@
2869
  17920,
2870
  48
2871
  ],
2872
- "dtype": "float16",
2873
  "format": "f32-to-bf16",
2874
  "nbytes": 1720320,
2875
  "byteOffset": 13762560
@@ -2879,7 +2879,7 @@
2879
  "shape": [
2880
  1536
2881
  ],
2882
- "dtype": "float16",
2883
  "format": "f32-to-bf16",
2884
  "nbytes": 3072,
2885
  "byteOffset": 15482880
@@ -2889,7 +2889,7 @@
2889
  "shape": [
2890
  2048
2891
  ],
2892
- "dtype": "float16",
2893
  "format": "f32-to-bf16",
2894
  "nbytes": 4096,
2895
  "byteOffset": 15485952
@@ -2911,7 +2911,7 @@
2911
  2048,
2912
  48
2913
  ],
2914
- "dtype": "float16",
2915
  "format": "f32-to-bf16",
2916
  "nbytes": 196608,
2917
  "byteOffset": 17062912
@@ -2933,7 +2933,7 @@
2933
  1536,
2934
  48
2935
  ],
2936
- "dtype": "float16",
2937
  "format": "f32-to-bf16",
2938
  "nbytes": 147456,
2939
  "byteOffset": 18439168
@@ -2943,7 +2943,7 @@
2943
  "shape": [
2944
  1536
2945
  ],
2946
- "dtype": "float16",
2947
  "format": "f32-to-bf16",
2948
  "nbytes": 3072,
2949
  "byteOffset": 18586624
@@ -2965,13 +2965,13 @@
2965
  1536,
2966
  280
2967
  ],
2968
- "dtype": "float16",
2969
  "format": "f32-to-bf16",
2970
  "nbytes": 860160,
2971
  "byteOffset": 25470976
2972
  }
2973
  ],
2974
- "md5sum": "6d48ea82720cc53d766d23e3f043a14c"
2975
  },
2976
  {
2977
  "dataPath": "params_shard_25.bin",
@@ -2995,7 +2995,7 @@
2995
  17920,
2996
  48
2997
  ],
2998
- "dtype": "float16",
2999
  "format": "f32-to-bf16",
3000
  "nbytes": 1720320,
3001
  "byteOffset": 13762560
@@ -3005,7 +3005,7 @@
3005
  "shape": [
3006
  1536
3007
  ],
3008
- "dtype": "float16",
3009
  "format": "f32-to-bf16",
3010
  "nbytes": 3072,
3011
  "byteOffset": 15482880
@@ -3015,7 +3015,7 @@
3015
  "shape": [
3016
  2048
3017
  ],
3018
- "dtype": "float16",
3019
  "format": "f32-to-bf16",
3020
  "nbytes": 4096,
3021
  "byteOffset": 15485952
@@ -3037,7 +3037,7 @@
3037
  2048,
3038
  48
3039
  ],
3040
- "dtype": "float16",
3041
  "format": "f32-to-bf16",
3042
  "nbytes": 196608,
3043
  "byteOffset": 17062912
@@ -3059,7 +3059,7 @@
3059
  1536,
3060
  48
3061
  ],
3062
- "dtype": "float16",
3063
  "format": "f32-to-bf16",
3064
  "nbytes": 147456,
3065
  "byteOffset": 18439168
@@ -3069,7 +3069,7 @@
3069
  "shape": [
3070
  1536
3071
  ],
3072
- "dtype": "float16",
3073
  "format": "f32-to-bf16",
3074
  "nbytes": 3072,
3075
  "byteOffset": 18586624
@@ -3091,13 +3091,13 @@
3091
  1536,
3092
  280
3093
  ],
3094
- "dtype": "float16",
3095
  "format": "f32-to-bf16",
3096
  "nbytes": 860160,
3097
  "byteOffset": 25470976
3098
  }
3099
  ],
3100
- "md5sum": "d7561fd6ce999ff110f534a8a59ce60e"
3101
  },
3102
  {
3103
  "dataPath": "params_shard_26.bin",
@@ -3121,7 +3121,7 @@
3121
  17920,
3122
  48
3123
  ],
3124
- "dtype": "float16",
3125
  "format": "f32-to-bf16",
3126
  "nbytes": 1720320,
3127
  "byteOffset": 13762560
@@ -3131,7 +3131,7 @@
3131
  "shape": [
3132
  1536
3133
  ],
3134
- "dtype": "float16",
3135
  "format": "f32-to-bf16",
3136
  "nbytes": 3072,
3137
  "byteOffset": 15482880
@@ -3141,7 +3141,7 @@
3141
  "shape": [
3142
  2048
3143
  ],
3144
- "dtype": "float16",
3145
  "format": "f32-to-bf16",
3146
  "nbytes": 4096,
3147
  "byteOffset": 15485952
@@ -3163,7 +3163,7 @@
3163
  2048,
3164
  48
3165
  ],
3166
- "dtype": "float16",
3167
  "format": "f32-to-bf16",
3168
  "nbytes": 196608,
3169
  "byteOffset": 17062912
@@ -3185,7 +3185,7 @@
3185
  1536,
3186
  48
3187
  ],
3188
- "dtype": "float16",
3189
  "format": "f32-to-bf16",
3190
  "nbytes": 147456,
3191
  "byteOffset": 18439168
@@ -3195,7 +3195,7 @@
3195
  "shape": [
3196
  1536
3197
  ],
3198
- "dtype": "float16",
3199
  "format": "f32-to-bf16",
3200
  "nbytes": 3072,
3201
  "byteOffset": 18586624
@@ -3217,13 +3217,13 @@
3217
  1536,
3218
  280
3219
  ],
3220
- "dtype": "float16",
3221
  "format": "f32-to-bf16",
3222
  "nbytes": 860160,
3223
  "byteOffset": 25470976
3224
  }
3225
  ],
3226
- "md5sum": "6a36a2a3fcb758f1d75337d201b19881"
3227
  },
3228
  {
3229
  "dataPath": "params_shard_27.bin",
@@ -3247,7 +3247,7 @@
3247
  17920,
3248
  48
3249
  ],
3250
- "dtype": "float16",
3251
  "format": "f32-to-bf16",
3252
  "nbytes": 1720320,
3253
  "byteOffset": 13762560
@@ -3257,7 +3257,7 @@
3257
  "shape": [
3258
  1536
3259
  ],
3260
- "dtype": "float16",
3261
  "format": "f32-to-bf16",
3262
  "nbytes": 3072,
3263
  "byteOffset": 15482880
@@ -3267,7 +3267,7 @@
3267
  "shape": [
3268
  2048
3269
  ],
3270
- "dtype": "float16",
3271
  "format": "f32-to-bf16",
3272
  "nbytes": 4096,
3273
  "byteOffset": 15485952
@@ -3289,7 +3289,7 @@
3289
  2048,
3290
  48
3291
  ],
3292
- "dtype": "float16",
3293
  "format": "f32-to-bf16",
3294
  "nbytes": 196608,
3295
  "byteOffset": 17062912
@@ -3311,7 +3311,7 @@
3311
  1536,
3312
  48
3313
  ],
3314
- "dtype": "float16",
3315
  "format": "f32-to-bf16",
3316
  "nbytes": 147456,
3317
  "byteOffset": 18439168
@@ -3321,7 +3321,7 @@
3321
  "shape": [
3322
  1536
3323
  ],
3324
- "dtype": "float16",
3325
  "format": "f32-to-bf16",
3326
  "nbytes": 3072,
3327
  "byteOffset": 18586624
@@ -3343,13 +3343,13 @@
3343
  1536,
3344
  280
3345
  ],
3346
- "dtype": "float16",
3347
  "format": "f32-to-bf16",
3348
  "nbytes": 860160,
3349
  "byteOffset": 25470976
3350
  }
3351
  ],
3352
- "md5sum": "e912b5b70fd9dae95dfd25a9cdf386db"
3353
  },
3354
  {
3355
  "dataPath": "params_shard_28.bin",
@@ -3373,7 +3373,7 @@
3373
  17920,
3374
  48
3375
  ],
3376
- "dtype": "float16",
3377
  "format": "f32-to-bf16",
3378
  "nbytes": 1720320,
3379
  "byteOffset": 13762560
@@ -3383,7 +3383,7 @@
3383
  "shape": [
3384
  1536
3385
  ],
3386
- "dtype": "float16",
3387
  "format": "f32-to-bf16",
3388
  "nbytes": 3072,
3389
  "byteOffset": 15482880
@@ -3393,7 +3393,7 @@
3393
  "shape": [
3394
  2048
3395
  ],
3396
- "dtype": "float16",
3397
  "format": "f32-to-bf16",
3398
  "nbytes": 4096,
3399
  "byteOffset": 15485952
@@ -3415,7 +3415,7 @@
3415
  2048,
3416
  48
3417
  ],
3418
- "dtype": "float16",
3419
  "format": "f32-to-bf16",
3420
  "nbytes": 196608,
3421
  "byteOffset": 17062912
@@ -3437,7 +3437,7 @@
3437
  1536,
3438
  48
3439
  ],
3440
- "dtype": "float16",
3441
  "format": "f32-to-bf16",
3442
  "nbytes": 147456,
3443
  "byteOffset": 18439168
@@ -3447,7 +3447,7 @@
3447
  "shape": [
3448
  1536
3449
  ],
3450
- "dtype": "float16",
3451
  "format": "f32-to-bf16",
3452
  "nbytes": 3072,
3453
  "byteOffset": 18586624
@@ -3469,13 +3469,13 @@
3469
  1536,
3470
  280
3471
  ],
3472
- "dtype": "float16",
3473
  "format": "f32-to-bf16",
3474
  "nbytes": 860160,
3475
  "byteOffset": 25470976
3476
  }
3477
  ],
3478
- "md5sum": "70177ad0862c8cd72c3162829f947657"
3479
  },
3480
  {
3481
  "dataPath": "params_shard_29.bin",
@@ -3499,7 +3499,7 @@
3499
  17920,
3500
  48
3501
  ],
3502
- "dtype": "float16",
3503
  "format": "f32-to-bf16",
3504
  "nbytes": 1720320,
3505
  "byteOffset": 13762560
@@ -3509,7 +3509,7 @@
3509
  "shape": [
3510
  1536
3511
  ],
3512
- "dtype": "float16",
3513
  "format": "f32-to-bf16",
3514
  "nbytes": 3072,
3515
  "byteOffset": 15482880
@@ -3519,7 +3519,7 @@
3519
  "shape": [
3520
  2048
3521
  ],
3522
- "dtype": "float16",
3523
  "format": "f32-to-bf16",
3524
  "nbytes": 4096,
3525
  "byteOffset": 15485952
@@ -3541,7 +3541,7 @@
3541
  2048,
3542
  48
3543
  ],
3544
- "dtype": "float16",
3545
  "format": "f32-to-bf16",
3546
  "nbytes": 196608,
3547
  "byteOffset": 17062912
@@ -3563,7 +3563,7 @@
3563
  1536,
3564
  48
3565
  ],
3566
- "dtype": "float16",
3567
  "format": "f32-to-bf16",
3568
  "nbytes": 147456,
3569
  "byteOffset": 18439168
@@ -3573,13 +3573,13 @@
3573
  "shape": [
3574
  1536
3575
  ],
3576
- "dtype": "float16",
3577
  "format": "f32-to-bf16",
3578
  "nbytes": 3072,
3579
  "byteOffset": 18586624
3580
  }
3581
  ],
3582
- "md5sum": "1ac4189703b9ace01f2d80cae1354a6d"
3583
  }
3584
  ]
3585
  }
 
1
  {
2
  "metadata": {
3
  "ParamSize": 311,
4
+ "ParamBytes": 965310464.0,
5
+ "BitsPerParam": 5.002534272041053
6
  },
7
  "records": [
8
  {
 
22
  "byteOffset": 0
23
  }
24
  ],
25
+ "md5sum": "d6a4315ea780a0261dec50ea468198b0"
26
  },
27
  {
28
  "dataPath": "params_shard_1.bin",
 
35
  151936,
36
  48
37
  ],
38
+ "dtype": "float32",
39
  "format": "f32-to-bf16",
40
  "nbytes": 14585856,
41
  "byteOffset": 0
 
45
  "shape": [
46
  1536
47
  ],
48
+ "dtype": "float32",
49
  "format": "f32-to-bf16",
50
  "nbytes": 3072,
51
  "byteOffset": 14585856
 
67
  1536,
68
  280
69
  ],
70
+ "dtype": "float32",
71
  "format": "f32-to-bf16",
72
  "nbytes": 860160,
73
  "byteOffset": 21470208
74
  }
75
  ],
76
+ "md5sum": "5afc5cfe3edcdaec786f9c72d6d7df44"
77
  },
78
  {
79
  "dataPath": "params_shard_2.bin",
 
97
  17920,
98
  48
99
  ],
100
+ "dtype": "float32",
101
  "format": "f32-to-bf16",
102
  "nbytes": 1720320,
103
  "byteOffset": 13762560
 
107
  "shape": [
108
  1536
109
  ],
110
+ "dtype": "float32",
111
  "format": "f32-to-bf16",
112
  "nbytes": 3072,
113
  "byteOffset": 15482880
 
117
  "shape": [
118
  2048
119
  ],
120
+ "dtype": "float32",
121
  "format": "f32-to-bf16",
122
  "nbytes": 4096,
123
  "byteOffset": 15485952
 
139
  2048,
140
  48
141
  ],
142
+ "dtype": "float32",
143
  "format": "f32-to-bf16",
144
  "nbytes": 196608,
145
  "byteOffset": 17062912
 
161
  1536,
162
  48
163
  ],
164
+ "dtype": "float32",
165
  "format": "f32-to-bf16",
166
  "nbytes": 147456,
167
  "byteOffset": 18439168
 
171
  "shape": [
172
  1536
173
  ],
174
+ "dtype": "float32",
175
  "format": "f32-to-bf16",
176
  "nbytes": 3072,
177
  "byteOffset": 18586624
 
193
  1536,
194
  280
195
  ],
196
+ "dtype": "float32",
197
  "format": "f32-to-bf16",
198
  "nbytes": 860160,
199
  "byteOffset": 25470976
200
  }
201
  ],
202
+ "md5sum": "3e1d2846eee65e6801082649712a4242"
203
  },
204
  {
205
  "dataPath": "params_shard_3.bin",
 
223
  17920,
224
  48
225
  ],
226
+ "dtype": "float32",
227
  "format": "f32-to-bf16",
228
  "nbytes": 1720320,
229
  "byteOffset": 13762560
 
233
  "shape": [
234
  1536
235
  ],
236
+ "dtype": "float32",
237
  "format": "f32-to-bf16",
238
  "nbytes": 3072,
239
  "byteOffset": 15482880
 
243
  "shape": [
244
  2048
245
  ],
246
+ "dtype": "float32",
247
  "format": "f32-to-bf16",
248
  "nbytes": 4096,
249
  "byteOffset": 15485952
 
265
  2048,
266
  48
267
  ],
268
+ "dtype": "float32",
269
  "format": "f32-to-bf16",
270
  "nbytes": 196608,
271
  "byteOffset": 17062912
 
287
  1536,
288
  48
289
  ],
290
+ "dtype": "float32",
291
  "format": "f32-to-bf16",
292
  "nbytes": 147456,
293
  "byteOffset": 18439168
 
297
  "shape": [
298
  1536
299
  ],
300
+ "dtype": "float32",
301
  "format": "f32-to-bf16",
302
  "nbytes": 3072,
303
  "byteOffset": 18586624
 
319
  1536,
320
  280
321
  ],
322
+ "dtype": "float32",
323
  "format": "f32-to-bf16",
324
  "nbytes": 860160,
325
  "byteOffset": 25470976
326
  }
327
  ],
328
+ "md5sum": "360ec089131fe9c3dcf59d41ec15922f"
329
  },
330
  {
331
  "dataPath": "params_shard_4.bin",
 
349
  17920,
350
  48
351
  ],
352
+ "dtype": "float32",
353
  "format": "f32-to-bf16",
354
  "nbytes": 1720320,
355
  "byteOffset": 13762560
 
359
  "shape": [
360
  1536
361
  ],
362
+ "dtype": "float32",
363
  "format": "f32-to-bf16",
364
  "nbytes": 3072,
365
  "byteOffset": 15482880
 
369
  "shape": [
370
  2048
371
  ],
372
+ "dtype": "float32",
373
  "format": "f32-to-bf16",
374
  "nbytes": 4096,
375
  "byteOffset": 15485952
 
391
  2048,
392
  48
393
  ],
394
+ "dtype": "float32",
395
  "format": "f32-to-bf16",
396
  "nbytes": 196608,
397
  "byteOffset": 17062912
 
413
  1536,
414
  48
415
  ],
416
+ "dtype": "float32",
417
  "format": "f32-to-bf16",
418
  "nbytes": 147456,
419
  "byteOffset": 18439168
 
423
  "shape": [
424
  1536
425
  ],
426
+ "dtype": "float32",
427
  "format": "f32-to-bf16",
428
  "nbytes": 3072,
429
  "byteOffset": 18586624
 
445
  1536,
446
  280
447
  ],
448
+ "dtype": "float32",
449
  "format": "f32-to-bf16",
450
  "nbytes": 860160,
451
  "byteOffset": 25470976
452
  }
453
  ],
454
+ "md5sum": "a84a347f273cd0f6acd25df405d34894"
455
  },
456
  {
457
  "dataPath": "params_shard_5.bin",
 
475
  17920,
476
  48
477
  ],
478
+ "dtype": "float32",
479
  "format": "f32-to-bf16",
480
  "nbytes": 1720320,
481
  "byteOffset": 13762560
 
485
  "shape": [
486
  1536
487
  ],
488
+ "dtype": "float32",
489
  "format": "f32-to-bf16",
490
  "nbytes": 3072,
491
  "byteOffset": 15482880
 
495
  "shape": [
496
  2048
497
  ],
498
+ "dtype": "float32",
499
  "format": "f32-to-bf16",
500
  "nbytes": 4096,
501
  "byteOffset": 15485952
 
517
  2048,
518
  48
519
  ],
520
+ "dtype": "float32",
521
  "format": "f32-to-bf16",
522
  "nbytes": 196608,
523
  "byteOffset": 17062912
 
539
  1536,
540
  48
541
  ],
542
+ "dtype": "float32",
543
  "format": "f32-to-bf16",
544
  "nbytes": 147456,
545
  "byteOffset": 18439168
 
549
  "shape": [
550
  1536
551
  ],
552
+ "dtype": "float32",
553
  "format": "f32-to-bf16",
554
  "nbytes": 3072,
555
  "byteOffset": 18586624
 
571
  1536,
572
  280
573
  ],
574
+ "dtype": "float32",
575
  "format": "f32-to-bf16",
576
  "nbytes": 860160,
577
  "byteOffset": 25470976
578
  }
579
  ],
580
+ "md5sum": "fedf0dec9f82f4f238e05953bcf96f72"
581
  },
582
  {
583
  "dataPath": "params_shard_6.bin",
 
601
  17920,
602
  48
603
  ],
604
+ "dtype": "float32",
605
  "format": "f32-to-bf16",
606
  "nbytes": 1720320,
607
  "byteOffset": 13762560
 
611
  "shape": [
612
  1536
613
  ],
614
+ "dtype": "float32",
615
  "format": "f32-to-bf16",
616
  "nbytes": 3072,
617
  "byteOffset": 15482880
 
621
  "shape": [
622
  2048
623
  ],
624
+ "dtype": "float32",
625
  "format": "f32-to-bf16",
626
  "nbytes": 4096,
627
  "byteOffset": 15485952
 
643
  2048,
644
  48
645
  ],
646
+ "dtype": "float32",
647
  "format": "f32-to-bf16",
648
  "nbytes": 196608,
649
  "byteOffset": 17062912
 
665
  1536,
666
  48
667
  ],
668
+ "dtype": "float32",
669
  "format": "f32-to-bf16",
670
  "nbytes": 147456,
671
  "byteOffset": 18439168
 
675
  "shape": [
676
  1536
677
  ],
678
+ "dtype": "float32",
679
  "format": "f32-to-bf16",
680
  "nbytes": 3072,
681
  "byteOffset": 18586624
 
697
  1536,
698
  280
699
  ],
700
+ "dtype": "float32",
701
  "format": "f32-to-bf16",
702
  "nbytes": 860160,
703
  "byteOffset": 25470976
704
  }
705
  ],
706
+ "md5sum": "03e0a7377e6fa3fb6fa1098781a5e550"
707
  },
708
  {
709
  "dataPath": "params_shard_7.bin",
 
727
  17920,
728
  48
729
  ],
730
+ "dtype": "float32",
731
  "format": "f32-to-bf16",
732
  "nbytes": 1720320,
733
  "byteOffset": 13762560
 
737
  "shape": [
738
  1536
739
  ],
740
+ "dtype": "float32",
741
  "format": "f32-to-bf16",
742
  "nbytes": 3072,
743
  "byteOffset": 15482880
 
747
  "shape": [
748
  2048
749
  ],
750
+ "dtype": "float32",
751
  "format": "f32-to-bf16",
752
  "nbytes": 4096,
753
  "byteOffset": 15485952
 
769
  2048,
770
  48
771
  ],
772
+ "dtype": "float32",
773
  "format": "f32-to-bf16",
774
  "nbytes": 196608,
775
  "byteOffset": 17062912
 
791
  1536,
792
  48
793
  ],
794
+ "dtype": "float32",
795
  "format": "f32-to-bf16",
796
  "nbytes": 147456,
797
  "byteOffset": 18439168
 
801
  "shape": [
802
  1536
803
  ],
804
+ "dtype": "float32",
805
  "format": "f32-to-bf16",
806
  "nbytes": 3072,
807
  "byteOffset": 18586624
 
823
  1536,
824
  280
825
  ],
826
+ "dtype": "float32",
827
  "format": "f32-to-bf16",
828
  "nbytes": 860160,
829
  "byteOffset": 25470976
830
  }
831
  ],
832
+ "md5sum": "16eeefe8737676249814f2cbc7b3f035"
833
  },
834
  {
835
  "dataPath": "params_shard_8.bin",
 
853
  17920,
854
  48
855
  ],
856
+ "dtype": "float32",
857
  "format": "f32-to-bf16",
858
  "nbytes": 1720320,
859
  "byteOffset": 13762560
 
863
  "shape": [
864
  1536
865
  ],
866
+ "dtype": "float32",
867
  "format": "f32-to-bf16",
868
  "nbytes": 3072,
869
  "byteOffset": 15482880
 
873
  "shape": [
874
  2048
875
  ],
876
+ "dtype": "float32",
877
  "format": "f32-to-bf16",
878
  "nbytes": 4096,
879
  "byteOffset": 15485952
 
895
  2048,
896
  48
897
  ],
898
+ "dtype": "float32",
899
  "format": "f32-to-bf16",
900
  "nbytes": 196608,
901
  "byteOffset": 17062912
 
917
  1536,
918
  48
919
  ],
920
+ "dtype": "float32",
921
  "format": "f32-to-bf16",
922
  "nbytes": 147456,
923
  "byteOffset": 18439168
 
927
  "shape": [
928
  1536
929
  ],
930
+ "dtype": "float32",
931
  "format": "f32-to-bf16",
932
  "nbytes": 3072,
933
  "byteOffset": 18586624
 
949
  1536,
950
  280
951
  ],
952
+ "dtype": "float32",
953
  "format": "f32-to-bf16",
954
  "nbytes": 860160,
955
  "byteOffset": 25470976
956
  }
957
  ],
958
+ "md5sum": "518d75cd78b4259b9b30be02990531fe"
959
  },
960
  {
961
  "dataPath": "params_shard_9.bin",
 
979
  17920,
980
  48
981
  ],
982
+ "dtype": "float32",
983
  "format": "f32-to-bf16",
984
  "nbytes": 1720320,
985
  "byteOffset": 13762560
 
989
  "shape": [
990
  1536
991
  ],
992
+ "dtype": "float32",
993
  "format": "f32-to-bf16",
994
  "nbytes": 3072,
995
  "byteOffset": 15482880
 
999
  "shape": [
1000
  2048
1001
  ],
1002
+ "dtype": "float32",
1003
  "format": "f32-to-bf16",
1004
  "nbytes": 4096,
1005
  "byteOffset": 15485952
 
1021
  2048,
1022
  48
1023
  ],
1024
+ "dtype": "float32",
1025
  "format": "f32-to-bf16",
1026
  "nbytes": 196608,
1027
  "byteOffset": 17062912
 
1043
  1536,
1044
  48
1045
  ],
1046
+ "dtype": "float32",
1047
  "format": "f32-to-bf16",
1048
  "nbytes": 147456,
1049
  "byteOffset": 18439168
 
1053
  "shape": [
1054
  1536
1055
  ],
1056
+ "dtype": "float32",
1057
  "format": "f32-to-bf16",
1058
  "nbytes": 3072,
1059
  "byteOffset": 18586624
 
1075
  1536,
1076
  280
1077
  ],
1078
+ "dtype": "float32",
1079
  "format": "f32-to-bf16",
1080
  "nbytes": 860160,
1081
  "byteOffset": 25470976
1082
  }
1083
  ],
1084
+ "md5sum": "3679d6d95783f1097d92fefd0f223d74"
1085
  },
1086
  {
1087
  "dataPath": "params_shard_10.bin",
 
1105
  17920,
1106
  48
1107
  ],
1108
+ "dtype": "float32",
1109
  "format": "f32-to-bf16",
1110
  "nbytes": 1720320,
1111
  "byteOffset": 13762560
 
1115
  "shape": [
1116
  1536
1117
  ],
1118
+ "dtype": "float32",
1119
  "format": "f32-to-bf16",
1120
  "nbytes": 3072,
1121
  "byteOffset": 15482880
 
1125
  "shape": [
1126
  2048
1127
  ],
1128
+ "dtype": "float32",
1129
  "format": "f32-to-bf16",
1130
  "nbytes": 4096,
1131
  "byteOffset": 15485952
 
1147
  2048,
1148
  48
1149
  ],
1150
+ "dtype": "float32",
1151
  "format": "f32-to-bf16",
1152
  "nbytes": 196608,
1153
  "byteOffset": 17062912
 
1169
  1536,
1170
  48
1171
  ],
1172
+ "dtype": "float32",
1173
  "format": "f32-to-bf16",
1174
  "nbytes": 147456,
1175
  "byteOffset": 18439168
 
1179
  "shape": [
1180
  1536
1181
  ],
1182
+ "dtype": "float32",
1183
  "format": "f32-to-bf16",
1184
  "nbytes": 3072,
1185
  "byteOffset": 18586624
 
1201
  1536,
1202
  280
1203
  ],
1204
+ "dtype": "float32",
1205
  "format": "f32-to-bf16",
1206
  "nbytes": 860160,
1207
  "byteOffset": 25470976
1208
  }
1209
  ],
1210
+ "md5sum": "89404e7477ef55d7cdab22767bf857c3"
1211
  },
1212
  {
1213
  "dataPath": "params_shard_11.bin",
 
1231
  17920,
1232
  48
1233
  ],
1234
+ "dtype": "float32",
1235
  "format": "f32-to-bf16",
1236
  "nbytes": 1720320,
1237
  "byteOffset": 13762560
 
1241
  "shape": [
1242
  1536
1243
  ],
1244
+ "dtype": "float32",
1245
  "format": "f32-to-bf16",
1246
  "nbytes": 3072,
1247
  "byteOffset": 15482880
 
1251
  "shape": [
1252
  2048
1253
  ],
1254
+ "dtype": "float32",
1255
  "format": "f32-to-bf16",
1256
  "nbytes": 4096,
1257
  "byteOffset": 15485952
 
1273
  2048,
1274
  48
1275
  ],
1276
+ "dtype": "float32",
1277
  "format": "f32-to-bf16",
1278
  "nbytes": 196608,
1279
  "byteOffset": 17062912
 
1295
  1536,
1296
  48
1297
  ],
1298
+ "dtype": "float32",
1299
  "format": "f32-to-bf16",
1300
  "nbytes": 147456,
1301
  "byteOffset": 18439168
 
1305
  "shape": [
1306
  1536
1307
  ],
1308
+ "dtype": "float32",
1309
  "format": "f32-to-bf16",
1310
  "nbytes": 3072,
1311
  "byteOffset": 18586624
 
1327
  1536,
1328
  280
1329
  ],
1330
+ "dtype": "float32",
1331
  "format": "f32-to-bf16",
1332
  "nbytes": 860160,
1333
  "byteOffset": 25470976
1334
  }
1335
  ],
1336
+ "md5sum": "c6fe02261e76dd1cf10162671314bb7d"
1337
  },
1338
  {
1339
  "dataPath": "params_shard_12.bin",
 
1357
  17920,
1358
  48
1359
  ],
1360
+ "dtype": "float32",
1361
  "format": "f32-to-bf16",
1362
  "nbytes": 1720320,
1363
  "byteOffset": 13762560
 
1367
  "shape": [
1368
  1536
1369
  ],
1370
+ "dtype": "float32",
1371
  "format": "f32-to-bf16",
1372
  "nbytes": 3072,
1373
  "byteOffset": 15482880
 
1377
  "shape": [
1378
  2048
1379
  ],
1380
+ "dtype": "float32",
1381
  "format": "f32-to-bf16",
1382
  "nbytes": 4096,
1383
  "byteOffset": 15485952
 
1399
  2048,
1400
  48
1401
  ],
1402
+ "dtype": "float32",
1403
  "format": "f32-to-bf16",
1404
  "nbytes": 196608,
1405
  "byteOffset": 17062912
 
1421
  1536,
1422
  48
1423
  ],
1424
+ "dtype": "float32",
1425
  "format": "f32-to-bf16",
1426
  "nbytes": 147456,
1427
  "byteOffset": 18439168
 
1431
  "shape": [
1432
  1536
1433
  ],
1434
+ "dtype": "float32",
1435
  "format": "f32-to-bf16",
1436
  "nbytes": 3072,
1437
  "byteOffset": 18586624
 
1453
  1536,
1454
  280
1455
  ],
1456
+ "dtype": "float32",
1457
  "format": "f32-to-bf16",
1458
  "nbytes": 860160,
1459
  "byteOffset": 25470976
1460
  }
1461
  ],
1462
+ "md5sum": "fb079556f9ef1836e8b30262f565b1ef"
1463
  },
1464
  {
1465
  "dataPath": "params_shard_13.bin",
 
1483
  17920,
1484
  48
1485
  ],
1486
+ "dtype": "float32",
1487
  "format": "f32-to-bf16",
1488
  "nbytes": 1720320,
1489
  "byteOffset": 13762560
 
1493
  "shape": [
1494
  1536
1495
  ],
1496
+ "dtype": "float32",
1497
  "format": "f32-to-bf16",
1498
  "nbytes": 3072,
1499
  "byteOffset": 15482880
 
1503
  "shape": [
1504
  2048
1505
  ],
1506
+ "dtype": "float32",
1507
  "format": "f32-to-bf16",
1508
  "nbytes": 4096,
1509
  "byteOffset": 15485952
 
1525
  2048,
1526
  48
1527
  ],
1528
+ "dtype": "float32",
1529
  "format": "f32-to-bf16",
1530
  "nbytes": 196608,
1531
  "byteOffset": 17062912
 
1547
  1536,
1548
  48
1549
  ],
1550
+ "dtype": "float32",
1551
  "format": "f32-to-bf16",
1552
  "nbytes": 147456,
1553
  "byteOffset": 18439168
 
1557
  "shape": [
1558
  1536
1559
  ],
1560
+ "dtype": "float32",
1561
  "format": "f32-to-bf16",
1562
  "nbytes": 3072,
1563
  "byteOffset": 18586624
 
1579
  1536,
1580
  280
1581
  ],
1582
+ "dtype": "float32",
1583
  "format": "f32-to-bf16",
1584
  "nbytes": 860160,
1585
  "byteOffset": 25470976
1586
  }
1587
  ],
1588
+ "md5sum": "dce38a13ec6b0abf1b1035f7ee847e63"
1589
  },
1590
  {
1591
  "dataPath": "params_shard_14.bin",
 
1609
  17920,
1610
  48
1611
  ],
1612
+ "dtype": "float32",
1613
  "format": "f32-to-bf16",
1614
  "nbytes": 1720320,
1615
  "byteOffset": 13762560
 
1619
  "shape": [
1620
  1536
1621
  ],
1622
+ "dtype": "float32",
1623
  "format": "f32-to-bf16",
1624
  "nbytes": 3072,
1625
  "byteOffset": 15482880
 
1629
  "shape": [
1630
  2048
1631
  ],
1632
+ "dtype": "float32",
1633
  "format": "f32-to-bf16",
1634
  "nbytes": 4096,
1635
  "byteOffset": 15485952
 
1651
  2048,
1652
  48
1653
  ],
1654
+ "dtype": "float32",
1655
  "format": "f32-to-bf16",
1656
  "nbytes": 196608,
1657
  "byteOffset": 17062912
 
1673
  1536,
1674
  48
1675
  ],
1676
+ "dtype": "float32",
1677
  "format": "f32-to-bf16",
1678
  "nbytes": 147456,
1679
  "byteOffset": 18439168
 
1683
  "shape": [
1684
  1536
1685
  ],
1686
+ "dtype": "float32",
1687
  "format": "f32-to-bf16",
1688
  "nbytes": 3072,
1689
  "byteOffset": 18586624
 
1705
  1536,
1706
  280
1707
  ],
1708
+ "dtype": "float32",
1709
  "format": "f32-to-bf16",
1710
  "nbytes": 860160,
1711
  "byteOffset": 25470976
1712
  }
1713
  ],
1714
+ "md5sum": "1feca36b4a8200b5faeffae2a8eb8032"
1715
  },
1716
  {
1717
  "dataPath": "params_shard_15.bin",
 
1735
  17920,
1736
  48
1737
  ],
1738
+ "dtype": "float32",
1739
  "format": "f32-to-bf16",
1740
  "nbytes": 1720320,
1741
  "byteOffset": 13762560
 
1745
  "shape": [
1746
  1536
1747
  ],
1748
+ "dtype": "float32",
1749
  "format": "f32-to-bf16",
1750
  "nbytes": 3072,
1751
  "byteOffset": 15482880
 
1755
  "shape": [
1756
  2048
1757
  ],
1758
+ "dtype": "float32",
1759
  "format": "f32-to-bf16",
1760
  "nbytes": 4096,
1761
  "byteOffset": 15485952
 
1777
  2048,
1778
  48
1779
  ],
1780
+ "dtype": "float32",
1781
  "format": "f32-to-bf16",
1782
  "nbytes": 196608,
1783
  "byteOffset": 17062912
 
1799
  1536,
1800
  48
1801
  ],
1802
+ "dtype": "float32",
1803
  "format": "f32-to-bf16",
1804
  "nbytes": 147456,
1805
  "byteOffset": 18439168
 
1809
  "shape": [
1810
  1536
1811
  ],
1812
+ "dtype": "float32",
1813
  "format": "f32-to-bf16",
1814
  "nbytes": 3072,
1815
  "byteOffset": 18586624
 
1831
  1536,
1832
  280
1833
  ],
1834
+ "dtype": "float32",
1835
  "format": "f32-to-bf16",
1836
  "nbytes": 860160,
1837
  "byteOffset": 25470976
1838
  }
1839
  ],
1840
+ "md5sum": "132a1fdb1327aa026d1af2628a33a0e8"
1841
  },
1842
  {
1843
  "dataPath": "params_shard_16.bin",
 
1861
  17920,
1862
  48
1863
  ],
1864
+ "dtype": "float32",
1865
  "format": "f32-to-bf16",
1866
  "nbytes": 1720320,
1867
  "byteOffset": 13762560
 
1871
  "shape": [
1872
  1536
1873
  ],
1874
+ "dtype": "float32",
1875
  "format": "f32-to-bf16",
1876
  "nbytes": 3072,
1877
  "byteOffset": 15482880
 
1881
  "shape": [
1882
  2048
1883
  ],
1884
+ "dtype": "float32",
1885
  "format": "f32-to-bf16",
1886
  "nbytes": 4096,
1887
  "byteOffset": 15485952
 
1903
  2048,
1904
  48
1905
  ],
1906
+ "dtype": "float32",
1907
  "format": "f32-to-bf16",
1908
  "nbytes": 196608,
1909
  "byteOffset": 17062912
 
1925
  1536,
1926
  48
1927
  ],
1928
+ "dtype": "float32",
1929
  "format": "f32-to-bf16",
1930
  "nbytes": 147456,
1931
  "byteOffset": 18439168
 
1935
  "shape": [
1936
  1536
1937
  ],
1938
+ "dtype": "float32",
1939
  "format": "f32-to-bf16",
1940
  "nbytes": 3072,
1941
  "byteOffset": 18586624
 
1957
  1536,
1958
  280
1959
  ],
1960
+ "dtype": "float32",
1961
  "format": "f32-to-bf16",
1962
  "nbytes": 860160,
1963
  "byteOffset": 25470976
1964
  }
1965
  ],
1966
+ "md5sum": "70442273d229fd032a6921673e3807cb"
1967
  },
1968
  {
1969
  "dataPath": "params_shard_17.bin",
 
1987
  17920,
1988
  48
1989
  ],
1990
+ "dtype": "float32",
1991
  "format": "f32-to-bf16",
1992
  "nbytes": 1720320,
1993
  "byteOffset": 13762560
 
1997
  "shape": [
1998
  1536
1999
  ],
2000
+ "dtype": "float32",
2001
  "format": "f32-to-bf16",
2002
  "nbytes": 3072,
2003
  "byteOffset": 15482880
 
2007
  "shape": [
2008
  2048
2009
  ],
2010
+ "dtype": "float32",
2011
  "format": "f32-to-bf16",
2012
  "nbytes": 4096,
2013
  "byteOffset": 15485952
 
2029
  2048,
2030
  48
2031
  ],
2032
+ "dtype": "float32",
2033
  "format": "f32-to-bf16",
2034
  "nbytes": 196608,
2035
  "byteOffset": 17062912
 
2051
  1536,
2052
  48
2053
  ],
2054
+ "dtype": "float32",
2055
  "format": "f32-to-bf16",
2056
  "nbytes": 147456,
2057
  "byteOffset": 18439168
 
2061
  "shape": [
2062
  1536
2063
  ],
2064
+ "dtype": "float32",
2065
  "format": "f32-to-bf16",
2066
  "nbytes": 3072,
2067
  "byteOffset": 18586624
 
2083
  1536,
2084
  280
2085
  ],
2086
+ "dtype": "float32",
2087
  "format": "f32-to-bf16",
2088
  "nbytes": 860160,
2089
  "byteOffset": 25470976
2090
  }
2091
  ],
2092
+ "md5sum": "218f11c64c4f7f1ba2d740c1406c9708"
2093
  },
2094
  {
2095
  "dataPath": "params_shard_18.bin",
 
2113
  17920,
2114
  48
2115
  ],
2116
+ "dtype": "float32",
2117
  "format": "f32-to-bf16",
2118
  "nbytes": 1720320,
2119
  "byteOffset": 13762560
 
2123
  "shape": [
2124
  1536
2125
  ],
2126
+ "dtype": "float32",
2127
  "format": "f32-to-bf16",
2128
  "nbytes": 3072,
2129
  "byteOffset": 15482880
 
2133
  "shape": [
2134
  2048
2135
  ],
2136
+ "dtype": "float32",
2137
  "format": "f32-to-bf16",
2138
  "nbytes": 4096,
2139
  "byteOffset": 15485952
 
2155
  2048,
2156
  48
2157
  ],
2158
+ "dtype": "float32",
2159
  "format": "f32-to-bf16",
2160
  "nbytes": 196608,
2161
  "byteOffset": 17062912
 
2177
  1536,
2178
  48
2179
  ],
2180
+ "dtype": "float32",
2181
  "format": "f32-to-bf16",
2182
  "nbytes": 147456,
2183
  "byteOffset": 18439168
 
2187
  "shape": [
2188
  1536
2189
  ],
2190
+ "dtype": "float32",
2191
  "format": "f32-to-bf16",
2192
  "nbytes": 3072,
2193
  "byteOffset": 18586624
 
2209
  1536,
2210
  280
2211
  ],
2212
+ "dtype": "float32",
2213
  "format": "f32-to-bf16",
2214
  "nbytes": 860160,
2215
  "byteOffset": 25470976
2216
  }
2217
  ],
2218
+ "md5sum": "9ca77e9ef072cc5ec5cf457776f5be1c"
2219
  },
2220
  {
2221
  "dataPath": "params_shard_19.bin",
 
2239
  17920,
2240
  48
2241
  ],
2242
+ "dtype": "float32",
2243
  "format": "f32-to-bf16",
2244
  "nbytes": 1720320,
2245
  "byteOffset": 13762560
 
2249
  "shape": [
2250
  1536
2251
  ],
2252
+ "dtype": "float32",
2253
  "format": "f32-to-bf16",
2254
  "nbytes": 3072,
2255
  "byteOffset": 15482880
 
2259
  "shape": [
2260
  2048
2261
  ],
2262
+ "dtype": "float32",
2263
  "format": "f32-to-bf16",
2264
  "nbytes": 4096,
2265
  "byteOffset": 15485952
 
2281
  2048,
2282
  48
2283
  ],
2284
+ "dtype": "float32",
2285
  "format": "f32-to-bf16",
2286
  "nbytes": 196608,
2287
  "byteOffset": 17062912
 
2303
  1536,
2304
  48
2305
  ],
2306
+ "dtype": "float32",
2307
  "format": "f32-to-bf16",
2308
  "nbytes": 147456,
2309
  "byteOffset": 18439168
 
2313
  "shape": [
2314
  1536
2315
  ],
2316
+ "dtype": "float32",
2317
  "format": "f32-to-bf16",
2318
  "nbytes": 3072,
2319
  "byteOffset": 18586624
 
2335
  1536,
2336
  280
2337
  ],
2338
+ "dtype": "float32",
2339
  "format": "f32-to-bf16",
2340
  "nbytes": 860160,
2341
  "byteOffset": 25470976
2342
  }
2343
  ],
2344
+ "md5sum": "80f21af8e8f1a65695d036dee877751c"
2345
  },
2346
  {
2347
  "dataPath": "params_shard_20.bin",
 
2365
  17920,
2366
  48
2367
  ],
2368
+ "dtype": "float32",
2369
  "format": "f32-to-bf16",
2370
  "nbytes": 1720320,
2371
  "byteOffset": 13762560
 
2375
  "shape": [
2376
  1536
2377
  ],
2378
+ "dtype": "float32",
2379
  "format": "f32-to-bf16",
2380
  "nbytes": 3072,
2381
  "byteOffset": 15482880
 
2385
  "shape": [
2386
  2048
2387
  ],
2388
+ "dtype": "float32",
2389
  "format": "f32-to-bf16",
2390
  "nbytes": 4096,
2391
  "byteOffset": 15485952
 
2407
  2048,
2408
  48
2409
  ],
2410
+ "dtype": "float32",
2411
  "format": "f32-to-bf16",
2412
  "nbytes": 196608,
2413
  "byteOffset": 17062912
 
2429
  1536,
2430
  48
2431
  ],
2432
+ "dtype": "float32",
2433
  "format": "f32-to-bf16",
2434
  "nbytes": 147456,
2435
  "byteOffset": 18439168
 
2439
  "shape": [
2440
  1536
2441
  ],
2442
+ "dtype": "float32",
2443
  "format": "f32-to-bf16",
2444
  "nbytes": 3072,
2445
  "byteOffset": 18586624
 
2461
  1536,
2462
  280
2463
  ],
2464
+ "dtype": "float32",
2465
  "format": "f32-to-bf16",
2466
  "nbytes": 860160,
2467
  "byteOffset": 25470976
2468
  }
2469
  ],
2470
+ "md5sum": "d1327a1c17a3cf5c16589c2aedebc114"
2471
  },
2472
  {
2473
  "dataPath": "params_shard_21.bin",
 
2491
  17920,
2492
  48
2493
  ],
2494
+ "dtype": "float32",
2495
  "format": "f32-to-bf16",
2496
  "nbytes": 1720320,
2497
  "byteOffset": 13762560
 
2501
  "shape": [
2502
  1536
2503
  ],
2504
+ "dtype": "float32",
2505
  "format": "f32-to-bf16",
2506
  "nbytes": 3072,
2507
  "byteOffset": 15482880
 
2511
  "shape": [
2512
  2048
2513
  ],
2514
+ "dtype": "float32",
2515
  "format": "f32-to-bf16",
2516
  "nbytes": 4096,
2517
  "byteOffset": 15485952
 
2533
  2048,
2534
  48
2535
  ],
2536
+ "dtype": "float32",
2537
  "format": "f32-to-bf16",
2538
  "nbytes": 196608,
2539
  "byteOffset": 17062912
 
2555
  1536,
2556
  48
2557
  ],
2558
+ "dtype": "float32",
2559
  "format": "f32-to-bf16",
2560
  "nbytes": 147456,
2561
  "byteOffset": 18439168
 
2565
  "shape": [
2566
  1536
2567
  ],
2568
+ "dtype": "float32",
2569
  "format": "f32-to-bf16",
2570
  "nbytes": 3072,
2571
  "byteOffset": 18586624
 
2587
  1536,
2588
  280
2589
  ],
2590
+ "dtype": "float32",
2591
  "format": "f32-to-bf16",
2592
  "nbytes": 860160,
2593
  "byteOffset": 25470976
2594
  }
2595
  ],
2596
+ "md5sum": "a5509f03d3bee1e339859ce3740a6d32"
2597
  },
2598
  {
2599
  "dataPath": "params_shard_22.bin",
 
2617
  17920,
2618
  48
2619
  ],
2620
+ "dtype": "float32",
2621
  "format": "f32-to-bf16",
2622
  "nbytes": 1720320,
2623
  "byteOffset": 13762560
 
2627
  "shape": [
2628
  1536
2629
  ],
2630
+ "dtype": "float32",
2631
  "format": "f32-to-bf16",
2632
  "nbytes": 3072,
2633
  "byteOffset": 15482880
 
2637
  "shape": [
2638
  2048
2639
  ],
2640
+ "dtype": "float32",
2641
  "format": "f32-to-bf16",
2642
  "nbytes": 4096,
2643
  "byteOffset": 15485952
 
2659
  2048,
2660
  48
2661
  ],
2662
+ "dtype": "float32",
2663
  "format": "f32-to-bf16",
2664
  "nbytes": 196608,
2665
  "byteOffset": 17062912
 
2681
  1536,
2682
  48
2683
  ],
2684
+ "dtype": "float32",
2685
  "format": "f32-to-bf16",
2686
  "nbytes": 147456,
2687
  "byteOffset": 18439168
 
2691
  "shape": [
2692
  1536
2693
  ],
2694
+ "dtype": "float32",
2695
  "format": "f32-to-bf16",
2696
  "nbytes": 3072,
2697
  "byteOffset": 18586624
 
2713
  1536,
2714
  280
2715
  ],
2716
+ "dtype": "float32",
2717
  "format": "f32-to-bf16",
2718
  "nbytes": 860160,
2719
  "byteOffset": 25470976
2720
  }
2721
  ],
2722
+ "md5sum": "393d77942fe94fff95167fb1300be8e1"
2723
  },
2724
  {
2725
  "dataPath": "params_shard_23.bin",
 
2743
  17920,
2744
  48
2745
  ],
2746
+ "dtype": "float32",
2747
  "format": "f32-to-bf16",
2748
  "nbytes": 1720320,
2749
  "byteOffset": 13762560
 
2753
  "shape": [
2754
  1536
2755
  ],
2756
+ "dtype": "float32",
2757
  "format": "f32-to-bf16",
2758
  "nbytes": 3072,
2759
  "byteOffset": 15482880
 
2763
  "shape": [
2764
  2048
2765
  ],
2766
+ "dtype": "float32",
2767
  "format": "f32-to-bf16",
2768
  "nbytes": 4096,
2769
  "byteOffset": 15485952
 
2785
  2048,
2786
  48
2787
  ],
2788
+ "dtype": "float32",
2789
  "format": "f32-to-bf16",
2790
  "nbytes": 196608,
2791
  "byteOffset": 17062912
 
2807
  1536,
2808
  48
2809
  ],
2810
+ "dtype": "float32",
2811
  "format": "f32-to-bf16",
2812
  "nbytes": 147456,
2813
  "byteOffset": 18439168
 
2817
  "shape": [
2818
  1536
2819
  ],
2820
+ "dtype": "float32",
2821
  "format": "f32-to-bf16",
2822
  "nbytes": 3072,
2823
  "byteOffset": 18586624
 
2839
  1536,
2840
  280
2841
  ],
2842
+ "dtype": "float32",
2843
  "format": "f32-to-bf16",
2844
  "nbytes": 860160,
2845
  "byteOffset": 25470976
2846
  }
2847
  ],
2848
+ "md5sum": "5ad909776281d0a989a5da08fd1c4a9e"
2849
  },
2850
  {
2851
  "dataPath": "params_shard_24.bin",
 
2869
  17920,
2870
  48
2871
  ],
2872
+ "dtype": "float32",
2873
  "format": "f32-to-bf16",
2874
  "nbytes": 1720320,
2875
  "byteOffset": 13762560
 
2879
  "shape": [
2880
  1536
2881
  ],
2882
+ "dtype": "float32",
2883
  "format": "f32-to-bf16",
2884
  "nbytes": 3072,
2885
  "byteOffset": 15482880
 
2889
  "shape": [
2890
  2048
2891
  ],
2892
+ "dtype": "float32",
2893
  "format": "f32-to-bf16",
2894
  "nbytes": 4096,
2895
  "byteOffset": 15485952
 
2911
  2048,
2912
  48
2913
  ],
2914
+ "dtype": "float32",
2915
  "format": "f32-to-bf16",
2916
  "nbytes": 196608,
2917
  "byteOffset": 17062912
 
2933
  1536,
2934
  48
2935
  ],
2936
+ "dtype": "float32",
2937
  "format": "f32-to-bf16",
2938
  "nbytes": 147456,
2939
  "byteOffset": 18439168
 
2943
  "shape": [
2944
  1536
2945
  ],
2946
+ "dtype": "float32",
2947
  "format": "f32-to-bf16",
2948
  "nbytes": 3072,
2949
  "byteOffset": 18586624
 
2965
  1536,
2966
  280
2967
  ],
2968
+ "dtype": "float32",
2969
  "format": "f32-to-bf16",
2970
  "nbytes": 860160,
2971
  "byteOffset": 25470976
2972
  }
2973
  ],
2974
+ "md5sum": "e5cf1a456d806749b56d7b9fc90ff4a0"
2975
  },
2976
  {
2977
  "dataPath": "params_shard_25.bin",
 
2995
  17920,
2996
  48
2997
  ],
2998
+ "dtype": "float32",
2999
  "format": "f32-to-bf16",
3000
  "nbytes": 1720320,
3001
  "byteOffset": 13762560
 
3005
  "shape": [
3006
  1536
3007
  ],
3008
+ "dtype": "float32",
3009
  "format": "f32-to-bf16",
3010
  "nbytes": 3072,
3011
  "byteOffset": 15482880
 
3015
  "shape": [
3016
  2048
3017
  ],
3018
+ "dtype": "float32",
3019
  "format": "f32-to-bf16",
3020
  "nbytes": 4096,
3021
  "byteOffset": 15485952
 
3037
  2048,
3038
  48
3039
  ],
3040
+ "dtype": "float32",
3041
  "format": "f32-to-bf16",
3042
  "nbytes": 196608,
3043
  "byteOffset": 17062912
 
3059
  1536,
3060
  48
3061
  ],
3062
+ "dtype": "float32",
3063
  "format": "f32-to-bf16",
3064
  "nbytes": 147456,
3065
  "byteOffset": 18439168
 
3069
  "shape": [
3070
  1536
3071
  ],
3072
+ "dtype": "float32",
3073
  "format": "f32-to-bf16",
3074
  "nbytes": 3072,
3075
  "byteOffset": 18586624
 
3091
  1536,
3092
  280
3093
  ],
3094
+ "dtype": "float32",
3095
  "format": "f32-to-bf16",
3096
  "nbytes": 860160,
3097
  "byteOffset": 25470976
3098
  }
3099
  ],
3100
+ "md5sum": "bfd877824ebbe030186527b24a682291"
3101
  },
3102
  {
3103
  "dataPath": "params_shard_26.bin",
 
3121
  17920,
3122
  48
3123
  ],
3124
+ "dtype": "float32",
3125
  "format": "f32-to-bf16",
3126
  "nbytes": 1720320,
3127
  "byteOffset": 13762560
 
3131
  "shape": [
3132
  1536
3133
  ],
3134
+ "dtype": "float32",
3135
  "format": "f32-to-bf16",
3136
  "nbytes": 3072,
3137
  "byteOffset": 15482880
 
3141
  "shape": [
3142
  2048
3143
  ],
3144
+ "dtype": "float32",
3145
  "format": "f32-to-bf16",
3146
  "nbytes": 4096,
3147
  "byteOffset": 15485952
 
3163
  2048,
3164
  48
3165
  ],
3166
+ "dtype": "float32",
3167
  "format": "f32-to-bf16",
3168
  "nbytes": 196608,
3169
  "byteOffset": 17062912
 
3185
  1536,
3186
  48
3187
  ],
3188
+ "dtype": "float32",
3189
  "format": "f32-to-bf16",
3190
  "nbytes": 147456,
3191
  "byteOffset": 18439168
 
3195
  "shape": [
3196
  1536
3197
  ],
3198
+ "dtype": "float32",
3199
  "format": "f32-to-bf16",
3200
  "nbytes": 3072,
3201
  "byteOffset": 18586624
 
3217
  1536,
3218
  280
3219
  ],
3220
+ "dtype": "float32",
3221
  "format": "f32-to-bf16",
3222
  "nbytes": 860160,
3223
  "byteOffset": 25470976
3224
  }
3225
  ],
3226
+ "md5sum": "5190cc309d33d1d245ecf4dfb3561277"
3227
  },
3228
  {
3229
  "dataPath": "params_shard_27.bin",
 
3247
  17920,
3248
  48
3249
  ],
3250
+ "dtype": "float32",
3251
  "format": "f32-to-bf16",
3252
  "nbytes": 1720320,
3253
  "byteOffset": 13762560
 
3257
  "shape": [
3258
  1536
3259
  ],
3260
+ "dtype": "float32",
3261
  "format": "f32-to-bf16",
3262
  "nbytes": 3072,
3263
  "byteOffset": 15482880
 
3267
  "shape": [
3268
  2048
3269
  ],
3270
+ "dtype": "float32",
3271
  "format": "f32-to-bf16",
3272
  "nbytes": 4096,
3273
  "byteOffset": 15485952
 
3289
  2048,
3290
  48
3291
  ],
3292
+ "dtype": "float32",
3293
  "format": "f32-to-bf16",
3294
  "nbytes": 196608,
3295
  "byteOffset": 17062912
 
3311
  1536,
3312
  48
3313
  ],
3314
+ "dtype": "float32",
3315
  "format": "f32-to-bf16",
3316
  "nbytes": 147456,
3317
  "byteOffset": 18439168
 
3321
  "shape": [
3322
  1536
3323
  ],
3324
+ "dtype": "float32",
3325
  "format": "f32-to-bf16",
3326
  "nbytes": 3072,
3327
  "byteOffset": 18586624
 
3343
  1536,
3344
  280
3345
  ],
3346
+ "dtype": "float32",
3347
  "format": "f32-to-bf16",
3348
  "nbytes": 860160,
3349
  "byteOffset": 25470976
3350
  }
3351
  ],
3352
+ "md5sum": "a41c433a5f3b5464204c771aee8e46cd"
3353
  },
3354
  {
3355
  "dataPath": "params_shard_28.bin",
 
3373
  17920,
3374
  48
3375
  ],
3376
+ "dtype": "float32",
3377
  "format": "f32-to-bf16",
3378
  "nbytes": 1720320,
3379
  "byteOffset": 13762560
 
3383
  "shape": [
3384
  1536
3385
  ],
3386
+ "dtype": "float32",
3387
  "format": "f32-to-bf16",
3388
  "nbytes": 3072,
3389
  "byteOffset": 15482880
 
3393
  "shape": [
3394
  2048
3395
  ],
3396
+ "dtype": "float32",
3397
  "format": "f32-to-bf16",
3398
  "nbytes": 4096,
3399
  "byteOffset": 15485952
 
3415
  2048,
3416
  48
3417
  ],
3418
+ "dtype": "float32",
3419
  "format": "f32-to-bf16",
3420
  "nbytes": 196608,
3421
  "byteOffset": 17062912
 
3437
  1536,
3438
  48
3439
  ],
3440
+ "dtype": "float32",
3441
  "format": "f32-to-bf16",
3442
  "nbytes": 147456,
3443
  "byteOffset": 18439168
 
3447
  "shape": [
3448
  1536
3449
  ],
3450
+ "dtype": "float32",
3451
  "format": "f32-to-bf16",
3452
  "nbytes": 3072,
3453
  "byteOffset": 18586624
 
3469
  1536,
3470
  280
3471
  ],
3472
+ "dtype": "float32",
3473
  "format": "f32-to-bf16",
3474
  "nbytes": 860160,
3475
  "byteOffset": 25470976
3476
  }
3477
  ],
3478
+ "md5sum": "3f0295c5456a9e6d8081874334efc174"
3479
  },
3480
  {
3481
  "dataPath": "params_shard_29.bin",
 
3499
  17920,
3500
  48
3501
  ],
3502
+ "dtype": "float32",
3503
  "format": "f32-to-bf16",
3504
  "nbytes": 1720320,
3505
  "byteOffset": 13762560
 
3509
  "shape": [
3510
  1536
3511
  ],
3512
+ "dtype": "float32",
3513
  "format": "f32-to-bf16",
3514
  "nbytes": 3072,
3515
  "byteOffset": 15482880
 
3519
  "shape": [
3520
  2048
3521
  ],
3522
+ "dtype": "float32",
3523
  "format": "f32-to-bf16",
3524
  "nbytes": 4096,
3525
  "byteOffset": 15485952
 
3541
  2048,
3542
  48
3543
  ],
3544
+ "dtype": "float32",
3545
  "format": "f32-to-bf16",
3546
  "nbytes": 196608,
3547
  "byteOffset": 17062912
 
3563
  1536,
3564
  48
3565
  ],
3566
+ "dtype": "float32",
3567
  "format": "f32-to-bf16",
3568
  "nbytes": 147456,
3569
  "byteOffset": 18439168
 
3573
  "shape": [
3574
  1536
3575
  ],
3576
+ "dtype": "float32",
3577
  "format": "f32-to-bf16",
3578
  "nbytes": 3072,
3579
  "byteOffset": 18586624
3580
  }
3581
  ],
3582
+ "md5sum": "fb0092056dc95f77bf851781c4dd259f"
3583
  }
3584
  ]
3585
  }
params_shard_0.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:26be12b60ee723962248754e7914f97aa2ca4c0147a43f6be9a3031c41059f05
3
  size 116686848
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a17ee8573c3ac6cf90d090d7b72d52ef6124e5ad52ddea9745a5fa9a9358fd01
3
  size 116686848
params_shard_1.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:f8d092f60318332b4831a385ffd05356d44d63c2d59597d83477091a04986d85
3
  size 22330368
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:45a38f2269e407cc3e1719a6a50ad468c460a32746073be8df47b5804e510538
3
  size 22330368
params_shard_10.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:62b9350f9e0b718352be0254cb4b6811d5892cf198029c9b62a055660fdfed5c
3
  size 26331136
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f32049d0b4717a3b2481e390fcb7bfd44202eafd4da01e9a79ec76dc57642390
3
  size 26331136
params_shard_11.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:4208ad50a01a8c4be7b97645d55238fc78477a32bed78d0578d34f0f94270f80
3
  size 26331136
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b2e5b93660083e81599077a124e5f943eb16f462f61e1614cbfbfd24ae27c123
3
  size 26331136
params_shard_12.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:de6af8f1a1b01517833f6aae22c038be057919b97bc07a88dc356d5997d39183
3
  size 26331136
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9779a002ed8fc5364d92da63663f2e1c8cd61547785f934d3f4b55776ebf9d14
3
  size 26331136
params_shard_13.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:b78aa6b099c7ed207700937df325bea208e22194116fb50b4e39bdde9a96e386
3
  size 26331136
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c5a8704525f5bcf916a310022303a7140bb449f9a8bd4f770d40210d9b8daa89
3
  size 26331136
params_shard_14.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:8763d5cc7ac41dd2f1078c19c9ccbfd5b80b288098e2d2b90b71353347541b40
3
  size 26331136
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:aadb43c2f703d7b39b5eb36dcfe360c5d1b17fe7827962d7ad52549697fa2670
3
  size 26331136
params_shard_15.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:fb5972f53178c99b9f9f9d16b2110227d7e1ac3a2ecb87cb86895c73b68c53e3
3
  size 26331136
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3a037dd0812d6e4259ce64da7dc680c6dc260979012684979780e5a4f4c0d6a3
3
  size 26331136
params_shard_16.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:54c0807e5656fc0dd2dd9d0c437617c29b84de450f02a0720633d8d047d4aeee
3
  size 26331136
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1d11f0ce0448d17e9660941954d815e079dbf5a1a3110069352197f0ad16e9ab
3
  size 26331136
params_shard_17.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:2db91699923981ab99f785c1cd391cc73546a28f355f8b7138cb60838638fcb4
3
  size 26331136
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e4499713ef3150f72a2b6ab11c8916a0c1b220e0903de97ac10864968ab73428
3
  size 26331136
params_shard_18.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:ed4e884e5313b50f6f704f47f2d03bdff5d946a7d6a7d9748ceb2d04dafb0f42
3
  size 26331136
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:44fd670a3adf0e21b4a4fbdfe82b62fc96d81a5c2ff2e9f52d001a44fca7bc95
3
  size 26331136
params_shard_19.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:ff1c0923a3cda87856f7ba2314d02cc6907098317099f2f76895849e4bc983ff
3
  size 26331136
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:70e7f36a30f55bcda9459cd7df1ef3695e0bf935cdc4a6c4aea5e6e5216ee58a
3
  size 26331136
params_shard_2.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:726ee471ddd4218f5c41529d9e64790d9cf21602070d6450bb65689e40668e81
3
  size 26331136
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:983e40552dd56f1f4a8c3c0b8e1e1fddc9ca927022cf20b7040a4dd6d22c153e
3
  size 26331136
params_shard_20.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:a395755ea6d87332fc7a3fd83cfba76d709c0d5309c6aa3e8dbf45c75cdeb2d4
3
  size 26331136
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7d339781e82d267dd6484a0365588f9b261460b4b3cc0b8720d84e845e5a91d5
3
  size 26331136
params_shard_21.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:799bcced27564b193e8ea03797cbfb84c8b1a2c4faeb4989b96fd0ef2ad493dd
3
  size 26331136
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ba7b707a0605ada5a1afb1b1bab10fae237ab97fd620c89a335c9240df30c3f1
3
  size 26331136
params_shard_22.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:1a74937e920b2d62e789eda1ac10e485a531a79be3a111f2d974638d4413cc0f
3
  size 26331136
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4c21e1dc09a75c2ccfdb8faf61467c53a89f1527eca79a000f7fb9607bb03d19
3
  size 26331136
params_shard_23.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:12c2fa93d94ff0eee00a964d85bd5d6c880d62bb3f464a75c337236dd6357e5d
3
  size 26331136
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1388a64f2f7770c8a020d220253d3cfa007d1b4447fcc48ad75cd8bce6e04c4a
3
  size 26331136
params_shard_24.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:661b3adce899d203e4dc3ac1423d345487868835e0b6a67220bdeae58c97675d
3
  size 26331136
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f25dfd62889d6922d54d6c9577290cdba68143948e7d3665b861d9b2f7e59dbc
3
  size 26331136
params_shard_25.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:2030958aff2e036a9b47845b02a71a17d6441c0a5d6e9a7b120231492131047f
3
  size 26331136
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:71eaa4bbde84d4f47dbbdb391169aec734c962d1632e41325cae4786bf28b77f
3
  size 26331136
params_shard_26.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:edceeaaf1f44d0c214298460fd508b8e025a09ccfb550d04be64e997b067bc8a
3
  size 26331136
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:572ac3661a42654bcf3d0dc84e33efdf020b765e6921bf514da54244a1eed76d
3
  size 26331136
params_shard_27.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:1caeed995bf6401545f9273d38e3e95c86ed8acc697d32f9ac5e0a73cbf5e38a
3
  size 26331136
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:dd228917a0d4e4223ade1c92a5317870a78ee529fa5bf4da4b5e52e2dca46be8
3
  size 26331136
params_shard_28.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:6efdfb6f7d564697b75b5205eee11485da1c9ac52308731004a8aade930741c2
3
  size 26331136
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1684f8d027a27911c64335e3b819a887d021572e784df28b4a5bb25816cb86b0
3
  size 26331136
params_shard_29.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:ae5936416b598d07976e5446fcc7a2ddc82299a3e7647214d0a8251da8668b78
3
  size 18589696
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4071fb8813c91e16018c774632f775b88dc234b293e724f2720dfa8fd54a0ced
3
  size 18589696
params_shard_3.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:e577c75f188c646bd5034df17373b96ed44bc7a68151e02a415726e74be70d0f
3
  size 26331136
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:59730b028a8101aaf15fddbcd12e4e8b1f40f5c330f55304bbf0e563d63fb9d6
3
  size 26331136
params_shard_4.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:d2ff77c2018f75d4fb1b66603544bc31982864d16d4ffe733691670df5ddd1d8
3
  size 26331136
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c2f09b93f68881e147b858bc734dfbf9636903cc1a91cd7f4003bb3c1cb970da
3
  size 26331136
params_shard_5.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:e296ab479be35658235ea14ce61f30468312f0ebf7d59abdc90fa25eaa0c67f4
3
  size 26331136
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:34962320fa414ade384ea75843bd7df2d45360e579e294e8d8e3657aa8aa5f3c
3
  size 26331136
params_shard_6.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:95c7d3fb7e495be364be1b18ec4ce03c3ba69278e05bab2553fd533b5bc9069b
3
  size 26331136
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:92454d901ea686762344b8934e9bfa7f9fe4a5d12b343bd2b828b5dea27e4d2d
3
  size 26331136
params_shard_7.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:ce468b379b9a165d6b9d9985d4691c6e817af06059d7ad167fd4c25ab7a037ed
3
  size 26331136
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b4d84d0871ac93862252e801a69259612d8ae6bb36126bf390b7e476fdc079d7
3
  size 26331136
params_shard_8.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:e4fb5e2c93370f302460692d83c77f6aac64d48b9ff3d24fd0b99dcf61ecbb66
3
  size 26331136
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:fd5b798b1f7101d8b35fdf4eb34c949f489accffca112a1c8dd63c506ff8ea86
3
  size 26331136
params_shard_9.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:97c9e13b0c783b160ea86fa863344c969fe4bc26b9a1525016cc06000e1c9753
3
  size 26331136
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:722e71f6aca4fe7f543dbd00510309c8b7b8ec4edc467616c71efac1d8763c75
3
  size 26331136