File tree
13 files changed
+537
-39
lines changed- recipes
- configs/llama4
- torchtune
- models/llama4
- modules
- moe
- training
- utils
13 files changed
+537
-39
lines changedLines changed: 19 additions & 6 deletions
Original file line number | Diff line number | Diff line change | |
---|---|---|---|
| |||
18 | 18 |
| |
19 | 19 |
| |
20 | 20 |
| |
21 |
| - | |
| 21 | + | |
22 | 22 |
| |
23 | 23 |
| |
24 | 24 |
| |
| |||
74 | 74 |
| |
75 | 75 |
| |
76 | 76 |
| |
77 |
| - | |
78 |
| - | |
79 |
| - | |
80 |
| - | |
| 77 | + | |
| 78 | + | |
| 79 | + | |
| 80 | + | |
81 | 81 |
| |
82 | 82 |
| |
83 | 83 |
| |
| |||
93 | 93 |
| |
94 | 94 |
| |
95 | 95 |
| |
96 |
| - | |
| 96 | + | |
| 97 | + | |
| 98 | + | |
| 99 | + | |
| 100 | + | |
| 101 | + | |
| 102 | + | |
| 103 | + | |
| 104 | + | |
| 105 | + | |
| 106 | + | |
| 107 | + | |
| 108 | + | |
| 109 | + |
Lines changed: 40 additions & 3 deletions
Original file line number | Diff line number | Diff line change | |
---|---|---|---|
| |||
16 | 16 |
| |
17 | 17 |
| |
18 | 18 |
| |
| 19 | + | |
19 | 20 |
| |
20 | 21 |
| |
21 | 22 |
| |
| |||
147 | 148 |
| |
148 | 149 |
| |
149 | 150 |
| |
| 151 | + | |
| 152 | + | |
| 153 | + | |
| 154 | + | |
150 | 155 |
| |
151 | 156 |
| |
152 | 157 |
| |
| |||
328 | 333 |
| |
329 | 334 |
| |
330 | 335 |
| |
| 336 | + | |
| 337 | + | |
| 338 | + | |
331 | 339 |
| |
332 | 340 |
| |
333 | 341 |
| |
| |||
343 | 351 |
| |
344 | 352 |
| |
345 | 353 |
| |
346 |
| - | |
| 354 | + | |
347 | 355 |
| |
348 | 356 |
| |
349 | 357 |
| |
| |||
380 | 388 |
| |
381 | 389 |
| |
382 | 390 |
| |
| 391 | + | |
383 | 392 |
| |
384 | 393 |
| |
385 | 394 |
| |
| |||
413 | 422 |
| |
414 | 423 |
| |
415 | 424 |
| |
416 |
| - | |
| 425 | + | |
417 | 426 |
| |
418 | 427 |
| |
419 | 428 |
| |
| |||
586 | 595 |
| |
587 | 596 |
| |
588 | 597 |
| |
589 |
| - | |
| 598 | + | |
590 | 599 |
| |
591 | 600 |
| |
592 | 601 |
| |
| |||
810 | 819 |
| |
811 | 820 |
| |
812 | 821 |
| |
| 822 | + | |
813 | 823 |
| |
814 | 824 |
| |
815 | 825 |
| |
| |||
820 | 830 |
| |
821 | 831 |
| |
822 | 832 |
| |
| 833 | + | |
823 | 834 |
| |
824 | 835 |
| |
825 | 836 |
| |
| |||
895 | 906 |
| |
896 | 907 |
| |
897 | 908 |
| |
| 909 | + | |
| 910 | + | |
| 911 | + | |
898 | 912 |
| |
899 | 913 |
| |
900 | 914 |
| |
| |||
916 | 930 |
| |
917 | 931 |
| |
918 | 932 |
| |
| 933 | + | |
919 | 934 |
| |
| 935 | + | |
920 | 936 |
| |
921 | 937 |
| |
922 | 938 |
| |
| |||
1068 | 1084 |
| |
1069 | 1085 |
| |
1070 | 1086 |
| |
| 1087 | + | |
| 1088 | + | |
| 1089 | + | |
| 1090 | + | |
| 1091 | + | |
| 1092 | + | |
| 1093 | + | |
| 1094 | + | |
| 1095 | + | |
| 1096 | + | |
| 1097 | + | |
| 1098 | + | |
| 1099 | + | |
| 1100 | + | |
| 1101 | + | |
| 1102 | + | |
| 1103 | + | |
| 1104 | + | |
| 1105 | + | |
| 1106 | + | |
1071 | 1107 |
| |
1072 | 1108 |
| |
1073 | 1109 |
| |
| |||
1081 | 1117 |
| |
1082 | 1118 |
| |
1083 | 1119 |
| |
| 1120 | + | |
1084 | 1121 |
| |
1085 | 1122 |
| |
1086 | 1123 |
| |
|
Lines changed: 10 additions & 2 deletions
Original file line number | Diff line number | Diff line change | |
---|---|---|---|
| |||
38 | 38 |
| |
39 | 39 |
| |
40 | 40 |
| |
| 41 | + | |
41 | 42 |
| |
42 | 43 |
| |
43 | 44 |
| |
| |||
180 | 181 |
| |
181 | 182 |
| |
182 | 183 |
| |
| 184 | + | |
183 | 185 |
| |
184 | 186 |
| |
185 | 187 |
| |
| |||
244 | 246 |
| |
245 | 247 |
| |
246 | 248 |
| |
| 249 | + | |
| 250 | + | |
| 251 | + | |
| 252 | + | |
| 253 | + | |
247 | 254 |
| |
248 | 255 |
| |
249 | 256 |
| |
| |||
263 | 270 |
| |
264 | 271 |
| |
265 | 272 |
| |
266 |
| - | |
267 | 273 |
| |
268 | 274 |
| |
269 | 275 |
| |
| |||
300 | 306 |
| |
301 | 307 |
| |
302 | 308 |
| |
| 309 | + | |
303 | 310 |
| |
304 | 311 |
| |
305 | 312 |
| |
| |||
355 | 362 |
| |
356 | 363 |
| |
357 | 364 |
| |
| 365 | + | |
358 | 366 |
| |
359 | 367 |
| |
360 | 368 |
| |
| |||
631 | 639 |
| |
632 | 640 |
| |
633 | 641 |
| |
| 642 | + | |
634 | 643 |
| |
635 | 644 |
| |
636 | 645 |
| |
| |||
649 | 658 |
| |
650 | 659 |
| |
651 | 660 |
| |
652 |
| - | |
653 | 661 |
| |
654 | 662 |
| |
655 | 663 |
| |
|
Lines changed: 1 addition & 1 deletion
Original file line number | Diff line number | Diff line change | |
---|---|---|---|
| |||
47 | 47 |
| |
48 | 48 |
| |
49 | 49 |
| |
50 |
| - | |
| 50 | + | |
51 | 51 |
| |
52 | 52 |
| |
53 | 53 |
| |
|
Lines changed: 60 additions & 20 deletions
Original file line number | Diff line number | Diff line change | |
---|---|---|---|
| |||
13 | 13 |
| |
14 | 14 |
| |
15 | 15 |
| |
| 16 | + | |
| 17 | + | |
| 18 | + | |
| 19 | + | |
| 20 | + | |
16 | 21 |
| |
17 | 22 |
| |
18 | 23 |
| |
| |||
31 | 36 |
| |
32 | 37 |
| |
33 | 38 |
| |
| 39 | + | |
34 | 40 |
| |
35 | 41 |
| |
36 | 42 |
| |
| |||
39 | 45 |
| |
40 | 46 |
| |
41 | 47 |
| |
| 48 | + | |
| 49 | + | |
42 | 50 |
| |
43 | 51 |
| |
44 | 52 |
| |
| |||
50 | 58 |
| |
51 | 59 |
| |
52 | 60 |
| |
| 61 | + | |
53 | 62 |
| |
54 | 63 |
| |
55 | 64 |
| |
| |||
64 | 73 |
| |
65 | 74 |
| |
66 | 75 |
| |
67 |
| - | |
68 |
| - | |
69 |
| - | |
70 |
| - | |
71 |
| - | |
72 |
| - | |
73 |
| - | |
74 |
| - | |
75 |
| - | |
76 |
| - | |
77 |
| - | |
78 |
| - | |
79 |
| - | |
80 |
| - | |
| 76 | + | |
| 77 | + | |
| 78 | + | |
| 79 | + | |
| 80 | + | |
| 81 | + | |
| 82 | + | |
| 83 | + | |
| 84 | + | |
| 85 | + | |
| 86 | + | |
81 | 87 |
| |
82 |
| - | |
83 |
| - | |
84 |
| - | |
85 |
| - | |
86 |
| - | |
87 |
| - | |
| 88 | + | |
| 89 | + | |
| 90 | + | |
| 91 | + | |
| 92 | + | |
| 93 | + | |
| 94 | + | |
| 95 | + | |
| 96 | + | |
| 97 | + | |
| 98 | + | |
| 99 | + | |
| 100 | + | |
| 101 | + | |
| 102 | + | |
88 | 103 |
| |
| 104 | + | |
| 105 | + | |
| 106 | + | |
| 107 | + | |
| 108 | + | |
| 109 | + | |
| 110 | + | |
| 111 | + | |
| 112 | + | |
| 113 | + | |
| 114 | + | |
| 115 | + | |
| 116 | + | |
| 117 | + | |
| 118 | + | |
| 119 | + | |
| 120 | + | |
| 121 | + | |
| 122 | + | |
| 123 | + | |
| 124 | + | |
| 125 | + | |
| 126 | + | |
| 127 | + | |
| 128 | + | |
89 | 129 |
| |
90 | 130 |
| |
91 | 131 |
| |
|
0 commit comments