zaydzuhri commited on
Commit
b81ca23
·
verified ·
1 Parent(s): 7aa3a52

Add files using upload-large-folder tool

Browse files
This view is limited to 50 files because it contains too many changes.   See raw diff
Files changed (50) hide show
  1. .gitattributes +1 -0
  2. model.safetensors +3 -0
  3. profile_trace/iteration_10752/rank0_trace.json +0 -0
  4. profile_trace/iteration_10752/rank4_trace.json +0 -0
  5. profile_trace/iteration_11776/rank1_trace.json +0 -0
  6. profile_trace/iteration_12288/rank0_trace.json +0 -0
  7. profile_trace/iteration_12288/rank2_trace.json +0 -0
  8. profile_trace/iteration_12288/rank4_trace.json +0 -0
  9. profile_trace/iteration_12288/rank6_trace.json +0 -0
  10. profile_trace/iteration_12288/rank7_trace.json +0 -0
  11. profile_trace/iteration_16384/rank3_trace.json +0 -0
  12. profile_trace/iteration_16384/rank4_trace.json +0 -0
  13. profile_trace/iteration_16384/rank7_trace.json +0 -0
  14. profile_trace/iteration_19968/rank5_trace.json +0 -0
  15. profile_trace/iteration_19968/rank7_trace.json +0 -0
  16. profile_trace/iteration_21504/rank0_trace.json +0 -0
  17. profile_trace/iteration_22016/rank1_trace.json +0 -0
  18. profile_trace/iteration_22016/rank2_trace.json +0 -0
  19. profile_trace/iteration_22016/rank3_trace.json +0 -0
  20. profile_trace/iteration_22016/rank4_trace.json +0 -0
  21. profile_trace/iteration_22016/rank6_trace.json +0 -0
  22. profile_trace/iteration_22016/rank7_trace.json +0 -0
  23. profile_trace/iteration_22528/rank0_trace.json +0 -0
  24. profile_trace/iteration_22528/rank1_trace.json +0 -0
  25. profile_trace/iteration_22528/rank3_trace.json +0 -0
  26. profile_trace/iteration_22528/rank4_trace.json +0 -0
  27. profile_trace/iteration_22528/rank6_trace.json +0 -0
  28. profile_trace/iteration_22528/rank7_trace.json +0 -0
  29. profile_trace/iteration_25088/rank6_trace.json +0 -0
  30. profile_trace/iteration_26112/rank2_trace.json +0 -0
  31. profile_trace/iteration_26112/rank3_trace.json +0 -0
  32. profile_trace/iteration_26112/rank4_trace.json +0 -0
  33. profile_trace/iteration_26112/rank6_trace.json +0 -0
  34. profile_trace/iteration_26112/rank7_trace.json +0 -0
  35. profile_trace/iteration_32768/rank0_trace.json +0 -0
  36. profile_trace/iteration_32768/rank1_trace.json +0 -0
  37. profile_trace/iteration_32768/rank2_trace.json +0 -0
  38. profile_trace/iteration_32768/rank3_trace.json +0 -0
  39. profile_trace/iteration_32768/rank4_trace.json +0 -0
  40. profile_trace/iteration_32768/rank5_trace.json +0 -0
  41. profile_trace/iteration_32768/rank6_trace.json +0 -0
  42. profile_trace/iteration_32768/rank7_trace.json +0 -0
  43. profile_trace/iteration_37376/rank0_trace.json +0 -0
  44. profile_trace/iteration_37376/rank2_trace.json +0 -0
  45. profile_trace/iteration_37376/rank3_trace.json +0 -0
  46. profile_trace/iteration_37376/rank5_trace.json +0 -0
  47. profile_trace/iteration_37376/rank7_trace.json +0 -0
  48. profile_trace/iteration_39936/rank0_trace.json +0 -0
  49. profile_trace/iteration_39936/rank1_trace.json +0 -0
  50. profile_trace/iteration_39936/rank2_trace.json +0 -0
.gitattributes CHANGED
@@ -33,3 +33,4 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text
33
  *.zip filter=lfs diff=lfs merge=lfs -text
34
  *.zst filter=lfs diff=lfs merge=lfs -text
35
  *tfevents* filter=lfs diff=lfs merge=lfs -text
 
 
33
  *.zip filter=lfs diff=lfs merge=lfs -text
34
  *.zst filter=lfs diff=lfs merge=lfs -text
35
  *tfevents* filter=lfs diff=lfs merge=lfs -text
36
+ tb/20250709-1334/wandb/run-20250709_133455-mtp_transformer-mtp.340M.batch16.seqlen4096.context4096.warmup1000.update1.steps100000.lr3e-4.cosine-202507091329/run-mtp_transformer-mtp.340M.batch16.seqlen4096.context4096.warmup1000.update1.steps100000.lr3e-4.cosine-202507091329.wandb filter=lfs diff=lfs merge=lfs -text
model.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:81133403ae76d33217d5cc2540ac62bcc532fd211c948ae25740372a2c21c593
3
+ size 1495494112
profile_trace/iteration_10752/rank0_trace.json ADDED
The diff for this file is too large to render. See raw diff
 
profile_trace/iteration_10752/rank4_trace.json ADDED
The diff for this file is too large to render. See raw diff
 
profile_trace/iteration_11776/rank1_trace.json ADDED
The diff for this file is too large to render. See raw diff
 
profile_trace/iteration_12288/rank0_trace.json ADDED
The diff for this file is too large to render. See raw diff
 
profile_trace/iteration_12288/rank2_trace.json ADDED
The diff for this file is too large to render. See raw diff
 
profile_trace/iteration_12288/rank4_trace.json ADDED
The diff for this file is too large to render. See raw diff
 
profile_trace/iteration_12288/rank6_trace.json ADDED
The diff for this file is too large to render. See raw diff
 
profile_trace/iteration_12288/rank7_trace.json ADDED
The diff for this file is too large to render. See raw diff
 
profile_trace/iteration_16384/rank3_trace.json ADDED
The diff for this file is too large to render. See raw diff
 
profile_trace/iteration_16384/rank4_trace.json ADDED
The diff for this file is too large to render. See raw diff
 
profile_trace/iteration_16384/rank7_trace.json ADDED
The diff for this file is too large to render. See raw diff
 
profile_trace/iteration_19968/rank5_trace.json ADDED
The diff for this file is too large to render. See raw diff
 
profile_trace/iteration_19968/rank7_trace.json ADDED
The diff for this file is too large to render. See raw diff
 
profile_trace/iteration_21504/rank0_trace.json ADDED
The diff for this file is too large to render. See raw diff
 
profile_trace/iteration_22016/rank1_trace.json ADDED
The diff for this file is too large to render. See raw diff
 
profile_trace/iteration_22016/rank2_trace.json ADDED
The diff for this file is too large to render. See raw diff
 
profile_trace/iteration_22016/rank3_trace.json ADDED
The diff for this file is too large to render. See raw diff
 
profile_trace/iteration_22016/rank4_trace.json ADDED
The diff for this file is too large to render. See raw diff
 
profile_trace/iteration_22016/rank6_trace.json ADDED
The diff for this file is too large to render. See raw diff
 
profile_trace/iteration_22016/rank7_trace.json ADDED
The diff for this file is too large to render. See raw diff
 
profile_trace/iteration_22528/rank0_trace.json ADDED
The diff for this file is too large to render. See raw diff
 
profile_trace/iteration_22528/rank1_trace.json ADDED
The diff for this file is too large to render. See raw diff
 
profile_trace/iteration_22528/rank3_trace.json ADDED
The diff for this file is too large to render. See raw diff
 
profile_trace/iteration_22528/rank4_trace.json ADDED
The diff for this file is too large to render. See raw diff
 
profile_trace/iteration_22528/rank6_trace.json ADDED
The diff for this file is too large to render. See raw diff
 
profile_trace/iteration_22528/rank7_trace.json ADDED
The diff for this file is too large to render. See raw diff
 
profile_trace/iteration_25088/rank6_trace.json ADDED
The diff for this file is too large to render. See raw diff
 
profile_trace/iteration_26112/rank2_trace.json ADDED
The diff for this file is too large to render. See raw diff
 
profile_trace/iteration_26112/rank3_trace.json ADDED
The diff for this file is too large to render. See raw diff
 
profile_trace/iteration_26112/rank4_trace.json ADDED
The diff for this file is too large to render. See raw diff
 
profile_trace/iteration_26112/rank6_trace.json ADDED
The diff for this file is too large to render. See raw diff
 
profile_trace/iteration_26112/rank7_trace.json ADDED
The diff for this file is too large to render. See raw diff
 
profile_trace/iteration_32768/rank0_trace.json ADDED
The diff for this file is too large to render. See raw diff
 
profile_trace/iteration_32768/rank1_trace.json ADDED
The diff for this file is too large to render. See raw diff
 
profile_trace/iteration_32768/rank2_trace.json ADDED
The diff for this file is too large to render. See raw diff
 
profile_trace/iteration_32768/rank3_trace.json ADDED
The diff for this file is too large to render. See raw diff
 
profile_trace/iteration_32768/rank4_trace.json ADDED
The diff for this file is too large to render. See raw diff
 
profile_trace/iteration_32768/rank5_trace.json ADDED
The diff for this file is too large to render. See raw diff
 
profile_trace/iteration_32768/rank6_trace.json ADDED
The diff for this file is too large to render. See raw diff
 
profile_trace/iteration_32768/rank7_trace.json ADDED
The diff for this file is too large to render. See raw diff
 
profile_trace/iteration_37376/rank0_trace.json ADDED
The diff for this file is too large to render. See raw diff
 
profile_trace/iteration_37376/rank2_trace.json ADDED
The diff for this file is too large to render. See raw diff
 
profile_trace/iteration_37376/rank3_trace.json ADDED
The diff for this file is too large to render. See raw diff
 
profile_trace/iteration_37376/rank5_trace.json ADDED
The diff for this file is too large to render. See raw diff
 
profile_trace/iteration_37376/rank7_trace.json ADDED
The diff for this file is too large to render. See raw diff
 
profile_trace/iteration_39936/rank0_trace.json ADDED
The diff for this file is too large to render. See raw diff
 
profile_trace/iteration_39936/rank1_trace.json ADDED
The diff for this file is too large to render. See raw diff
 
profile_trace/iteration_39936/rank2_trace.json ADDED
The diff for this file is too large to render. See raw diff