dacorvo HF Staff commited on
Commit
675ddb6
·
verified ·
1 Parent(s): f611e3d

Synchronizing local compiler cache.

Browse files
This view is limited to 50 files because it contains too many changes.   See raw diff
Files changed (50) hide show
  1. .gitattributes +19 -0
  2. neuronxcc-2.21.18209.0+043b1bf7/MODULE_0654da519a1110a6aad4+ad9e832d/compile_flags.json +1 -0
  3. neuronxcc-2.21.18209.0+043b1bf7/MODULE_0654da519a1110a6aad4+ad9e832d/model.done +0 -0
  4. neuronxcc-2.21.18209.0+043b1bf7/MODULE_0654da519a1110a6aad4+ad9e832d/model.hlo_module.pb +3 -0
  5. neuronxcc-2.21.18209.0+043b1bf7/MODULE_0654da519a1110a6aad4+ad9e832d/model.neff +3 -0
  6. neuronxcc-2.21.18209.0+043b1bf7/MODULE_06e58c7a469128c652b5+ad9e832d/compile_flags.json +1 -0
  7. neuronxcc-2.21.18209.0+043b1bf7/MODULE_06e58c7a469128c652b5+ad9e832d/model.done +0 -0
  8. neuronxcc-2.21.18209.0+043b1bf7/MODULE_06e58c7a469128c652b5+ad9e832d/model.hlo_module.pb +3 -0
  9. neuronxcc-2.21.18209.0+043b1bf7/MODULE_06e58c7a469128c652b5+ad9e832d/model.neff +3 -0
  10. neuronxcc-2.21.18209.0+043b1bf7/MODULE_3cb9043f67e6b5a9acbf+ad9e832d/compile_flags.json +1 -0
  11. neuronxcc-2.21.18209.0+043b1bf7/MODULE_3cb9043f67e6b5a9acbf+ad9e832d/model.done +0 -0
  12. neuronxcc-2.21.18209.0+043b1bf7/MODULE_3cb9043f67e6b5a9acbf+ad9e832d/model.hlo_module.pb +3 -0
  13. neuronxcc-2.21.18209.0+043b1bf7/MODULE_3cb9043f67e6b5a9acbf+ad9e832d/model.neff +3 -0
  14. neuronxcc-2.21.18209.0+043b1bf7/MODULE_4262eabf33a3b2c61448+617f6939/compile_flags.json +1 -0
  15. neuronxcc-2.21.18209.0+043b1bf7/MODULE_4262eabf33a3b2c61448+617f6939/model.done +0 -0
  16. neuronxcc-2.21.18209.0+043b1bf7/MODULE_4262eabf33a3b2c61448+617f6939/model.hlo_module.pb +3 -0
  17. neuronxcc-2.21.18209.0+043b1bf7/MODULE_4262eabf33a3b2c61448+617f6939/model.neff +3 -0
  18. neuronxcc-2.21.18209.0+043b1bf7/MODULE_4262eabf33a3b2c61448+617f6939/wrapped_neff.hlo +3 -0
  19. neuronxcc-2.21.18209.0+043b1bf7/MODULE_57d02543ed097317eb38+ad9e832d/compile_flags.json +1 -0
  20. neuronxcc-2.21.18209.0+043b1bf7/MODULE_57d02543ed097317eb38+ad9e832d/model.done +0 -0
  21. neuronxcc-2.21.18209.0+043b1bf7/MODULE_57d02543ed097317eb38+ad9e832d/model.hlo_module.pb +3 -0
  22. neuronxcc-2.21.18209.0+043b1bf7/MODULE_57d02543ed097317eb38+ad9e832d/model.neff +3 -0
  23. neuronxcc-2.21.18209.0+043b1bf7/MODULE_6df16d281c8d34e7b8c8+ad9e832d/compile_flags.json +1 -0
  24. neuronxcc-2.21.18209.0+043b1bf7/MODULE_6df16d281c8d34e7b8c8+ad9e832d/model.done +0 -0
  25. neuronxcc-2.21.18209.0+043b1bf7/MODULE_6df16d281c8d34e7b8c8+ad9e832d/model.hlo_module.pb +3 -0
  26. neuronxcc-2.21.18209.0+043b1bf7/MODULE_6df16d281c8d34e7b8c8+ad9e832d/model.neff +3 -0
  27. neuronxcc-2.21.18209.0+043b1bf7/MODULE_7776165b0d0d23f46d32+ad9e832d/compile_flags.json +1 -0
  28. neuronxcc-2.21.18209.0+043b1bf7/MODULE_7776165b0d0d23f46d32+ad9e832d/model.done +0 -0
  29. neuronxcc-2.21.18209.0+043b1bf7/MODULE_7776165b0d0d23f46d32+ad9e832d/model.hlo_module.pb +3 -0
  30. neuronxcc-2.21.18209.0+043b1bf7/MODULE_7776165b0d0d23f46d32+ad9e832d/model.neff +3 -0
  31. neuronxcc-2.21.18209.0+043b1bf7/MODULE_8d519e024abae9bbf305+617f6939/compile_flags.json +1 -0
  32. neuronxcc-2.21.18209.0+043b1bf7/MODULE_8d519e024abae9bbf305+617f6939/model.done +0 -0
  33. neuronxcc-2.21.18209.0+043b1bf7/MODULE_8d519e024abae9bbf305+617f6939/model.hlo_module.pb +3 -0
  34. neuronxcc-2.21.18209.0+043b1bf7/MODULE_8d519e024abae9bbf305+617f6939/model.neff +3 -0
  35. neuronxcc-2.21.18209.0+043b1bf7/MODULE_8d519e024abae9bbf305+617f6939/wrapped_neff.hlo +3 -0
  36. neuronxcc-2.21.18209.0+043b1bf7/MODULE_da7e97c0c4b45f3b3821+ad9e832d/compile_flags.json +1 -0
  37. neuronxcc-2.21.18209.0+043b1bf7/MODULE_da7e97c0c4b45f3b3821+ad9e832d/model.done +0 -0
  38. neuronxcc-2.21.18209.0+043b1bf7/MODULE_da7e97c0c4b45f3b3821+ad9e832d/model.hlo_module.pb +3 -0
  39. neuronxcc-2.21.18209.0+043b1bf7/MODULE_da7e97c0c4b45f3b3821+ad9e832d/model.neff +3 -0
  40. neuronxcc-2.21.18209.0+043b1bf7/MODULE_de35c230ea0abd3360a7+617f6939/compile_flags.json +1 -0
  41. neuronxcc-2.21.18209.0+043b1bf7/MODULE_de35c230ea0abd3360a7+617f6939/model.done +0 -0
  42. neuronxcc-2.21.18209.0+043b1bf7/MODULE_de35c230ea0abd3360a7+617f6939/model.hlo_module.pb +3 -0
  43. neuronxcc-2.21.18209.0+043b1bf7/MODULE_de35c230ea0abd3360a7+617f6939/model.neff +3 -0
  44. neuronxcc-2.21.18209.0+043b1bf7/MODULE_de35c230ea0abd3360a7+617f6939/wrapped_neff.hlo +3 -0
  45. neuronxcc-2.21.18209.0+043b1bf7/MODULE_fede9e304a150a635925+617f6939/compile_flags.json +1 -0
  46. neuronxcc-2.21.18209.0+043b1bf7/MODULE_fede9e304a150a635925+617f6939/model.done +0 -0
  47. neuronxcc-2.21.18209.0+043b1bf7/MODULE_fede9e304a150a635925+617f6939/model.hlo_module.pb +3 -0
  48. neuronxcc-2.21.18209.0+043b1bf7/MODULE_fede9e304a150a635925+617f6939/model.neff +3 -0
  49. neuronxcc-2.21.18209.0+043b1bf7/MODULE_fede9e304a150a635925+617f6939/wrapped_neff.hlo +3 -0
  50. neuronxcc-2.21.33363.0+82129205/0_REGISTRY/0.4.3.dev2/llama/meta-llama/Llama-3.1-8B-Instruct/3f2788536ce52a84f6c0.json +62 -0
.gitattributes CHANGED
@@ -5687,3 +5687,22 @@ neuronxcc-2.21.33363.0+82129205/MODULE_e54f2eec2036cfaa2527+a02c3a36/model.neff
5687
  neuronxcc-2.21.33363.0+82129205/MODULE_e54f2eec2036cfaa2527+a02c3a36/wrapped_neff.hlo filter=lfs diff=lfs merge=lfs -text
5688
  neuronxcc-2.21.33363.0+82129205/MODULE_ebda959e0a7e1b1b3d41+24129607/model.neff filter=lfs diff=lfs merge=lfs -text
5689
  neuronxcc-2.21.33363.0+82129205/MODULE_ed0ddf13430a2a717168+24129607/model.neff filter=lfs diff=lfs merge=lfs -text
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
5687
  neuronxcc-2.21.33363.0+82129205/MODULE_e54f2eec2036cfaa2527+a02c3a36/wrapped_neff.hlo filter=lfs diff=lfs merge=lfs -text
5688
  neuronxcc-2.21.33363.0+82129205/MODULE_ebda959e0a7e1b1b3d41+24129607/model.neff filter=lfs diff=lfs merge=lfs -text
5689
  neuronxcc-2.21.33363.0+82129205/MODULE_ed0ddf13430a2a717168+24129607/model.neff filter=lfs diff=lfs merge=lfs -text
5690
+ neuronxcc-2.21.18209.0+043b1bf7/MODULE_0654da519a1110a6aad4+ad9e832d/model.neff filter=lfs diff=lfs merge=lfs -text
5691
+ neuronxcc-2.21.18209.0+043b1bf7/MODULE_06e58c7a469128c652b5+ad9e832d/model.neff filter=lfs diff=lfs merge=lfs -text
5692
+ neuronxcc-2.21.18209.0+043b1bf7/MODULE_3cb9043f67e6b5a9acbf+ad9e832d/model.neff filter=lfs diff=lfs merge=lfs -text
5693
+ neuronxcc-2.21.18209.0+043b1bf7/MODULE_4262eabf33a3b2c61448+617f6939/model.neff filter=lfs diff=lfs merge=lfs -text
5694
+ neuronxcc-2.21.18209.0+043b1bf7/MODULE_4262eabf33a3b2c61448+617f6939/wrapped_neff.hlo filter=lfs diff=lfs merge=lfs -text
5695
+ neuronxcc-2.21.18209.0+043b1bf7/MODULE_57d02543ed097317eb38+ad9e832d/model.neff filter=lfs diff=lfs merge=lfs -text
5696
+ neuronxcc-2.21.18209.0+043b1bf7/MODULE_6df16d281c8d34e7b8c8+ad9e832d/model.neff filter=lfs diff=lfs merge=lfs -text
5697
+ neuronxcc-2.21.18209.0+043b1bf7/MODULE_7776165b0d0d23f46d32+ad9e832d/model.neff filter=lfs diff=lfs merge=lfs -text
5698
+ neuronxcc-2.21.18209.0+043b1bf7/MODULE_8d519e024abae9bbf305+617f6939/model.neff filter=lfs diff=lfs merge=lfs -text
5699
+ neuronxcc-2.21.18209.0+043b1bf7/MODULE_8d519e024abae9bbf305+617f6939/wrapped_neff.hlo filter=lfs diff=lfs merge=lfs -text
5700
+ neuronxcc-2.21.18209.0+043b1bf7/MODULE_da7e97c0c4b45f3b3821+ad9e832d/model.neff filter=lfs diff=lfs merge=lfs -text
5701
+ neuronxcc-2.21.18209.0+043b1bf7/MODULE_de35c230ea0abd3360a7+617f6939/model.neff filter=lfs diff=lfs merge=lfs -text
5702
+ neuronxcc-2.21.18209.0+043b1bf7/MODULE_de35c230ea0abd3360a7+617f6939/wrapped_neff.hlo filter=lfs diff=lfs merge=lfs -text
5703
+ neuronxcc-2.21.18209.0+043b1bf7/MODULE_fede9e304a150a635925+617f6939/model.neff filter=lfs diff=lfs merge=lfs -text
5704
+ neuronxcc-2.21.18209.0+043b1bf7/MODULE_fede9e304a150a635925+617f6939/wrapped_neff.hlo filter=lfs diff=lfs merge=lfs -text
5705
+ neuronxcc-2.21.33363.0+82129205/MODULE_818bc30ba0942fe4c3d6+24129607/model.neff filter=lfs diff=lfs merge=lfs -text
5706
+ neuronxcc-2.21.33363.0+82129205/MODULE_adf2c812522e586cea39+24129607/model.neff filter=lfs diff=lfs merge=lfs -text
5707
+ neuronxcc-2.21.33363.0+82129205/MODULE_ccc2d4abbb67d5b7286f+a02c3a36/model.neff filter=lfs diff=lfs merge=lfs -text
5708
+ neuronxcc-2.21.33363.0+82129205/MODULE_ccc2d4abbb67d5b7286f+a02c3a36/wrapped_neff.hlo filter=lfs diff=lfs merge=lfs -text
neuronxcc-2.21.18209.0+043b1bf7/MODULE_0654da519a1110a6aad4+ad9e832d/compile_flags.json ADDED
@@ -0,0 +1 @@
 
 
1
+ ["--target=trn1", "--auto-cast=none", "--model-type=transformer", "--tensorizer-options=--enable-ccop-compute-overlap --cc-pipeline-tiling-factor=2 --vectorize-strided-dma ", "--lnc=1", "-O1", "--internal-hlo2tensorizer-options= --modular-flow-mac-threshold=10 --verify-hlo=true", "--logfile=/tmp/nxd_model/context_encoding_model/_tp0_bk0/log-neuron-cc.txt"]
neuronxcc-2.21.18209.0+043b1bf7/MODULE_0654da519a1110a6aad4+ad9e832d/model.done ADDED
File without changes
neuronxcc-2.21.18209.0+043b1bf7/MODULE_0654da519a1110a6aad4+ad9e832d/model.hlo_module.pb ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:17c096a64f827fc570914bd877c33bb2b6d4b1afd2313a82e249d70da338f146
3
+ size 936785
neuronxcc-2.21.18209.0+043b1bf7/MODULE_0654da519a1110a6aad4+ad9e832d/model.neff ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2c15732a812350a3a27aeace7738a30c6027911be1dc5e6a5d896ff890d7c00e
3
+ size 11561984
neuronxcc-2.21.18209.0+043b1bf7/MODULE_06e58c7a469128c652b5+ad9e832d/compile_flags.json ADDED
@@ -0,0 +1 @@
 
 
1
+ ["--target=trn1", "--auto-cast=none", "--model-type=transformer", "--tensorizer-options=--enable-ccop-compute-overlap --cc-pipeline-tiling-factor=2 --vectorize-strided-dma ", "--lnc=1", "-O1", "--internal-hlo2tensorizer-options= --modular-flow-mac-threshold=10 --verify-hlo=true", "--logfile=/tmp/nxd_model/context_encoding_model/_tp0_bk0/log-neuron-cc.txt"]
neuronxcc-2.21.18209.0+043b1bf7/MODULE_06e58c7a469128c652b5+ad9e832d/model.done ADDED
File without changes
neuronxcc-2.21.18209.0+043b1bf7/MODULE_06e58c7a469128c652b5+ad9e832d/model.hlo_module.pb ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:05c5f09f68c1912103423eeb9d56a58404f0c6fdddbe1816e7c33073e659a2cb
3
+ size 726384
neuronxcc-2.21.18209.0+043b1bf7/MODULE_06e58c7a469128c652b5+ad9e832d/model.neff ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d68ad0966b1e9e7ea97f6212f6275741342159f8b013adca888b4ed2564a7a4c
3
+ size 492544
neuronxcc-2.21.18209.0+043b1bf7/MODULE_3cb9043f67e6b5a9acbf+ad9e832d/compile_flags.json ADDED
@@ -0,0 +1 @@
 
 
1
+ ["--target=trn1", "--auto-cast=none", "--model-type=transformer", "--tensorizer-options=--enable-ccop-compute-overlap --cc-pipeline-tiling-factor=2 --vectorize-strided-dma ", "--lnc=1", "-O1", "--internal-hlo2tensorizer-options= --modular-flow-mac-threshold=10 --verify-hlo=true", "--logfile=/tmp/nxd_model/context_encoding_model/_tp0_bk0/log-neuron-cc.txt"]
neuronxcc-2.21.18209.0+043b1bf7/MODULE_3cb9043f67e6b5a9acbf+ad9e832d/model.done ADDED
File without changes
neuronxcc-2.21.18209.0+043b1bf7/MODULE_3cb9043f67e6b5a9acbf+ad9e832d/model.hlo_module.pb ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:eb5bd8e78159ccce3eae8b4e36beb1bc30d66f673c8c4d01b80e818f0e5483cf
3
+ size 678558
neuronxcc-2.21.18209.0+043b1bf7/MODULE_3cb9043f67e6b5a9acbf+ad9e832d/model.neff ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:93a4c486f03a6855de565b9571babfa47a4f214c4242a94445cc972c72dfedf5
3
+ size 1659904
neuronxcc-2.21.18209.0+043b1bf7/MODULE_4262eabf33a3b2c61448+617f6939/compile_flags.json ADDED
@@ -0,0 +1 @@
 
 
1
+ ["--target=trn1", "--auto-cast=none", "--model-type=transformer", "--tensorizer-options=--enable-ccop-compute-overlap --cc-pipeline-tiling-factor=1 --vectorize-strided-dma ", "--lnc=1", "-O2", "--internal-hlo2tensorizer-options=--verify-hlo=true", "--logfile=/tmp/nxd_model/token_generation_model/_tp0_bk0/log-neuron-cc.txt", "--enable-internal-neff-wrapper"]
neuronxcc-2.21.18209.0+043b1bf7/MODULE_4262eabf33a3b2c61448+617f6939/model.done ADDED
File without changes
neuronxcc-2.21.18209.0+043b1bf7/MODULE_4262eabf33a3b2c61448+617f6939/model.hlo_module.pb ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:76aa5bdd9171b91554e3461102196b55b4a8f7453a965cdc9e9c89b9746deda7
3
+ size 747576
neuronxcc-2.21.18209.0+043b1bf7/MODULE_4262eabf33a3b2c61448+617f6939/model.neff ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:405817d784b623c7bc20cb7ce54f7d65ed8a737226de9755f081bf73b10c95e0
3
+ size 3113984
neuronxcc-2.21.18209.0+043b1bf7/MODULE_4262eabf33a3b2c61448+617f6939/wrapped_neff.hlo ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:95fb219447af7158351ee48861dbcfbffd673c4fb243778edef7c658333a80f0
3
+ size 3299472
neuronxcc-2.21.18209.0+043b1bf7/MODULE_57d02543ed097317eb38+ad9e832d/compile_flags.json ADDED
@@ -0,0 +1 @@
 
 
1
+ ["--target=trn1", "--auto-cast=none", "--model-type=transformer", "--tensorizer-options=--enable-ccop-compute-overlap --cc-pipeline-tiling-factor=2 --vectorize-strided-dma ", "--lnc=1", "-O1", "--internal-hlo2tensorizer-options= --modular-flow-mac-threshold=10 --verify-hlo=true", "--logfile=/tmp/nxd_model/context_encoding_model/_tp0_bk0/log-neuron-cc.txt"]
neuronxcc-2.21.18209.0+043b1bf7/MODULE_57d02543ed097317eb38+ad9e832d/model.done ADDED
File without changes
neuronxcc-2.21.18209.0+043b1bf7/MODULE_57d02543ed097317eb38+ad9e832d/model.hlo_module.pb ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f7889bc62e8dcef2a8de07ab0712acd532c2d6f207defd057f42dc19a58a0dc7
3
+ size 983272
neuronxcc-2.21.18209.0+043b1bf7/MODULE_57d02543ed097317eb38+ad9e832d/model.neff ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:fee37fa3f3fd8eb8db0f8f866970dfdccc1d45a71c42a03a5da62f6ff16ea6a2
3
+ size 11981824
neuronxcc-2.21.18209.0+043b1bf7/MODULE_6df16d281c8d34e7b8c8+ad9e832d/compile_flags.json ADDED
@@ -0,0 +1 @@
 
 
1
+ ["--target=trn1", "--auto-cast=none", "--model-type=transformer", "--tensorizer-options=--enable-ccop-compute-overlap --cc-pipeline-tiling-factor=2 --vectorize-strided-dma ", "--lnc=1", "-O1", "--internal-hlo2tensorizer-options= --modular-flow-mac-threshold=10 --verify-hlo=true", "--logfile=/tmp/nxd_model/context_encoding_model/_tp0_bk0/log-neuron-cc.txt"]
neuronxcc-2.21.18209.0+043b1bf7/MODULE_6df16d281c8d34e7b8c8+ad9e832d/model.done ADDED
File without changes
neuronxcc-2.21.18209.0+043b1bf7/MODULE_6df16d281c8d34e7b8c8+ad9e832d/model.hlo_module.pb ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:97fb1218b3b85f5e1750c92b0b95e18b2f0fff0dbe607f1c8307ff625175c782
3
+ size 598800
neuronxcc-2.21.18209.0+043b1bf7/MODULE_6df16d281c8d34e7b8c8+ad9e832d/model.neff ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:789d0cd4da08ab7421274e55250c231edd04c5dab1294fedc165ce26e13ef622
3
+ size 297984
neuronxcc-2.21.18209.0+043b1bf7/MODULE_7776165b0d0d23f46d32+ad9e832d/compile_flags.json ADDED
@@ -0,0 +1 @@
 
 
1
+ ["--target=trn1", "--auto-cast=none", "--model-type=transformer", "--tensorizer-options=--enable-ccop-compute-overlap --cc-pipeline-tiling-factor=2 --vectorize-strided-dma ", "--lnc=1", "-O1", "--internal-hlo2tensorizer-options= --modular-flow-mac-threshold=10 --verify-hlo=true", "--logfile=/tmp/nxd_model/context_encoding_model/_tp0_bk0/log-neuron-cc.txt"]
neuronxcc-2.21.18209.0+043b1bf7/MODULE_7776165b0d0d23f46d32+ad9e832d/model.done ADDED
File without changes
neuronxcc-2.21.18209.0+043b1bf7/MODULE_7776165b0d0d23f46d32+ad9e832d/model.hlo_module.pb ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5e7683c211dc0af38826ebf6230b77d074a161cee9ec7cb1479cbed80886141d
3
+ size 879322
neuronxcc-2.21.18209.0+043b1bf7/MODULE_7776165b0d0d23f46d32+ad9e832d/model.neff ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:359e60c0c6954b4b1e41353841731e1af857fcdfae77175beede8434fa5b0b4f
3
+ size 11664384
neuronxcc-2.21.18209.0+043b1bf7/MODULE_8d519e024abae9bbf305+617f6939/compile_flags.json ADDED
@@ -0,0 +1 @@
 
 
1
+ ["--target=trn1", "--auto-cast=none", "--model-type=transformer", "--tensorizer-options=--enable-ccop-compute-overlap --cc-pipeline-tiling-factor=1 --vectorize-strided-dma ", "--lnc=1", "-O2", "--internal-hlo2tensorizer-options=--verify-hlo=true", "--logfile=/tmp/nxd_model/token_generation_model/_tp0_bk0/log-neuron-cc.txt", "--enable-internal-neff-wrapper"]
neuronxcc-2.21.18209.0+043b1bf7/MODULE_8d519e024abae9bbf305+617f6939/model.done ADDED
File without changes
neuronxcc-2.21.18209.0+043b1bf7/MODULE_8d519e024abae9bbf305+617f6939/model.hlo_module.pb ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5071a7599bf37c6e189b6187158a0179ccca7462c9dffd2a1c7bd8018789229d
3
+ size 764473
neuronxcc-2.21.18209.0+043b1bf7/MODULE_8d519e024abae9bbf305+617f6939/model.neff ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:314b069eebb2613c82e93cdce1a0e1e98cc3f8b83d87c475b1be547e9b715902
3
+ size 8397824
neuronxcc-2.21.18209.0+043b1bf7/MODULE_8d519e024abae9bbf305+617f6939/wrapped_neff.hlo ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:dc685dbef59db678dce409552323ab8686c2f8181be35c3a56d908b079d65c6b
3
+ size 8583322
neuronxcc-2.21.18209.0+043b1bf7/MODULE_da7e97c0c4b45f3b3821+ad9e832d/compile_flags.json ADDED
@@ -0,0 +1 @@
 
 
1
+ ["--target=trn1", "--auto-cast=none", "--model-type=transformer", "--tensorizer-options=--enable-ccop-compute-overlap --cc-pipeline-tiling-factor=2 --vectorize-strided-dma ", "--lnc=1", "-O1", "--internal-hlo2tensorizer-options= --modular-flow-mac-threshold=10 --verify-hlo=true", "--logfile=/tmp/nxd_model/context_encoding_model/_tp0_bk0/log-neuron-cc.txt"]
neuronxcc-2.21.18209.0+043b1bf7/MODULE_da7e97c0c4b45f3b3821+ad9e832d/model.done ADDED
File without changes
neuronxcc-2.21.18209.0+043b1bf7/MODULE_da7e97c0c4b45f3b3821+ad9e832d/model.hlo_module.pb ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:67a1aedb62ddf41c80dc68cc5012e85a308184096cc91161a0b8c3722ed7e519
3
+ size 667112
neuronxcc-2.21.18209.0+043b1bf7/MODULE_da7e97c0c4b45f3b3821+ad9e832d/model.neff ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1c8b0200b2ad3b8eab8b71726ba5c3f59f83e8e5fb23c82e56699848db128fce
3
+ size 451584
neuronxcc-2.21.18209.0+043b1bf7/MODULE_de35c230ea0abd3360a7+617f6939/compile_flags.json ADDED
@@ -0,0 +1 @@
 
 
1
+ ["--target=trn1", "--auto-cast=none", "--model-type=transformer", "--tensorizer-options=--enable-ccop-compute-overlap --cc-pipeline-tiling-factor=1 --vectorize-strided-dma ", "--lnc=1", "-O2", "--internal-hlo2tensorizer-options=--verify-hlo=true", "--logfile=/tmp/nxd_model/token_generation_model/_tp0_bk0/log-neuron-cc.txt", "--enable-internal-neff-wrapper"]
neuronxcc-2.21.18209.0+043b1bf7/MODULE_de35c230ea0abd3360a7+617f6939/model.done ADDED
File without changes
neuronxcc-2.21.18209.0+043b1bf7/MODULE_de35c230ea0abd3360a7+617f6939/model.hlo_module.pb ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:005f593253160ac83985c31e41ad06d4e8ef8abb217eabd8f83f8616b96d0fcc
3
+ size 623022
neuronxcc-2.21.18209.0+043b1bf7/MODULE_de35c230ea0abd3360a7+617f6939/model.neff ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1c9ddd19d822c930094daf4f23fe71ba2ef0752147d8d2f02c968f84b64b932a
3
+ size 1537024
neuronxcc-2.21.18209.0+043b1bf7/MODULE_de35c230ea0abd3360a7+617f6939/wrapped_neff.hlo ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:777da8f3b00fbf3c274133ae4405c17c52d5d2942b92d8423bc02639d1b597f5
3
+ size 1720482
neuronxcc-2.21.18209.0+043b1bf7/MODULE_fede9e304a150a635925+617f6939/compile_flags.json ADDED
@@ -0,0 +1 @@
 
 
1
+ ["--target=trn1", "--auto-cast=none", "--model-type=transformer", "--tensorizer-options=--enable-ccop-compute-overlap --cc-pipeline-tiling-factor=1 --vectorize-strided-dma ", "--lnc=1", "-O2", "--internal-hlo2tensorizer-options=--verify-hlo=true", "--logfile=/tmp/nxd_model/token_generation_model/_tp0_bk0/log-neuron-cc.txt", "--enable-internal-neff-wrapper"]
neuronxcc-2.21.18209.0+043b1bf7/MODULE_fede9e304a150a635925+617f6939/model.done ADDED
File without changes
neuronxcc-2.21.18209.0+043b1bf7/MODULE_fede9e304a150a635925+617f6939/model.hlo_module.pb ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e7707b4ae5ae2b0aafdac9c76d4726c1969cbe176743da0ce7d7ad494ae57b7f
3
+ size 743609
neuronxcc-2.21.18209.0+043b1bf7/MODULE_fede9e304a150a635925+617f6939/model.neff ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b1816edc19a32a1152161f05f69ee58a6289d6a4bef3c10b547245abd13e8333
3
+ size 2970624
neuronxcc-2.21.18209.0+043b1bf7/MODULE_fede9e304a150a635925+617f6939/wrapped_neff.hlo ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:41cca0b61d997d19bcb4eb7bf9d5d2b64b1e0ed7c572644b2097d98b1b2c918b
3
+ size 3155208
neuronxcc-2.21.33363.0+82129205/0_REGISTRY/0.4.3.dev2/llama/meta-llama/Llama-3.1-8B-Instruct/3f2788536ce52a84f6c0.json ADDED
@@ -0,0 +1,62 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "_entry_class": "SingleModelCacheEntry",
3
+ "_model_id": "meta-llama/Llama-3.1-8B-Instruct",
4
+ "_task": "text-generation",
5
+ "architectures": [
6
+ "LlamaForCausalLM"
7
+ ],
8
+ "attention_bias": false,
9
+ "attention_dropout": 0.0,
10
+ "dtype": "bfloat16",
11
+ "head_dim": 128,
12
+ "hidden_act": "silu",
13
+ "hidden_size": 4096,
14
+ "initializer_range": 0.02,
15
+ "intermediate_size": 14336,
16
+ "max_position_embeddings": 131072,
17
+ "mlp_bias": false,
18
+ "model_type": "llama",
19
+ "neuron": {
20
+ "_serialized_key": "NxDNeuronConfig",
21
+ "batch_size": 1,
22
+ "capacity_factor": null,
23
+ "checkpoint_id": "meta-llama/Llama-3.1-8B-Instruct",
24
+ "checkpoint_revision": "0e9e39f249a16976918f6564b8830bc894c89659",
25
+ "continuous_batching": false,
26
+ "ep_degree": 1,
27
+ "fused_qkv": true,
28
+ "glu_mlp": true,
29
+ "local_ranks_size": 8,
30
+ "max_batch_size": 1,
31
+ "max_context_length": 16384,
32
+ "max_topk": 256,
33
+ "n_active_tokens": 16384,
34
+ "neuronxcc_version": "2.21.33363.0+82129205",
35
+ "on_device_sampling": true,
36
+ "optimum_neuron_version": "0.4.3.dev2",
37
+ "output_logits": false,
38
+ "pp_degree": 1,
39
+ "sequence_length": 16384,
40
+ "speculation_length": 0,
41
+ "start_rank_id": 0,
42
+ "target": "trn1",
43
+ "torch_dtype": "bfloat16",
44
+ "tp_degree": 8
45
+ },
46
+ "num_attention_heads": 32,
47
+ "num_hidden_layers": 32,
48
+ "num_key_value_heads": 8,
49
+ "pretraining_tp": 1,
50
+ "rms_norm_eps": 1e-05,
51
+ "rope_scaling": {
52
+ "factor": 8.0,
53
+ "high_freq_factor": 4.0,
54
+ "low_freq_factor": 1.0,
55
+ "original_max_position_embeddings": 8192,
56
+ "rope_type": "llama3"
57
+ },
58
+ "rope_theta": 500000.0,
59
+ "tie_word_embeddings": false,
60
+ "use_cache": true,
61
+ "vocab_size": 128256
62
+ }