hyunsikc commited on
Commit
f274dbe
·
verified ·
1 Parent(s): 23cfbe0

Add files using upload-large-folder tool

Browse files
This view is limited to 50 files because it contains too many changes.   See raw diff
Files changed (50) hide show
  1. .gitattributes +36 -0
  2. 1129bce53d3d1ee5a8f977a0806f1f46.edf +3 -0
  3. 137d10656805f6f8bc18c24d6f91d9c5.edf +3 -0
  4. 14c1a2095eb9c3a506e9626f128a66cf.edf +3 -0
  5. 1e2ed7604bb259726ca13f29add32333.edf +3 -0
  6. 1ed55b4780a08696d73ce7879b62802d.edf +3 -0
  7. 25abc103ddf44d724373ff2f36432ec7.edf +3 -0
  8. 25d8f41fa7286a7890ecab1bfe3c2773.edf +3 -0
  9. 2d1ff096fac5f7369d4fe0df06ea9350.edf +3 -0
  10. 35e702f367369ea52eaa1340e9468777.edf +3 -0
  11. 3720b13705fc725d18a2226a5aa53054.edf +3 -0
  12. 48a2cfb22464b00526ea1aa027af6c0c.edf +3 -0
  13. 4bdbfe24d81eb397adad8bf7a1914f4d.edf +3 -0
  14. 58d3a49ca251bd09d8a562ee46b36db4.edf +3 -0
  15. 5b138d280525401763559084fb14da81.edf +3 -0
  16. 610270bc5c975f554829183d913e5bc7.edf +3 -0
  17. 6b29f1caa7f2cd692f042a87256a36e0.edf +3 -0
  18. 6b908b290b8ca1a76889bc4b178b9856.edf +3 -0
  19. 6f21938bfb4069ed906a1da74dd57178.edf +3 -0
  20. 7109f6f7354167d3d4b1891a6214f639.edf +3 -0
  21. 7448d72a5fda7547fe9ad2b6f3ad97c7.edf +3 -0
  22. 8410ae84799fc187448af43b3dc6a8d6.edf +3 -0
  23. 8c154ca0f99ba80642cd90f0287ef820.edf +3 -0
  24. 8ea114c1cd9f77b4d76203fa38968343.edf +3 -0
  25. 90098b75e19f46042ea7d3d8b4674c0b.edf +3 -0
  26. 963ad0449b698838213ebd9cacee4ac0.edf +3 -0
  27. 9d656d7523cb06049b60978fcfda0ce6.edf +3 -0
  28. LICENSE +202 -0
  29. README.md +65 -0
  30. add_const_file-Quantized_furiosa_llm_models.gptj.symbolic.mlperf_submission.GPTJForCausalLM-kv0-b1-attn1024-0.safetensors +3 -0
  31. add_const_file-Quantized_furiosa_llm_models.gptj.symbolic.mlperf_submission.GPTJForCausalLM-kv0-b1-attn1152-0.safetensors +3 -0
  32. add_const_file-Quantized_furiosa_llm_models.gptj.symbolic.mlperf_submission.GPTJForCausalLM-kv0-b1-attn1280-0.safetensors +3 -0
  33. add_const_file-Quantized_furiosa_llm_models.gptj.symbolic.mlperf_submission.GPTJForCausalLM-kv0-b1-attn1408-0.safetensors +3 -0
  34. add_const_file-Quantized_furiosa_llm_models.gptj.symbolic.mlperf_submission.GPTJForCausalLM-kv0-b1-attn1536-0.safetensors +3 -0
  35. add_const_file-Quantized_furiosa_llm_models.gptj.symbolic.mlperf_submission.GPTJForCausalLM-kv0-b1-attn1664-0.safetensors +3 -0
  36. add_const_file-Quantized_furiosa_llm_models.gptj.symbolic.mlperf_submission.GPTJForCausalLM-kv0-b1-attn1920-0.safetensors +3 -0
  37. add_const_file-Quantized_furiosa_llm_models.gptj.symbolic.mlperf_submission.GPTJForCausalLM-kv0-b1-attn512-0.safetensors +3 -0
  38. add_const_file-Quantized_furiosa_llm_models.gptj.symbolic.mlperf_submission.GPTJForCausalLM-kv0-b1-attn768-0.safetensors +3 -0
  39. add_const_file-Quantized_furiosa_llm_models.gptj.symbolic.mlperf_submission.GPTJForCausalLM-kv0-b1-attn896-0.safetensors +3 -0
  40. add_const_file-Quantized_furiosa_llm_models.gptj.symbolic.mlperf_submission.GPTJForCausalLM-kv2047-b128-attn2048-0.safetensors +3 -0
  41. add_const_file-Quantized_furiosa_llm_models.gptj.symbolic.mlperf_submission.GPTJForCausalLM-kv2047-b64-attn2048-0.safetensors +3 -0
  42. added_tokens.json +146 -0
  43. artifact.json +0 -0
  44. bd08125c4282ab1fe0c8772d973554a8.edf +3 -0
  45. c43b1888e8cf33792e1d6887c3df03bd.edf +3 -0
  46. c7f564baab300a5c527cd066d6e4c425.edf +3 -0
  47. ce58ee1c4d1f21799982509932512df0.edf +3 -0
  48. ce6abc136515c0a87e2214d4b762465c.edf +3 -0
  49. config.json +42 -0
  50. de2b0ec73c43d254f53398576cde487e.edf +3 -0
.gitattributes CHANGED
@@ -33,3 +33,39 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text
33
  *.zip filter=lfs diff=lfs merge=lfs -text
34
  *.zst filter=lfs diff=lfs merge=lfs -text
35
  *tfevents* filter=lfs diff=lfs merge=lfs -text
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
33
  *.zip filter=lfs diff=lfs merge=lfs -text
34
  *.zst filter=lfs diff=lfs merge=lfs -text
35
  *tfevents* filter=lfs diff=lfs merge=lfs -text
36
+ c43b1888e8cf33792e1d6887c3df03bd.edf filter=lfs diff=lfs merge=lfs -text
37
+ ce58ee1c4d1f21799982509932512df0.edf filter=lfs diff=lfs merge=lfs -text
38
+ 7109f6f7354167d3d4b1891a6214f639.edf filter=lfs diff=lfs merge=lfs -text
39
+ bd08125c4282ab1fe0c8772d973554a8.edf filter=lfs diff=lfs merge=lfs -text
40
+ 1e2ed7604bb259726ca13f29add32333.edf filter=lfs diff=lfs merge=lfs -text
41
+ 2d1ff096fac5f7369d4fe0df06ea9350.edf filter=lfs diff=lfs merge=lfs -text
42
+ ff1369bcc7b47669dfd8a1baad2f11d5.edf filter=lfs diff=lfs merge=lfs -text
43
+ 48a2cfb22464b00526ea1aa027af6c0c.edf filter=lfs diff=lfs merge=lfs -text
44
+ c7f564baab300a5c527cd066d6e4c425.edf filter=lfs diff=lfs merge=lfs -text
45
+ 610270bc5c975f554829183d913e5bc7.edf filter=lfs diff=lfs merge=lfs -text
46
+ 14c1a2095eb9c3a506e9626f128a66cf.edf filter=lfs diff=lfs merge=lfs -text
47
+ 963ad0449b698838213ebd9cacee4ac0.edf filter=lfs diff=lfs merge=lfs -text
48
+ 6b29f1caa7f2cd692f042a87256a36e0.edf filter=lfs diff=lfs merge=lfs -text
49
+ 8410ae84799fc187448af43b3dc6a8d6.edf filter=lfs diff=lfs merge=lfs -text
50
+ 8c154ca0f99ba80642cd90f0287ef820.edf filter=lfs diff=lfs merge=lfs -text
51
+ 6f21938bfb4069ed906a1da74dd57178.edf filter=lfs diff=lfs merge=lfs -text
52
+ 25abc103ddf44d724373ff2f36432ec7.edf filter=lfs diff=lfs merge=lfs -text
53
+ 35e702f367369ea52eaa1340e9468777.edf filter=lfs diff=lfs merge=lfs -text
54
+ 5b138d280525401763559084fb14da81.edf filter=lfs diff=lfs merge=lfs -text
55
+ 137d10656805f6f8bc18c24d6f91d9c5.edf filter=lfs diff=lfs merge=lfs -text
56
+ 9d656d7523cb06049b60978fcfda0ce6.edf filter=lfs diff=lfs merge=lfs -text
57
+ 58d3a49ca251bd09d8a562ee46b36db4.edf filter=lfs diff=lfs merge=lfs -text
58
+ 4bdbfe24d81eb397adad8bf7a1914f4d.edf filter=lfs diff=lfs merge=lfs -text
59
+ 3720b13705fc725d18a2226a5aa53054.edf filter=lfs diff=lfs merge=lfs -text
60
+ f3644e9896baca7db2dd9c9a3b41b527.edf filter=lfs diff=lfs merge=lfs -text
61
+ fd9ffdee553b8d6e7fec5bbdead5da26.edf filter=lfs diff=lfs merge=lfs -text
62
+ 7448d72a5fda7547fe9ad2b6f3ad97c7.edf filter=lfs diff=lfs merge=lfs -text
63
+ 8ea114c1cd9f77b4d76203fa38968343.edf filter=lfs diff=lfs merge=lfs -text
64
+ 6b908b290b8ca1a76889bc4b178b9856.edf filter=lfs diff=lfs merge=lfs -text
65
+ 1129bce53d3d1ee5a8f977a0806f1f46.edf filter=lfs diff=lfs merge=lfs -text
66
+ 90098b75e19f46042ea7d3d8b4674c0b.edf filter=lfs diff=lfs merge=lfs -text
67
+ 25d8f41fa7286a7890ecab1bfe3c2773.edf filter=lfs diff=lfs merge=lfs -text
68
+ 1ed55b4780a08696d73ce7879b62802d.edf filter=lfs diff=lfs merge=lfs -text
69
+ f919d50f5fa4992d3ccbc407db54ec0b.edf filter=lfs diff=lfs merge=lfs -text
70
+ ce6abc136515c0a87e2214d4b762465c.edf filter=lfs diff=lfs merge=lfs -text
71
+ de2b0ec73c43d254f53398576cde487e.edf filter=lfs diff=lfs merge=lfs -text
1129bce53d3d1ee5a8f977a0806f1f46.edf ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:02ecfc0b2936d10c289ccb44f4b67f6377e773eb78a8aa31a430fff3f2f3ea74
3
+ size 1068267
137d10656805f6f8bc18c24d6f91d9c5.edf ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:05a4ee59abd97b9018fa64f33972ac8e22c1d8f0b5abfd40f655989049b31a58
3
+ size 1624630
14c1a2095eb9c3a506e9626f128a66cf.edf ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6b67736a43be84026ae7ec2972e8e3e0c444b1b8e2f5c5fb040154be1f8e214f
3
+ size 955320
1e2ed7604bb259726ca13f29add32333.edf ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a662f61df1bda111f77112955335e8ca0fa24e9527914145a31108fd5d40ffb7
3
+ size 1389965
1ed55b4780a08696d73ce7879b62802d.edf ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:33f6f49ce31d61f7c95b1baf7afde0ccb755133b7964a36eac61ad925680f9e0
3
+ size 2074119
25abc103ddf44d724373ff2f36432ec7.edf ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:738751bf906f45cac23a4daea7d1c6aca6b53c907854f77cb961ce6fe75be7d6
3
+ size 967877
25d8f41fa7286a7890ecab1bfe3c2773.edf ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5eb2ef6485d825f6c6d0e14d133044ea5ff3f9ae1239be8cb71d8f99813a0d7c
3
+ size 3176056
2d1ff096fac5f7369d4fe0df06ea9350.edf ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:fcdcf223d7db96b11a726c9ef05bb76495971fa8bb2cab54225d4b4afbd3a876
3
+ size 1419750
35e702f367369ea52eaa1340e9468777.edf ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a5444031f8b27327bdc14e28bc2df8b6bec58580020c20729d2e2ba1754752bc
3
+ size 1484768
3720b13705fc725d18a2226a5aa53054.edf ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b0347dd4e2ef5d5a5bd8447f1e43fe52b6e9d400aec9ea68e484453774bc90cc
3
+ size 931650
48a2cfb22464b00526ea1aa027af6c0c.edf ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6b7ee0a839ce3f6f8516354646ccfc83e85768a68adf8eefd85c341839e4c5ee
3
+ size 1108370
4bdbfe24d81eb397adad8bf7a1914f4d.edf ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c7b5f040629ed0eaae685aec610fc70fa7d25214f5690bcbb3a88258d5cfbe54
3
+ size 1752034
58d3a49ca251bd09d8a562ee46b36db4.edf ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:046ffb1fa53c15b5e870d5369d8a09982bee67f27d42d5a019634c5a4b05cde6
3
+ size 1221167
5b138d280525401763559084fb14da81.edf ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:83be8fcc0a2821477dfe5f7fe059df8b4385f7b7f2a6fb0da0d4df55092b5d1c
3
+ size 1293126
610270bc5c975f554829183d913e5bc7.edf ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d6b8a7bd6aa308dc02155bbc49018e5e88575c33bfc114831b17018f6fb044d2
3
+ size 996175
6b29f1caa7f2cd692f042a87256a36e0.edf ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:022b6b7892396b060fa6abb2b355b59984d2bffbcd8e455ef89b0396994bac75
3
+ size 1101339
6b908b290b8ca1a76889bc4b178b9856.edf ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e2bdd19e9ae2e22c0b33f49ff0a78cfe8674f31af25bfd61563ad65b1e2a4d00
3
+ size 998138
6f21938bfb4069ed906a1da74dd57178.edf ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ecd079bdd281ba20809c0aa057a1a99b7b737c0bf9ff537d1395bb341fd153e1
3
+ size 779415
7109f6f7354167d3d4b1891a6214f639.edf ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e049d652f0f857a4e4f74fefd99d234dc21811a47deb7d5ac90f048e47498eb9
3
+ size 1275391
7448d72a5fda7547fe9ad2b6f3ad97c7.edf ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:636a3ef07a04f2d7921c1519a43b46281307ba246495173c2e95706209adbc14
3
+ size 895088
8410ae84799fc187448af43b3dc6a8d6.edf ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c2f1f863b2b5bdf8f05f85e4b6f2140809dd59cd3e9586097cb5775589b6fc01
3
+ size 1467387
8c154ca0f99ba80642cd90f0287ef820.edf ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a49b53e843a205ec357da17108e9b073235b48f387dfdb9f1204137e47df0277
3
+ size 1774692
8ea114c1cd9f77b4d76203fa38968343.edf ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:718008b1faba674dfd6e9fa24055f494e082957221e036ad9eb96295fb894c03
3
+ size 3496662
90098b75e19f46042ea7d3d8b4674c0b.edf ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:64106a58fc6ca2f8bb4ed9fe773857ec7cc7c8401d9209c429c2b24c5d9479d7
3
+ size 2309055
963ad0449b698838213ebd9cacee4ac0.edf ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:61eca1b1e14da9b5fc9f92ac113812b77a019bef6927bf43cd2eb497211e4c60
3
+ size 1020681
9d656d7523cb06049b60978fcfda0ce6.edf ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:dff00ec542fa7a6a4f38e789111103428cb3a231e0716ccc397b3fffe3d4ae9c
3
+ size 1058499
LICENSE ADDED
@@ -0,0 +1,202 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+
2
+ Apache License
3
+ Version 2.0, January 2004
4
+ http://www.apache.org/licenses/
5
+
6
+ TERMS AND CONDITIONS FOR USE, REPRODUCTION, AND DISTRIBUTION
7
+
8
+ 1. Definitions.
9
+
10
+ "License" shall mean the terms and conditions for use, reproduction,
11
+ and distribution as defined by Sections 1 through 9 of this document.
12
+
13
+ "Licensor" shall mean the copyright owner or entity authorized by
14
+ the copyright owner that is granting the License.
15
+
16
+ "Legal Entity" shall mean the union of the acting entity and all
17
+ other entities that control, are controlled by, or are under common
18
+ control with that entity. For the purposes of this definition,
19
+ "control" means (i) the power, direct or indirect, to cause the
20
+ direction or management of such entity, whether by contract or
21
+ otherwise, or (ii) ownership of fifty percent (50%) or more of the
22
+ outstanding shares, or (iii) beneficial ownership of such entity.
23
+
24
+ "You" (or "Your") shall mean an individual or Legal Entity
25
+ exercising permissions granted by this License.
26
+
27
+ "Source" form shall mean the preferred form for making modifications,
28
+ including but not limited to software source code, documentation
29
+ source, and configuration files.
30
+
31
+ "Object" form shall mean any form resulting from mechanical
32
+ transformation or translation of a Source form, including but
33
+ not limited to compiled object code, generated documentation,
34
+ and conversions to other media types.
35
+
36
+ "Work" shall mean the work of authorship, whether in Source or
37
+ Object form, made available under the License, as indicated by a
38
+ copyright notice that is included in or attached to the work
39
+ (an example is provided in the Appendix below).
40
+
41
+ "Derivative Works" shall mean any work, whether in Source or Object
42
+ form, that is based on (or derived from) the Work and for which the
43
+ editorial revisions, annotations, elaborations, or other modifications
44
+ represent, as a whole, an original work of authorship. For the purposes
45
+ of this License, Derivative Works shall not include works that remain
46
+ separable from, or merely link (or bind by name) to the interfaces of,
47
+ the Work and Derivative Works thereof.
48
+
49
+ "Contribution" shall mean any work of authorship, including
50
+ the original version of the Work and any modifications or additions
51
+ to that Work or Derivative Works thereof, that is intentionally
52
+ submitted to Licensor for inclusion in the Work by the copyright owner
53
+ or by an individual or Legal Entity authorized to submit on behalf of
54
+ the copyright owner. For the purposes of this definition, "submitted"
55
+ means any form of electronic, verbal, or written communication sent
56
+ to the Licensor or its representatives, including but not limited to
57
+ communication on electronic mailing lists, source code control systems,
58
+ and issue tracking systems that are managed by, or on behalf of, the
59
+ Licensor for the purpose of discussing and improving the Work, but
60
+ excluding communication that is conspicuously marked or otherwise
61
+ designated in writing by the copyright owner as "Not a Contribution."
62
+
63
+ "Contributor" shall mean Licensor and any individual or Legal Entity
64
+ on behalf of whom a Contribution has been received by Licensor and
65
+ subsequently incorporated within the Work.
66
+
67
+ 2. Grant of Copyright License. Subject to the terms and conditions of
68
+ this License, each Contributor hereby grants to You a perpetual,
69
+ worldwide, non-exclusive, no-charge, royalty-free, irrevocable
70
+ copyright license to reproduce, prepare Derivative Works of,
71
+ publicly display, publicly perform, sublicense, and distribute the
72
+ Work and such Derivative Works in Source or Object form.
73
+
74
+ 3. Grant of Patent License. Subject to the terms and conditions of
75
+ this License, each Contributor hereby grants to You a perpetual,
76
+ worldwide, non-exclusive, no-charge, royalty-free, irrevocable
77
+ (except as stated in this section) patent license to make, have made,
78
+ use, offer to sell, sell, import, and otherwise transfer the Work,
79
+ where such license applies only to those patent claims licensable
80
+ by such Contributor that are necessarily infringed by their
81
+ Contribution(s) alone or by combination of their Contribution(s)
82
+ with the Work to which such Contribution(s) was submitted. If You
83
+ institute patent litigation against any entity (including a
84
+ cross-claim or counterclaim in a lawsuit) alleging that the Work
85
+ or a Contribution incorporated within the Work constitutes direct
86
+ or contributory patent infringement, then any patent licenses
87
+ granted to You under this License for that Work shall terminate
88
+ as of the date such litigation is filed.
89
+
90
+ 4. Redistribution. You may reproduce and distribute copies of the
91
+ Work or Derivative Works thereof in any medium, with or without
92
+ modifications, and in Source or Object form, provided that You
93
+ meet the following conditions:
94
+
95
+ (a) You must give any other recipients of the Work or
96
+ Derivative Works a copy of this License; and
97
+
98
+ (b) You must cause any modified files to carry prominent notices
99
+ stating that You changed the files; and
100
+
101
+ (c) You must retain, in the Source form of any Derivative Works
102
+ that You distribute, all copyright, patent, trademark, and
103
+ attribution notices from the Source form of the Work,
104
+ excluding those notices that do not pertain to any part of
105
+ the Derivative Works; and
106
+
107
+ (d) If the Work includes a "NOTICE" text file as part of its
108
+ distribution, then any Derivative Works that You distribute must
109
+ include a readable copy of the attribution notices contained
110
+ within such NOTICE file, excluding those notices that do not
111
+ pertain to any part of the Derivative Works, in at least one
112
+ of the following places: within a NOTICE text file distributed
113
+ as part of the Derivative Works; within the Source form or
114
+ documentation, if provided along with the Derivative Works; or,
115
+ within a display generated by the Derivative Works, if and
116
+ wherever such third-party notices normally appear. The contents
117
+ of the NOTICE file are for informational purposes only and
118
+ do not modify the License. You may add Your own attribution
119
+ notices within Derivative Works that You distribute, alongside
120
+ or as an addendum to the NOTICE text from the Work, provided
121
+ that such additional attribution notices cannot be construed
122
+ as modifying the License.
123
+
124
+ You may add Your own copyright statement to Your modifications and
125
+ may provide additional or different license terms and conditions
126
+ for use, reproduction, or distribution of Your modifications, or
127
+ for any such Derivative Works as a whole, provided Your use,
128
+ reproduction, and distribution of the Work otherwise complies with
129
+ the conditions stated in this License.
130
+
131
+ 5. Submission of Contributions. Unless You explicitly state otherwise,
132
+ any Contribution intentionally submitted for inclusion in the Work
133
+ by You to the Licensor shall be under the terms and conditions of
134
+ this License, without any additional terms or conditions.
135
+ Notwithstanding the above, nothing herein shall supersede or modify
136
+ the terms of any separate license agreement you may have executed
137
+ with Licensor regarding such Contributions.
138
+
139
+ 6. Trademarks. This License does not grant permission to use the trade
140
+ names, trademarks, service marks, or product names of the Licensor,
141
+ except as required for reasonable and customary use in describing the
142
+ origin of the Work and reproducing the content of the NOTICE file.
143
+
144
+ 7. Disclaimer of Warranty. Unless required by applicable law or
145
+ agreed to in writing, Licensor provides the Work (and each
146
+ Contributor provides its Contributions) on an "AS IS" BASIS,
147
+ WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or
148
+ implied, including, without limitation, any warranties or conditions
149
+ of TITLE, NON-INFRINGEMENT, MERCHANTABILITY, or FITNESS FOR A
150
+ PARTICULAR PURPOSE. You are solely responsible for determining the
151
+ appropriateness of using or redistributing the Work and assume any
152
+ risks associated with Your exercise of permissions under this License.
153
+
154
+ 8. Limitation of Liability. In no event and under no legal theory,
155
+ whether in tort (including negligence), contract, or otherwise,
156
+ unless required by applicable law (such as deliberate and grossly
157
+ negligent acts) or agreed to in writing, shall any Contributor be
158
+ liable to You for damages, including any direct, indirect, special,
159
+ incidental, or consequential damages of any character arising as a
160
+ result of this License or out of the use or inability to use the
161
+ Work (including but not limited to damages for loss of goodwill,
162
+ work stoppage, computer failure or malfunction, or any and all
163
+ other commercial damages or losses), even if such Contributor
164
+ has been advised of the possibility of such damages.
165
+
166
+ 9. Accepting Warranty or Additional Liability. While redistributing
167
+ the Work or Derivative Works thereof, You may choose to offer,
168
+ and charge a fee for, acceptance of support, warranty, indemnity,
169
+ or other liability obligations and/or rights consistent with this
170
+ License. However, in accepting such obligations, You may act only
171
+ on Your own behalf and on Your sole responsibility, not on behalf
172
+ of any other Contributor, and only if You agree to indemnify,
173
+ defend, and hold each Contributor harmless for any liability
174
+ incurred by, or claims asserted against, such Contributor by reason
175
+ of your accepting any such warranty or additional liability.
176
+
177
+ END OF TERMS AND CONDITIONS
178
+
179
+ APPENDIX: How to apply the Apache License to your work.
180
+
181
+ To apply the Apache License to your work, attach the following
182
+ boilerplate notice, with the fields enclosed by brackets "[]"
183
+ replaced with your own identifying information. (Don't include
184
+ the brackets!) The text should be enclosed in the appropriate
185
+ comment syntax for the file format. We also recommend that a
186
+ file or class name and description of purpose be included on the
187
+ same "printed page" as the copyright notice for easier
188
+ identification within third-party archives.
189
+
190
+ Copyright [yyyy] [name of copyright owner]
191
+
192
+ Licensed under the Apache License, Version 2.0 (the "License");
193
+ you may not use this file except in compliance with the License.
194
+ You may obtain a copy of the License at
195
+
196
+ http://www.apache.org/licenses/LICENSE-2.0
197
+
198
+ Unless required by applicable law or agreed to in writing, software
199
+ distributed under the License is distributed on an "AS IS" BASIS,
200
+ WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
201
+ See the License for the specific language governing permissions and
202
+ limitations under the License.
README.md ADDED
@@ -0,0 +1,65 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ ---
2
+ base_model: EleutherAI/gpt-j-6b
3
+ language:
4
+ - en
5
+ license: apache-2.0
6
+ pipeline_tag: text-generation
7
+ library_name: furiosa-llm
8
+ tags:
9
+ - furiosa-ai
10
+ ---
11
+ # Model Overview
12
+ - **Model Architecture:** GPT-J
13
+ - **Input:** Text
14
+ - **Output:** Text
15
+ - **Model Optimizations:**
16
+ - Beam search optimization (beam=4) for MLPerf (This model cannot run for greedy search, top-k, top-p)
17
+ - **Maximum Context Length:** 2k tokens
18
+ - Maximum Prompt Length: 1920 tokens
19
+ - Maximum Generation Length: 2048 tokens
20
+ - **Intended Use Cases:** Intended for commercial and non-commercial use. Same as [EleutherAI/gpt-j-6b](https://huggingface.co/EleutherAI/gpt-j-6b), this models is intended for text summarization.
21
+ - **Release Date:** 04/12/2025
22
+ - **Version:** v2025.2
23
+ - **License(s):** [Apache License 2.0](https://huggingface.co/datasets/choosealicense/licenses/blob/main/markdown/apache-2.0.md)
24
+ - **Supported Inference Engine(s):** Furiosa LLM
25
+ - **Supported Hardware Compatibility:** FuriosaAI RNGD
26
+ - **Preferred Operating System(s):** Linux
27
+ - **Fine-tunes:** This model is fine-tuned for text summarization. More details can be found at [Datasets & Models at mlcommons/inferences/gpt-j/README.md](https://github.com/mlcommons/inference/blob/7bf59976b5f4eb7c5b8f30a88af832e028028446/language/gpt-j/README.md#datasets--models)
28
+ - **Quantization:**
29
+ - Tool: Furiosa Model Compressor v0.6.2, included in Furiosa SDK 2025.2
30
+ - Weight: float8, Activation: float8, KV cache: float8
31
+ - Calibration: [cnn_dailymail](https://huggingface.co/datasets/cnn_dailymail) ([instruction](https://github.com/mlcommons/inference/blob/7bf59976b5f4eb7c5b8f30a88af832e028028446/language/gpt-j/README.md#download--process-dataset))
32
+
33
+
34
+ ## Description:
35
+ This is pre-compiled model of a fine-tuned and quantized version of [EleutherAI/gpt-j-6b](https://huggingface.co/EleutherAI/gpt-j-6b). [cnn_dailymail](https://huggingface.co/datasets/cnn_dailymail) is used for calibration and fine-tuned for text summarization. Detailes about how this model was fine-tuned and calibrated can be found in [mlcommons/inferences/gpt-j/README.md](https://github.com/mlcommons/inference/blob/7bf59976b5f4eb7c5b8f30a88af832e028028446/language/gpt-j/README.md).
36
+
37
+ As mentioned above, this model is fine-tuned for text summarization task.
38
+ Please use the following prompt when using this model and replace the {INPUT} part accordingly:
39
+ ```
40
+ Below is an instruction that describes a task, paired with an input that provides further context. Write a response that appropriately completes the request.
41
+
42
+ ### Instruction:
43
+ Summarize the following news article:
44
+
45
+ ### Input:
46
+ {INPUTS}
47
+
48
+ ### Response:
49
+ ```
50
+
51
+ ## Usage
52
+
53
+ ### Furiosa-LLM
54
+ Follow the example command below after [installing Furiosa-LLM and its prerequisites](https://developer.furiosa.ai/latest/en/getting_started/furiosa_llm.html#installing-furiosa-llm).
55
+
56
+ ```sh
57
+ furiosa-llm serve furiosa-ai/gpt-j-6b-FP8-MLPerf
58
+ ```
59
+
60
+ ### MLPerf Benchmark using RNGD
61
+ Follow the example command below after [installing furiosa-mlperf and its prerequisites](https://developer.furiosa.ai/latest/en/getting_started/furiosa_mlperf.html).
62
+
63
+ ```sh
64
+ furiosa-mlperf gpt-j-offline furiosa-ai/gpt-j-6b-FP8-MLPerf ./mlperf-result
65
+ ```
add_const_file-Quantized_furiosa_llm_models.gptj.symbolic.mlperf_submission.GPTJForCausalLM-kv0-b1-attn1024-0.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b6b2ea5d6db9d6e59e12e42ca7005d6ddd152a22987c52cdd3cb042ae921e481
3
+ size 7155636
add_const_file-Quantized_furiosa_llm_models.gptj.symbolic.mlperf_submission.GPTJForCausalLM-kv0-b1-attn1152-0.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b6b2ea5d6db9d6e59e12e42ca7005d6ddd152a22987c52cdd3cb042ae921e481
3
+ size 7155636
add_const_file-Quantized_furiosa_llm_models.gptj.symbolic.mlperf_submission.GPTJForCausalLM-kv0-b1-attn1280-0.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b6b2ea5d6db9d6e59e12e42ca7005d6ddd152a22987c52cdd3cb042ae921e481
3
+ size 7155636
add_const_file-Quantized_furiosa_llm_models.gptj.symbolic.mlperf_submission.GPTJForCausalLM-kv0-b1-attn1408-0.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b6b2ea5d6db9d6e59e12e42ca7005d6ddd152a22987c52cdd3cb042ae921e481
3
+ size 7155636
add_const_file-Quantized_furiosa_llm_models.gptj.symbolic.mlperf_submission.GPTJForCausalLM-kv0-b1-attn1536-0.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b6b2ea5d6db9d6e59e12e42ca7005d6ddd152a22987c52cdd3cb042ae921e481
3
+ size 7155636
add_const_file-Quantized_furiosa_llm_models.gptj.symbolic.mlperf_submission.GPTJForCausalLM-kv0-b1-attn1664-0.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b6b2ea5d6db9d6e59e12e42ca7005d6ddd152a22987c52cdd3cb042ae921e481
3
+ size 7155636
add_const_file-Quantized_furiosa_llm_models.gptj.symbolic.mlperf_submission.GPTJForCausalLM-kv0-b1-attn1920-0.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b6b2ea5d6db9d6e59e12e42ca7005d6ddd152a22987c52cdd3cb042ae921e481
3
+ size 7155636
add_const_file-Quantized_furiosa_llm_models.gptj.symbolic.mlperf_submission.GPTJForCausalLM-kv0-b1-attn512-0.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b6b2ea5d6db9d6e59e12e42ca7005d6ddd152a22987c52cdd3cb042ae921e481
3
+ size 7155636
add_const_file-Quantized_furiosa_llm_models.gptj.symbolic.mlperf_submission.GPTJForCausalLM-kv0-b1-attn768-0.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b6b2ea5d6db9d6e59e12e42ca7005d6ddd152a22987c52cdd3cb042ae921e481
3
+ size 7155636
add_const_file-Quantized_furiosa_llm_models.gptj.symbolic.mlperf_submission.GPTJForCausalLM-kv0-b1-attn896-0.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b6b2ea5d6db9d6e59e12e42ca7005d6ddd152a22987c52cdd3cb042ae921e481
3
+ size 7155636
add_const_file-Quantized_furiosa_llm_models.gptj.symbolic.mlperf_submission.GPTJForCausalLM-kv2047-b128-attn2048-0.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:abdd7e7a97908a45e52675eb8ac33b7409fa72e04235287b032ab1f93e0cd2ba
3
+ size 7154916
add_const_file-Quantized_furiosa_llm_models.gptj.symbolic.mlperf_submission.GPTJForCausalLM-kv2047-b64-attn2048-0.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:abdd7e7a97908a45e52675eb8ac33b7409fa72e04235287b032ab1f93e0cd2ba
3
+ size 7154916
added_tokens.json ADDED
@@ -0,0 +1,146 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "<|extratoken_100|>": 50356,
3
+ "<|extratoken_101|>": 50357,
4
+ "<|extratoken_102|>": 50358,
5
+ "<|extratoken_103|>": 50359,
6
+ "<|extratoken_104|>": 50360,
7
+ "<|extratoken_105|>": 50361,
8
+ "<|extratoken_106|>": 50362,
9
+ "<|extratoken_107|>": 50363,
10
+ "<|extratoken_108|>": 50364,
11
+ "<|extratoken_109|>": 50365,
12
+ "<|extratoken_10|>": 50266,
13
+ "<|extratoken_110|>": 50366,
14
+ "<|extratoken_111|>": 50367,
15
+ "<|extratoken_112|>": 50368,
16
+ "<|extratoken_113|>": 50369,
17
+ "<|extratoken_114|>": 50370,
18
+ "<|extratoken_115|>": 50371,
19
+ "<|extratoken_116|>": 50372,
20
+ "<|extratoken_117|>": 50373,
21
+ "<|extratoken_118|>": 50374,
22
+ "<|extratoken_119|>": 50375,
23
+ "<|extratoken_11|>": 50267,
24
+ "<|extratoken_120|>": 50376,
25
+ "<|extratoken_121|>": 50377,
26
+ "<|extratoken_122|>": 50378,
27
+ "<|extratoken_123|>": 50379,
28
+ "<|extratoken_124|>": 50380,
29
+ "<|extratoken_125|>": 50381,
30
+ "<|extratoken_126|>": 50382,
31
+ "<|extratoken_127|>": 50383,
32
+ "<|extratoken_128|>": 50384,
33
+ "<|extratoken_129|>": 50385,
34
+ "<|extratoken_12|>": 50268,
35
+ "<|extratoken_130|>": 50386,
36
+ "<|extratoken_131|>": 50387,
37
+ "<|extratoken_132|>": 50388,
38
+ "<|extratoken_133|>": 50389,
39
+ "<|extratoken_134|>": 50390,
40
+ "<|extratoken_135|>": 50391,
41
+ "<|extratoken_136|>": 50392,
42
+ "<|extratoken_137|>": 50393,
43
+ "<|extratoken_138|>": 50394,
44
+ "<|extratoken_139|>": 50395,
45
+ "<|extratoken_13|>": 50269,
46
+ "<|extratoken_140|>": 50396,
47
+ "<|extratoken_141|>": 50397,
48
+ "<|extratoken_142|>": 50398,
49
+ "<|extratoken_143|>": 50399,
50
+ "<|extratoken_14|>": 50270,
51
+ "<|extratoken_15|>": 50271,
52
+ "<|extratoken_16|>": 50272,
53
+ "<|extratoken_17|>": 50273,
54
+ "<|extratoken_18|>": 50274,
55
+ "<|extratoken_19|>": 50275,
56
+ "<|extratoken_1|>": 50257,
57
+ "<|extratoken_20|>": 50276,
58
+ "<|extratoken_21|>": 50277,
59
+ "<|extratoken_22|>": 50278,
60
+ "<|extratoken_23|>": 50279,
61
+ "<|extratoken_24|>": 50280,
62
+ "<|extratoken_25|>": 50281,
63
+ "<|extratoken_26|>": 50282,
64
+ "<|extratoken_27|>": 50283,
65
+ "<|extratoken_28|>": 50284,
66
+ "<|extratoken_29|>": 50285,
67
+ "<|extratoken_2|>": 50258,
68
+ "<|extratoken_30|>": 50286,
69
+ "<|extratoken_31|>": 50287,
70
+ "<|extratoken_32|>": 50288,
71
+ "<|extratoken_33|>": 50289,
72
+ "<|extratoken_34|>": 50290,
73
+ "<|extratoken_35|>": 50291,
74
+ "<|extratoken_36|>": 50292,
75
+ "<|extratoken_37|>": 50293,
76
+ "<|extratoken_38|>": 50294,
77
+ "<|extratoken_39|>": 50295,
78
+ "<|extratoken_3|>": 50259,
79
+ "<|extratoken_40|>": 50296,
80
+ "<|extratoken_41|>": 50297,
81
+ "<|extratoken_42|>": 50298,
82
+ "<|extratoken_43|>": 50299,
83
+ "<|extratoken_44|>": 50300,
84
+ "<|extratoken_45|>": 50301,
85
+ "<|extratoken_46|>": 50302,
86
+ "<|extratoken_47|>": 50303,
87
+ "<|extratoken_48|>": 50304,
88
+ "<|extratoken_49|>": 50305,
89
+ "<|extratoken_4|>": 50260,
90
+ "<|extratoken_50|>": 50306,
91
+ "<|extratoken_51|>": 50307,
92
+ "<|extratoken_52|>": 50308,
93
+ "<|extratoken_53|>": 50309,
94
+ "<|extratoken_54|>": 50310,
95
+ "<|extratoken_55|>": 50311,
96
+ "<|extratoken_56|>": 50312,
97
+ "<|extratoken_57|>": 50313,
98
+ "<|extratoken_58|>": 50314,
99
+ "<|extratoken_59|>": 50315,
100
+ "<|extratoken_5|>": 50261,
101
+ "<|extratoken_60|>": 50316,
102
+ "<|extratoken_61|>": 50317,
103
+ "<|extratoken_62|>": 50318,
104
+ "<|extratoken_63|>": 50319,
105
+ "<|extratoken_64|>": 50320,
106
+ "<|extratoken_65|>": 50321,
107
+ "<|extratoken_66|>": 50322,
108
+ "<|extratoken_67|>": 50323,
109
+ "<|extratoken_68|>": 50324,
110
+ "<|extratoken_69|>": 50325,
111
+ "<|extratoken_6|>": 50262,
112
+ "<|extratoken_70|>": 50326,
113
+ "<|extratoken_71|>": 50327,
114
+ "<|extratoken_72|>": 50328,
115
+ "<|extratoken_73|>": 50329,
116
+ "<|extratoken_74|>": 50330,
117
+ "<|extratoken_75|>": 50331,
118
+ "<|extratoken_76|>": 50332,
119
+ "<|extratoken_77|>": 50333,
120
+ "<|extratoken_78|>": 50334,
121
+ "<|extratoken_79|>": 50335,
122
+ "<|extratoken_7|>": 50263,
123
+ "<|extratoken_80|>": 50336,
124
+ "<|extratoken_81|>": 50337,
125
+ "<|extratoken_82|>": 50338,
126
+ "<|extratoken_83|>": 50339,
127
+ "<|extratoken_84|>": 50340,
128
+ "<|extratoken_85|>": 50341,
129
+ "<|extratoken_86|>": 50342,
130
+ "<|extratoken_87|>": 50343,
131
+ "<|extratoken_88|>": 50344,
132
+ "<|extratoken_89|>": 50345,
133
+ "<|extratoken_8|>": 50264,
134
+ "<|extratoken_90|>": 50346,
135
+ "<|extratoken_91|>": 50347,
136
+ "<|extratoken_92|>": 50348,
137
+ "<|extratoken_93|>": 50349,
138
+ "<|extratoken_94|>": 50350,
139
+ "<|extratoken_95|>": 50351,
140
+ "<|extratoken_96|>": 50352,
141
+ "<|extratoken_97|>": 50353,
142
+ "<|extratoken_98|>": 50354,
143
+ "<|extratoken_99|>": 50355,
144
+ "<|extratoken_9|>": 50265,
145
+ "[PAD]": 50400
146
+ }
artifact.json ADDED
The diff for this file is too large to render. See raw diff
 
bd08125c4282ab1fe0c8772d973554a8.edf ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:883969c3d3f633343f765111968287bdfb9b6536e742a2f9c09d45b83f4e8958
3
+ size 1009992
c43b1888e8cf33792e1d6887c3df03bd.edf ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b6995a9fa42deb43ae74028a7305ec058426d5c8c4506f1367ee689500b5e24a
3
+ size 966559
c7f564baab300a5c527cd066d6e4c425.edf ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9c19b9d859665a36e89d1a1db811187556b009869b9a14efdc9fb6c7dd1c93d3
3
+ size 1710008
ce58ee1c4d1f21799982509932512df0.edf ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6a31b49f94759f68b2edd8facda8d9b921a49b21d1b248bb4ec78b94ebc0d3dd
3
+ size 3218585
ce6abc136515c0a87e2214d4b762465c.edf ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6cababa6f49ff84aa53650447fb1481bbccb2ba3f8deed04440c70c67137ea3a
3
+ size 1966897
config.json ADDED
@@ -0,0 +1,42 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "_name_or_path": "furiosa-ai/mlperf-gpt-j-6b",
3
+ "activation_function": "gelu_new",
4
+ "architectures": [
5
+ "GPTJForCausalLM"
6
+ ],
7
+ "attn_pdrop": 0.0,
8
+ "bos_token_id": 50256,
9
+ "embd_pdrop": 0.0,
10
+ "eos_token_id": 50256,
11
+ "gradient_checkpointing": false,
12
+ "initializer_range": 0.02,
13
+ "layer_norm_epsilon": 1e-05,
14
+ "model_type": "gptj",
15
+ "n_embd": 4096,
16
+ "n_head": 16,
17
+ "n_inner": null,
18
+ "n_layer": 28,
19
+ "n_positions": 2048,
20
+ "resid_pdrop": 0.0,
21
+ "rotary": true,
22
+ "rotary_dim": 64,
23
+ "scale_attn_weights": true,
24
+ "summary_activation": null,
25
+ "summary_first_dropout": 0.1,
26
+ "summary_proj_to_labels": true,
27
+ "summary_type": "cls_index",
28
+ "summary_use_proj": true,
29
+ "task_specific_params": {
30
+ "text-generation": {
31
+ "do_sample": true,
32
+ "max_length": 50,
33
+ "temperature": 1.0
34
+ }
35
+ },
36
+ "tie_word_embeddings": false,
37
+ "tokenizer_class": "GPT2Tokenizer",
38
+ "torch_dtype": "float32",
39
+ "transformers_version": "4.48.1",
40
+ "use_cache": true,
41
+ "vocab_size": 50401
42
+ }
de2b0ec73c43d254f53398576cde487e.edf ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:15665a63be4d1f523d83561f206e8143cb1498b5619be9aa9c41f44d45051a41
3
+ size 1122932