hyunsikc commited on
Commit
bc683c8
·
verified ·
1 Parent(s): fb4f729

Add files using upload-large-folder tool

Browse files
This view is limited to 50 files because it contains too many changes.   See raw diff
Files changed (50) hide show
  1. .gitattributes +7 -0
  2. 00852babc64b23ad2a0cee69cd01b44f.edf +3 -0
  3. 0459eb8508fa7278f3397c636fb38f37.edf +3 -0
  4. 0e51734f4fd6bdc2a37670010bbe161e.edf +3 -0
  5. 0fb796c440d1193727495cd5131464fc.edf +3 -0
  6. 1013a7281f9b82e099f30fc6c7b7ee6a.edf +3 -0
  7. 1905b3bde56415edd508d9bf943a571f.edf +3 -0
  8. 19fc01089689025e7fd06eae4355507d.edf +3 -0
  9. 230c5c612a258fa4664a9b0c7991219d.edf +3 -0
  10. 253322114d04d3fe619d211da70154a7.edf +3 -0
  11. 265360903451f7dedb717b7b9b72461e.edf +3 -0
  12. 3f969183b14039dad7ebf54ae6af97ca.edf +3 -0
  13. 435a6b2dc26692d83db8a638de4470c5.edf +3 -0
  14. 444902f20f5011550ed11180c7782bfa.edf +3 -0
  15. 47122db966459854cab6e913177206d7.edf +3 -0
  16. 55ca2cec49402aeb399c90a0488b46ab.edf +3 -0
  17. 599ebf67ab06553d8e2eac2b218ce2b1.edf +3 -0
  18. 674a22b64d0fac8be1dc1a402daa0126.edf +3 -0
  19. 6a52705628ee03d2f2142d9d2aeb4e75.edf +3 -0
  20. 6ffe692071814fe20782bfeb93ed7500.edf +3 -0
  21. 71c090fbea34420bb7d543bbd8ca0afb.edf +3 -0
  22. 7be2f7b337826bb7aa6759e059bca330.edf +3 -0
  23. 80c7ea681548402ea828303776e8ae65.edf +3 -0
  24. 9539f966acbc53e10b456267925123b5.edf +3 -0
  25. 96b29272fb158c073e0688c7eabc25c2.edf +3 -0
  26. 9b03bfbe480a8f08895c480d5f27ac1e.edf +3 -0
  27. 9e5396080f97fe6a301ebc83f98b99db.edf +3 -0
  28. LICENSE +21 -0
  29. README.md +36 -0
  30. b7dfdc6a0adbb5c49cd22d7bf4d9e3ad.edf +3 -0
  31. bce17aca74c04d95e0f97b7690751257.edf +3 -0
  32. bed798118b103c5e3adbdd3b53134ade.edf +3 -0
  33. c1780f91b2117f234e1b266fde202c96.edf +3 -0
  34. c2002116d6922d70217f6fce6ed5bb10.edf +3 -0
  35. c36a0cf94961335dd45464ccc7741873.edf +3 -0
  36. c694752a40ba26ae630abc2ca947fe22.edf +3 -0
  37. c957c6744fe2374d152a48eb7d769f64.edf +3 -0
  38. config.json +41 -0
  39. d33f69ccba0e6862bc39698e4515ffd0.edf +3 -0
  40. e8673bbd23f98c234d46131ebbcb0440.edf +3 -0
  41. ea6cc401d5a2d6ba2adffdaa7188cdc0.edf +3 -0
  42. f05457e46dbf735daf839c9d05ce977d.edf +3 -0
  43. f193f4bf4443b5b3a841edb7593ff2bd.edf +3 -0
  44. f1e5c26a5a48f68501f1ab424ec7b0c1.edf +3 -0
  45. f45aebdf48dd270d96d2b4bfb704f5e2.edf +3 -0
  46. f844b65bd62eb3e3865a7883276620c0.edf +3 -0
  47. f9a330e5d73ac3cf6ed0d0579c14f5e5.edf +3 -0
  48. furiosa_config.json +58 -0
  49. params-DeepSeek-R1-Distill-Llama-70B-aramco_specdec-80L-W16A16KV16-allow_bfloat16_cast_with_mcp-shard_size=5000000000-4d741bdc3970366668c076b824e5e349f6c9e492c6da3e4fec20bbfa6f0eb7fc.safetensors/model-00032-of-00032.safetensors +3 -0
  50. special_tokens_map.json +17 -0
.gitattributes CHANGED
@@ -146,3 +146,10 @@ f5f4eb0a371dd559f47e8067ce36bb52.edf filter=lfs diff=lfs merge=lfs -text
146
  9539f966acbc53e10b456267925123b5.edf filter=lfs diff=lfs merge=lfs -text
147
  c884bb0e814b3d51cd8d2dd59851bcb0.edf filter=lfs diff=lfs merge=lfs -text
148
  9de95e06ccea08279ea551c4df760813.edf filter=lfs diff=lfs merge=lfs -text
 
 
 
 
 
 
 
 
146
  9539f966acbc53e10b456267925123b5.edf filter=lfs diff=lfs merge=lfs -text
147
  c884bb0e814b3d51cd8d2dd59851bcb0.edf filter=lfs diff=lfs merge=lfs -text
148
  9de95e06ccea08279ea551c4df760813.edf filter=lfs diff=lfs merge=lfs -text
149
+ ea6cc401d5a2d6ba2adffdaa7188cdc0.edf filter=lfs diff=lfs merge=lfs -text
150
+ f05457e46dbf735daf839c9d05ce977d.edf filter=lfs diff=lfs merge=lfs -text
151
+ 253322114d04d3fe619d211da70154a7.edf filter=lfs diff=lfs merge=lfs -text
152
+ 599ebf67ab06553d8e2eac2b218ce2b1.edf filter=lfs diff=lfs merge=lfs -text
153
+ c1780f91b2117f234e1b266fde202c96.edf filter=lfs diff=lfs merge=lfs -text
154
+ 0fb796c440d1193727495cd5131464fc.edf filter=lfs diff=lfs merge=lfs -text
155
+ 47122db966459854cab6e913177206d7.edf filter=lfs diff=lfs merge=lfs -text
00852babc64b23ad2a0cee69cd01b44f.edf ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4fb62bf2ba651e04a7f03e6180974cc46737f4d9c3b71ba72d46c6e2010ae3d6
3
+ size 4797965
0459eb8508fa7278f3397c636fb38f37.edf ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:603b5127eacdec02f9df8b597e1cabba76293ad9a18f214397f22a449938a841
3
+ size 35929788
0e51734f4fd6bdc2a37670010bbe161e.edf ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:82251ff730684d13b7b9ef3d86e9e14f53ae4cd3677b135dca81ae3427c52cd3
3
+ size 5716404
0fb796c440d1193727495cd5131464fc.edf ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b4dfe03db2cab92271b9a1971486495f50345e29bd0e9d7feecafe72ea77f1ee
3
+ size 56511229
1013a7281f9b82e099f30fc6c7b7ee6a.edf ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:67de7fdc4db78253037d74b941ec25643918c16cee18f6aae3a29162be02688a
3
+ size 18875261
1905b3bde56415edd508d9bf943a571f.edf ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:16f800decdbdb103861227f60f15edfd6178f3b0e8418760f3aaaaaa85c09b5c
3
+ size 34297575
19fc01089689025e7fd06eae4355507d.edf ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9321d46df0e0e056dab3c70d63d7cefefdb074f9604259bf12a453d57b3a635d
3
+ size 30163116
230c5c612a258fa4664a9b0c7991219d.edf ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b4d6cef7f39f0af55211d7e72d20b36019d25fcf9c2e197b981b6a5e203388a3
3
+ size 4036364
253322114d04d3fe619d211da70154a7.edf ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1de23a68d37822a88eccbc11cf1c99b051dce46cd403c1710d1c27c2be93a833
3
+ size 30377687
265360903451f7dedb717b7b9b72461e.edf ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:476f9cded5e6ede17be04070ed6c08cad333ce860c4b1a49983f5d4efffeb122
3
+ size 33124100
3f969183b14039dad7ebf54ae6af97ca.edf ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7d5cd31d14465d9f70b1dc70e850771aa084797595e8cd074f2f0a8a61498273
3
+ size 30600772
435a6b2dc26692d83db8a638de4470c5.edf ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:052ae93cecd8efce21a2dfa13c3f16b02e8b7af8df171e981d23b28435428314
3
+ size 18851011
444902f20f5011550ed11180c7782bfa.edf ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ca1bacc7c71e7f8d24f8058c1a8b96528b4889cc4d2c2023fd02d0cf2553b8c1
3
+ size 3951853
47122db966459854cab6e913177206d7.edf ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:fe376db21936c01fd2d1b40ec1d2526bfd73a1b87c374202a45ab4fd455fea8a
3
+ size 57078164
55ca2cec49402aeb399c90a0488b46ab.edf ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:46ae60a1983554b4523b53b37b5e6ceaff3162f0a57bfa993480422fca4e8ecb
3
+ size 30596818
599ebf67ab06553d8e2eac2b218ce2b1.edf ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7a53cca3c46ae403e7d9b4c5fead612207b2b6bcf66a826597c5469038fc54f8
3
+ size 30941839
674a22b64d0fac8be1dc1a402daa0126.edf ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c08f0c54a202b1a4768004f6fadf8ae76f8ad59b24ac7142356a64aa654fd89d
3
+ size 4924546
6a52705628ee03d2f2142d9d2aeb4e75.edf ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0c5597a331fe6fd11f0497ef67bd79ad989aa0f6fa3047537a55e8ed85b70d18
3
+ size 5068798
6ffe692071814fe20782bfeb93ed7500.edf ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:73b9774d575df5ce5b4a94e8f1d0165a140aad631b50d6732b945f4fcdf0ec72
3
+ size 17711989
71c090fbea34420bb7d543bbd8ca0afb.edf ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a6a7983c6a29d2244f5f47ccf547bb62954bf148c7a1383cda0336ffd1fcffce
3
+ size 5004740
7be2f7b337826bb7aa6759e059bca330.edf ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9a0cfc05f395b98f165a1990fefa9bc4ac566c2abfc29df605c49b49582c1798
3
+ size 4769261
80c7ea681548402ea828303776e8ae65.edf ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:abf67dc8931a050f68fd09cd89c92ffcaf175a65e5cb7c6893954c2680b7a645
3
+ size 30247421
9539f966acbc53e10b456267925123b5.edf ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c59ab500ee3ba1da291abab7ac896238a0109db6897fe79c13fc626992fafb2b
3
+ size 17306945
96b29272fb158c073e0688c7eabc25c2.edf ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c4d60300c95c3e5f7c31a3bd57daee283e8a3e4f10b4ec62ff3ea1d82fd83191
3
+ size 19403203
9b03bfbe480a8f08895c480d5f27ac1e.edf ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e3ed5d494c73fb62b61674ccf7878915cc945aa32e204caefdbeb03c0aef7ef8
3
+ size 4714752
9e5396080f97fe6a301ebc83f98b99db.edf ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4c7d591a4f961fdc86f1bd95a4fbe0fb6a419dc491e98bf100d68584c112bde3
3
+ size 3472839
LICENSE ADDED
@@ -0,0 +1,21 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ MIT License
2
+
3
+ Copyright (c) 2023 DeepSeek
4
+
5
+ Permission is hereby granted, free of charge, to any person obtaining a copy
6
+ of this software and associated documentation files (the "Software"), to deal
7
+ in the Software without restriction, including without limitation the rights
8
+ to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
9
+ copies of the Software, and to permit persons to whom the Software is
10
+ furnished to do so, subject to the following conditions:
11
+
12
+ The above copyright notice and this permission notice shall be included in all
13
+ copies or substantial portions of the Software.
14
+
15
+ THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
16
+ IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
17
+ FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
18
+ AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
19
+ LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
20
+ OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
21
+ SOFTWARE.
README.md ADDED
@@ -0,0 +1,36 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ ---
2
+ base_model: deepseek-ai/DeepSeek-R1-Distill-Llama-70B
3
+ license: mit
4
+ pipeline_tag: text-generation
5
+ library_name: furiosa-llm
6
+ tags:
7
+ - furiosa-ai
8
+ ---
9
+ # Model Overview
10
+ - **Model Architecture:** Meta-Llama-3
11
+ - **Input:** Text
12
+ - **Output:** Text
13
+ - **Model Optimizations:**
14
+ - **Context Length:** 32k tokens
15
+ - Maximum Prompt Length: 32768 tokens
16
+ - Maximum Generation Length: 32768 tokens
17
+ - **Intended Use Cases:** Intended for commercial and non-commercial use. Same as [DeepSeek-R1-Distill-Llama-70B](https://huggingface.co/deepseek-ai/DeepSeek-R1-Distill-Llama-70B), this models is intended for assistant-like chat.
18
+ - **Release Date:** 07/28/2025
19
+ - **Version:** v2025.3
20
+ - **License(s):** [MIT License](https://huggingface.co/deepseek-ai/DeepSeek-R1-Distill-Llama-70B/blob/main/LICENSE)
21
+ - **Supported Inference Engine(s):** Furiosa LLM
22
+ - **Supported Hardware Compatibility:** FuriosaAI RNGD
23
+ - **Preferred Operating System(s):** Linux
24
+ - **Quantization:** No
25
+
26
+ ## Description:
27
+ This model is the pre-compiled version of the [DeepSeek-R1-Distill-Llama-70B](https://huggingface.co/deepseek-ai/DeepSeek-R1-Distill-Llama-70B), which is an auto-regressive language model that uses an optimized transformer architecture.
28
+
29
+ ## Usage
30
+
31
+ To run this model with [Furiosa-LLM](https://developer.furiosa.ai/latest/en/furiosa_llm/intro.html), follow the example command below after [installing Furiosa-LLM and its prerequisites](https://developer.furiosa.ai/latest/en/getting_started/furiosa_llm.html#installing-furiosa-llm).
32
+
33
+ ```sh
34
+ furiosa-llm serve furiosa-ai/DeepSeek-R1-Distill-Llama-70B \
35
+ --enable-reasoning --reasoning-parser deepseek_r1
36
+ ```
b7dfdc6a0adbb5c49cd22d7bf4d9e3ad.edf ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:77157789b1e8a7d413ec304ab3469ead9b18452308a9bda2a649748b8eaee1ff
3
+ size 3451274
bce17aca74c04d95e0f97b7690751257.edf ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c329a199da2b5505cda6eea07e2b837766111f75aae94ec0634e11cca55f2de1
3
+ size 18929574
bed798118b103c5e3adbdd3b53134ade.edf ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5b150bf14435e31c212617943ba30eb294f3fc4aab5c2688f081f302a9198109
3
+ size 4499479
c1780f91b2117f234e1b266fde202c96.edf ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:cb0dd55da6e0ca287aaea03992337f59d60c394e9ab49496553973a67398d4cc
3
+ size 56579945
c2002116d6922d70217f6fce6ed5bb10.edf ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c202a3d9b79707e318ce9704ea37091c47cfafcab32bd7399af46a3e00076fe0
3
+ size 34880297
c36a0cf94961335dd45464ccc7741873.edf ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:984371e7f76092a471546e499d468e7a983d8a9e13cdd6a0cf9e8bfd68914825
3
+ size 17363289
c694752a40ba26ae630abc2ca947fe22.edf ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c763c2b4a28c12f6f446478e78259fea8e900976a5e9f0597f7c60c20b2d30c3
3
+ size 7550233
c957c6744fe2374d152a48eb7d769f64.edf ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4fc45ecbbf1663399ab8bd146620d0b783dafc1e9db3d8fc9e225ac44366533b
3
+ size 31085735
config.json ADDED
@@ -0,0 +1,41 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "_name_or_path": "deepseek-ai/DeepSeek-R1-Distill-Llama-70B",
3
+ "architectures": [
4
+ "LlamaForCausalLM"
5
+ ],
6
+ "attention_bias": false,
7
+ "attention_dropout": 0.0,
8
+ "bos_token_id": 128000,
9
+ "eos_token_id": [
10
+ 128001,
11
+ 128008,
12
+ 128009
13
+ ],
14
+ "head_dim": 128,
15
+ "hidden_act": "silu",
16
+ "hidden_size": 8192,
17
+ "initializer_range": 0.02,
18
+ "intermediate_size": 28672,
19
+ "inv_freq_config": {
20
+ "factor": 8.0,
21
+ "high_freq_factor": 4.0,
22
+ "low_freq_factor": 1.0,
23
+ "original_max_position_embeddings": 8192,
24
+ "rope_type": "llama3"
25
+ },
26
+ "max_position_embeddings": 131072,
27
+ "mlp_bias": false,
28
+ "model_type": "llama",
29
+ "num_attention_heads": 64,
30
+ "num_hidden_layers": 80,
31
+ "num_key_value_heads": 8,
32
+ "pretraining_tp": 1,
33
+ "rms_norm_eps": 1e-05,
34
+ "rope_scaling": null,
35
+ "rope_theta": 500000.0,
36
+ "tie_word_embeddings": false,
37
+ "torch_dtype": "bfloat16",
38
+ "transformers_version": "4.48.1",
39
+ "use_cache": true,
40
+ "vocab_size": 128256
41
+ }
d33f69ccba0e6862bc39698e4515ffd0.edf ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:19958b09cd1f260114fd877b87442845d655af8e676c95819a34691c77a7a082
3
+ size 21762241
e8673bbd23f98c234d46131ebbcb0440.edf ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:219ed9a8bb383d1cc2fb0636c05162b7d4553540e6d650597bedda49af31ac44
3
+ size 5229866
ea6cc401d5a2d6ba2adffdaa7188cdc0.edf ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0c88548d84bbf58117ebe1a1c50b688c432265d4ef9aded4bafe313e5a8e84b6
3
+ size 31057901
f05457e46dbf735daf839c9d05ce977d.edf ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:740c0c0506b6f2cf4bb32d04d25e999c05e4a359c5a4b4538b1540d5f198780a
3
+ size 30768543
f193f4bf4443b5b3a841edb7593ff2bd.edf ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a675b90d5574a22d5bf8e3d87455844556d83128e7a4f46863dcadc15da2224f
3
+ size 23668557
f1e5c26a5a48f68501f1ab424ec7b0c1.edf ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6ccdf68150b43032089712088f824ce96c15406f43580cb93e58abb54b902a2e
3
+ size 4690840
f45aebdf48dd270d96d2b4bfb704f5e2.edf ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5815d7e69a669b3c01d6e30142883ac13bacfe9fe11a3c01d5a3ea95d24e5053
3
+ size 16960679
f844b65bd62eb3e3865a7883276620c0.edf ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:09b4fa635037abbf30c1355b00118ae8f1d0bee89a99396d0c1c7a13e5178e1f
3
+ size 5293200
f9a330e5d73ac3cf6ed0d0579c14f5e5.edf ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:433210280d817d6bb9d25348904fa0748e743edb0e36de1d4a479fd1615b3b91
3
+ size 4545294
furiosa_config.json ADDED
@@ -0,0 +1,58 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "config_version": "1.0.0",
3
+ "model_id": "deepseek-ai/DeepSeek-R1-Distill-Llama-70B",
4
+ "model_kinds": [
5
+ "ARTIFACT"
6
+ ],
7
+ "model_class": {
8
+ "module": "furiosa_llm_models.llama3.symbolic.aramco_specdec",
9
+ "name": "LlamaForCausalLM"
10
+ },
11
+ "llm_config": {
12
+ "optimization_config": {
13
+ "attention_type": "PAGED_ATTENTION",
14
+ "optimize_rope": true,
15
+ "optimize_packed": true,
16
+ "decompose_layernorm": false,
17
+ "optimize_furiosa": false,
18
+ "use_unsplit_packed": false,
19
+ "compact_causal_mask": false,
20
+ "use_rngd_gelu": false,
21
+ "causal_mask_free_decoding": true,
22
+ "kv_cache_sharing_across_beams": false,
23
+ "inbound_beamsearch_softmax": false,
24
+ "calculate_logit_only_for_last_token": false,
25
+ "optimized_for_speculative_decoding": true,
26
+ "use_2d_masks": false,
27
+ "merged_kv_indices": false
28
+ },
29
+ "quantization_config": {
30
+ "weight": "bf16",
31
+ "activation": "bf16",
32
+ "kv_cache": "bf16",
33
+ "use_mcp": true
34
+ }
35
+ },
36
+ "components_versions": {
37
+ "furiosa_llm": {
38
+ "version": "0.1.0-dev",
39
+ "git_hash": "f8deb1c",
40
+ "build_time": null
41
+ },
42
+ "furiosa_ir": {
43
+ "version": "0.11.0-dev",
44
+ "git_hash": "8c5160b804",
45
+ "build_time": "2025-07-30T04:23:32Z"
46
+ },
47
+ "furiosa_runtime": {
48
+ "version": "2025.3.0",
49
+ "git_hash": "834ab6188",
50
+ "build_time": "2025-07-30T04:27:48Z"
51
+ },
52
+ "furiosa_model_compressor": {
53
+ "version": "2025.3.0 (rev: 4cd9804)",
54
+ "git_hash": null,
55
+ "build_time": null
56
+ }
57
+ }
58
+ }
params-DeepSeek-R1-Distill-Llama-70B-aramco_specdec-80L-W16A16KV16-allow_bfloat16_cast_with_mcp-shard_size=5000000000-4d741bdc3970366668c076b824e5e349f6c9e492c6da3e4fec20bbfa6f0eb7fc.safetensors/model-00032-of-00032.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0b963d599436fc2a583f43872389a5e804f5c5af7111609437d8334492df8955
3
+ size 2571660128
special_tokens_map.json ADDED
@@ -0,0 +1,17 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "bos_token": {
3
+ "content": "<|begin▁of▁sentence|>",
4
+ "lstrip": false,
5
+ "normalized": false,
6
+ "rstrip": false,
7
+ "single_word": false
8
+ },
9
+ "eos_token": {
10
+ "content": "<|end▁of▁sentence|>",
11
+ "lstrip": false,
12
+ "normalized": false,
13
+ "rstrip": false,
14
+ "single_word": false
15
+ },
16
+ "pad_token": "<|end▁of▁sentence|>"
17
+ }