Add files using upload-large-folder tool
Browse filesThis view is limited to 50 files because it contains too many changes. See raw diff
- .gitattributes +7 -0
- 00852babc64b23ad2a0cee69cd01b44f.edf +3 -0
- 0459eb8508fa7278f3397c636fb38f37.edf +3 -0
- 0e51734f4fd6bdc2a37670010bbe161e.edf +3 -0
- 0fb796c440d1193727495cd5131464fc.edf +3 -0
- 1013a7281f9b82e099f30fc6c7b7ee6a.edf +3 -0
- 1905b3bde56415edd508d9bf943a571f.edf +3 -0
- 19fc01089689025e7fd06eae4355507d.edf +3 -0
- 230c5c612a258fa4664a9b0c7991219d.edf +3 -0
- 253322114d04d3fe619d211da70154a7.edf +3 -0
- 265360903451f7dedb717b7b9b72461e.edf +3 -0
- 3f969183b14039dad7ebf54ae6af97ca.edf +3 -0
- 435a6b2dc26692d83db8a638de4470c5.edf +3 -0
- 444902f20f5011550ed11180c7782bfa.edf +3 -0
- 47122db966459854cab6e913177206d7.edf +3 -0
- 55ca2cec49402aeb399c90a0488b46ab.edf +3 -0
- 599ebf67ab06553d8e2eac2b218ce2b1.edf +3 -0
- 674a22b64d0fac8be1dc1a402daa0126.edf +3 -0
- 6a52705628ee03d2f2142d9d2aeb4e75.edf +3 -0
- 6ffe692071814fe20782bfeb93ed7500.edf +3 -0
- 71c090fbea34420bb7d543bbd8ca0afb.edf +3 -0
- 7be2f7b337826bb7aa6759e059bca330.edf +3 -0
- 80c7ea681548402ea828303776e8ae65.edf +3 -0
- 9539f966acbc53e10b456267925123b5.edf +3 -0
- 96b29272fb158c073e0688c7eabc25c2.edf +3 -0
- 9b03bfbe480a8f08895c480d5f27ac1e.edf +3 -0
- 9e5396080f97fe6a301ebc83f98b99db.edf +3 -0
- LICENSE +21 -0
- README.md +36 -0
- b7dfdc6a0adbb5c49cd22d7bf4d9e3ad.edf +3 -0
- bce17aca74c04d95e0f97b7690751257.edf +3 -0
- bed798118b103c5e3adbdd3b53134ade.edf +3 -0
- c1780f91b2117f234e1b266fde202c96.edf +3 -0
- c2002116d6922d70217f6fce6ed5bb10.edf +3 -0
- c36a0cf94961335dd45464ccc7741873.edf +3 -0
- c694752a40ba26ae630abc2ca947fe22.edf +3 -0
- c957c6744fe2374d152a48eb7d769f64.edf +3 -0
- config.json +41 -0
- d33f69ccba0e6862bc39698e4515ffd0.edf +3 -0
- e8673bbd23f98c234d46131ebbcb0440.edf +3 -0
- ea6cc401d5a2d6ba2adffdaa7188cdc0.edf +3 -0
- f05457e46dbf735daf839c9d05ce977d.edf +3 -0
- f193f4bf4443b5b3a841edb7593ff2bd.edf +3 -0
- f1e5c26a5a48f68501f1ab424ec7b0c1.edf +3 -0
- f45aebdf48dd270d96d2b4bfb704f5e2.edf +3 -0
- f844b65bd62eb3e3865a7883276620c0.edf +3 -0
- f9a330e5d73ac3cf6ed0d0579c14f5e5.edf +3 -0
- furiosa_config.json +58 -0
- params-DeepSeek-R1-Distill-Llama-70B-aramco_specdec-80L-W16A16KV16-allow_bfloat16_cast_with_mcp-shard_size=5000000000-4d741bdc3970366668c076b824e5e349f6c9e492c6da3e4fec20bbfa6f0eb7fc.safetensors/model-00032-of-00032.safetensors +3 -0
- special_tokens_map.json +17 -0
.gitattributes
CHANGED
|
@@ -146,3 +146,10 @@ f5f4eb0a371dd559f47e8067ce36bb52.edf filter=lfs diff=lfs merge=lfs -text
|
|
| 146 |
9539f966acbc53e10b456267925123b5.edf filter=lfs diff=lfs merge=lfs -text
|
| 147 |
c884bb0e814b3d51cd8d2dd59851bcb0.edf filter=lfs diff=lfs merge=lfs -text
|
| 148 |
9de95e06ccea08279ea551c4df760813.edf filter=lfs diff=lfs merge=lfs -text
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 146 |
9539f966acbc53e10b456267925123b5.edf filter=lfs diff=lfs merge=lfs -text
|
| 147 |
c884bb0e814b3d51cd8d2dd59851bcb0.edf filter=lfs diff=lfs merge=lfs -text
|
| 148 |
9de95e06ccea08279ea551c4df760813.edf filter=lfs diff=lfs merge=lfs -text
|
| 149 |
+
ea6cc401d5a2d6ba2adffdaa7188cdc0.edf filter=lfs diff=lfs merge=lfs -text
|
| 150 |
+
f05457e46dbf735daf839c9d05ce977d.edf filter=lfs diff=lfs merge=lfs -text
|
| 151 |
+
253322114d04d3fe619d211da70154a7.edf filter=lfs diff=lfs merge=lfs -text
|
| 152 |
+
599ebf67ab06553d8e2eac2b218ce2b1.edf filter=lfs diff=lfs merge=lfs -text
|
| 153 |
+
c1780f91b2117f234e1b266fde202c96.edf filter=lfs diff=lfs merge=lfs -text
|
| 154 |
+
0fb796c440d1193727495cd5131464fc.edf filter=lfs diff=lfs merge=lfs -text
|
| 155 |
+
47122db966459854cab6e913177206d7.edf filter=lfs diff=lfs merge=lfs -text
|
00852babc64b23ad2a0cee69cd01b44f.edf
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:4fb62bf2ba651e04a7f03e6180974cc46737f4d9c3b71ba72d46c6e2010ae3d6
|
| 3 |
+
size 4797965
|
0459eb8508fa7278f3397c636fb38f37.edf
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:603b5127eacdec02f9df8b597e1cabba76293ad9a18f214397f22a449938a841
|
| 3 |
+
size 35929788
|
0e51734f4fd6bdc2a37670010bbe161e.edf
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:82251ff730684d13b7b9ef3d86e9e14f53ae4cd3677b135dca81ae3427c52cd3
|
| 3 |
+
size 5716404
|
0fb796c440d1193727495cd5131464fc.edf
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:b4dfe03db2cab92271b9a1971486495f50345e29bd0e9d7feecafe72ea77f1ee
|
| 3 |
+
size 56511229
|
1013a7281f9b82e099f30fc6c7b7ee6a.edf
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:67de7fdc4db78253037d74b941ec25643918c16cee18f6aae3a29162be02688a
|
| 3 |
+
size 18875261
|
1905b3bde56415edd508d9bf943a571f.edf
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:16f800decdbdb103861227f60f15edfd6178f3b0e8418760f3aaaaaa85c09b5c
|
| 3 |
+
size 34297575
|
19fc01089689025e7fd06eae4355507d.edf
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:9321d46df0e0e056dab3c70d63d7cefefdb074f9604259bf12a453d57b3a635d
|
| 3 |
+
size 30163116
|
230c5c612a258fa4664a9b0c7991219d.edf
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:b4d6cef7f39f0af55211d7e72d20b36019d25fcf9c2e197b981b6a5e203388a3
|
| 3 |
+
size 4036364
|
253322114d04d3fe619d211da70154a7.edf
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:1de23a68d37822a88eccbc11cf1c99b051dce46cd403c1710d1c27c2be93a833
|
| 3 |
+
size 30377687
|
265360903451f7dedb717b7b9b72461e.edf
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:476f9cded5e6ede17be04070ed6c08cad333ce860c4b1a49983f5d4efffeb122
|
| 3 |
+
size 33124100
|
3f969183b14039dad7ebf54ae6af97ca.edf
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:7d5cd31d14465d9f70b1dc70e850771aa084797595e8cd074f2f0a8a61498273
|
| 3 |
+
size 30600772
|
435a6b2dc26692d83db8a638de4470c5.edf
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:052ae93cecd8efce21a2dfa13c3f16b02e8b7af8df171e981d23b28435428314
|
| 3 |
+
size 18851011
|
444902f20f5011550ed11180c7782bfa.edf
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:ca1bacc7c71e7f8d24f8058c1a8b96528b4889cc4d2c2023fd02d0cf2553b8c1
|
| 3 |
+
size 3951853
|
47122db966459854cab6e913177206d7.edf
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:fe376db21936c01fd2d1b40ec1d2526bfd73a1b87c374202a45ab4fd455fea8a
|
| 3 |
+
size 57078164
|
55ca2cec49402aeb399c90a0488b46ab.edf
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:46ae60a1983554b4523b53b37b5e6ceaff3162f0a57bfa993480422fca4e8ecb
|
| 3 |
+
size 30596818
|
599ebf67ab06553d8e2eac2b218ce2b1.edf
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:7a53cca3c46ae403e7d9b4c5fead612207b2b6bcf66a826597c5469038fc54f8
|
| 3 |
+
size 30941839
|
674a22b64d0fac8be1dc1a402daa0126.edf
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:c08f0c54a202b1a4768004f6fadf8ae76f8ad59b24ac7142356a64aa654fd89d
|
| 3 |
+
size 4924546
|
6a52705628ee03d2f2142d9d2aeb4e75.edf
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:0c5597a331fe6fd11f0497ef67bd79ad989aa0f6fa3047537a55e8ed85b70d18
|
| 3 |
+
size 5068798
|
6ffe692071814fe20782bfeb93ed7500.edf
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:73b9774d575df5ce5b4a94e8f1d0165a140aad631b50d6732b945f4fcdf0ec72
|
| 3 |
+
size 17711989
|
71c090fbea34420bb7d543bbd8ca0afb.edf
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:a6a7983c6a29d2244f5f47ccf547bb62954bf148c7a1383cda0336ffd1fcffce
|
| 3 |
+
size 5004740
|
7be2f7b337826bb7aa6759e059bca330.edf
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:9a0cfc05f395b98f165a1990fefa9bc4ac566c2abfc29df605c49b49582c1798
|
| 3 |
+
size 4769261
|
80c7ea681548402ea828303776e8ae65.edf
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:abf67dc8931a050f68fd09cd89c92ffcaf175a65e5cb7c6893954c2680b7a645
|
| 3 |
+
size 30247421
|
9539f966acbc53e10b456267925123b5.edf
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:c59ab500ee3ba1da291abab7ac896238a0109db6897fe79c13fc626992fafb2b
|
| 3 |
+
size 17306945
|
96b29272fb158c073e0688c7eabc25c2.edf
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:c4d60300c95c3e5f7c31a3bd57daee283e8a3e4f10b4ec62ff3ea1d82fd83191
|
| 3 |
+
size 19403203
|
9b03bfbe480a8f08895c480d5f27ac1e.edf
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:e3ed5d494c73fb62b61674ccf7878915cc945aa32e204caefdbeb03c0aef7ef8
|
| 3 |
+
size 4714752
|
9e5396080f97fe6a301ebc83f98b99db.edf
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:4c7d591a4f961fdc86f1bd95a4fbe0fb6a419dc491e98bf100d68584c112bde3
|
| 3 |
+
size 3472839
|
LICENSE
ADDED
|
@@ -0,0 +1,21 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
MIT License
|
| 2 |
+
|
| 3 |
+
Copyright (c) 2023 DeepSeek
|
| 4 |
+
|
| 5 |
+
Permission is hereby granted, free of charge, to any person obtaining a copy
|
| 6 |
+
of this software and associated documentation files (the "Software"), to deal
|
| 7 |
+
in the Software without restriction, including without limitation the rights
|
| 8 |
+
to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
|
| 9 |
+
copies of the Software, and to permit persons to whom the Software is
|
| 10 |
+
furnished to do so, subject to the following conditions:
|
| 11 |
+
|
| 12 |
+
The above copyright notice and this permission notice shall be included in all
|
| 13 |
+
copies or substantial portions of the Software.
|
| 14 |
+
|
| 15 |
+
THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
|
| 16 |
+
IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
|
| 17 |
+
FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
|
| 18 |
+
AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
|
| 19 |
+
LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
|
| 20 |
+
OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
|
| 21 |
+
SOFTWARE.
|
README.md
ADDED
|
@@ -0,0 +1,36 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
---
|
| 2 |
+
base_model: deepseek-ai/DeepSeek-R1-Distill-Llama-70B
|
| 3 |
+
license: mit
|
| 4 |
+
pipeline_tag: text-generation
|
| 5 |
+
library_name: furiosa-llm
|
| 6 |
+
tags:
|
| 7 |
+
- furiosa-ai
|
| 8 |
+
---
|
| 9 |
+
# Model Overview
|
| 10 |
+
- **Model Architecture:** Meta-Llama-3
|
| 11 |
+
- **Input:** Text
|
| 12 |
+
- **Output:** Text
|
| 13 |
+
- **Model Optimizations:**
|
| 14 |
+
- **Context Length:** 32k tokens
|
| 15 |
+
- Maximum Prompt Length: 32768 tokens
|
| 16 |
+
- Maximum Generation Length: 32768 tokens
|
| 17 |
+
- **Intended Use Cases:** Intended for commercial and non-commercial use. Same as [DeepSeek-R1-Distill-Llama-70B](https://huggingface.co/deepseek-ai/DeepSeek-R1-Distill-Llama-70B), this models is intended for assistant-like chat.
|
| 18 |
+
- **Release Date:** 07/28/2025
|
| 19 |
+
- **Version:** v2025.3
|
| 20 |
+
- **License(s):** [MIT License](https://huggingface.co/deepseek-ai/DeepSeek-R1-Distill-Llama-70B/blob/main/LICENSE)
|
| 21 |
+
- **Supported Inference Engine(s):** Furiosa LLM
|
| 22 |
+
- **Supported Hardware Compatibility:** FuriosaAI RNGD
|
| 23 |
+
- **Preferred Operating System(s):** Linux
|
| 24 |
+
- **Quantization:** No
|
| 25 |
+
|
| 26 |
+
## Description:
|
| 27 |
+
This model is the pre-compiled version of the [DeepSeek-R1-Distill-Llama-70B](https://huggingface.co/deepseek-ai/DeepSeek-R1-Distill-Llama-70B), which is an auto-regressive language model that uses an optimized transformer architecture.
|
| 28 |
+
|
| 29 |
+
## Usage
|
| 30 |
+
|
| 31 |
+
To run this model with [Furiosa-LLM](https://developer.furiosa.ai/latest/en/furiosa_llm/intro.html), follow the example command below after [installing Furiosa-LLM and its prerequisites](https://developer.furiosa.ai/latest/en/getting_started/furiosa_llm.html#installing-furiosa-llm).
|
| 32 |
+
|
| 33 |
+
```sh
|
| 34 |
+
furiosa-llm serve furiosa-ai/DeepSeek-R1-Distill-Llama-70B \
|
| 35 |
+
--enable-reasoning --reasoning-parser deepseek_r1
|
| 36 |
+
```
|
b7dfdc6a0adbb5c49cd22d7bf4d9e3ad.edf
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:77157789b1e8a7d413ec304ab3469ead9b18452308a9bda2a649748b8eaee1ff
|
| 3 |
+
size 3451274
|
bce17aca74c04d95e0f97b7690751257.edf
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:c329a199da2b5505cda6eea07e2b837766111f75aae94ec0634e11cca55f2de1
|
| 3 |
+
size 18929574
|
bed798118b103c5e3adbdd3b53134ade.edf
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:5b150bf14435e31c212617943ba30eb294f3fc4aab5c2688f081f302a9198109
|
| 3 |
+
size 4499479
|
c1780f91b2117f234e1b266fde202c96.edf
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:cb0dd55da6e0ca287aaea03992337f59d60c394e9ab49496553973a67398d4cc
|
| 3 |
+
size 56579945
|
c2002116d6922d70217f6fce6ed5bb10.edf
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:c202a3d9b79707e318ce9704ea37091c47cfafcab32bd7399af46a3e00076fe0
|
| 3 |
+
size 34880297
|
c36a0cf94961335dd45464ccc7741873.edf
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:984371e7f76092a471546e499d468e7a983d8a9e13cdd6a0cf9e8bfd68914825
|
| 3 |
+
size 17363289
|
c694752a40ba26ae630abc2ca947fe22.edf
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:c763c2b4a28c12f6f446478e78259fea8e900976a5e9f0597f7c60c20b2d30c3
|
| 3 |
+
size 7550233
|
c957c6744fe2374d152a48eb7d769f64.edf
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:4fc45ecbbf1663399ab8bd146620d0b783dafc1e9db3d8fc9e225ac44366533b
|
| 3 |
+
size 31085735
|
config.json
ADDED
|
@@ -0,0 +1,41 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"_name_or_path": "deepseek-ai/DeepSeek-R1-Distill-Llama-70B",
|
| 3 |
+
"architectures": [
|
| 4 |
+
"LlamaForCausalLM"
|
| 5 |
+
],
|
| 6 |
+
"attention_bias": false,
|
| 7 |
+
"attention_dropout": 0.0,
|
| 8 |
+
"bos_token_id": 128000,
|
| 9 |
+
"eos_token_id": [
|
| 10 |
+
128001,
|
| 11 |
+
128008,
|
| 12 |
+
128009
|
| 13 |
+
],
|
| 14 |
+
"head_dim": 128,
|
| 15 |
+
"hidden_act": "silu",
|
| 16 |
+
"hidden_size": 8192,
|
| 17 |
+
"initializer_range": 0.02,
|
| 18 |
+
"intermediate_size": 28672,
|
| 19 |
+
"inv_freq_config": {
|
| 20 |
+
"factor": 8.0,
|
| 21 |
+
"high_freq_factor": 4.0,
|
| 22 |
+
"low_freq_factor": 1.0,
|
| 23 |
+
"original_max_position_embeddings": 8192,
|
| 24 |
+
"rope_type": "llama3"
|
| 25 |
+
},
|
| 26 |
+
"max_position_embeddings": 131072,
|
| 27 |
+
"mlp_bias": false,
|
| 28 |
+
"model_type": "llama",
|
| 29 |
+
"num_attention_heads": 64,
|
| 30 |
+
"num_hidden_layers": 80,
|
| 31 |
+
"num_key_value_heads": 8,
|
| 32 |
+
"pretraining_tp": 1,
|
| 33 |
+
"rms_norm_eps": 1e-05,
|
| 34 |
+
"rope_scaling": null,
|
| 35 |
+
"rope_theta": 500000.0,
|
| 36 |
+
"tie_word_embeddings": false,
|
| 37 |
+
"torch_dtype": "bfloat16",
|
| 38 |
+
"transformers_version": "4.48.1",
|
| 39 |
+
"use_cache": true,
|
| 40 |
+
"vocab_size": 128256
|
| 41 |
+
}
|
d33f69ccba0e6862bc39698e4515ffd0.edf
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:19958b09cd1f260114fd877b87442845d655af8e676c95819a34691c77a7a082
|
| 3 |
+
size 21762241
|
e8673bbd23f98c234d46131ebbcb0440.edf
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:219ed9a8bb383d1cc2fb0636c05162b7d4553540e6d650597bedda49af31ac44
|
| 3 |
+
size 5229866
|
ea6cc401d5a2d6ba2adffdaa7188cdc0.edf
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:0c88548d84bbf58117ebe1a1c50b688c432265d4ef9aded4bafe313e5a8e84b6
|
| 3 |
+
size 31057901
|
f05457e46dbf735daf839c9d05ce977d.edf
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:740c0c0506b6f2cf4bb32d04d25e999c05e4a359c5a4b4538b1540d5f198780a
|
| 3 |
+
size 30768543
|
f193f4bf4443b5b3a841edb7593ff2bd.edf
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:a675b90d5574a22d5bf8e3d87455844556d83128e7a4f46863dcadc15da2224f
|
| 3 |
+
size 23668557
|
f1e5c26a5a48f68501f1ab424ec7b0c1.edf
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:6ccdf68150b43032089712088f824ce96c15406f43580cb93e58abb54b902a2e
|
| 3 |
+
size 4690840
|
f45aebdf48dd270d96d2b4bfb704f5e2.edf
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:5815d7e69a669b3c01d6e30142883ac13bacfe9fe11a3c01d5a3ea95d24e5053
|
| 3 |
+
size 16960679
|
f844b65bd62eb3e3865a7883276620c0.edf
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:09b4fa635037abbf30c1355b00118ae8f1d0bee89a99396d0c1c7a13e5178e1f
|
| 3 |
+
size 5293200
|
f9a330e5d73ac3cf6ed0d0579c14f5e5.edf
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:433210280d817d6bb9d25348904fa0748e743edb0e36de1d4a479fd1615b3b91
|
| 3 |
+
size 4545294
|
furiosa_config.json
ADDED
|
@@ -0,0 +1,58 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"config_version": "1.0.0",
|
| 3 |
+
"model_id": "deepseek-ai/DeepSeek-R1-Distill-Llama-70B",
|
| 4 |
+
"model_kinds": [
|
| 5 |
+
"ARTIFACT"
|
| 6 |
+
],
|
| 7 |
+
"model_class": {
|
| 8 |
+
"module": "furiosa_llm_models.llama3.symbolic.aramco_specdec",
|
| 9 |
+
"name": "LlamaForCausalLM"
|
| 10 |
+
},
|
| 11 |
+
"llm_config": {
|
| 12 |
+
"optimization_config": {
|
| 13 |
+
"attention_type": "PAGED_ATTENTION",
|
| 14 |
+
"optimize_rope": true,
|
| 15 |
+
"optimize_packed": true,
|
| 16 |
+
"decompose_layernorm": false,
|
| 17 |
+
"optimize_furiosa": false,
|
| 18 |
+
"use_unsplit_packed": false,
|
| 19 |
+
"compact_causal_mask": false,
|
| 20 |
+
"use_rngd_gelu": false,
|
| 21 |
+
"causal_mask_free_decoding": true,
|
| 22 |
+
"kv_cache_sharing_across_beams": false,
|
| 23 |
+
"inbound_beamsearch_softmax": false,
|
| 24 |
+
"calculate_logit_only_for_last_token": false,
|
| 25 |
+
"optimized_for_speculative_decoding": true,
|
| 26 |
+
"use_2d_masks": false,
|
| 27 |
+
"merged_kv_indices": false
|
| 28 |
+
},
|
| 29 |
+
"quantization_config": {
|
| 30 |
+
"weight": "bf16",
|
| 31 |
+
"activation": "bf16",
|
| 32 |
+
"kv_cache": "bf16",
|
| 33 |
+
"use_mcp": true
|
| 34 |
+
}
|
| 35 |
+
},
|
| 36 |
+
"components_versions": {
|
| 37 |
+
"furiosa_llm": {
|
| 38 |
+
"version": "0.1.0-dev",
|
| 39 |
+
"git_hash": "f8deb1c",
|
| 40 |
+
"build_time": null
|
| 41 |
+
},
|
| 42 |
+
"furiosa_ir": {
|
| 43 |
+
"version": "0.11.0-dev",
|
| 44 |
+
"git_hash": "8c5160b804",
|
| 45 |
+
"build_time": "2025-07-30T04:23:32Z"
|
| 46 |
+
},
|
| 47 |
+
"furiosa_runtime": {
|
| 48 |
+
"version": "2025.3.0",
|
| 49 |
+
"git_hash": "834ab6188",
|
| 50 |
+
"build_time": "2025-07-30T04:27:48Z"
|
| 51 |
+
},
|
| 52 |
+
"furiosa_model_compressor": {
|
| 53 |
+
"version": "2025.3.0 (rev: 4cd9804)",
|
| 54 |
+
"git_hash": null,
|
| 55 |
+
"build_time": null
|
| 56 |
+
}
|
| 57 |
+
}
|
| 58 |
+
}
|
params-DeepSeek-R1-Distill-Llama-70B-aramco_specdec-80L-W16A16KV16-allow_bfloat16_cast_with_mcp-shard_size=5000000000-4d741bdc3970366668c076b824e5e349f6c9e492c6da3e4fec20bbfa6f0eb7fc.safetensors/model-00032-of-00032.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:0b963d599436fc2a583f43872389a5e804f5c5af7111609437d8334492df8955
|
| 3 |
+
size 2571660128
|
special_tokens_map.json
ADDED
|
@@ -0,0 +1,17 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"bos_token": {
|
| 3 |
+
"content": "<|begin▁of▁sentence|>",
|
| 4 |
+
"lstrip": false,
|
| 5 |
+
"normalized": false,
|
| 6 |
+
"rstrip": false,
|
| 7 |
+
"single_word": false
|
| 8 |
+
},
|
| 9 |
+
"eos_token": {
|
| 10 |
+
"content": "<|end▁of▁sentence|>",
|
| 11 |
+
"lstrip": false,
|
| 12 |
+
"normalized": false,
|
| 13 |
+
"rstrip": false,
|
| 14 |
+
"single_word": false
|
| 15 |
+
},
|
| 16 |
+
"pad_token": "<|end▁of▁sentence|>"
|
| 17 |
+
}
|