Spaces:

markqiu
/

prinvest_mate

Sleeping

johnsmith253325 commited on Sep 16, 2023

Commit

7d0f396

1 Parent(s): 52cd289

feat: 加入LLaMA-7B-Chat

Files changed (5) hide show

modules/models/LLaMA.py CHANGED Viewed

@@ -15,6 +15,13 @@ import json
 from llama_cpp import Llama
 from huggingface_hub import hf_hub_download
 def download(repo_id, filename, retry=10):
     if os.path.exists("./models/downloaded_models.json"):
         with open("./models/downloaded_models.json", "r") as f:
@@ -70,18 +77,15 @@ class LLaMA_Client(BaseLLMModel):
             #     lora_path = f"lora/{lora_path}"
     def _get_llama_style_input(self):
-        history = []
-        instruction = ""
-        if self.system_prompt:
-            instruction = (f"Instruction: {self.system_prompt}\n")
-        for x in self.history:
-            if x["role"] == "user":
-                history.append(f"{instruction}Input: {x['content']}")
             else:
-                history.append(f"Output: {x['content']}")
-        context = "\n\n".join(history)
-        context += "\n\nOutput: "
-        return context
     def get_answer_at_once(self):
         context = self._get_llama_style_input()

 from llama_cpp import Llama
 from huggingface_hub import hf_hub_download
+SYS_PREFIX = "<<SYS>>\n"
+SYS_POSTFIX = "\n<</SYS>>\n\n"
+INST_PREFIX = "<s>[INST] "
+INST_POSTFIX = " "
+OUTPUT_PREFIX = "[/INST] "
+OUTPUT_POSTFIX = "</s>"
 def download(repo_id, filename, retry=10):
     if os.path.exists("./models/downloaded_models.json"):
         with open("./models/downloaded_models.json", "r") as f:
             #     lora_path = f"lora/{lora_path}"
     def _get_llama_style_input(self):
+        context = []
+        for conv in self.history:
+            if conv["role"] == "system":
+                context.append(SYS_PREFIX+conv["content"]+SYS_POSTFIX)
+            elif conv["role"] == "user":
+                context.append(INST_PREFIX+conv["content"]+INST_POSTFIX+OUTPUT_PREFIX)
             else:
+                context.append(conv["content"]+OUTPUT_POSTFIX)
+        return "".join(context)
     def get_answer_at_once(self):
         context = self._get_llama_style_input()

modules/presets.py CHANGED Viewed

@@ -83,9 +83,21 @@ LOCAL_MODELS = [
     "chatglm2-6b-int4",
     "StableLM",
     "MOSS",
-    "Llama-2-7B",
 ]
 if os.environ.get('HIDE_LOCAL_MODELS', 'false') == 'true':
     MODELS = ONLINE_MODELS
 else:
@@ -262,11 +274,3 @@ small_and_beautiful_theme = gr.themes.Soft(
         # gradio 会把这个几个chatbot打头的变量应用到其他md渲染的地方，鬼晓得怎么想的。。。
         chatbot_code_background_color_dark="*neutral_950",
     )
-# Additional metadate for local models
-MODEL_METADATA = {
-    "Llama-2-7B":{
-        "repo_id": "TheBloke/Llama-2-7B-GGUF",
-        "filelist": ["llama-2-7b.Q6_K.gguf"],
-    }
-}

     "chatglm2-6b-int4",
     "StableLM",
     "MOSS",
+    "Llama-2-7B-Chat",
 ]
+# Additional metadate for local models
+MODEL_METADATA = {
+    "Llama-2-7B":{
+        "repo_id": "TheBloke/Llama-2-7B-GGUF",
+        "filelist": ["llama-2-7b.Q6_K.gguf"],
+    },
+    "Llama-2-7B-Chat":{
+        "repo_id": "TheBloke/Llama-2-7b-Chat-GGUF",
+        "filelist": ["llama-2-7b-chat.Q6_K.gguf"],
+    }
+}
 if os.environ.get('HIDE_LOCAL_MODELS', 'false') == 'true':
     MODELS = ONLINE_MODELS
 else:
         # gradio 会把这个几个chatbot打头的变量应用到其他md渲染的地方，鬼晓得怎么想的。。。
         chatbot_code_background_color_dark="*neutral_950",
     )

requirements_advanced.txt CHANGED Viewed

@@ -1,11 +1,8 @@
 transformers
 huggingface_hub
 torch
-icetk
-protobuf==3.19.0
-git+https://github.com/OptimalScale/LMFlow.git
 cpm-kernels
 sentence_transformers
 accelerate
 sentencepiece
-datasets

 transformers
 huggingface_hub
 torch
 cpm-kernels
 sentence_transformers
 accelerate
 sentencepiece
+llama-cpp-python

run_Linux.sh CHANGED Viewed

File without changes

run_macOS.command CHANGED Viewed

File without changes