chat-ggml

Runtime error

App Files Files Community

faisalhr1997 commited on Jul 20, 2023

Commit

2b5b254

1 Parent(s): f3fb74e

Update app.py

Browse files

Files changed (1) hide show

app.py +15 -15

app.py CHANGED Viewed

@@ -8,9 +8,9 @@ from huggingface_hub import hf_hub_download
 _ = """
 snapshot_download(
-  repo_id="TheBloke/falcon-7b-instruct-GGML",
-  allow_patterns="falcon7b-instruct.ggmlv3.q4_0.bin",
-  revision="ggmlv3",
   local_dir="models",
   local_dir_use_symlinks=False,  # default "auto"
 )
@@ -26,16 +26,16 @@ hf_hub_download(
 _ = """
 llm = AutoModelForCausalLM.from_pretrained(
-    "TheBloke/falcon-7b-instruct-GGML",
-    model_file="falcon7b-instruct.ggmlv3.q4_0.bin",
-    model_type="falcon", gpu_layers=32, threads=2,
 )
 # """
-# _ = Path("models", "falcon7b-instruct.ggmlv3.q4_0.bin").absolute().as_posix()
 # assert Path(_).exists(), f"{_} does not exist, perhaps snapshot_download failed?"
-URL = "https://huggingface.co/TheBloke/falcon-7b-instruct-GGML/blob/main/falcon-7b-instruct.ggccv1.q4_1.bin"
-URL = "https://huggingface.co/TheBloke/falcon-7b-instruct-GGML/blob/ggmlv3/falcon7b-instruct.ggmlv3.q4_1.bin"
 repo_id = "/".join(urlparse(URL).path.strip("/").split("/")[:2])
@@ -43,7 +43,7 @@ model_file = Path(URL).name
 _ = hf_hub_download(
     repo_id=repo_id,
-    revision="ggmlv3",
     filename=model_file,
     local_dir="models",
     # local_dir_use_symlinks=True,
@@ -54,14 +54,14 @@ llm = AutoModelForCausalLM.from_pretrained(
     # model_file=model_file,
     # model_file=_,
     _,
-    model_type="falcon",
     threads=psutil.cpu_count(logical=False),
 )
-TITLE = f"""<h2 align="center">🦅 Falcon-Chat ggml ({model_file}) 🦅"""
 USER_NAME = "User"
-BOT_NAME = "Falcon"
-DEFAULT_INSTRUCTIONS = """The following is a conversation between a highly knowledgeable and intelligent AI assistant, called Falcon, and a human user, called User. In the following interactions, User and Falcon will converse in natural language, and Falcon will answer User's questions. Falcon was built to be respectful, polite and inclusive. Falcon was built by the Technology Innovation Institute in Abu Dhabi. Falcon will never decline to answer a question, and always attempts to give an answer that User would be satisfied with. It knows a lot, and always tells the truth. The conversation begins.
 """
 RETRY_COMMAND = "/retry"
 STOP_STR = f"\n{USER_NAME}:"
@@ -165,7 +165,7 @@ def chat():
         chat_history = chat_history + [[message, ""]]
         stream = llm(
             prompt,
-            max_new_tokens=1024,
             stop=[STOP_STR, "<|endoftext|>"],
             temperature=temperature,
             top_p=top_p,

 _ = """
 snapshot_download(
+  repo_id="TheBloke/Luna-AI-Llama2-Uncensored-GGML",
+  allow_patterns="luna-ai-llama2-uncensored.ggmlv3.q2_K.bin",
+  revision="main",
   local_dir="models",
   local_dir_use_symlinks=False,  # default "auto"
 )
 _ = """
 llm = AutoModelForCausalLM.from_pretrained(
+    "TheBloke/Luna-AI-Llama2-Uncensored-GGML",
+    model_file="luna-ai-llama2-uncensored.ggmlv3.q2_K.bin",
+    model_type="llama", gpu_layers=32, threads=2,
 )
 # """
+# _ = Path("models", "luna-ai-llama2-uncensored.ggmlv3.q2_K.bin").absolute().as_posix()
 # assert Path(_).exists(), f"{_} does not exist, perhaps snapshot_download failed?"
+# URL = "https://huggingface.co/TheBloke/falcon-7b-instruct-GGML/blob/main/falcon-7b-instruct.ggccv1.q4_1.bin"
+URL = "https://huggingface.co/TheBloke/Luna-AI-Llama2-Uncensored-GGML/resolve/main/luna-ai-llama2-uncensored.ggmlv3.q2_K.bin"
 repo_id = "/".join(urlparse(URL).path.strip("/").split("/")[:2])
 _ = hf_hub_download(
     repo_id=repo_id,
+    revision="main",
     filename=model_file,
     local_dir="models",
     # local_dir_use_symlinks=True,
     # model_file=model_file,
     # model_file=_,
     _,
+    model_type="llama",
     threads=psutil.cpu_count(logical=False),
 )
+TITLE = f"""<h2 align="center"> chat-ggml ({model_file})"""
 USER_NAME = "User"
+BOT_NAME = "Assistant"
+DEFAULT_INSTRUCTIONS = """The following is a conversation between a highly knowledgeable and intelligent AI assistant and a human User. In the following interactions, User and Assistant will converse and Assistant will answer User's questions.
 """
 RETRY_COMMAND = "/retry"
 STOP_STR = f"\n{USER_NAME}:"
         chat_history = chat_history + [[message, ""]]
         stream = llm(
             prompt,
+            max_new_tokens=2048,
             stop=[STOP_STR, "<|endoftext|>"],
             temperature=temperature,
             top_p=top_p,