WizardCoder-Python-34b-v1.0

Runtime error

App Files Files Community

bleysg commited on Sep 7, 2023

Commit

380e40f

1 Parent(s): 8378e8f

Update app.py

Browse files

Files changed (1) hide show

app.py +5 -5

app.py CHANGED Viewed

@@ -6,12 +6,12 @@ import openai
 print(os.environ)
 openai.api_base = os.environ.get("OPENAI_API_BASE")
-openai.api_key = os.environ.get("OPENAI_API_KEY")
 BASE_SYSTEM_MESSAGE = """### System Prompt\n"""
 def make_prediction(prompt, max_tokens=None, temperature=None, top_p=None, top_k=None, repetition_penalty=None):
-    completion = openai.Completion.create(model="Phind/Phind-CodeLlama-34B-v2", prompt=prompt, max_tokens=max_tokens, temperature=temperature, top_p=top_p, top_k=top_k, repetition_penalty=repetition_penalty, stream=True, stop=["</s>", "<|im_end|>"])
     for chunk in completion:
         yield chunk["choices"][0]["text"]
@@ -33,7 +33,7 @@ def chat(history, system_message, max_tokens, temperature, top_p, top_k, repetit
     history = history or []
     messages = BASE_SYSTEM_MESSAGE + system_message.strip() + "\n" + \
-               "\n".join(["\n".join(["### User Message\n"+item[0]+"\n\n", "### Assistant\n"+item[1]+"\n\n"])
                           for item in history])
     # strip the last `<|end_of_turn|>` from the messages
     #messages = messages.rstrip("<|end_of_turn|>")
@@ -75,11 +75,11 @@ with gr.Blocks(css=CSS) as demo:
     with gr.Row():
         with gr.Column():
             gr.Markdown(f"""
-                    ## This demo is an unquantized GPU chatbot of [Phind-CodeLlama-34B-v2](https://huggingface.co/Phind/Phind-CodeLlama-34B-v2)
                     Brought to you by your friends at Alignment Lab AI, garage-bAInd, Open Access AI Collective, and OpenChat!
                     """)
     with gr.Row():
-        gr.Markdown("# 🔍 Phind CodeLlama 34B Playground Space! 🔎")
     with gr.Row():
         #chatbot = gr.Chatbot().style(height=500)
         chatbot = gr.Chatbot(elem_id="chatbot")

 print(os.environ)
 openai.api_base = os.environ.get("OPENAI_API_BASE")
+#openai.api_key = os.environ.get("OPENAI_API_KEY")
 BASE_SYSTEM_MESSAGE = """### System Prompt\n"""
 def make_prediction(prompt, max_tokens=None, temperature=None, top_p=None, top_k=None, repetition_penalty=None):
+    completion = openai.Completion.create(model="/workspace/text-generation-webui/models/wizardcoder-python-34b-v1.0.Q5_K_M.gguf", prompt=prompt, max_tokens=max_tokens, temperature=temperature, top_p=top_p, top_k=top_k, repetition_penalty=repetition_penalty, stream=True, stop=["</s>", "<|im_end|>"])
     for chunk in completion:
         yield chunk["choices"][0]["text"]
     history = history or []
     messages = BASE_SYSTEM_MESSAGE + system_message.strip() + "\n" + \
+               "\n".join(["\n".join(["###Instruction\n"+item[0]+"\n\n", "###Response\n"+item[1]+"\n\n"])
                           for item in history])
     # strip the last `<|end_of_turn|>` from the messages
     #messages = messages.rstrip("<|end_of_turn|>")
     with gr.Row():
         with gr.Column():
             gr.Markdown(f"""
+                    ## This demo is an unquantized GPU chatbot of [WizardCoder-Python-34B-V1.0-GGUF](https://huggingface.co/TheBloke/WizardCoder-Python-34B-V1.0-GGUF)
                     Brought to you by your friends at Alignment Lab AI, garage-bAInd, Open Access AI Collective, and OpenChat!
                     """)
     with gr.Row():
+        gr.Markdown("# 🔍 WizardCoder-Python-34B-V1.0-GGUF Playground Space! 🔎")
     with gr.Row():
         #chatbot = gr.Chatbot().style(height=500)
         chatbot = gr.Chatbot(elem_id="chatbot")