PythonAIPairProgrammer

Runtime error

App Files Files Community

awacke1 commited on Nov 17, 2023

Commit

8bb28e6

1 Parent(s): d900de3

Update app.py

Browse files

Files changed (1) hide show

app.py +45 -43

app.py CHANGED Viewed

@@ -152,50 +152,52 @@ def readitaloud(result):
     #return result
 def chat_with_model(prompt, document_section, model_choice='Llama-2-7b-chat-hf'):
-        endpoint_url = 'https://qe55p8afio98s0u3.us-east-1.aws.endpoints.huggingface.cloud'  # Dr Llama
-        hf_token = os.getenv('HF_KEY')
-        client = InferenceClient(endpoint_url, token=hf_token)
-        gen_kwargs = dict(
-            max_new_tokens=512,
-            top_k=30,
-            top_p=0.9,
-            temperature=0.2,
-            repetition_penalty=1.02,
-            stop_sequences=["\nUser:", "<|endoftext|>", "</s>"],
-        )
-        stream = client.text_generation(prompt, stream=True, details=True, **gen_kwargs)
-        report=[]
-        res_box = st.empty()
-        collected_chunks=[]
-        collected_messages=[]
-        allresults=''
-        for r in stream:
-            if r.token.special:
-                continue
-            if r.token.text in gen_kwargs["stop_sequences"]:
-                break
-            collected_chunks.append(r.token.text)
-            chunk_message = r.token.text
-            collected_messages.append(chunk_message)
-            try:
-                report.append(r.token.text)
-                if len(r.token.text) > 0:
-                    result="".join(report).strip()
-                    res_box.markdown(f'*{result}*')
-            except:
-                st.write('.')
-        full_reply_content = result
-        st.write("Elapsed time:")
-        st.write(time.time() - start_time)
-        filename = generate_filename(full_reply_content, prompt)
-        create_file(filename, prompt, full_reply_content, should_save)
-        readitaloud(full_reply_content)
-        return result
 # Chat and Chat with files
 def chat_with_model2(prompt, document_section, model_choice='gpt-3.5-turbo'):

     #return result
 def chat_with_model(prompt, document_section, model_choice='Llama-2-7b-chat-hf'):
+    start_time = time.time()
+    endpoint_url = 'https://qe55p8afio98s0u3.us-east-1.aws.endpoints.huggingface.cloud'  # Dr Llama
+    hf_token = os.getenv('HF_KEY')
+    client = InferenceClient(endpoint_url, token=hf_token)
+    gen_kwargs = dict(
+        max_new_tokens=512,
+        top_k=30,
+        top_p=0.9,
+        temperature=0.2,
+        repetition_penalty=1.02,
+        stop_sequences=["\nUser:", "<|endoftext|>", "</s>"],
+    )
+    stream = client.text_generation(prompt, stream=True, details=True, **gen_kwargs)
+    report=[]
+    res_box = st.empty()
+    collected_chunks=[]
+    collected_messages=[]
+    allresults=''
+    for r in stream:
+        if r.token.special:
+            continue
+        if r.token.text in gen_kwargs["stop_sequences"]:
+            break
+        collected_chunks.append(r.token.text)
+        chunk_message = r.token.text
+        collected_messages.append(chunk_message)
+        try:
+            report.append(r.token.text)
+            if len(r.token.text) > 0:
+                result="".join(report).strip()
+                res_box.markdown(f'*{result}*')
+        except:
+            st.write('.')
+    full_reply_content = result
+    st.write("Elapsed time:")
+    st.write(time.time() - start_time)
+    filename = generate_filename(full_reply_content, prompt)
+    create_file(filename, prompt, full_reply_content, should_save)
+    readitaloud(full_reply_content)
+    return result
 # Chat and Chat with files
 def chat_with_model2(prompt, document_section, model_choice='gpt-3.5-turbo'):