File size: 6,108 Bytes
bcee819
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
6047652
 
bcee819
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
722ad62
bcee819
 
 
 
 
722ad62
bcee819
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
d5a518b
bcee819
 
 
 
702bf74
 
 
 
 
 
 
 
 
 
7e07c33
 
 
90f373a
702bf74
 
 
bcee819
 
 
 
 
 
 
 
 
 
 
 
 
 
3ba4c57
bcee819
 
 
 
 
 
3ba4c57
bcee819
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
efd893d
bcee819
 
 
 
0207b81
bcee819
 
 
 
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
import streamlit as st
from io import BytesIO
import ibm_watsonx_ai
import secretsload
import genparam
import requests
import time
import re
from ibm_watsonx_ai.foundation_models import ModelInference
from ibm_watsonx_ai import Credentials, APIClient
from ibm_watsonx_ai.metanames import GenTextParamsMetaNames as GenParams
from ibm_watsonx_ai.metanames import GenTextReturnOptMetaNames as RetParams
from secretsload import load_stsecrets

credentials = load_stsecrets()

st.set_page_config(
    page_title="Jimmy",
    page_icon="πŸ˜’",
    initial_sidebar_state="collapsed"
)

# Password protection
def check_password():
    def password_entered():
        if st.session_state["password"] == st.secrets["app_password"]:
            st.session_state["password_correct"] = True
            del st.session_state["password"]
        else:
            st.session_state["password_correct"] = False

    if "password_correct" not in st.session_state:
        st.markdown("\n\n")
        st.text_input("Enter the password", type="password", on_change=password_entered, key="password")
        st.divider()
        st.info("Developed by Milan Mrdenovic Β© IBM Norway 2025")
        return False
    elif not st.session_state["password_correct"]:
        st.markdown("\n\n")
        st.text_input("Enter the password", type="password", on_change=password_entered, key="password")
        st.divider()
        st.info("Developed by Milan Mrdenovic Β© IBM Norway 2025")
        st.error("πŸ˜• Password incorrect")
        return False
    else:
        return True

if not check_password():
    st.stop()


# Initialize session state
if 'current_page' not in st.session_state:
    st.session_state.current_page = 0

def initialize_session_state():
    if 'chat_history' not in st.session_state:
        st.session_state.chat_history = []

def setup_client():
    credentials = Credentials(
        url=st.secrets["url"],
        api_key=st.secrets["api_key"]
    )
    return APIClient(credentials, project_id=st.secrets["project_id"])

def prepare_prompt(prompt, chat_history):
    if genparam.TYPE == "chat" and chat_history:
        chats = "\n".join([f"{message['role']}: \"{message['content']}\"" for message in chat_history])
        return f"Conversation History:\n{chats}\n\n New User Prompt: {prompt}"
    return prompt

def apply_prompt_syntax(prompt, system_prompt, prompt_template, bake_in_prompt_syntax):
    model_family_syntax = {
        ### Llama Models
        "llama3_instruct - system": """<|begin_of_text|><|start_header_id|>system<|end_header_id|>\n\n{system_prompt}<|eot_id|><|start_header_id|>user<|end_header_id|>\n\n{prompt}<|eot_id|><|start_header_id|>assistant<|end_header_id|>\n\n""",
        "llama3_instruct - user": """<|begin_of_text|><|start_header_id|>user<|end_header_id|>\n\n{prompt}<|eot_id|><|start_header_id|>assistant<|end_header_id|>\n\n""",
        ### Granite Models
        "granite_3 - system": """<|start_of_role|>system<|end_of_role|>{system_prompt}<|end_of_text|>\n<|start_of_role|>user<|end_of_role|>{prompt}<|end_of_text|>\n<|start_of_role|>assistant<|end_of_role|>""",
        "granite_3 - user": """<|start_of_role|>user<|end_of_role|>{prompt}<|end_of_text|>\n<|start_of_role|>assistant<|end_of_role|>""",
        ### Granite Code Only
        "granite_code - with system": """System:\n{system_prompt}\n\nQuestion:\n{prompt}\n\nAnswer:\n""",
        "granite_code - instruction only": """Question:\n{prompt}\n\nAnswer:\n""",
        ### Mistral Models
        "mistral_ai_models_sys": """<s>[INST]System Prompt: {system_prompt} \n\n User Prompt: {prompt}[/INST]""",
        "mistral_ai_models": """<s>[INST]{prompt}[/INST]""",
        "mistral_ai_small_sys": """<s>[SYSTEM_PROMPT]{system_prompt}[/SYSTEM_PROMPT][INST]{prompt}[/INST]""",
        "mistral_ai_small_raw": """[SYSTEM_PROMPT]{system_prompt}[/SYSTEM_PROMPT][INST]{prompt}[/INST]""",
        ### No Syntax
        "no syntax - system": """{system_prompt}\n\n{prompt}""",
        "no syntax - user": """{prompt}""",
    }
    
    if bake_in_prompt_syntax:
        template = model_family_syntax[prompt_template]
        if system_prompt:
            return template.format(system_prompt=system_prompt, prompt=prompt)
    return prompt

def generate_response(watsonx_llm, prompt_data, params):
    generated_response = watsonx_llm.generate_text_stream(prompt=prompt_data, params=params)
    for chunk in generated_response:
        yield chunk

def chat_interface():
    st.subheader("Jimmy")

    # User input
    user_input = st.chat_input("You:", key="user_input")

    if user_input:
        # Add user message to chat history
        st.session_state.chat_history.append({"role": "user", "content": user_input})

        # Prepare the prompt
        prompt = prepare_prompt(user_input, st.session_state.chat_history)

        # Apply prompt syntax
        prompt_data = apply_prompt_syntax(
            prompt, 
            genparam.SYSTEM_PROMPT,
            genparam.PROMPT_TEMPLATE,
            genparam.BAKE_IN_PROMPT_SYNTAX
        )
    
        # Setup client and model
        client = setup_client()
        watsonx_llm = ModelInference(
            api_client=client, 
            model_id=genparam.SELECTED_MODEL,
            verify=genparam.VERIFY
        )
    
        # Prepare parameters
        params = {
            GenParams.DECODING_METHOD: genparam.DECODING_METHOD,
            GenParams.MAX_NEW_TOKENS: genparam.MAX_NEW_TOKENS,
            GenParams.MIN_NEW_TOKENS: genparam.MIN_NEW_TOKENS,
            GenParams.REPETITION_PENALTY: genparam.REPETITION_PENALTY,
            GenParams.STOP_SEQUENCES: genparam.STOP_SEQUENCES
        }

       # Generate and stream response
        with st.chat_message("Jimmy", avatar="πŸ˜’"):
            stream = generate_response(watsonx_llm, prompt_data, params)
            response = st.write_stream(stream)

        # Add AI response to chat history
        st.session_state.chat_history.append({"role": "Jimmy", "content": response})

def main():
    initialize_session_state()
    chat_interface()

if __name__ == "__main__":
    main()