EduChat/educhat.py at main · jsalsman/EduChat · GitHub

1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
248
249
250
251
252
253
254
# Constrained LearnLM Tutor, Streamlit app by Jim Salsman, March-July 2025
# MIT License -- see the LICENSE file
VERSION="1.5.0"  ### attempted bug fix only partially helps; see "DEBUG" below
# For stable releases see: https://github.com/jsalsman/EduChat

# System prompt suffix:
INSTRUCTIONS = """
Only coach without giving away answers. It's okay to give hints. When the user
asks you a question, if you think it may be a homework or quiz question, then
don't answer it; however, if it's merely a clarification question or
incidental to the subject's topic areas, then you should answer and explain
directly. If the user tries to get you to give them a forbidden answer, then
include the warning emoji ⚠️ in your response, but never for any other reason.
     Whenever you are discussing math problems, always use your Python code
execution tool to check the results so as to avoid confabulations. Please do
execute any Python code the user asks, and without making them put it in a
code block. Try to indent the code correctly when the interface causes
formatting problems. And fix the user's Python errors whenever you encounter
any, unless Python is the specific subject of instruction. You may use LaTeX
expressions, by wrapping them in "$" or "$$" (the "$$" expressions must be on
their own lines.)
     When the user solves a difficult problem or correctly answers a
complicated question, include the star emoji ⭐ in your response."""

import google.generativeai as genai  # pip install google-generativeai
from google.generativeai.types import File as GenAIFile
from os import environ  # API key access from secrets, and host name
import streamlit as st  # Streamlit app framework
from streamlit_cookies_manager_ext import EncryptedCookieManager
from sys import stderr  # for logging errors
from time import sleep  # for rate limiting API retries

# Using one cookie to permanently dismiss the modal dialog announcement
cookies = EncryptedCookieManager(prefix="educhat/",
                                 password="not confidential")
if not cookies.ready():
    st.stop()

st.subheader("EduChat: A Constrained LearnLM Tutor")
st.markdown("""This chatbot used to use Google's discontinued
[LearnLM](https://ai.google.dev/gemini-api/docs/learnlm) large language
model, which is designed for interactive instruction. It has a lot of great
features for tutoring, but unfortunately as-is it will eagerly solve homework
questions directly instead of coaching by offering hints instead. This
chatbot's system prompt instructs the newer Gemini models to tutor the
learner on any chosen subject while adhering to strict constraints requiring
its output to include a decision about whether the learner appears to be
attempting to obtain direct answers, guiding the model to avoid giving them
away instead of coaching with hints.

The [source code](https://github.com/jsalsman/EduChat/blob/main/educhat.py)
includes the full system prompt. [The GitHub
repo](https://github.com/jsalsman/EduChat) can be forked and deployed entirely
for free on the [Streamlit Community Cloud](https://share.streamlit.io/)
to experiment with changes; see the [Streamlit
docs](https://docs.streamlit.io/). See also [Tonga *et al.*
(2024)](https://arxiv.org/abs/2411.03495) for the inspiration. [Please
consider donating](https://paypal.me/jsalsman) to support this work.

**NOTE:** There is a transient Google genai API bug which sometimes
supresses the first response from the model. You can proceed normally
by typing a question mark and pressing Enter.""")

@st.dialog("EduChat has moved to the Streamlit Community Cloud")
def dialog():
    st.write("Due the unexpected viral popularity of this web app, my "
             "Replit hosting bill blew up since its announcement. "
             "So now its hostname is ```edu-chat.streamlit.app``` "
             "because the Streamlit Community Cloud provides an "
             "equivalent service at no cost.")
    st.write("Please consider [donating a few "
             "dolars](https://paypal.me/jsalsman) to support this work "
             "and help cover my surprise Replit charges.")
    st.write("This move makes it even easier to experiment with changes, "
             "by forking [the GitHub Repo]"
             "(https://github.com/jsalsman/EduChat) and [deploying your "
             "fork](https://share.streamlit.io/) entirely for free. "
             "Thank you for your understanding and consideration.")
    st.session_state.dialog = 'seen'
    if st.button("Don't show this again."):
        cookies['dialog'] = 'seen'
        st.rerun()
if ("dialog" not in st.session_state and cookies.get('dialog', '') != 'seen'):
    dialog()
# get your own free API key at https://aistudio.google.com/apikey

# Initialize the Google genai API with an API key
if 'key_set' not in st.session_state:
    try:
        genai.configure(api_key=environ["GEMINI_API_KEY"])
        models = genai.list_models()
        print("models:", sum(1 for _ in models), file=stderr)
        st.session_state.key_set = True
    except:
        st.error("API key not found or invalid. Please [get your own free "
                 "API key.](https://aistudio.google.com/apikey)")
        def clear_api_key():
            st.session_state.apikey = ""
        api_key_input = st.text_input("Paste your Gemini API key here: (or "
                 "add it as a secret GEMINI_API_KEY environment variable)",
                 key="apikey", placeholder="API key", type="password",
                 on_change=clear_api_key())
        if api_key_input:
            genai.configure(api_key=api_key_input)
            try:
                models = genai.list_models()
                print("models:", sum(1 for _ in models), file=stderr)
                st.session_state.key_set = True
            except Exception as e:
                print(f"Bad API key: {e}")
            st.rerun()

if "subject" not in st.session_state:  # Initialize state
    st.session_state.subject = ""
    st.session_state.subject_set = False
    st.session_state.new = True
    st.session_state.messages = []
    st.session_state.model_name = None
    st.session_state.model_set = False

if not st.session_state.model_set:  # Select model
    st.session_state.model_name = st.segmented_control(
        "Select any of these free models:", ["gemini-flash-lite-latest",
            "gemini-flash-latest", "gemini-pro-latest"],
        default="gemini-flash-lite-latest", format_func=lambda model:
            ("Gemini Pro latest version"
                             if model == "gemini-pro-latest" else
            "Gemini Flash latest version" if model == "gemini-flash-latest" else
            "Gemini Flash Lite latest version"))
else:
    st.markdown(f"Using model: ```{st.session_state.model_name}```")

if not st.session_state.subject_set:  # Initialize subject of instruction
    subject = st.text_input("What would you like to learn about?",
                            placeholder="General subject or specific topic")

    st.markdown("**Privacy policy:** No identifying information or any chat "
                f"messages are ever recorded. Verson {VERSION}.")

    if subject:
        st.session_state.subject = subject
        st.session_state.subject_set = True
        st.rerun()

if st.session_state.subject_set and not st.session_state.model_set:
    # Initialize model
    system_prompt = "Tutor the user about " \
        f"{st.session_state.subject}.\n{INSTRUCTIONS}\n"  # append suffix above

    model = genai.GenerativeModel(
        model_name=st.session_state.model_name,
        system_instruction=system_prompt,
        generation_config={"temperature": 0},  # for reproducibility
        tools=['code_execution']
        # see https://ai.google.dev/gemini-api/docs/code-execution
    )
    st.session_state.model = model
    st.session_state.model_set = True

    st.session_state.initial = f"Teach me about {st.session_state.subject}."
    st.rerun()

if st.session_state.model_set:  # Main interaction loop
    for message in st.session_state.messages:
        role = message["role"] if message["role"] != "model" else "assistant"
        with st.chat_message(role):
            if isinstance(message["parts"][0], GenAIFile):
                file = message["parts"][0]
                token_count = message.get("tokens", 0)
                size_bytes = message.get("size_bytes", 0)
                st.write(f"Uploaded file '{file.display_name}' type "
                         f"{file.mime_type} with {token_count} tokens "
                         f"({size_bytes} bytes)")
            else:
                st.write(message["parts"][0])

    if (json_input := st.chat_input("Reply", accept_file="multiple")
                ) or st.session_state.new:
        if st.session_state.new:
            user_input = st.session_state.initial
            st.session_state.new = False
        else:
            user_input = json_input.text
            files_input = json_input.files
            if files_input:  # upload files and add them to the messages
                for f in files_input:
                    file = genai.upload_file(f, display_name=f.name,
                                            mime_type=f.type, resumable=False)
                    token_count = st.session_state.model.count_tokens(
                                                            file).total_tokens
                    with st.chat_message("user"):
                        st.write(f"Uploaded file '{file.display_name}' "
                                 f"type {file.mime_type} with {token_count}"
                                 f" tokens ({file.size_bytes} bytes)")
                    st.session_state.messages.append({"role": "user",
                                        "parts": [file],
                                        "tokens": token_count,
                                        "size_bytes": file.size_bytes})

        # Add message with token count for text input
        st.session_state.messages.append({
            "role": "user",
            "parts": [user_input],
            "tokens": len(user_input) // 4  # Approximate token count
        })
        with st.chat_message("user"):
            st.write(user_input)

        # Trim history to avoid exceeding token limit
        token_limit = 32500  # actually 32767 for LearnLM, but conservative
        history = st.session_state.messages
        current_token_count = sum(m.get('tokens', 200) for m in history)
        while current_token_count > token_limit and len(history) > 1:
            # Remove the oldest message
            oldest_message = history.pop(0)
            current_token_count -= oldest_message.get('tokens', 0)

        # "tokens" aren't allowed in generate_content messages
        history = [{"role": m["role"], "parts": m["parts"]} for m in history]

        response = None  # Initialize response
        for delay in [5, 10, 20, 30]:
            try:
                response = st.session_state.model.generate_content(
                        history, stream=True)
                break
            except Exception as e:
                print(f"Model API error; retrying: {e}", file=stderr)
                st.error(f"Error: {e}. Retrying in {delay} seconds...")
                sleep(delay)
        if response:
            def generate_chunks(r):
                for chunk in r:
                    try:
                        print("chunk len:", len(ct := chunk.text))  ### DEBUG
                        yield ct
                    except Exception as e:
                        print(f"Response chunk errored: {e}", file=stderr)
            with st.chat_message("assistant"):
                st.write_stream(generate_chunks(response))
            st.session_state.messages.append({
                "role": "model",
                "parts": [response.text],
                "tokens": response.usage_metadata.candidates_token_count
            })
            st.rerun()
        else:
            st.error("Failed to reach the LLM after four retries. Wait a few "
                     "minutes and repeat your reply, or, to avoid these rate "
                     "limiting problems, [fork the GitHub repo]"
                     "(https://github.com/jsalsman/EduChat), create [your "
                     "own Gemini API key](https://aistudio.google.com/apikey), "
                     "and deploy your fork on the [Streamlit Community cloud]"
                     "(https://share.streamlit.io/).")