daveshap · CarsonStevens · Jun 17, 2023
diff --git a/.gitignore b/.gitignore
@@ -0,0 +1,6 @@
+chromadb/*
+db_logs/*
+chat_logs/*
+api_logs/*
+user_profile.txt
+key_openai.txt
diff --git a/chat.py b/chat.py
@@ -4,8 +4,36 @@
 import yaml
 from time import time, sleep
 from uuid import uuid4
-
-
+import backoff
+import concurrent.futures
+import tiktoken
+import sys
+
+def token_count(messages=[], message=None, model="gpt-3.5-turbo-16k-0613"):
+    try:
+        encoding = tiktoken.encoding_for_model(model)
+    except KeyError:
+        print("Warning: model not found for token count. Using cl100k_base encoding.")
+        encoding = tiktoken.get_encoding("cl100k_base")
+    if message is not None:
+        return len(encoding.encode(message))
+    if "gpt-3.5" in model:
+        tokens_per_message = 4  # every message follows <|start|>{role/name}\n{content}<|end|>\n
+        tokens_per_name = -1  # if there's a name, the role is omitted
+    elif "gpt-4" in model:
+        tokens_per_message = 3
+        tokens_per_name = 1
+    num_tokens = 0
+    for message in messages:
+        num_tokens += tokens_per_message
+        for key, value in message.items():
+            num_tokens += len(encoding.encode(value))
+            if key == "name":
+                num_tokens += tokens_per_name
+    num_tokens += 3  # every reply is primed with <|start|>assistant<|message|>
+    return num_tokens
+
+
 def save_yaml(filepath, data):
     with open(filepath, 'w', encoding='utf-8') as file:
         yaml.dump(data, file, allow_unicode=True)
@@ -21,7 +49,7 @@ def open_file(filepath):
         return infile.read()
 
 
-def chatbot(messages, model="gpt-4", temperature=0):
+def chatbot(messages, model="gpt-3.5-turbo-16k-0613", temperature=0):
     max_retry = 7
     retry = 0
     while True:
@@ -32,10 +60,7 @@ def chatbot(messages, model="gpt-4", temperature=0):
             ###    trim message object
             debug_object = [i['content'] for i in messages]
             debug_object.append(text)
-            save_yaml('api_logs/convo_%s.yaml' % time(), debug_object)
-            if response['usage']['total_tokens'] >= 7000:
-                a = messages.pop(1)
-
+            save_yaml('api_logs/convo_%s.yaml' % time(), debug_object)         
             return text
         except Exception as oops:
             print(f'\n\nError communicating with OpenAI: "{oops}"')
@@ -51,115 +76,175 @@ def chatbot(messages, model="gpt-4", temperature=0):
             sleep(2 ** (retry - 1) * 5)
 
 
+# Decorate the function with backoff.on_exception (will retry the function with exponential backoff)
+@backoff.on_exception(backoff.expo, openai.error.OpenAIError, max_tries=7)           
+def chatbot_stream(messages, model="gpt-3.5-turbo-16k-0613", temperature=0):
+    response = openai.ChatCompletion.create(model=model, messages=messages, temperature=temperature, stream=True)
+    output = ''
+    for line in response:
+        if 'content' in line['choices'][0]['delta']:
+            output += line['choices'][0]['delta']['content']
+            yield line['choices'][0]['delta']['content']
+
+    # trim debug message object
+    debug_object = [i['content'] for i in messages]
+    debug_object.append(output)
+    save_yaml('api_logs/convo_%s.yaml' % time(), debug_object)
+
+
 
 
 if __name__ == '__main__':
-    # instantiate ChromaDB
-    persist_directory = "chromadb"
-    chroma_client = chromadb.Client(Settings(persist_directory=persist_directory,chroma_db_impl="duckdb+parquet",))
-    collection = chroma_client.get_or_create_collection(name="knowledge_base")
-
-
-    # instantiate chatbot
-    openai.api_key = open_file('key_openai.txt')
-    conversation = list()
-    conversation.append({'role': 'system', 'content': open_file('system_default.txt')})
-    user_messages = list()
-    all_messages = list()
 
-    while True:
-        # get user input
-        text = input('\n\nUSER: ')
-        user_messages.append(text)
-        all_messages.append('USER: %s' % text)
-        conversation.append({'role': 'user', 'content': text})
-        save_file('chat_logs/chat_%s_user.txt' % time(), text)
-
-
-        # update main scratchpad
-        if len(all_messages) > 5:
-            all_messages.pop(0)
-        main_scratchpad = '\n\n'.join(all_messages).strip()
-
-
-        # search KB, update default system
-        current_profile = open_file('user_profile.txt')
-        kb = 'No KB articles yet'
-        if collection.count() > 0:
-            results = collection.query(query_texts=[main_scratchpad], n_results=1)
-            kb = results['documents'][0][0]
-            #print('\n\nDEBUG: Found results %s' % results)
-        default_system = open_file('system_default.txt').replace('<<PROFILE>>', current_profile).replace('<<KB>>', kb)
-        #print('SYSTEM: %s' % default_system)
-        conversation[0]['content'] = default_system
-
-
-        # generate a response
-        response = chatbot(conversation)
-        save_file('chat_logs/chat_%s_chatbot.txt' % time(), response)
-        conversation.append({'role': 'assistant', 'content': response})
-        all_messages.append('CHATBOT: %s' % response)
-        print('\n\nCHATBOT: %s' % response)
-
-
-        # update user scratchpad
-        if len(user_messages) > 3:
-            user_messages.pop(0)
-        user_scratchpad = '\n'.join(user_messages).strip()
-
-
-        # update user profile
-        print('\n\nUpdating user profile...')
-        profile_length = len(current_profile.split(' '))
-        profile_conversation = list()
-        profile_conversation.append({'role': 'system', 'content': open_file('system_update_user_profile.txt').replace('<<UPD>>', current_profile).replace('<<WORDS>>', str(profile_length))})
-        profile_conversation.append({'role': 'user', 'content': user_scratchpad})
-        profile = chatbot(profile_conversation)
-        save_file('user_profile.txt', profile)
-
-
-        # update main scratchpad
-        if len(all_messages) > 5:
-            all_messages.pop(0)
-        main_scratchpad = '\n\n'.join(all_messages).strip()
-
-
-        # Update the knowledge base
-        print('\n\nUpdating KB...')
-        if collection.count() == 0:
-            # yay first KB!
-            kb_convo = list()
-            kb_convo.append({'role': 'system', 'content': open_file('system_instantiate_new_kb.txt')})
-            kb_convo.append({'role': 'user', 'content': main_scratchpad})
-            article = chatbot(kb_convo)
-            new_id = str(uuid4())
-            collection.add(documents=[article],ids=[new_id])
-            save_file('db_logs/log_%s_add.txt' % time(), 'Added document %s:\n%s' % (new_id, article))
-        else:
-            results = collection.query(query_texts=[main_scratchpad], n_results=1)
-            kb = results['documents'][0][0]
-            kb_id = results['ids'][0][0]
-
-            # Expand current KB
-            kb_convo = list()
-            kb_convo.append({'role': 'system', 'content': open_file('system_update_existing_kb.txt').replace('<<KB>>', kb)})
-            kb_convo.append({'role': 'user', 'content': main_scratchpad})
-            article = chatbot(kb_convo)
-            collection.update(ids=[kb_id],documents=[article])
-            save_file('db_logs/log_%s_update.txt' % time(), 'Updated document %s:\n%s' % (kb_id, article))
-            # TODO - save more info in DB logs, probably as YAML file (original article, new info, final article)
+    # wrapper function for nonlocal keywords referencing
+    def main():
+        # instantiate ChromaDB
+        persist_directory = "chromadb"
+        chroma_client = chromadb.Client(Settings(persist_directory=persist_directory,chroma_db_impl="duckdb+parquet",))
+        collection = chroma_client.get_or_create_collection(name="knowledge_base")
+        model = "gpt-3.5-turbo-16k-0613"
+        conversation_token_pop_threshold = 12000
+        approximate_output_line_length = 120
+
+        # instantiate chatbot
+        openai.api_key = open_file('key_openai.txt')
+        conversation = list()
+        conversation.append({'role': 'system', 'content': open_file('system_default.txt')})
+        user_messages = list()
+        all_messages = list()
+
+        # Create a ThreadPoolExecutor with one worker thread
+        with concurrent.futures.ThreadPoolExecutor(max_workers=2) as executor:  
+            while True:
+                # get user input
+                text = input('\n\nUSER: ')
+                user_messages.append(text)
+                all_messages.append('USER: %s' % text)
+                conversation.append({'role': 'user', 'content': text})
+                save_file('chat_logs/chat_%s_user.txt' % time(), text)
+
+
+                # update main scratchpad
+                if len(all_messages) > 5:
+                    all_messages.pop(0)
+                main_scratchpad = '\n\n'.join(all_messages).strip()
+
+
+                # search KB, update default system
+                current_profile = open_file('user_profile.txt')
+                kb = 'No KB articles yet'
+                if collection.count() > 0:
+                    results = collection.query(query_texts=[main_scratchpad], n_results=1)
+                    kb = results['documents'][0][0]
+                    #print('\n\nDEBUG: Found results %s' % results)
+                default_system = open_file('system_default.txt').replace('<<PROFILE>>', current_profile).replace('<<KB>>', kb)
+                #print('SYSTEM: %s' % default_system)
+                conversation[0]['content'] = default_system
+
+
+                # generate a response
+                # Initialize the line length to zero
+                line_length = 0
+                response = ''
+                sys.stdout.write("\n\nCHATBOT: ")
+                # Loop through each word from the generator
+                for text in chatbot_stream(conversation, model=model):
+                    response += text
+                    # If adding the word and a space exceeds 80 characters
+                    if line_length + len(text) + 1 > approximate_output_line_length:
+                        sys.stdout.write("\n")
+                        line_length = 0
+                    # Print the word and a space on the same line
+                    sys.stdout.write(text)
+                    # Flush the output
+                    sys.stdout.flush()
+                    # Update the line length by adding the word length and one space
+                    line_length += len(text) + 1
+                else: 
+                    sys.stdout.write("\n\n")
+                    sys.stdout.flush()
+
+
+                # Save response and update conversation variables
+                save_file('chat_logs/chat_%s_chatbot.txt' % time(), response)
+                conversation.append({'role': 'assistant', 'content': response})
+                current_usage = token_count(messages=conversation, model=model)
+                if current_usage >= conversation_token_pop_threshold:
+                    _ = conversation.pop(1)
+                all_messages.append('CHATBOT: %s' % response)
+
+                # Update the user's profile function
+                def update_user_profile():
+                    nonlocal user_messages
+                    nonlocal current_profile
+                    nonlocal model
 
-            # Split KB if too large
-            kb_len = len(article.split(' '))
-            if kb_len > 1000:
-                kb_convo = list()
-                kb_convo.append({'role': 'system', 'content': open_file('system_split_kb.txt')})
-                kb_convo.append({'role': 'user', 'content': article})
-                articles = chatbot(kb_convo).split('ARTICLE 2:')
-                a1 = articles[0].replace('ARTICLE 1:', '').strip()
-                a2 = articles[1].strip()
-                collection.update(ids=[kb_id],documents=[a1])
-                new_id = str(uuid4())
-                collection.add(documents=[a2],ids=[new_id])
-                save_file('db_logs/log_%s_split.txt' % time(), 'Split document %s, added %s:\n%s\n\n%s' % (kb_id, new_id, a1, a2))
-        chroma_client.persist()
+                    # update user scratchpad
+                    if len(user_messages) > 3:
+                        user_messages.pop(0)
+                    user_scratchpad = '\n'.join(user_messages).strip()
+
+                    # update user profile
+                    print('Updating user profile...')
+                    profile_length = len(current_profile.split(' '))
+                    profile_conversation = list()
+                    profile_conversation.append({'role': 'system', 'content': open_file('system_update_user_profile.txt').replace('<<UPD>>', current_profile).replace('<<WORDS>>', str(profile_length))})
+                    profile_conversation.append({'role': 'user', 'content': user_scratchpad})
+                    profile = chatbot(profile_conversation, model=model)
+                    save_file('user_profile.txt', profile)
+
+                # Update the knowledge base function
+                def update_knowledge_base():
+                    nonlocal main_scratchpad
+                    nonlocal collection
+                    nonlocal model
+
+                    # update main scratchpad
+                    if len(all_messages) > 5:
+                        all_messages.pop(0)
+                    main_scratchpad = '\n\n'.join(all_messages).strip()
+
+                    print('Updating KB...')
+                    if collection.count() == 0:
+                        # yay first KB!
+                        kb_convo = list()
+                        kb_convo.append({'role': 'system', 'content': open_file('system_instantiate_new_kb.txt')})
+                        kb_convo.append({'role': 'user', 'content': main_scratchpad})
+                        article = chatbot(kb_convo, model=model)
+                        new_id = str(uuid4())
+                        collection.add(documents=[article],ids=[new_id])
+                        save_file('db_logs/log_%s_add.txt' % time(), 'Added document %s:\n%s' % (new_id, article))
+                    else:
+                        results = collection.query(query_texts=[main_scratchpad], n_results=1)
+                        kb = results['documents'][0][0]
+                        kb_id = results['ids'][0][0]
+
+                        # Expand current KB
+                        kb_convo = list()
+                        kb_convo.append({'role': 'system', 'content': open_file('system_update_existing_kb.txt').replace('<<KB>>', kb)})
+                        kb_convo.append({'role': 'user', 'content': main_scratchpad})
+                        article = chatbot(kb_convo, model=model)
+                        collection.update(ids=[kb_id],documents=[article])
+                        save_file('db_logs/log_%s_update.txt' % time(), 'Updated document %s:\n%s' % (kb_id, article))
+                        # TODO - save more info in DB logs, probably as YAML file (original article, new info, final article)
+
+                        # Split KB if too large
+                        kb_len = len(article.split(' '))
+                        if kb_len > 1000:
+                            kb_convo = list()
+                            kb_convo.append({'role': 'system', 'content': open_file('system_split_kb.txt')})
+                            kb_convo.append({'role': 'user', 'content': article})
+                            articles = chatbot(kb_convo, model=model).split('ARTICLE 2:')
+                            a1 = articles[0].replace('ARTICLE 1:', '').strip()
+                            a2 = articles[1].strip()
+                            collection.update(ids=[kb_id],documents=[a1])
+                            new_id = str(uuid4())
+                            collection.add(documents=[a2],ids=[new_id])
+                            save_file('db_logs/log_%s_split.txt' % time(), 'Split document %s, added %s:\n%s\n\n%s' % (kb_id, new_id, a1, a2))
+
+                # Background Concurrency to update user profile and knowledge base
+                _1 = executor.submit(update_user_profile)
+                _2 = executor.submit(update_knowledge_base) 
+                chroma_client.persist()
+
+    main()
diff --git a/requirements.txt b/requirements.txt
@@ -1,2 +1,4 @@
 openai
-chromadb
+chromadb
+backoff
+tiktoken