From d4e1120b22f0a866ef85408c240f9f6d69f04a39 Mon Sep 17 00:00:00 2001
From: Debanjum Singh Solanky <debanjum@gmail.com>
Date: Fri, 26 Nov 2021 17:23:03 +0530
Subject: [PATCH 1/4] Add GPT based conversation processor to understand intent
 and converse with user

- Allow conversing with user using GPT's contextually aware, generative capability
- Extract metadata, user intent from user's messages using GPT's general understanding
---
 environment.yml                   |  3 +-
 src/processor/conversation/gpt.py | 70 +++++++++++++++++++++++++++++++
 tests/test_chatbot.py             | 63 ++++++++++++++++++++++++++++
 3 files changed, 135 insertions(+), 1 deletion(-)
 create mode 100644 src/processor/conversation/gpt.py
 create mode 100644 tests/test_chatbot.py

diff --git a/environment.yml b/environment.yml
index e0691da8..aedf5358 100644
--- a/environment.yml
+++ b/environment.yml
@@ -12,4 +12,5 @@ dependencies:
   - pyyaml=5.*
   - pytest=6.*
   - pillow=8.*
-  - torchvision=0.*
\ No newline at end of file
+  - torchvision=0.*
+  - openai=0.*
\ No newline at end of file
diff --git a/src/processor/conversation/gpt.py b/src/processor/conversation/gpt.py
new file mode 100644
index 00000000..8418ff44
--- /dev/null
+++ b/src/processor/conversation/gpt.py
@@ -0,0 +1,70 @@
+# Standard Packages
+import os
+
+# External Packages
+import openai
+
+
+def understand(text, api_key=None, temperature=0.5, max_tokens=100):
+    """
+    Understand user input using OpenAI's GPT
+    """
+    # Initialize Variables
+    openai.api_key = api_key or os.getenv("OPENAI_API_KEY")
+    understand_primer="Extract information from each chat message\n\nremember(memory-type, data);\nmemory-type=[\"companion\", \"notes\", \"ledger\", \"image\", \"music\"]\nsearch(search-type, data);\nsearch-type=[\"google\", \"youtube\"]\ngenerate(activity);\nactivity=[\"paint\",\"write\", \"chat\"]\ntrigger-emotion(emotion);\nemotion=[\"happy\",\"confidence\",\"fear\",\"surprise\",\"sadness\",\"disgust\",\"anger\", \"curiosity\", \"calm\"]\n\nQ: How are you doing?\nA: activity(\"chat\"); trigger-emotion(\"surprise\")\nQ: Do you remember what I told you about my brother Antoine when we were at the beach?\nA: remember(\"notes\", \"Brother Antoine when we were at the beach\"); trigger-emotion(\"curiosity\");\nQ: what did we talk about last time?\nA: remember(\"notes\", \"talk last time\"); trigger-emotion(\"curiosity\");\nQ: Let's make some drawings!\nA: generate(\"paint\"); trigger-emotion(\"happy\");\nQ: Do you know anything about Lebanon?\nA: search(\"google\", \"lebanon\");  trigger-emotion(\"confidence\");\nQ: Find a video about a panda rolling in the grass\nA: search(\"youtube\",\"panda rolling in the grass\");  trigger-emotion(\"happy\"); \nQ: Tell me a scary story\nA: generate(\"write\" \"A story about some adventure\"); trigger-emotion(\"fear\");\nQ: What fiction book was I reading last week about AI starship?\nA: remember(\"notes\", \"read fiction book about AI starship last week\"); trigger-emotion(\"curiosity\");\nQ: How much did I spend at Subway for dinner last time?\nA: remember(\"ledger\", \"last Subway dinner\"); trigger-emotion(\"curiosity\");\nQ: I'm feeling sleepy\nA: activity(\"chat\"); trigger-emotion(\"calm\")\nQ: What was that popular Sri lankan song that Alex showed me recently?\nA: remember(\"music\", \"popular Sri lankan song that Alex showed recently\");  trigger-emotion(\"curiosity\"); \nQ: You're pretty funny!\nA: activity(\"chat\"); trigger-emotion(\"pride\")"
+
+    # Setup Prompt with Understand Primer
+    prompt = message_to_prompt(text, understand_primer, start_sequence="\nA:", restart_sequence="\nQ:")
+
+    # Get Reponse from GPT
+    response = openai.Completion.create(
+        engine="davinci",
+        prompt=prompt,
+        temperature=temperature,
+        max_tokens=max_tokens,
+        top_p=1,
+        frequency_penalty=0.2,
+        presence_penalty=0,
+        stop=["\n"])
+
+    # Extract, Clean Message from GPT's Response
+    story = response['choices'][0]['text']
+    return str(story)
+
+
+def converse(text, conversation_history=None, api_key=None, temperature=0.9, max_tokens=150):
+    """
+    Converse with user using OpenAI's GPT
+    """
+    # Initialize Variables
+    openai.api_key = api_key or os.getenv("OPENAI_API_KEY")
+
+    start_sequence = "\nAI:"
+    restart_sequence = "\nHuman:"
+    conversation_primer = f"The following is a conversation with an AI assistant. The assistant is helpful, creative, clever, and very friendly companion.\n{restart_sequence} Hello, who are you?{start_sequence} Hi, I am an AI conversational companion created by OpenAI. How can I help you today?"
+
+    # Setup Prompt with Primer or Conversation History
+    prompt = message_to_prompt(text, conversation_history or conversation_primer, start_sequence=start_sequence, restart_sequence=restart_sequence)
+
+    # Get Response from GPT
+    response = openai.Completion.create(
+        engine="davinci",
+        prompt=prompt,
+        temperature=temperature,
+        max_tokens=max_tokens,
+        top_p=1,
+        frequency_penalty=0,
+        presence_penalty=0.6,
+        stop=["\n", " Human:", " AI:"])
+
+    # Extract, Clean Message from GPT's Response
+    story = response['choices'][0]['text']
+    return str(story).strip()
+
+
+def message_to_prompt(user_message, conversation_history="", gpt_message=None, start_sequence="\nAI:", restart_sequence="\nHuman:"):
+    """Create prompt for GPT from message"""
+    if gpt_message:
+        return f"{conversation_history}{restart_sequence} {user_message}{start_sequence} {gpt_message}"
+    else:
+        return f"{conversation_history}{restart_sequence} {user_message}{start_sequence}"
\ No newline at end of file
diff --git a/tests/test_chatbot.py b/tests/test_chatbot.py
new file mode 100644
index 00000000..ca207d02
--- /dev/null
+++ b/tests/test_chatbot.py
@@ -0,0 +1,63 @@
+# External Packages
+import pytest
+
+# Internal Packages
+from src.processor.conversation.gpt import converse, understand, message_to_prompt
+
+# Input your OpenAI API key to run the tests below
+api_key = None
+
+
+# Test
+# ----------------------------------------------------------------------------------------------------
+def test_message_to_understand_prompt():
+    # Setup
+    understand_primer = "Extract information from each chat message\n\nremember(memory-type, data);\nmemory-type=[\"companion\", \"notes\", \"ledger\", \"image\", \"music\"]\nsearch(search-type, data);\nsearch-type=[\"google\", \"youtube\"]\ngenerate(activity);\nactivity=[\"paint\",\"write\", \"chat\"]\ntrigger-emotion(emotion);\nemotion=[\"happy\",\"confidence\",\"fear\",\"surprise\",\"sadness\",\"disgust\",\"anger\", \"curiosity\", \"calm\"]\n\nQ: How are you doing?\nA: activity(\"chat\"); trigger-emotion(\"surprise\")\nQ: Do you remember what I told you about my brother Antoine when we were at the beach?\nA: remember(\"notes\", \"Brother Antoine when we were at the beach\"); trigger-emotion(\"curiosity\");\nQ: what did we talk about last time?\nA: remember(\"notes\", \"talk last time\"); trigger-emotion(\"curiosity\");\nQ: Let's make some drawings!\nA: generate(\"paint\"); trigger-emotion(\"happy\");\nQ: Do you know anything about Lebanon?\nA: search(\"google\", \"lebanon\");  trigger-emotion(\"confidence\");\nQ: Find a video about a panda rolling in the grass\nA: search(\"youtube\",\"panda rolling in the grass\");  trigger-emotion(\"happy\"); \nQ: Tell me a scary story\nA: generate(\"write\" \"A story about some adventure\"); trigger-emotion(\"fear\");\nQ: What fiction book was I reading last week about AI starship?\nA: remember(\"notes\", \"read fiction book about AI starship last week\"); trigger-emotion(\"curiosity\");\nQ: How much did I spend at Subway for dinner last time?\nA: remember(\"ledger\", \"last Subway dinner\"); trigger-emotion(\"curiosity\");\nQ: I'm feeling sleepy\nA: activity(\"chat\"); trigger-emotion(\"calm\")\nQ: What was that popular Sri lankan song that Alex showed me recently?\nA: remember(\"music\", \"popular Sri lankan song that Alex showed recently\");  trigger-emotion(\"curiosity\"); \nQ: You're pretty funny!\nA: activity(\"chat\"); trigger-emotion(\"pride\")"
+    expected_response = "Extract information from each chat message\n\nremember(memory-type, data);\nmemory-type=[\"companion\", \"notes\", \"ledger\", \"image\", \"music\"]\nsearch(search-type, data);\nsearch-type=[\"google\", \"youtube\"]\ngenerate(activity);\nactivity=[\"paint\",\"write\", \"chat\"]\ntrigger-emotion(emotion);\nemotion=[\"happy\",\"confidence\",\"fear\",\"surprise\",\"sadness\",\"disgust\",\"anger\", \"curiosity\", \"calm\"]\n\nQ: How are you doing?\nA: activity(\"chat\"); trigger-emotion(\"surprise\")\nQ: Do you remember what I told you about my brother Antoine when we were at the beach?\nA: remember(\"notes\", \"Brother Antoine when we were at the beach\"); trigger-emotion(\"curiosity\");\nQ: what did we talk about last time?\nA: remember(\"notes\", \"talk last time\"); trigger-emotion(\"curiosity\");\nQ: Let's make some drawings!\nA: generate(\"paint\"); trigger-emotion(\"happy\");\nQ: Do you know anything about Lebanon?\nA: search(\"google\", \"lebanon\");  trigger-emotion(\"confidence\");\nQ: Find a video about a panda rolling in the grass\nA: search(\"youtube\",\"panda rolling in the grass\");  trigger-emotion(\"happy\"); \nQ: Tell me a scary story\nA: generate(\"write\" \"A story about some adventure\"); trigger-emotion(\"fear\");\nQ: What fiction book was I reading last week about AI starship?\nA: remember(\"notes\", \"read fiction book about AI starship last week\"); trigger-emotion(\"curiosity\");\nQ: How much did I spend at Subway for dinner last time?\nA: remember(\"ledger\", \"last Subway dinner\"); trigger-emotion(\"curiosity\");\nQ: I'm feeling sleepy\nA: activity(\"chat\"); trigger-emotion(\"calm\")\nQ: What was that popular Sri lankan song that Alex showed me recently?\nA: remember(\"music\", \"popular Sri lankan song that Alex showed recently\");  trigger-emotion(\"curiosity\"); \nQ: You're pretty funny!\nA: activity(\"chat\"); trigger-emotion(\"pride\")\nQ: When did I last dine at Burger King?\nA:"
+
+    # Act
+    actual_response = message_to_prompt("When did I last dine at Burger King?", understand_primer, start_sequence="\nA:", restart_sequence="\nQ:")
+
+    # Assert
+    assert actual_response == expected_response
+
+
+# ----------------------------------------------------------------------------------------------------
+@pytest.mark.skipif(api_key is None,
+                    reason="Set api_key variable to your OpenAI API key from https://beta.openai.com/account/api-keys")
+def test_minimal_chat_with_gpt():
+    # Act
+    response = converse("What will happen when the stars go out?", api_key=api_key)
+
+    # Assert
+    assert len(response) > 0
+
+
+# ----------------------------------------------------------------------------------------------------
+@pytest.mark.skipif(api_key is None,
+                    reason="Set api_key variable to your OpenAI API key from https://beta.openai.com/account/api-keys")
+def test_chat_with_history():
+    # Act
+    start_sequence="\nAI:"
+    restart_sequence="\nHuman:"
+
+    conversation_primer = f"The following is a conversation with an AI assistant. The assistant is helpful, creative, clever, and very friendly companion.\n{restart_sequence} Hello, I am testatron. Who are you?{start_sequence} Hi, I am an AI conversational companion created by OpenAI. How can I help you today?"
+    conversation_history = conversation_primer
+
+    response = converse("Can you tell me my name?", conversation_history=conversation_history, api_key=api_key, temperature=0, max_tokens=50)
+
+    # Assert
+    assert len(response) > 0
+    assert "Testatron" in response or "testatron" in response
+
+
+# ----------------------------------------------------------------------------------------------------
+@pytest.mark.skipif(api_key is None,
+                    reason="Set api_key variable to your OpenAI API key from https://beta.openai.com/account/api-keys")
+def test_understand_message_using_gpt():
+    # Act
+    response = understand("When did I last dine at Subway?", api_key=api_key)
+
+    # Assert
+    assert len(response) > 0
+    assert "remember(\"ledger\", " in response

From a99b4b3434c67ee2151d28c5ac41a4ee979d1cbd Mon Sep 17 00:00:00 2001
From: Debanjum Singh Solanky <debanjum@gmail.com>
Date: Sat, 27 Nov 2021 01:26:26 +0530
Subject: [PATCH 2/4] Make conversation processor configurable

---
 sample_config.yml   |  6 ++++++
 src/utils/cli.py    | 11 ++++++++++-
 src/utils/config.py | 24 ++++++++++++++++++++++++
 3 files changed, 40 insertions(+), 1 deletion(-)

diff --git a/sample_config.yml b/sample_config.yml
index 2fb447ab..fc04918f 100644
--- a/sample_config.yml
+++ b/sample_config.yml
@@ -30,3 +30,9 @@ search-type:
 
   image:
     encoder: "clip-ViT-B-32"
+
+processor:
+  conversation:
+    openai-api-key: null
+    conversation-logfile: "tests/data/.conversation_logs.json"
+    conversation-history: null
\ No newline at end of file
diff --git a/src/utils/cli.py b/src/utils/cli.py
index b8c725f4..6891463a 100644
--- a/src/utils/cli.py
+++ b/src/utils/cli.py
@@ -80,6 +80,15 @@ default_config = {
         'image':
         {
             'encoder': "clip-ViT-B-32"
-        }
+        },
+    },
+    'processor':
+    {
+        'conversation':
+        {
+            'openai-api-key': "",
+            'conversation-logfile': ".conversation_logs.json",
+            'conversation-history': ""
+        },
     }
 }
diff --git a/src/utils/config.py b/src/utils/config.py
index 16328e37..7627697a 100644
--- a/src/utils/config.py
+++ b/src/utils/config.py
@@ -93,3 +93,27 @@ class SearchConfig():
     ledger: TextSearchConfig = None
     music: TextSearchConfig = None
     image: ImageSearchConfig = None
+
+
+class ConversationProcessorConfig():
+    def __init__(self, conversation_logfile, conversation_history, openai_api_key, verbose):
+        self.openai_api_key = openai_api_key
+        self.conversation_logfile = conversation_logfile
+        self.conversation_history = conversation_history
+        self.verbose = verbose
+
+    def create_from_dictionary(config, key_tree, verbose):
+        conversation_config = get_from_dict(config, *key_tree)
+        if not conversation_config:
+            return None
+
+        return ConversationProcessorConfig(
+            openai_api_key = conversation_config['openai-api-key'],
+            conversation_history = '',
+            conversation_logfile = Path(conversation_config['conversation-logfile']),
+            verbose = verbose)
+
+
+@dataclass
+class ProcessorConfig():
+    conversation: ConversationProcessorConfig = None
\ No newline at end of file

From ccfb97e1a7da444b3ac1c3acba1e9aa77f293554 Mon Sep 17 00:00:00 2001
From: Debanjum Singh Solanky <debanjum@gmail.com>
Date: Sat, 27 Nov 2021 01:27:46 +0530
Subject: [PATCH 3/4] Wire up minimal conversation processor. Expose it over
 /chat API endpoint

Ensure conversation history persists across application restart
---
 src/main.py | 57 +++++++++++++++++++++++++++++++++++++++++++++++++++--
 1 file changed, 55 insertions(+), 2 deletions(-)

diff --git a/src/main.py b/src/main.py
index bf2f819f..5d0a83d5 100644
--- a/src/main.py
+++ b/src/main.py
@@ -1,5 +1,6 @@
 # Standard Packages
 import sys
+import json
 from typing import Optional
 
 # External Packages
@@ -8,14 +9,16 @@ from fastapi import FastAPI
 
 # Internal Packages
 from src.search_type import asymmetric, symmetric_ledger, image_search
-from src.utils.helpers import get_from_dict
+from src.utils.helpers import get_absolute_path
 from src.utils.cli import cli
-from src.utils.config import SearchType, SearchModels, TextSearchConfig, ImageSearchConfig, SearchConfig
+from src.utils.config import SearchType, SearchModels, TextSearchConfig, ImageSearchConfig, SearchConfig, ProcessorConfig, ConversationProcessorConfig
+from src.processor.conversation.gpt import converse, message_to_prompt
 
 
 # Application Global State
 model = SearchModels()
 search_config = SearchConfig()
+processor_config = ProcessorConfig()
 app = FastAPI()
 
 
@@ -85,6 +88,20 @@ def regenerate(t: Optional[SearchType] = None):
     return {'status': 'ok', 'message': 'regeneration completed'}
 
 
+@app.get('/chat')
+def chat(q: str):
+    # Load Conversation History
+    conversation_history = processor_config.conversation.conversation_history
+
+    # Converse with OpenAI GPT
+    gpt_response = converse(q, conversation_history, api_key=processor_config.conversation.openai_api_key)
+
+    # Update Conversation History
+    processor_config.conversation.conversation_history = message_to_prompt(q, conversation_history, gpt_response)
+
+    return {'status': 'ok', 'response': gpt_response}
+
+
 def initialize_search(config, regenerate, verbose):
     model = SearchModels()
     search_config = SearchConfig()
@@ -112,6 +129,39 @@ def initialize_search(config, regenerate, verbose):
     return model, search_config
 
 
+def initialize_processor(config, verbose):
+    processor_config = ProcessorConfig()
+
+    # Initialize Conversation Processor
+    processor_config.conversation = ConversationProcessorConfig.create_from_dictionary(config, ('processor', 'conversation'), verbose)
+
+    # Load or Initialize Conversation History from Disk
+    conversation_logfile = processor_config.conversation.conversation_logfile
+    if processor_config.conversation.verbose:
+        print('Saving conversation logs to disk...')
+
+    if conversation_logfile.expanduser().absolute().is_file():
+        with open(get_absolute_path(conversation_logfile), 'r') as f:
+            processor_config.conversation.conversation_history = json.load(f).get('chat', '')
+    else:
+        processor_config.conversation.conversation_history = ''
+
+    return processor_config
+
+
+@app.on_event('shutdown')
+def shutdown_event():
+    if processor_config.conversation.verbose:
+        print('Saving conversation logs to disk...')
+
+    # Save Conversation History to Disk
+    conversation_logfile = get_absolute_path(processor_config.conversation.conversation_logfile)
+    with open(conversation_logfile, "w+", encoding='utf-8') as logfile:
+        json.dump({"chat": processor_config.conversation.conversation_history}, logfile)
+
+    print('Conversation logs saved to disk.')
+
+
 if __name__ == '__main__':
     # Load config from CLI
     args = cli(sys.argv[1:])
@@ -119,6 +169,9 @@ if __name__ == '__main__':
     # Initialize Search from Config
     model, search_config = initialize_search(args.config, args.regenerate, args.verbose)
 
+    # Initialize Processor from Config
+    processor_config = initialize_processor(args.config, args.verbose)
+
     # Start Application Server
     if args.socket:
         uvicorn.run(app, proxy_headers=True, uds=args.socket)

From 882e0f81b4fa42b83ceebb8493ac0b07fcd4540c Mon Sep 17 00:00:00 2001
From: Debanjum Singh Solanky <debanjum@gmail.com>
Date: Sat, 27 Nov 2021 18:14:29 +0530
Subject: [PATCH 4/4] Skip running the inconsistent image search test

---
 tests/test_image_search.py | 4 ++++
 1 file changed, 4 insertions(+)

diff --git a/tests/test_image_search.py b/tests/test_image_search.py
index 5d1155e5..943d6bec 100644
--- a/tests/test_image_search.py
+++ b/tests/test_image_search.py
@@ -1,3 +1,6 @@
+# External Packages
+import pytest
+
 # Internal Packages
 from src.main import model
 from src.search_type import image_search
@@ -17,6 +20,7 @@ def test_image_search_setup(search_config):
 
 
 # ----------------------------------------------------------------------------------------------------
+@pytest.mark.skip(reason="results inconsistent currently")
 def test_image_search(search_config):
     # Arrange
     model.image_search = image_search.setup(search_config.image, regenerate=False)