Fix #11 -- Add thread locking, to avoid premature assistant runs

voiio · Dec 17, 2023 · 700805b · 700805b
1 parent bdd4b48
commit 700805b
Show file tree

Hide file tree

Showing 2 changed files with 133 additions and 117 deletions.
diff --git a/sam/config.py b/sam/config.py
@@ -5,4 +5,4 @@
 OPENAI_API_KEY = os.getenv("OPENAI_API_KEY")
 OPENAI_ASSISTANT_ID = os.getenv("OPENAI_ASSISTANT_ID")
 REDIS_URL = os.getenv("REDIS_URL", "redis:///")
-RANDOM_RUN_RATIO = float(os.getenv("RANDOM_RUN_RATIO"))
+RANDOM_RUN_RATIO = float(os.getenv("RANDOM_RUN_RATIO", "0"))
diff --git a/sam/slack.py b/sam/slack.py
@@ -1,6 +1,7 @@
 import json
 import logging
 import random  # nosec
+import threading
 import time
 import urllib.request
 from typing import Any
@@ -34,47 +35,59 @@ def handle_message(event: {str, Any}, say: Say):
     text = event["text"]
     text = text.replace(f"<@{USER_HANDLE}>", "Sam")
     thread_id = utils.get_thread_id(channel_id)
-    file_ids = []
-    voice_prompt = False
-    if "files" in event:
-        for file in event["files"]:
-            req = urllib.request.Request(
-                file["url_private"],
-                headers={"Authorization": f"Bearer {config.SLACK_BOT_TOKEN}"},
-            )
-            with urllib.request.urlopen(req) as response:  # nosec
-                if file["filetype"] in AUDIO_FORMATS:
-                    text += "\n" + client.audio.transcriptions.create(
-                        model="whisper-1",
-                        file=(file["name"], response.read()),
-                        response_format="text",
-                    )
-                    logger.info(f"User={user_id} added Audio={file['id']}")
-                    voice_prompt = True
-                else:
-                    file_ids.append(
-                        client.files.create(
-                            file=(file["name"], response.read()), purpose="assistants"
-                        ).id
-                    )
-                    logger.info(
-                        f"User={user_id} added File={file_ids[-1]} to Thread={thread_id}"
-                    )
-    client.beta.threads.messages.create(
-        thread_id=thread_id,
-        content=text,
-        role="user",
-        file_ids=file_ids,
-    )
-    logger.info(
-        f"User={user_id} added Message={client_msg_id} added to Thread={thread_id}"
-    )
-    if (
-        channel_type == "im"
-        or event.get("parent_user_id") == USER_HANDLE
-        or random.random() < config.RANDOM_RUN_RATIO  # nosec
-    ):
-        process_run(event, say, voice_prompt=voice_prompt)
+    # We may only add messages to a thread while the assistant is not running
+    with utils.storage.lock(
+        thread_id, timeout=10 * 60, thread_local=False
+    ):  # 10 minutes
+        file_ids = []
+        voice_prompt = False
+        if "files" in event:
+            for file in event["files"]:
+                req = urllib.request.Request(
+                    file["url_private"],
+                    headers={"Authorization": f"Bearer {config.SLACK_BOT_TOKEN}"},
+                )
+                with urllib.request.urlopen(req) as response:  # nosec
+                    if file["filetype"] in AUDIO_FORMATS:
+                        text += "\n" + client.audio.transcriptions.create(
+                            model="whisper-1",
+                            file=(file["name"], response.read()),
+                            response_format="text",
+                        )
+                        logger.info(f"User={user_id} added Audio={file['id']}")
+                        voice_prompt = True
+                    else:
+                        file_ids.append(
+                            client.files.create(
+                                file=(file["name"], response.read()),
+                                purpose="assistants",
+                            ).id
+                        )
+                        logger.info(
+                            f"User={user_id} added File={file_ids[-1]} to Thread={thread_id}"
+                        )
+        client.beta.threads.messages.create(
+            thread_id=thread_id,
+            content=text,
+            role="user",
+            file_ids=file_ids,
+        )
+        logger.info(
+            f"User={user_id} added Message={client_msg_id} added to Thread={thread_id}"
+        )
+        if (
+            channel_type == "im"
+            or event.get("parent_user_id") == USER_HANDLE
+            or random.random() < config.RANDOM_RUN_RATIO  # nosec
+        ):
+            # we need to run the assistant in a separate thread, otherwise we will
+            # block the main thread:
+            # process_run(event, say, voice_prompt=voice_prompt)
+            threading.Thread(
+                target=process_run,
+                args=(event, say),
+                kwargs={"voice_prompt": voice_prompt},
+            ).start()
 
 
 def process_run(event: {str, Any}, say: Say, voice_prompt: bool = False):
@@ -83,88 +96,91 @@ def process_run(event: {str, Any}, say: Say, voice_prompt: bool = False):
     user_id = event["user"]
     thread_ts = event.get("thread_ts")
     thread_id = utils.get_thread_id(channel_id)
-    run = client.beta.threads.runs.create(
-        thread_id=thread_id,
-        assistant_id=config.OPENAI_ASSISTANT_ID,
-    )
-    msg = say(f":speech_balloon:", mrkdwn=True, thread_ts=thread_ts)
-    logger.info(f"User={user_id} started Run={run.id} for Thread={thread_id}")
-    for i in range(14):  # ~ 10 minutes
-        if run.status not in ["queued", "in_progress"]:
-            break
-        time.sleep(min(2**i, 60))  # exponential backoff capped at 60 seconds
-        run = client.beta.threads.runs.retrieve(thread_id=thread_id, run_id=run.id)
-    if run.status == "failed":
-        logger.error(run.last_error)
-        say.client.chat_update(
-            channel=say.channel,
-            ts=msg["ts"],
-            text=f"🤖 {run.last_error.message}",
-            mrkdwn=True,
-        )
-        logger.error(f"Run {run.id} {run.status} for Thread {thread_id}")
-        logger.error(run.last_error.message)
-        return
-    elif run.status != "completed":
-        logger.error(f"Run={run.id} {run.status} for Thread {thread_id}")
-        say.client.chat_update(
-            channel=say.channel,
-            ts=msg["ts"],
-            text=f"🤯",
-            mrkdwn=True,
+    # We may wait for the messages being processed, before starting a new run
+    with utils.storage.lock(thread_id, timeout=10 * 60):  # 10 minutes
+        run = client.beta.threads.runs.create(
+            thread_id=thread_id,
+            assistant_id=config.OPENAI_ASSISTANT_ID,
         )
-        return
-    logger.info(f"Run={run.id} {run.status} for Thread={thread_id}")
-
-    messages = client.beta.threads.messages.list(thread_id=thread_id)
-    for message in messages:
-        if message.role == "assistant":
-            message_content = message.content[0].text
-            if voice_prompt:
-                response = client.audio.speech.create(
-                    model="tts-1-hd",
-                    voice="alloy",
-                    input=message_content.value,
-                )
-                say.client.files_upload(
-                    content=response.read(),
-                    channels=say.channel,
-                    ts=msg["ts"],
-                )
-                logger.info(
-                    f"Sam responded to the User={user_id} in Channel={channel_id} via Voice"
-                )
-            else:
-                annotations = message_content.annotations
-                citations = []
-
-                # Iterate over the annotations and add footnotes
-                for index, annotation in enumerate(annotations):
-                    message_content.value = message_content.value.replace(
-                        annotation.text, f" [{index}]"
-                    )
-
-                    if file_citation := getattr(annotation, "file_citation", None):
-                        cited_file = client.files.retrieve(file_citation.file_id)
-                        citations.append(
-                            f"[{index}] {file_citation.quote} — {cited_file.filename}"
-                        )
-                    elif file_path := getattr(annotation, "file_path", None):
-                        cited_file = client.files.retrieve(file_path.file_id)
-                        citations.append(f"[{index}]({cited_file.filename})")
-
-                # Add footnotes to the end of the message before displaying to user
-                message_content.value += "\n" + "\n".join(citations)
+        msg = say(f":speech_balloon:", mrkdwn=True, thread_ts=thread_ts)
+        logger.info(f"User={user_id} started Run={run.id} for Thread={thread_id}")
+        for i in range(14):  # ~ 10 minutes
+            if run.status not in ["queued", "in_progress"]:
+                break
+            time.sleep(min(2**i, 60))  # exponential backoff capped at 60 seconds
+            run = client.beta.threads.runs.retrieve(thread_id=thread_id, run_id=run.id)
+        if run.status == "failed":
+            logger.error(run.last_error)
             say.client.chat_update(
                 channel=say.channel,
                 ts=msg["ts"],
-                text=message_content.value,
+                text=f"🤖 {run.last_error.message}",
                 mrkdwn=True,
             )
-            logger.info(
-                f"Sam responded to the User={user_id} in Channel={channel_id} via Text"
+            logger.error(f"Run {run.id} {run.status} for Thread {thread_id}")
+            logger.error(run.last_error.message)
+            return
+        elif run.status != "completed":
+            logger.error(f"Run={run.id} {run.status} for Thread {thread_id}")
+            say.client.chat_update(
+                channel=say.channel,
+                ts=msg["ts"],
+                text=f"🤯",
+                mrkdwn=True,
             )
-            break
+            return
+        logger.info(f"Run={run.id} {run.status} for Thread={thread_id}")
+
+        messages = client.beta.threads.messages.list(thread_id=thread_id)
+        for message in messages:
+            if message.role == "assistant":
+                message_content = message.content[0].text
+                if voice_prompt:
+                    response = client.audio.speech.create(
+                        model="tts-1-hd",
+                        voice="alloy",
+                        input=message_content.value,
+                    )
+                    say.client.files_upload(
+                        content=response.read(),
+                        channels=say.channel,
+                        thread_ts=thread_ts,
+                        ts=msg["ts"],
+                    )
+                    logger.info(
+                        f"Sam responded to the User={user_id} in Channel={channel_id} via Voice"
+                    )
+                else:
+                    annotations = message_content.annotations
+                    citations = []
+
+                    # Iterate over the annotations and add footnotes
+                    for index, annotation in enumerate(annotations):
+                        message_content.value = message_content.value.replace(
+                            annotation.text, f" [{index}]"
+                        )
+
+                        if file_citation := getattr(annotation, "file_citation", None):
+                            cited_file = client.files.retrieve(file_citation.file_id)
+                            citations.append(
+                                f"[{index}] {file_citation.quote} — {cited_file.filename}"
+                            )
+                        elif file_path := getattr(annotation, "file_path", None):
+                            cited_file = client.files.retrieve(file_path.file_id)
+                            citations.append(f"[{index}]({cited_file.filename})")
+
+                    # Add footnotes to the end of the message before displaying to user
+                    message_content.value += "\n" + "\n".join(citations)
+                say.client.chat_update(
+                    channel=say.channel,
+                    ts=msg["ts"],
+                    text=message_content.value,
+                    mrkdwn=True,
+                )
+                logger.info(
+                    f"Sam responded to the User={user_id} in Channel={channel_id} via Text"
+                )
+                break
 
 
 app.event("message")(handle_message)