Initial app commit v0.1.0.

dylanhogg · Feb 6, 2024 · 6feb99b · 6feb99b
1 parent 12479f1
commit 6feb99b
Show file tree

Hide file tree

Showing 18 changed files with 3,251 additions and 21 deletions.
diff --git a/.gitignore b/.gitignore
@@ -11,6 +11,9 @@ _temp/
 .DS_Store
 .pypirc
 
+mp3/
+conversation_transcripts/
+
 # Byte-compiled / optimized / DLL files
 __pycache__/
 *.py[cod]

diff --git a/Makefile b/Makefile
@@ -1,6 +1,7 @@
 run:
 	# Executes the given command inside the virtualenv
-	poetry run llmvsllm "llm1" "llm2" --llm-use-localhost 0
+	# poetry run llmvsllm python_language_evangelist java_language_evangelist # --speak
+	poetry run llmvsllm chatgpt_llm_evangelist bard_llm_evangelist # --speak
 
 build:
 	# Build the source and wheels archives

diff --git a/README.md b/README.md
@@ -4,3 +4,5 @@
 [![Build](https://github.com/dylanhogg/llmvsllm/workflows/build/badge.svg)](https://github.com/dylanhogg/llmvsllm/actions/workflows/python-poetry-app.yml)
 
 LLM vs. LLM: Simulates a rap battle or debate between two Large Language Models (LLMs)
+
+Currently a WIP.
diff --git a/llmvsllm/arena/bot_base.py b/llmvsllm/arena/bot_base.py
@@ -0,0 +1,59 @@
+from abc import ABC, abstractmethod
+
+from joblib import Memory
+
+memory = Memory(".joblib_cache", verbose=0)
+
+
+class BotBase(ABC):
+    def __init__(
+        self,
+        name: str,
+        system: str,
+        opener: str,
+        first_bot: bool = False,
+        voice: str = "onyx",
+        debug: bool = False,
+        attr_name: str = "",
+    ):
+        self.name = name
+        self.system = system
+        self.opener = opener
+        self.first_bot = first_bot
+        self.attr_name = attr_name
+        self.voice = voice
+        self.debug = debug
+
+        self.conversation = []
+        self.total_prompt_tokens = 0
+        self.total_completion_tokens = 0
+
+    @abstractmethod
+    def respond_to(self, user_input: str) -> (int, list, str, int, int):
+        pass
+
+    @abstractmethod
+    def cost_estimate_cents(self):
+        pass
+
+    def is_human(self):
+        return False
+
+    def get_opener(self):
+        return self.opener
+
+    def pair_with(self, other: "BotBase") -> "BotBase":
+        def talking_with_statement(name):
+            return "You are talking with " + name.replace("_", " ") + " (only address them by name once, not more)\n"
+
+        self.system = talking_with_statement(other.name) + self.system
+        other.system = talking_with_statement(self.name) + other.system
+        self.first_bot = True
+        other.first_bot = False
+
+    @property
+    def display_name(self):
+        return self.name.lower().replace(" ", "_").replace("(", "").replace(")", "")[0:15]
+
+    def __repr__(self) -> str:
+        return f"{type(self).__name__} {self.attr_name} '{self.name}' {self.model}@{self.temperature}{' (1st)' if self.first_bot else ' (2nd)'}"
diff --git a/llmvsllm/arena/bot_pair.py b/llmvsllm/arena/bot_pair.py
@@ -0,0 +1,55 @@
+import copy
+import inspect
+
+from llmvsllm.arena.bot_base import BotBase
+from llmvsllm.bots.generic_llm_bots import GenericLLMBots
+from llmvsllm.bots.system_bots import SystemBots
+from llmvsllm.library.classes import AppUsageException
+
+
+class AllBots(
+    GenericLLMBots,
+    SystemBots,
+):
+    pass
+
+
+class BotPair:
+    def get_all_bot_names(self) -> list[str]:
+        result = [
+            m[0] for m in inspect.getmembers(AllBots()) if not m[0].startswith("_") and not inspect.ismethod(m[1])
+        ]
+        return sorted(result)
+
+    def get_bot(self, bot_name) -> BotBase:
+        try:
+            found_bot = getattr(AllBots(), bot_name)
+            found_bot.attr_name = bot_name
+            return copy.deepcopy(found_bot)
+        except AttributeError as e:
+            # print(f"Bot name {bot_name} not found. Try one of: {self.get_all_bot_names()}")
+            raise AppUsageException(f"Bot name {bot_name} not found. Try one of: {self.get_all_bot_names()}") from e
+
+    def __init__(
+        self, bot1_name: str, bot2_name: str, model1: str, model2: str, temperature1: float, temperature2: float
+    ):
+        assert bot1_name, "bot1_name required"
+        assert bot2_name, "bot2_name required"
+        assert model1, "model1 required"
+        assert model2, "model2 required"
+
+        # Initialization
+        self.bot1 = self.get_bot(bot1_name)
+        self.bot1.model = model1
+        if self.bot1.temperature is None:
+            self.bot1.temperature = temperature1
+        assert isinstance(self.bot1.system, str), f"system must be a string, not {type(self.bot1.system)=}"
+
+        self.bot2 = self.get_bot(bot2_name)
+        self.bot2.model = model2
+        if self.bot2.temperature is None:
+            self.bot2.temperature = temperature2
+        assert isinstance(self.bot2.system, str), f"system must be a string, not {type(self.bot1.system)=}"
+
+        # Pair bots
+        self.bot1.pair_with(self.bot2)
diff --git a/llmvsllm/arena/conversation.py b/llmvsllm/arena/conversation.py
@@ -0,0 +1,158 @@
+import hashlib
+import os
+from datetime import datetime
+from pathlib import Path
+
+from loguru import logger
+from rich import print
+
+from llmvsllm.arena.bot_pair import AllBots, BotPair
+from llmvsllm.library.sound import Sound
+
+
+class Conversation:
+    def __init__(
+        self,
+        bot1: str,
+        bot2: str,
+        model1: str,
+        model2: str,
+        temperature1: float = 0.7,
+        temperature2: float = 0.7,
+        speak: bool = False,
+        debug: bool = False,
+    ):
+        self.bot1 = bot1
+        self.bot2 = bot2
+        self.model1 = model1
+        self.model2 = model2
+        self.temperature1 = temperature1
+        self.temperature2 = temperature2
+        self.speak = speak
+        self.debug = debug
+
+    def _pprint(self, text: str):
+        print(text)
+        logger.info(text)
+
+    def _initialise_bots(self):
+        return BotPair(self.bot1, self.bot2, self.model1, self.model2, self.temperature1, self.temperature2)
+
+    def _parse_pause_input(self, bots: BotPair):
+        if not bots.bot1.is_human() and not bots.bot2.is_human():
+            while True:
+                pause_input = input("...")  # Pause if both bots are non-human
+                # Parse pause input
+                if pause_input == "%human1":
+                    print("Switching bot1 to human...")
+                    human_bot = AllBots().human
+                    human_bot.system = bots.bot1.system
+                    human_bot.conversation = bots.bot1.conversation
+                    human_bot.first_bot = bots.bot1.first_bot
+                    bots.bot1 = human_bot
+                    break
+                elif pause_input == "%human2":
+                    print("Switching bot2 to human...")
+                    human_bot = AllBots().human
+                    human_bot.system = bots.bot2.system
+                    human_bot.conversation = bots.bot2.conversation
+                    human_bot.first_bot = bots.bot2.first_bot
+                    bots.bot2 = human_bot
+                    break
+                elif pause_input == "%system1":
+                    self._pprint(f"Bot 1 system:\n{bots.bot1.augmented_conversation_system()}")
+                elif pause_input == "%system1":
+                    self._pprint(f"Bot 2 system:\n{bots.bot2.augmented_conversation_system()}")
+                else:
+                    break
+
+    def _get_conversation_details(self, bots) -> tuple[Path, str, str]:
+        transcript_header = f"{bots.bot1.attr_name} '{bots.bot1.name}' {bots.bot1.model}@{bots.bot1.temperature} <-> {bots.bot2.attr_name} '{bots.bot2.name}' {bots.bot2.model}@{bots.bot2.temperature}"
+        hash = hashlib.md5(transcript_header.encode("utf-8")).hexdigest()[0:7]
+        folder = Path("./conversation_transcripts/")
+        folder.mkdir(parents=True, exist_ok=True)
+        filename = (
+            folder
+            / f"{bots.bot1.attr_name}#{bots.bot1.model}@{bots.bot1.temperature}___{bots.bot2.attr_name}#{bots.bot2.model}@{bots.bot2.temperature}_{hash}_{datetime.today().strftime('%Y%m%d.%H%M%S')}.txt"
+        )
+        return filename, hash, transcript_header
+
+    def start(self):
+        if self.model1.startswith("gpt-4") or self.model2.startswith("gpt-4"):
+            self._pprint("[red]WARNING: GPT-4 model activated, watch your costs.[/red]")
+
+        api_key = os.environ.get("OPENAI_API_KEY", None)
+        assert api_key, "OPENAI_API_KEY environment variable must be set"
+
+        bots = self._initialise_bots()
+        self._pprint("Conversation set up:")
+        self._pprint(f"Bot1: {bots.bot1} <-> Bot2: {bots.bot2}")
+        self._pprint(f"{self.speak=}, {self.debug=}")
+        self._pprint(f"{bots.bot1=}\n{bots.bot2=}")
+        print()
+
+        total_prompt_tokens = 0
+        total_completion_tokens = 0
+        total_chars = 0
+        total_mp3_cents = 0
+
+        # Bot1 opener
+        response1 = bots.bot1.get_opener()
+        self._pprint("Conversation:\n[white]1.[/white]")
+        self._pprint(f"[u][white]{bots.bot1.display_name} (opener):[/white][/u] [cyan2]{response1}[/cyan2]")
+        if self.speak and not bots.bot1.is_human():
+            mp3_file, total_mp3_cents, mp3_from_cache = Sound.to_mp3(response1, bots.bot1.voice, bots.bot1.name)
+            Sound.play_mp3(mp3_file)
+
+        # Start conversation
+        mp3_from_cache1, mp3_from_cache2 = False, False
+        filename, hash, transcript_header = self._get_conversation_details(bots)
+        with open(filename, "w") as f:
+            f.write(f"Conversation {datetime.today().strftime('%Y-%m-%d %H:%M:%S')} @{hash}\n")
+            f.write(f"{transcript_header}\n")
+            while True:
+                # Bot 2 responds to Bot 1 opener
+                i, conversation2, response2, prompt_tokens2, completion_tokens2 = bots.bot2.respond_to(response1)
+                self._pprint(f"[u][white]{bots.bot2.display_name}:[/white][/u] [magenta1]{response2}[/magenta1]")
+                f.write(f"\n{'-'*80}\n{bots.bot2.display_name}: {response2}\n")
+                f.flush()
+                if self.speak and not bots.bot2.is_human():
+                    mp3_file2, estimated_cost_cents2, mp3_from_cache2 = Sound.to_mp3(
+                        response2, bots.bot2.voice, bots.bot2.name
+                    )
+                    Sound.play_mp3(mp3_file2)
+                    total_mp3_cents += estimated_cost_cents2
+                total_prompt_tokens += prompt_tokens2
+                total_completion_tokens += completion_tokens2
+                total_chars += len(response2)
+
+                # Debug info
+                total_bot_cents = bots.bot1.cost_estimate_cents() + bots.bot2.cost_estimate_cents()
+                total_cents = total_mp3_cents + total_bot_cents
+                self._pprint(
+                    f"[bright_black]({total_prompt_tokens=}, {total_completion_tokens=}, {total_chars=}, "
+                    f"{total_mp3_cents=:.1f}, {total_bot_cents=:.2f}, {total_cents=:.2f}) "
+                    f"{'*' if mp3_from_cache2 else ''}{'^' if mp3_from_cache1 else ''}[/bright_black]"
+                )
+
+                # Pause if both bots are non-human
+                self._parse_pause_input(bots)
+
+                print()
+                self._pprint(f"[white]{i+1}.[/white]")
+
+                # Bot 1 responds to Bot 2
+                i, conversation1, response1, prompt_tokens1, completion_tokens1 = bots.bot1.respond_to(response2)
+                self._pprint(f"[u][white]{bots.bot1.display_name}:[/white][/u] [cyan2]{response1}[/cyan2]")
+
+                f.write(f"\n{'-'*80}\n{bots.bot1.display_name}: {response1}\n")
+                f.flush()
+                if self.speak and not bots.bot1.is_human():
+                    mp3_file1, estimated_cost_cents1, mp3_from_cache1 = Sound.to_mp3(
+                        response1, bots.bot1.voice, bots.bot1.name
+                    )
+                    Sound.play_mp3(mp3_file1)
+                    total_mp3_cents += estimated_cost_cents1
+                total_prompt_tokens += prompt_tokens1
+                total_completion_tokens += completion_tokens1
+                total_chars += len(response1)
diff --git a/llmvsllm/arena/fixed_response_bot.py b/llmvsllm/arena/fixed_response_bot.py
@@ -0,0 +1,37 @@
+from llmvsllm.arena.bot_base import BotBase
+
+
+class FixedRespoonseBot(BotBase):
+    def __init__(
+        self,
+        name: str,
+        system: str,
+        opener: str,
+        response_list: list,
+        first_bot: bool = False,
+        voice: str = "onyx",
+        debug: bool = False,
+    ):
+        super().__init__(name, system, opener, first_bot, voice, debug)
+
+        self.i = 0
+        self.system = ""
+        self.temperature = ""
+        self.model = ""
+        self.conversation = ["Not applicable, this bot has a fixed response list."]
+        self.response_list = response_list
+
+    def respond_to(self, user_input: str) -> (int, list, str, int, int):
+        if self.first_bot and self.i == 0:
+            # Include opener in start of conversation (should only apply for the first initiating bot)
+            assert (
+                self.opener
+            ), f"first_bot was True but no opener provided for bot {self.name}. {self.i=}, {self.first_bot=}, {self.opener=}"
+            self.conversation.append({"role": "assistant", "content": self.opener})
+
+        response = self.response_list[self.i % len(self.response_list)]
+        self.i += 1
+        return self.i, self.conversation, response, 0, 0
+
+    def cost_estimate_cents(self):
+        return 0