From 5a1bd48d94b97480bf654ff4156fea10f275626e Mon Sep 17 00:00:00 2001
From: Rene Teigen <rene9917@gmail.com>
Date: Sun, 5 Feb 2023 11:36:23 +0000
Subject: [PATCH] Fix regression in full discord server indexing Add back
 response mode, only on vector index queries Added the llmpredictor to queries
 Fix docker build Update requirements

---
 Dockerfile                   |  6 +++---
 cogs/commands.py             | 20 +++++++++++++-------
 cogs/index_service_cog.py    | 22 ++++++++++++++++++++--
 models/autocomplete_model.py | 24 +++++++++++++++++++++---
 models/index_model.py        | 31 +++++++++++++++++--------------
 requirements.txt             |  2 +-
 6 files changed, 75 insertions(+), 30 deletions(-)

diff --git a/Dockerfile b/Dockerfile
index 3260cf2..5e7b98a 100644
--- a/Dockerfile
+++ b/Dockerfile
@@ -9,9 +9,9 @@ COPY . .
 RUN mkdir /install /src
 WORKDIR /install
 RUN pip install --target="/install" --upgrade pip setuptools wheel
-RUN pip install setuptools_rust
-RUN pip install torch==1.9.1+cpu torchvision==0.10.1+cpu -f https://download.pytorch.org/whl/torch_stable.html
-RUN pip install git+https://github.com/openai/whisper.git
+RUN pip install --target="/install" --upgrade setuptools_rust
+RUN pip install --target="/install" --upgrade torch==1.9.1+cpu torchvision==0.10.1+cpu -f https://download.pytorch.org/whl/torch_stable.html
+RUN pip install --target="/install" --upgrade git+https://github.com/openai/whisper.git
 COPY requirements.txt /install
 RUN pip install --target="/install" -r requirements.txt
 COPY README.md /src
diff --git a/cogs/commands.py b/cogs/commands.py
index 2fc30ca..63acc24 100644
--- a/cogs/commands.py
+++ b/cogs/commands.py
@@ -532,13 +532,19 @@ class Commands(discord.Cog, name="Commands"):
     )
     @discord.guild_only()
     @discord.option(
-        name="index",
-        description="Which file to load the index from",
-        required=True,
-        autocomplete=File_autocompleter.get_indexes,
+        name="user_index",
+        description="Which user file to load the index from",
+        required=False,
+        autocomplete=File_autocompleter.get_user_indexes,
+    )
+    @discord.option(
+        name="server_index",
+        description="Which serever file to load the index from",
+        required=False,
+        autocomplete=File_autocompleter.get_server_indexes,
     )
-    async def load_index(self, ctx: discord.ApplicationContext, index: str):
-        await self.index_cog.load_index_command(ctx, index)
+    async def load_index(self, ctx: discord.ApplicationContext, user_index: str, server_index: str):
+        await self.index_cog.load_index_command(ctx, user_index, server_index)
 
     @add_to_group("index")
     @discord.slash_command(
@@ -624,7 +630,7 @@ class Commands(discord.Cog, name="Commands"):
     @discord.option(name="query", description="What to query the index", required=True)
     @discord.option(
         name="response_mode",
-        description="Response mode",
+        description="Response mode, doesn't work on deep composed indexes",
         guild_ids=ALLOWED_GUILDS,
         required=False,
         default="default",
diff --git a/cogs/index_service_cog.py b/cogs/index_service_cog.py
index 14fee92..ef0b4a2 100644
--- a/cogs/index_service_cog.py
+++ b/cogs/index_service_cog.py
@@ -95,8 +95,26 @@ class IndexService(discord.Cog, name="IndexService"):
         await ctx.defer(ephemeral=True)
         await self.index_handler.backup_discord(ctx, user_api_key=user_api_key)
 
-    async def load_index_command(self, ctx, index):
+    async def load_index_command(self, ctx, user_index, server_index):
         """Command handler to backup the entire server"""
+
+        if not user_index and not server_index:
+            await ctx.respond("Please provide a user or server index")
+            return
+
+        if user_index and server_index:
+            await ctx.respond(
+                "Please provide only one user index or server index. Only one or the other."
+            )
+            return
+
+        if server_index:
+            index = server_index
+            server = True
+        else:
+            index = user_index
+            server = False
+
         user_api_key = None
         if USER_INPUT_API_KEYS:
             user_api_key = await TextService.get_user_api_key(
@@ -106,7 +124,7 @@ class IndexService(discord.Cog, name="IndexService"):
                 return
 
         await ctx.defer(ephemeral=True)
-        await self.index_handler.load_index(ctx, index, user_api_key)
+        await self.index_handler.load_index(ctx, index, server, user_api_key)
 
     async def query_command(self, ctx, query, response_mode):
         """Command handler to query your index"""
diff --git a/models/autocomplete_model.py b/models/autocomplete_model.py
index bde41ef..7a38481 100644
--- a/models/autocomplete_model.py
+++ b/models/autocomplete_model.py
@@ -150,8 +150,8 @@ class File_autocompleter:
         except Exception:
             return ["No 'openers' folder"]
 
-    async def get_indexes(ctx: discord.AutocompleteContext):
-        """get all files in the openers folder"""
+    async def get_user_indexes(ctx: discord.AutocompleteContext):
+        """get all files in the indexes folder"""
         try:
             return [
                 file
@@ -165,4 +165,22 @@ class File_autocompleter:
                 :25
             ]  # returns the 25 first files from your current input
         except Exception:
-            return ["No 'indexes' folder"]
+            return ["No user indexes found, add an index"]
+
+            
+    async def get_server_indexes(ctx: discord.AutocompleteContext):
+        """get all files in the indexes folder"""
+        try:
+            return [
+                file
+                for file in os.listdir(
+                    EnvService.find_shared_file(
+                        f"indexes/{str(ctx.interaction.guild.id)}/"
+                    )
+                )
+                if file.startswith(ctx.value.lower())
+            ][
+                :25
+            ]  # returns the 25 first files from your current input
+        except Exception:
+            return ["No server indexes found, add an index"]
diff --git a/models/index_model.py b/models/index_model.py
index 786e66d..21737d3 100644
--- a/models/index_model.py
+++ b/models/index_model.py
@@ -8,7 +8,8 @@ import aiofiles
 from functools import partial
 from typing import List, Optional
 from pathlib import Path
-from datetime import date, datetime
+from datetime import date
+from langchain import OpenAI
 
 from gpt_index.readers import YoutubeTranscriptReader
 from gpt_index.readers.schema.base import Document
@@ -17,12 +18,12 @@ from gpt_index import (
     SimpleDirectoryReader,
     QuestionAnswerPrompt,
     BeautifulSoupWebReader,
-    GPTFaissIndex,
     GPTListIndex,
     QueryMode,
     GPTTreeIndex,
     GoogleDocsReader,
     MockLLMPredictor,
+    LLMPredictor,
     QueryConfig,
     IndexStructType,
 )
@@ -35,15 +36,14 @@ from services.environment_service import EnvService, app_root_path
 SHORT_TO_LONG_CACHE = {}
 
 
-def get_and_query(user_id, index_storage, query, llm_predictor):
-    # TODO Do prediction here for token usage
+def get_and_query(user_id, index_storage, query, response_mode, llm_predictor):
     index: [GPTSimpleVectorIndex, ComposableGraph] = index_storage[
         user_id
     ].get_index_or_throw()
     if isinstance(index, GPTTreeIndex):
-        response = index.query(query, verbose=True, child_branch_factor=2)
+        response = index.query(query, verbose=True, child_branch_factor=2, llm_predictor=llm_predictor)
     else:
-        response = index.query(query, verbose=True)
+        response = index.query(query, response_mode=response_mode, verbose=True, llm_predictor=llm_predictor)
     return response
 
 
@@ -66,7 +66,7 @@ class IndexData:
     def has_indexes(self, user_id):
         try:
             return len(os.listdir(f"{app_root_path()}/indexes/{user_id}")) > 0
-        except:
+        except Exception:
             return False
 
     def add_index(self, index, user_id, file_name):
@@ -93,9 +93,8 @@ class IndexData:
             for file in os.listdir(f"{app_root_path()}/indexes/{user_id}"):
                 os.remove(f"{app_root_path()}/indexes/{user_id}/{file}")
 
-        except:
+        except Exception:
             traceback.print_exc()
-            pass
 
 
 class Index_handler:
@@ -271,14 +270,17 @@ class Index_handler:
             await ctx.respond("Failed to set index")
             traceback.print_exc()
 
-    async def load_index(self, ctx: discord.ApplicationContext, index, user_api_key):
+    async def load_index(self, ctx: discord.ApplicationContext, index, server, user_api_key):
         if not user_api_key:
             os.environ["OPENAI_API_KEY"] = self.openai_key
         else:
             os.environ["OPENAI_API_KEY"] = user_api_key
 
         try:
-            index_file = EnvService.find_shared_file(f"indexes/{ctx.user.id}/{index}")
+            if server:
+                index_file = EnvService.find_shared_file(f"indexes/{ctx.guild.id}/{index}")
+            else:
+                index_file = EnvService.find_shared_file(f"indexes/{ctx.user.id}/{index}")
             index = await self.loop.run_in_executor(
                 None, partial(self.index_load_file, index_file)
             )
@@ -353,10 +355,11 @@ class Index_handler:
             index = await self.loop.run_in_executor(
                 None, partial(self.index_discord, document)
             )
-            Path(app_root_path() / "indexes").mkdir(parents=True, exist_ok=True)
+            Path(app_root_path() / "indexes" / str(ctx.guild.id)).mkdir(parents=True, exist_ok=True)
             index.save_to_disk(
                 app_root_path()
                 / "indexes"
+                / str(ctx.guild.id)
                 / f"{ctx.guild.name.replace(' ', '-')}_{date.today().month}_{date.today().day}.json"
             )
 
@@ -374,11 +377,11 @@ class Index_handler:
             os.environ["OPENAI_API_KEY"] = user_api_key
 
         try:
-            llm_predictor = MockLLMPredictor(max_tokens=256)
+            llm_predictor = LLMPredictor(llm=OpenAI(model_name="text-davinci-003"))
             response = await self.loop.run_in_executor(
                 None,
                 partial(
-                    get_and_query, ctx.user.id, self.index_storage, query, llm_predictor
+                    get_and_query, ctx.user.id, self.index_storage, query, response_mode, llm_predictor
                 ),
             )
             print("The last token usage was ", llm_predictor.last_token_usage)
diff --git a/requirements.txt b/requirements.txt
index d0ac6f3..7acee75 100644
--- a/requirements.txt
+++ b/requirements.txt
@@ -10,7 +10,7 @@ sqlitedict==2.1.0
 backoff==2.2.1
 flask==2.2.2
 beautifulsoup4==4.11.1
-gpt-index==0.3.4
+gpt-index==0.3.5
 PyPDF2==3.0.1
 youtube_transcript_api==0.5.0
 sentencepiece==0.1.97