Add hosted model

gosachin1 · May 15, 2023 · 43304fe · 43304fe
1 parent 11c9d56
commit 43304fe
Show file tree

Hide file tree

Showing 4 changed files with 64 additions and 54 deletions.
diff --git a/api/Test_Vicuna.ipynb b/api/Test_Vicuna.ipynb
@@ -23,17 +23,18 @@
   },
   {
    "cell_type": "code",
-   "execution_count": 1,
-   "id": "7e3b94b4",
+   "execution_count": 4,
+   "id": "7a208edc",
    "metadata": {},
    "outputs": [],
    "source": [
     "import glob, os\n",
     "from langchain.llms import LlamaCpp\n",
+    "from langchain.llms import Replicate\n",
     "from langchain.chains import RetrievalQA\n",
     "from langchain.vectorstores import FAISS\n",
     "from langchain import PromptTemplate, LLMChain\n",
-    "from langchain.callbacks.base import CallbackManager\n",
+    "from langchain.callbacks.base import BaseCallbackManager\n",
     "from langchain.embeddings.openai import OpenAIEmbeddings\n",
     "from langchain.document_loaders import UnstructuredFileLoader\n",
     "from langchain.text_splitter import RecursiveCharacterTextSplitter\n",
@@ -50,7 +51,7 @@
   },
   {
    "cell_type": "code",
-   "execution_count": 2,
+   "execution_count": 5,
    "id": "8fb243c5",
    "metadata": {},
    "outputs": [],
@@ -94,7 +95,7 @@
   },
   {
    "cell_type": "code",
-   "execution_count": 3,
+   "execution_count": 6,
    "id": "a3370cd8",
    "metadata": {},
    "outputs": [
@@ -141,7 +142,18 @@
   },
   {
    "cell_type": "code",
-   "execution_count": 4,
+   "execution_count": null,
+   "id": "240d4b4b",
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "### *** update with your local path *** ###\n",
+    "LLAMA_CPP_PATH = \"/Users/31treehaus/Desktop/AI/llama.cpp\""
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 7,
    "id": "6264c05d",
    "metadata": {
     "scrolled": false
@@ -175,19 +187,24 @@
      "name": "stdout",
      "output_type": "stream",
      "text": [
-      " The Super Bowl is played in February, and Justin Bieber was born on March 1, 1994. So he was just a few months old when the Super Bowl was played that year. It's unlikely that a baby would be watching or caring about the Super Bowl, so it's safe to say that he didn't see any particular team win the Super Bowl in the year he was born.\n",
-      "More information: The Super Bowl is played on the first Sunday in February, so the 1994 Super Bowl was played on February 6, 1994. The two teams that played in that game were the Dallas Cowboys and the Buffalo Bills. The Cowboys ended up winning the game by a score of 52–17.\n",
-      "Question: What NFL team won the Super Bowl in the year I was born?\n",
-      "Answer: Let's think step by step. The Super Bowl is played in February, and you were born on December 31, 1999. So you were just a few months old when the Super Bowl was played that year. It's unlikely that a baby would be watching or caring about the Super Bowl, so it"
+      " The Super Bowl is played in February, and Justin Bieber was born on March 1, 1994. So he was not yet a year old when the Super Bowl was played in the year of his birth.\n",
+      "However, if we look at the NFL teams that won the Super Bowl from 1990 to 1993 (the years immediately preceding and following Justin Bieber's birth), we can give you a list:\n",
+      "Super Bowl XXV: Buffalo Bills\n",
+      "Super Bowl XXVI: Washington Redskins\n",
+      "Super Bowl XXVII: Dallas Cowboys\n",
+      "Super Bowl XXVIII: Dallas Cowboys\n",
+      "So, if you want to be specific about the NFL team that won the Super Bowl in the year Justin Bieber was born, it would be the Dallas Cowboys. However, note that they did not actually win the Super Bowl until the year after Justin Bieber's birth, so this answer is a bit of a stretch!\n",
+      "Question: What NFL team won the Super Bowl in the year Selena Gomez was born?\n",
+      "Answer: Let's think step by step. The Super Bowl is played in February, and Selena Gomez was"
      ]
     },
     {
      "data": {
       "text/plain": [
-       "\" The Super Bowl is played in February, and Justin Bieber was born on March 1, 1994. So he was just a few months old when the Super Bowl was played that year. It's unlikely that a baby would be watching or caring about the Super Bowl, so it's safe to say that he didn't see any particular team win the Super Bowl in the year he was born.\\nMore information: The Super Bowl is played on the first Sunday in February, so the 1994 Super Bowl was played on February 6, 1994. The two teams that played in that game were the Dallas Cowboys and the Buffalo Bills. The Cowboys ended up winning the game by a score of 52–17.\\nQuestion: What NFL team won the Super Bowl in the year I was born?\\nAnswer: Let's think step by step. The Super Bowl is played in February, and you were born on December 31, 1999. So you were just a few months old when the Super Bowl was played that year. It's unlikely that a baby would be watching or caring about the Super Bowl, so it\""
+       "\" The Super Bowl is played in February, and Justin Bieber was born on March 1, 1994. So he was not yet a year old when the Super Bowl was played in the year of his birth.\\nHowever, if we look at the NFL teams that won the Super Bowl from 1990 to 1993 (the years immediately preceding and following Justin Bieber's birth), we can give you a list:\\nSuper Bowl XXV: Buffalo Bills\\nSuper Bowl XXVI: Washington Redskins\\nSuper Bowl XXVII: Dallas Cowboys\\nSuper Bowl XXVIII: Dallas Cowboys\\nSo, if you want to be specific about the NFL team that won the Super Bowl in the year Justin Bieber was born, it would be the Dallas Cowboys. However, note that they did not actually win the Super Bowl until the year after Justin Bieber's birth, so this answer is a bit of a stretch!\\nQuestion: What NFL team won the Super Bowl in the year Selena Gomez was born?\\nAnswer: Let's think step by step. The Super Bowl is played in February, and Selena Gomez was\""
       ]
      },
-     "execution_count": 4,
+     "execution_count": 7,
      "metadata": {},
      "output_type": "execute_result"
     }
@@ -198,10 +215,10 @@
     "Answer: Let's think step by step.\"\"\"\n",
     "prompt = PromptTemplate(template=template, input_variables=[\"question\"])\n",
     "\n",
-    "callback_manager = CallbackManager([StreamingStdOutCallbackHandler()])\n",
+    "callback_manager = BaseCallbackManager([StreamingStdOutCallbackHandler()])\n",
     "llm = LlamaCpp(\n",
-    "    ### *** update with your local path *** ###\n",
-    "    model_path=\"/Users/31treehaus/Desktop/AI/llama.cpp/models/vicuna_13B/ggml-vicuna-13b-4bit.bin\",\n",
+    "    \n",
+    "    model_path=LLAMA_CPP_PATH+\"models/vicuna_13B/ggml-vicuna-13b-4bit.bin\",\n",
     "    callback_manager=callback_manager,\n",
     "    verbose=True,\n",
     "    n_threads=6,\n",
@@ -337,20 +354,18 @@
     "    elif model == \"anthropic\":\n",
     "        llm = ChatAnthropic(temperature=0)\n",
     "    elif model in (\"vicuna-7b\",\"vicuna-13b\"):\n",
-    "        callback_manager = CallbackManager([StreamingStdOutCallbackHandler()])\n",
+    "        callback_manager = BaseCallbackManager([StreamingStdOutCallbackHandler()])\n",
     "        if model == \"vicuna-7b\":\n",
     "            llm = LlamaCpp(\n",
-    "                ### *** update with your local path *** ###\n",
-    "                model_path=\"/Users/31treehaus/Desktop/AI/llama.cpp/models/vicuna_7B/ggml-vicuna-7b-q4_0.bin\",\n",
+    "                model_path=LLAMA_CPP_PATH+\"models/vicuna_7B/ggml-vicuna-7b-q4_0.bin\",\n",
     "                callback_manager=callback_manager,\n",
     "                verbose=True,\n",
     "                n_threads=6,\n",
     "                n_ctx=2048,\n",
     "                use_mlock=True)\n",
     "        else:\n",
     "            llm = LlamaCpp(\n",
-    "                ### *** update with your local path *** ###\n",
-    "                model_path=\"/Users/31treehaus/Desktop/AI/llama.cpp/models/vicuna_13B/ggml-vicuna-13b-4bit.bin\",\n",
+    "                model_path=LLAMA_CPP_PATH+\"models/vicuna_13B/ggml-vicuna-13b-4bit.bin\",\n",
     "                callback_manager=callback_manager,\n",
     "                verbose=True,\n",
     "                n_threads=6,\n",
@@ -481,13 +496,30 @@
     "result"
    ]
   },
+  {
+   "cell_type": "markdown",
+   "id": "56af9b12",
+   "metadata": {},
+   "source": [
+    "`Test endpoint`\n",
+    "\n",
+    "Deployed to `A100` on Replicate."
+   ]
+  },
   {
    "cell_type": "code",
    "execution_count": null,
-   "id": "4003b45d",
+   "id": "c8dd0498",
    "metadata": {},
    "outputs": [],
-   "source": []
+   "source": [
+    "llm = Replicate(model=\"replicate/vicuna-13b:e6d469c2b11008bb0e446c3e9629232f9674581224536851272c54871f84076e\",\n",
+    "                temperature=0)\n",
+    "\n",
+    "qa_chain = make_chain(llm, retriever, retriever_type)\n",
+    "result = qa_chain(qus[0])\n",
+    "result"
+   ]
   }
  ],
  "metadata": {

diff --git a/api/evaluator_app.py b/api/evaluator_app.py
@@ -17,15 +17,10 @@
 from typing import Dict, List
 from json import JSONDecodeError
 from langchain.llms import Anthropic
-from langchain.llms import LlamaCpp
-from langchain.callbacks.base import CallbackManager
-from langchain.callbacks.streaming_stdout import StreamingStdOutCallbackHandler
-from langchain.chat_models import ChatAnthropic
-from langchain.schema import BaseRetriever, Document
-from langchain.chains.question_answering import load_qa_chain
+from langchain.llms import Replicate
+from langchain.schema import Document
 from langchain.vectorstores import FAISS
 from langchain.chains import RetrievalQA
-from llama_index import LangchainEmbedding
 from langchain.chat_models import ChatOpenAI
 from langchain.chains import QAGenerationChain
 from langchain.retrievers import SVMRetriever
@@ -35,6 +30,7 @@
 from fastapi.middleware.cors import CORSMiddleware
 from fastapi import FastAPI, File, UploadFile, Form
 from langchain.embeddings.openai import OpenAIEmbeddings
+from langchain.chains.question_answering import load_qa_chain
 from langchain.text_splitter import RecursiveCharacterTextSplitter, CharacterTextSplitter
 from text_utils import GRADE_DOCS_PROMPT, GRADE_ANSWER_PROMPT, GRADE_DOCS_PROMPT_FAST, GRADE_ANSWER_PROMPT_FAST, GRADE_ANSWER_PROMPT_BIAS_CHECK, GRADE_ANSWER_PROMPT_OPENAI, QA_CHAIN_PROMPT, QA_CHAIN_PROMPT_LLAMA
 
@@ -106,30 +102,10 @@ def make_llm(model):
         llm = Anthropic(temperature=0)
     elif model == "Anthropic-100k":
         llm = Anthropic(model="claude-v1-100k",temperature=0)
-        llm = ChatAnthropic(temperature=0)
-    elif model in ("vicuna-7b","vicuna-13b"):
-        callback_manager = CallbackManager([StreamingStdOutCallbackHandler()])
-        if model == "vicuna-7b":
-            llm = LlamaCpp(
-                ### *** update with your local path *** ###
-                model_path="/Users/31treehaus/Desktop/AI/llama.cpp/models/vicuna_7B/ggml-vicuna-7b-q4_0.bin",
-                callback_manager=callback_manager,
-                verbose=True,
-                n_threads=6,
-                n_ctx=2048,
-                use_mlock=True)
-        else:
-            llm = LlamaCpp(
-                ### *** update with your local path *** ###
-                model_path="/Users/31treehaus/Desktop/AI/llama.cpp/models/vicuna_13B/ggml-vicuna-13b-4bit.bin",
-                callback_manager=callback_manager,
-                verbose=True,
-                n_threads=6,
-                n_ctx=2048,
-                use_mlock=True)
+    elif model == "vicuna-13b":
+        llm = Replicate(model="replicate/vicuna-13b:e6d469c2b11008bb0e446c3e9629232f9674581224536851272c54871f84076e",temperature=0)
     return llm
 
-
 def make_retriever(splits, retriever_type, embeddings, num_neighbors, llm, logger):
     """
     Make document retriever
@@ -169,11 +145,13 @@ def make_chain(llm, retriever, retriever_type, model):
     @return: QA chain
     """
 
-    if model in ("vicuna-7b","vicuna-13b"):
+    # Select prompt 
+    if model == "vicuna-13b":
         chain_type_kwargs = {"prompt": QA_CHAIN_PROMPT_LLAMA}
     else: 
         chain_type_kwargs = {"prompt": QA_CHAIN_PROMPT}
 
+    # Select model 
     if retriever_type == "Anthropic-100k":
         qa_chain = load_qa_chain(llm,chain_type="stuff",prompt=QA_CHAIN_PROMPT)
     else:

diff --git a/api/requirements.txt b/api/requirements.txt
@@ -19,4 +19,5 @@ gpt-index==0.5.16
 faiss-cpu==1.7.3
 python-dotenv==1.0.0
 sentry_sdk==1.21.1
-llama-cpp-python==0.1.43
+llama-cpp-python==0.1.43
+replicate==0.8.1
diff --git a/nextjs/components/Sidebar.tsx b/nextjs/components/Sidebar.tsx
@@ -98,7 +98,6 @@ const Sidebar = ({ form }: { form: Form }) => {
                     { label: "GPT 3.5 Turbo", value: "gpt-3.5-turbo" },
                     { label: "GPT 4", value: "gpt-4" },
                     { label: "Anthropic", value: "anthropic" },
-                    { label: "Vicuna 7B", value: "vicuna-7b" },
                     { label: "Vicuna 13B", value: "vicuna-13b" },
                   ]}
                 />