Spaces:

calmgoose
/

Talk2Book

Running

calmgoose commited on Mar 17, 2023

Commit

e48d6fc

1 Parent(s): 3d3bae7

use hugging face inference api instead of loading pipeline since that wasn't working

Files changed (1) hide show

app.py CHANGED Viewed

@@ -9,7 +9,7 @@ from langchain.chains import VectorDBQA
 from huggingface_hub import snapshot_download
 from langchain import OpenAI
 from langchain import PromptTemplate
-from langchain.llms import HuggingFacePipeline
 BOOK_NAME = "1984"
@@ -84,11 +84,16 @@ def load_chain(model: Literal["openai", "GPT-NeoXT-Chat-Base-20B"] ="openai"):
         llm = OpenAI(temperature=0.2)
     if model=="GPT-NeoXT-Chat-Base-20B":
-        llm = HuggingFacePipeline.from_model_id(
-            model_id="togethercomputer/GPT-NeoXT-Chat-Base-20B",
             task="text-generation",
             model_kwargs={"temperature":0.2, "max_length":400}
-        )
     # load chain
     chain = VectorDBQA.from_chain_type(
@@ -153,6 +158,14 @@ with st.sidebar:
                                )
         os.environ["OPENAI_API_KEY"] = api_key
     st.markdown("---")
     st.info("Based on [Talk2Book](https://github.com/batmanscode/Talk2Book)")
@@ -174,7 +187,7 @@ ask = col2.button("Ask")
 if ask:
-    if choice=="OpenAI" and api_key is "":
         st.write(f"**{BOOK_NAME}:** Whoops looks like you forgot your API key buddy")
         st.stop()
     else:

 from huggingface_hub import snapshot_download
 from langchain import OpenAI
 from langchain import PromptTemplate
+from langchain.llms import HuggingFacePipeline, HuggingFaceHub
 BOOK_NAME = "1984"
         llm = OpenAI(temperature=0.2)
     if model=="GPT-NeoXT-Chat-Base-20B":
+        # llm = HuggingFacePipeline.from_model_id(
+        #     model_id="togethercomputer/GPT-NeoXT-Chat-Base-20B",
+        #     task="text-generation",
+        #     model_kwargs={"temperature":0.2, "max_length":400}
+        # )
+        llm = HuggingFaceHub(
+            repo_id="togethercomputer/GPT-NeoXT-Chat-Base-20B",
             task="text-generation",
             model_kwargs={"temperature":0.2, "max_length":400}
+        )
     # load chain
     chain = VectorDBQA.from_chain_type(
                                )
         os.environ["OPENAI_API_KEY"] = api_key
+    if choice == "togethercomputer/GPT-NeoXT-Chat-Base-20B":
+        api_key = st.text_input(label = "Paste your Hugging Face Hub API key here to get started",
+                                type = "password",
+                                help = "This isn't saved 🙈"
+                               )
+        os.environ["HUGGINGFACEHUB_API_TOKEN"] = api_key
     st.markdown("---")
     st.info("Based on [Talk2Book](https://github.com/batmanscode/Talk2Book)")
 if ask:
+    if api_key is "":
         st.write(f"**{BOOK_NAME}:** Whoops looks like you forgot your API key buddy")
         st.stop()
     else: