Learn

Sleeping

hanzla commited on Apr 21, 2024

Commit

2c5756e

1 Parent(s): aa636d7

new code

Files changed (1) hide show

src/pdfchatbot.py CHANGED Viewed

@@ -36,6 +36,7 @@ class PDFChatBot:
         self.chunk_size = None
         self.current_context = None
         self.format_seperator="""\n\n--\n\n"""
         #self.chunk_size_slider = chunk_size_slider
     def load_embeddings(self):
@@ -59,7 +60,7 @@ class PDFChatBot:
     @spaces.GPU
     def create_organic_pipeline(self):
-        self.pipeline = pipeline(
             "text-generation",
             model="meta-llama/Meta-Llama-3-8B-Instruct",
             model_kwargs={"torch_dtype": torch.bfloat16},
@@ -78,12 +79,14 @@ class PDFChatBot:
     def create_organic_response(self, history, query):
         self.get_organic_context(query)
         tokenizer = AutoTokenizer.from_pretrained("meta-llama/Meta-Llama-3-8B-Instruct")
         pipe = pipeline(
             "text-generation",
             model="meta-llama/Meta-Llama-3-8B-Instruct",
             model_kwargs={"torch_dtype": torch.bfloat16},
             device="cuda",
         )
         messages = [
             {"role": "system", "content": "From the the contained given below, answer the question of user \n " + self.current_context},
             {"role": "user", "content": query},
@@ -95,7 +98,7 @@ class PDFChatBot:
             add_generation_prompt=True
         )
         temp = 0.1
-        outputs = pipe(
             prompt,
             max_new_tokens=1024,
             do_sample=True,

         self.chunk_size = None
         self.current_context = None
         self.format_seperator="""\n\n--\n\n"""
+        self.pipe = None
         #self.chunk_size_slider = chunk_size_slider
     def load_embeddings(self):
     @spaces.GPU
     def create_organic_pipeline(self):
+        self.pipe = pipeline(
             "text-generation",
             model="meta-llama/Meta-Llama-3-8B-Instruct",
             model_kwargs={"torch_dtype": torch.bfloat16},
     def create_organic_response(self, history, query):
         self.get_organic_context(query)
         tokenizer = AutoTokenizer.from_pretrained("meta-llama/Meta-Llama-3-8B-Instruct")
+        """
         pipe = pipeline(
             "text-generation",
             model="meta-llama/Meta-Llama-3-8B-Instruct",
             model_kwargs={"torch_dtype": torch.bfloat16},
             device="cuda",
         )
+        """
         messages = [
             {"role": "system", "content": "From the the contained given below, answer the question of user \n " + self.current_context},
             {"role": "user", "content": query},
             add_generation_prompt=True
         )
         temp = 0.1
+        outputs = self.pipe(
             prompt,
             max_new_tokens=1024,
             do_sample=True,