Spaces:

helal94hb1
/

backend_chatbot

Sleeping

App Files Files Community

helal94hb1 commited on Sep 13

Commit

101cdda

1 Parent(s): ffe6d33

fix: new embeddings and rerankh4

Browse files

Files changed (1) hide show

app/models/expert_judge_model.py +20 -16

app/models/expert_judge_model.py CHANGED Viewed

@@ -1,8 +1,7 @@
 # expert_judge_model.py
 import torch.nn as nn
-# --- MODIFIED: Import AutoTokenizer for a more robust helper ---
-from transformers import AutoModelForSequenceClassification, AutoTokenizer, BertTokenizer
 class ExpertJudgeCrossEncoder(nn.Module):
     """
@@ -18,30 +17,35 @@ class ExpertJudgeCrossEncoder(nn.Module):
             num_labels=1
         )
-    # --- MODIFIED: The forward method now accepts token_type_ids ---
     def forward(self, input_ids, attention_mask, token_type_ids=None):
         """
-        Forward pass for the cross-encoder.
         Args:
             input_ids (Tensor): Token IDs for the concatenated sequence.
             attention_mask (Tensor): Attention mask for the input sequence.
             token_type_ids (Tensor, optional): Segment IDs to distinguish query from chunk. Defaults to None.
         """
-        # Pass all arguments to the underlying Hugging Face model.
-        # It will use token_type_ids if the model architecture supports it (like BERT).
-        outputs = self.model(
-            input_ids=input_ids,
-            attention_mask=attention_mask,
-            token_type_ids=token_type_ids
-        )
         return outputs.logits
-# --- MODIFIED: A more robust tokenizer helper function ---
 def get_tokenizer(model_name='bert-base-uncased'):
     """
     Helper function to get the tokenizer corresponding to the model.

 # expert_judge_model.py
 import torch.nn as nn
+from transformers import AutoModelForSequenceClassification, AutoTokenizer
 class ExpertJudgeCrossEncoder(nn.Module):
     """
             num_labels=1
         )
+    # --- CORRECTED: The forward method is now model-aware ---
     def forward(self, input_ids, attention_mask, token_type_ids=None):
         """
+        Forward pass for the cross-encoder. This version dynamically handles arguments
+        to support different model architectures.
         Args:
             input_ids (Tensor): Token IDs for the concatenated sequence.
             attention_mask (Tensor): Attention mask for the input sequence.
             token_type_ids (Tensor, optional): Segment IDs to distinguish query from chunk. Defaults to None.
         """
+        # 1. Create a dictionary with the arguments that are always required.
+        model_inputs = {
+            'input_ids': input_ids,
+            'attention_mask': attention_mask
+        }
+        # 2. Check if the underlying model's forward method accepts 'token_type_ids'.
+        #    This makes the class compatible with models that use it (like BERT)
+        #    and those that don't (like Qwen2).
+        if 'token_type_ids' in self.model.forward.__code__.co_varnames:
+            if token_type_ids is not None:
+                model_inputs['token_type_ids'] = token_type_ids
+        # 3. Pass the dynamically built arguments to the model using dictionary unpacking.
+        outputs = self.model(**model_inputs)
         return outputs.logits
 def get_tokenizer(model_name='bert-base-uncased'):
     """
     Helper function to get the tokenizer corresponding to the model.