Spaces:

mic3333
/

summllama-demo

Sleeping

App Files Files Community

mic3333 commited on Nov 3

Commit

8bbf9e2

verified ·

1 Parent(s): c3564f5

Update app.py

Browse files

Files changed (1) hide show

app.py +1 -39

app.py CHANGED Viewed

@@ -3,7 +3,6 @@ from transformers import pipeline, AutoTokenizer
 import torch
 import spaces
-# Load model and tokenizer globally
 model_name = "DISLab/SummLlama3.2-3B"
 print(f"Loading model: {model_name}")
@@ -19,8 +18,6 @@ pipe = pipeline(
 print("Model loaded successfully!")
 def format_chat_template(instruction, document):
-    """Format input using the recommended template with timestamp awareness built-in"""
-    # Enhanced instruction that always includes timestamp awareness
     enhanced_instruction = f"{instruction} If the input contains timestamps, preserve them and note when key topics were discussed."
     row_json = [{
@@ -31,12 +28,9 @@ def format_chat_template(instruction, document):
 @spaces.GPU
 def summarize(instruction, text):
-    """Generate summary using the model with custom instruction"""
     try:
-        # Format input with enhanced instruction
         formatted_input = format_chat_template(instruction, text)
-        # Generate summary
         output = pipe(
             formatted_input,
             max_new_tokens=512,
@@ -46,14 +40,12 @@ def summarize(instruction, text):
             return_full_text=False
         )
-        # Extract the generated summary
         summary = output[0]['generated_text'].strip()
         return summary
     except Exception as e:
         return f"Error: {str(e)}"
-# Create Gradio interface
 demo = gr.Interface(
     fn=summarize,
     inputs=[
@@ -105,34 +97,4 @@ John (9:27): Sure, I'll review it tomorrow and get back to you."""
 )
 if __name__ == "__main__":
-    demo.launch()
-```
-## Key Changes:
-**What's different:**
-1. The `format_chat_template` function now automatically appends: `"If the input contains timestamps, preserve them and note when key topics were discussed."` to ANY instruction
-2. Default instruction is now simpler: `"Please provide a concise summary of this meeting transcript."`
-3. Users don't need to mention timestamps anymore
-**Now you can use simple instructions like:**
-- "Provide a concise summary"
-- "Extract action items"
-- "Summarize technical discussions"
-- "Focus on decisions made"
-**The system will automatically:**
-- ✅ Preserve timestamps when present
-- ✅ Note when topics were discussed
-- ✅ Keep chronological flow
-**For OpenWebUI, the equivalent system prompt would be:**
-```
-You are a summarization assistant. Always follow these rules:
-1. If the input contains timestamps, preserve them and note when key topics were discussed
-2. Identify speakers and their contributions
-3. Maintain chronological order
-4. Follow the user's specific instruction for the summary style
-The user will provide their custom instruction followed by the document/transcript.

 import torch
 import spaces
 model_name = "DISLab/SummLlama3.2-3B"
 print(f"Loading model: {model_name}")
 print("Model loaded successfully!")
 def format_chat_template(instruction, document):
     enhanced_instruction = f"{instruction} If the input contains timestamps, preserve them and note when key topics were discussed."
     row_json = [{
 @spaces.GPU
 def summarize(instruction, text):
     try:
         formatted_input = format_chat_template(instruction, text)
         output = pipe(
             formatted_input,
             max_new_tokens=512,
             return_full_text=False
         )
         summary = output[0]['generated_text'].strip()
         return summary
     except Exception as e:
         return f"Error: {str(e)}"
 demo = gr.Interface(
     fn=summarize,
     inputs=[
 )
 if __name__ == "__main__":
+    demo.launch()