Spaces:

Hrushi02
/

Root_Math

Sleeping

Hrushi02 commited on Oct 16

Commit

3dcc254

verified ·

1 Parent(s): ea305a2

Update app.py

Files changed (1) hide show

app.py CHANGED Viewed

@@ -5,7 +5,7 @@ from transformers import AutoModelForCausalLM, AutoTokenizer
 """
 🧮 Root_Math full model chat app
-Auto-detects GPU/CPU and loads appropriate base model.
 """
 # ✅ Load Hugging Face API token
@@ -13,29 +13,23 @@ api_token = os.getenv("HUGGINGFACEHUB_API_TOKEN")
 if not api_token:
     raise ValueError("❌ ERROR: Hugging Face API token is not set. Please set it as an environment variable.")
-# ✅ Detect environment
-use_cuda = torch.cuda.is_available()
-if use_cuda:
-    print("🚀 GPU detected — using float16 model for efficiency.")
-    dtype = torch.float16
-else:
-    print("💻 CPU detected — using float32 model.")
-    dtype = torch.float32
-# ✅ Load your full fine-tuned model directly
-model_name = "Hrushi02/Root_Math"  # Your repo
-print(f"🔄 Loading full model: {model_name} ...")
 model = AutoModelForCausalLM.from_pretrained(
     model_name,
     torch_dtype=dtype,
     device_map="auto",
-    token=api_token
 )
 # ✅ Load tokenizer
-print("🔄 Loading tokenizer...")
 tokenizer = AutoTokenizer.from_pretrained(model_name, token=api_token)
@@ -68,7 +62,7 @@ def respond(message, history, system_message, max_tokens, temperature, top_p):
     yield response
-# ✅ Gradio UI
 demo = gr.ChatInterface(
     respond,
     additional_inputs=[

 """
 🧮 Root_Math full model chat app
+Supports private/public repo and GPU/CPU auto-detection.
 """
 # ✅ Load Hugging Face API token
 if not api_token:
     raise ValueError("❌ ERROR: Hugging Face API token is not set. Please set it as an environment variable.")
+# ✅ Correct model repo name (case-sensitive)
+model_name = "Hrushi02/Root_Math"  # double-check on HF website
+# ✅ Device and dtype
+device = "cuda" if torch.cuda.is_available() else "cpu"
+dtype = torch.float16 if device == "cuda" else torch.float32
+print(f"⚡ Loading model on {device.upper()} with dtype={dtype}")
+# ✅ Load the model (directly, full fine-tuned)
 model = AutoModelForCausalLM.from_pretrained(
     model_name,
     torch_dtype=dtype,
     device_map="auto",
+    token=api_token  # required for private repo
 )
 # ✅ Load tokenizer
 tokenizer = AutoTokenizer.from_pretrained(model_name, token=api_token)
     yield response
+# ✅ Gradio ChatInterface
 demo = gr.ChatInterface(
     respond,
     additional_inputs=[