Spaces:
Runtime error
Runtime error
| import gradio as gr | |
| from transformers import AutoModelForCausalLM, AutoTokenizer | |
| import safetensors.torch | |
| import spaces | |
| # Load base model and tokenizer | |
| base_model_name = "AIDC-AI/Marco-o1" | |
| tokenizer = AutoTokenizer.from_pretrained(base_model_name) | |
| model = AutoModelForCausalLM.from_pretrained(base_model_name) | |
| # Load your lightweight safetensor | |
| safetensor_path = "MegaTronX/Odyssey-SelectolaxQLoRA" | |
| model.load_state_dict(safetensors.torch.load_file(safetensor_path), strict=False) | |
| @spaces.GPU | |
| def predict(text): | |
| inputs = tokenizer.encode(text, return_tensors="pt") | |
| outputs = model.generate(inputs) | |
| prediction = tokenizer.decode(outputs[0], skip_special_tokens=True) | |
| return prediction | |
| demo = gr.Interface(fn=predict, inputs="text", outputs="text") | |
| demo.launch() | |