| | import gradio as gr |
| | import spaces |
| | from transformers import AutoModelForCausalLM, AutoTokenizer |
| |
|
| | |
| | model_name = "infly/OpenCoder-8B-Instruct" |
| | tokenizer = AutoTokenizer.from_pretrained(model_name, trust_remote_code=True) |
| | model = AutoModelForCausalLM.from_pretrained(model_name, trust_remote_code=True) |
| |
|
| | @spaces.GPU |
| | def generate_text(prompt): |
| | inputs = tokenizer(prompt, return_tensors="pt", truncation=True, padding=True) |
| | outputs = model.generate(inputs["input_ids"], max_length=100, num_return_sequences=1) |
| | return tokenizer.decode(outputs[0], skip_special_tokens=True) |
| |
|
| | |
| | interface = gr.Interface( |
| | fn=generate_text, |
| | inputs=gr.Textbox(lines=2, placeholder="Enter your prompt here..."), |
| | outputs=gr.Textbox(label="Generated Text") |
| | ) |
| |
|
| | |
| | if __name__ == "__main__": |
| | interface.launch() |