gokulraj121 commited on
Commit
ce48ad3
·
verified ·
1 Parent(s): e01fdda

Create app.py

Browse files
Files changed (1) hide show
  1. app.py +19 -0
app.py ADDED
@@ -0,0 +1,19 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ import gradio as gr
2
+ from transformers import AutoModelForCausalLM, AutoTokenizer
3
+ from peft import PeftModel
4
+
5
+ base_model = "microsoft/phi-2"
6
+ adapter_path = "your-username/brahma-lora" # Replace with your adapter repo
7
+
8
+ # Load model and LoRA adapter
9
+ tokenizer = AutoTokenizer.from_pretrained(base_model)
10
+ model = AutoModelForCausalLM.from_pretrained(base_model, device_map="auto")
11
+ model = PeftModel.from_pretrained(model, adapter_path)
12
+
13
+ def generate_response(prompt):
14
+ inputs = tokenizer(prompt, return_tensors="pt").to(model.device)
15
+ output = model.generate(**inputs, max_new_tokens=100)
16
+ return tokenizer.decode(output[0], skip_special_tokens=True)
17
+
18
+ demo = gr.Interface(fn=generate_response, inputs="text", outputs="text")
19
+ demo.launch()