bipulsardar421 commited on
Commit
df5ee62
·
1 Parent(s): 0f9537d
Files changed (2) hide show
  1. app.py +20 -0
  2. requirements.txt +4 -0
app.py ADDED
@@ -0,0 +1,20 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ import gradio as gr
2
+ from transformers import AutoTokenizer, AutoModelForCausalLM
3
+
4
+ MODEL = "google/gemma-3-270m"
5
+
6
+ tokenizer = AutoTokenizer.from_pretrained(MODEL)
7
+ model = AutoModelForCausalLM.from_pretrained(MODEL)
8
+
9
+ def chat(message, history):
10
+ inputs = tokenizer(message, return_tensors="pt")
11
+ outputs = model.generate(**inputs, max_new_tokens=128)
12
+ response = tokenizer.decode(outputs[0], skip_special_tokens=True)
13
+ return response
14
+
15
+ gr.Interface(
16
+ fn=chat,
17
+ inputs=["text", "state"],
18
+ outputs=["text"],
19
+ title="Gemma 3 (270M)"
20
+ ).launch()
requirements.txt ADDED
@@ -0,0 +1,4 @@
 
 
 
 
 
1
+ transformers
2
+ accelerate
3
+ torch
4
+ gradio