OzoneAsai commited on
Commit
7b50948
1 Parent(s): b6dc5c9

Create app.py

Browse files
Files changed (1) hide show
  1. app.py +27 -0
app.py ADDED
@@ -0,0 +1,27 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ import gradio as gr
2
+ import os
3
+ os.system("pip install torch sentencepiece transformers Xformers")
4
+ import torch
5
+ from transformers import AutoModelForCausalLM, AutoTokenizer
6
+
7
+ model = AutoModelForCausalLM.from_pretrained("cyberagent/open-calm-1b", device_map="auto", torch_dtype=torch.float16)
8
+ tokenizer = AutoTokenizer.from_pretrained("cyberagent/open-calm-1b")
9
+
10
+ def generate_text(prompt, max_new_tokens, do_sample, temperature, top_p, repetition_penalty, pad_token_id):
11
+ inputs = tokenizer(prompt, return_tensors="pt").to(model.device)
12
+ with torch.no_grad():
13
+ tokens = model.generate(
14
+ **inputs,
15
+ max_new_tokens=max_new_tokens,
16
+ do_sample=do_sample,
17
+ temperature=temperature,
18
+ top_p=top_p,
19
+ repetition_penalty=repetition_penalty,
20
+ pad_token_id=pad_token_id,
21
+ )
22
+
23
+ output = tokenizer.decode(tokens[0], skip_special_tokens=True)
24
+ return output
25
+
26
+ app = gr.Interface(generate_text, inputs=[gr.Input(label="Prompt", type="text"), gr.IntSlider(label="Max new tokens", min=1, max=1024, step=1), gr.Checkbox(label="Do sample"), gr.FloatSlider(label="Temperature", min=0.1, max=1.0, step=0.1), gr.FloatSlider(label="Top P", min=0.0, max=1.0, step=0.01), gr.FloatSlider(label="Repetition penalty", min=0.0, max=2.0, step=0.1), gr.IntSlider(label="Pad token ID", min=0, max=1023, step=1)], outputs=[gr.Output(label="Output", type="text")])
27
+ app.launch()