Spaces:
Runtime error
Runtime error
Update app.py
Browse files
app.py
CHANGED
@@ -2,6 +2,9 @@ from transformers import AutoTokenizer, AutoModelForSeq2SeqLM
|
|
2 |
from transformers import pipeline
|
3 |
import torch
|
4 |
import gradio as gr
|
|
|
|
|
|
|
5 |
|
6 |
# chatgpt-gpt4-prompts-bart-large-cnn-samsum
|
7 |
tokenizer = AutoTokenizer.from_pretrained(
|
@@ -10,7 +13,7 @@ model = AutoModelForSeq2SeqLM.from_pretrained(
|
|
10 |
"Kaludi/chatgpt-gpt4-prompts-bart-large-cnn-samsum", from_tf=True)
|
11 |
|
12 |
# zephyr
|
13 |
-
pipe = pipeline("text-generation", model="HuggingFaceH4/zephyr-7b-alpha",torch_dtype=torch.bfloat16, device_map="auto")
|
14 |
|
15 |
def generate(inputuno, inputdos, max_new_tokens=3556, top_p=0.95, repetition_penalty=1.0):
|
16 |
top_p = float(top_p)
|
@@ -35,15 +38,15 @@ def generate(inputuno, inputdos, max_new_tokens=3556, top_p=0.95, repetition_pen
|
|
35 |
"role": "user", "content": str(promptdos)
|
36 |
},
|
37 |
]
|
38 |
-
|
39 |
-
stream =
|
40 |
output = ""
|
41 |
|
42 |
for response in stream:
|
43 |
output += response.token.text
|
44 |
yield output
|
45 |
return output
|
46 |
-
|
47 |
|
48 |
def generatePrompt(inputuno, inputdos):
|
49 |
|
|
|
2 |
from transformers import pipeline
|
3 |
import torch
|
4 |
import gradio as gr
|
5 |
+
from huggingface_hub import InferenceClient
|
6 |
+
|
7 |
+
client = InferenceClient("HuggingFaceH4/zephyr-7b-beta")
|
8 |
|
9 |
# chatgpt-gpt4-prompts-bart-large-cnn-samsum
|
10 |
tokenizer = AutoTokenizer.from_pretrained(
|
|
|
13 |
"Kaludi/chatgpt-gpt4-prompts-bart-large-cnn-samsum", from_tf=True)
|
14 |
|
15 |
# zephyr
|
16 |
+
# pipe = pipeline("text-generation", model="HuggingFaceH4/zephyr-7b-alpha",torch_dtype=torch.bfloat16, device_map="auto")
|
17 |
|
18 |
def generate(inputuno, inputdos, max_new_tokens=3556, top_p=0.95, repetition_penalty=1.0):
|
19 |
top_p = float(top_p)
|
|
|
38 |
"role": "user", "content": str(promptdos)
|
39 |
},
|
40 |
]
|
41 |
+
|
42 |
+
stream = client.text_generation(formatted_prompt, **generate_kwargs, stream=True, details=True, return_full_text=False)
|
43 |
output = ""
|
44 |
|
45 |
for response in stream:
|
46 |
output += response.token.text
|
47 |
yield output
|
48 |
return output
|
49 |
+
|
50 |
|
51 |
def generatePrompt(inputuno, inputdos):
|
52 |
|