Spaces:

sagar007
/

lama_storm_8b

Runtime error

App Files Files Community

sagar007 commited on Aug 28, 2024

Commit

2848e2c

verified ·

1 Parent(s): 15967e4

Update app.py

Browse files

Files changed (1) hide show

app.py +37 -149

app.py CHANGED Viewed

@@ -1,18 +1,26 @@
 import gradio as gr
-import spaces
 import torch
-from transformers import AutoTokenizer, AutoModelForCausalLM
 # Load the model and tokenizer
 model_name = "akjindal53244/Llama-3.1-Storm-8B"
 tokenizer = AutoTokenizer.from_pretrained(model_name)
-model = AutoModelForCausalLM.from_pretrained(
-    model_name,
     torch_dtype=torch.bfloat16,
     device_map="auto"
 )
-@spaces.GPU(duration=120)
 def generate_text(prompt, max_length, temperature):
     messages = [
         {"role": "system", "content": "You are a helpful assistant."},
@@ -20,10 +28,8 @@ def generate_text(prompt, max_length, temperature):
     ]
     formatted_prompt = tokenizer.apply_chat_template(messages, add_generation_prompt=True, tokenize=False)
-    inputs = tokenizer(formatted_prompt, return_tensors="pt").to(model.device)
-    outputs = model.generate(
-        **inputs,
         max_new_tokens=max_length,
         do_sample=True,
         temperature=temperature,
@@ -31,151 +37,33 @@ def generate_text(prompt, max_length, temperature):
         top_p=0.95,
     )
-    return tokenizer.decode(outputs[0][inputs['input_ids'].shape[1]:], skip_special_tokens=True)
-# Custom CSS
-css = """
-body {
-    background-color: #1a1a2e;
-    color: #e0e0e0;
-    font-family: 'Arial', sans-serif;
-}
-.container {
-    max-width: 900px;
-    margin: auto;
-    padding: 20px;
-}
-.gradio-container {
-    background-color: #16213e;
-    border-radius: 15px;
-    box-shadow: 0 4px 6px rgba(0, 0, 0, 0.1);
-}
-.header {
-    background-color: #0f3460;
-    padding: 20px;
-    border-radius: 15px 15px 0 0;
-    text-align: center;
-    margin-bottom: 20px;
-}
-.header h1 {
-    color: #e94560;
-    font-size: 2.5em;
-    margin-bottom: 10px;
-}
-.header p {
-    color: #a0a0a0;
-}
-.header img {
-    max-width: 300px;
-    border-radius: 10px;
-    margin: 15px auto;
-    display: block;
-}
-.input-group, .output-group {
-    background-color: #1a1a2e;
-    padding: 20px;
-    border-radius: 10px;
-    margin-bottom: 20px;
-}
-.input-group label, .output-group label {
-    color: #e94560;
-    font-weight: bold;
-}
-.generate-btn {
-    background-color: #e94560 !important;
-    color: white !important;
-    border: none !important;
-    border-radius: 5px !important;
-    padding: 10px 20px !important;
-    font-size: 16px !important;
-    cursor: pointer !important;
-    transition: background-color 0.3s ease !important;
-}
-.generate-btn:hover {
-    background-color: #c81e45 !important;
-}
-.example-prompts {
-    background-color: #1f2b47;
-    padding: 15px;
-    border-radius: 10px;
-    margin-bottom: 20px;
-}
-.example-prompts h3 {
-    color: #e94560;
-    margin-bottom: 10px;
-}
-.example-prompts ul {
-    list-style-type: none;
-    padding-left: 0;
-}
-.example-prompts li {
-    margin-bottom: 5px;
-    cursor: pointer;
-    transition: color 0.3s ease;
-}
-.example-prompts li:hover {
-    color: #e94560;
-}
-"""
-# Example prompts
-example_prompts = [
-    "Write a Python function to find the n-th Fibonacci number.",
-    "Explain the concept of recursion in programming.",
-    "What are the key differences between Python and JavaScript?",
-    "Tell me a short story about a time-traveling robot.",
-    "Describe the process of photosynthesis in simple terms."
 ]
-# Gradio interface
-with gr.Blocks(css=css) as iface:
-    gr.HTML(
-        """
-        <div class="header">
-            <h1>Llama-3.1-Storm-8B Text Generation</h1>
-            <p>Generate text using the powerful Llama-3.1-Storm-8B model. Enter a prompt and let the AI create!</p>
-            <img src="https://cdn-uploads.huggingface.co/production/uploads/64c75c1237333ccfef30a602/tmOlbERGKP7JSODa6T06J.jpeg" alt="Llama">
-        </div>
-        """
-    )
-    with gr.Group():
-        gr.HTML(
-            """
-            <div class="example-prompts">
-                <h3>Example Prompts:</h3>
-                <ul>
-                    """ + "".join([f"<li>{prompt}</li>" for prompt in example_prompts]) + """
-                </ul>
-            </div>
-            """
-        )
-        with gr.Group(elem_classes="input-group"):
-            prompt = gr.Textbox(label="Prompt", placeholder="Enter your prompt here...", lines=5)
             max_length = gr.Slider(minimum=1, maximum=500, value=128, step=1, label="Max Length")
             temperature = gr.Slider(minimum=0.1, maximum=2.0, value=0.7, step=0.1, label="Temperature")
-            generate_btn = gr.Button("Generate", elem_classes="generate-btn")
-        with gr.Group(elem_classes="output-group"):
             output = gr.Textbox(label="Generated Text", lines=10)
-    generate_btn.click(generate_text, inputs=[prompt, max_length, temperature], outputs=output)
-    # JavaScript to make example prompts clickable
-    gr.HTML(
-        """
-        <script>
-        document.addEventListener('DOMContentLoaded', (event) => {
-            document.querySelectorAll('.example-prompts li').forEach(item => {
-                item.addEventListener('click', event => {
-                    document.querySelector('textarea[data-testid="textbox"]').value = event.target.textContent;
-                });
-            });
-        });
-        </script>
-        """
     )
-# Launch the app
-iface.launch()

 import gradio as gr
 import torch
+from transformers import AutoTokenizer, pipeline
 # Load the model and tokenizer
 model_name = "akjindal53244/Llama-3.1-Storm-8B"
 tokenizer = AutoTokenizer.from_pretrained(model_name)
+pipe = pipeline(
+    "text-generation",
+    model=model_name,
     torch_dtype=torch.bfloat16,
     device_map="auto"
 )
+# HTML content
+HTML_CONTENT = """
+<h1 style="text-align: center;">Llama-3.1-Storm-8B Text Generation</h1>
+<p style="text-align: center;">Generate text using the powerful Llama-3.1-Storm-8B model. Enter a prompt or select an example, and let the AI create!</p>
+<div style="display: flex; justify-content: center; margin-bottom: 20px;">
+    <img src="https://cdn-uploads.huggingface.co/production/uploads/64c75c1237333ccfef30a602/tmOlbERGKP7JSODa6T06J.jpeg" alt="Llama" style="width:200px; border-radius:10px;">
+</div>
+"""
 def generate_text(prompt, max_length, temperature):
     messages = [
         {"role": "system", "content": "You are a helpful assistant."},
     ]
     formatted_prompt = tokenizer.apply_chat_template(messages, add_generation_prompt=True, tokenize=False)
+    outputs = pipe(
+        formatted_prompt,
         max_new_tokens=max_length,
         do_sample=True,
         temperature=temperature,
         top_p=0.95,
     )
+    return outputs[0]['generated_text'][len(formatted_prompt):]
+examples = [
+    "Write a short story about a magical llama.",
+    "Explain the concept of machine learning to a 10-year-old.",
+    "Describe the process of making the perfect cup of coffee.",
+    "What are the main differences between Python and JavaScript?"
 ]
+with gr.Blocks() as demo:
+    gr.HTML(HTML_CONTENT)
+    with gr.Row():
+        with gr.Column(scale=2):
+            prompt = gr.Textbox(label="Prompt", lines=5)
             max_length = gr.Slider(minimum=1, maximum=500, value=128, step=1, label="Max Length")
             temperature = gr.Slider(minimum=0.1, maximum=2.0, value=0.7, step=0.1, label="Temperature")
+            submit_button = gr.Button("Generate")
+        with gr.Column(scale=2):
             output = gr.Textbox(label="Generated Text", lines=10)
+    gr.Examples(
+        examples=examples,
+        inputs=prompt,
+        label="Click on an example to load it into the prompt box:"
     )
+    submit_button.click(generate_text, inputs=[prompt, max_length, temperature], outputs=[output])
+if __name__ == "__main__":
+    demo.launch()