sparse-mpt-7b-gsm8k

Sleeping

App Files Files Community

rgreenberg1 commited on Jan 17, 2024

Commit

1d4a7a3

verified ·

1 Parent(s): 55b009f

Update app.py

Browse files

Files changed (1) hide show

app.py +46 -1

app.py CHANGED Viewed

@@ -58,7 +58,52 @@ with gr.Blocks() as demo:
             "James decides to run 3 sprints 3 times a week. He runs 60 meters each sprint. How many total meters does he run a week?",
             "Claire makes a 3 egg omelet every morning for breakfast. How many dozens of eggs will she eat in 4 weeks?",
             "Gretchen has 110 coins. There are 30 more gold coins than silver coins. How many gold coins does Gretchen have?",],inputs=[textbox],)
             # Generation inference
             def generate(

             "James decides to run 3 sprints 3 times a week. He runs 60 meters each sprint. How many total meters does he run a week?",
             "Claire makes a 3 egg omelet every morning for breakfast. How many dozens of eggs will she eat in 4 weeks?",
             "Gretchen has 110 coins. There are 30 more gold coins than silver coins. How many gold coins does Gretchen have?",],inputs=[textbox],)
+             max_new_tokens = gr.Slider(
+                    label="Max new tokens",
+                    value=DEFAULT_MAX_NEW_TOKENS,
+                    minimum=0,
+                    maximum=MAX_MAX_NEW_TOKENS,
+                    step=1,
+                    interactive=True,
+                    info="The maximum numbers of new tokens",)
+            temperature = gr.Slider(
+                label="Temperature",
+                value=0.3,
+                minimum=0.05,
+                maximum=1.0,
+                step=0.05,
+                interactive=True,
+                info="Higher values produce more diverse outputs",
+                            )
+            top_p = gr.Slider(
+                label="Top-p (nucleus) sampling",
+                value=0.40,
+                minimum=0.0,
+                maximum=1,
+                step=0.05,
+                interactive=True,
+                info="Higher values sample more low-probability tokens",
+                            )
+            top_k = gr.Slider(
+                label="Top-k sampling",
+                value=20,
+                minimum=1,
+                maximum=100,
+                step=1,
+                interactive=True,
+                info="Sample from the top_k most likely tokens",
+                )
+            repetition_penalty = gr.Slider(
+                label="Repetition penalty",
+                value=1.2,
+                minimum=1.0,
+                maximum=2.0,
+                step=0.05,
+                interactive=True,
+                info="Penalize repeated tokens",
+                )
             # Generation inference
             def generate(