Smart_LLM

Running on Zero

App Files Files Community

Daemontatox commited on Dec 22, 2024

Commit

c44cbfe

verified ·

1 Parent(s): 9440edf

Update app.py

Browse files

Files changed (1) hide show

app.py +41 -18

app.py CHANGED Viewed

@@ -16,7 +16,7 @@ from threading import Thread
 HF_TOKEN = os.environ.get("HF_TOKEN", None)
 MODEL = "Daemontatox/SphinX"
-TITLE = "<h1><center>Reason</center></h1>"
 PLACEHOLDER = """
 <center>
@@ -79,8 +79,8 @@ def stream_chat(
     message: str,
     history: list,
     system_prompt: str,
-    temperature: float = 0.8,
-    max_new_tokens: int = 128000,
     top_p: float = 1.0,
     top_k: int = 20,
     penalty: float = 1.2,
@@ -138,23 +138,46 @@ with gr.Blocks(css=CSS, theme="soft") as demo:
         additional_inputs_accordion=gr.Accordion(label="⚙️ Parameters", open=False, render=False),
         additional_inputs=[
             gr.Textbox(
-                value="""You are a Sentient AI expert at providing high-quality answers by using chain of Thought reasoning. Your process involves these steps:
-1. **Initial Thought:** First, reason step-by-step to generate your best possible response to the following request: [User's Request Here]
-2. **Self-Critique:** Now, critically evaluate your initial response. Specifically consider:
-    * **Accuracy:** Is it factually correct and verifiable?
-    * **Clarity:** Is it easy to understand and free of ambiguity?
-    * **Completeness:** Does it fully address the user's request?
-    * **Improvement:** What specific aspects could be better?
-3. **Revision:** Based on your self-critique, revise your initial response to address the identified areas for improvement.
-4. **Final Response:** Present your improved, final response.
-Ensure you think out loud and include your thoughts in <Thinking> Tag
-If you reflecting on your actions or thoughts use the <Reflecting> Tag
-If you need a new Tag create on and use it .""",
                 label="System Prompt",
                 lines=5,
                 render=False,
@@ -169,7 +192,7 @@ If you need a new Tag create on and use it .""",
             ),
             gr.Slider(
                 minimum=128,
-                maximum=128000,
                 step=1,
                 value= 8192,
                 label="Max new tokens",
@@ -195,7 +218,7 @@ If you need a new Tag create on and use it .""",
                 minimum=0.0,
                 maximum=2.0,
                 step=0.1,
-                value=0.1,
                 label="Repetition penalty",
                 render=False,
             ),
@@ -203,7 +226,7 @@ If you need a new Tag create on and use it .""",
         examples=[
             ["What is meant by a Singularity? "],
             ["Explain the theory of Relativty"],
-            ["Explain how do you think"],
             ["Explain how mamba2 structure LLMs work and how do they differ from transformers? "],
         ],
         cache_examples=False,

 HF_TOKEN = os.environ.get("HF_TOKEN", None)
 MODEL = "Daemontatox/SphinX"
+TITLE = "<h1><center>Sphinx Reasoner</center></h1>"
 PLACEHOLDER = """
 <center>
     message: str,
     history: list,
     system_prompt: str,
+    temperature: float = 1.0,
+    max_new_tokens: int = 8192,
     top_p: float = 1.0,
     top_k: int = 20,
     penalty: float = 1.2,
         additional_inputs_accordion=gr.Accordion(label="⚙️ Parameters", open=False, render=False),
         additional_inputs=[
             gr.Textbox(
+                value="""You are an AI expert at providing high-quality answers. Your process involves these steps:
+1. Initial Thought: Use the <Thinking> tag to reason step-by-step and generate your best possible response to the following request: [User's Request Here].
+Example:
+<Thinking> Step 1: Understand the request. Step 2: Analyze potential solutions. Step 3: Choose the optimal response. </Thinking>
+2. Self-Critique: Critically evaluate your initial response within <Critique> tags, focusing on:
+Accuracy: Is it factually correct and verifiable?
+Clarity: Is it easy to understand and free of ambiguity?
+Completeness: Does it fully address the user's request?
+Improvement: What specific aspects could be better?
+Example:
+<Critique> Accuracy: Verified. Clarity: Needs simplification. Completeness: Add examples. </Critique>
+3. Revision: Based on your critique, use <Revising> tags to refine and improve your response.
+Example:
+<Revising> Adjusting for clarity and adding an example to improve understanding. </Revising>
+4. Final Response: Present your revised answer clearly within <Final> tags.
+Example:
+<Final> This is the improved response. </Final>
+5. Tag Innovation: If necessary, create and define new tags to better structure your reasoning or enhance clarity. Use them consistently.
+Example:
+<Definition> This tag defines a new term introduced in the response. </Definition>
+Ensure every part of your thought process and output is properly enclosed in appropriate tags for clarity and organization.
+""",
                 label="System Prompt",
                 lines=5,
                 render=False,
             ),
             gr.Slider(
                 minimum=128,
+                maximum=32000,
                 step=1,
                 value= 8192,
                 label="Max new tokens",
                 minimum=0.0,
                 maximum=2.0,
                 step=0.1,
+                value=1.2,
                 label="Repetition penalty",
                 render=False,
             ),
         examples=[
             ["What is meant by a Singularity? "],
             ["Explain the theory of Relativty"],
+            ["Explain your thought process"],
             ["Explain how mamba2 structure LLMs work and how do they differ from transformers? "],
         ],
         cache_examples=False,