TSM

Sleeping

App Files Files Community

faelfernandes commited on Aug 18

Commit

616481a

•

1 Parent(s): 9792fb4

Update app.py

Browse files

Files changed (1) hide show

app.py +57 -46

app.py CHANGED Viewed

@@ -1,20 +1,21 @@
 from huggingface_hub import InferenceClient
 import gradio as gr
-client = InferenceClient("mistralai/Mixtral-8x7B-Instruct-v0.1")
-def format_prompt(message, history, system_prompt=None):
-    prompt = "<s>"
-    for user_prompt, bot_response in history:
-        prompt += f"[INST] {user_prompt} [/INST]"
-        prompt += f" {bot_response}</s> "
-    if system_prompt:
-        prompt += f"[SYS] {system_prompt} [/SYS]"
-    prompt += f"[INST] {message} [/INST]"
-    return prompt
 def generate(
-    prompt, history, system_prompt=None, temperature=0.2, max_new_tokens=512, top_p=0.95, repetition_penalty=1.0,
 ):
     temperature = float(temperature)
     if temperature < 1e-2:
@@ -30,7 +31,7 @@ def generate(
         seed=42,
     )
-    formatted_prompt = format_prompt(prompt, history, system_prompt)
     stream = client.text_generation(formatted_prompt, **generate_kwargs, stream=True, details=True, return_full_text=False)
     output = ""
@@ -40,40 +41,50 @@ def generate(
         yield output
     return output
-mychatbot = gr.Chatbot(
-    avatar_images=["./user.png", "./botm.png"], bubble_full_width=False, show_label=False, show_copy_button=True, likeable=True,)
-demo = gr.ChatInterface(
-    fn=generate,
-    chatbot=mychatbot,
-    title="Hello! I'm Elisa by SpriFi.👋 How can I help you today?",
-    css="body { background-color: inherit; overflow-x:hidden;}"
-                        ":root {--color-accent: transparent !important; --color-accent-soft:transparent !important; --code-background-fill:black !important; --body-text-color:white !important;}"
-                        "#component-2 {background:#ffffff1a; display:contents;}"
-                        "div#component-0 {    height: auto !important;}"
-                        ".gradio-container.gradio-container-4-8-0.svelte-1kyws56.app {background: #000000;}gradio-app {background: #333 !important;}"
-                        "gradio-app {background: #000000 !important; background-attachment: fixed !important; background-position: top;}"
-                        ".panel.svelte-vt1mxs {background: transparent; padding:0;}"
-                        ".block.svelte-90oupt {    background: transparent;    border-color: transparent;}"
-                        ".bot.svelte-12dsd9j.svelte-12dsd9j.svelte-12dsd9j {    background: #ffffff1a;    border-color: transparent;    color: white;}"
-                        ".user.svelte-12dsd9j.svelte-12dsd9j.svelte-12dsd9j {    background: #ffffff1a;    border-color: transparent;    color: white;    padding: 10px 18px;}"
-                        "div.svelte-iyf88w{    background: #cc0000;    border-color: trasparent; border-radius: 25px;}"
-                        "textarea.scroll-hide.svelte-1f354aw {background: #555 !important;}"
-                        ".primary.svelte-cmf5ev {   background: transparent;    color: white;}"
-                        ".primary.svelte-cmf5ev:hover {   background: transparent;    color: white;}"
-                        "div#component-9 {    max-width: fit-content;    margin-left: auto;    margin-right: auto;}"
-                        "button#component-8, button#component-10, button#component-11, button#component-12 {    flex: none;    background: #ffffff1a;    border: none;    color: white;    margin-right: auto;    margin-left: auto;    border-radius: 9px;    min-width: fit-content;}"
-                        ".share-button.svelte-12dsd9j {    display: none;}"
-                        "footer.svelte-mpyp5e {    display: none !important;}"
-                        ".message-buttons-bubble.svelte-12dsd9j.svelte-12dsd9j.svelte-12dsd9j { border-color: #FFFFFF;    background: #FFFFFF;}"
-                        ".bubble-wrap.svelte-12dsd9j.svelte-12dsd9j.svelte-12dsd9j {padding: 0;}"
-                        ".prose h1 { color: white !important;    font-size: 16px !important;    font-weight: normal !important;    background: #ffffff1a;    padding: 20px;    border-radius: 20px;    width: 90%;    margin-left: auto !important;    margin-right: auto !important;}"
-                        ".toast-wrap.svelte-pu0yf1 { display:none !important;}"
-                        ".scroll-hide { scrollbar-width: auto !important;}"
-                        ".main svelte-1kyws56 {max-width: 800px; align-self: center;}"
-                        "div#component-4 {max-width: 650px;    margin-left: auto;    margin-right: auto;}"
-                        "body::-webkit-scrollbar {    display: none;}"
-)
-demo.queue().launch(show_api=False)

 from huggingface_hub import InferenceClient
 import gradio as gr
+client = InferenceClient(
+    "mistralai/Mistral-7B-Instruct-v0.3"
+)
+def format_prompt(message, history):
+  prompt = "<s>"
+  for user_prompt, bot_response in history:
+    prompt += f"[INST] {user_prompt} [/INST]"
+    prompt += f" {bot_response}</s> "
+  prompt += f"[INST] {message} [/INST]"
+  return prompt
 def generate(
+    prompt, history, temperature=0.9, max_new_tokens=256, top_p=0.95, repetition_penalty=1.0,
 ):
     temperature = float(temperature)
     if temperature < 1e-2:
         seed=42,
     )
+    formatted_prompt = format_prompt(prompt, history)
     stream = client.text_generation(formatted_prompt, **generate_kwargs, stream=True, details=True, return_full_text=False)
     output = ""
         yield output
     return output
+additional_inputs=[
+    gr.Slider(
+        label="Temperature",
+        value=0.9,
+        minimum=0.0,
+        maximum=1.0,
+        step=0.05,
+        interactive=True,
+        info="Higher values produce more diverse outputs",
+    ),
+    gr.Slider(
+        label="Max new tokens",
+        value=256,
+        minimum=0,
+        maximum=1048,
+        step=64,
+        interactive=True,
+        info="The maximum numbers of new tokens",
+    ),
+    gr.Slider(
+        label="Top-p (nucleus sampling)",
+        value=0.90,
+        minimum=0.0,
+        maximum=1,
+        step=0.05,
+        interactive=True,
+        info="Higher values sample more low-probability tokens",
+    ),
+    gr.Slider(
+        label="Repetition penalty",
+        value=1.2,
+        minimum=1.0,
+        maximum=2.0,
+        step=0.05,
+        interactive=True,
+        info="Penalize repeated tokens",
+    )
+]
+gr.ChatInterface(
+    fn=generate,
+    chatbot=gr.Chatbot(show_label=False, show_share_button=False, show_copy_button=True, likeable=True, layout="panel"),
+    additional_inputs=additional_inputs,
+    title="""Mistral 7B v0.3"""
+).launch(show_api=False)