File size: 1,528 Bytes
67553c2
f71c677
d83b1aa
e16bfa2
f71c677
e16bfa2
f71c677
67553c2
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
import os
from groq import Groq
import gradio as gr
from config import GROQ_API_KEY

os.environ["GROQ_API_KEY"] = GROQ_API_KEY
client = Groq()

system_prompt = {
                "role": "system",
                "content":
                "You are a useful assistant. You reply with efficient answers. "
                }

async def chat_groq(message, history):
    
    messages = [system_prompt]
    
    for msg in history:
        messages.append({"role": "user", "content": str(msg[0])})
        messages.append({"role": "assistant", "content": str(msg[1])})
        
    messages.append({"role": "user", "content": str (message)})
    
    response_content = ''
    
    stream = client.chat.completions.create(
                                            model="llama3-70b-8192",
                                            messages=messages,
                                            max_tokens=1024,
                                            temperature=1.3,
                                            stream=True
                                        )

    for chunk in stream:
        content = chunk.choices[0].delta.content
        if content:
            response_content += chunk. choices[0].delta.content 
        yield response_content

with gr. Blocks(theme=gr.themes.Monochrome(), fill_height=True) as demo:
    gr.ChatInterface(chat_groq,
                     clear_btn=None, 
                     undo_btn=None, 
                     retry_btn=None,
                    )

demo.queue()
demo.launch()