LATS_powered_by_SambaNova

Runtime error

App Files Files Community

Etash Guha commited on Jul 9

Commit

d4db51c

•

1 Parent(s): 7936375

changed key

Browse files

Files changed (1) hide show

generators/model.py +20 -13

generators/model.py CHANGED Viewed

@@ -125,13 +125,7 @@ class Samba():
         resps = []
         for i in range(num_comps):
-            url = "kjddazcq2e2wzvzv.snova.ai"
-            api_key = "bGlnaHRuaW5nOlUyM3pMcFlHY3dmVzRzUGFy"
-            url = f'https://{url}/api/v1/chat/completion'
-            headers = {
-                'Authorization': f'Basic {api_key}',
-                'Content-Type': 'application/json',
-            }
             payload = {
                 "inputs": [dataclasses.asdict(message) for message in messages],
                 "params": {
@@ -142,22 +136,26 @@ class Samba():
                 },
                 "model": "llama3-8b"
             }
-            post_response = requests.post(url, headers=headers, data=payload)
             response_text = ""
             for line in post_response.iter_lines():
                 if line.startswith(b"data: "):
                     data_str = line.decode('utf-8')[6:]
                     try:
                         line_json = json.loads(data_str)
-                        content = line_json['0'].get("stream_token", "")
                         if content:
                             response_text += content
                     except json.JSONDecodeError as e:
                         pass
-            breakpoint()
             resps.append(response_text)
         if num_comps == 1:
             return resps[0]
@@ -339,3 +337,12 @@ If a question does not make any sense, or is not factually coherent, explain why
     def extract_output(self, output: str) -> str:
         out = output.split("[/INST]")[-1].split("</s>")[0].strip()
         return out

         resps = []
         for i in range(num_comps):
             payload = {
                 "inputs": [dataclasses.asdict(message) for message in messages],
                 "params": {
                 },
                 "model": "llama3-8b"
             }
+            url = "kjddazcq2e2wzvzv.snova.ai"
+            key = "bGlnaHRuaW5nOlUyM3pMcFlHY3dmVzRzUGFy"
+            headers = {
+                "Authorization": f"Basic {key}",
+                "Content-Type": "application/json"
+            }
+            post_response = requests.post(f'https://{url}/api/v1/chat/completion', json=payload, headers=headers, stream=True)
             response_text = ""
             for line in post_response.iter_lines():
                 if line.startswith(b"data: "):
                     data_str = line.decode('utf-8')[6:]
                     try:
                         line_json = json.loads(data_str)
+                        content = line_json.get('completion')
                         if content:
                             response_text += content
                     except json.JSONDecodeError as e:
                         pass
+                    except:
+                        pass
             resps.append(response_text)
         if num_comps == 1:
             return resps[0]
     def extract_output(self, output: str) -> str:
         out = output.split("[/INST]")[-1].split("</s>")[0].strip()
         return out
+if __name__ == "__main__":
+    model = Samba()
+    messages = [Message(
+                    role="user", # TODO: check this
+                    content="say something",
+                )]
+    out= model.generate_chat(messages)
+    breakpoint()