Spaces:

srijaydeshpande
/

DeID

Sleeping

App Files Files Community

srijaydeshpande commited on Jun 6

Commit

31fecb2

•

1 Parent(s): 178388d

Update app.py

Browse files

Files changed (1) hide show

app.py +43 -43

app.py CHANGED Viewed

@@ -101,7 +101,7 @@ def deidentify_doc(pdftext, maxtokens, temperature, top_probability):
     #             n_ctx=8192,
     #             )
-    chat_template = MessagesFormatterType.LLAMA_3
     llm = Llama(
         model_path="models/Meta-Llama-3-70B-Instruct-Q3_K_M.gguf",
@@ -111,51 +111,51 @@ def deidentify_doc(pdftext, maxtokens, temperature, top_probability):
         n_ctx=8192,
     )
-    provider = LlamaCppPythonProvider(llm)
-    agent = LlamaCppAgent(
-        provider,
-        system_prompt="You are a helpful assistant.",
-        predefined_messages_formatter_type=chat_template,
-        debug_output=True
-    )
-    settings = provider.get_provider_default_settings()
-    settings.temperature = 0.7
-    settings.top_k = 40
-    settings.top_p = 0.95
-    settings.max_tokens = 2048
-    settings.repeat_penalty = 1.1
-    settings.stream = True
-    messages = BasicChatHistory()
-    stream = agent.get_chat_response(
-        prompt + ' : ' + pdftext,
-        llm_sampling_settings=settings,
-        chat_history=messages,
-        returns_streaming_generator=True,
-        print_output=False
-    )
-    outputs = ""
-    for output in stream:
-        outputs += output
-    return outputs
-    # output = model.create_chat_completion(
-    #     messages=[
-    #         {"role": "assistant", "content": prompt},
-    #         {
-    #             "role": "user",
-    #             "content": pdftext
-    #         }
-    #     ],
-    #     max_tokens=maxtokens,
-    #     temperature=temperature
-    # )
-    # output = output['choices'][0]['message']['content']
     # prompt = "Perform the following actions on given text: 1. Replace any person age with term [redacted] 2. DO NOT REPLACE ANY MEDICAL MEASUREMENTS 3. Replace only the CALENDAR DATES of format 'day/month/year' with term [redacted]"
     # output = model.create_chat_completion(
@@ -175,7 +175,7 @@ def deidentify_doc(pdftext, maxtokens, temperature, top_probability):
     # print(output)
     # print('-------------------------------------------------------')
-    # return outputs
 def pdf_to_text(files, maxtokens=2048, temperature=0, top_probability=0.95):
     print('Control 0-----------------------------------')
@@ -204,7 +204,7 @@ output_text = gr.Textbox()
 output_path_component = gr.File(label="Select Output Path")
 iface = gr.Interface(
     fn=pdf_to_text,
-    inputs='file',
     # inputs=["textbox", input_folder_text, "textbox", max_tokens, temp_slider, prob_slider],
     outputs=output_text,
     title='COBIx Endoscopy Report De-Identification',

     #             n_ctx=8192,
     #             )
+    # chat_template = MessagesFormatterType.LLAMA_3
     llm = Llama(
         model_path="models/Meta-Llama-3-70B-Instruct-Q3_K_M.gguf",
         n_ctx=8192,
     )
+    # provider = LlamaCppPythonProvider(llm)
+    # agent = LlamaCppAgent(
+    #     provider,
+    #     system_prompt="You are a helpful assistant.",
+    #     predefined_messages_formatter_type=chat_template,
+    #     debug_output=True
+    # )
+    # settings = provider.get_provider_default_settings()
+    # settings.temperature = 0.7
+    # settings.top_k = 40
+    # settings.top_p = 0.95
+    # settings.max_tokens = 2048
+    # settings.repeat_penalty = 1.1
+    # settings.stream = True
+    # messages = BasicChatHistory()
+    # stream = agent.get_chat_response(
+    #     prompt + ' : ' + pdftext,
+    #     llm_sampling_settings=settings,
+    #     chat_history=messages,
+    #     returns_streaming_generator=True,
+    #     print_output=False
+    # )
+    # outputs = ""
+    # for output in stream:
+    #     outputs += output
+    # return outputs
+    output = model.create_chat_completion(
+        messages=[
+            {"role": "assistant", "content": prompt},
+            {
+                "role": "user",
+                "content": pdftext
+            }
+        ],
+        max_tokens=maxtokens,
+        temperature=temperature
+    )
+    output = output['choices'][0]['message']['content']
     # prompt = "Perform the following actions on given text: 1. Replace any person age with term [redacted] 2. DO NOT REPLACE ANY MEDICAL MEASUREMENTS 3. Replace only the CALENDAR DATES of format 'day/month/year' with term [redacted]"
     # output = model.create_chat_completion(
     # print(output)
     # print('-------------------------------------------------------')
+    return output
 def pdf_to_text(files, maxtokens=2048, temperature=0, top_probability=0.95):
     print('Control 0-----------------------------------')
 output_path_component = gr.File(label="Select Output Path")
 iface = gr.Interface(
     fn=pdf_to_text,
+    inputs=['file', max_tokens, temp_slider, prob_slider],
     # inputs=["textbox", input_folder_text, "textbox", max_tokens, temp_slider, prob_slider],
     outputs=output_text,
     title='COBIx Endoscopy Report De-Identification',