Arxiv-CS-RAG

Running

App Files Files Community

bishmoy commited on Mar 5

Commit

5628a76

•

1 Parent(s): 2e45345

code clean up

Browse files

Files changed (1) hide show

app.py +11 -4

app.py CHANGED Viewed

@@ -24,11 +24,13 @@ try:
   gr.Info("Setting up retriever, please wait...")
   rag_initial_output = RAG.search("what is Mistral?", k = 1)
   gr.Info("Retriever working successfully!")
 except:
   gr.Warning("Retriever not working!")
 mark_text = '# 🔍 Search Results\n'
 header_text = "# ArXivCS RAG \n"
 try:
   with open("README.md", "r") as f:
       mdfile = f.read()
@@ -37,6 +39,7 @@ try:
   date = match.group().split(': ')[1]
   formatted_date = datetime.strptime(date, '%Y-%m-%d').strftime('%d %b %Y')
   header_text += f'Index Last Updated: {formatted_date}\n'
 except:
   pass
@@ -45,6 +48,7 @@ if show_examples:
       sample_outputs = json.load(f)
     output_placeholder = sample_outputs['output_placeholder']
     md_text_initial = sample_outputs['search_placeholder']
 else:
     output_placeholder = None
     md_text_initial = ''
@@ -61,6 +65,7 @@ def get_prompt_text(question, context, formatted = True, llm_model_picked = 'mis
     if formatted:
       sys_instruction = f"Context:\n {context} \n Given the following scientific paper abstracts, take a deep breath and lets think step by step to answer the question. Cite the titles of your sources when answering, do not cite links or dates."
       message = f"Question: {question}"
       if 'mistralai' in llm_model_picked:
           return f"<s>" + f"[INST] {sys_instruction}" +  f" {message}[/INST]"
@@ -74,12 +79,14 @@ def get_references(question, retriever, k = retrieve_results):
     return rag_out
 def get_rag(message):
-        return get_references(message, RAG)
 with gr.Blocks(theme = gr.themes.Soft()) as demo:
     header = gr.Markdown(header_text)
     with gr.Group():
       msg = gr.Textbox(label = 'Search', placeholder = 'What is Mistral?')
       with gr.Accordion("Advanced Settings", open=False):
         with gr.Row(equal_height = True):
           llm_model = gr.Dropdown(choices = llm_models_to_choose, value = 'mistralai/Mistral-7B-Instruct-v0.2', label = 'LLM Model')
@@ -97,7 +104,6 @@ with gr.Blocks(theme = gr.themes.Soft()) as demo:
           rag_answer = rag_out[i]
           title = rag_answer['document_metadata']['title'].replace('\n','')
-          #score = round(rag_answer['score'], 2)
           date = rag_answer['document_metadata']['_time']
           paper_title = f'''### {date} | [{title}](https://arxiv.org/abs/{rag_answer['document_id']}) | [⬇️](https://arxiv.org/pdf/{rag_answer['document_id']})\n'''
           paper_abs = rag_answer['content']
@@ -111,6 +117,7 @@ with gr.Blocks(theme = gr.themes.Soft()) as demo:
     def ask_llm(prompt, llm_model_picked = 'mistralai/Mistral-7B-Instruct-v0.2', stream_outputs = False):
        model_disabled_text = "LLM Model is disabled"
        output = ""
        if llm_model_picked == 'None':
           if stream_outputs:
               for out in model_disabled_text:
@@ -123,10 +130,10 @@ with gr.Blocks(theme = gr.themes.Soft()) as demo:
        client = InferenceClient(llm_model_picked)
        try:
            stream = client.text_generation(prompt, **generate_kwargs,  stream=stream_outputs, details=False, return_full_text=False)
        except:
            gr.Warning("LLM Inference rate limit reached, try again later!")
            return ""
-       #output = output.lstrip(' \n') if output.lstrip().startswith('\n') else output
        if stream_outputs:
            for response in stream:
@@ -139,4 +146,4 @@ with gr.Blocks(theme = gr.themes.Soft()) as demo:
     msg.submit(update_with_rag_md, [msg, llm_results, llm_model], [gr_md, input]).success(ask_llm, [input, llm_model, stream_results], output_text)
-demo.queue(default_concurrency_limit=10).launch()

   gr.Info("Setting up retriever, please wait...")
   rag_initial_output = RAG.search("what is Mistral?", k = 1)
   gr.Info("Retriever working successfully!")
 except:
   gr.Warning("Retriever not working!")
 mark_text = '# 🔍 Search Results\n'
 header_text = "# ArXivCS RAG \n"
 try:
   with open("README.md", "r") as f:
       mdfile = f.read()
   date = match.group().split(': ')[1]
   formatted_date = datetime.strptime(date, '%Y-%m-%d').strftime('%d %b %Y')
   header_text += f'Index Last Updated: {formatted_date}\n'
 except:
   pass
       sample_outputs = json.load(f)
     output_placeholder = sample_outputs['output_placeholder']
     md_text_initial = sample_outputs['search_placeholder']
 else:
     output_placeholder = None
     md_text_initial = ''
     if formatted:
       sys_instruction = f"Context:\n {context} \n Given the following scientific paper abstracts, take a deep breath and lets think step by step to answer the question. Cite the titles of your sources when answering, do not cite links or dates."
       message = f"Question: {question}"
       if 'mistralai' in llm_model_picked:
           return f"<s>" + f"[INST] {sys_instruction}" +  f" {message}[/INST]"
     return rag_out
 def get_rag(message):
+    return get_references(message, RAG)
 with gr.Blocks(theme = gr.themes.Soft()) as demo:
     header = gr.Markdown(header_text)
     with gr.Group():
       msg = gr.Textbox(label = 'Search', placeholder = 'What is Mistral?')
       with gr.Accordion("Advanced Settings", open=False):
         with gr.Row(equal_height = True):
           llm_model = gr.Dropdown(choices = llm_models_to_choose, value = 'mistralai/Mistral-7B-Instruct-v0.2', label = 'LLM Model')
           rag_answer = rag_out[i]
           title = rag_answer['document_metadata']['title'].replace('\n','')
           date = rag_answer['document_metadata']['_time']
           paper_title = f'''### {date} | [{title}](https://arxiv.org/abs/{rag_answer['document_id']}) | [⬇️](https://arxiv.org/pdf/{rag_answer['document_id']})\n'''
           paper_abs = rag_answer['content']
     def ask_llm(prompt, llm_model_picked = 'mistralai/Mistral-7B-Instruct-v0.2', stream_outputs = False):
        model_disabled_text = "LLM Model is disabled"
        output = ""
        if llm_model_picked == 'None':
           if stream_outputs:
               for out in model_disabled_text:
        client = InferenceClient(llm_model_picked)
        try:
            stream = client.text_generation(prompt, **generate_kwargs,  stream=stream_outputs, details=False, return_full_text=False)
        except:
            gr.Warning("LLM Inference rate limit reached, try again later!")
            return ""
        if stream_outputs:
            for response in stream:
     msg.submit(update_with_rag_md, [msg, llm_results, llm_model], [gr_md, input]).success(ask_llm, [input, llm_model, stream_results], output_text)
+demo.queue().launch()