Spaces:

Ritvik19
/

Zeta

Sleeping

App Files Files Community

Ritvik19 commited on Mar 6

Commit

eed34fa

•

1 Parent(s): c323312

synopsis / insight bullets

Browse files

Files changed (4) hide show

app.py +47 -3
autoqa_chains.py +6 -3
insights_bullet_chain.py +17 -0
synopsis_chain.py +29 -0

app.py CHANGED Viewed

@@ -17,6 +17,8 @@ from chat_chains import (
 )
 from autoqa_chains import auto_qa_chain, auto_qa_output_parser
 from chain_of_density import chain_of_density_chain
 from custom_exceptions import InvalidArgumentError, InvalidCommandError
 st.set_page_config(layout="wide")
@@ -34,9 +36,11 @@ Here's a quick guide to getting started with me:
 | `/library` | View an index of processed documents to easily navigate your research. |
 | `/session-expense` | Calculate the cost of our conversation, ensuring transparency in resource usage. |
 | `/export` | Download conversation data for your records or further analysis. |
-| `/auto-insight <document id>` | Automatically generate questions and answers for a document. |
-| `/deep-dive [<list of document ids>] <query>` | Query the AI with a specific document context. |
-| `/condense-summary <document id>` | Generate increasingly concise, entity-dense summaries of a document. |
 <br>
@@ -185,6 +189,44 @@ def chain_of_density_wrapper(inputs):
     return (summary, "identity")
 def auto_qa_chain_wrapper(inputs):
     if inputs == "":
         raise InvalidArgumentError("Please provide a document id")
@@ -256,6 +298,8 @@ if __name__ == "__main__":
         ("/auto-insight", str, auto_qa_chain_wrapper),
         ("/deep-dive", str, query_llm_wrapper),
         ("/condense-summary", str, chain_of_density_wrapper),
     ]
     command_center = CommandCenter(
         default_input_type=str,

 )
 from autoqa_chains import auto_qa_chain, auto_qa_output_parser
 from chain_of_density import chain_of_density_chain
+from insights_bullet_chain import insights_bullet_chain
+from synopsis_chain import synopsis_chain
 from custom_exceptions import InvalidArgumentError, InvalidCommandError
 st.set_page_config(layout="wide")
 | `/library` | View an index of processed documents to easily navigate your research. |
 | `/session-expense` | Calculate the cost of our conversation, ensuring transparency in resource usage. |
 | `/export` | Download conversation data for your records or further analysis. |
+| `/auto-insight <document id>` | Automatically generate questions and answers for the paper. |
+| `/deep-dive [<list of document ids>] <query>` | Query me with a specific context. |
+| `/condense-summary <document id>` | Generate increasingly concise, entity-dense summaries of the paper. |
+| `/insight-bullets <list of document ids>` | Extract and summarize key insights, methods, results, and conclusions. |
+| `/paper-synopsis <document id>` | Generate a synopsis of the paper. |
 <br>
     return (summary, "identity")
+def synopsis_wrapper(inputs):
+    if inputs == "":
+        raise InvalidArgumentError("Please provide a document id")
+    document = st.session_state.documents[inputs].page_content
+    llm = ChatOpenAI(model="gpt-4-turbo-preview", temperature=0)
+    with get_openai_callback() as cb:
+        summary = synopsis_chain(llm).invoke({"paper": document})
+        stats = cb
+    st.session_state.messages.append(("/paper-synopsis", summary, "identity"))
+    st.session_state.costing.append(
+        {
+            "prompt tokens": stats.prompt_tokens,
+            "completion tokens": stats.completion_tokens,
+            "cost": stats.total_cost,
+        }
+    )
+    return (summary, "identity")
+def insights_bullet_wrapper(inputs):
+    if inputs == "":
+        raise InvalidArgumentError("Please provide a document id")
+    document = "\n\n".join([st.session_state.documents[c].page_content for c in inputs])
+    llm = ChatOpenAI(model="gpt-4-turbo-preview", temperature=0)
+    with get_openai_callback() as cb:
+        insights = insights_bullet_chain(llm).invoke({"paper": document})
+        stats = cb
+    st.session_state.messages.append(("/insight-bullets", insights, "identity"))
+    st.session_state.costing.append(
+        {
+            "prompt tokens": stats.prompt_tokens,
+            "completion tokens": stats.completion_tokens,
+            "cost": stats.total_cost,
+        }
+    )
+    return (insights, "identity")
 def auto_qa_chain_wrapper(inputs):
     if inputs == "":
         raise InvalidArgumentError("Please provide a document id")
         ("/auto-insight", str, auto_qa_chain_wrapper),
         ("/deep-dive", str, query_llm_wrapper),
         ("/condense-summary", str, chain_of_density_wrapper),
+        ("/insight-bullets", list, insights_bullet_wrapper),
+        ("/paper-synopsis", str, synopsis_wrapper),
     ]
     command_center = CommandCenter(
         default_input_type=str,

autoqa_chains.py CHANGED Viewed

@@ -14,9 +14,12 @@ class AutoQA(BaseModel):
 qa_prompt_template = """
-Come up with the 10 questions and answers that could be commonly asked by people about the following research paper.
-The question and answers should capture the whole essence of the research paper
-The answers should be a bit detailed and strictly based on the research paper.
 Your response should be recorded in the following json format: {format_instructions}.
 here is the research paper: ####{paper}####

 qa_prompt_template = """
+Generate 10 insightful questions and their corresponding detailed answers about the key aspects of a specific machine learning research paper.
+The focus should be on the paper's objectives, methodology, key findings, and implications for future research or application.
+The answers must be based on the content of the research paper, offering clear and comprehensive insights for readers who may not be experts in the field.
+Ensure that the questions cover a broad range of topics related to the paper, including but not limited to the introduction, literature review, \
+methodology, results, discussion, and conclusions.
+The goal is to capture the essence of the paper in a way that is accessible to a broad audience.
 Your response should be recorded in the following json format: {format_instructions}.
 here is the research paper: ####{paper}####

insights_bullet_chain.py ADDED Viewed

	@@ -0,0 +1,17 @@

+from langchain_core.prompts import PromptTemplate
+from langchain_core.output_parsers import StrOutputParser
+insights_bullet_prompt_template = """
+Draw the key insights about objective, method, results and conclusions from the given excerpt in the form of bullet points. Also mention the figure or tables referred to along-with the corresponding bullet points
+Note: if results and conclusions are not much different, feel free to combine them to avoid duplication of information
+excerpt: {paper}
+"""
+insights_bullet_output_parser = StrOutputParser()
+insights_bullet_prompt = PromptTemplate(
+    template=insights_bullet_prompt_template,
+    input_variables=["paper"],
+)
+insights_bullet_chain = (
+    lambda model: insights_bullet_prompt | model | insights_bullet_output_parser
+)

synopsis_chain.py ADDED Viewed

	@@ -0,0 +1,29 @@

+from langchain_core.prompts import PromptTemplate
+from langchain_core.output_parsers import StrOutputParser
+synopsis_prompt_template = """
+Research Paper: {paper}
+Could you provide a concise summary of this paper, highlighting the following key points:
+Objective: Begin by briefly describing the primary goal of the research. What problem is the paper trying to solve, or what hypothesis is it testing? Mention the specific domain of machine learning it pertains to (e.g., supervised learning, unsupervised learning, reinforcement learning, deep learning, etc.).
+Background: Provide a concise overview of the context and motivation behind the research. Why is this problem important? What are the key challenges that previous studies have not addressed, which this paper seeks to overcome?
+Methods: Summarize the methodology used in the study. What are the key techniques, algorithms, or models proposed or evaluated? Mention any novel approach or significant modification to existing methods. Include information on the dataset(s) used, if applicable.
+Results: Highlight the main findings of the paper. What were the outcomes of applying the proposed methods? Include key metrics or statistics that demonstrate the effectiveness, efficiency, or advancements over previous approaches.
+Discussion and Implications: Discuss the significance of the results. What do these findings imply for the field of machine learning? How can they be applied in practice, or what future research directions do they suggest?
+Limitations: Briefly note any limitations or caveats of the study. Are there any specific conditions under which the findings may not hold? What aspects of the research could be improved upon?
+Conclusion: Conclude with a summary of the research paper's contributions to the field of machine learning. Reiterate the importance of the problem addressed and the impact of the findings.
+"""
+synopsis_output_parser = StrOutputParser()
+synopsis_prompt = PromptTemplate(
+    template=synopsis_prompt_template,
+    input_variables=["paper"],
+)
+synopsis_chain = lambda model: synopsis_prompt | model | synopsis_output_parser