Spaces:

Perunio
/

galis

Running

App Files Files Community

Perunio commited on Aug 23

Commit

8400bf2

1 Parent(s): 73669ab

improve llm prompt

Browse files

Files changed (2) hide show

galis_app.py +2 -0
llm/related_work_generator.py +45 -18

galis_app.py CHANGED Viewed

@@ -114,6 +114,8 @@ def app():
                 with related_work_placeholder.container():
                     with st.spinner("Generating related work section..."):
                         related_work = generate_related_work(
                             st.session_state.references
                         )
                         st.session_state.related_work = related_work

                 with related_work_placeholder.container():
                     with st.spinner("Generating related work section..."):
                         related_work = generate_related_work(
+                            st.session_state.abstract_title,
+                            st.session_state.abstract_text,
                             st.session_state.references
                         )
                         st.session_state.related_work = related_work

llm/related_work_generator.py CHANGED Viewed

@@ -16,12 +16,18 @@ logger = structlog.get_logger()
 load_dotenv()
 PROMPT_TEXT = """
-You are a research assistant AI specializing in academic writing. Your task is to generate a "Related Work" section
-for a research paper. You will be given a list of citations.
 Your goal is to synthesize the provided citations into a coherent and well-structured "Related Work" section that
 contextualizes the user's project within the existing academic literature.
 **PROVIDED CITATIONS:**
 {citations}
@@ -49,8 +55,12 @@ work introduces...", or "Building upon the foundation laid by [Author, Year], we
 transitions between paragraphs and ideas to create a coherent narrative that logically leads the reader to understand
 the novelty and importance of the user's project.
-6.  **Output Format:** Generate only the text for the "Related Work" section. Do not include headers like
-"INSTRUCTIONS" or "PROVIDED CITATIONS" in the final output. The entire response should be the section text itself.
 """
@@ -67,12 +77,12 @@ def create_related_work_pipeline():
     """Creates a ready-to-use pipeline for generating the Related Work section."""
     llm = ChatGoogleGenerativeAI(
-        model="gemini-1.5-flash",
         temperature=0.3
     )
     prompt = PromptTemplate(
-        input_variables=["citations"],
         template=PROMPT_TEXT
     )
@@ -83,24 +93,42 @@ def create_related_work_pipeline():
     return chain
-def generate_related_work(citations_text: str) -> str:
     """
-    Main function - pass citations, get Related Work
     Args:
         citations_text: Text with citations (can be a list or a string)
     Returns:
         The generated Related Work section
     """
     pipeline = create_related_work_pipeline()
-    result = pipeline.invoke({"citations": citations_text})
     return result
 if __name__ == "__main__":
-    my_citations = """
 Top 5 Citation Predictions:
   - Title: 'deterministic construction of rip matrices in compressed sensing from constant weight codes'
   - Title: 'mizar items exploring fine grained dependencies in the mizar mathematical library'
@@ -109,16 +137,15 @@ Top 5 Citation Predictions:
   - Title: 'anonymization with worst case distribution based background knowledge'
     """
-    print("Generuję Related Work...")
-    print("=" * 50)
     try:
-        related_work = generate_related_work(my_citations)
         print(related_work)
     except Exception as e:
-        print(f"Błąd: {e}")
-        print("\n=== INSTRUKCJE KONFIGURACJI ===")
-        print("1. Stwórz plik .env w tym samym folderze co skrypt")
-        print("2. Dodaj do niego linię: GOOGLE_API_KEY=twój_klucz")
-        print("3. Uzyskaj klucz na: https://makersuite.google.com/app/apikey")
         check_api_key()

 load_dotenv()
 PROMPT_TEXT = """
+You are a research assistant specializing in academic writing. Your task is to generate a "Related Work" section
+for a research paper. You will be given paper's title, abstract and a list of citations.
 Your goal is to synthesize the provided citations into a coherent and well-structured "Related Work" section that
 contextualizes the user's project within the existing academic literature.
+**PROVIDED TITLE**
+{title}
+**PROVIDED ABSTRACT**
+{abstract}**
 **PROVIDED CITATIONS:**
 {citations}
 transitions between paragraphs and ideas to create a coherent narrative that logically leads the reader to understand
 the novelty and importance of the user's project.
+6.  **Domain Sensitivity:** Adapt the discussion to the specific research domain indicated by the title and abstract.
+Use appropriate terminology and focus on concepts, methods, and challenges relevant to that particular field of study.
+7.  **Output Format:** Generate only the text for the "Related Work" section. Do not include headers like
+"INSTRUCTIONS," "PAPER TITLE," or "PROVIDED CITATIONS" in the final output. The entire response should be the
+section text itself, ready to be inserted into an academic paper.
 """
     """Creates a ready-to-use pipeline for generating the Related Work section."""
     llm = ChatGoogleGenerativeAI(
+        model="gemini-2.0-flash-exp",
         temperature=0.3
     )
     prompt = PromptTemplate(
+        input_variables=["title", "abstract", "citations"],
         template=PROMPT_TEXT
     )
     return chain
+def generate_related_work(title:str, abstract:str, citations_text: str) -> str:
     """
+    Main function - pass title, abstract, and citations, get Related Work
     Args:
+        title: The paper's title
+        abstract: The paper's abstract
         citations_text: Text with citations (can be a list or a string)
     Returns:
         The generated Related Work section
     """
     pipeline = create_related_work_pipeline()
+    result = pipeline.invoke({
+        "title": title,
+        "abstract": abstract,
+        "citations": citations_text
+    })
     return result
 if __name__ == "__main__":
+    title = "Privacy-Preserving Data Analysis in Distributed Systems: A Comprehensive Framework"
+    abstract = """
+    This paper presents a novel framework for privacy-preserving data analysis in distributed computing environments.
+    We propose a hybrid approach that combines differential privacy mechanisms with secure multi-party computation
+    to enable statistical analysis while maintaining strong privacy guarantees. Our framework addresses key challenges
+    in distributed data processing, including data heterogeneity, communication overhead, and scalability constraints.
+    Through extensive experiments on real-world datasets, we demonstrate that our approach achieves comparable accuracy
+    to centralized methods while providing provable privacy protection. The proposed system shows significant improvements
+    in computational efficiency compared to existing privacy-preserving solutions, making it practical for large-scale
+    deployment in enterprise environments.
+    """
+    citations = """
 Top 5 Citation Predictions:
   - Title: 'deterministic construction of rip matrices in compressed sensing from constant weight codes'
   - Title: 'mizar items exploring fine grained dependencies in the mizar mathematical library'
   - Title: 'anonymization with worst case distribution based background knowledge'
     """
+    print("Generating Related Work...")
+    print("-" * 50)
     try:
+        related_work = generate_related_work(title, abstract, citations)
         print(related_work)
     except Exception as e:
+        print(f"Error: {e}")
+        print("1. Create a .env file in the same folder as the script")
+        print("2. Add the line: GOOGLE_API_KEY=your_key")
+        print("3. Get the key at: https://makersuite.google.com/app/apikey")
         check_api_key()