Spaces:

dolphinium
/

pc-ai-data-analyst-dup

Running

App Files Files Community

dolphinium commited on 30 days ago

Commit

c13e67b

1 Parent(s): a811652

parse intentions only on search_list returned by ex. api

Browse files

Files changed (3) hide show

data_processing.py +13 -7
extract_results.py +11 -4
ui.py +8 -4

data_processing.py CHANGED Viewed

@@ -1,4 +1,3 @@
 """
 Core data processing and analysis logic for the PharmaCircle AI Data Analyst.
@@ -44,11 +43,18 @@ def llm_generate_analysis_plan_with_history(llm_model, natural_language_query, c
     and dynamic field suggestions from an external API.
     """
     search_fields, search_name, field_mappings = [], "", {}
     try:
-        search_fields, search_name, field_mappings = get_search_list_params(natural_language_query)
-        print(f"API returned core: '{search_name}' with {len(search_fields)} fields and {len(field_mappings)} mappings.")
     except Exception as e:
         print(f"Warning: Could not retrieve dynamic search fields. Proceeding without them. Error: {e}")
     core_name = search_name if search_name else 'news'
@@ -70,15 +76,15 @@ def llm_generate_analysis_plan_with_history(llm_model, natural_language_query, c
         response = llm_model.generate_content(prompt)
         cleaned_text = re.sub(r'```json\s*|\s*```', '', response.text, flags=re.MULTILINE | re.DOTALL).strip()
         plan = json.loads(cleaned_text)
-        return plan, mapped_search_fields, core_name
     except json.JSONDecodeError as e:
         raw_response_text = response.text if 'response' in locals() else 'N/A'
         print(f"Error decoding JSON from LLM response: {e}\nRaw Response:\n{raw_response_text}")
-        return None, mapped_search_fields, core_name
     except Exception as e:
         raw_response_text = response.text if 'response' in locals() else 'N/A'
         print(f"Error in llm_generate_analysis_plan_with_history: {e}\nRaw Response:\n{raw_response_text}")
-        return None, mapped_search_fields, core_name
 def execute_quantitative_query(solr_client, plan):
     """Executes the facet query to get aggregate data."""
@@ -194,4 +200,4 @@ def execute_viz_code_and_get_path(viz_code, facet_data):
         print(f"Error: {e}")
         print(f"--- Code---\n{viz_code}")
         print("-----------------------------------------")
-        return None

 """
 Core data processing and analysis logic for the PharmaCircle AI Data Analyst.
     and dynamic field suggestions from an external API.
     """
     search_fields, search_name, field_mappings = [], "", {}
+    intent = None
     try:
+        intent, search_fields, search_name, field_mappings = get_search_list_params(natural_language_query)
+        print(f"API returned intent: '{intent}', core: '{search_name}' with {len(search_fields)} fields and {len(field_mappings)} mappings.")
+        if intent != 'search_list':
+            print(f"API returned intent '{intent}' which is not 'search_list'. Aborting analysis.")
+            return None, None, None, intent
     except Exception as e:
         print(f"Warning: Could not retrieve dynamic search fields. Proceeding without them. Error: {e}")
+        return None, [], None, 'api_error'
     core_name = search_name if search_name else 'news'
         response = llm_model.generate_content(prompt)
         cleaned_text = re.sub(r'```json\s*|\s*```', '', response.text, flags=re.MULTILINE | re.DOTALL).strip()
         plan = json.loads(cleaned_text)
+        return plan, mapped_search_fields, core_name, intent
     except json.JSONDecodeError as e:
         raw_response_text = response.text if 'response' in locals() else 'N/A'
         print(f"Error decoding JSON from LLM response: {e}\nRaw Response:\n{raw_response_text}")
+        return None, mapped_search_fields, core_name, intent
     except Exception as e:
         raw_response_text = response.text if 'response' in locals() else 'N/A'
         print(f"Error in llm_generate_analysis_plan_with_history: {e}\nRaw Response:\n{raw_response_text}")
+        return None, mapped_search_fields, core_name, intent
 def execute_quantitative_query(solr_client, plan):
     """Executes the facet query to get aggregate data."""
         print(f"Error: {e}")
         print(f"--- Code---\n{viz_code}")
         print("-----------------------------------------")
+        return None

extract_results.py CHANGED Viewed

@@ -19,10 +19,10 @@ def _parse_mappings(mapping_str: str) -> dict:
 def get_search_list_params(query, k=20):
     """
-    Connects to the external API, parses the stream, and returns the core name,
     search fields, and field mappings.
-    Returns tuple: (search_fields, search_name, field_mappings)
     """
     url = "https://aitest.ebalina.com/stream"
@@ -39,6 +39,7 @@ def get_search_list_params(query, k=20):
         search_fields = []
         search_name = ""
         field_mappings_str = ""
         for line in response.iter_lines():
             if line and line.startswith(b'data: '):
@@ -50,6 +51,12 @@ def get_search_list_params(query, k=20):
                     data = json.loads(line_str)
                     log_title = data.get('log_title')
                     if log_title == 'Search List Result':
                         content = data.get('content', '')
                         if content:
@@ -68,8 +75,8 @@ def get_search_list_params(query, k=20):
         field_mappings = _parse_mappings(field_mappings_str)
-        return search_fields, search_name, field_mappings
     except requests.exceptions.RequestException as e:
         print(f"Error connecting to the external API: {e}")
-        return [], "", {}

 def get_search_list_params(query, k=20):
     """
+    Connects to the external API, parses the stream, and returns the intent, core name,
     search fields, and field mappings.
+    Returns tuple: (intent, search_fields, search_name, field_mappings)
     """
     url = "https://aitest.ebalina.com/stream"
         search_fields = []
         search_name = ""
         field_mappings_str = ""
+        intent = None
         for line in response.iter_lines():
             if line and line.startswith(b'data: '):
                     data = json.loads(line_str)
                     log_title = data.get('log_title')
+                    if log_title == 'NER Succeded':
+                        content = data.get('content', {})
+                        if 'intent' in content and content['intent']:
+                            intent = content['intent'][0]
+                            print(f"DEBUG: Intent detected: {intent}")
                     if log_title == 'Search List Result':
                         content = data.get('content', '')
                         if content:
         field_mappings = _parse_mappings(field_mappings_str)
+        return intent, search_fields, search_name, field_mappings
     except requests.exceptions.RequestException as e:
         print(f"Error connecting to the external API: {e}")
+        return None, [], "", {}

ui.py CHANGED Viewed

@@ -96,8 +96,8 @@ def create_ui(llm_model, solr_client):
             history.append((user_input, f"Analyzing: '{query_context}'\n\n*Generating analysis plan...*"))
             yield (history, state, None, None, None, None, None, None, None, None)
-            # Generate plan and get search field suggestions. This now returns the core name.
-            analysis_plan, mapped_search_fields, core_name = llm_generate_analysis_plan_with_history(llm_model, query_context, history)
             # Update and display search field suggestions in its own accordion
             if mapped_search_fields:
@@ -107,7 +107,11 @@ def create_ui(llm_model, solr_client):
                 suggestions_display_update = gr.update(value="No suggestions were returned from the external API.", visible=True)
             if not analysis_plan:
-                history.append((None, "I'm sorry, I couldn't generate a valid analysis plan. Please try rephrasing."))
                 yield (history, state, None, None, None, None, None, None, None, suggestions_display_update)
                 return
@@ -225,4 +229,4 @@ def create_ui(llm_model, solr_client):
             queue=False
         )
-    return demo

             history.append((user_input, f"Analyzing: '{query_context}'\n\n*Generating analysis plan...*"))
             yield (history, state, None, None, None, None, None, None, None, None)
+            # Generate plan, get search field suggestions, and intent.
+            analysis_plan, mapped_search_fields, core_name, intent = llm_generate_analysis_plan_with_history(llm_model, query_context, history)
             # Update and display search field suggestions in its own accordion
             if mapped_search_fields:
                 suggestions_display_update = gr.update(value="No suggestions were returned from the external API.", visible=True)
             if not analysis_plan:
+                if intent and intent != 'search_list':
+                    message = f"I am sorry, I can only perform analysis for 'search_list' type queries. Your query was identified as a '{intent}', which is not supported."
+                else:
+                    message = "I'm sorry, I couldn't generate a valid analysis plan. Please try rephrasing your question."
+                history.append((None, message))
                 yield (history, state, None, None, None, None, None, None, None, suggestions_display_update)
                 return
             queue=False
         )
+    return demo