Canner · paopa · Mar 13, 2025 · Mar 7, 2025 · Mar 7, 2025 · Mar 10, 2025
diff --git a/wren-ai-service/src/config.py b/wren-ai-service/src/config.py
@@ -36,6 +36,7 @@ class Settings(BaseSettings):
     # generation config
     allow_intent_classification: bool = Field(default=True)
     allow_sql_generation_reasoning: bool = Field(default=True)
+    max_histories: int = Field(default=10)
 
     # engine config
     engine_timeout: float = Field(default=30.0)

diff --git a/wren-ai-service/src/globals.py b/wren-ai-service/src/globals.py
@@ -117,6 +117,7 @@ def create_service_container(
             },
             allow_intent_classification=settings.allow_intent_classification,
             allow_sql_generation_reasoning=settings.allow_sql_generation_reasoning,
+            max_histories=settings.max_histories,
             **query_cache,
         ),
         chart_service=services.ChartService(

diff --git a/wren-ai-service/src/pipelines/generation/data_assistance.py b/wren-ai-service/src/pipelines/generation/data_assistance.py
@@ -53,15 +53,11 @@ def prompt(
     db_schemas: list[str],
     language: str,
     prompt_builder: PromptBuilder,
-    history: Optional[AskHistory] = None,
+    histories: Optional[list[AskHistory]] = None,
 ) -> dict:
-    if history:
-        previous_query_summaries = [
-            step.summary for step in history.steps if step.summary
-        ]
-    else:
-        previous_query_summaries = []
-
+    previous_query_summaries = (
+        [history.question for history in histories] if histories else []
+    )
     query = "\n".join(previous_query_summaries) + "\n" + query
 
     return prompt_builder.run(
@@ -106,9 +102,9 @@ def __init__(
 
     def _streaming_callback(self, chunk, query_id):
         if query_id not in self._user_queues:
-            self._user_queues[
-                query_id
-            ] = asyncio.Queue()  # Create a new queue for the user if it doesn't exist
+            self._user_queues[query_id] = (
+                asyncio.Queue()
+            )  # Create a new queue for the user if it doesn't exist
         # Put the chunk content into the user's queue
         asyncio.create_task(self._user_queues[query_id].put(chunk.content))
         if chunk.meta.get("finish_reason"):
@@ -119,9 +115,9 @@ async def _get_streaming_results(query_id):
             return await self._user_queues[query_id].get()
 
         if query_id not in self._user_queues:
-            self._user_queues[
-                query_id
-            ] = asyncio.Queue()  # Ensure the user's queue exists
+            self._user_queues[query_id] = (
+                asyncio.Queue()
+            )  # Ensure the user's queue exists
         while True:
             try:
                 # Wait for an item from the user's queue
@@ -146,7 +142,7 @@ async def run(
         db_schemas: list[str],
         language: str,
         query_id: Optional[str] = None,
-        history: Optional[AskHistory] = None,
+        histories: Optional[list[AskHistory]] = None,
     ):
         logger.info("Data Assistance pipeline is running...")
         return await self._pipe.execute(
@@ -156,7 +152,7 @@ async def run(
                 "db_schemas": db_schemas,
                 "language": language,
                 "query_id": query_id or "",
-                "history": history,
+                "histories": histories,
                 **self._components,
             },
         )

diff --git a/wren-ai-service/src/pipelines/generation/followup_sql_generation.py b/wren-ai-service/src/pipelines/generation/followup_sql_generation.py
@@ -48,11 +48,11 @@
 {% endif %}
 
 ### CONTEXT ###
-Previous SQL Summary:
-{% for summary in previous_query_summaries %}
-    {{ summary }}
+User's query history:
+{% for history in histories %}
+    {{ history.question }}
+    {{ history.sql }}
 {% endfor %}
-Previous SQL Query: {{ history.sql }}
 
 ### QUESTION ###
 User's Follow-up Question: {{ query }}
@@ -71,20 +71,20 @@ def prompt(
     query: str,
     documents: List[str],
     sql_generation_reasoning: str,
-    history: AskHistory,
+    histories: list[AskHistory],
     configuration: Configuration,
     prompt_builder: PromptBuilder,
     sql_samples: List[Dict] | None = None,
     has_calculated_field: bool = False,
     has_metric: bool = False,
 ) -> dict:
-    previous_query_summaries = [step.summary for step in history.steps if step.summary]
+    previous_query_summaries = [history.question for history in histories]
 
     return prompt_builder.run(
         query=query,
         documents=documents,
         sql_generation_reasoning=sql_generation_reasoning,
-        history=history,
+        histories=histories,
         previous_query_summaries=previous_query_summaries,
         instructions=construct_instructions(
             configuration,
@@ -152,7 +152,7 @@ async def run(
         query: str,
         contexts: List[str],
         sql_generation_reasoning: str,
-        history: AskHistory,
+        histories: list[AskHistory],
         configuration: Configuration = Configuration(),
         sql_samples: List[Dict] | None = None,
         project_id: str | None = None,
@@ -166,7 +166,7 @@ async def run(
                 "query": query,
                 "documents": contexts,
                 "sql_generation_reasoning": sql_generation_reasoning,
-                "history": history,
+                "histories": histories,
                 "project_id": project_id,
                 "configuration": configuration,
                 "sql_samples": sql_samples,

diff --git a/wren-ai-service/src/pipelines/generation/intent_classification.py b/wren-ai-service/src/pipelines/generation/intent_classification.py
@@ -103,7 +103,11 @@
 
 ### INPUT ###
 {% if query_history %}
-User's previous SQLs: {{ query_history }}
+User's query history:
+{% for history in query_history %}
+{{ history.question }}
+{{ history.sql }}
+{% endfor %}
 {% endif %}
 User's question: {{query}}
 Current Time: {{ current_time }}
@@ -116,10 +120,10 @@
 ## Start of Pipeline
 @observe(capture_input=False, capture_output=False)
 async def embedding(
-    query: str, embedder: Any, history: Optional[AskHistory] = None
+    query: str, embedder: Any, histories: Optional[list[AskHistory]] = None
 ) -> dict:
     previous_query_summaries = (
-        [step.summary for step in history.steps if step.summary] if history else []
+        [history.question for history in histories] if histories else []
     )
 
     query = "\n".join(previous_query_summaries) + "\n" + query
@@ -222,14 +226,14 @@ def prompt(
     query: str,
     construct_db_schemas: list[str],
     prompt_builder: PromptBuilder,
-    history: Optional[AskHistory] = None,
+    histories: Optional[list[AskHistory]] = None,
     configuration: Configuration | None = None,
 ) -> dict:
     return prompt_builder.run(
         query=query,
         language=configuration.language,
         db_schemas=construct_db_schemas,
-        query_history=history.sql if history else [],
+        query_history=histories,
         current_time=configuration.show_current_time(),
     )
 
@@ -316,7 +320,7 @@ async def run(
         self,
         query: str,
         id: Optional[str] = None,
-        history: Optional[AskHistory] = None,
+        histories: Optional[list[AskHistory]] = None,
         configuration: Configuration = Configuration(),
     ):
         logger.info("Intent Classification pipeline is running...")
@@ -325,7 +329,7 @@ async def run(
             inputs={
                 "query": query,
                 "id": id or "",
-                "history": history,
+                "histories": histories,
                 "configuration": configuration,
                 **self._components,
             },

diff --git a/wren-ai-service/src/pipelines/generation/sql_expansion.py b/wren-ai-service/src/pipelines/generation/sql_expansion.py
@@ -149,6 +149,6 @@ async def run(
         "sql_expansion",
         query="query",
         contexts=[],
-        history=AskHistory(sql="SELECT * FROM table", summary="Summary", steps=[]),
+        history=AskHistory(sql="SELECT * FROM table", question="user question"),
         configuration=Configuration(),
     )
diff --git a/wren-ai-service/src/pipelines/retrieval/retrieval.py b/wren-ai-service/src/pipelines/retrieval/retrieval.py
@@ -116,12 +116,12 @@ def _build_view_ddl(content: dict) -> str:
 ## Start of Pipeline
 @observe(capture_input=False, capture_output=False)
 async def embedding(
-    query: str, embedder: Any, history: Optional[AskHistory] = None
+    query: str, embedder: Any, histories: Optional[list[AskHistory]] = None
 ) -> dict:
     if query:
-        if history:
+        if histories:
             previous_query_summaries = [
-                step.summary for step in history.steps if step.summary
+                history.question for history in histories
             ]
         else:
             previous_query_summaries = []
@@ -292,7 +292,7 @@ def prompt(
     construct_db_schemas: list[dict],
     prompt_builder: PromptBuilder,
     check_using_db_schemas_without_pruning: dict,
-    history: Optional[AskHistory] = None,
+    histories: Optional[list[AskHistory]] = None,
 ) -> dict:
     if not check_using_db_schemas_without_pruning["db_schemas"]:
         logger.info(
@@ -303,12 +303,9 @@ def prompt(
             for construct_db_schema in construct_db_schemas
         ]
 
-        if history:
-            previous_query_summaries = [
-                step.summary for step in history.steps if step.summary
-            ]
-        else:
-            previous_query_summaries = []
+        previous_query_summaries = (
+            [history.question for history in histories] if histories else []
+        )
 
         query = "\n".join(previous_query_summaries) + "\n" + query
         return prompt_builder.run(question=query, db_schemas=db_schemas)
@@ -482,7 +479,7 @@ async def run(
         query: str = "",
         tables: Optional[list[str]] = None,
         id: Optional[str] = None,
-        history: Optional[AskHistory] = None,
+        histories: Optional[list[AskHistory]] = None,
     ):
         logger.info("Ask Retrieval pipeline is running...")
         return await self._pipe.execute(
@@ -491,7 +488,7 @@ async def run(
                 "query": query,
                 "tables": tables,
                 "id": id or "",
-                "history": history,
+                "histories": histories,
                 **self._components,
                 **self._configs,
             },

diff --git a/wren-ai-service/src/web/v1/routers/ask.py b/wren-ai-service/src/web/v1/routers/ask.py
@@ -152,10 +152,10 @@ async def ask_feedback(
 ) -> AskFeedbackResponse:
     query_id = str(uuid.uuid4())
     ask_feedback_request.query_id = query_id
-    service_container.ask_service._ask_feedback_results[
-        query_id
-    ] = AskFeedbackResultResponse(
-        status="searching",
+    service_container.ask_service._ask_feedback_results[query_id] = (
+        AskFeedbackResultResponse(
+            status="searching",
+        )
     )
 
     background_tasks.add_task(

diff --git a/wren-ai-service/src/web/v1/routers/sql_expansions.py b/wren-ai-service/src/web/v1/routers/sql_expansions.py
@@ -88,13 +88,13 @@
 
 @router.post("/sql-expansions")
 async def sql_expansion(
-    sql_expansion_request: SqlExpansionRequest,
+    request: SqlExpansionRequest,
     background_tasks: BackgroundTasks,
     service_container: ServiceContainer = Depends(get_service_container),
     service_metadata: ServiceMetadata = Depends(get_service_metadata),
 ) -> SqlExpansionResponse:
     query_id = str(uuid.uuid4())
-    sql_expansion_request.query_id = query_id
+    request.query_id = query_id
     service_container.sql_expansion_service._sql_expansion_results[
         query_id
     ] = SqlExpansionResultResponse(
@@ -103,7 +103,7 @@ async def sql_expansion(
 
     background_tasks.add_task(
         service_container.sql_expansion_service.sql_expansion,
-        sql_expansion_request,
+        request,
         service_metadata=asdict(service_metadata),
     )
     return SqlExpansionResponse(query_id=query_id)

diff --git a/wren-ai-service/src/web/v1/services/ask.py b/wren-ai-service/src/web/v1/services/ask.py
@@ -9,14 +9,13 @@
 from src.core.pipeline import BasicPipeline
 from src.utils import trace_metadata
 from src.web.v1.services import Configuration, SSEEvent
-from src.web.v1.services.ask_details import SQLBreakdown
 
 logger = logging.getLogger("wren-ai-service")
 
 
 class AskHistory(BaseModel):
     sql: str
-    steps: List[SQLBreakdown]
+    question: str
 
 
 # POST /v1/asks
@@ -29,7 +28,7 @@ class AskRequest(BaseModel):
     # so we need to support as a choice, and will remove it in the future
     mdl_hash: Optional[str] = Field(validation_alias=AliasChoices("mdl_hash", "id"))
     thread_id: Optional[str] = None
-    history: Optional[AskHistory] = None
+    histories: Optional[list[AskHistory]] = Field(default_factory=list)
     configurations: Optional[Configuration] = Configuration()
 
     @property
@@ -166,6 +165,7 @@ def __init__(
         pipelines: Dict[str, BasicPipeline],
         allow_intent_classification: bool = True,
         allow_sql_generation_reasoning: bool = True,
+        max_histories: int = 10,
         maxsize: int = 1_000_000,
         ttl: int = 120,
     ):
@@ -178,6 +178,7 @@ def __init__(
         )
         self._allow_sql_generation_reasoning = allow_sql_generation_reasoning
         self._allow_intent_classification = allow_intent_classification
+        self._max_histories = max_histories
 
     def _is_stopped(self, query_id: str, container: dict):
         if (
@@ -205,6 +206,7 @@ async def ask(
         }
 
-
+        histories = ask_request.histories[:self._max_histories]
-
+        histories = ask_request.histories[:self._max_histories]
         query_id = ask_request.query_id
+        histories = ask_request.histories[: self._max_histories]
         rephrased_question = None
         intent_reasoning = None
         sql_generation_reasoning = None
@@ -250,7 +252,7 @@ async def ask(
                     intent_classification_result = (
                         await self._pipelines["intent_classification"].run(
                             query=user_query,
-                            history=ask_request.history,
+                            histories=histories,
                             id=ask_request.project_id,
                             configuration=ask_request.configurations,
                         )
@@ -278,7 +280,7 @@ async def ask(
                         asyncio.create_task(
                             self._pipelines["data_assistance"].run(
                                 query=user_query,
-                                history=ask_request.history,
+                                histories=histories,
                                 db_schemas=intent_classification_result.get(
                                     "db_schemas"
                                 ),
@@ -315,7 +317,7 @@ async def ask(
 
                 retrieval_result = await self._pipelines["retrieval"].run(
                     query=user_query,
-                    history=ask_request.history,
+                    histories=histories,
                     id=ask_request.project_id,
                 )
                 _retrieval_result = retrieval_result.get(
@@ -403,14 +405,14 @@ async def ask(
                 )
                 has_metric = (_retrieval_result.get("has_metric", False),)
 
-                if ask_request.history:
+                if histories:
                     text_to_sql_generation_results = await self._pipelines[
                         "followup_sql_generation"
                     ].run(
                         query=user_query,
                         contexts=table_ddls,
                         sql_generation_reasoning=sql_generation_reasoning,
-                        history=ask_request.history,
+                        histories=histories,
                         project_id=ask_request.project_id,
                         configuration=ask_request.configurations,
                         sql_samples=sql_samples,