Commit 292517b

committed

Refactor, please mypy

1 parent 33b5295 commit 292517bCopy full SHA for 292517b

File tree

19 files changed

+283

-93

lines changed

.vscode
- settings.json
requirements-dev.txt
src/backend
tests
- conftest.py
- snapshots/test_api_routes
  - test_advanced_chat_flow
    - advanced_chat_flow_response.json
  - test_advanced_chat_streaming_flow
    - advanced_chat_streaming_flow_response.jsonlines
  - test_simple_chat_flow_message_history
    - simple_chat_flow_message_history_response.json
  - test_simple_chat_flow
    - simple_chat_flow_response.json
  - test_simple_chat_streaming_flow
    - simple_chat_streaming_flow_response.jsonlines
- test_api_routes.py
- test_postgres_searcher.py

19 files changed

+283

-93

lines changed

`‎.vscode/settings.json`

Lines changed: 2 additions & 1 deletion

Original file line number	Diff line number	Diff line change
`@@ -36,5 +36,6 @@`
`36`	`36`	`"htmlcov": true,`
`37`	`37`	`".mypy_cache": true,`
`38`	`38`	`".coverage": true`
`39`		`- }`
	`39`	`+ },`
	`40`	`+ "python.REPL.enableREPLSmartSend": false`
`40`	`41`	`}`

`‎requirements-dev.txt`

Lines changed: 1 addition & 0 deletions

Original file line number	Diff line number	Diff line change
`@@ -14,3 +14,4 @@ pytest-snapshot`
`14`	`14`	`locust`
`15`	`15`	`psycopg2`
`16`	`16`	`dotenv-azd`
	`17`	`+freezegun`

`‎src/backend/fastapi_app/init.py`

Lines changed: 1 addition & 1 deletion

Original file line number	Diff line number	Diff line change
`@@ -38,7 +38,7 @@ async def lifespan(app: fastapi.FastAPI) -> AsyncIterator[State]:`
`38`	`38`	`if (`
`39`	`39`	`os.getenv("OPENAI_CHAT_HOST") == "azure"`
`40`	`40`	`or os.getenv("OPENAI_EMBED_HOST") == "azure"`
`41`		`- or os.getenv("POSTGRES_HOST").endswith(".database.azure.com")`
	`41`	`+ or os.getenv("POSTGRES_HOST", "").endswith(".database.azure.com")`
`42`	`42`	`):`
`43`	`43`	`azure_credential = await get_azure_credential()`
`44`	`44`	`engine = await create_postgres_engine_from_env(azure_credential)`

`‎src/backend/fastapi_app/api_models.py`

Lines changed: 33 additions & 3 deletions

Original file line number	Diff line number	Diff line change
`@@ -1,8 +1,9 @@`
`1`	`1`	`from enum import Enum`
`2`		`-from typing import Any, Optional`
	`2`	`+from typing import Any, Optional, Union`
`3`	`3`
`4`	`4`	`from openai.types.chat import ChatCompletionMessageParam`
`5`		`-from pydantic import BaseModel`
	`5`	`+from pydantic import BaseModel, Field`
	`6`	`+from pydantic_ai.messages import ModelRequest, ModelResponse`
`6`	`7`
`7`	`8`
`8`	`9`	`class AIChatRoles(str, Enum):`
`@@ -95,4 +96,33 @@ class ChatParams(ChatRequestOverrides):`
`95`	`96`	`enable_text_search: bool`
`96`	`97`	`enable_vector_search: bool`
`97`	`98`	`original_user_query: str`
`98`		`- past_messages: list[ChatCompletionMessageParam]`
	`99`	`+ past_messages: list[Union[ModelRequest, ModelResponse]]`
	`100`	`+`
	`101`	`+`
	`102`	`+class Filter(BaseModel):`
	`103`	`+ column: str`
	`104`	`+ comparison_operator: str`
	`105`	`+ value: Any`
	`106`	`+`
	`107`	`+`
	`108`	`+class PriceFilter(Filter):`
	`109`	`+ column: str = Field(default="price", description="The column to filter on (always 'price' for this filter)")`
	`110`	`+ comparison_operator: str = Field(description="The operator for price comparison ('>', '<', '>=', '<=', '=')")`
	`111`	`+ value: float = Field(description="The price value to compare against (e.g., 30.00)")`
	`112`	`+`
	`113`	`+`
	`114`	`+class BrandFilter(Filter):`
	`115`	`+ column: str = Field(default="brand", description="The column to filter on (always 'brand' for this filter)")`
	`116`	`+ comparison_operator: str = Field(description="The operator for brand comparison ('=' or '!=')")`
	`117`	`+ value: str = Field(description="The brand name to compare against (e.g., 'AirStrider')")`
	`118`	`+`
	`119`	`+`
	`120`	`+class SearchResults(BaseModel):`
	`121`	`+ query: str`
	`122`	`+ """The original search query"""`
	`123`	`+`
	`124`	`+ items: list[ItemPublic]`
	`125`	`+ """List of items that match the search query and filters"""`
	`126`	`+`
	`127`	`+ filters: list[Filter]`
	`128`	`+ """List of filters applied to the search results"""`

`‎src/backend/fastapi_app/openai_clients.py`

Lines changed: 8 additions & 4 deletions

Original file line number	Diff line number	Diff line change
`@@ -9,7 +9,7 @@`
`9`	`9`
`10`	`10`
`11`	`11`	`async def create_openai_chat_client(`
`12`		`- azure_credential: Union[azure.identity.AzureDeveloperCliCredential, azure.identity.ManagedIdentityCredential],`
	`12`	`+ azure_credential: Union[azure.identity.AzureDeveloperCliCredential, azure.identity.ManagedIdentityCredential, None],`
`13`	`13`	`) -> Union[openai.AsyncAzureOpenAI, openai.AsyncOpenAI]:`
`14`	`14`	`openai_chat_client: Union[openai.AsyncAzureOpenAI, openai.AsyncOpenAI]`
`15`	`15`	`OPENAI_CHAT_HOST = os.getenv("OPENAI_CHAT_HOST")`
`@@ -29,7 +29,7 @@ async def create_openai_chat_client(`
`29`	`29`	`azure_deployment=azure_deployment,`
`30`	`30`	`api_key=api_key,`
`31`	`31`	`)`
`32`		`- else:`
	`32`	`+ elifazure_credential:`
`33`	`33`	`logger.info(`
`34`	`34`	`"Setting up Azure OpenAI client for chat completions using Azure Identity, endpoint %s, deployment %s",`
`35`	`35`	`azure_endpoint,`
`@@ -44,6 +44,8 @@ async def create_openai_chat_client(`
`44`	`44`	`azure_deployment=azure_deployment,`
`45`	`45`	`azure_ad_token_provider=token_provider,`
`46`	`46`	`)`
	`47`	`+ else:`
	`48`	`+ raise ValueError("Azure OpenAI client requires either an API key or Azure Identity credential.")`
`47`	`49`	`elif OPENAI_CHAT_HOST == "ollama":`
`48`	`50`	`logger.info("Setting up OpenAI client for chat completions using Ollama")`
`49`	`51`	`openai_chat_client = openai.AsyncOpenAI(`
`@@ -67,7 +69,7 @@ async def create_openai_chat_client(`
`67`	`69`
`68`	`70`
`69`	`71`	`async def create_openai_embed_client(`
`70`		`- azure_credential: Union[azure.identity.AzureDeveloperCliCredential, azure.identity.ManagedIdentityCredential],`
	`72`	`+ azure_credential: Union[azure.identity.AzureDeveloperCliCredential, azure.identity.ManagedIdentityCredential, None],`
`71`	`73`	`) -> Union[openai.AsyncAzureOpenAI, openai.AsyncOpenAI]:`
`72`	`74`	`openai_embed_client: Union[openai.AsyncAzureOpenAI, openai.AsyncOpenAI]`
`73`	`75`	`OPENAI_EMBED_HOST = os.getenv("OPENAI_EMBED_HOST")`
`@@ -87,7 +89,7 @@ async def create_openai_embed_client(`
`87`	`89`	`azure_deployment=azure_deployment,`
`88`	`90`	`api_key=api_key,`
`89`	`91`	`)`
`90`		`- else:`
	`92`	`+ elifazure_credential:`
`91`	`93`	`logger.info(`
`92`	`94`	`"Setting up Azure OpenAI client for embeddings using Azure Identity, endpoint %s, deployment %s",`
`93`	`95`	`azure_endpoint,`
`@@ -102,6 +104,8 @@ async def create_openai_embed_client(`
`102`	`104`	`azure_deployment=azure_deployment,`
`103`	`105`	`azure_ad_token_provider=token_provider,`
`104`	`106`	`)`
	`107`	`+ else:`
	`108`	`+ raise ValueError("Azure OpenAI client requires either an API key or Azure Identity credential.")`
`105`	`109`	`elif OPENAI_EMBED_HOST == "ollama":`
`106`	`110`	`logger.info("Setting up OpenAI client for embeddings using Ollama")`
`107`	`111`	`openai_embed_client = openai.AsyncOpenAI(`

`‎src/backend/fastapi_app/postgres_searcher.py`

Lines changed: 10 additions & 6 deletions

Original file line number	Diff line number	Diff line change
`@@ -5,6 +5,7 @@`
`5`	`5`	`from sqlalchemy import Float, Integer, column, select, text`
`6`	`6`	`from sqlalchemy.ext.asyncio import AsyncSession`
`7`	`7`
	`8`	`+from fastapi_app.api_models import Filter`
`8`	`9`	`from fastapi_app.embeddings import compute_text_embedding`
`9`	`10`	`from fastapi_app.postgres_models import Item`
`10`	`11`
`@@ -26,21 +27,24 @@ def __init__(`
`26`	`27`	`self.embed_dimensions = embed_dimensions`
`27`	`28`	`self.embedding_column = embedding_column`
`28`	`29`
`29`		`- def build_filter_clause(self, filters) -> tuple[str, str]:`
	`30`	`+ def build_filter_clause(self, filters: Optional[list[Filter]]) -> tuple[str, str]:`
`30`	`31`	`if filters is None:`
`31`	`32`	`return "", ""`
`32`	`33`	`filter_clauses = []`
`33`	`34`	`for filter in filters:`
`34`		`- if isinstance(filter["value"], str):`
`35`		`- filter["value"] = f"'{filter['value']}'"`
`36`		`- filter_clauses.append(f"{filter['column']} {filter['comparison_operator']} {filter['value']}")`
	`35`	`+ filter_value = f"'{filter.value}'" if isinstance(filter.value, str) else filter.value`
	`36`	`+ filter_clauses.append(f"{filter.column} {filter.comparison_operator} {filter_value}")`
`37`	`37`	`filter_clause = " AND ".join(filter_clauses)`
`38`	`38`	`if len(filter_clause) > 0:`
`39`	`39`	`return f"WHERE {filter_clause}", f"AND {filter_clause}"`
`40`	`40`	`return "", ""`
`41`	`41`
`42`	`42`	`async def search(`
`43`		`- self, query_text: Optional[str], query_vector: list[float], top: int = 5, filters: Optional[list[dict]] = None`
	`43`	`+ self,`
	`44`	`+ query_text: Optional[str],`
	`45`	`+ query_vector: list[float],`
	`46`	`+ top: int = 5,`
	`47`	`+ filters: Optional[list[Filter]] = None,`
`44`	`48`	`):`
`45`	`49`	`filter_clause_where, filter_clause_and = self.build_filter_clause(filters)`
`46`	`50`	`table_name = Item.__tablename__`
`@@ -106,7 +110,7 @@ async def search_and_embed(`
`106`	`110`	`top: int = 5,`
`107`	`111`	`enable_vector_search: bool = False,`
`108`	`112`	`enable_text_search: bool = False,`
`109`		`- filters: Optional[list[dict]] = None,`
	`113`	`+ filters: Optional[list[Filter]] = None,`
`110`	`114`	`) -> list[Item]:`
`111`	`115`	`"""`
`112`	`116`	`Search rows by query text. Optionally converts the query text to a vector if enable_vector_search is True.`

`‎src/backend/fastapi_app/rag_advanced.py`

Lines changed: 17 additions & 42 deletions

Original file line number	Diff line number	Diff line change
`@@ -1,5 +1,5 @@`
`1`	`1`	`from collections.abc import AsyncGenerator`
`2`		`-from typing import Optional, TypedDict, Union`
	`2`	`+from typing import Optional, Union`
`3`	`3`
`4`	`4`	`from openai import AsyncAzureOpenAI, AsyncOpenAI`
`5`	`5`	`from openai.types.chat import ChatCompletionMessageParam`
`@@ -11,51 +11,22 @@`
`11`	`11`
`12`	`12`	`from fastapi_app.api_models import (`
`13`	`13`	`AIChatRoles,`
	`14`	`+ BrandFilter,`
`14`	`15`	`ChatRequestOverrides,`
	`16`	`+ Filter,`
`15`	`17`	`ItemPublic,`
`16`	`18`	`Message,`
	`19`	`+ PriceFilter,`
`17`	`20`	`RAGContext,`
`18`	`21`	`RetrievalResponse,`
`19`	`22`	`RetrievalResponseDelta,`
	`23`	`+ SearchResults,`
`20`	`24`	`ThoughtStep,`
`21`	`25`	`)`
`22`	`26`	`from fastapi_app.postgres_searcher import PostgresSearcher`
`23`	`27`	`from fastapi_app.rag_base import ChatParams, RAGChatBase`
`24`	`28`
`25`	`29`
`26`		`-class PriceFilter(TypedDict):`
`27`		`- column: str = "price"`
`28`		`- """The column to filter on (always 'price' for this filter)"""`
`29`		`-`
`30`		`- comparison_operator: str`
`31`		`- """The operator for price comparison ('>', '<', '>=', '<=', '=')"""`
`32`		`-`
`33`		`- value: float`
`34`		`- """ The price value to compare against (e.g., 30.00) """`
`35`		`-`
`36`		`-`
`37`		`-class BrandFilter(TypedDict):`
`38`		`- column: str = "brand"`
`39`		`- """The column to filter on (always 'brand' for this filter)"""`
`40`		`-`
`41`		`- comparison_operator: str`
`42`		`- """The operator for brand comparison ('=' or '!=')"""`
`43`		`-`
`44`		`- value: str`
`45`		`- """The brand name to compare against (e.g., 'AirStrider')"""`
`46`		`-`
`47`		`-`
`48`		`-class SearchResults(TypedDict):`
`49`		`- query: str`
`50`		`- """The original search query"""`
`51`		`-`
`52`		`- items: list[ItemPublic]`
`53`		`- """List of items that match the search query and filters"""`
`54`		`-`
`55`		`- filters: list[Union[PriceFilter, BrandFilter]]`
`56`		`- """List of filters applied to the search results"""`
`57`		`-`
`58`		`-`
`59`	`30`	`class AdvancedRAGChat(RAGChatBase):`
`60`	`31`	`query_prompt_template = open(RAGChatBase.prompts_dir / "query.txt").read()`
`61`	`32`	`query_fewshots = open(RAGChatBase.prompts_dir / "query_fewshots.json").read()`
`@@ -79,9 +50,13 @@ def __init__(`
`79`	`50`	`chat_model if chat_deployment is None else chat_deployment,`
`80`	`51`	`provider=OpenAIProvider(openai_client=openai_chat_client),`
`81`	`52`	`)`
`82`		`- self.search_agent = Agent(`
	`53`	`+ self.search_agent = Agent[ChatParams, SearchResults](`
`83`	`54`	`pydantic_chat_model,`
`84`		`- model_settings=ModelSettings(temperature=0.0, max_tokens=500, seed=self.chat_params.seed),`
	`55`	`+ model_settings=ModelSettings(`
	`56`	`+ temperature=0.0,`
	`57`	`+ max_tokens=500,`
	`58`	`+ **({"seed": self.chat_params.seed} if self.chat_params.seed is not None else {}),`
	`59`	`+ ),`
`85`	`60`	`system_prompt=self.query_prompt_template,`
`86`	`61`	`tools=[self.search_database],`
`87`	`62`	`output_type=SearchResults,`
`@@ -92,7 +67,7 @@ def __init__(`
`92`	`67`	`model_settings=ModelSettings(`
`93`	`68`	`temperature=self.chat_params.temperature,`
`94`	`69`	`max_tokens=self.chat_params.response_token_limit,`
`95`		`- seed=self.chat_params.seed,`
	`70`	`+ **({"seed": self.chat_params.seed} ifself.chat_params.seedisnotNoneelse {}),`
`96`	`71`	`),`
`97`	`72`	`)`
`98`	`73`
`@@ -115,7 +90,7 @@ async def search_database(`
`115`	`90`	`List of formatted items that match the search query and filters`
`116`	`91`	`"""`
`117`	`92`	`# Only send non-None filters`
`118`		`- filters = []`
	`93`	`+ filters: list[Filter] = []`
`119`	`94`	`if price_filter:`
`120`	`95`	`filters.append(price_filter)`
`121`	`96`	`if brand_filter:`
`@@ -134,12 +109,12 @@ async def search_database(`
`134`	`109`	`async def prepare_context(self) -> tuple[list[ItemPublic], list[ThoughtStep]]:`
`135`	`110`	`few_shots = ModelMessagesTypeAdapter.validate_json(self.query_fewshots)`
`136`	`111`	`user_query = f"Find search results for user query: {self.chat_params.original_user_query}"`
`137`		`- results = await self.search_agent.run(`
	`112`	`+ results = await self.search_agent.run(# type: ignore[call-overload]`
`138`	`113`	`user_query,`
`139`	`114`	`message_history=few_shots + self.chat_params.past_messages,`
`140`	`115`	`deps=self.chat_params,`
`141`	`116`	`)`
`142`		`- items = results.output["items"]`
	`117`	`+ items = results.output.items`
`143`	`118`	`thoughts = [`
`144`	`119`	`ThoughtStep(`
`145`	`120`	`title="Prompt to generate search arguments",`
`@@ -148,12 +123,12 @@ async def prepare_context(self) -> tuple[list[ItemPublic], list[ThoughtStep]]:`
`148`	`123`	`),`
`149`	`124`	`ThoughtStep(`
`150`	`125`	`title="Search using generated search arguments",`
`151`		`- description=results.output["query"],`
	`126`	`+ description=results.output.query,`
`152`	`127`	`props={`
`153`	`128`	`"top": self.chat_params.top,`
`154`	`129`	`"vector_search": self.chat_params.enable_vector_search,`
`155`	`130`	`"text_search": self.chat_params.enable_text_search,`
`156`		`- "filters": results.output["filters"],`
	`131`	`+ "filters": results.output.filters,`
`157`	`132`	`},`
`158`	`133`	`),`
`159`	`134`	`ThoughtStep(`

`‎src/backend/fastapi_app/rag_base.py`

Lines changed: 18 additions & 11 deletions

Original file line number	Diff line number	Diff line change
`@@ -1,8 +1,10 @@`
`1`	`1`	`import pathlib`
`2`	`2`	`from abc import ABC, abstractmethod`
`3`	`3`	`from collections.abc import AsyncGenerator`
	`4`	`+from typing import Union`
`4`	`5`
`5`	`6`	`from openai.types.chat import ChatCompletionMessageParam`
	`7`	`+from pydantic_ai.messages import ModelRequest, ModelResponse, TextPart, UserPromptPart`
`6`	`8`
`7`	`9`	`from fastapi_app.api_models import (`
`8`	`10`	`ChatParams,`
`@@ -12,7 +14,6 @@`
`12`	`14`	`RetrievalResponseDelta,`
`13`	`15`	`ThoughtStep,`
`14`	`16`	`)`
`15`		`-from fastapi_app.postgres_models import Item`
`16`	`17`
`17`	`18`
`18`	`19`	`class RAGChatBase(ABC):`
`@@ -31,7 +32,19 @@ def get_chat_params(`
`31`	`32`	`original_user_query = messages[-1]["content"]`
`32`	`33`	`if not isinstance(original_user_query, str):`
`33`	`34`	`raise ValueError("The most recent message content must be a string.")`
`34`		`- past_messages = messages[:-1]`
	`35`	`+`
	`36`	`+ # Convert to PydanticAI format:`
	`37`	`+ past_messages: list[Union[ModelRequest, ModelResponse]] = []`
	`38`	`+ for message in messages[:-1]:`
	`39`	`+ content = message["content"]`
	`40`	`+ if not isinstance(content, str):`
	`41`	`+ raise ValueError("All messages must have string content.")`
	`42`	`+ if message["role"] == "user":`
	`43`	`+ past_messages.append(ModelRequest(parts=[UserPromptPart(content=content)]))`
	`44`	`+ elif message["role"] == "assistant":`
	`45`	`+ past_messages.append(ModelResponse(parts=[TextPart(content=content)]))`
	`46`	`+ else:`
	`47`	`+ raise ValueError(f"Cannot convert message: {message}")`
`35`	`48`
`36`	`49`	`return ChatParams(`
`37`	`50`	`top=overrides.top,`
`@@ -48,9 +61,7 @@ def get_chat_params(`
`48`	`61`	`)`
`49`	`62`
`50`	`63`	`@abstractmethod`
`51`		`- async def prepare_context(`
`52`		`- self, chat_params: ChatParams`
`53`		`- ) -> tuple[list[ChatCompletionMessageParam], list[Item], list[ThoughtStep]]:`
	`64`	`+ async def prepare_context(self) -> tuple[list[ItemPublic], list[ThoughtStep]]:`
`54`	`65`	`raise NotImplementedError`
`55`	`66`
`56`	`67`	`def prepare_rag_request(self, user_query, items: list[ItemPublic]) -> str:`
`@@ -60,19 +71,15 @@ def prepare_rag_request(self, user_query, items: list[ItemPublic]) -> str:`
`60`	`71`	`@abstractmethod`
`61`	`72`	`async def answer(`
`62`	`73`	`self,`
`63`		`- chat_params: ChatParams,`
`64`		`- contextual_messages: list[ChatCompletionMessageParam],`
`65`		`- results: list[Item],`
	`74`	`+ items: list[ItemPublic],`
`66`	`75`	`earlier_thoughts: list[ThoughtStep],`
`67`	`76`	`) -> RetrievalResponse:`
`68`	`77`	`raise NotImplementedError`
`69`	`78`
`70`	`79`	`@abstractmethod`
`71`	`80`	`async def answer_stream(`
`72`	`81`	`self,`
`73`		`- chat_params: ChatParams,`
`74`		`- contextual_messages: list[ChatCompletionMessageParam],`
`75`		`- results: list[Item],`
	`82`	`+ items: list[ItemPublic],`
`76`	`83`	`earlier_thoughts: list[ThoughtStep],`
`77`	`84`	`) -> AsyncGenerator[RetrievalResponseDelta, None]:`
`78`	`85`	`raise NotImplementedError`

`‎src/backend/fastapi_app/rag_simple.py`

Lines changed: 1 addition & 1 deletion

Original file line number	Diff line number	Diff line change
`@@ -48,7 +48,7 @@ def __init__(`
`48`	`48`	`model_settings=ModelSettings(`
`49`	`49`	`temperature=self.chat_params.temperature,`
`50`	`50`	`max_tokens=self.chat_params.response_token_limit,`
`51`		`- seed=self.chat_params.seed,`
	`51`	`+ **({"seed": self.chat_params.seed} ifself.chat_params.seedisnotNoneelse {}),`
`52`	`52`	`),`
`53`	`53`	`)`
`54`	`54`

`‎src/backend/pyproject.toml`

Lines changed: 1 addition & 1 deletion

Original file line number	Diff line number	Diff line change
`@@ -19,7 +19,7 @@ dependencies = [`
`19`	`19`	`"opentelemetry-instrumentation-sqlalchemy",`
`20`	`20`	`"opentelemetry-instrumentation-aiohttp-client",`
`21`	`21`	`"opentelemetry-instrumentation-openai",`
`22`		`- "pydantic-ai"`
	`22`	`+ "pydantic-ai-slim[openai]"`
`23`	`23`	`]`
`24`	`24`
`25`	`25`	`[build-system]`

0 commit comments

Comments

(0)

Navigation Menu

Search code, repositories, users, issues, pull requests...

Provide feedback

Saved searches

Use saved searches to filter your results more quickly

Uh oh!

Commit 292517b

File tree

19 files changed

19 files changed

`‎.vscode/settings.json`

`‎requirements-dev.txt`

`‎src/backend/fastapi_app/init.py`

`‎src/backend/fastapi_app/api_models.py`

`‎src/backend/fastapi_app/openai_clients.py`

`‎src/backend/fastapi_app/postgres_searcher.py`

`‎src/backend/fastapi_app/rag_advanced.py`

`‎src/backend/fastapi_app/rag_base.py`

`‎src/backend/fastapi_app/rag_simple.py`

`‎src/backend/pyproject.toml`

0 commit comments