diff --git a/servers/fastapi/api/main.py b/servers/fastapi/api/main.py
index 93517b12..80eea709 100644
--- a/servers/fastapi/api/main.py
+++ b/servers/fastapi/api/main.py
@@ -1,10 +1,8 @@
 from fastapi import FastAPI
 from fastapi.middleware.cors import CORSMiddleware
-from fastapi.staticfiles import StaticFiles
 from api.lifespan import app_lifespan
 from api.middlewares import UserConfigEnvUpdateMiddleware
 from api.v1.ppt.router import API_V1_PPT_ROUTER
-from utils.asset_directory_utils import get_exports_directory, get_images_directory, get_uploads_directory
 
 
 app = FastAPI(lifespan=app_lifespan)
@@ -13,25 +11,6 @@ app = FastAPI(lifespan=app_lifespan)
 # Routers
 app.include_router(API_V1_PPT_ROUTER)
 
-# Static files
-app.mount("/static", StaticFiles(directory="static"), name="static")
-app.mount(
-    "/app_data/images",
-    StaticFiles(directory=get_images_directory()),
-    name="app_data/images",
-)
-app.mount(
-    "/app_data/exports",
-    StaticFiles(directory=get_exports_directory()),
-    name="app_data/exports",
-)
-app.mount(
-    "/app_data/uploads",
-    StaticFiles(directory=get_uploads_directory()),
-    name="app_data/uploads",
-)
-
-
 # Middlewares
 origins = ["*"]
 app.add_middleware(
diff --git a/servers/fastapi/api/v1/ppt/endpoints/anthropic.py b/servers/fastapi/api/v1/ppt/endpoints/anthropic.py
index ff41e223..e3e1d569 100644
--- a/servers/fastapi/api/v1/ppt/endpoints/anthropic.py
+++ b/servers/fastapi/api/v1/ppt/endpoints/anthropic.py
@@ -1,20 +1,16 @@
-from typing import Annotated, List, Optional
-import anthropic
+from typing import Annotated, List
 from fastapi import APIRouter, Body, HTTPException
 
-from utils.get_env import get_anthropic_api_key_env
+from utils.available_models import list_available_anthropic_models
 
 ANTHROPIC_ROUTER = APIRouter(prefix="/anthropic", tags=["Anthropic"])
 
 
 @ANTHROPIC_ROUTER.post("/models/available", response_model=List[str])
 async def get_available_models(
-    api_key: Annotated[Optional[str], Body(embed=True)] = None,
+    api_key: Annotated[str, Body(embed=True)],
 ):
-    anthropic_api_key = api_key or get_anthropic_api_key_env()
-    if not anthropic_api_key:
-        raise HTTPException(status_code=400, detail="Anthropic API key is required")
-
-    client = anthropic.Anthropic(api_key=anthropic_api_key)
-    models = client.models.list(limit=20)
-    return [model.id for model in models]
+    try:
+        return await list_available_anthropic_models(api_key)
+    except Exception as e:
+        raise HTTPException(status_code=500, detail=str(e))
diff --git a/servers/fastapi/api/v1/ppt/endpoints/custom_llm.py b/servers/fastapi/api/v1/ppt/endpoints/custom_llm.py
deleted file mode 100644
index 146ef3b2..00000000
--- a/servers/fastapi/api/v1/ppt/endpoints/custom_llm.py
+++ /dev/null
@@ -1,18 +0,0 @@
-from typing import Annotated, List, Optional
-from fastapi import APIRouter, Body, HTTPException
-
-from utils.custom_llm_provider import list_available_custom_models
-
-CUSTOM_LLM_ROUTER = APIRouter(prefix="/custom_llm", tags=["Custom LLM"])
-
-
-@CUSTOM_LLM_ROUTER.post("/models/available", response_model=List[str])
-async def get_available_models(
-    url: Annotated[Optional[str], Body()] = None,
-    api_key: Annotated[Optional[str], Body()] = None,
-):
-    try:
-        return await list_available_custom_models(url, api_key)
-    except Exception as e:
-        print(e)
-        raise HTTPException(status_code=500, detail=str(e))
diff --git a/servers/fastapi/api/v1/ppt/endpoints/google.py b/servers/fastapi/api/v1/ppt/endpoints/google.py
new file mode 100644
index 00000000..4c83627f
--- /dev/null
+++ b/servers/fastapi/api/v1/ppt/endpoints/google.py
@@ -0,0 +1,14 @@
+from typing import Annotated, List
+from fastapi import APIRouter, Body, HTTPException
+
+from utils.available_models import list_available_google_models
+
+GOOGLE_ROUTER = APIRouter(prefix="/google", tags=["Google"])
+
+
+@GOOGLE_ROUTER.post("/models/available", response_model=List[str])
+async def get_available_models(api_key: Annotated[str, Body(embed=True)]):
+    try:
+        return await list_available_google_models(api_key)
+    except Exception as e:
+        raise HTTPException(status_code=500, detail=str(e))
diff --git a/servers/fastapi/api/v1/ppt/endpoints/openai.py b/servers/fastapi/api/v1/ppt/endpoints/openai.py
new file mode 100644
index 00000000..8e2f00e6
--- /dev/null
+++ b/servers/fastapi/api/v1/ppt/endpoints/openai.py
@@ -0,0 +1,17 @@
+from typing import Annotated, List
+from fastapi import APIRouter, Body, HTTPException
+
+from utils.available_models import list_available_openai_compatible_models
+
+OPENAI_ROUTER = APIRouter(prefix="/openai", tags=["OpenAI"])
+
+
+@OPENAI_ROUTER.post("/models/available", response_model=List[str])
+async def get_available_models(
+    url: Annotated[str, Body()],
+    api_key: Annotated[str, Body()],
+):
+    try:
+        return await list_available_openai_compatible_models(url, api_key)
+    except Exception as e:
+        raise HTTPException(status_code=500, detail=str(e))
diff --git a/servers/fastapi/api/v1/ppt/endpoints/presentation.py b/servers/fastapi/api/v1/ppt/endpoints/presentation.py
index 31207b95..b8eaf018 100644
--- a/servers/fastapi/api/v1/ppt/endpoints/presentation.py
+++ b/servers/fastapi/api/v1/ppt/endpoints/presentation.py
@@ -28,7 +28,7 @@ from utils.export_utils import export_presentation
 from utils.llm_calls.generate_presentation_outlines import generate_ppt_outline
 from models.sql.slide import SlideModel
 from models.sse_response import SSECompleteResponse, SSEResponse
-from services import SCHEMA_TO_MODEL_SERVICE, TEMP_FILE_SERVICE
+from services import TEMP_FILE_SERVICE
 from services.database import get_async_session
 from services.documents_loader import DocumentsLoader
 from models.sql.presentation import PresentationModel
@@ -43,7 +43,6 @@ from utils.llm_calls.generate_slide_content import (
 )
 from utils.process_slides import process_slide_and_fetch_assets
 from utils.randomizers import get_random_uuid
-from utils.schema_utils import remove_fields_from_schema
 from utils.validators import validate_files
 
 PRESENTATION_ROUTER = APIRouter(prefix="/presentation", tags=["Presentation"])
@@ -220,20 +219,8 @@ async def stream_presentation(
         for i, slide_layout_index in enumerate(structure.slides):
             slide_layout = layout.slides[slide_layout_index]
 
-            # Generate Pydantic model from slide layout schema
-            schema_model_id = f"{layout.name}/{slide_layout.id}"
-            response_schema = remove_fields_from_schema(
-                slide_layout.json_schema, ["image_url_", "icon_url_"]
-            )
-            schema_model_path = (
-                await SCHEMA_TO_MODEL_SERVICE.get_pydantic_model_path_from_schema(
-                    schema_model_id, response_schema
-                )
-            )
-            module = importlib.import_module(schema_model_path)
-            response_model = module.GeneratedModel
             slide_content = await get_slide_content_from_type_and_outline(
-                response_model, outline.slides[i], presentation.language
+                slide_layout, outline.slides[i], presentation.language
             )
 
             slide = SlideModel(
@@ -252,9 +239,6 @@ async def stream_presentation(
                 )
             )
 
-            # Give control to the event loop
-            await asyncio.sleep(0)
-
             yield SSEResponse(
                 event="response",
                 data=json.dumps({"type": "chunk", "chunk": slide.model_dump_json()}),
@@ -491,7 +475,6 @@ async def from_template(
         new_slide_data = list(filter(lambda x: x.index == each_slide.index, data.data))
         if new_slide_data:
             updated_content = deep_update(each_slide.content, new_slide_data[0].content)
-            print(f"Updated content for slide {each_slide.index}: {updated_content}")
         new_slides.append(
             each_slide.get_new_slide(new_presentation.id, updated_content)
         )
diff --git a/servers/fastapi/api/v1/ppt/endpoints/slide.py b/servers/fastapi/api/v1/ppt/endpoints/slide.py
index 3e0dfcce..a0c81107 100644
--- a/servers/fastapi/api/v1/ppt/endpoints/slide.py
+++ b/servers/fastapi/api/v1/ppt/endpoints/slide.py
@@ -5,7 +5,6 @@ from sqlalchemy.ext.asyncio import AsyncSession
 
 from models.sql.presentation import PresentationModel
 from models.sql.slide import SlideModel
-from services import SCHEMA_TO_MODEL_SERVICE
 from services.database import get_async_session
 from services.icon_finder_service import IconFinderService
 from services.image_generation_service import ImageGenerationService
@@ -35,25 +34,12 @@ async def edit_slide(
         raise HTTPException(status_code=404, detail="Presentation not found")
 
     presentation_layout = presentation.get_layout()
-
     slide_layout = await get_slide_layout_from_prompt(
         prompt, presentation_layout, slide
     )
 
-    # Generate Pydantic model from slide layout schema
-    schema_model_id = f"{presentation_layout.name}/{slide_layout.id}"
-    response_schema = remove_fields_from_schema(
-        slide_layout.json_schema, ["image_url_", "icon_url_"]
-    )
-    schema_model_path = (
-        await SCHEMA_TO_MODEL_SERVICE.get_pydantic_model_path_from_schema(
-            schema_model_id, response_schema
-        )
-    )
-    module = importlib.import_module(schema_model_path)
-    response_model = module.GeneratedModel
     edited_slide_content = await get_edited_slide_content(
-        prompt, slide, presentation.language, response_model
+        prompt, slide, presentation.language, slide_layout
     )
 
     image_generation_service = ImageGenerationService(get_images_directory())
diff --git a/servers/fastapi/api/v1/ppt/router.py b/servers/fastapi/api/v1/ppt/router.py
index 928a9354..2f22e1b5 100644
--- a/servers/fastapi/api/v1/ppt/router.py
+++ b/servers/fastapi/api/v1/ppt/router.py
@@ -1,7 +1,8 @@
 from fastapi import APIRouter
 
 from api.v1.ppt.endpoints.anthropic import ANTHROPIC_ROUTER
-from api.v1.ppt.endpoints.custom_llm import CUSTOM_LLM_ROUTER
+from api.v1.ppt.endpoints.google import GOOGLE_ROUTER
+from api.v1.ppt.endpoints.openai import OPENAI_ROUTER
 from api.v1.ppt.endpoints.files import FILES_ROUTER
 from api.v1.ppt.endpoints.icons import ICONS_ROUTER
 from api.v1.ppt.endpoints.images import IMAGES_ROUTER
@@ -20,5 +21,6 @@ API_V1_PPT_ROUTER.include_router(SLIDE_ROUTER)
 API_V1_PPT_ROUTER.include_router(IMAGES_ROUTER)
 API_V1_PPT_ROUTER.include_router(ICONS_ROUTER)
 API_V1_PPT_ROUTER.include_router(OLLAMA_ROUTER)
-API_V1_PPT_ROUTER.include_router(CUSTOM_LLM_ROUTER)
+API_V1_PPT_ROUTER.include_router(OPENAI_ROUTER)
 API_V1_PPT_ROUTER.include_router(ANTHROPIC_ROUTER)
+API_V1_PPT_ROUTER.include_router(GOOGLE_ROUTER)
diff --git a/servers/fastapi/chroma/chroma.sqlite3 b/servers/fastapi/chroma/chroma.sqlite3
index 7398b74c..30b90af8 100644
Binary files a/servers/fastapi/chroma/chroma.sqlite3 and b/servers/fastapi/chroma/chroma.sqlite3 differ
diff --git a/servers/fastapi/constants/llm.py b/servers/fastapi/constants/llm.py
new file mode 100644
index 00000000..ac4bd527
--- /dev/null
+++ b/servers/fastapi/constants/llm.py
@@ -0,0 +1,6 @@
+OPENAI_URL = "https://api.openai.com/v1"
+
+# Default models
+DEFAULT_OPENAI_MODEL = "gpt-4.1"
+DEFAULT_GOOGLE_MODEL = "models/gemini-2.0-flash"
+DEFAULT_ANTHROPIC_MODEL = "claude-3-5-sonnet-20240620"
diff --git a/servers/fastapi/constants/supported_ollama_models.py b/servers/fastapi/constants/supported_ollama_models.py
index a46b5774..6ae3ac4e 100644
--- a/servers/fastapi/constants/supported_ollama_models.py
+++ b/servers/fastapi/constants/supported_ollama_models.py
@@ -7,7 +7,6 @@ SUPPORTED_OLLAMA_MODELS = {
         value="llama3:8b",
         description="❌ Graphs not supported.",
         size="4.7GB",
-        supports_graph=False,
         icon="/static/icons/meta.png",
     ),
     "llama3:70b": OllamaModelMetadata(
@@ -15,7 +14,6 @@ SUPPORTED_OLLAMA_MODELS = {
         value="llama3:70b",
         description="✅ Graphs supported.",
         size="40GB",
-        supports_graph=True,
         icon="/static/icons/meta.png",
     ),
     "llama3.1:8b": OllamaModelMetadata(
@@ -23,7 +21,6 @@ SUPPORTED_OLLAMA_MODELS = {
         value="llama3.1:8b",
         description="❌ Graphs not supported.",
         size="4.9GB",
-        supports_graph=False,
         icon="/static/icons/meta.png",
     ),
     "llama3.1:70b": OllamaModelMetadata(
@@ -31,7 +28,6 @@ SUPPORTED_OLLAMA_MODELS = {
         value="llama3.1:70b",
         description="✅ Graphs supported.",
         size="43GB",
-        supports_graph=True,
         icon="/static/icons/meta.png",
     ),
     "llama3.1:405b": OllamaModelMetadata(
@@ -39,7 +35,6 @@ SUPPORTED_OLLAMA_MODELS = {
         value="llama3.1:405b",
         description="✅ Graphs supported.",
         size="243GB",
-        supports_graph=True,
         icon="/static/icons/meta.png",
     ),
     "llama3.2:1b": OllamaModelMetadata(
@@ -47,7 +42,6 @@ SUPPORTED_OLLAMA_MODELS = {
         value="llama3.2:1b",
         description="❌ Graphs not supported.",
         size="1.3GB",
-        supports_graph=False,
         icon="/static/icons/meta.png",
     ),
     "llama3.2:3b": OllamaModelMetadata(
@@ -55,7 +49,6 @@ SUPPORTED_OLLAMA_MODELS = {
         value="llama3.2:3b",
         description="❌ Graphs not supported.",
         size="2GB",
-        supports_graph=False,
         icon="/static/icons/meta.png",
     ),
     "llama3.3:70b": OllamaModelMetadata(
@@ -63,7 +56,6 @@ SUPPORTED_OLLAMA_MODELS = {
         value="llama3.3:70b",
         description="✅ Graphs supported.",
         size="43GB",
-        supports_graph=True,
         icon="/static/icons/meta.png",
     ),
     "llama4:16x17b": OllamaModelMetadata(
@@ -71,7 +63,6 @@ SUPPORTED_OLLAMA_MODELS = {
         value="llama4:16x17b",
         description="✅ Graphs supported.",
         size="67GB",
-        supports_graph=True,
         icon="/static/icons/meta.png",
     ),
     "llama4:128x17b": OllamaModelMetadata(
@@ -79,7 +70,6 @@ SUPPORTED_OLLAMA_MODELS = {
         value="llama4:128x17b",
         description="✅ Graphs supported.",
         size="245GB",
-        supports_graph=True,
         icon="/static/icons/meta.png",
     ),
 }
@@ -90,7 +80,6 @@ SUPPORTED_GEMMA_MODELS = {
         value="gemma3:1b",
         description="❌ Graphs not supported.",
         size="815MB",
-        supports_graph=False,
         icon="/static/icons/gemma.png",
     ),
     "gemma3:4b": OllamaModelMetadata(
@@ -98,7 +87,6 @@ SUPPORTED_GEMMA_MODELS = {
         value="gemma3:4b",
         description="❌ Graphs not supported.",
         size="3.3GB",
-        supports_graph=False,
         icon="/static/icons/gemma.png",
     ),
     "gemma3:12b": OllamaModelMetadata(
@@ -106,7 +94,6 @@ SUPPORTED_GEMMA_MODELS = {
         value="gemma3:12b",
         description="❌ Graphs not supported.",
         size="8.1GB",
-        supports_graph=False,
         icon="/static/icons/gemma.png",
     ),
     "gemma3:27b": OllamaModelMetadata(
@@ -114,7 +101,6 @@ SUPPORTED_GEMMA_MODELS = {
         value="gemma3:27b",
         description="✅ Graphs supported.",
         size="17GB",
-        supports_graph=True,
         icon="/static/icons/gemma.png",
     ),
 }
@@ -125,7 +111,6 @@ SUPPORTED_DEEPSEEK_MODELS = {
         value="deepseek-r1:1.5b",
         description="❌ Graphs not supported.",
         size="1.1GB",
-        supports_graph=False,
         icon="/static/icons/deepseek.png",
     ),
     "deepseek-r1:7b": OllamaModelMetadata(
@@ -133,7 +118,6 @@ SUPPORTED_DEEPSEEK_MODELS = {
         value="deepseek-r1:7b",
         description="❌ Graphs not supported.",
         size="4.7GB",
-        supports_graph=False,
         icon="/static/icons/deepseek.png",
     ),
     "deepseek-r1:8b": OllamaModelMetadata(
@@ -141,7 +125,6 @@ SUPPORTED_DEEPSEEK_MODELS = {
         value="deepseek-r1:8b",
         description="❌ Graphs not supported.",
         size="5.2GB",
-        supports_graph=False,
         icon="/static/icons/deepseek.png",
     ),
     "deepseek-r1:14b": OllamaModelMetadata(
@@ -149,7 +132,6 @@ SUPPORTED_DEEPSEEK_MODELS = {
         value="deepseek-r1:14b",
         description="❌ Graphs not supported.",
         size="9GB",
-        supports_graph=False,
         icon="/static/icons/deepseek.png",
     ),
     "deepseek-r1:32b": OllamaModelMetadata(
@@ -157,7 +139,6 @@ SUPPORTED_DEEPSEEK_MODELS = {
         value="deepseek-r1:32b",
         description="✅ Graphs supported.",
         size="20GB",
-        supports_graph=True,
         icon="/static/icons/deepseek.png",
     ),
     "deepseek-r1:70b": OllamaModelMetadata(
@@ -165,7 +146,6 @@ SUPPORTED_DEEPSEEK_MODELS = {
         value="deepseek-r1:70b",
         description="✅ Graphs supported.",
         size="43GB",
-        supports_graph=True,
         icon="/static/icons/deepseek.png",
     ),
     "deepseek-r1:671b": OllamaModelMetadata(
@@ -173,7 +153,6 @@ SUPPORTED_DEEPSEEK_MODELS = {
         value="deepseek-r1:671b",
         description="✅ Graphs supported.",
         size="404GB",
-        supports_graph=True,
         icon="/static/icons/deepseek.png",
     ),
 }
@@ -184,7 +163,6 @@ SUPPORTED_QWEN_MODELS = {
         value="qwen3:0.6b",
         description="❌ Graphs not supported.",
         size="523MB",
-        supports_graph=False,
         icon="/static/icons/qwen.png",
     ),
     "qwen3:1.7b": OllamaModelMetadata(
@@ -192,7 +170,6 @@ SUPPORTED_QWEN_MODELS = {
         value="qwen3:1.7b",
         description="❌ Graphs not supported.",
         size="1.4GB",
-        supports_graph=False,
         icon="/static/icons/qwen.png",
     ),
     "qwen3:4b": OllamaModelMetadata(
@@ -200,7 +177,6 @@ SUPPORTED_QWEN_MODELS = {
         value="qwen3:4b",
         description="❌ Graphs not supported.",
         size="2.6GB",
-        supports_graph=False,
         icon="/static/icons/qwen.png",
     ),
     "qwen3:8b": OllamaModelMetadata(
@@ -208,7 +184,6 @@ SUPPORTED_QWEN_MODELS = {
         value="qwen3:8b",
         description="❌ Graphs not supported.",
         size="5.2GB",
-        supports_graph=False,
         icon="/static/icons/qwen.png",
     ),
     "qwen3:14b": OllamaModelMetadata(
@@ -216,7 +191,6 @@ SUPPORTED_QWEN_MODELS = {
         value="qwen3:14b",
         description="❌ Graphs not supported.",
         size="9.3GB",
-        supports_graph=False,
         icon="/static/icons/qwen.png",
     ),
     "qwen3:30b": OllamaModelMetadata(
@@ -224,7 +198,6 @@ SUPPORTED_QWEN_MODELS = {
         value="qwen3:30b",
         description="✅ Graphs supported.",
         size="19GB",
-        supports_graph=True,
         icon="/static/icons/qwen.png",
     ),
     "qwen3:32b": OllamaModelMetadata(
@@ -232,7 +205,6 @@ SUPPORTED_QWEN_MODELS = {
         value="qwen3:32b",
         description="✅ Graphs supported.",
         size="20GB",
-        supports_graph=True,
         icon="/static/icons/qwen.png",
     ),
     "qwen3:235b": OllamaModelMetadata(
@@ -240,7 +212,6 @@ SUPPORTED_QWEN_MODELS = {
         value="qwen3:235b",
         description="✅ Graphs supported.",
         size="142GB",
-        supports_graph=True,
         icon="/static/icons/qwen.png",
     ),
 }
diff --git a/servers/fastapi/get_test_schema.py b/servers/fastapi/get_test_schema.py
index f03966d4..0ae458b3 100644
--- a/servers/fastapi/get_test_schema.py
+++ b/servers/fastapi/get_test_schema.py
@@ -17,8 +17,8 @@ class ContactInfoModel(BaseModel):
 
 
 class ImageModel(BaseModel):
-    image_url_: str = Field(description="Image URL")
-    image_prompt_: str = Field(description="Image prompt")
+    __image_url__: str = Field(description="Image URL")
+    __image_prompt__: str = Field(description="Image prompt")
 
 
 # First Slide Layout
diff --git a/servers/fastapi/models/ollama_model_metadata.py b/servers/fastapi/models/ollama_model_metadata.py
index ce2abae3..766924db 100644
--- a/servers/fastapi/models/ollama_model_metadata.py
+++ b/servers/fastapi/models/ollama_model_metadata.py
@@ -7,4 +7,3 @@ class OllamaModelMetadata(BaseModel):
     description: str
     icon: str
     size: str
-    supports_graph: bool
diff --git a/servers/fastapi/models/presentation_layout.py b/servers/fastapi/models/presentation_layout.py
index fe462554..784e41fc 100644
--- a/servers/fastapi/models/presentation_layout.py
+++ b/servers/fastapi/models/presentation_layout.py
@@ -1,4 +1,5 @@
 from typing import List, Optional
+from fastapi import HTTPException
 from pydantic import BaseModel, Field
 
 from models.presentation_structure_model import PresentationStructureModel
@@ -16,6 +17,14 @@ class PresentationLayoutModel(BaseModel):
     ordered: bool = Field(default=False)
     slides: List[SlideLayoutModel]
 
+    def get_slide_layout_index(self, slide_layout_id: str) -> int:
+        for index, slide in enumerate(self.slides):
+            if slide.id == slide_layout_id:
+                return index
+        raise HTTPException(
+            status_code=404, detail=f"Slide layout {slide_layout_id} not found"
+        )
+
     def to_presentation_structure(self):
         return PresentationStructureModel(
             slides=[index for index in range(len(self.slides))]
diff --git a/servers/fastapi/models/user_config.py b/servers/fastapi/models/user_config.py
index 03b12fcf..4f8f5e53 100644
--- a/servers/fastapi/models/user_config.py
+++ b/servers/fastapi/models/user_config.py
@@ -4,16 +4,32 @@ from pydantic import BaseModel
 
 class UserConfig(BaseModel):
     LLM: Optional[str] = None
+
+    # OpenAI
     OPENAI_API_KEY: Optional[str] = None
+    OPENAI_MODEL: Optional[str] = None
+
+    # Google
     GOOGLE_API_KEY: Optional[str] = None
+    GOOGLE_MODEL: Optional[str] = None
+
+    # Anthropic
     ANTHROPIC_API_KEY: Optional[str] = None
     ANTHROPIC_MODEL: Optional[str] = None
+
+    # Ollama
     OLLAMA_URL: Optional[str] = None
     OLLAMA_MODEL: Optional[str] = None
+
+    # Custom LLM
     CUSTOM_LLM_URL: Optional[str] = None
     CUSTOM_LLM_API_KEY: Optional[str] = None
     CUSTOM_MODEL: Optional[str] = None
-    PEXELS_API_KEY: Optional[str] = None
+
+    # Image Provider
     IMAGE_PROVIDER: Optional[str] = None
+    PEXELS_API_KEY: Optional[str] = None
     PIXABAY_API_KEY: Optional[str] = None
+
+    # Reasoning
     EXTENDED_REASONING: Optional[bool] = None
diff --git a/servers/fastapi/requirements.txt b/servers/fastapi/requirements.txt
index 75a5b248..7ccb1000 100644
--- a/servers/fastapi/requirements.txt
+++ b/servers/fastapi/requirements.txt
@@ -22,7 +22,6 @@ chromadb==1.0.15
 click==8.2.1
 coloredlogs==15.0.1
 cryptography==45.0.5
-datamodel-code-generator==0.32.0
 distro==1.9.0
 dnspython==2.7.0
 durationpy==0.10
diff --git a/servers/fastapi/services/__init__.py b/servers/fastapi/services/__init__.py
index bcf11e3c..2c4366c5 100644
--- a/servers/fastapi/services/__init__.py
+++ b/servers/fastapi/services/__init__.py
@@ -1,8 +1,6 @@
 from services.redis_service import RedisService
-from services.schema_to_model_service import SchemaToModelService
 from services.temp_file_service import TempFileService
 
 
 TEMP_FILE_SERVICE = TempFileService()
 REDIS_SERVICE = RedisService()
-SCHEMA_TO_MODEL_SERVICE = SchemaToModelService(TEMP_FILE_SERVICE)
diff --git a/servers/fastapi/services/image_generation_service.py b/servers/fastapi/services/image_generation_service.py
index 667425ac..a0159b68 100644
--- a/servers/fastapi/services/image_generation_service.py
+++ b/servers/fastapi/services/image_generation_service.py
@@ -3,12 +3,12 @@ import os
 import aiohttp
 from google import genai
 from google.genai.types import GenerateContentConfig
+from openai import AsyncOpenAI
 from models.image_prompt import ImagePrompt
 from models.sql.image_asset import ImageAsset
 from utils.download_helpers import download_file
 from utils.get_env import get_pexels_api_key_env
 from utils.get_env import get_pixabay_api_key_env
-from utils.llm_provider import get_llm_client
 from utils.image_provider import (
     is_pixels_selected,
     is_pixabay_selected,
@@ -80,7 +80,7 @@ class ImageGenerationService:
             return "/static/images/placeholder.jpg"
 
     async def generate_image_openai(self, prompt: str, output_directory: str) -> str:
-        client = get_llm_client()
+        client = AsyncOpenAI()
         result = await client.images.generate(
             model="dall-e-3",
             prompt=prompt,
diff --git a/servers/fastapi/services/llm_client.py b/servers/fastapi/services/llm_client.py
index 4184b18e..e75545a4 100644
--- a/servers/fastapi/services/llm_client.py
+++ b/servers/fastapi/services/llm_client.py
@@ -1,6 +1,6 @@
 import asyncio
 import json
-from typing import List, Optional
+from typing import List
 from fastapi import HTTPException
 from openai import AsyncOpenAI
 from google import genai
@@ -8,7 +8,6 @@ from google.genai.types import GenerateContentConfig
 from anthropic import AsyncAnthropic
 from anthropic.types import Message as AnthropicMessage
 from anthropic import MessageStreamEvent as AnthropicMessageStreamEvent
-from pydantic import BaseModel
 from enums.llm_provider import LLMProvider
 from models.llm_message import LLMMessage
 from utils.async_iterator import iterator_to_async
@@ -21,6 +20,7 @@ from utils.get_env import (
     get_openai_api_key_env,
 )
 from utils.llm_provider import get_llm_provider
+from utils.schema_utils import ensure_strict_json_schema
 
 
 class LLMClient:
@@ -173,43 +173,45 @@ class LLMClient:
 
     # ? Generate Structured Content
     async def _generate_openai_structured(
-        self, model: str, messages: List[LLMMessage], response_format: BaseModel | dict
+        self,
+        model: str,
+        messages: List[LLMMessage],
+        response_format: dict,
+        strict: bool = False,
     ):
         client: AsyncOpenAI = self._client
-        is_response_format_dict = isinstance(response_format, dict)
-        if is_response_format_dict:
-            response = await client.chat.completions.create(
-                model=model,
-                messages=[message.model_dump() for message in messages],
-                response_format={
-                    "type": "json_schema",
-                    "json_schema": (
-                        {
-                            "name": "ResponseSchema",
-                            "schema": response_format,
-                        }
-                    ),
-                },
-                max_completion_tokens=self.max_tokens,
+        response_schema = response_format
+        if strict:
+            response_schema = ensure_strict_json_schema(
+                response_schema,
+                path=(),
+                root=response_schema,
             )
-            content = response.choices[0].message.content
-            if content:
-                return json.loads(content)
-            return None
-        else:
-            response = await client.chat.completions.parse(
-                model=model,
-                messages=[message.model_dump() for message in messages],
-                response_format=response_format,
-                max_completion_tokens=self.max_tokens,
-            )
-            content = response.choices[0].message.parsed
-            if content:
-                return content.model_dump(mode="json")
-            return None
+        response = await client.chat.completions.create(
+            model=model,
+            messages=[message.model_dump() for message in messages],
+            response_format={
+                "type": "json_schema",
+                "json_schema": (
+                    {
+                        "name": "ResponseSchema",
+                        "strict": strict,
+                        "schema": response_schema,
+                    }
+                ),
+            },
+            max_completion_tokens=self.max_tokens,
+        )
+        content = response.choices[0].message.content
+        if content:
+            return json.loads(content)
+        return None
 
     async def _generate_google_structured(
-        self, model: str, messages: List[LLMMessage], response_format: BaseModel | dict
+        self,
+        model: str,
+        messages: List[LLMMessage],
+        response_format: dict,
     ):
         client: genai.Client = self._client
         response = await asyncio.to_thread(
@@ -219,7 +221,7 @@ class LLMClient:
             config=GenerateContentConfig(
                 system_instruction=self._get_system_prompt(messages),
                 response_mime_type="application/json",
-                response_schema=response_format,
+                response_json_schema=response_format,
                 max_output_tokens=self.max_tokens,
             ),
         )
@@ -230,10 +232,12 @@ class LLMClient:
         return content
 
     async def _generate_anthropic_structured(
-        self, model: str, messages: List[LLMMessage], response_format: BaseModel | dict
+        self,
+        model: str,
+        messages: List[LLMMessage],
+        response_format: dict,
     ):
         client: AsyncAnthropic = self._client
-        is_response_format_dict = isinstance(response_format, dict)
         response: AnthropicMessage = await client.messages.create(
             model=model,
             system=self._get_system_prompt(messages),
@@ -246,11 +250,7 @@ class LLMClient:
                 {
                     "name": "ResponseSchema",
                     "description": "A response to the user's message",
-                    "input_schema": (
-                        response_format
-                        if is_response_format_dict
-                        else response_format.model_json_schema()
-                    ),
+                    "input_schema": response_format,
                 }
             ],
         )
@@ -262,23 +262,39 @@ class LLMClient:
         return content
 
     async def _generate_ollama_structured(
-        self, model: str, messages: List[LLMMessage], response_format: BaseModel | dict
+        self,
+        model: str,
+        messages: List[LLMMessage],
+        response_format: dict,
+        strict: bool = False,
     ):
-        return await self._generate_openai_structured(model, messages, response_format)
+        return await self._generate_openai_structured(
+            model, messages, response_format, strict
+        )
 
     async def _generate_custom_structured(
-        self, model: str, messages: List[LLMMessage], response_format: BaseModel | dict
+        self,
+        model: str,
+        messages: List[LLMMessage],
+        response_format: dict,
+        strict: bool = False,
     ):
-        return await self._generate_openai_structured(model, messages, response_format)
+        return await self._generate_openai_structured(
+            model, messages, response_format, strict
+        )
 
     async def generate_structured(
-        self, model: str, messages: List[LLMMessage], response_format: BaseModel | dict
+        self,
+        model: str,
+        messages: List[LLMMessage],
+        response_format: dict,
+        strict: bool = False,
     ) -> dict:
         content = None
         match self.llm_provider:
             case LLMProvider.OPENAI:
                 content = await self._generate_openai_structured(
-                    model, messages, response_format
+                    model, messages, response_format, strict
                 )
             case LLMProvider.GOOGLE:
                 content = await self._generate_google_structured(
@@ -290,11 +306,11 @@ class LLMClient:
                 )
             case LLMProvider.OLLAMA:
                 content = await self._generate_ollama_structured(
-                    model, messages, response_format
+                    model, messages, response_format, strict
                 )
             case LLMProvider.CUSTOM:
                 content = await self._generate_custom_structured(
-                    model, messages, response_format
+                    model, messages, response_format, strict
                 )
         if content is None:
             raise HTTPException(
@@ -366,10 +382,20 @@ class LLMClient:
 
     # ? Stream Structured Content
     async def _stream_openai_structured(
-        self, model: str, messages: List[LLMMessage], response_format: BaseModel | dict
+        self,
+        model: str,
+        messages: List[LLMMessage],
+        response_format: dict,
+        strict: bool = False,
     ):
         client: AsyncOpenAI = self._client
-        is_response_format_dict = isinstance(response_format, dict)
+        response_schema = response_format
+        if strict:
+            response_schema = ensure_strict_json_schema(
+                response_schema,
+                path=(),
+                root=response_schema,
+            )
         async with client.chat.completions.stream(
             model=model,
             messages=[message.model_dump() for message in messages],
@@ -379,11 +405,10 @@ class LLMClient:
                     "type": "json_schema",
                     "json_schema": {
                         "name": "ResponseSchema",
-                        "schema": response_format,
+                        "strict": strict,
+                        "schema": response_schema,
                     },
                 }
-                if is_response_format_dict
-                else response_format
             ),
         ) as stream:
             async for event in stream:
@@ -391,7 +416,10 @@ class LLMClient:
                     yield event.delta
 
     async def _stream_google_structured(
-        self, model: str, messages: List[LLMMessage], response_format: BaseModel | dict
+        self,
+        model: str,
+        messages: List[LLMMessage],
+        response_format: dict,
     ):
         client: genai.Client = self._client
         async for event in iterator_to_async(client.models.generate_content_stream)(
@@ -400,7 +428,7 @@ class LLMClient:
             config=GenerateContentConfig(
                 system_instruction=self._get_system_prompt(messages),
                 response_mime_type="application/json",
-                response_schema=response_format,
+                response_json_schema=response_format,
                 max_output_tokens=self.max_tokens,
             ),
         ):
@@ -408,10 +436,12 @@ class LLMClient:
                 yield event.text
 
     async def _stream_anthropic_structured(
-        self, model: str, messages: List[LLMMessage], response_format: BaseModel | dict
+        self,
+        model: str,
+        messages: List[LLMMessage],
+        response_format: dict,
     ):
         client: AsyncAnthropic = self._client
-        is_response_format_dict = isinstance(response_format, dict)
         async with client.messages.stream(
             model=model,
             system=self._get_system_prompt(messages),
@@ -424,11 +454,7 @@ class LLMClient:
                 {
                     "name": "ResponseSchema",
                     "description": "A response to the user's message",
-                    "input_schema": (
-                        response_format
-                        if is_response_format_dict
-                        else response_format.model_json_schema()
-                    ),
+                    "input_schema": response_format,
                 }
             ],
         ) as stream:
@@ -438,21 +464,35 @@ class LLMClient:
                     yield event.partial_json
 
     def _stream_ollama_structured(
-        self, model: str, messages: List[LLMMessage], response_format: BaseModel | dict
+        self,
+        model: str,
+        messages: List[LLMMessage],
+        response_format: dict,
+        strict: bool = False,
     ):
-        return self._stream_openai_structured(model, messages, response_format)
+        return self._stream_openai_structured(model, messages, response_format, strict)
 
     def _stream_custom_structured(
-        self, model: str, messages: List[LLMMessage], response_format: BaseModel | dict
+        self,
+        model: str,
+        messages: List[LLMMessage],
+        response_format: dict,
+        strict: bool = False,
     ):
-        return self._stream_openai_structured(model, messages, response_format)
+        return self._stream_openai_structured(model, messages, response_format, strict)
 
     def stream_structured(
-        self, model: str, messages: List[LLMMessage], response_format: BaseModel | dict
+        self,
+        model: str,
+        messages: List[LLMMessage],
+        response_format: dict,
+        strict: bool = False,
     ):
         match self.llm_provider:
             case LLMProvider.OPENAI:
-                return self._stream_openai_structured(model, messages, response_format)
+                return self._stream_openai_structured(
+                    model, messages, response_format, strict
+                )
             case LLMProvider.GOOGLE:
                 return self._stream_google_structured(model, messages, response_format)
             case LLMProvider.ANTHROPIC:
@@ -460,6 +500,10 @@ class LLMClient:
                     model, messages, response_format
                 )
             case LLMProvider.OLLAMA:
-                return self._stream_ollama_structured(model, messages, response_format)
+                return self._stream_ollama_structured(
+                    model, messages, response_format, strict
+                )
             case LLMProvider.CUSTOM:
-                return self._stream_custom_structured(model, messages, response_format)
+                return self._stream_custom_structured(
+                    model, messages, response_format, strict
+                )
diff --git a/servers/fastapi/services/schema_to_model_service.py b/servers/fastapi/services/schema_to_model_service.py
deleted file mode 100644
index 655329bc..00000000
--- a/servers/fastapi/services/schema_to_model_service.py
+++ /dev/null
@@ -1,78 +0,0 @@
-import asyncio
-import json
-import os
-from pathlib import Path
-from typing import Dict
-from fastapi import HTTPException
-from datamodel_code_generator import generate, InputFileType, DataModelType
-
-from services.temp_file_service import TempFileService
-from utils.randomizers import get_random_uuid
-
-
-class SchemaToModelService:
-    def __init__(self, temp_file_service: TempFileService):
-        self.temp_file_service = temp_file_service
-        self.temp_dir = self.temp_file_service.create_temp_dir()
-
-        self.generated_models_dir = "generated_models"
-        if os.path.exists(self.generated_models_dir):
-            for file in os.listdir(self.generated_models_dir):
-                if file.endswith(".py"):
-                    os.remove(os.path.join(self.generated_models_dir, file))
-        os.makedirs(self.generated_models_dir, exist_ok=True)
-
-        self._records: Dict[str, str] = {}
-        self._fetch_locks: Dict[str, asyncio.Lock] = {}
-
-    def convert_path_to_module_path(self, path: str):
-        return path.replace("/", ".").replace("\\", ".").replace(".py", "")
-
-    async def get_pydantic_model_path_from_schema(
-        self, identifier: str, schema: dict
-    ) -> str:
-        if identifier in self._fetch_locks:
-            async with self._fetch_locks[identifier]:
-                return self._records[identifier]
-        else:
-            async_lock = asyncio.Lock()
-            await async_lock.acquire()
-            self._fetch_locks[identifier] = async_lock
-            model_path = await self.generate_pydantic_model_from_schema_async(schema)
-            model_path = self.convert_path_to_module_path(model_path)
-            self._records[identifier] = model_path
-            async_lock.release()
-            return model_path
-
-    async def generate_pydantic_model_from_schema_async(self, schema: dict):
-        return await asyncio.to_thread(self.generate_pydantic_model_from_schema, schema)
-
-    def generate_pydantic_model_from_schema(self, schema: dict):
-        generated_model_path = os.path.join(
-            self.generated_models_dir, get_random_uuid() + ".py"
-        )
-        try:
-            schema_path = self.temp_file_service.create_temp_file_path(
-                get_random_uuid() + ".json", self.temp_dir
-            )
-            with open(schema_path, "w") as f:
-                json.dump(schema, f)
-
-            generate(
-                input_=Path(schema_path),
-                input_file_type=InputFileType.JsonSchema,
-                output=Path(generated_model_path),
-                output_model_type=DataModelType.PydanticV2BaseModel,
-                class_name="GeneratedModel",
-                use_annotated=False,
-                field_constraints=True,
-                extra_fields="ignore",
-            )
-        except Exception as e:
-            raise HTTPException(
-                status_code=500, detail="Failed to generate Pydantic model from schema"
-            )
-        finally:
-            self.temp_file_service.cleanup_temp_file(schema_path)
-
-        return generated_model_path
diff --git a/servers/fastapi/utils/available_models.py b/servers/fastapi/utils/available_models.py
new file mode 100644
index 00000000..539533ad
--- /dev/null
+++ b/servers/fastapi/utils/available_models.py
@@ -0,0 +1,21 @@
+from anthropic import AsyncAnthropic
+from openai import AsyncOpenAI
+from google import genai
+
+
+async def list_available_openai_compatible_models(url: str, api_key: str) -> list[str]:
+    client = AsyncOpenAI(api_key=api_key, base_url=url)
+    models = (await client.models.list()).data
+    if models:
+        return list(map(lambda x: x.id, models))
+    return []
+
+
+async def list_available_anthropic_models(api_key: str) -> list[str]:
+    client = AsyncAnthropic(api_key=api_key)
+    return list(map(lambda x: x.id, (await client.models.list(limit=50)).data))
+
+
+async def list_available_google_models(api_key: str) -> list[str]:
+    client = genai.Client(api_key=api_key)
+    return list(map(lambda x: x.name, client.models.list(config={"page_size": 50})))
diff --git a/servers/fastapi/utils/custom_llm_provider.py b/servers/fastapi/utils/custom_llm_provider.py
deleted file mode 100644
index bac0f72b..00000000
--- a/servers/fastapi/utils/custom_llm_provider.py
+++ /dev/null
@@ -1,17 +0,0 @@
-from typing import Optional
-from openai import AsyncOpenAI
-
-from utils.llm_provider import get_llm_client
-
-
-async def list_available_custom_models(
-    url: Optional[str] = None, api_key: Optional[str] = None
-) -> list[str]:
-    if not url:
-        client = get_llm_client()
-    else:
-        client = AsyncOpenAI(api_key=api_key or "null", base_url=url)
-    models = []
-    async for model in client.models.list():
-        models.append(model.id)
-    return models
diff --git a/servers/fastapi/utils/dict_utils.py b/servers/fastapi/utils/dict_utils.py
index e7e860b5..72c69c53 100644
--- a/servers/fastapi/utils/dict_utils.py
+++ b/servers/fastapi/utils/dict_utils.py
@@ -78,3 +78,12 @@ def deep_update(original: dict, updates: dict) -> dict:
             if not isinstance(value, (dict, list)):
                 original[key] = value
     return original
+
+
+def has_more_than_n_keys(obj: dict[str, object], n: int) -> bool:
+    i = 0
+    for _ in obj.keys():
+        i += 1
+        if i > n:
+            return True
+    return False
diff --git a/servers/fastapi/utils/get_env.py b/servers/fastapi/utils/get_env.py
index 93be0370..f2301b69 100644
--- a/servers/fastapi/utils/get_env.py
+++ b/servers/fastapi/utils/get_env.py
@@ -45,10 +45,18 @@ def get_openai_api_key_env():
     return os.getenv("OPENAI_API_KEY")
 
 
+def get_openai_model_env():
+    return os.getenv("OPENAI_MODEL")
+
+
 def get_google_api_key_env():
     return os.getenv("GOOGLE_API_KEY")
 
 
+def get_google_model_env():
+    return os.getenv("GOOGLE_MODEL")
+
+
 def get_custom_llm_api_key_env():
     return os.getenv("CUSTOM_LLM_API_KEY")
 
diff --git a/servers/fastapi/utils/llm_calls/edit_slide.py b/servers/fastapi/utils/llm_calls/edit_slide.py
index f572779b..a8df598a 100644
--- a/servers/fastapi/utils/llm_calls/edit_slide.py
+++ b/servers/fastapi/utils/llm_calls/edit_slide.py
@@ -1,9 +1,8 @@
-from pydantic import BaseModel
 from models.llm_message import LLMMessage
 from models.presentation_layout import SlideLayoutModel
 from models.sql.slide import SlideModel
 from services.llm_client import LLMClient
-from utils.llm_provider import get_large_model
+from utils.llm_provider import get_model
 from utils.schema_utils import remove_fields_from_schema
 
 system_prompt = """
@@ -57,14 +56,19 @@ async def get_edited_slide_content(
     prompt: str,
     slide: SlideModel,
     language: str,
-    response_model: BaseModel,
+    slide_layout: SlideLayoutModel,
 ):
-    model = get_large_model()
+    model = get_model()
+
+    response_schema = remove_fields_from_schema(
+        slide_layout.json_schema, ["__image_url__", "__icon_url__"]
+    )
 
     client = LLMClient()
     response = await client.generate_structured(
         model=model,
         messages=get_messages(prompt, slide.content, language),
-        response_format=response_model,
+        response_format=response_schema,
+        strict=False,
     )
     return response
diff --git a/servers/fastapi/utils/llm_calls/edit_slide_html.py b/servers/fastapi/utils/llm_calls/edit_slide_html.py
index 5169364d..a5e2dfad 100644
--- a/servers/fastapi/utils/llm_calls/edit_slide_html.py
+++ b/servers/fastapi/utils/llm_calls/edit_slide_html.py
@@ -1,14 +1,7 @@
-import asyncio
 from typing import Optional
-from google.genai.types import GenerateContentConfig
-from utils.llm_provider import (
-    get_anthropic_llm_client,
-    get_google_llm_client,
-    get_large_model,
-    is_anthropic_selected,
-    is_google_selected,
-    get_llm_client,
-)
+from models.llm_message import LLMMessage
+from services.llm_client import LLMClient
+from utils.llm_provider import get_model
 
 system_prompt = """
     You are an expert HTML slide editor. Your task is to modify slide HTML content based on user prompts while maintaining proper structure, styling, and functionality.
@@ -54,48 +47,17 @@ def get_user_prompt(prompt: str, html: str):
 
 
 async def get_edited_slide_html(prompt: str, html: str):
-    model = get_large_model()
-    llm_response = None
+    model = get_model()
 
-    if is_anthropic_selected():
-        client = get_anthropic_llm_client()
-        response = await client.messages.create(
-            model=model,
-            messages=[get_user_prompt(prompt, html)],
-        )
-        for each in response.content:
-            if each.type == "text":
-                llm_response = each.text
-                break
-
-    elif is_google_selected():
-        client = get_google_llm_client()
-        response = await asyncio.to_thread(
-            client.models.generate_content,
-            model=model,
-            contents=[get_user_prompt(prompt, html)],
-            config=GenerateContentConfig(
-                system_instruction=system_prompt,
-                response_mime_type="text/plain",
-            ),
-        )
-        llm_response = response.text
-
-    else:
-        client = get_llm_client()
-        response = await client.chat.completions.create(
-            model=model,
-            messages=[
-                {"role": "system", "content": system_prompt},
-                {"role": "user", "content": get_user_prompt(prompt, html)},
-            ],
-        )
-        llm_response = response.choices[0].message.content
-
-    if not llm_response:
-        return html
-
-    return extract_html_from_response(llm_response) or html
+    client = LLMClient()
+    response = await client.generate(
+        model=model,
+        messages=[
+            LLMMessage(role="system", content=system_prompt),
+            LLMMessage(role="user", content=get_user_prompt(prompt, html)),
+        ],
+    )
+    return extract_html_from_response(response) or html
 
 
 def extract_html_from_response(response_text: str) -> Optional[str]:
diff --git a/servers/fastapi/utils/llm_calls/generate_document_summary.py b/servers/fastapi/utils/llm_calls/generate_document_summary.py
index 8e3c490e..044d28e8 100644
--- a/servers/fastapi/utils/llm_calls/generate_document_summary.py
+++ b/servers/fastapi/utils/llm_calls/generate_document_summary.py
@@ -3,7 +3,7 @@ from typing import List
 
 from models.llm_message import LLMMessage
 from services.llm_client import LLMClient
-from utils.llm_provider import get_nano_model
+from utils.llm_provider import get_model
 
 
 sysmte_prompt = """
@@ -25,7 +25,7 @@ Maintain as much information as possible.
 
 async def generate_document_summary(documents: List[str]):
     client = LLMClient()
-    model = get_nano_model()
+    model = get_model()
 
     coroutines = []
     for document in documents:
diff --git a/servers/fastapi/utils/llm_calls/generate_presentation_outlines.py b/servers/fastapi/utils/llm_calls/generate_presentation_outlines.py
index f0e94c0f..54e41d61 100644
--- a/servers/fastapi/utils/llm_calls/generate_presentation_outlines.py
+++ b/servers/fastapi/utils/llm_calls/generate_presentation_outlines.py
@@ -4,7 +4,7 @@ from typing import Optional
 from models.llm_message import LLMMessage
 from services.llm_client import LLMClient
 from utils.get_dynamic_models import get_presentation_outline_model_with_n_slides
-from utils.llm_provider import get_large_model
+from utils.llm_provider import get_model
 
 system_prompt = """
 You are an expert presentation creator. Generate structured presentations based on user requirements and format them according to the specified JSON schema with markdown content.
@@ -75,7 +75,7 @@ async def generate_ppt_outline(
     language: Optional[str] = None,
     content: Optional[str] = None,
 ):
-    model = get_large_model()
+    model = get_model()
     response_model = get_presentation_outline_model_with_n_slides(n_slides)
 
     client = LLMClient()
@@ -83,6 +83,7 @@ async def generate_ppt_outline(
     async for chunk in client.stream_structured(
         model,
         get_messages(prompt, n_slides, language, content),
-        response_model,
+        response_model.model_json_schema(),
+        strict=True,
     ):
         yield chunk
diff --git a/servers/fastapi/utils/llm_calls/generate_presentation_structure.py b/servers/fastapi/utils/llm_calls/generate_presentation_structure.py
index 056dd418..47f47dba 100644
--- a/servers/fastapi/utils/llm_calls/generate_presentation_structure.py
+++ b/servers/fastapi/utils/llm_calls/generate_presentation_structure.py
@@ -2,7 +2,7 @@ from models.llm_message import LLMMessage
 from models.presentation_layout import PresentationLayoutModel
 from models.presentation_outline_model import PresentationOutlineModel
 from services.llm_client import LLMClient
-from utils.llm_provider import get_large_model
+from utils.llm_provider import get_model
 from utils.get_dynamic_models import get_presentation_structure_model_with_n_slides
 from models.presentation_structure_model import PresentationStructureModel
 
@@ -62,7 +62,7 @@ async def generate_presentation_structure(
 ) -> PresentationStructureModel:
 
     client = LLMClient()
-    model = get_large_model()
+    model = get_model()
     response_model = get_presentation_structure_model_with_n_slides(
         len(presentation_outline.slides)
     )
@@ -74,6 +74,7 @@ async def generate_presentation_structure(
             len(presentation_outline.slides),
             presentation_outline.to_string(),
         ),
-        response_format=response_model,
+        response_format=response_model.model_json_schema(),
+        strict=True,
     )
     return PresentationStructureModel(**response)
diff --git a/servers/fastapi/utils/llm_calls/generate_slide_content.py b/servers/fastapi/utils/llm_calls/generate_slide_content.py
index e69f02e0..f75ed979 100644
--- a/servers/fastapi/utils/llm_calls/generate_slide_content.py
+++ b/servers/fastapi/utils/llm_calls/generate_slide_content.py
@@ -1,8 +1,9 @@
-from pydantic import BaseModel
 from models.llm_message import LLMMessage
+from models.presentation_layout import SlideLayoutModel
 from models.presentation_outline_model import SlideOutlineModel
 from services.llm_client import LLMClient
-from utils.llm_provider import get_large_model
+from utils.llm_provider import get_model
+from utils.schema_utils import remove_fields_from_schema
 
 system_prompt = """
     Generate structured slide based on provided title and outline, follow mentioned steps and notes and provide structured output.
@@ -14,8 +15,8 @@ system_prompt = """
     # Notes
     - Slide body should not use words like "This slide", "This presentation".
     - Rephrase the slide body to make it flow naturally.
-    - Provide prompt to generate image on "image_prompt_" property.
-    - Provide query to search icon on "icon_query_" property.
+    - Provide prompt to generate image on "__image_prompt__" property.
+    - Provide query to search icon on "__icon_query__" property.
     - Do not use markdown formatting in slide body.
     - Make sure to follow language guidelines.
     **Strictly follow the max and min character limit for every property in the slide.**
@@ -53,10 +54,14 @@ def get_messages(title: str, outline: str, language: str):
 
 
 async def get_slide_content_from_type_and_outline(
-    response_model: BaseModel, outline: SlideOutlineModel, language: str
+    slide_layout: SlideLayoutModel, outline: SlideOutlineModel, language: str
 ):
     client = LLMClient()
-    model = get_large_model()
+    model = get_model()
+
+    response_schema = remove_fields_from_schema(
+        slide_layout.json_schema, ["__image_url__", "__icon_url__"]
+    )
 
     response = await client.generate_structured(
         model=model,
@@ -65,6 +70,7 @@ async def get_slide_content_from_type_and_outline(
             outline.body,
             language,
         ),
-        response_format=response_model,
+        response_format=response_schema,
+        strict=False,
     )
     return response
diff --git a/servers/fastapi/utils/llm_calls/select_slide_type_on_edit.py b/servers/fastapi/utils/llm_calls/select_slide_type_on_edit.py
index a41c717b..f3532b48 100644
--- a/servers/fastapi/utils/llm_calls/select_slide_type_on_edit.py
+++ b/servers/fastapi/utils/llm_calls/select_slide_type_on_edit.py
@@ -3,7 +3,7 @@ from models.presentation_layout import PresentationLayoutModel, SlideLayoutModel
 from models.slide_layout_index import SlideLayoutIndex
 from models.sql.slide import SlideModel
 from services.llm_client import LLMClient
-from utils.llm_provider import get_large_model
+from utils.llm_provider import get_model
 
 
 def get_messages(
@@ -44,9 +44,9 @@ async def get_slide_layout_from_prompt(
 ) -> SlideLayoutModel:
 
     client = LLMClient()
-    model = get_large_model()
+    model = get_model()
 
-    slide_layout_ids = list(map(lambda x: x.id, layout.slides))
+    slide_layout_index = layout.get_slide_layout_index(slide.layout)
 
     response = await client.generate_structured(
         model=model,
@@ -54,9 +54,10 @@ async def get_slide_layout_from_prompt(
             prompt,
             slide.content,
             layout,
-            slide_layout_ids.index(slide.layout),
+            slide_layout_index,
         ),
-        response_format=SlideLayoutIndex,
+        response_format=SlideLayoutIndex.model_json_schema(),
+        strict=True,
     )
     index = SlideLayoutIndex(**response).index
     return layout.slides[index]
diff --git a/servers/fastapi/utils/llm_provider.py b/servers/fastapi/utils/llm_provider.py
index 23e98f62..aabc8f61 100644
--- a/servers/fastapi/utils/llm_provider.py
+++ b/servers/fastapi/utils/llm_provider.py
@@ -1,21 +1,18 @@
-import os
-import anthropic
 from fastapi import HTTPException
-from openai import AsyncOpenAI
-from google import genai
 
+from constants.llm import (
+    DEFAULT_ANTHROPIC_MODEL,
+    DEFAULT_GOOGLE_MODEL,
+    DEFAULT_OPENAI_MODEL,
+)
 from enums.llm_provider import LLMProvider
 from utils.get_env import (
-    get_anthropic_api_key_env,
     get_anthropic_model_env,
-    get_custom_llm_api_key_env,
-    get_custom_llm_url_env,
     get_custom_model_env,
-    get_google_api_key_env,
+    get_google_model_env,
     get_llm_provider_env,
     get_ollama_model_env,
-    get_ollama_url_env,
-    get_openai_api_key_env,
+    get_openai_model_env,
 )
 
 
@@ -25,14 +22,10 @@ def get_llm_provider():
     except:
         raise HTTPException(
             status_code=500,
-            detail=f"Invalid LLM provider. Please select one of: openai, google, ollama, custom",
+            detail=f"Invalid LLM provider. Please select one of: openai, google, anthropic, ollama, custom",
         )
 
 
-def get_ollama_url():
-    return get_ollama_url_env() or "http://localhost:11434"
-
-
 def is_openai_selected():
     return get_llm_provider() == LLMProvider.OPENAI
 
@@ -53,100 +46,20 @@ def is_custom_llm_selected():
     return get_llm_provider() == LLMProvider.CUSTOM
 
 
-def get_model_base_url():
-    selected_llm = get_llm_provider()
-
-    if selected_llm == LLMProvider.OPENAI:
-        return "https://api.openai.com/v1"
-    elif selected_llm == LLMProvider.GOOGLE:
-        return "https://generativelanguage.googleapis.com/v1beta/openai"
-    elif selected_llm == LLMProvider.ANTHROPIC:
-        return "https://api.anthropic.com/v1"
-    elif selected_llm == LLMProvider.OLLAMA:
-        return os.path.join(get_ollama_url(), "v1")
-    elif selected_llm == LLMProvider.CUSTOM:
-        return get_custom_llm_url_env()
-    else:
-        raise HTTPException(f"LLM provider {selected_llm} is not supported")
-
-
-def get_llm_api_key():
+def get_model():
     selected_llm = get_llm_provider()
     if selected_llm == LLMProvider.OPENAI:
-        return get_openai_api_key_env()
+        return get_openai_model_env() or DEFAULT_OPENAI_MODEL
     elif selected_llm == LLMProvider.GOOGLE:
-        return get_google_api_key_env()
+        return get_google_model_env() or DEFAULT_GOOGLE_MODEL
     elif selected_llm == LLMProvider.ANTHROPIC:
-        return get_anthropic_api_key_env()
-    elif selected_llm == LLMProvider.OLLAMA:
-        return "ollama"
-    elif selected_llm == LLMProvider.CUSTOM:
-        return get_custom_llm_api_key_env() or "none"
-    else:
-        raise HTTPException(f"LLM provider {selected_llm} is not supported")
-
-
-def get_llm_client():
-    client = AsyncOpenAI(
-        base_url=get_model_base_url(),
-        api_key=get_llm_api_key(),
-    )
-    return client
-
-
-def get_google_llm_client():
-    client = genai.Client(api_key=get_google_api_key_env())
-    return client
-
-
-def get_anthropic_llm_client():
-    client = anthropic.AsyncAnthropic(api_key=get_anthropic_api_key_env())
-    return client
-
-
-def get_large_model():
-    selected_llm = get_llm_provider()
-    if selected_llm == LLMProvider.OPENAI:
-        return "gpt-4.1"
-    elif selected_llm == LLMProvider.GOOGLE:
-        return "gemini-2.0-flash"
-    elif selected_llm == LLMProvider.ANTHROPIC:
-        return get_anthropic_model_env()
+        return get_anthropic_model_env() or DEFAULT_ANTHROPIC_MODEL
     elif selected_llm == LLMProvider.OLLAMA:
         return get_ollama_model_env()
     elif selected_llm == LLMProvider.CUSTOM:
         return get_custom_model_env()
     else:
-        raise ValueError(f"Invalid LLM model")
-
-
-def get_small_model():
-    selected_llm = get_llm_provider()
-    if selected_llm == LLMProvider.OPENAI:
-        return "gpt-4.1-mini"
-    elif selected_llm == LLMProvider.GOOGLE:
-        return "gemini-2.0-flash"
-    elif selected_llm == LLMProvider.ANTHROPIC:
-        return get_anthropic_model_env()
-    elif selected_llm == LLMProvider.OLLAMA:
-        return get_ollama_model_env()
-    elif selected_llm == LLMProvider.CUSTOM:
-        return get_custom_model_env()
-    else:
-        raise ValueError(f"Invalid LLM model")
-
-
-def get_nano_model():
-    selected_llm = get_llm_provider()
-    if selected_llm == LLMProvider.OPENAI:
-        return "gpt-4.1-nano"
-    elif selected_llm == LLMProvider.GOOGLE:
-        return "gemini-2.0-flash"
-    elif selected_llm == LLMProvider.ANTHROPIC:
-        return get_anthropic_model_env()
-    elif selected_llm == LLMProvider.OLLAMA:
-        return get_ollama_model_env()
-    elif selected_llm == LLMProvider.CUSTOM:
-        return get_custom_model_env()
-    else:
-        raise ValueError(f"Invalid LLM model")
+        raise HTTPException(
+            status_code=500,
+            detail=f"Invalid LLM provider. Please select one of: openai, google, anthropic, ollama, custom",
+        )
diff --git a/servers/fastapi/utils/model_availability.py b/servers/fastapi/utils/model_availability.py
index 210fcdd2..a546640e 100644
--- a/servers/fastapi/utils/model_availability.py
+++ b/servers/fastapi/utils/model_availability.py
@@ -1,11 +1,19 @@
-import os
 from constants.supported_ollama_models import SUPPORTED_OLLAMA_MODELS
+from constants.llm import OPENAI_URL
 from enums.image_provider import ImageProvider
 from enums.llm_provider import LLMProvider
-from utils.custom_llm_provider import list_available_custom_models
+from utils.available_models import (
+    list_available_anthropic_models,
+    list_available_google_models,
+    list_available_openai_compatible_models,
+)
 from utils.get_env import (
+    get_anthropic_api_key_env,
+    get_anthropic_model_env,
     get_can_change_keys_env,
+    get_google_model_env,
     get_openai_api_key_env,
+    get_openai_model_env,
     get_pixabay_api_key_env,
     get_pexels_api_key_env,
 )
@@ -20,13 +28,7 @@ from utils.llm_provider import (
     is_ollama_selected,
 )
 from utils.ollama import pull_ollama_model
-from utils.image_provider import (
-    get_selected_image_provider,
-    is_pixels_selected,
-    is_pixabay_selected,
-    is_gemini_flash_selected,
-    is_dalle3_selected,
-)
+from utils.image_provider import get_selected_image_provider
 
 
 async def check_llm_and_image_provider_api_or_model_availability():
@@ -36,11 +38,41 @@ async def check_llm_and_image_provider_api_or_model_availability():
             openai_api_key = get_openai_api_key_env()
             if not openai_api_key:
                 raise Exception("OPENAI_API_KEY must be provided")
+            openai_model = get_openai_model_env()
+            if openai_model:
+                available_models = await list_available_openai_compatible_models(
+                    OPENAI_URL, openai_api_key
+                )
+                if openai_model not in available_models:
+                    print("-" * 50)
+                    print("Available models: ", available_models)
+                    raise Exception(f"Model {openai_model} is not available")
 
         elif get_llm_provider() == LLMProvider.GOOGLE:
             google_api_key = get_google_api_key_env()
             if not google_api_key:
                 raise Exception("GOOGLE_API_KEY must be provided")
+            google_model = get_google_model_env()
+            if google_model:
+                available_models = await list_available_google_models(google_api_key)
+                if google_model not in available_models:
+                    print("-" * 50)
+                    print("Available models: ", available_models)
+                    raise Exception(f"Model {google_model} is not available")
+
+        elif get_llm_provider() == LLMProvider.ANTHROPIC:
+            anthropic_api_key = get_anthropic_api_key_env()
+            if not anthropic_api_key:
+                raise Exception("ANTHROPIC_API_KEY must be provided")
+            anthropic_model = get_anthropic_model_env()
+            if anthropic_model:
+                available_models = await list_available_anthropic_models(
+                    anthropic_api_key
+                )
+                if anthropic_model not in available_models:
+                    print("-" * 50)
+                    print("Available models: ", available_models)
+                    raise Exception(f"Model {anthropic_model} is not available")
 
         elif is_ollama_selected():
             ollama_model = get_ollama_model_env()
@@ -67,14 +99,12 @@ async def check_llm_and_image_provider_api_or_model_availability():
                 raise Exception("CUSTOM_LLM_URL must be provided")
             if not custom_llm_api_key:
                 raise Exception("CUSTOM_LLM_API_KEY must be provided")
-            print("-" * 50)
-            print("Selecting model: ", custom_model)
-            models = await list_available_custom_models(
+            available_models = await list_available_openai_compatible_models(
                 custom_llm_url, custom_llm_api_key
             )
-            print("Available models: ", models)
             print("-" * 50)
-            if custom_model not in models:
+            print("Available models: ", available_models)
+            if custom_model not in available_models:
                 raise Exception(f"Model {custom_model} is not available")
 
         # Check for Image Provider and API keys
diff --git a/servers/fastapi/utils/ollama.py b/servers/fastapi/utils/ollama.py
index 10c8500f..928ee895 100644
--- a/servers/fastapi/utils/ollama.py
+++ b/servers/fastapi/utils/ollama.py
@@ -1,7 +1,7 @@
-from http.client import HTTPException
 import json
 from typing import AsyncGenerator
 import aiohttp
+from fastapi import HTTPException
 
 from models.ollama_model_status import OllamaModelStatus
 from utils.get_env import get_ollama_url_env
diff --git a/servers/fastapi/utils/process_slides.py b/servers/fastapi/utils/process_slides.py
index 2623f95f..81a0a6b5 100644
--- a/servers/fastapi/utils/process_slides.py
+++ b/servers/fastapi/utils/process_slides.py
@@ -17,23 +17,23 @@ async def process_slide_and_fetch_assets(
 
     async_tasks = []
 
-    image_paths = get_dict_paths_with_key(slide.content, "image_prompt_")
-    icon_paths = get_dict_paths_with_key(slide.content, "icon_query_")
+    image_paths = get_dict_paths_with_key(slide.content, "__image_prompt__")
+    icon_paths = get_dict_paths_with_key(slide.content, "__icon_query__")
 
     for image_path in image_paths:
-        image_prompt_parent = get_dict_at_path(slide.content, image_path)
+        __image_prompt__parent = get_dict_at_path(slide.content, image_path)
         async_tasks.append(
             image_generation_service.generate_image(
                 ImagePrompt(
-                    prompt=image_prompt_parent["image_prompt_"],
+                    prompt=__image_prompt__parent["__image_prompt__"],
                 )
             )
         )
 
     for icon_path in icon_paths:
-        icon_query_parent = get_dict_at_path(slide.content, icon_path)
+        __icon_query__parent = get_dict_at_path(slide.content, icon_path)
         async_tasks.append(
-            icon_finder_service.search_icons(icon_query_parent["icon_query_"])
+            icon_finder_service.search_icons(__icon_query__parent["__icon_query__"])
         )
 
     results = await asyncio.gather(*async_tasks)
@@ -45,14 +45,14 @@ async def process_slide_and_fetch_assets(
         result = results.pop()
         if isinstance(result, ImageAsset):
             return_assets.append(result)
-            image_dict["image_url_"] = result.path
+            image_dict["__image_url__"] = result.path
         else:
-            image_dict["image_url_"] = result
+            image_dict["__image_url__"] = result
         set_dict_at_path(slide.content, image_path, image_dict)
 
     for icon_path in icon_paths:
         icon_dict = get_dict_at_path(slide.content, icon_path)
-        icon_dict["icon_url_"] = results.pop()[0]
+        icon_dict["__icon_url__"] = results.pop()[0]
         set_dict_at_path(slide.content, icon_path, icon_dict)
 
     return return_assets
@@ -66,34 +66,34 @@ async def process_old_and_new_slides_and_fetch_assets(
 ) -> List[ImageAsset]:
     # Finds all old images
     old_image_dict_paths = get_dict_paths_with_key(
-        old_slide_content, "image_prompt_"
+        old_slide_content, "__image_prompt__"
     )
     old_image_dicts = [
         get_dict_at_path(old_slide_content, path) for path in old_image_dict_paths
     ]
     old_image_prompts = [
-        old_image_dict["image_prompt_"] for old_image_dict in old_image_dicts
+        old_image_dict["__image_prompt__"] for old_image_dict in old_image_dicts
     ]
 
     # Finds all old icons
-    old_icon_dict_paths = get_dict_paths_with_key(old_slide_content, "icon_query_")
+    old_icon_dict_paths = get_dict_paths_with_key(old_slide_content, "__icon_query__")
     old_icon_dicts = [
         get_dict_at_path(old_slide_content, path) for path in old_icon_dict_paths
     ]
     old_icon_queries = [
-        old_icon_dict["icon_query_"] for old_icon_dict in old_icon_dicts
+        old_icon_dict["__icon_query__"] for old_icon_dict in old_icon_dicts
     ]
 
     # Finds all new images
     new_image_dict_paths = get_dict_paths_with_key(
-        new_slide_content, "image_prompt_"
+        new_slide_content, "__image_prompt__"
     )
     new_image_dicts = [
         get_dict_at_path(new_slide_content, path) for path in new_image_dict_paths
     ]
 
     # Finds all new icons
-    new_icon_dict_paths = get_dict_paths_with_key(new_slide_content, "icon_query_")
+    new_icon_dict_paths = get_dict_paths_with_key(new_slide_content, "__icon_query__")
     new_icon_dicts = [
         get_dict_at_path(new_slide_content, path) for path in new_icon_dict_paths
     ]
@@ -109,18 +109,18 @@ async def process_old_and_new_slides_and_fetch_assets(
     # Creates async tasks for fetching new images
     # Use old image url if prompt is same
     for new_image in new_image_dicts:
-        if new_image["image_prompt_"] in old_image_prompts:
+        if new_image["__image_prompt__"] in old_image_prompts:
             old_image_url = old_image_dicts[
-                old_image_prompts.index(new_image["image_prompt_"])
-            ]["image_url_"]
-            new_image["image_url_"] = old_image_url
+                old_image_prompts.index(new_image["__image_prompt__"])
+            ]["__image_url__"]
+            new_image["__image_url__"] = old_image_url
             new_images_fetch_status.append(False)
             continue
 
         async_image_fetch_tasks.append(
             image_generation_service.generate_image(
                 ImagePrompt(
-                    prompt=new_image["image_prompt_"],
+                    prompt=new_image["__image_prompt__"],
                 )
             )
         )
@@ -129,16 +129,16 @@ async def process_old_and_new_slides_and_fetch_assets(
     # Creates async tasks for fetching new icons
     # Use old icon url if query is same
     for new_icon in new_icon_dicts:
-        if new_icon["icon_query_"] in old_icon_queries:
+        if new_icon["__icon_query__"] in old_icon_queries:
             old_icon_url = old_icon_dicts[
-                old_icon_queries.index(new_icon["icon_query_"])
-            ]["icon_url_"]
-            new_icon["icon_url_"] = old_icon_url
+                old_icon_queries.index(new_icon["__icon_query__"])
+            ]["__icon_url__"]
+            new_icon["__icon_url__"] = old_icon_url
             new_icons_fetch_status.append(False)
             continue
 
         async_icon_fetch_tasks.append(
-            icon_finder_service.search_icons(new_icon["icon_query_"])
+            icon_finder_service.search_icons(new_icon["__icon_query__"])
         )
         new_icons_fetch_status.append(True)
 
@@ -157,11 +157,11 @@ async def process_old_and_new_slides_and_fetch_assets(
                 image_url = fetched_image.path
             else:
                 image_url = fetched_image
-            new_image_dicts[i]["image_url_"] = image_url
+            new_image_dicts[i]["__image_url__"] = image_url
 
     for i, new_icon in enumerate(new_icons):
         if new_icons_fetch_status[i]:
-            new_icon_dicts[i]["icon_url_"] = new_icons[i][0]
+            new_icon_dicts[i]["__icon_url__"] = new_icons[i][0]
 
     for i, new_image_dict in enumerate(new_image_dicts):
         set_dict_at_path(new_slide_content, new_image_dict_paths[i], new_image_dict)
diff --git a/servers/fastapi/utils/schema_utils.py b/servers/fastapi/utils/schema_utils.py
index 0f2ad6d7..ae65f002 100644
--- a/servers/fastapi/utils/schema_utils.py
+++ b/servers/fastapi/utils/schema_utils.py
@@ -1,30 +1,25 @@
 from copy import deepcopy
-from typing import List
+from typing import Any, List
 
-from utils.dict_utils import get_dict_paths_with_key, get_dict_at_path
+from openai import NOT_GIVEN
 
+from utils.dict_utils import (
+    get_dict_paths_with_key,
+    get_dict_at_path,
+    has_more_than_n_keys,
+)
 
-def resolve_refs(schema, defs):
-    if isinstance(schema, dict):
-        if "$ref" in schema:
-            ref_path = schema["$ref"]
-            if ref_path.startswith("#/$defs/"):
-                def_key = ref_path.replace("#/$defs/", "")
-                return resolve_refs(defs[def_key], defs)
-            else:
-                raise ValueError(f"Unsupported $ref path: {ref_path}")
-        else:
-            return {k: resolve_refs(v, defs) for k, v in schema.items()}
-    elif isinstance(schema, list):
-        return [resolve_refs(item, defs) for item in schema]
-    else:
-        return schema
-
-
-def flatten_schema(schema):
-    schema = deepcopy(schema)
-    defs = schema.pop("$defs", {})
-    return resolve_refs(schema, defs)
+supported_string_formats = [
+    "date-time",
+    "time",
+    "date",
+    "duration",
+    "email",
+    "hostname",
+    "ipv4",
+    "ipv6",
+    "uuid",
+]
 
 
 def remove_fields_from_schema(schema: dict, fields_to_remove: List[str]):
@@ -50,6 +45,138 @@ def remove_fields_from_schema(schema: dict, fields_to_remove: List[str]):
     return schema
 
 
+# From OpenAI
+def ensure_strict_json_schema(
+    json_schema: object,
+    *,
+    path: tuple[str, ...],
+    root: dict[str, object],
+) -> dict[str, Any]:
+    """Mutates the given JSON schema to ensure it conforms to the `strict` standard
+    that the API expects.
+    """
+    if not isinstance(json_schema, dict):
+        raise TypeError(f"Expected {json_schema} to be a dictionary; path={path}")
+
+    defs = json_schema.get("$defs")
+    if isinstance(defs, dict):
+        for def_name, def_schema in defs.items():
+            ensure_strict_json_schema(
+                def_schema, path=(*path, "$defs", def_name), root=root
+            )
+
+    definitions = json_schema.get("definitions")
+    if isinstance(definitions, dict):
+        for definition_name, definition_schema in definitions.items():
+            ensure_strict_json_schema(
+                definition_schema,
+                path=(*path, "definitions", definition_name),
+                root=root,
+            )
+
+    typ = json_schema.get("type")
+    if typ == "object" and "additionalProperties" not in json_schema:
+        json_schema["additionalProperties"] = False
+
+    # object types
+    # { 'type': 'object', 'properties': { 'a':  {...} } }
+    properties = json_schema.get("properties")
+    if isinstance(properties, dict):
+        json_schema["required"] = [prop for prop in properties.keys()]
+        json_schema["properties"] = {
+            key: ensure_strict_json_schema(
+                prop_schema, path=(*path, "properties", key), root=root
+            )
+            for key, prop_schema in properties.items()
+        }
+
+    # arrays
+    # { 'type': 'array', 'items': {...} }
+    items = json_schema.get("items")
+    if isinstance(items, dict):
+        json_schema["items"] = ensure_strict_json_schema(
+            items, path=(*path, "items"), root=root
+        )
+
+    # unions
+    any_of = json_schema.get("anyOf")
+    if isinstance(any_of, list):
+        json_schema["anyOf"] = [
+            ensure_strict_json_schema(variant, path=(*path, "anyOf", str(i)), root=root)
+            for i, variant in enumerate(any_of)
+        ]
+
+    # intersections
+    all_of = json_schema.get("allOf")
+    if isinstance(all_of, list):
+        if len(all_of) == 1:
+            json_schema.update(
+                ensure_strict_json_schema(
+                    all_of[0], path=(*path, "allOf", "0"), root=root
+                )
+            )
+            json_schema.pop("allOf")
+        else:
+            json_schema["allOf"] = [
+                ensure_strict_json_schema(
+                    entry, path=(*path, "allOf", str(i)), root=root
+                )
+                for i, entry in enumerate(all_of)
+            ]
+
+    # string
+    if typ == "string":
+        if "format" in json_schema:
+            if json_schema["format"] not in supported_string_formats:
+                del json_schema["format"]
+
+    # strip `None` defaults as there's no meaningful distinction here
+    # the schema will still be `nullable` and the model will default
+    # to using `None` anyway
+    if json_schema.get("default", NOT_GIVEN) is None:
+        json_schema.pop("default")
+
+    # we can't use `$ref`s if there are also other properties defined, e.g.
+    # `{"$ref": "...", "description": "my description"}`
+    #
+    # so we unravel the ref
+    # `{"type": "string", "description": "my description"}`
+    ref = json_schema.get("$ref")
+    if ref and has_more_than_n_keys(json_schema, 1):
+        assert isinstance(ref, str), f"Received non-string $ref - {ref}"
+
+        resolved = resolve_ref(root=root, ref=ref)
+        if not isinstance(resolved, dict):
+            raise ValueError(
+                f"Expected `$ref: {ref}` to resolved to a dictionary but got {resolved}"
+            )
+
+        # properties from the json schema take priority over the ones on the `$ref`
+        json_schema.update({**resolved, **json_schema})
+        json_schema.pop("$ref")
+        # Since the schema expanded from `$ref` might not have `additionalProperties: false` applied,
+        # we call `_ensure_strict_json_schema` again to fix the inlined schema and ensure it's valid.
+        return ensure_strict_json_schema(json_schema, path=path, root=root)
+
+    return json_schema
+
+
+def resolve_ref(*, root: dict[str, object], ref: str) -> object:
+    if not ref.startswith("#/"):
+        raise ValueError(f"Unexpected $ref format {ref!r}; Does not start with #/")
+
+    path = ref[2:].split("/")
+    resolved = root
+    for key in path:
+        value = resolved[key]
+        assert isinstance(
+            value, dict
+        ), f"encountered non-dictionary entry while resolving {ref} - {resolved}"
+        resolved = value
+
+    return resolved
+
+
 # ? Not used
 def generate_constraint_sentences(schema: dict) -> str:
     """
diff --git a/servers/fastapi/utils/set_env.py b/servers/fastapi/utils/set_env.py
index 1b63f95c..5566d800 100644
--- a/servers/fastapi/utils/set_env.py
+++ b/servers/fastapi/utils/set_env.py
@@ -25,10 +25,18 @@ def set_openai_api_key_env(value):
     os.environ["OPENAI_API_KEY"] = value
 
 
+def set_openai_model_env(value):
+    os.environ["OPENAI_MODEL"] = value
+
+
 def set_google_api_key_env(value):
     os.environ["GOOGLE_API_KEY"] = value
 
 
+def set_google_model_env(value):
+    os.environ["GOOGLE_MODEL"] = value
+
+
 def set_anthropic_api_key_env(value):
     os.environ["ANTHROPIC_API_KEY"] = value
 
diff --git a/servers/fastapi/utils/user_config.py b/servers/fastapi/utils/user_config.py
index a494b340..d1ddd20a 100644
--- a/servers/fastapi/utils/user_config.py
+++ b/servers/fastapi/utils/user_config.py
@@ -9,10 +9,12 @@ from utils.get_env import (
     get_custom_llm_url_env,
     get_custom_model_env,
     get_google_api_key_env,
+    get_google_model_env,
     get_llm_provider_env,
     get_ollama_model_env,
     get_ollama_url_env,
     get_openai_api_key_env,
+    get_openai_model_env,
     get_pexels_api_key_env,
     get_user_config_path_env,
     get_image_provider_env,
@@ -27,10 +29,12 @@ from utils.set_env import (
     set_custom_model_env,
     set_extended_reasoning_env,
     set_google_api_key_env,
+    set_google_model_env,
     set_llm_provider_env,
     set_ollama_model_env,
     set_ollama_url_env,
     set_openai_api_key_env,
+    set_openai_model_env,
     set_pexels_api_key_env,
     set_image_provider_env,
     set_pixabay_api_key_env,
@@ -58,7 +62,9 @@ def get_user_config():
     return UserConfig(
         LLM=existing_config.LLM or get_llm_provider_env(),
         OPENAI_API_KEY=existing_config.OPENAI_API_KEY or get_openai_api_key_env(),
+        OPENAI_MODEL=existing_config.OPENAI_MODEL or get_openai_model_env(),
         GOOGLE_API_KEY=existing_config.GOOGLE_API_KEY or get_google_api_key_env(),
+        GOOGLE_MODEL=existing_config.GOOGLE_MODEL or get_google_model_env(),
         ANTHROPIC_API_KEY=existing_config.ANTHROPIC_API_KEY
         or get_anthropic_api_key_env(),
         ANTHROPIC_MODEL=existing_config.ANTHROPIC_MODEL or get_anthropic_model_env(),
@@ -81,8 +87,12 @@ def update_env_with_user_config():
         set_llm_provider_env(user_config.LLM)
     if user_config.OPENAI_API_KEY:
         set_openai_api_key_env(user_config.OPENAI_API_KEY)
+    if user_config.OPENAI_MODEL:
+        set_openai_model_env(user_config.OPENAI_MODEL)
     if user_config.GOOGLE_API_KEY:
         set_google_api_key_env(user_config.GOOGLE_API_KEY)
+    if user_config.GOOGLE_MODEL:
+        set_google_model_env(user_config.GOOGLE_MODEL)
     if user_config.ANTHROPIC_API_KEY:
         set_anthropic_api_key_env(user_config.ANTHROPIC_API_KEY)
     if user_config.ANTHROPIC_MODEL: