Future-House · jamesbraza · Oct 20, 2025 · Oct 20, 2025 · Oct 20, 2025 · Oct 27, 2025
diff --git a/README.md b/README.md
@@ -451,7 +451,7 @@ asyncio.run(main())
 
 ### Choosing Model
 
-By default, PaperQA2 uses OpenAI's `gpt-4o-2024-11-20` model for the
+By default, PaperQA2 uses OpenAI's `gpt-5-2025-08-07` model for the
 `summary_llm`, `llm`, and `agent_llm`.
 Please see the [Settings Cheatsheet](#settings-cheatsheet)
 for more information on these settings.
@@ -895,13 +895,13 @@ will return much faster than the first query and we'll be certain the authors ma
 
 | Setting                                      | Default                                | Description                                                                                                                   |
 | -------------------------------------------- | -------------------------------------- | ----------------------------------------------------------------------------------------------------------------------------- |
-| `llm`                                        | `"gpt-4o-2024-11-20"`                  | LLM for general use including metadata inference (see Docs.aadd) and answer generation (see Docs.aquery and gen_answer tool). |
+| `llm`                                        | `"gpt-5-2025-08-07"`                   | LLM for general use including metadata inference (see Docs.aadd) and answer generation (see Docs.aquery and gen_answer tool). |
 | `llm_config`                                 | `None`                                 | Optional configuration for `llm`.                                                                                             |
-| `summary_llm`                                | `"gpt-4o-2024-11-20"`                  | LLM for creating contextual summaries (see Docs.aget_evidence and gather_evidence tool).                                      |
+| `summary_llm`                                | `"gpt-5-2025-08-07"`                   | LLM for creating contextual summaries (see Docs.aget_evidence and gather_evidence tool).                                      |
 | `summary_llm_config`                         | `None`                                 | Optional configuration for `summary_llm`.                                                                                     |
 | `embedding`                                  | `"text-embedding-3-small"`             | Embedding model for embedding text chunks when adding papers.                                                                 |
 | `embedding_config`                           | `None`                                 | Optional configuration for `embedding`.                                                                                       |
-| `temperature`                                | `0.0`                                  | Temperature for LLMs.                                                                                                         |
+| `temperature`                                | `1.0`                                  | Temperature for LLMs.                                                                                                         |
 | `batch_size`                                 | `1`                                    | Batch size for calling LLMs.                                                                                                  |
 | `texts_index_mmr_lambda`                     | `1.0`                                  | Lambda for MMR in text index.                                                                                                 |
 | `verbosity`                                  | `0`                                    | Integer verbosity level for logging (0-3). 3 = all LLM/Embeddings calls logged.                                               |
@@ -944,7 +944,7 @@ will return much faster than the first query and we'll be certain the authors ma
 | `prompt.summary_json_system`                 | `summary_json_system_prompt`           | System prompt for JSON summaries.                                                                                             |
 | `prompt.context_outer`                       | `CONTEXT_OUTER_PROMPT`                 | Prompt for how to format all contexts in generate answer.                                                                     |
 | `prompt.context_inner`                       | `CONTEXT_INNER_PROMPT`                 | Prompt for how to format a single context in generate answer. Must contain 'name' and 'text' variables.                       |
-| `agent.agent_llm`                            | `"gpt-4o-2024-11-20"`                  | LLM inside the agent making tool selections.                                                                                  |
+| `agent.agent_llm`                            | `"gpt-5-2025-08-07"`                   | LLM inside the agent making tool selections.                                                                                  |
 | `agent.agent_llm_config`                     | `None`                                 | Optional configuration for `agent_llm`.                                                                                       |
 | `agent.agent_type`                           | `"ToolSelector"`                       | Type of agent to use.                                                                                                         |
 | `agent.agent_config`                         | `None`                                 | Optional kwarg for AGENT constructor.                                                                                         |

diff --git a/src/paperqa/agents/helpers.py b/src/paperqa/agents/helpers.py
@@ -26,9 +26,9 @@ def get_year(ts: datetime | None = None) -> str:
 
 async def litellm_get_search_query(
     question: str,
+    llm: LLMModel | str,
     count: int,
     template: str | None = None,
-    llm: LLMModel | str = "gpt-4o-mini",
     temperature: float = 1.0,
 ) -> list[str]:
     search_prompt = ""

diff --git a/src/paperqa/agents/models.py b/src/paperqa/agents/models.py
@@ -66,7 +66,7 @@ def strip_answer(
         v.filter_content_for_user()
         return v
 
-    async def get_summary(self, llm_model: LLMModel | str = "gpt-4o") -> str:
+    async def get_summary(self, llm_model: LLMModel | str) -> str:
         sys_prompt = (
             "Revise the answer to a question to be a concise SMS message. "
             "Use abbreviations or emojis if necessary."

diff --git a/src/paperqa/settings.py b/src/paperqa/settings.py
@@ -11,12 +11,7 @@
 
 import anyio
 from aviary.core import Tool, ToolSelector
-from lmi import (
-    CommonLLMNames,
-    EmbeddingModel,
-    LiteLLMModel,
-    embedding_model_factory,
-)
+from lmi import CommonLLMNames, EmbeddingModel, LiteLLMModel, embedding_model_factory
 from pydantic import (
     BaseModel,
     ConfigDict,
@@ -525,7 +520,7 @@ class AgentSettings(BaseModel):
     model_config = ConfigDict(extra="forbid")
 
     agent_llm: str = Field(
-        default=CommonLLMNames.GPT_4O.value,
+        default=CommonLLMNames.GPT_5.value,
         description="LLM inside the agent making tool selections.",
     )
 
@@ -693,7 +688,7 @@ class Settings(BaseSettings):
     model_config = SettingsConfigDict(extra="ignore")
 
     llm: str = Field(
-        default=CommonLLMNames.GPT_4O.value,
+        default=CommonLLMNames.GPT_5.value,
         description=(
             "LLM for general use including metadata inference (see Docs.aadd)"
             " and answer generation (see Docs.aquery and gen_answer tool)."
@@ -717,7 +712,7 @@ class Settings(BaseSettings):
         ),
     )
     summary_llm: str = Field(
-        default=CommonLLMNames.GPT_4O.value,
+        default=CommonLLMNames.GPT_5.value,
         description=(
             "LLM for creating contextual summaries"
             " (see Docs.aget_evidence and gather_evidence tool)."
@@ -741,7 +736,10 @@ class Settings(BaseSettings):
         default=None,
         description="Optional configuration for the embedding model.",
     )
-    temperature: float = Field(default=0.0, description="Temperature for LLMs.")
+    temperature: float = Field(
+        default=1.0,
+        description="Temperature for LLMs, default is 1 for compatibility with OpenAI's GPT-5.",
+    )
     batch_size: int = Field(default=1, description="Batch size for calling LLMs.")
     texts_index_mmr_lambda: float = Field(
         default=1.0, description="Lambda for MMR in text index."