Adds in support for gpt-5-mini

juggler434 · juggler434 · commit 5e8378b90fee · 2025-09-10T11:22:06.000-07:00
diff --git a/express-server/src/pipeline/retryConfig.ts b/express-server/src/pipeline/retryConfig.ts
@@ -34,12 +34,12 @@ export const TEST_RETRY_OPTIONS = {
  */
 export const HTTP_TIMEOUTS = {
   // 2 minutes per request - LLM processing can take time
-  REQUEST_TIMEOUT: 120000,
-  HEADERS_TIMEOUT: 120000,
-  BODY_TIMEOUT: 120000,
-  KEEP_ALIVE_TIMEOUT: 30000,
+  REQUEST_TIMEOUT: 12000000,
+  HEADERS_TIMEOUT: 12000000,
+  BODY_TIMEOUT: 12000000,
+  KEEP_ALIVE_TIMEOUT: 3000000,
   // Total operation timeout to prevent indefinite hangs (8 minutes with retries)
-  OPERATION_TIMEOUT: 480000,
+  OPERATION_TIMEOUT: 48000000,
 } as const;
 
 /**
diff --git a/pyserver/config.py b/pyserver/config.py
@@ -18,7 +18,7 @@
     # or: input is $0.0025/1K tokens, output is $0.01/1K tokens
     "gpt-4o": {"in_per_1K": 0.0025, "out_per_1K": 0.01},
     # GPT-5-mini: Input is $0.250 / 1M tokens, Output is $2.00/1M tokens
-    "gpt-5-mini": {"in_per_1K": 0.00025, "out_per_1k": 0.002}
+    "gpt-5-mini": {"in_per_1K": 0.00025, "out_per_1K": 0.002}
 }
 
 # for web-app mode, require at least 3 words in order to extract meaningful claims
diff --git a/pyserver/test_pipeline.py b/pyserver/test_pipeline.py
@@ -53,7 +53,7 @@
 # NOTE: gpt-4o-mini is cheaper/better for basic tests, but it fails on some very basic deduplication
 API_KEY = os.getenv('OPENAI_API_KEY')
 base_llm = {
-  "model_name" : "gpt-4o-mini",
+  "model_name" : "gpt-5-mini",
   "system_prompt": config.SYSTEM_PROMPT,
   "api_key" : API_KEY
 }
diff --git a/pyserver/utils.py b/pyserver/utils.py
@@ -21,6 +21,7 @@ def token_cost(model_name:str, tok_in:int, tok_out:int):
   if model_name not in config.COST_BY_MODEL:
     print("model undefined!")
     return -1
+
   return 0.001 * (tok_in  *  config.COST_BY_MODEL[model_name]["in_per_1K"] + tok_out * config.COST_BY_MODEL[model_name]["out_per_1K"])
 
 def cute_print(json_obj):

Original file line number	Diff line number	Diff line change
`@@ -18,7 +18,7 @@`
`18`	`18`	`# or: input is $0.0025/1K tokens, output is $0.01/1K tokens`
`19`	`19`	`"gpt-4o": {"in_per_1K": 0.0025, "out_per_1K": 0.01},`
`20`	`20`	`# GPT-5-mini: Input is $0.250 / 1M tokens, Output is $2.00/1M tokens`
`21`		`- "gpt-5-mini": {"in_per_1K": 0.00025, "out_per_1k": 0.002}`
	`21`	`+ "gpt-5-mini": {"in_per_1K": 0.00025, "out_per_1K": 0.002}`
`22`	`22`	`}`
`23`	`23`
`24`	`24`	`# for web-app mode, require at least 3 words in order to extract meaningful claims`
Original file line number	Diff line number	Diff line change
`@@ -53,7 +53,7 @@`
`53`	`53`	`# NOTE: gpt-4o-mini is cheaper/better for basic tests, but it fails on some very basic deduplication`
`54`	`54`	`API_KEY = os.getenv('OPENAI_API_KEY')`
`55`	`55`	`base_llm = {`
`56`		`- "model_name" : "gpt-4o-mini",`
	`56`	`+ "model_name" : "gpt-5-mini",`
`57`	`57`	`"system_prompt": config.SYSTEM_PROMPT,`
`58`	`58`	`"api_key" : API_KEY`
`59`	`59`	`}`