Skip to content

Commit 5e8378b

Browse files
committed
Adds in support for gpt-5-mini
1 parent eccd49b commit 5e8378b

File tree

4 files changed

+8
-7
lines changed

4 files changed

+8
-7
lines changed

express-server/src/pipeline/retryConfig.ts

Lines changed: 5 additions & 5 deletions
Original file line numberDiff line numberDiff line change
@@ -34,12 +34,12 @@ export const TEST_RETRY_OPTIONS = {
3434
*/
3535
export const HTTP_TIMEOUTS = {
3636
// 2 minutes per request - LLM processing can take time
37-
REQUEST_TIMEOUT: 120000,
38-
HEADERS_TIMEOUT: 120000,
39-
BODY_TIMEOUT: 120000,
40-
KEEP_ALIVE_TIMEOUT: 30000,
37+
REQUEST_TIMEOUT: 12000000,
38+
HEADERS_TIMEOUT: 12000000,
39+
BODY_TIMEOUT: 12000000,
40+
KEEP_ALIVE_TIMEOUT: 3000000,
4141
// Total operation timeout to prevent indefinite hangs (8 minutes with retries)
42-
OPERATION_TIMEOUT: 480000,
42+
OPERATION_TIMEOUT: 48000000,
4343
} as const;
4444

4545
/**

pyserver/config.py

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -18,7 +18,7 @@
1818
# or: input is $0.0025/1K tokens, output is $0.01/1K tokens
1919
"gpt-4o": {"in_per_1K": 0.0025, "out_per_1K": 0.01},
2020
# GPT-5-mini: Input is $0.250 / 1M tokens, Output is $2.00/1M tokens
21-
"gpt-5-mini": {"in_per_1K": 0.00025, "out_per_1k": 0.002}
21+
"gpt-5-mini": {"in_per_1K": 0.00025, "out_per_1K": 0.002}
2222
}
2323

2424
# for web-app mode, require at least 3 words in order to extract meaningful claims

pyserver/test_pipeline.py

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -53,7 +53,7 @@
5353
# NOTE: gpt-4o-mini is cheaper/better for basic tests, but it fails on some very basic deduplication
5454
API_KEY = os.getenv('OPENAI_API_KEY')
5555
base_llm = {
56-
"model_name" : "gpt-4o-mini",
56+
"model_name" : "gpt-5-mini",
5757
"system_prompt": config.SYSTEM_PROMPT,
5858
"api_key" : API_KEY
5959
}

pyserver/utils.py

Lines changed: 1 addition & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -21,6 +21,7 @@ def token_cost(model_name:str, tok_in:int, tok_out:int):
2121
if model_name not in config.COST_BY_MODEL:
2222
print("model undefined!")
2323
return -1
24+
2425
return 0.001 * (tok_in * config.COST_BY_MODEL[model_name]["in_per_1K"] + tok_out * config.COST_BY_MODEL[model_name]["out_per_1K"])
2526

2627
def cute_print(json_obj):

0 commit comments

Comments
 (0)