-
Notifications
You must be signed in to change notification settings - Fork 1
Expand file tree
/
Copy pathrun_mcs_selection.sh
More file actions
59 lines (51 loc) · 1.63 KB
/
run_mcs_selection.sh
File metadata and controls
59 lines (51 loc) · 1.63 KB
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
#!/bin/bash
# --- Configuration ---
if [ -z "${PYTHON_BIN:-}" ]; then
if [ -x ".venv/bin/python" ]; then
PYTHON_BIN=".venv/bin/python"
else
PYTHON_BIN="python3"
fi
fi
ARTIFACT_ROOT=${ARTIFACT_ROOT:-"artifacts"}
DATASET_TYPE=${DATASET_TYPE:-"bird"}
DATA_PATH=${DATA_PATH:-"data/bird/dev/mini_dev.json"}
DB_ROOT_PATH=${DB_ROOT_PATH:-"data/bird/dev/dev_databases"}
CANDIDATES_PATH=${CANDIDATES_PATH:-"${ARTIFACT_ROOT}/candidates/Qwen2.5-Coder-7B-Instruct_BIRD_Mini_Dev.json"}
OUTPUT_PATH=${OUTPUT_PATH:-"${ARTIFACT_ROOT}/temp/Qwen2.5-Coder-7B-Instruct_BIRD_Mini_Dev_MCS.json"}
# --- LLM Configuration ---
MODEL_NAME=${MODEL_NAME:-"qwen2.5-coder-7b-instruct"}
API_KEY=${API_KEY:-""}
BASE_URL=${BASE_URL:-""}
TEMPERATURE=${TEMPERATURE:-0.7}
MAX_TOKENS=${MAX_TOKENS:-4096}
# --- Execution Configuration ---
TIMEOUT=${TIMEOUT:-30}
NUM_WORKERS=${NUM_WORKERS:-8}
echo "Starting Multi-Choice Selection (MCS) Baseline..."
echo "Input: $CANDIDATES_PATH"
echo "Output: $OUTPUT_PATH"
echo "Model: $MODEL_NAME"
echo "Workers: $NUM_WORKERS"
# Build command arguments
CMD_ARGS=(
--dataset_type "$DATASET_TYPE"
--data_path "$DATA_PATH"
--db_root_path "$DB_ROOT_PATH"
--pred_path "$CANDIDATES_PATH"
--output_path "$OUTPUT_PATH"
--model_name "$MODEL_NAME"
--temperature "$TEMPERATURE"
--max_tokens "$MAX_TOKENS"
--timeout "$TIMEOUT"
--num_workers "$NUM_WORKERS"
)
# Add API Key and Base URL if provided
if [ -n "$API_KEY" ]; then
CMD_ARGS+=(--api_key "$API_KEY")
fi
if [ -n "$BASE_URL" ]; then
CMD_ARGS+=(--base_url "$BASE_URL")
fi
# Run the script
"$PYTHON_BIN" baseline/run_mcs_selection.py "${CMD_ARGS[@]}"