int/eval.sh at main · intervention-training/int · GitHub

1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
#!/bin/bash
#SBATCH --mem=100g
#SBATCH --nodes=1
#SBATCH --ntasks-per-node=1
#SBATCH --ntasks-per-socket=1
#SBATCH --cpus-per-task=16
#SBATCH --partition=ghx4
#SBATCH --time=12:00:00
#SBATCH --account=ACCOUNT
#SBATCH --gpus-per-node=1
#SBATCH --gpu-bind=verbose,closest


mkdir -p /tmp/$USER/triton_cache
mkdir -p /tmp/$USER/vllm_cache
mkdir -p /tmp/$USER/torch_cache
mkdir -p /tmp/$USER/hf_cache
export TRITON_CACHE_DIR=/tmp/$USER/triton_cache
export VLLM_CACHE_ROOT=/tmp/$USER/vllm_cache
export TORCH_COMPILE_CACHE_DIR=/tmp/$USER/torch_cache
export TORCHINDUCTOR_CACHE_DIR=/tmp/$USER/torch_cache
export HF_HOME=/tmp/$USER/hf_cache

batch_number=$1
model_path=MODEL_PATH
logs_path=LOGS_PATH
output_path=OUTPUT_PATH

mkdir -p $logs_path
mkdir -p $output_path

echo $logs_path
echo $model_path

source /user/miniconda3/bin/activate vllm

PYTHONUNBUFFERED=1 python ~/int/sample_rollouts.py \
    --input_dataset_name CMU-AIRe/InT-test-set \
    --dataset_split test \
    --dataset_start $((batch_number * 30)) \
    --dataset_end $(((batch_number + 1) * 30)) \
    --output_path $output_path \
    -K 128 \
    --model $model_path \
    --temperature 0.7 \
    --top_p 0.8 \
    --top_k 20 \
    --max_tokens 16384 \
    --tensor_parallel_size 1 \
    --batch_size 15 > $logs_path/eval_${batch_number}.log 2>&1