-
Notifications
You must be signed in to change notification settings - Fork 2
Expand file tree
/
Copy patheval.sh
More file actions
51 lines (43 loc) · 1.28 KB
/
eval.sh
File metadata and controls
51 lines (43 loc) · 1.28 KB
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
#!/bin/bash
#SBATCH --mem=100g
#SBATCH --nodes=1
#SBATCH --ntasks-per-node=1
#SBATCH --ntasks-per-socket=1
#SBATCH --cpus-per-task=16
#SBATCH --partition=ghx4
#SBATCH --time=12:00:00
#SBATCH --account=ACCOUNT
#SBATCH --gpus-per-node=1
#SBATCH --gpu-bind=verbose,closest
mkdir -p /tmp/$USER/triton_cache
mkdir -p /tmp/$USER/vllm_cache
mkdir -p /tmp/$USER/torch_cache
mkdir -p /tmp/$USER/hf_cache
export TRITON_CACHE_DIR=/tmp/$USER/triton_cache
export VLLM_CACHE_ROOT=/tmp/$USER/vllm_cache
export TORCH_COMPILE_CACHE_DIR=/tmp/$USER/torch_cache
export TORCHINDUCTOR_CACHE_DIR=/tmp/$USER/torch_cache
export HF_HOME=/tmp/$USER/hf_cache
batch_number=$1
model_path=MODEL_PATH
logs_path=LOGS_PATH
output_path=OUTPUT_PATH
mkdir -p $logs_path
mkdir -p $output_path
echo $logs_path
echo $model_path
source /user/miniconda3/bin/activate vllm
PYTHONUNBUFFERED=1 python ~/int/sample_rollouts.py \
--input_dataset_name CMU-AIRe/InT-test-set \
--dataset_split test \
--dataset_start $((batch_number * 30)) \
--dataset_end $(((batch_number + 1) * 30)) \
--output_path $output_path \
-K 128 \
--model $model_path \
--temperature 0.7 \
--top_p 0.8 \
--top_k 20 \
--max_tokens 16384 \
--tensor_parallel_size 1 \
--batch_size 15 > $logs_path/eval_${batch_number}.log 2>&1