File size: 1,675 Bytes
81a794d
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
export HF_HUB_OFFLINE=1
export DATASET_ROOT="./evaluate/dataset/C_C++_Java_Python"
export RESULT_ROOT="./evaluate/result"
export EVAL_SCRIPT="./dataset_eval.py"

GPT-3.5-turbo
export KEY=""
export URL="https://api.chatanywhere.tech/v1/"
export MODEL="gpt-3.5-turbo"

mkdir -p $RESULT_ROOT/$MODEL
export INCLUDE_MSG=no
python $EVAL_SCRIPT -d $DATASET_ROOT/test.jsonl -t online -m $MODEL -u $URL -k $KEY -o "$RESULT_ROOT/$MODEL/nomsg.jsonl" 2>&1 | tee $RESULT_ROOT/$MODEL/nomsg.log
export INCLUDE_MSG=yes
python $EVAL_SCRIPT -d $DATASET_ROOT/test.jsonl -t online -m $MODEL -u $URL -k $KEY -o "$RESULT_ROOT/$MODEL/msg.jsonl" 2>&1 | tee $RESULT_ROOT/$MODEL/msg.log

# DeepSeek-V3
export KEY=""
export URL="https://api.deepseek.com/v1"
export MODEL="deepseek-chat"

mkdir -p $RESULT_ROOT/$MODEL
export INCLUDE_MSG=no
python $EVAL_SCRIPT -d $DATASET_ROOT/test.jsonl -t online -m $MODEL -u $URL -k $KEY -o "$RESULT_ROOT/$MODEL/nomsg.jsonl" 2>&1 | tee $RESULT_ROOT/$MODEL/nomsg.log
export INCLUDE_MSG=yes
python $EVAL_SCRIPT -d $DATASET_ROOT/test.jsonl -t online -m $MODEL -u $URL -k $KEY -o "$RESULT_ROOT/$MODEL/msg.jsonl" 2>&1 | tee $RESULT_ROOT/$MODEL/msg.log

qwen-coder-plus
export KEY=""
export URL="https://dashscope.aliyuncs.com/compatible-mode/v1"
export MODEL="qwen-coder-plus"

mkdir -p $RESULT_ROOT/$MODEL
export INCLUDE_MSG=no
python $EVAL_SCRIPT -d $DATASET_ROOT/test.jsonl -t online -m $MODEL -u $URL -k $KEY -o "$RESULT_ROOT/$MODEL/nomsg.jsonl" 2>&1 | tee $RESULT_ROOT/$MODEL/nomsg.log
export INCLUDE_MSG=yes
python $EVAL_SCRIPT -d $DATASET_ROOT/test.jsonl -t online -m $MODEL -u $URL -k $KEY -o "$RESULT_ROOT/$MODEL/msg.jsonl" 2>&1 | tee $RESULT_ROOT/$MODEL/msg.log