PreMode / scripts /DMS.subset.prepare.yaml.sh
gzhong's picture
Upload folder using huggingface_hub
7718235 verified
#!/bin/bash
# $1 is the name of the scripts folder
# pretrain.seed.0.yaml: main file, the pretrain model
# first select the best model for TL based on validation dataset in pretrain
# prepare yaml files for subset tasks
for gene in PTEN PTEN.bin CCR5 CXCR4 NUDT15 SNCA CYP2C9 GCK ASPA fluorescence
do
mkdir $1/$gene.subsets/
for subset in 1 2 4 6
do
mkdir $1/$gene.subsets/subset.$subset
for seed in {0..4}
do
cp $1/$gene/$gene.seed.$seed.yaml $1/$gene.subsets/subset.$subset/seed.$seed.yaml
# change training dataset
sed -i "s|training.csv|/training."$subset"."$seed".csv|g" $1/$gene.subsets/subset.$subset/seed.$seed.yaml
# change output log
sed -i "s|TL."$gene"|TL."$gene".subset."$subset"|g" $1/$gene.subsets/subset.$subset/seed.$seed.yaml
done
done
done