-
Notifications
You must be signed in to change notification settings - Fork 1
/
Copy pathrun_SPRINT_custom.sh
executable file
·44 lines (40 loc) · 2.22 KB
/
run_SPRINT_custom.sh
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
#!/bin/bash
#Reproduce what I did
# first: download pre_computed_HSP and Uniprot_human_protein_sequences.fasta files from https://www.csd.uwo.ca/~ilie/SPRINT/
# then: try to reproduce results:
#Biogrid C1 dataset:
# bin/predict_interactions -p data/Uniprot_human_protein_sequences.fasta -h HSP/pre_computed_HSP -tr PPI_dataset/Biogrid/train.pos.1.txt -pos PPI_dataset/Biogrid/test.pos.c1.1.txt -neg PPI_dataset/Biogrid/test.neg.c1.1.txt -o results/result_Biogrid_C1_1.txt
#HPRD C3 dataset:
# bin/predict_interactions -p data/Uniprot_human_protein_sequences.fasta -h HSP/pre_computed_HSP -tr PPI_dataset/HPRD/train.pos.1.txt -pos PPI_dataset/HPRD/test.pos.c1.1.txt -neg PPI_dataset/HPRD/test.neg.c1.1.txt -o results/result_HPRD_C3_1.txt
# run other datasets huang, richoux, pan;
# Train on both, test on 0. Train on both, test on 1. Train on 0, test on 1:
for DATASET in du guo
do
for TRAIN in "both" "0"
do
for TEST in "0" "1"
do
if [ "$TRAIN" = "0" ] && [ "$TEST" = "0" ]
then
continue
fi
echo dataset ${DATASET}, training on ${TRAIN}, testing on ${TEST}
{ time bin/predict_interactions -p ../../Datasets_PPIs/SwissProt/yeast_swissprot_oneliner.fasta -h HSP/pre_computed_yeast_HSP -tr data/partitions/${DATASET}_partition_${TRAIN}_pos.txt -pos data/partitions/${DATASET}_partition_${TEST}_pos.txt -neg data/partitions/${DATASET}_partition_${TEST}_neg.txt -o results/partitions/${DATASET}_train_${TRAIN}_test_${TEST}.txt ; } 2> results/partitions/${DATASET}_train_${TRAIN}_test_${TEST}_time.txt
done
done
done
for DATASET in huang richoux pan dscript
do
for TRAIN in "both" "0"
do
for TEST in "0" "1"
do
if [ "$TRAIN" = "0" ] && [ "$TEST" = "0" ]
then
continue
fi
echo dataset ${DATASET}, training on ${TRAIN}, testing on ${TEST}
{ time bin/predict_interactions -p data/Uniprot_human_protein_sequences.fasta -h HSP/pre_computed_HSP -tr data/partitions/${DATASET}_partition_${TRAIN}_pos.txt -pos data/partitions/${DATASET}_partition_${TEST}_pos.txt -neg data/partitions/${DATASET}_partition_${TEST}_neg.txt -o results/partitions/${DATASET}_train_${TRAIN}_test_${TEST}.txt ; } 2> results/partitions/${DATASET}_train_${TRAIN}_test_${TEST}_time.txt
done
done
done