Skip to content

Commit 0ef25a8

Browse files
committedMay 18, 2022
some notes on how to run things
1 parent dff3c12 commit 0ef25a8

File tree

2 files changed

+60
-0
lines changed

2 files changed

+60
-0
lines changed
 

‎notes/HOWTO

+28
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,28 @@
1+
export RUNMODE=maker
2+
./annocomba -t slurm -c data/cluster_config-vsc4.yaml.template --dry -s "--until cegma"
3+
4+
for d in $(cat to_remove); do rm -rf .snakemake/shadow/$d; done
5+
6+
./annocomba -t slurm -c data/cluster_config-vsc4.yaml.template --dry -s "-pr --until iprscan" --dry
7+
8+
#merge xml
9+
head -n 1 results/GthyKa/FUNANNOTATE/GthyKa_preds/annotate_misc/iprscan_xmls/0001.xml > test.xml
10+
for f in $(ls -1 results/GthyKa/FUNANNOTATE/GthyKa_preds/annotate_misc/iprscan_xmls/*.xml); do cat $f | tail -n +2 | head -n -1; done >> test.xml
11+
tail -n 1 results/GthyKa/FUNANNOTATE/GthyKa_preds/annotate_misc/iprscan_xmls/0001.xml >> test.xml
12+
13+
#manually merge phobius results
14+
echo -e "ID\tTM\tSP\tPrediction" > results/EsKje/FUNANNOTATE/EsKje_preds/annotate_misc/phobius.results.txt
15+
for f in $(ls -1 results/EsKje/FUNANNOTATE/phobius_58560202-d387-4d26-a178-990e3bbb3db5/*.phobius); do cat $f | tail -n +2 | awk '{print $1"\t"$2"\t"$3"\t"$4}'; done >> results/EsKje/FUNANNOTATE/EsKje_preds/annotate_misc/phobius.results.txt
16+
17+
#relevant gene in Schistosoma mansoni - https://www.sciencedirect.com/science/article/pii/S2211320720300026 and also the paper suggested by Haakon
18+
Smp_246790 - Sm.TRPMPZQ
19+
20+
#change dependency so that only a third of rMP1 jobs are running at a time - note that 1920462 in this case is iMP1, so all need to wait for this one
21+
bash <(squeue -u $USER | grep "rMP1" | awk '{print $1}' | perl -ne 'chomp; $f=$_; $s=<>; chomp $s; $t=<>; chomp $t; print "scontrol update JobId=$s Dependency=afterok:1920462,afterok:$f\nscontrol update JobId=$t Dependency=afterok:1920462,afterok:$s\n"' | head -n -2)
22+
23+
24+
./annocomba -t slurm -c data/cluster_config-vsc4.yaml.template --dry -s "-pr --until annotate"
25+
26+
./annocomba -t serial -c data/cluster_config-vsc4.yaml.template -s "-pr --until annotate"
27+
28+
./annocomba -t serial -c data/cluster_config-vsc4.yaml.template -s "-pr --forcerun predict --until predict"

‎notes/HOWTO.setup

+32
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,32 @@
1+
#Download genemark from here: http://topaz.gatech.edu/GeneMark/license_download.cgi
2+
#select GeneMark-ES/ET/EP ver 4.68_lic - Linux 64
3+
#use 64 bit version (software and key)
4+
#this will get you a tarball: gmes_linux_64.tar.gz
5+
wget http://topaz.gatech.edu/GeneMark/tmp/GMtool_dQnST/gmes_linux_64.tar.gz -O data/external/gmes_linux_64.tar.gz
6+
tar xvfz data/external/gmes_linux_64.tar.gz -C data/external/
7+
#key comes with this
8+
#decompress the key
9+
#gunzip gm_key_64.gz
10+
11+
#mv key into gmes_linux_64 directory
12+
#mv gm_key_64 gmes_linux_64/
13+
14+
#################
15+
16+
#get maker from https://www.yandell-lab.org/software/maker.html
17+
#we have tested annocomba with maker-2.31.10.tgz
18+
19+
###############
20+
#Repbase (optional)
21+
#put at data/external/RepBaseRepeatMaskerEdition-20181026.tar.gz
22+
23+
#######################
24+
25+
#adjust your config file: data/config.yaml
26+
27+
./annocomba --setup
28+
29+
## get interproscan script
30+
rsync -avpuzP hahnc@vsc4.vsc.ac.at:/gpfs/data/fs71312/reslp/databases/interproscan-5.48-83.0 data/external/
31+
#then specify position of interproscan.sh script in config file
32+
#

0 commit comments

Comments
 (0)