-
Notifications
You must be signed in to change notification settings - Fork 1
/
augustus_run_sp2_training_sp2.sh
56 lines (36 loc) · 1.67 KB
/
augustus_run_sp2_training_sp2.sh
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
#PBS -S /bin/bash
#PBS -l nodes=1:ppn=8:bigmem,mem=30gb
#PBS -e /pandata/bguinet/LEPIWASP/ACG-sp2_Augustus/LOGS/augustus_training_sp2.error
#PBS -o /pandata/bguinet/LEPIWASP/ACG-sp2_Augustus/LOGS/augustus_training_sp2.out
#PBS -q q1day
#PBS -N augustus_sp2_training_sp2
# Prediction of genes in the genome of species 2 using its own training.
# This script is used to run the Augustus program that will predict genes by an Ab initio approach.
# With Busco run, training files are available to better predict genes.
# Note that this retraining file (myspecie) must be added to the species file of the Augustus program.
# Usual Busco retraining file path: sp2_busco / run_sp2_BUSCO_v2 / augustus_output / retraining_parameters
# The usual path of the file where to transfer the retraining file: / augustus / config / species / myspecie
# Required files:
# - Genome Assembled Fasta Format (assembly)
# - Training file for species 2 (retraining)
# Be sure to define variable names and file paths before issuing commands.
echo debut:
date #debut
hostname
uname -a
#
#
#Declarations des variables
SAMP=sp2
PATH=bguinet@pbil-deb
# GENOME (sequence file)
ASSEMBLY=/pandata/varaldi/LEPIWASP/OUT/$SAMP/scaffold.fa
# augustus config path (where the retraining file from busco should be added in the specie file)
PATH=/panhome/bguinet/TOOLS/augustus/config/
#retraining file's name (not a path)
RETRAINING=retraining_sp2
#Augustus programme path
AUGUSTUS=/panhome/bguinet/TOOLS/augustus/bin/augustus
# outputfile's path and name
OUTPUT=/pandata/bguinet/LEPIWASP/ACG-sp2_Augustus/LOGS/run_augustus_sp2_training_sp2.out
$AUGUSTUS --species=$RETRAINING --AUGUSTUS_CONFIG_PATH=$PATH $ASSEMBLY > $OUTPUT