forked from BenjaminGuinet/HGT-finder-between-2-species
-
Notifications
You must be signed in to change notification settings - Fork 0
/
augustus_run_sp1_training_sp1.sh
58 lines (36 loc) · 1.67 KB
/
augustus_run_sp1_training_sp1.sh
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
#PBS -S /bin/bash
#PBS -l nodes=1:ppn=8:bigmem,mem=30gb
#PBS -e /pandata/bguinet/LEPIWASP/ACG-sp1_Augustus/LOGS/augustus_training_sp1.error
#PBS -o /pandata/bguinet/LEPIWASP/ACG-sp1_Augustus/LOGS/augustus_training_sp1.out
#PBS -q q1day
#PBS -N augustus_sp1_training_sp1
# Prediction of genes in the genome of species 1 using the its own training.
# This script is used to run the Augustus program that will predict genes by an Ab initio approach.
# With Busco run, training files are available to better predict genes.
# Note that this retraining file (myspecie) must be added to the species file of the Augustus program.
# Usual Busco retraining file path: sp2_busco/run_sp2_BUSCO_v2/augustus_output/retraining_parameters
# The usual path of the file where to transfer the retraining file: / augustus / config / species / myspecie
# Required files:
# - Genome Assembled Fasta Format (assembly)
# - Training file for species 2 (retraining)
# Be sure to define variable names and file paths before issuing commands.
echo debut:
date #debut
hostname
uname -a
#
#
#Declarations des variables
SAMP=sp1
PATH=bguinet@pbil-deb
# GENOME (sequence file)
ASSEMBLY=/pandata/varaldi/LEPIWASP/OUT/$SAMP/scaffold.fa
# augustus config path (where the retraining file from busco should be added in the specie file)
PATH=/panhome/bguinet/TOOLS/augustus/config/
#retraining file's name(Not a path)
RETRAINING=retraining_sp1
#Augustus programme path
AUGUSTUS=/panhome/bguinet/TOOLS/augustus/bin/augustus
# outputfile's path and name
OUTPUT=/pandata/bguinet/LEPIWASP/ACG-sp1_Augustus/LOGS/run_augustus_sp1_training_sp1.out
$AUGUSTUS --species=$RETRAINING --AUGUSTUS_CONFIG_PATH=$PATH $ASSEMBLY > $OUTPUT