-
Notifications
You must be signed in to change notification settings - Fork 0
Expand file tree
/
Copy path189225.sh
More file actions
68 lines (36 loc) · 3.17 KB
/
189225.sh
File metadata and controls
68 lines (36 loc) · 3.17 KB
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
#PBS -S /bin/bash
#PBS -N 189225
#PBS -q batch
#PBS -l nodes=1:ppn=12
#PBS -l walltime=48:00:00
#PBS -l mem=32gb
##before running this script be sure to cat together all forward/reverse reads
##for each bulk into a single forward read and single reverse read file per
##bulk, and download your reference genome.
BASEDIR=/scratch/lfa81121/189225
BULKHIGH1=/home/lfa81121/SRR8751599_1.fastq
BULKHIGH2=/home/lfa81121/SRR8751599_2.fastq
REFGENOME=/work/cemlab/reference_genomes/97103_v2.fa
mkdir $BASEDIR
cd $BASEDIR
module load SAMtools/1.6-foss-2016b
time samtools faidx $REFGENOME
module load BWA/0.7.15-foss-2016b
time bwa mem -t 8 $REFGENOME $BULKHIGH1 $BULKHIGH2 > Hbulk_aligned.sam
time samtools view -@ 8 -S -b Hbulk_aligned.sam > H_aligned.bam
time samtools sort -@ 8 -m 3G H_aligned.bam -o H_sorted.bam
time samtools index H_sorted.bam
module load picard/2.16.0-Java-1.8.0_144
time java -Xmx20g -classpath "/usr/local/apps/eb/picard/2.16.0-Java-1.8.0_144" -jar /usr/local/apps/eb/picard/2.16.0-Java-1.8.0_144/picard.jar AddOrReplaceReadGroups INPUT=H_sorted.bam OUTPUT=H_sorted.rg.bam RGID=high_bulk RGSM=high_bulk RGLB=high_bulk RGPL=ILLUMINA RGPU=ignore
time java -Xmx20g -classpath "/usr/local/apps/eb/picard/2.16.0-Java-1.8.0_144" -jar /usr/local/apps/eb/picard/2.16.0-Java-1.8.0_144/picard.jar MarkDuplicates INPUT= H_sorted.rg.bam OUTPUT=H_sorted_mkdupl_rg.bam METRICS_FILE=H_sorted_mkduplMetrics.txt
time java -Xmx20g -classpath "/usr/local/apps/eb/picard/2.16.0-Java-1.8.0_144" -jar /usr/local/apps/eb/picard/2.16.0-Java-1.8.0_144/picard.jar BuildBamIndex INPUT=H_sorted_mkdupl_rg.bam
time java -Xmx20g -classpath "/usr/local/apps/eb/picard/2.16.0-Java-1.8.0_144" -jar /usr/local/apps/eb/picard/2.16.0-Java-1.8.0_144/picard.jar CreateSequenceDictionary REFERENCE=$REFGENOME OUTPUT="$REFGENOME".dict
module load GATK/3.8-1-Java-1.8.0_144
java -jar $EBROOTGATK/GenomeAnalysisTK.jar -T RealignerTargetCreator -R $REFGENOME -I H_sorted_mkdupl_rg.bam -o H_intervals.list
java -jar $EBROOTGATK/GenomeAnalysisTK.jar -T IndelRealigner -R $REFGENOME -I H_sorted_mkdupl_rg.bam -targetIntervals H_intervals.list -o H_realigned.bam
java -jar $EBROOTGATK/GenomeAnalysisTK.jar -T HaplotypeCaller -nct 8 -R $REFGENOME -I H_realigned.bam --emitRefConfidence GVCF --variant_index_type LINEAR --variant_index_parameter 128000 -o H_realigned_reads_raw_variants_gvcf.vcf
java -jar $EBROOTGATK/GenomeAnalysisTK.jar -T GenotypeGVCFs -R $REFGENOME --variant H_realigned_reads_raw_variants_gvcf.vcf -nt 8 -o HL_raw_snps_and_indels.vcf
java -jar $EBROOTGATK/GenomeAnalysisTK.jar -T VariantFiltration -R $REFGENOME -V HL_raw_snps_and_indels.vcf --filterExpression "QD < 2.0 || FS > 60.0 || MQ < 40.0 || MQRankSum < -12.5 || ReadPosRankSum < -8.0" --filterName "Default_recommended" -o HL_filtered_snps.vcf
module load VCFtools/0.1.15-foss-2016b-Perl-5.24.1
time /usr/local/apps/eb/VCFtools/0.1.15-foss-2016b-Perl-5.24.1/bin/vcftools --vcf HL_filtered_snps.vcf --remove-filtered-all --recode --max-missing 1 -c > HL_pass_nomiss_snps.vcf
java -jar $EBROOTGATK/GenomeAnalysisTK.jar -T VariantsToTable -R $REFGENOME -V HL_pass_nomiss_snps.vcf -F CHROM -F POS -F REF -F ALT -GF AD -GF DP -GF GQ -GF PL -o HL_SNPs_R.table