NGS related files for testing
workspace="path/to/workspace" && cd ${workspace}
git clone https://github.com/yh549848/ngsfiles.git
FYR: Generating procedure
Download and subsampling FASTQ
wget -P tmp -i scripts/uri_fastq.txt
find tmp/*.fastq.gz | xargs scripts/subsample_fastq.sh
rm tmp/SRR896743_1.fastq.gz tmp/SRR896743_2.fastq.gz tmp/SRR896663_1.fastq.gz tmp/SRR896663_2.fastq.gz
mv tmp/*.*.fastq.gz assets/FASTQ
Download and subsampling GTF
wget ftp://ftp.ebi.ac.uk/pub/databases/gencode/Gencode_human/release_32/gencode.v32.basic.annotation.gtf.gz -P tmp
gunzip tmp/gencode.v32.basic.annotation.gtf.gz
./scripts/subsample_gtf.sh tmp/gencode.v32.basic.annotation.gtf
mv tmp/*.chr*.gtf assets/GTF
for f in `find assets/GTF -name "*.gtf"`; do gffread ${f} -o ${f/.gtf/.gff}; done
mv assets/GTF/*.gff assets/GFF
Align to reference and extract records located specified chromosome
wget ftp://ftp.ebi.ac.uk/pub/databases/gencode/Gencode_human/release_32/GRCh38.primary_assembly.genome.fa.gz -P tmp
gunzip tmp/GRCh38.primary_assembly.genome.fa.gz
qsub -V scripts/build_idx_star.sh tmp/GRCh38.primary_assembly.genome.fa
find assets/FASTQ/*.fastq.gz | sort | xargs qsub -V -t 1-4:2 scripts/align_star_pe.sh
cd tmp && cp --parents */*bam ../assets/BAM && cd ${workspace}
find assets/BAM/*/Aligned.sortedByCoord.out.bam | sort | xargs -I {} samtools index {}
find assets/BAM/*/Aligned.sortedByCoord.out.bam | sort | xargs -I {} scripts/subsample_bam.sh {}
find assets/BAM/*/Aligned.sortedByCoord.out*.bam | sort | xargs -I {} samtools index {}
gffread -w tmp/gencode.v32.basic.transcripts_with_attr.fa -g tmp/GRCh38.primary_assembly.genome.fa tmp/gencode.v32.basic.annotation.gtf
./scripts/strip_attributes_fasta.py tmp/gencode.v32.basic.transcripts_with_attr.fa > tmp/gencode.v32.basic.transcripts.fa
qsub -V scripts/build_idx_rsem_with_ebseq_ngvector.sh tmp/gencode.v32.basic.transcripts.fa
find assets/BAM/*/Aligned.sortedByCoord.out.bam | sort | xargs qsub -V -t 1-2 scripts/quant_rsem.sh
find assets/BAM/*/Aligned.sortedByCoord.out.bam | sort | xargs qsub -V -t 1-2 scripts/quant_stringtie.sh
find assets/StringTie/*/*.gtf | xargs -I {} gzip {}
find assets/FASTQ/*.fastq.gz | sort | xargs qsub -V -t 1-4:2 scripts/quant_kallisto.sh
find assets/BAM/*/Aligned.sortedByCoord.out.bam | sort | xargs qsub -V -t 1-2 scripts/quant_htseq.sh
for f in `find assets/BAM -name "*.bam"`; do bedtools bamtobed -i ${f} > ${f/.bam/.bed}; done
cd assets/BAM; cp --parents */*.bed ../BED/ && rm */*.bed; cd ${workspace}