Alignment-based method
STAR alignment
$ cd /home/USER/SSAPs
$ mkdir star
$ declare -a runname=("ERR2675454" "ERR2675455" "ERR2675458" "ERR2675459" "ERR2675460" "ERR2675461" "ERR2675464" "ERR2675465" "ERR2675468" "ERR2675469" "ERR2675472" "ERR2675473" "ERR2675476" "ERR2675477" "ERR2675478" "ERR2675479" "ERR2675480" "ERR2675481" "ERR2675484" "ERR2675485")
# Modified from ENCODE-DCC/rna-seq-pipeline; https://github.com/ENCODE-DCC/rna-seq-pipeline
for id in ${runname[@]}; do
trim1=trimmed/${id}_1.fastq.gz
trim2=trimmed/${id}_2.fastq.gz
out=star/${id}_
STAR --genomeDir /home/USER/db/refanno/gencode.v33_star-2.7.3a \
--readFilesIn $trim1 $trim2 \
--outFileNamePrefix $out \
--readFilesCommand zcat \
--runThreadN 6 \
--genomeLoad NoSharedMemory \
--twopassMode Basic \
--sjdbGTFfile /home/USER/db/refanno/gencode.v33.annotation.gtf \
--sjdbScore 2 \
--sjdbOverhang 150 \
--limitSjdbInsertNsj 1000000 \
--outFilterMultimapNmax 20 \
--alignSJoverhangMin 8 \
--alignSJDBoverhangMin 1 \
--outFilterMismatchNmax 999 \
--outFilterMismatchNoverReadLmax 0.04 \
--alignIntronMin 20 \
--alignIntronMax 1000000 \
--alignMatesGapMax 1000000 \
--outSAMunmapped Within \
--outFilterType BySJout \
--outSAMattributes NH HI AS NM MD \
--outSAMtype BAM SortedByCoordinate \
--quantMode TranscriptomeSAM GeneCounts \
--quantTranscriptomeBan IndelSoftclipSingleend \
--limitBAMsortRAM 32000000000
done
rm -R star/*_STARgenome star/*_STARpass1STAR-Salmon Quantification (alignment-based mode)
STAR-RSEM Quantification
Last updated