!/bin/sh
An task for serial job.
DO NOT RUN THIS SCRIPT DIRECTLY,
PLEASE RUN THIS SCRIPT WITH qsub: qsub serial_job.pbs
#
PBS -N download_data
PBS -o download_data.log
PBS -e download_data.err
PBS -q middle
PBS -l walltime=48:00:00
PBS -l nodes=1:ppn=2
cd $YOUR_WORKDIR
cd /home/sysbio/SA20008161/PBSorder
#首先下载raw data
module load sratoolkit
#prefetch SRR8467686
#prefetch SRR8467687
#prefetch SRR8467688
#prefetch SRR8467689
#prefetch SRR8467690
#prefetch SRR8467691
#prefetch SRR8467692
#prefetch SRR8467693
#利用fast-dump命令转换sra文件为fastq文件,gzip用于解压缩
#fastq-dump.2.8.2 -O /home/sysbio/SA2000816/RNA-seq/example/from_NCBI --gzip /home/sysbio/SA20008161/ncbi/public/sra/SRR8467686.sra
#fastq-dump.2.8.2 -O /home/sysbio/SA2000816/RNA-seq/example/from_NCBI --gzip /home/sysbio/SA20008161/ncbi/public/sra/SRR8467687.sra
#fastq-dump.2.8.2 -O /home/sysbio/SA2000816/RNA-seq/example/from_NCBI --gzip /home/sysbio/SA20008161/ncbi/public/sra/SRR8467688.sra
#fastq-dump.2.8.2 -O /home/sysbio/SA2000816/RNA-seq/example/from_NCBI --gzip /home/sysbio/SA20008161/ncbi/public/sra/SRR8467689.sra
#fastq-dump.2.8.2 -O /home/sysbio/SA2000816/RNA-seq/example/from_NCBI --gzip /home/sysbio/SA20008161/ncbi/public/sra/SRR8467690.sra
#fastq-dump.2.8.2 -O /home/sysbio/SA20008161/RNA-seq/example/from_NCBI --gzip /home/sysbio/SA20008161/ncbi/public/sra/SRR8467691.sra
#fastq-dump.2.8.2 -O /home/sysbio/SA20008161/RNA-seq/example/from_NCBI --gzip /home/sysbio/SA20008161/ncbi/public/sra/SRR8467692.sra
#fastq-dump.2.8.2 -O /home/sysbio/SA20008161/RNA-seq/example/from_NCBI --gzip /home/sysbio/SA20008161/ncbi/public/sra/SRR8467693.sra
#####
!/bin/sh
An task for serial job.
DO NOT RUN THIS SCRIPT DIRECTLY,
PLEASE RUN THIS SCRIPT WITH qsub: qsub serial_job.pbs
#
PBS -N job_name
PBS -o job_human.log
PBS -e job_human.err
PBS -q middle
PBS -l walltime=48:00:00
PBS -l nodes=1:ppn=2
cd $YOUR_WORKDIR
cd /home/sysbio/SA20008161/PBSorder
fastqc-o/home/sysbio/SA20008161/RNA-seq/example/from_NCBI/-t6/home/sysbio/SA20008161/RNA-seq/example/from_NCBI/*fastq.gz
#!/bin/sh
#An task for serial job.
#DO NOT RUN THIS SCRIPT DIRECTLY,
#PLEASE RUN THIS SCRIPT WITH qsub: qsub serial_job.pbs
#
#PBS -N download refgenome and annotation
#PBS -o download refgenome and annotation.log
#PBS -e download refgenome and annotation.err
#PBS -q middle
#PBS -l walltime=48:00:00
#PBS -l nodes=1:ppn=2
#cd $YOUR_WORKDIR
cd /home/sysbio/SA20008161/PBSorder
#下载参考基因组并解压缩
wget-Phome/sysbio/SA20008161/mappingftp://ftp.ebi.ac.uk/pub/databases/gencode/Gencode_human/release_36/gencode.v36.transcripts.fa.gz
gzip -d home/sysbio/SA20008161/mapping/gencode.v36.transcripts.fa.gz
#下载gff注释文件并解压缩
wget-Phome/sysbio/SA20008161/mapping ftp://ftp.ebi.ac.uk/pub/databases/gencode/Gencode_human/release_36/gencode.v36.annotation.gtf.gz
gzip -d home/sysbio/SA20008161/mapping/gencode.v36.annotation.gtf.gz
#!/bin/sh
#An example for serial job.
#DO NOT RUN THIS SCRIPT DIRECTLY,
#PLEASE RUN THIS SCRIPT WITH qsub: qsub serial_job.pbs
#
#PBS -N lovemapping
#PBS -o lovemapping.log
#PBS -e lovemapping.err
#PBS -q middle
#PBS -l walltime=48:00:00
#PBS -l nodes=1:ppn=4
#cd $YOUR_WORKDIR
cd /home/sysbio/SA20008161/PBSorder
module load STAR
fastq_path=/home/sysbio/SA20008161/RNA-seq/example/from_NCBI
output_path=/home/sysbio/SA20008161/mapping/STAR_result2
#Step 1 - Build a genome index构建索引
module load STAR
STAR
--runThreadN 4
--runMode genomeGenerate
--genomeDir /home/sysbio/SA20008161/mapping/hg38_star_index
--genomeFastaFiles/home/sysbio/SA20008161/mapping/Homo_sapiens.GRCh38.dna.primary_assembly.fa
--sjdbGTFfile /home/sysbio/SA20008161/mapping/Homo_sapiens.GRCh38.102.gtf
#Step 2 - Align RNA-Seq Reads to the genome with 用STAR比对
STAR --runThreadN 4 --genomeDir /home/sysbio/SA20008161/mapping/hg38_star_index --readFilesIn $fastq_path/SRR8467686.fastq.gz --outFileNamePrefix $output_path/SRR8467686 --outSAMtype BAM SortedByCoordinate --quantMode TranscriptomeSAM --readFilesCommand gunzip -c
STAR --runThreadN 4 --genomeDir /home/sysbio/SA20008161/mapping/hg38_star_index --readFilesIn $fastq_path/SRR8467687.fastq.gz --outFileNamePrefix $output_path/SRR8467687 --outSAMtype BAM SortedByCoordinate --quantMode TranscriptomeSAM --readFilesCommand gunzip -c
STAR --runThreadN 4 --genomeDir /home/sysbio/SA20008161/mapping/hg38_star_index --readFilesIn $fastq_path/SRR8467688.fastq.gz --outFileNamePrefix $output_path/SRR8467688 --outSAMtype BAM SortedByCoordinate --quantMode TranscriptomeSAM --readFilesCommand gunzip -c
STAR --runThreadN 4 --genomeDir /home/sysbio/SA20008161/mapping/hg38_star_index --readFilesIn $fastq_path/SRR8467689.fastq.gz --outFileNamePrefix $output_path/SRR8467689 --outSAMtype BAM SortedByCoordinate --quantMode TranscriptomeSAM --readFilesCommand gunzip -c
STAR --runThreadN 4 --genomeDir /home/sysbio/SA20008161/mapping/hg38_star_index --readFilesIn $fastq_path/SRR8467690.fastq.gz --outFileNamePrefix $output_path/SRR8467690 --outSAMtype BAM SortedByCoordinate --quantMode TranscriptomeSAM --readFilesCommand gunzip -c
STAR --runThreadN 4 --genomeDir /home/sysbio/SA20008161/mapping/hg38_star_index --readFilesIn $fastq_path/SRR8467691.fastq.gz --outFileNamePrefix $output_path/SRR8467691 --outSAMtype BAM SortedByCoordinate --quantMode TranscriptomeSAM --readFilesCommand gunzip -c
STAR --runThreadN 4 --genomeDir /home/sysbio/SA20008161/mapping/hg38_star_index --readFilesIn $fastq_path/SRR8467692.fastq.gz --outFileNamePrefix $output_path/SRR8467692 --outSAMtype BAM SortedByCoordinate --quantMode TranscriptomeSAM --readFilesCommand gunzip -c
STAR --runThreadN 4 --genomeDir /home/sysbio/SA20008161/mapping/hg38_star_index --readFilesIn $fastq_path/SRR8467693.fastq.gz --outFileNamePrefix $output_path/SRR8467693 --outSAMtype BAM SortedByCoordinate --quantMode TranscriptomeSAM --readFilesCommand gunzip -c
#!/bin/sh
#An example for serial job.
#DO NOT RUN THIS SCRIPT DIRECTLY,
#PLEASE RUN THIS SCRIPT WITH qsub: qsub serial_job.pbs
#
#PBS -N BAMtoBW
#PBS -o BAMtoBW_human.log
#PBS -e BAMtoBW_human.err
#PBS -q middle
#PBS -l walltime=48:00:00
#PBS -l nodes=1:ppn=4
#cd $YOUR_WORKDIR
cd /home/sysbio/SA20008161/PBSorder
source /home/sysbio/SA20008161/miniconda3/etc/profile.d/conda.sh
#
conda activate RNA
#创建bai索引
bedtools genomecov -ibam /home/sysbio/SA20008161/mapping/STAR_result2/SRR8467687Aligned.sortedByCoord.out.bam -bg > SRR8467686.bedgraph
bedtools genomecov -ibam /home/sysbio/SA20008161/mapping/STAR_result2/SRR8467687Aligned.sortedByCoord.out.bam -bg > SRR8467687.bedgraph
bedtools genomecov -ibam /home/sysbio/SA20008161/mapping/STAR_result2/SRR8467688Aligned.sortedByCoord.out.bam -bg > SRR8467688.bedgraph
bedtools genomecov -ibam /home/sysbio/SA20008161/mapping/STAR_result2/SRR8467689Aligned.sortedByCoord.out.bam -bg > SRR8467689.bedgraph
bedtools genomecov -ibam /home/sysbio/SA20008161/mapping/STAR_result2/SRR8467690Aligned.sortedByCoord.out.bam -bg > SRR8467690.bedgraph
bedtools genomecov -ibam /home/sysbio/SA20008161/mapping/STAR_result2/SRR8467691Aligned.sortedByCoord.out.bam -bg > SRR8467691.bedgraph
bedtools genomecov -ibam /home/sysbio/SA20008161/mapping/STAR_result2/SRR8467692Aligned.sortedByCoord.out.bam -bg > SRR8467692.bedgraph
bedtools genomecov -ibam /home/sysbio/SA20008161/mapping/STAR_result2/SRR8467693Aligned.sortedByCoord.out.bam -bg > SRR8467693.bedgraph
samtools index -b /home/sysbio/SA20008161/mapping/STAR_result2/SRR8467686Aligned.sortedByCoord.out.bam
samtools index -b /home/sysbio/SA20008161/mapping/STAR_result2/SRR8467687Aligned.sortedByCoord.out.bam
samtools index -b /home/sysbio/SA20008161/mapping/STAR_result2/SRR8467688Aligned.sortedByCoord.out.bam
samtools index -b /home/sysbio/SA20008161/mapping/STAR_result2/SRR8467689Aligned.sortedByCoord.out.bam
samtools index -b /home/sysbio/SA20008161/mapping/STAR_result2/SRR8467690Aligned.sortedByCoord.out.bam
samtools index -b /home/sysbio/SA20008161/mapping/STAR_result2/SRR8467691Aligned.sortedByCoord.out.bam
samtools index -b /home/sysbio/SA20008161/mapping/STAR_result2/SRR8467692Aligned.sortedByCoord.out.bam
samtools index -b /home/sysbio/SA20008161/mapping/STAR_result2/SRR8467693Aligned.sortedByCoord.out.bam
#批量处理BAMtoBW
bamCoverage -b /home/sysbio/SA20008161/mapping/STAR_result2/SRR8467686Aligned.sortedByCoord.out.bam -o /home/sysbio/SA20008161/mapping/STAR_result2/SRR8467686.bw
bamCoverage -b /home/sysbio/SA20008161/mapping/STAR_result2/SRR8467687Aligned.sortedByCoord.out.bam -o /home/sysbio/SA20008161/mapping/STAR_result2/SRR8467687.bw
bamCoverage -b /home/sysbio/SA20008161/mapping/STAR_result2/SRR8467688Aligned.sortedByCoord.out.bam -o /home/sysbio/SA20008161/mapping/STAR_result2/SRR8467688.bw
bamCoverage -b /home/sysbio/SA20008161/mapping/STAR_result2/SRR8467689Aligned.sortedByCoord.out.bam -o /home/sysbio/SA20008161/mapping/STAR_result2/SRR8467689.bw
bamCoverage -b /home/sysbio/SA20008161/mapping/STAR_result2/SRR8467690Aligned.sortedByCoord.out.bam -o /home/sysbio/SA20008161/mapping/STAR_result2/SRR8467690.bw
bamCoverage -b /home/sysbio/SA20008161/mapping/STAR_result2/SRR8467691Aligned.sortedByCoord.out.bam -o /home/sysbio/SA20008161/mapping/STAR_result2/SRR8467691.bw
bamCoverage -b /home/sysbio/SA20008161/mapping/STAR_result2/SRR8467692Aligned.sortedByCoord.out.bam -o /home/sysbio/SA20008161/mapping/STAR_result2/SRR8467692.bw
bamCoverage -b /home/sysbio/SA20008161/mapping/STAR_result2/SRR8467693Aligned.sortedByCoord.out.bam -o /home/sysbio/SA20008161/mapping/STAR_result2/SRR8467693.bw
#!/bin/sh
#An example for serial job.
#DO NOT RUN THIS SCRIPT DIRECTLY,
#PLEASE RUN THIS SCRIPT WITH qsub: qsub serial_job.pbs
#
#PBS -N je3_name
#PBS -o ec3.log
#PBS -e ec3.err
#PBS -q middle
#PBS -l walltime=48:00:00
#PBS -l nodes=1:ppn=4
#cd $YOUR_WORKDIR
cd /home/sysbio/SA20008161/PBSorder
source /home/sysbio/SA20008161/miniconda3/etc/profile.d/conda.sh
#Build RSEM index and compute expression
# rsem prepare reference 从参考基因组中提取原始准备文件
module load STAR
rsem-prepare-reference --gtf /home/sysbio/SA20008161/mapping/Homo_sapiens.GRCh38.102.gtf \
--star \
--star-path /public/software/bio/STAR \
-p 4 \
/home/sysbio/SA20008161/mapping/Homo_sapiens.GRCh38.dna.primary_assembly.fa \
/home/sysbio/SA20008161/software_code/RSEM_example/hg38_ref/hg38
#转录组数据计算表达定量;再顺便改个名
rsem-calculate-expression -p 4 --bam /home/sysbio/SA20008161/mapping/STAR_result2/SRR8467686Aligned.toTranscriptome.out.bam /home/sysbio/SA20008161/software_code/software_code/RSEM_example/hg38_ref/hg38 KD1-1
rsem-calculate-expression -p 4 --bam /home/sysbio/SA20008161/mapping/STAR_result2/SRR8467687Aligned.toTranscriptome.out.bam /home/sysbio/SA20008161/software_code/software_code/RSEM_example/hg38_ref/hg38 KD1-2
rsem-calculate-expression -p 4 --bam /home/sysbio/SA20008161/mapping/STAR_result2/SRR8467688Aligned.toTranscriptome.out.bam /home/sysbio/SA20008161/software_code/software_code/RSEM_example/hg38_ref/hg38 KD2-1
rsem-calculate-expression -p 4 --bam /home/sysbio/SA20008161/mapping/STAR_result2/SRR8467689Aligned.toTranscriptome.out.bam /home/sysbio/SA20008161/software_code/software_code/RSEM_example/hg38_ref/hg38 KD2-2
rsem-calculate-expression -p 4 --bam /home/sysbio/SA20008161/mapping/STAR_result2/SRR8467690Aligned.toTranscriptome.out.bam /home/sysbio/SA20008161/software_code/software_code/RSEM_example/hg38_ref/hg38 C1-1
rsem-calculate-expression -p 4 --bam /home/sysbio/SA20008161/mapping/STAR_result2/SRR8467691Aligned.toTranscriptome.out.bam /home/sysbio/SA20008161/software_code/software_code/RSEM_example/hg38_ref/hg38 C1-2
rsem-calculate-expression -p 4 --bam /home/sysbio/SA20008161/mapping/STAR_result2/SRR8467692Aligned.toTranscriptome.out.bam /home/sysbio/SA20008161/software_code/software_code/RSEM_example/hg38_ref/hg38 C2-1
rsem-calculate-expression -p 4 --bam /home/sysbio/SA20008161/mapping/STAR_result2/SRR8467693Aligned.toTranscriptome.out.bam /home/sysbio/SA20008161/software_code/software_code/RSEM_example/hg38_ref/hg38 C2-2
#Htseq计算表达量
conda activate RNA
#htseq-count -i gene_id /home/sysbio/SA20008161/mapping/STAR_result2/SRR8467686.sorted.bam /home/sysbio/SA20008161/mapping/Homo_sapiens.GRCh38.102.gtff > /home/sysbio/SA20008161/mapping/result/KD1-1.txt
#htseq-count -i gene_id /home/sysbio/SA20008161/mapping/STAR_result2/SRR8467687Aligned.sortedByCoord.out.bam /home/sysbio/SA20008161/mapping/Homo_sapiens.GRCh38.102.gtff > /home/sysbio/SA20008161/mapping/result/KD1-2.txt
#htseq-count -i gene_id /home/sysbio/SA20008161/mapping/STAR_result2/SRR8467688Aligned.sortedByCoord.out.bam /home/sysbio/SA20008161/mapping/Homo_sapiens.GRCh38.102.gtff > /home/sysbio/SA20008161/mapping/result/KD2-1.txt
#htseq-count -i gene_id /home/sysbio/SA20008161/mapping/STAR_result2/SRR8467689Aligned.sortedByCoord.out.bam /home/sysbio/SA20008161/mapping/Homo_sapiens.GRCh38.102.gtff > /home/sysbio/SA20008161/mapping/result/KD2-2.txt
#htseq-count -i gene_id /home/sysbio/SA20008161/mapping/STAR_result2/SRR8467690Aligned.sortedByCoord.out.bam /home/sysbio/SA20008161/mapping/Homo_sapiens.GRCh38.102.gtff > /home/sysbio/SA20008161/mapping/result/C1-1.txt
#htseq-count -i gene_id /home/sysbio/SA20008161/mapping/STAR_result2/SRR8467691Aligned.sortedByCoord.out.bam /home/sysbio/SA20008161/mapping/Homo_sapiens.GRCh38.102.gtff > /home/sysbio/SA20008161/mapping/result/C1-2.txt
#htseq-count -i gene_id /home/sysbio/SA20008161/mapping/STAR_result2/SRR8467692Aligned.sortedByCoord.out.bam /home/sysbio/SA20008161/mapping/Homo_sapiens.GRCh38.102.gtff > /home/sysbio/SA20008161/mapping/result/C2-1.txt
#htseq-count -i gene_id /home/sysbio/SA20008161/mapping/STAR_result2/SRR8467693Aligned.sortedByCoord.out.bam /home/sysbio/SA20008161/mapping/Homo_sapiens.GRCh38.102.gtff > /home/sysbio/SA20008161/mapping/result/C2-2.txt
近期会对这篇文章进行大幅度修改,主要是利用循环简化语句,以及加入后续的可视化分析