pipeline/other/test.sh

45 lines
2.5 KiB
Bash
Raw Normal View History

2023-08-25 10:06:31 +08:00
#!/bin/bash
#
seqkit replace -p "/1" -r " 1" -j 10 /dataseq/T7/result/OutputFq/upload/E100076595/L01/*_PQSK-20230803_*1.fq.gz \
-o /home/jm001/project/pancancer_controlsample/624/Blood/PQSK-20230803/qc/PQSK-20230803_changehead_R1.fq
seqkit replace -p "/2" -r " 2" -j 10 /dataseq/T7/result/OutputFq/upload/E100076595/L01/*_PQSK-20230803_*2.fq.gz \
-o /home/jm001/project/pancancer_controlsample/624/Blood/PQSK-20230803/qc/PQSK-20230803_changehead_R2.fq
#
fastp -i /home/jm001/project/pancancer_controlsample/624/Blood/PQSK-20230803/qc/PQSK-20230803_changehead_R1.fq \
-o /home/jm001/project/pancancer_controlsample/624/Blood/PQSK-20230803/qc/PQSK-20230803_clean_R1.fq.gz \
-I /home/jm001/project/pancancer_controlsample/624/Blood/PQSK-20230803/qc/PQSK-20230803_changehead_R2.fq \
-O /home/jm001/project/pancancer_controlsample/624/Blood/PQSK-20230803/qc/PQSK-20230803_clean_R2.fq.gz \
-w 10 -U --umi_loc=per_read --umi_len=4 --umi_prefix=UMI --umi_skip=3 \
--disable_trim_poly_g \
--disable_quality_filtering \
--adapter_sequence AGATCGGAAGAGCACACGTCTGAACTCCAGTCA \
--adapter_sequence_r2 AGATCGGAAGAGCGTCGTGTAGGGAAAGAGTGT \
--correction \
--overlap_len_require 10 \
-j /home/jm001/project/pancancer_controlsample/624/Blood/PQSK-20230803/qc/PQSK-20230803.json \
-h /home/jm001/project/pancancer_controlsample/624/Blood/PQSK-20230803/qc/PQSK-20230803.html --report_title PQSK-20230803
# UMI
python3 /dataseq/jmdna/codes/624/UMI_Project.py \
-i /dataseq/T7/result/OutputFq/upload/E100076595/L01 \
-o /home/jm001/project/pancancer_controlsample/624/Blood/PQSK-20230803 \
-t PQSK-20230803
rm /home/jm001/project/pancancer_controlsample/624/Blood/PQSK-20230803/qc/PQSK-20230803_changehead_R1.fq \
/home/jm001/project/pancancer_controlsample/624/Blood/PQSK-20230803/qc/PQSK-20230803_changehead_R2.fq
# 对照样本
fastp -i /dataseq/T7/result/OutputFq/upload/E100076595/L01/*_PQSK-20230803-B_*1.fq.gz \
-o /home/jm001/project/pancancer_controlsample/624/Blood/PQSK-20230803/qc/PQSK-20230803-B_clean_R1.fq.gz \
-I /dataseq/T7/result/OutputFq/upload/E100076595/L01/*_PQSK-20230803-B_*2.fq.gz \
-O /home/jm001/project/pancancer_controlsample/624/Blood/PQSK-20230803/qc/PQSK-20230803-B_clean_R2.fq.gz \
-w 10 --correction --overlap_len_require 20 \
--adapter_sequence AGATCGGAAGAGCACACGTCTGAACTCCAGTCA \
--adapter_sequence_r2 AGATCGGAAGAGCGTCGTGTAGGGAAAGAGTGT \
-j /home/jm001/project/pancancer_controlsample/624/Blood/PQSK-20230803/qc/PQSK-20230803-B.json \
-h /home/jm001/project/pancancer_controlsample/624/Blood/PQSK-20230803/qc/PQSK-20230803-B.html --report_title PQSK-20230803-B -e 20