Skip to content
Snippets Groups Projects
Commit cd2052dd authored by CJHerrmann's avatar CJHerrmann
Browse files

Started working on subpipelines

parent 52c1de75
No related branches found
No related tags found
1 merge request!4Subpipelines
......@@ -110,29 +110,7 @@ rule generate_segemehl_index_other_RNAs:
### Index genome STAR
#################################################################################
rule index_genome_STAR:
input:
genome = os.path.join(config["output_dir"], "genome.fa"),
annotation = os.path.join(config["output_dir"], "annotation.gtf")
output:
output = os.path.join(config["output_dir"], "STAR_index")
params:
outputdir = os.path.join(config["output_dir"],"STAR_index"),
sjdbOverhang = config["sjdbOverhang"]
threads: 8
singularity:
"docker://zavolab/star:2.6.0a"
log:
os.path.join(config["local_log"],"index_genome_STAR.log")
shell:
"mkdir -p {output.output}; \
chmod -R 777 {output.output}; \
(STAR --runMode genomeGenerate \
--sjdbOverhang {params.sjdbOverhang} \
--genomeDir {params.outputdir} \
--genomeFastaFiles {input.genome} \
--runThreadN {threads} \
--sjdbGTFfile {input.annotation}) &> {log}"
##################################################################################
### Filter protein coding and lncRNA transcripts
......
import pandas as pd
configfile: "config.yaml"
samples = pd.read_table(config['samples_table'], header=0, index_col=0, comment='#', engine='python')
samples['out_name'] = samples['Sample_name'] + samples['Library_Type']
localrules: finish
#################################################################################
......@@ -8,10 +19,22 @@ localrules: finish
rule finish:
input:
fastqc = expand(os.path.join(config["output_dir"], "{sample}", "fastqc"), sample=config["sample"]),
htseq_qa = expand(os.path.join(config["output_dir"], "{sample}", "htseq_qa", "htseq_quality.pdf"), sample=config["sample"]),
gn_estimates = expand(os.path.join(config["output_dir"], "{sample}", "salmon_quant", "quant.genes.sf"), sample=config["sample"]),
bam = expand(os.path.join(config["output_dir"], "{sample}", "STAR_Aligned.out.bam"), sample=config["sample"])
final_sample = expand(os.path.join(config["output_dir"], "{sample}", "fastqc"), sample=samples['out_name'].values),
#fastqc = expand(os.path.join(config["output_dir"], "{sample}", "fastqc"), sample=config["sample"]),
#htseq_qa = expand(os.path.join(config["output_dir"], "{sample}", "htseq_qa", "htseq_quality.pdf"), sample=config["sample"]),
#gn_estimates = expand(os.path.join(config["output_dir"], "{sample}", "salmon_quant", "quant.genes.sf"), sample=config["sample"]),
#bam = expand(os.path.join(config["output_dir"], "{sample}", "STAR_Aligned.out.bam"), sample=config["sample"])
##################################################################################
# Execution dependend on sequencing mode
##################################################################################
include: 'paired_end.snakefile'
include: 'single_end.snakefile'
##################################################################################
### Fastqc
......
......@@ -2,6 +2,7 @@
##############################################################################
### Annotation
##############################################################################
organism: "Homo_sapiens"
annotation: "../prepare_annotation/results/annotation.gtf"
genome: "../prepare_annotation/results/genome.fa"
annotation_filtered: "../prepare_annotation/results/filtered_transcripts.gtf"
......@@ -12,6 +13,8 @@
##############################################################################
### Output and log directories
##############################################################################
database_path: "/scicore/home/zavolan/GROUP/Rna_Seq_pipeline/Blabla"
STAR_idx_folder: "STAR_indices"
output_dir: "results"
local_log: "logs/local_log"
cluster_log: "logs/cluster_log"
......
rule index_genome_STAR:
'''
Create Star index
'''
input:
genome = os.path.join(config["output_dir"], "genome.fa"),
annotation = os.path.join(config["output_dir"], "annotation.gtf")
output:
output = os.path.join(config["database_path"], config['organism'], config['STAR_idx_folder], "STAR_index" + {sjdb})
params:
outputdir = os.path.join(config["output_dir"],"STAR_index"),
sjdb = lambda wildcards: samples.loc['sjdb']
threads: 8
singularity:
"docker://zavolab/star:2.6.0a"
log:
os.path.join(config["local_log"],"index_genome_STAR.log")
shell:
"mkdir -p {output.output}; \
chmod -R 777 {output.output}; \
(STAR --runMode genomeGenerate \
--sjdbOverhang {params.sjdbOverhang} \
--genomeDir {params.outputdir} \
--genomeFastaFiles {input.genome} \
--runThreadN {threads} \
--sjdbGTFfile {input.annotation}) &> {log}"
\ No newline at end of file
0% Loading or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment