.. _`bio/bwa/samxe`: BWA SAM(SE/PE) ============== .. image:: https://img.shields.io/github/issues-pr/snakemake/snakemake-wrappers/bio/bwa/samxe?label=version%20update%20pull%20requests :target: https://github.com/snakemake/snakemake-wrappers/pulls?q=is%3Apr+is%3Aopen+label%3Abio/bwa/samxe Map paired-end reads with either bwa samse or sampe. Example ------- This wrapper can be used in the following way: .. code-block:: python rule bwa_sam_pe: input: fastq=["reads/{sample}.1.fastq", "reads/{sample}.2.fastq"], sai=["sai/{sample}.1.sai", "sai/{sample}.2.sai"], idx=multiext("genome", ".amb", ".ann", ".bwt", ".pac", ".sa"), output: "mapped/{sample}.pe.sam", params: extra=r"-r '@RG\tID:{sample}\tSM:{sample}'", # optional: Extra parameters for bwa. sort="none", log: "logs/bwa_sam_pe/{sample}.log", wrapper: "v3.0.1/bio/bwa/samxe" rule bwa_sam_se: input: fastq="reads/{sample}.1.fastq", sai="sai/{sample}.1.sai", idx=multiext("genome", ".amb", ".ann", ".bwt", ".pac", ".sa"), output: "mapped/{sample}.se.sam", params: extra=r"-r '@RG\tID:{sample}\tSM:{sample}'", # optional: Extra parameters for bwa. sort="none", log: "logs/bwa_sam_se/{sample}.log", wrapper: "v3.0.1/bio/bwa/samxe" rule bwa_bam_pe: input: fastq=["reads/{sample}.1.fastq", "reads/{sample}.2.fastq"], sai=["sai/{sample}.1.sai", "sai/{sample}.2.sai"], idx=multiext("genome", ".amb", ".ann", ".bwt", ".pac", ".sa"), output: "mapped/{sample}.pe.bam", params: extra=r"-r '@RG\tID:{sample}\tSM:{sample}'", # optional: Extra parameters for bwa. sort="none", log: "logs/bwa_bam_pe/{sample}.log", wrapper: "v3.0.1/bio/bwa/samxe" rule bwa_bam_se: input: fastq="reads/{sample}.1.fastq", sai="sai/{sample}.1.sai", idx=multiext("genome", ".amb", ".ann", ".bwt", ".pac", ".sa"), output: "mapped/{sample}.se.bam", params: extra=r"-r '@RG\tID:{sample}\tSM:{sample}'", # optional: Extra parameters for bwa. sort="none", log: "logs/bwa_bam_se/{sample}.log", wrapper: "v3.0.1/bio/bwa/samxe" Note that input, output and log file paths can be chosen freely. When running with .. code-block:: bash snakemake --use-conda the software dependencies will be automatically deployed into an isolated environment before execution. Notes ----- * The `extra` param allows for additional program arguments. * For more information see, http://bio-bwa.sourceforge.net/bwa.shtml Software dependencies --------------------- * ``bwa=0.7.17`` * ``samtools=1.18`` * ``picard-slim=3.1.1`` Input/Output ------------ **Input:** * ``fastq``: FASTQ file(s) * ``sai``: SAI file(s) * ``idx``: BWA reference genome index **Output:** * SAM/BAM alignment file Authors ------- * Filipe G. Vieira Code ---- .. code-block:: python """Snakemake wrapper for both bwa samse and sampe.""" __author__ = "Filipe G. Vieira" __copyright__ = "Copyright 2020, Filipe G. Vieira" __license__ = "MIT" from os import path from snakemake.shell import shell index = snakemake.input.get("idx", "") if isinstance(index, str): index = path.splitext(snakemake.input.idx)[0] else: index = path.splitext(snakemake.input.idx[0])[0] # Check inputs. fastq = ( snakemake.input.fastq if isinstance(snakemake.input.fastq, list) else [snakemake.input.fastq] ) sai = ( snakemake.input.sai if isinstance(snakemake.input.sai, list) else [snakemake.input.sai] ) if len(fastq) == 1 and len(sai) == 1: alg = "samse" elif len(fastq) == 2 and len(sai) == 2: alg = "sampe" else: raise ValueError("input.fastq and input.sai must have 1 or 2 elements each") # Extract output format out_name, out_ext = path.splitext(snakemake.output[0]) out_ext = out_ext[1:].upper() # Extract arguments. extra = snakemake.params.get("extra", "") sort = snakemake.params.get("sort", "none") sort_order = snakemake.params.get("sort_order", "coordinate") sort_extra = snakemake.params.get("sort_extra", "") log = snakemake.log_fmt_shell(stdout=False, stderr=True) # Determine which pipe command to use for converting to bam or sorting. if sort == "none": # Simply convert to output format using samtools view. pipe_cmd = ( "samtools view -h --output-fmt " + out_ext + " -o {snakemake.output[0]} -" ) elif sort == "samtools": # Sort alignments using samtools sort. pipe_cmd = "samtools sort {sort_extra} -o {snakemake.output[0]} -" # Add name flag if needed. if sort_order == "queryname": sort_extra += " -n" # Use prefix for temp. prefix = path.splitext(snakemake.output[0])[0] sort_extra += " -T " + prefix + ".tmp" # Define output format sort_extra += " --output-fmt {}".format(out_ext) elif sort == "picard": # Sort alignments using picard SortSam. pipe_cmd = ( "picard SortSam {sort_extra} INPUT=/dev/stdin" " OUTPUT={snakemake.output[0]} SORT_ORDER={sort_order}" ) else: raise ValueError("Unexpected value for params.sort ({})".format(sort)) # Run command. shell( "(bwa {alg}" " {extra}" " {index}" " {snakemake.input.sai}" " {snakemake.input.fastq}" " | " + pipe_cmd + ") {log}" ) .. |nl| raw:: html