[
    {
        "id": "gstacks_denovo",
        "name": "gstacks_denovo",
        "article": "10.1111\/mec.15253",
        "website": "http:\/\/catchenlab.life.illinois.edu\/stacks\/comp\/gstacks.php",
        "git": "",
        "description": "gstacks build loci from the single and\/or paired-end reads before calling SNPs",
        "version": "2.64",
        "documentation": "http:\/\/catchenlab.life.illinois.edu\/stacks\/comp\/gstacks.php",
        "multiqc": "custom",
        "commands": [
            {
                "name": "gstacks_denovo",
                "cname": "gstacks_denovo",
                "command": "gstacks",
                "category": "stacks",
                "output_dir": "gstacks_denovo",
                "inputs": [
                    {
                        "name": "tsv2bam_done",
                        "type": "tsv2bam_done"
                    },
                    {
                        "name": "popmap",
                        "type": "popmap"
                    }
                ],
                "outputs": [
                    {
                        "name": "catalog_calls",
                        "type": "stacks_calls",
                        "file": "catalog.calls",
                        "description": "Consensus sequence for each assembled locus in the data"
                    },
                    {
                        "name": "catalog_fa",
                        "type": "fa.gz",
                        "file": "catalog.fa.gz",
                        "description": "Custom file that contains genotyping data"
                    },
                    {
                        "name": "stats",
                        "type": "distribs",
                        "file": "gstacks.log.distribs",
                        "description": "Distributions statistics (bam stats, coverage and phasing_rates per sample)"
                    }
                ],
                "options": [
                    {
                        "name": "gstacks_denovo_threads",
                        "prefix": "-t",
                        "type": "numeric",
                        "value": 4,
                        "min": 1,
                        "max": "NA",
                        "step": 1,
                        "label": "Number of threads to use"
                    },
                    {
                        "name": "gstacks_denovo_model",
                        "prefix": "--model",
                        "type": "select",
                        "value": "marukilow",
                        "choices": [
                            {
                                "marukilow": "marukilow"
                            },
                            {
                                "marukihigh": "marukihigh"
                            },
                            {
                                "snp": "snp"
                            }
                        ],
                        "label": "Model to use to call variants and genotypes"
                    },
                    {
                        "name": "gstacks_denovo_var_alpha",
                        "prefix": "--var-alpha",
                        "type": "numeric",
                        "value": 0.05,
                        "min": 0,
                        "max": "NA",
                        "step": "NA",
                        "label": "Alpha threshold for discovering SNPs"
                    },
                    {
                        "name": "gstacks_denovo_gt_alpha",
                        "prefix": "--gt-alpha",
                        "type": "numeric",
                        "value": 0.05,
                        "min": 0,
                        "max": "NA",
                        "step": "NA",
                        "label": "Alpha threshold for calling genotypes"
                    },
                    {
                        "name": "gstacks_denovo_min_mapq",
                        "prefix": "--min-mapq",
                        "type": "numeric",
                        "value": 20,
                        "min": 0,
                        "max": "NA",
                        "step": 1,
                        "label": "Minimum PHRED-scaled mapping quality to consider a read"
                    },
                    {
                        "name": "gstacks_denovo_max_clipped",
                        "prefix": "--max-clipped",
                        "type": "numeric",
                        "value": 0.2,
                        "min": 0,
                        "max": "NA",
                        "step": "NA",
                        "label": "Maximum soft-clipping level, in fraction of read length"
                    }
                ]
            }
        ],
        "prepare_report_script": "gstacks_denovo.prepare.report.R",
        "prepare_report_outputs": [
            "effective_coverages_per_sample_mqc.tsv",
            "phasing_rates_per_sample_mqc.tsv"
        ],
        "install": [],
        "citations": {
            "stacks": [
                " Rochette, NC, Rivera\u2010Col\u00f3n, AG, Catchen, JM. Stacks 2: Analytical methods for paired\u2010end sequencing improve RADseq\u2010based population genomics. Mol Ecol. 2019; 28: 4737- 4754. https:\/\/doi.org\/10.1111\/mec.15253"
            ]
        },
        "yaml": "{\n  id: gstacks_denovo,\n  name: gstacks_denovo,\n  article: 10.1111\/mec.15253,\n  website: \"http:\/\/catchenlab.life.illinois.edu\/stacks\/comp\/gstacks.php\",\n  git: \"\",\n  description: \"gstacks build loci from the single and\/or paired-end reads before calling SNPs\",\n  version: \"2.64\",\n  documentation: \"http:\/\/catchenlab.life.illinois.edu\/stacks\/comp\/gstacks.php\",\n  multiqc: \"custom\",\n  commands:\n    [\n      {\n        name: gstacks_denovo,\n        cname: \"gstacks_denovo\",\n        command: gstacks,\n        category: \"stacks\",\n        output_dir: gstacks_denovo,\n        inputs: [{ name: tsv2bam_done, type: \"tsv2bam_done\" }, #all bams must be in the same tsv2bam dir \n                 { name: popmap, type: \"popmap\" }\n                 ],\n        outputs:\n          [\n            { name: catalog_calls, type: \"stacks_calls\", file: \"catalog.calls\", description: \"Consensus sequence for each assembled locus in the data\" },\n            { name: catalog_fa, type: \"fa.gz\", file: \"catalog.fa.gz\", description: \"Custom file that contains genotyping data\" },\n            { name: stats, type: \"distribs\", file: \"gstacks.log.distribs\", description: \"Distributions statistics (bam stats, coverage and phasing_rates per sample)\" },\n          ],\n        options:\n          [\n            {\n              name: gstacks_denovo_threads,\n              prefix: -t,\n              type: numeric,\n              value: 4,\n              min: 1,\n              max: NA,\n              step: 1,\n              label: \"Number of threads to use\",\n            },\n            {\n              name: gstacks_denovo_model,\n              prefix: --model,\n              type: select,\n              value: marukilow,\n              choices: [marukilow: marukilow, marukihigh: marukihigh, snp: snp],\n              label: \"Model to use to call variants and genotypes\",\n            },\n            {\n              name: gstacks_denovo_var_alpha,\n              prefix: --var-alpha,\n              type: numeric,\n              value: 0.05,\n              min: 0,\n              max: NA,\n              step: NA,\n              label: \"Alpha threshold for discovering SNPs\",\n            },\n            {\n              name: gstacks_denovo_gt_alpha,\n              prefix: --gt-alpha,\n              type: numeric,\n              value: 0.05,\n              min: 0,\n              max: NA,\n              step: NA,\n              label: \"Alpha threshold for calling genotypes\",\n            },\n            {\n              name: gstacks_denovo_min_mapq,\n              prefix: --min-mapq,\n              type: numeric,\n              value: 20,\n              min: 0,\n              max: NA,\n              step: 1,\n              label: \"Minimum PHRED-scaled mapping quality to consider a read\",\n            },\n            {\n              name: gstacks_denovo_max_clipped,\n              prefix: --max-clipped,\n              type: numeric,\n              value: 0.20,\n              min: 0,\n              max: NA,\n              step: NA,\n              label: \"Maximum soft-clipping level, in fraction of read length\",\n            }\n          ],\n      },\n    ],\n  prepare_report_script:  gstacks_denovo.prepare.report.R,\n  prepare_report_outputs: [\n     effective_coverages_per_sample_mqc.tsv,\n     phasing_rates_per_sample_mqc.tsv\n  ],  \n  install:\n    {\n      # stacks: [\n      #   \"cd \/opt\/biotools\",\n      #   \"wget http:\/\/catchenlab.life.illinois.edu\/stacks\/source\/stacks-2.61.tar.gz\",\n      #   \"tar -zxvf stacks-2.61.tar.gz\",\n      #   \"cd stacks-2.61\/\",\n      #   \".\/configure\",\n      #   \"make -j 10\",\n      #   \"make install\",\n      #   \"mv -t ..\/bin sstacks kmer_filter gstacks tsv2bam process_shortreads populations ustacks phasedstacks cstacks process_radtags\",\n      #   \"cd .. && rm -r stacks-2.61 stacks-2.61.tar.gz\"\n      # ]\n    },\n  citations:  {\n    stacks: [\n      \" Rochette, NC, Rivera\u2010Col\u00f3n, AG, Catchen, JM. Stacks 2: Analytical methods for paired\u2010end sequencing improve RADseq\u2010based population genomics. Mol Ecol. 2019; 28: 4737- 4754. https:\/\/doi.org\/10.1111\/mec.15253\"\n    ]\n  }\n}\n"
    }
]