From a193eb7e4a4550c289b83821a7f4ece0a4888fa5 Mon Sep 17 00:00:00 2001 From: Chengxin Dai <37200167+daichengxin@users.noreply.github.com> Date: Mon, 26 Feb 2024 11:16:54 +0800 Subject: [PATCH] Update nextflow_schema.json --- nextflow_schema.json | 151 ++++++++----------------------------------- 1 file changed, 27 insertions(+), 124 deletions(-) diff --git a/nextflow_schema.json b/nextflow_schema.json index 05ab141c..e682d1c4 100644 --- a/nextflow_schema.json +++ b/nextflow_schema.json @@ -10,10 +10,7 @@ "type": "object", "fa_icon": "fas fa-terminal", "description": "Define where the pipeline should find input data and save output data.", - "required": [ - "input", - "outdir" - ], + "required": ["input", "outdir"], "properties": { "input": { "type": "string", @@ -28,7 +25,7 @@ "outdir": { "type": "string", "description": "The output directory where the results will be saved.", - "default": null, + "default": "./results", "fa_icon": "fas fa-folder-open" }, "email": { @@ -59,10 +56,7 @@ "acquisition_method": { "type": "string", "description": "Proteomics data acquisition method", - "enum": [ - "dda", - "dia" - ], + "enum": ["dda", "dia"], "fa_icon": "far fa-list-ol" }, "id_only": { @@ -115,9 +109,7 @@ "default": "reverse", "fa_icon": "fas fa-list-ol", "enum": [ - "reverse", - "shuffle" - ] + "reverse", "shuffle"] }, "shuffle_max_attempts": { "type": "integer", @@ -140,9 +132,7 @@ } }, "fa_icon": "fas fa-database", - "required": [ - "database" - ] + "required": ["database"] }, "spectrum_preprocessing": { "title": "Spectrum preprocessing", @@ -217,11 +207,7 @@ "help_text": "Warning: not supported by sage yet.", "default": "fully", "fa_icon": "fas fa-list-ol", - "enum": [ - "fully", - "semi", - "none" - ] + "enum": ["fully", "semi", "none"] }, "allowed_missed_cleavages": { "type": "integer", @@ -240,10 +226,7 @@ "description": "Precursor mass tolerance unit used for database search. Possible values are 'ppm' (default) and 'Da'.", "default": "ppm", "fa_icon": "fas fa-sliders-h", - "enum": [ - "Da", - "ppm" - ] + "enum": ["Da", "ppm"] }, "fragment_mass_tolerance": { "type": "number", @@ -258,10 +241,7 @@ "default": "Da", "fa_icon": "fas fa-list-ol", "help_text": "Caution: for Comet we are estimating the `fragment_bin_tolerance` parameter based on this automatically.", - "enum": [ - "Da", - "ppm" - ] + "enum": ["Da", "ppm"] }, "fixed_mods": { "type": "string", @@ -426,11 +406,7 @@ "description": "What to do when peptides are found that do not follow a unified set of rules (since search engines sometimes differ in their interpretation of them). ", "default": "warn", "fa_icon": "far fa-check-square", - "enum": [ - "warn", - "error", - "remove" - ] + "enum": ["warn", "error", "remove"] }, "IL_equivalent": { "type": "boolean", @@ -452,10 +428,7 @@ "description": "How to calculate posterior probabilities for PSMs:\n\n* 'percolator' = Re-score based on PSM-feature-based SVM and transform distance\n to hyperplane for posteriors\n* 'fit_distributions' = Fit positive and negative distributions to scores\n (similar to PeptideProphet)", "fa_icon": "fas fa-list-ol", "default": "percolator", - "enum": [ - "percolator", - "fit_distributions" - ] + "enum": ["percolator", "fit_distributions"] }, "run_fdr_cutoff": { "type": "number", @@ -498,10 +471,7 @@ "description": "Calculate FDR on PSM ('psm-level-fdrs') or peptide level ('peptide-level-fdrs')?", "default": "peptide-level-fdrs", "fa_icon": "fas fa-list-ol", - "enum": [ - "peptide-level-fdrs", - "psm-level-fdrs" - ] + "enum": ["peptide-level-fdrs", "psm-level-fdrs"] }, "train_FDR": { "type": "number", @@ -554,12 +524,7 @@ "description": "How to handle outliers during fitting:\n\n* ignore_iqr_outliers (default): ignore outliers outside of `3*IQR` from Q1/Q3 for fitting\n* set_iqr_to_closest_valid: set IQR-based outliers to the last valid value for fitting\n* ignore_extreme_percentiles: ignore everything outside 99th and 1st percentile (also removes equal values like potential censored max values in XTandem)\n* none: do nothing", "default": "none", "fa_icon": "fas fa-list-ol", - "enum": [ - "none", - "ignore_iqr_outliers", - "set_iqr_to_closest_valid", - "ignore_extreme_percentiles" - ] + "enum": ["none", "ignore_iqr_outliers", "set_iqr_to_closest_valid", "ignore_extreme_percentiles"] }, "idpep_debug": { "type": "integer", @@ -583,11 +548,7 @@ "default": "best", "fa_icon": "fas fa-list-ol", "help_text": "Specifies how search engine results are combined: ConsensusID offers several algorithms that can aggregate results from multiple peptide identification engines ('search engines') into consensus identifications - typically one per MS2 spectrum. This works especially well for search engines that provide more than one peptide hit per spectrum, i.e. that report not just the best hit, but also a list of runner-up candidates with corresponding scores.\n\nThe available algorithms are:\n\n* PEPMatrix: Scoring based on posterior error probabilities (PEPs) and peptide sequence similarities. This algorithm uses a substitution matrix to score the similarity of sequences not listed by all search engines. It requires PEPs as the scores for all peptide hits.\n* PEPIons: Scoring based on posterior error probabilities (PEPs) and fragment ion similarities ('shared peak count'). This algorithm, too, requires PEPs as scores.\n* best: For each peptide ID, this uses the best score of any search engine as the consensus score.\n* worst: For each peptide ID, this uses the worst score of any search engine as the consensus score.\n* average: For each peptide ID, this uses the average score of all search engines as the consensus score.\n* ranks: Calculates a consensus score based on the ranks of peptide IDs in the results of different search engines. The final score is in the range (0, 1], with 1 being the best score.\n\nTo make scores comparable, for best, worst and average, PEPs are used as well. Peptide IDs are only considered the same if they map to exactly the same sequence (including modifications and their localization). Also isobaric aminoacids are (for now) only considered equal with the PEPMatrix/PEPIons algorithms.", - "enum": [ - "best", - "PEPMatrix", - "PEPIons" - ] + "enum": ["best", "PEPMatrix", "PEPIons"] }, "consensusid_considered_top_hits": { "type": "integer", @@ -621,12 +582,7 @@ "type": "string", "description": "Operate only on MSn scans where any of its precursors features a certain activation method. Set to empty to disable.", "fa_icon": "fas fa-font", - "enum": [ - "HCD", - "CID", - "ETD", - "ECD" - ] + "enum": ["HCD", "CID", "ETD", "ECD"] }, "reporter_mass_shift": { "type": "number", @@ -715,20 +671,13 @@ "default": "aggregation", "fa_icon": "fas fa-list-ol", "help_text": "Infer proteins through:\n\n* 'aggregation' = aggregates all peptide scores across a protein (by calculating the maximum) (default)\n* 'bayesian' = compute a posterior probability for every protein based on a Bayesian network (i.e. using Epifany)\n* ('percolator' not yet supported)\n\n**Note:** If protein grouping is performed also depends on the `protein_quant` parameter (i.e. if peptides have to be unique or unique to a group only)", - "enum": [ - "aggregation", - "bayesian" - ] + "enum": ["aggregation", "bayesian"] }, "protein_score": { "type": "string", "description": "[Ignored in Bayesian] How to aggregate scores of peptides matching to the same protein", "default": "best", - "enum": [ - "best", - "product", - "sum" - ], + "enum": ["best", "product", "sum"], "fa_icon": "fas fa-list-ol" }, "use_shared_peptides": { @@ -817,12 +766,7 @@ "type": "string", "description": "Averaging method used to compute protein abundances from peptide abundances.", "default": "median", - "enum": [ - "median", - "mean", - "weighted_mean", - "sum" - ], + "enum": ["median", "mean", "weighted_mean", "sum"], "fa_icon": "fas fa-list-ol" }, "best_charge_and_fraction": { @@ -858,11 +802,7 @@ "type": "string", "description": "Quantify proteins based on:\n\n* 'unique_peptides' = use peptides mapping to single proteins or a group of indistinguishable proteins (according to the set of experimentally identified peptides)\n* 'strictly_unique_peptides' (only LFQ) = use peptides mapping to a unique single protein only\n* 'shared_peptides' = use shared peptides, too, but only greedily for its best group (by inference score and nr. of peptides)", "default": "unique_peptides", - "enum": [ - "unique_peptides", - "strictly_unique_peptides", - "shared_peptides" - ], + "enum": ["unique_peptides", "strictly_unique_peptides", "shared_peptides"], "fa_icon": "fas fa-list-ol" }, "export_mztab": { @@ -884,10 +824,7 @@ "type": "string", "description": "Choose between feature-based quantification based on integrated MS1 signals ('feature_intensity'; default) or spectral counting of PSMs ('spectral_counting'). **WARNING:** 'spectral_counting' is not compatible with our MSstats step yet. MSstats will therefore be disabled automatically with that choice.", "default": "feature_intensity", - "enum": [ - "feature_intensity", - "spectral_counting" - ], + "enum": ["feature_intensity", "spectral_counting"], "fa_icon": "fas fa-list-ol" }, "mass_recalibration": { @@ -926,10 +863,7 @@ "type": "string", "description": "The order in which maps are aligned. Star = all vs. the reference with most IDs (default). TreeGuided = an alignment tree is calculated first based on similarity measures of the IDs in the maps.", "default": "star", - "enum": [ - "star", - "treeguided" - ], + "enum": ["star", "treeguided"], "fa_icon": "far fa-list-ol" }, "quantify_decoys": { @@ -995,11 +929,7 @@ "type": "number", "description": "Controls the protein inference mode", "fa_icon": "fas fa-list-ol", - "enum": [ - 0, - 1, - 2 - ], + "enum": [0, 1, 2], "default": 2 }, "species_genes": { @@ -1034,13 +964,7 @@ "description": "Debug level", "default": 3, "fa_icon": "fas fa-bug", - "enum": [ - 0, - 1, - 2, - 3, - 4 - ], + "enum": [0, 1, 2, 3, 4], "hidden": true }, "diann_normalize": { @@ -1103,20 +1027,14 @@ "description": "Which features to use for quantification per protein: 'top3' or 'highQuality' which removes outliers only", "fa_icon": "far fa-list-ol", "default": "top3", - "enum": [ - "top3", - "highQuality" - ] + "enum": ["top3", "highQuality"] }, "msstatslfq_quant_summary_method": { "type": "string", "description": "which summary method to use: 'TMP' (Tukey's median polish) or 'linear' (linear mixed model)", "fa_icon": "far fa-list-ol", "default": "TMP", - "enum": [ - "TMP", - "linear" - ] + "enum": ["TMP", "linear"] }, "msstats_remove_one_feat_prot": { "type": "boolean", @@ -1147,22 +1065,14 @@ "description": "select the feature with the largest summmation or maximal value", "fa_icon": "far fa-list-ol", "default": "sum", - "enum": [ - "sum", - "max" - ] + "enum": ["sum", "max"] }, "msstatsiso_summarization_method": { "type": "string", "description": "summarization methods to protein-level can be perfomed", "fa_icon": "far fa-list-ol", "default": "msstats", - "enum": [ - "msstats", - "MedianPolish", - "Median", - "LogSum" - ] + "enum": ["msstats", "MedianPolish", "Median", "LogSum"] }, "msstatsiso_global_norm": { "type": "boolean", @@ -1318,14 +1228,7 @@ "description": "Method used to save pipeline results to output directory.", "help_text": "The Nextflow `publishDir` option specifies which intermediate files should be saved to the output directory. This option tells the pipeline what method should be used to move these files. See [Nextflow docs](https://www.nextflow.io/docs/latest/process.html#publishdir) for details.", "fa_icon": "fas fa-copy", - "enum": [ - "symlink", - "rellink", - "link", - "copy", - "copyNoFollow", - "move" - ], + "enum": ["symlink", "rellink", "link", "copy", "copyNoFollow", "move"], "hidden": true }, "email_on_fail": {