Skip to content

Commit

Permalink
Update nextflow_schema.json
Browse files Browse the repository at this point in the history
  • Loading branch information
daichengxin committed Feb 26, 2024
1 parent d2ccd5f commit a193eb7
Showing 1 changed file with 27 additions and 124 deletions.
151 changes: 27 additions & 124 deletions nextflow_schema.json
Original file line number Diff line number Diff line change
Expand Up @@ -10,10 +10,7 @@
"type": "object",
"fa_icon": "fas fa-terminal",
"description": "Define where the pipeline should find input data and save output data.",
"required": [
"input",
"outdir"
],
"required": ["input", "outdir"],
"properties": {
"input": {
"type": "string",
Expand All @@ -28,7 +25,7 @@
"outdir": {
"type": "string",
"description": "The output directory where the results will be saved.",
"default": null,
"default": "./results",
"fa_icon": "fas fa-folder-open"
},
"email": {
Expand Down Expand Up @@ -59,10 +56,7 @@
"acquisition_method": {
"type": "string",
"description": "Proteomics data acquisition method",
"enum": [
"dda",
"dia"
],
"enum": ["dda", "dia"],
"fa_icon": "far fa-list-ol"
},
"id_only": {
Expand Down Expand Up @@ -115,9 +109,7 @@
"default": "reverse",
"fa_icon": "fas fa-list-ol",
"enum": [
"reverse",
"shuffle"
]
"reverse", "shuffle"]
},
"shuffle_max_attempts": {
"type": "integer",
Expand All @@ -140,9 +132,7 @@
}
},
"fa_icon": "fas fa-database",
"required": [
"database"
]
"required": ["database"]
},
"spectrum_preprocessing": {
"title": "Spectrum preprocessing",
Expand Down Expand Up @@ -217,11 +207,7 @@
"help_text": "Warning: not supported by sage yet.",
"default": "fully",
"fa_icon": "fas fa-list-ol",
"enum": [
"fully",
"semi",
"none"
]
"enum": ["fully", "semi", "none"]
},
"allowed_missed_cleavages": {
"type": "integer",
Expand All @@ -240,10 +226,7 @@
"description": "Precursor mass tolerance unit used for database search. Possible values are 'ppm' (default) and 'Da'.",
"default": "ppm",
"fa_icon": "fas fa-sliders-h",
"enum": [
"Da",
"ppm"
]
"enum": ["Da", "ppm"]
},
"fragment_mass_tolerance": {
"type": "number",
Expand All @@ -258,10 +241,7 @@
"default": "Da",
"fa_icon": "fas fa-list-ol",
"help_text": "Caution: for Comet we are estimating the `fragment_bin_tolerance` parameter based on this automatically.",
"enum": [
"Da",
"ppm"
]
"enum": ["Da", "ppm"]
},
"fixed_mods": {
"type": "string",
Expand Down Expand Up @@ -426,11 +406,7 @@
"description": "What to do when peptides are found that do not follow a unified set of rules (since search engines sometimes differ in their interpretation of them). ",
"default": "warn",
"fa_icon": "far fa-check-square",
"enum": [
"warn",
"error",
"remove"
]
"enum": ["warn", "error", "remove"]
},
"IL_equivalent": {
"type": "boolean",
Expand All @@ -452,10 +428,7 @@
"description": "How to calculate posterior probabilities for PSMs:\n\n* 'percolator' = Re-score based on PSM-feature-based SVM and transform distance\n to hyperplane for posteriors\n* 'fit_distributions' = Fit positive and negative distributions to scores\n (similar to PeptideProphet)",
"fa_icon": "fas fa-list-ol",
"default": "percolator",
"enum": [
"percolator",
"fit_distributions"
]
"enum": ["percolator", "fit_distributions"]
},
"run_fdr_cutoff": {
"type": "number",
Expand Down Expand Up @@ -498,10 +471,7 @@
"description": "Calculate FDR on PSM ('psm-level-fdrs') or peptide level ('peptide-level-fdrs')?",
"default": "peptide-level-fdrs",
"fa_icon": "fas fa-list-ol",
"enum": [
"peptide-level-fdrs",
"psm-level-fdrs"
]
"enum": ["peptide-level-fdrs", "psm-level-fdrs"]
},
"train_FDR": {
"type": "number",
Expand Down Expand Up @@ -554,12 +524,7 @@
"description": "How to handle outliers during fitting:\n\n* ignore_iqr_outliers (default): ignore outliers outside of `3*IQR` from Q1/Q3 for fitting\n* set_iqr_to_closest_valid: set IQR-based outliers to the last valid value for fitting\n* ignore_extreme_percentiles: ignore everything outside 99th and 1st percentile (also removes equal values like potential censored max values in XTandem)\n* none: do nothing",
"default": "none",
"fa_icon": "fas fa-list-ol",
"enum": [
"none",
"ignore_iqr_outliers",
"set_iqr_to_closest_valid",
"ignore_extreme_percentiles"
]
"enum": ["none", "ignore_iqr_outliers", "set_iqr_to_closest_valid", "ignore_extreme_percentiles"]
},
"idpep_debug": {
"type": "integer",
Expand All @@ -583,11 +548,7 @@
"default": "best",
"fa_icon": "fas fa-list-ol",
"help_text": "Specifies how search engine results are combined: ConsensusID offers several algorithms that can aggregate results from multiple peptide identification engines ('search engines') into consensus identifications - typically one per MS2 spectrum. This works especially well for search engines that provide more than one peptide hit per spectrum, i.e. that report not just the best hit, but also a list of runner-up candidates with corresponding scores.\n\nThe available algorithms are:\n\n* PEPMatrix: Scoring based on posterior error probabilities (PEPs) and peptide sequence similarities. This algorithm uses a substitution matrix to score the similarity of sequences not listed by all search engines. It requires PEPs as the scores for all peptide hits.\n* PEPIons: Scoring based on posterior error probabilities (PEPs) and fragment ion similarities ('shared peak count'). This algorithm, too, requires PEPs as scores.\n* best: For each peptide ID, this uses the best score of any search engine as the consensus score.\n* worst: For each peptide ID, this uses the worst score of any search engine as the consensus score.\n* average: For each peptide ID, this uses the average score of all search engines as the consensus score.\n* ranks: Calculates a consensus score based on the ranks of peptide IDs in the results of different search engines. The final score is in the range (0, 1], with 1 being the best score.\n\nTo make scores comparable, for best, worst and average, PEPs are used as well. Peptide IDs are only considered the same if they map to exactly the same sequence (including modifications and their localization). Also isobaric aminoacids are (for now) only considered equal with the PEPMatrix/PEPIons algorithms.",
"enum": [
"best",
"PEPMatrix",
"PEPIons"
]
"enum": ["best", "PEPMatrix", "PEPIons"]
},
"consensusid_considered_top_hits": {
"type": "integer",
Expand Down Expand Up @@ -621,12 +582,7 @@
"type": "string",
"description": "Operate only on MSn scans where any of its precursors features a certain activation method. Set to empty to disable.",
"fa_icon": "fas fa-font",
"enum": [
"HCD",
"CID",
"ETD",
"ECD"
]
"enum": ["HCD", "CID", "ETD", "ECD"]
},
"reporter_mass_shift": {
"type": "number",
Expand Down Expand Up @@ -715,20 +671,13 @@
"default": "aggregation",
"fa_icon": "fas fa-list-ol",
"help_text": "Infer proteins through:\n\n* 'aggregation' = aggregates all peptide scores across a protein (by calculating the maximum) (default)\n* 'bayesian' = compute a posterior probability for every protein based on a Bayesian network (i.e. using Epifany)\n* ('percolator' not yet supported)\n\n**Note:** If protein grouping is performed also depends on the `protein_quant` parameter (i.e. if peptides have to be unique or unique to a group only)",
"enum": [
"aggregation",
"bayesian"
]
"enum": ["aggregation", "bayesian"]
},
"protein_score": {
"type": "string",
"description": "[Ignored in Bayesian] How to aggregate scores of peptides matching to the same protein",
"default": "best",
"enum": [
"best",
"product",
"sum"
],
"enum": ["best", "product", "sum"],
"fa_icon": "fas fa-list-ol"
},
"use_shared_peptides": {
Expand Down Expand Up @@ -817,12 +766,7 @@
"type": "string",
"description": "Averaging method used to compute protein abundances from peptide abundances.",
"default": "median",
"enum": [
"median",
"mean",
"weighted_mean",
"sum"
],
"enum": ["median", "mean", "weighted_mean", "sum"],
"fa_icon": "fas fa-list-ol"
},
"best_charge_and_fraction": {
Expand Down Expand Up @@ -858,11 +802,7 @@
"type": "string",
"description": "Quantify proteins based on:\n\n* 'unique_peptides' = use peptides mapping to single proteins or a group of indistinguishable proteins (according to the set of experimentally identified peptides)\n* 'strictly_unique_peptides' (only LFQ) = use peptides mapping to a unique single protein only\n* 'shared_peptides' = use shared peptides, too, but only greedily for its best group (by inference score and nr. of peptides)",
"default": "unique_peptides",
"enum": [
"unique_peptides",
"strictly_unique_peptides",
"shared_peptides"
],
"enum": ["unique_peptides", "strictly_unique_peptides", "shared_peptides"],
"fa_icon": "fas fa-list-ol"
},
"export_mztab": {
Expand All @@ -884,10 +824,7 @@
"type": "string",
"description": "Choose between feature-based quantification based on integrated MS1 signals ('feature_intensity'; default) or spectral counting of PSMs ('spectral_counting'). **WARNING:** 'spectral_counting' is not compatible with our MSstats step yet. MSstats will therefore be disabled automatically with that choice.",
"default": "feature_intensity",
"enum": [
"feature_intensity",
"spectral_counting"
],
"enum": ["feature_intensity", "spectral_counting"],
"fa_icon": "fas fa-list-ol"
},
"mass_recalibration": {
Expand Down Expand Up @@ -926,10 +863,7 @@
"type": "string",
"description": "The order in which maps are aligned. Star = all vs. the reference with most IDs (default). TreeGuided = an alignment tree is calculated first based on similarity measures of the IDs in the maps.",
"default": "star",
"enum": [
"star",
"treeguided"
],
"enum": ["star", "treeguided"],
"fa_icon": "far fa-list-ol"
},
"quantify_decoys": {
Expand Down Expand Up @@ -995,11 +929,7 @@
"type": "number",
"description": "Controls the protein inference mode",
"fa_icon": "fas fa-list-ol",
"enum": [
0,
1,
2
],
"enum": [0, 1, 2],
"default": 2
},
"species_genes": {
Expand Down Expand Up @@ -1034,13 +964,7 @@
"description": "Debug level",
"default": 3,
"fa_icon": "fas fa-bug",
"enum": [
0,
1,
2,
3,
4
],
"enum": [0, 1, 2, 3, 4],
"hidden": true
},
"diann_normalize": {
Expand Down Expand Up @@ -1103,20 +1027,14 @@
"description": "Which features to use for quantification per protein: 'top3' or 'highQuality' which removes outliers only",
"fa_icon": "far fa-list-ol",
"default": "top3",
"enum": [
"top3",
"highQuality"
]
"enum": ["top3", "highQuality"]
},
"msstatslfq_quant_summary_method": {
"type": "string",
"description": "which summary method to use: 'TMP' (Tukey's median polish) or 'linear' (linear mixed model)",
"fa_icon": "far fa-list-ol",
"default": "TMP",
"enum": [
"TMP",
"linear"
]
"enum": ["TMP", "linear"]
},
"msstats_remove_one_feat_prot": {
"type": "boolean",
Expand Down Expand Up @@ -1147,22 +1065,14 @@
"description": "select the feature with the largest summmation or maximal value",
"fa_icon": "far fa-list-ol",
"default": "sum",
"enum": [
"sum",
"max"
]
"enum": ["sum", "max"]
},
"msstatsiso_summarization_method": {
"type": "string",
"description": "summarization methods to protein-level can be perfomed",
"fa_icon": "far fa-list-ol",
"default": "msstats",
"enum": [
"msstats",
"MedianPolish",
"Median",
"LogSum"
]
"enum": ["msstats", "MedianPolish", "Median", "LogSum"]
},
"msstatsiso_global_norm": {
"type": "boolean",
Expand Down Expand Up @@ -1318,14 +1228,7 @@
"description": "Method used to save pipeline results to output directory.",
"help_text": "The Nextflow `publishDir` option specifies which intermediate files should be saved to the output directory. This option tells the pipeline what method should be used to move these files. See [Nextflow docs](https://www.nextflow.io/docs/latest/process.html#publishdir) for details.",
"fa_icon": "fas fa-copy",
"enum": [
"symlink",
"rellink",
"link",
"copy",
"copyNoFollow",
"move"
],
"enum": ["symlink", "rellink", "link", "copy", "copyNoFollow", "move"],
"hidden": true
},
"email_on_fail": {
Expand Down

0 comments on commit a193eb7

Please sign in to comment.