|
9 | 9 | "title": "Input options", |
10 | 10 | "type": "object", |
11 | 11 | "description": "Define where the pipeline should find input data ", |
12 | | - "required": ["input_folder", "species_tree"], |
| 12 | + "required": ["input", "species_tree"], |
13 | 13 | "properties": { |
14 | | - "input_folder": { |
| 14 | + "input": { |
15 | 15 | "type": "string", |
16 | | - "format": "directory-path", |
17 | | - "description": "Path to input directory containing proteomes and species tree", |
18 | | - "fa_icon": "fas fa-folder-open" |
| 16 | + "description": "Input data source: local directory, archive file, or remote URL", |
| 17 | + "help": "Can be: (1) Path to a local directory containing proteome/ subfolder and species_tree.nwk file, (2) Path to a local archive file (.tar.gz, .tgz, .zip), or (3) HTTP/HTTPS URL to download an archive. Archives will be automatically extracted and cached.", |
| 18 | + "fa_icon": "fas fa-folder-open", |
| 19 | + "examples": [ |
| 20 | + "/path/to/dataset/", |
| 21 | + "/path/to/dataset.tar.gz", |
| 22 | + "https://zenodo.org/records/12345/files/dataset.tar.gz" |
| 23 | + ] |
19 | 24 | }, |
20 | 25 | "proteome_folder": { |
21 | 26 | "type": "string", |
22 | 27 | "format": "directory-path", |
23 | 28 | "description": "Path to input directory containing the proteome files in fasta format", |
24 | | - "help": "If not provided, the proteomes are asumed to be in the input_folder/proteomes directory.", |
| 29 | + "help": "Override the default proteome folder location. Only used when input is a local directory. If not specified, defaults to input/proteome/.", |
25 | 30 | "fa_icon": "fas fa-folder-open" |
26 | 31 | }, |
27 | 32 | "hogmap_in": { |
|
34 | 39 | "species_tree": { |
35 | 40 | "type": "string", |
36 | 41 | "format": "file-path", |
37 | | - "description": "Path to species tree file", |
| 42 | + "description": "Path to species tree file in Newick format", |
38 | 43 | "fa_icon": "fas fa-tree", |
39 | 44 | "pattern": "^\\S+\\.(nhx|nh|nwk)", |
40 | | - "help": "The species tree should be in Newick or NHX format. By default, the pipeline looks for a file named species_tree.nwk in the input_folder." |
| 45 | + "help": "Override the default species tree location. Only used when input is a local directory. If not specified, defaults to input/species_tree.nwk." |
41 | 46 | }, |
42 | 47 | "splice_folder": { |
43 | 48 | "type": "string", |
44 | 49 | "format": "directory-path", |
45 | 50 | "description": "Path to input directory containing the splice files", |
46 | 51 | "fa_icon": "fas fa-folder-open", |
47 | | - "help": "If provided, FastOMA will use the splice files to identify and handle alternative splicing isoforms in the proteomes and select the best representative isoform for each gene." |
| 52 | + "help": "If provided, FastOMA will use splice variant information to select representative isoforms for each gene. Only used when input is a local directory." |
48 | 53 | }, |
49 | 54 | "omamer_db": { |
50 | 55 | "type": "string", |
|
53 | 58 | "fa_icon": "fas fa-database", |
54 | 59 | "help": "If not provided, the default OMAmer database (LUCA) will be used.", |
55 | 60 | "default": "https://omabrowser.org/All/LUCA.h5" |
| 61 | + }, |
| 62 | + "test_data_cache": { |
| 63 | + "type": "string", |
| 64 | + "format": "directory-path", |
| 65 | + "description": "Path where (remote) input archives will be stored and permanently cached", |
| 66 | + "fa_ison": "fas fa-folder-open" |
| 67 | + }, |
| 68 | + "input_folder": { |
| 69 | + "type": "string", |
| 70 | + "hidden": true, |
| 71 | + "format": "directory-path", |
| 72 | + "description": "DEPRECATED: Use --input instead", |
| 73 | + "help_text": "This parameter has been renamed to --input. Please update your command line or configuration files." |
56 | 74 | } |
57 | 75 | } |
58 | 76 | }, |
|
0 commit comments