|
13 | 13 | "errorMessage": "Sample name must be provided and cannot contain spaces", |
14 | 14 | "meta": ["id"] |
15 | 15 | }, |
16 | | - "fastq_1": { |
| 16 | + "fasta": { |
17 | 17 | "type": "string", |
18 | 18 | "format": "file-path", |
19 | 19 | "exists": true, |
20 | 20 | "pattern": "^([\\S\\s]*\\/)?[^\\s\\/]+\\.f(ast)?q\\.gz$", |
21 | | - "errorMessage": "FastQ file for reads 1 must be provided, cannot contain spaces and must have extension '.fq.gz' or '.fastq.gz'" |
| 21 | + "errorMessage": "FASTA file for sequences 1 must be provided, cannot contain spaces and must have extension '.fa.gz' or '.fasta.gz'", |
| 22 | + "description": "MAG/bin sequence file" |
22 | 23 | }, |
23 | | - "fastq_2": { |
| 24 | + "accession": { |
24 | 25 | "type": "string", |
25 | | - "format": "file-path", |
26 | | - "exists": true, |
27 | | - "pattern": "^([\\S\\s]*\\/)?[^\\s\\/]+\\.f(ast)?q\\.gz$", |
28 | | - "errorMessage": "FastQ file for reads 2 cannot contain spaces and must have extension '.fq.gz' or '.fastq.gz'" |
| 26 | + "description": "Run or assembly ENA accession" |
| 27 | + }, |
| 28 | + "assembly_software": { |
| 29 | + "type": "string", |
| 30 | + "description": "Tool name and version that was used to assemble data" |
| 31 | + }, |
| 32 | + "binning_software": { |
| 33 | + "type": "string", |
| 34 | + "description": "Tool name and version that was used to bin data" |
| 35 | + }, |
| 36 | + "binning_parameters": { |
| 37 | + "type": "string", |
| 38 | + "description": "Arguments used to bin data different from default" |
| 39 | + }, |
| 40 | + "stats_generation_software": { |
| 41 | + "type": "string", |
| 42 | + "description": "Tool(s) used to estimate completeness and contamination" |
| 43 | + }, |
| 44 | + "completeness": { |
| 45 | + "type": "number", |
| 46 | + "description": "MAG/bin completeness value" |
| 47 | + }, |
| 48 | + "contamination": { |
| 49 | + "type": "number", |
| 50 | + "description": "MAG/bin contamination value" |
| 51 | + }, |
| 52 | + "genome_coverage": { |
| 53 | + "type": "number", |
| 54 | + "description": "MAG/bin coverage value" |
| 55 | + }, |
| 56 | + "metagenome": { |
| 57 | + "type": "string", |
| 58 | + "description": "ENA accepted metagenome name" |
| 59 | + }, |
| 60 | + "co-assembly": { |
| 61 | + "type": "boolean", |
| 62 | + "description": "True if data was co-assembled, False otherwise" |
| 63 | + }, |
| 64 | + "broad_environment": { |
| 65 | + "type": "string", |
| 66 | + "description": "broad ecological context of a sample" |
| 67 | + }, |
| 68 | + "local_environment": { |
| 69 | + "type": "string", |
| 70 | + "description": "local ecological context" |
| 71 | + }, |
| 72 | + "environmental_medium": { |
| 73 | + "type": "string", |
| 74 | + "description": "material displaced by the sample" |
| 75 | + }, |
| 76 | + "rRNA_presence": { |
| 77 | + "type": "boolean", |
| 78 | + "description": "True/False if rRNA genes detected" |
| 79 | + }, |
| 80 | + "NCBI_lineage": { |
| 81 | + "type": "string", |
| 82 | + "description": "full NCBI lineage - format: x;y;z" |
29 | 83 | } |
30 | 84 | }, |
31 | 85 | "required": ["sample", "fastq_1"] |
|
0 commit comments