-
Notifications
You must be signed in to change notification settings - Fork 5
/
Copy pathschema_input.json
executable file
·140 lines (140 loc) · 5.1 KB
/
schema_input.json
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
{
"$schema": "http://json-schema.org/draft-07/schema",
"$id": "https://raw.githubusercontent.com/sanger-tol/treeval/master/assets/schema_input.json",
"title": "sanger-tol/treeval pipeline - params.input schema",
"description": "Schema for the file provided with params.input",
"type": "array",
"items": {
"type": "object",
"properties": {
"assembly": {
"type": "object",
"properties": {
"sample_id": {
"type": "string",
"errorMessage": "Sample name must be provided and cannot contain spaces"
},
"latin_name": {
"type": "string",
"errorMessage": "The scientific name for the assembly"
},
"classT": {
"type": "string",
"errorMessage": "The Clade of the assembly. Used as the syntenic group and to complete the gene_alignment data dir."
},
"TicketType": {
"type": "string",
"errorMessage": "Not currently in use. Single word description of associated project."
}
}
},
"reference_file": {
"type": "string",
"pattern": "^\\S+\\.f(ast)a$",
"errorMessage": "Assembly input file, decompressed"
},
"assem_reads": {
"type": "object",
"properties": {
"pacbio": {
"type": "string",
"errorMessage": "Path to folder containing fasta.gz files"
},
"hic": {
"type": "string",
"errorMessage": "Path to folder containing .cram and .crai files"
},
"supplementary": {
"type": "string",
"errorMessage": "Not currently in use. Placeholder for future use"
}
}
},
"alignment": {
"type": "object",
"properties": {
"data_dir": {
"type": "string",
"errorMessage": "Gene Alignment data directory"
},
"common_name": {
"type": "string",
"errorMessage": "Not currently in use. Common identifier for group (adding bee, wasp, ant as sub division for clade)"
},
"geneset": {
"type": "string",
"errorMessage": "A csv list of organisms to run against."
}
}
},
"self_comp": {
"type": "object",
"properties": {
"motif_len": {
"type": "integer",
"errorMessage": "Length of motif to be used in self comp search"
},
"mummer_chunk": {
"type": "integer",
"errorMessage": "Size of chunks to be used my Mummer"
}
}
},
"synteny": {
"type": "object",
"properties": {
"synteny_genome_path": {
"type": "string",
"errorMessage": "Syntenic Genome Directory Path"
}
}
},
"outdir": {
"type": "string",
"errorMessage": "Out directory path, can be changed via cli"
},
"intron": {
"type": "object",
"properties": {
"size": {
"type": "string",
"errorMessage": "Base pair size of introns, defaults to 50k"
}
}
},
"telomere": {
"type": "object",
"properties": {
"teloseq": {
"type": "string",
"errorMessage": "Expected telomeric motif"
}
}
},
"busco": {
"type": "object",
"properties": {
"lineage_path": {
"type": "string",
"errorMessage": "Path to directory containing lineages folder"
},
"lineage": {
"type": "string",
"errorMessage": "busco lineage to run"
}
}
}
},
"required": [
"busco",
"telomere",
"intron",
"synteny",
"self_comp",
"alignment",
"assem_reads",
"reference_file",
"assembly"
]
}
}