-
Notifications
You must be signed in to change notification settings - Fork 18
Expand file tree
/
Copy pathRAST_SDK.spec
More file actions
280 lines (240 loc) · 8.79 KB
/
RAST_SDK.spec
File metadata and controls
280 lines (240 loc) · 8.79 KB
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
248
249
250
251
252
253
254
255
256
257
258
259
260
261
262
263
264
265
266
267
268
269
270
271
272
273
274
275
276
277
278
279
280
/*
The SDK version of the KBaase Genome Annotation Service.
This wraps genome_annotation which is based off of the SEED annotations.
*/
module RAST_SDK {
/*
A binary boolean
*/
typedef int bool;
/*
A string representing a genome id.
*/
typedef string genome_id;
/*
A string representing a ContigSet id.
*/
typedef string contigset_id;
/*
A string representing a workspace name.
*/
typedef string workspace_name;
/* Parameters for the annotate_genome method.
ncbi_taxon_id - the numeric ID of the NCBI taxon to which this genome belongs. If this
is included scientific_name is ignored.
relation_engine_timestamp_ms - the timestamp to send to the Relation Engine when looking
up taxon information in milliseconds since the epoch.
scientific_name - the scientific name of the genome. Overridden by ncbi_taxon_id.
TODO: document remainder of parameters.
*/
typedef structure {
string workspace;
genome_id input_genome;
contigset_id input_contigset;
int genetic_code;
string domain;
int ncbi_taxon_id;
int relation_engine_timestamp_ms;
string scientific_name;
string output_genome;
bool call_features_rRNA_SEED;
bool call_features_tRNA_trnascan;
bool call_selenoproteins;
bool call_pyrrolysoproteins;
bool call_features_repeat_region_SEED;
bool call_features_insertion_sequences;
bool call_features_strep_suis_repeat;
bool call_features_strep_pneumo_repeat;
bool call_features_crispr;
bool call_features_CDS_glimmer3;
bool call_features_CDS_prodigal;
bool call_features_CDS_genemark;
bool annotate_proteins_kmer_v2;
bool kmer_v1_parameters;
bool annotate_proteins_similarity;
bool resolve_overlapping_features;
bool call_features_prophage_phispy;
bool retain_old_anno_for_hypotheticals;
} AnnotateGenomeParams;
typedef structure {
workspace_name workspace;
string id;
string report_name;
string report_ref;
} AnnotateGenomeResults;
/*
annotate genome
params - a param hash that includes the workspace id and options
*/
funcdef annotate_genome(AnnotateGenomeParams params) returns (AnnotateGenomeResults) authentication required;
typedef structure {
contigset_id input_contigset;
genome_id input_genome;
genome_id output_genome;
int genetic_code;
string domain;
string scientific_name;
} GenomeParams;
/* Parameters for the annotate_genomes method.
ncbi_taxon_id - the numeric ID of the NCBI taxon to which this genome belongs. If this
is included scientific_name is ignored.
relation_engine_timestamp_ms - the timestamp to send to the Relation Engine when looking
up taxon information in milliseconds since the epoch.
scientific_name - the scientific name of the genome. Overridden by ncbi_taxon_id.
TODO: document remainder of parameters.
*/
typedef structure {
string workspace;
list<GenomeParams> input_genomes;
int genetic_code;
string domain;
int ncbi_taxon_id;
int relation_engine_timestamp_ms;
string scientific_name;
string genome_text;
string output_genome;
bool call_features_rRNA_SEED;
bool call_features_tRNA_trnascan;
bool call_selenoproteins;
bool call_pyrrolysoproteins;
bool call_features_repeat_region_SEED;
bool call_features_insertion_sequences;
bool call_features_strep_suis_repeat;
bool call_features_strep_pneumo_repeat;
bool call_features_crispr;
bool call_features_CDS_glimmer3;
bool call_features_CDS_prodigal;
bool call_features_CDS_genemark;
bool annotate_proteins_kmer_v2;
bool kmer_v1_parameters;
bool annotate_proteins_similarity;
bool resolve_overlapping_features;
bool call_features_prophage_phispy;
bool retain_old_anno_for_hypotheticals;
} AnnotateGenomesParams;
typedef structure {
workspace_name workspace;
string report_name;
string report_ref;
} AnnotateGenomesResults;
/*
annotate genomes
params - a param hash that includes the workspace id and options
*/
funcdef annotate_genomes(AnnotateGenomesParams params) returns (AnnotateGenomesResults) authentication required;
typedef structure {
list<string> proteins;
} AnnotateProteinParams;
typedef structure {
list<list<string> > functions;
} AnnotateProteinResults;
/*
annotate proteins - returns a list of the RAST annotations for the input protein sequences
*/
funcdef annotate_proteins(AnnotateProteinParams params) returns (AnnotateProteinResults);
/*
For RAST annotating metagenomes (borrowed and simplied from ProkkaAnnotation moduel)
Reference to an Assembly or Genome object in the workspace
@id ws KBaseGenomeAnnotations.Assembly
@id ws KBaseGenomes.Genome
@id ws KBaseMetagenomes.AnnotatedMetagenomeAssembly
*/
typedef string data_obj_ref;
/*
Reference to a Annotated Metagenome Assembly object in the workspace
@id ws KBaseMetagenomes.AnnotatedMetagenomeAssembly
*/
typedef string metagenome_ref;
/*
Required parameters:
object_ref - reference to Assembly or Genome object,
output_workspace - output workspace name,
output_metagenome_name - output object name,
*/
typedef structure {
data_obj_ref object_ref;
string output_workspace;
string output_metagenome_name;
bool create_report;
} MetagenomeAnnotateParams;
typedef structure {
metagenome_ref output_metagenome_ref;
string output_workspace;
string report_name;
string report_ref;
} MetagenomeAnnotateOutput;
funcdef annotate_metagenome(MetagenomeAnnotateParams params)
returns (MetagenomeAnnotateOutput output) authentication required;
typedef structure {
list<data_obj_ref> input_AMAs;
list<data_obj_ref> input_assemblies;
string input_text;
string output_workspace;
string output_AMASet_name;
bool create_report;
} BulkAnnotateMetagenomesParams;
typedef structure {
data_obj_ref output_AMASet_ref;
string output_workspace;
} BulkMetagenomesAnnotateOutput;
funcdef annotate_metagenomes(BulkAnnotateMetagenomesParams params)
returns (BulkMetagenomesAnnotateOutput output) authentication required;
/*
Required parameters for rast_genome_assembly:
object_ref - reference to a Genome or Assembly object,
output_workspace - output workspace name,
output_genome_name - output object name
Optional parameters for rast_genome_assembly:
ncbi_taxon_id - the numeric ID of the NCBI taxon to which this genome belongs. If this
is included scientific_name is ignored.
relation_engine_timestamp_ms - the timestamp to send to the Relation Engine when looking
up taxon information in milliseconds since the epoch.
scientific_name - the scientific name of the genome. Overridden by ncbi_taxon_id.
*/
typedef structure {
data_obj_ref object_ref;
string output_workspace;
int genetic_code;
string domain;
int ncbi_taxon_id;
int relation_engine_timestamp_ms;
string scientific_name;
string output_genome_name;
bool create_report;
} RastGenomeAssemblyParams;
typedef structure {
genome_id output_genome_ref;
string output_workspace;
string report_name;
string report_ref;
} RastGenomeAssemblyOutput;
funcdef rast_genome_assembly(RastGenomeAssemblyParams params)
returns (RastGenomeAssemblyOutput output) authentication required;
/*
For RAST annotating genomes/assemblies
Reference to a set of annotated Genome and/or Assembly objects in the workspace
@id ws KBaseSearch.GenomeSet
*/
typedef string genomeSet_ref;
typedef structure {
list<data_obj_ref> input_genomes;
list<data_obj_ref> input_assemblies;
genomeSet_ref input_genomeset;
string input_text;
string scientific_name;
int genetic_code;
string domain;
int ncbi_taxon_id;
int relation_engine_timestamp_ms;
string output_workspace;
string output_GenomeSet_name;
} BulkRastGenomesAssembliesParams;
typedef structure {
genomeSet_ref output_GenomeSet_ref;
string output_workspace;
string report_name;
string report_ref;
} BulkRastGenomesAssembliesOutput;
funcdef rast_genomes_assemblies(BulkRastGenomesAssembliesParams params)
returns (BulkRastGenomesAssembliesOutput output) authentication required;
};