1 | // ============================================================ // |
---|
2 | // // |
---|
3 | // File : gb_aci.cxx // |
---|
4 | // Purpose : ARB command interpreter (ACI) // |
---|
5 | // // |
---|
6 | // http://www.arb-home.de/ // |
---|
7 | // // |
---|
8 | // ============================================================ // |
---|
9 | |
---|
10 | #include "gb_aci.h" |
---|
11 | #include "gb_aci_impl.h" |
---|
12 | |
---|
13 | #include <arb_strbuf.h> |
---|
14 | #include <arb_match.h> |
---|
15 | |
---|
16 | using namespace GBL_IMPL; |
---|
17 | |
---|
18 | GBL_command_lookup_table::GBL_command_lookup_table(const GBL_command_definition *table, unsigned size) { |
---|
19 | /*! create table to lookup ACI commands |
---|
20 | * @param table command-table (has to exist as long as GBL_command_lookup_table exists; needs sentinel) |
---|
21 | * @param size number of commands in 'table' ( = size of 'table' - 1) |
---|
22 | */ |
---|
23 | |
---|
24 | for (unsigned i = 0; i<size; ++i) { |
---|
25 | const GBL_command_definition& cmd = table[i]; |
---|
26 | gb_assert(cmd.is_defined()); |
---|
27 | |
---|
28 | defined[cmd.identifier] = cmd.function; |
---|
29 | } |
---|
30 | gb_assert(table[size].is_sentinel()); |
---|
31 | } |
---|
32 | |
---|
33 | namespace GBL_IMPL { |
---|
34 | static const char *search_matching_dquote(const char *str) { |
---|
35 | int c; |
---|
36 | for (; (c=*str); str++) { |
---|
37 | if (c=='\\') { // escaped characters |
---|
38 | str++; |
---|
39 | if (!(c=*str)) return NULp; |
---|
40 | continue; |
---|
41 | } |
---|
42 | if (c=='"') return (char *)str; |
---|
43 | } |
---|
44 | return NULp; |
---|
45 | } |
---|
46 | inline char *search_matching_dquote(char *str) { |
---|
47 | return const_cast<char*>(search_matching_dquote(const_cast<const char*>(str))); |
---|
48 | } |
---|
49 | const char *search_matching_parenthesis(const char *source) { |
---|
50 | int c; |
---|
51 | int deep = 0; |
---|
52 | if (*source != '(') deep --; // first bracket |
---|
53 | for (; (c=*source); source++) { |
---|
54 | if (c=='\\') { // escaped characters |
---|
55 | source++; |
---|
56 | if (!*source) break; |
---|
57 | continue; |
---|
58 | } |
---|
59 | if (c=='(') deep--; |
---|
60 | else if (c==')') deep++; |
---|
61 | if (!deep) return (char *)source; |
---|
62 | if (c=='"') { // search the second " |
---|
63 | source = search_matching_dquote(source); |
---|
64 | if (!source) return NULp; |
---|
65 | } |
---|
66 | } |
---|
67 | if (!c) return NULp; |
---|
68 | return source; |
---|
69 | } |
---|
70 | static const char *search_next_separator(const char *source, const char *seps) { |
---|
71 | // search the next separator |
---|
72 | static char tab[256]; |
---|
73 | static bool init = false; |
---|
74 | |
---|
75 | if (!init) { |
---|
76 | memset(tab, 0, 256); |
---|
77 | init = true; |
---|
78 | } |
---|
79 | |
---|
80 | for (const char *p = seps; *p; ++p) tab[safeCharIndex(*p)] = 1; |
---|
81 | |
---|
82 | tab['('] = 2; // exclude () pairs |
---|
83 | tab['"'] = 2; // exclude " pairs |
---|
84 | tab['\\'] = 2; // exclude \-escaped chars |
---|
85 | |
---|
86 | for (; *source; ++source) { |
---|
87 | const char chType = tab[safeCharIndex(*source)]; |
---|
88 | if (chType == 0) continue; // accept char |
---|
89 | if (chType == 1) break; // found separator |
---|
90 | |
---|
91 | if (*source == '\\') { |
---|
92 | ++source; // -> skip over next char |
---|
93 | if (!source[0]) break; // abort if end of string seen |
---|
94 | } |
---|
95 | else if (*source == '(') { |
---|
96 | source = search_matching_parenthesis(source); |
---|
97 | if (!source) break; |
---|
98 | } |
---|
99 | else if (*source == '\"') { |
---|
100 | source = search_matching_dquote(source+1); |
---|
101 | if (!source) break; |
---|
102 | } |
---|
103 | } |
---|
104 | for (const char *p = seps; *p; ++p) tab[safeCharIndex(*p)] = 0; // clear tab |
---|
105 | return source && source[0] ? source : NULp; |
---|
106 | } |
---|
107 | inline char *search_next_separator(char *source, const char *seps) { |
---|
108 | return const_cast<char*>(search_next_separator(const_cast<const char*>(source), seps)); |
---|
109 | } |
---|
110 | }; |
---|
111 | |
---|
112 | static void dumpStreams(const char *name, const GBL_streams& streams) { |
---|
113 | if (streams.empty()) { |
---|
114 | print_trace(GBS_global_string("%s [none]\n", name)); |
---|
115 | } |
---|
116 | else { |
---|
117 | int count = streams.size(); |
---|
118 | char *header = GBS_global_string_copy("%s", name); |
---|
119 | |
---|
120 | print_trace(GBS_global_string("%s [0]='%s'", header, streams.get(0))); |
---|
121 | if (count>1) { |
---|
122 | LocallyModify<int> inc(traceIndent, traceIndent+strlen(header)+1); |
---|
123 | for (int c = 1; c<count; c++) { |
---|
124 | if (c == 10 || c == 100 || c == 1000) --traceIndent; // dec indentation |
---|
125 | print_trace(GBS_global_string("[%i]='%s'\n", c, streams.get(c))); |
---|
126 | } |
---|
127 | } |
---|
128 | free(header); |
---|
129 | } |
---|
130 | } |
---|
131 | |
---|
132 | static const char *shortenLongString(const char *str, size_t wanted_len) { |
---|
133 | // shortens the string 'str' to 'wanted_len' (appends '[..]' if string was shortened) |
---|
134 | |
---|
135 | const char *result; |
---|
136 | size_t len = strlen(str); |
---|
137 | |
---|
138 | gb_assert(wanted_len>4); |
---|
139 | |
---|
140 | if (len>wanted_len) { |
---|
141 | static char *shortened_str; |
---|
142 | static size_t short_len = 0; |
---|
143 | |
---|
144 | if (short_len >= wanted_len) { |
---|
145 | memcpy(shortened_str, str, wanted_len-4); |
---|
146 | } |
---|
147 | else { |
---|
148 | freeset(shortened_str, ARB_strpartdup(str, str+wanted_len)); |
---|
149 | short_len = wanted_len; |
---|
150 | } |
---|
151 | strcpy(shortened_str+wanted_len-4, "[..]"); |
---|
152 | result = shortened_str; |
---|
153 | } |
---|
154 | else { |
---|
155 | result = str; |
---|
156 | } |
---|
157 | return result; |
---|
158 | } |
---|
159 | |
---|
160 | static char *apply_ACI(const char *str, const char *commands, const GBL_call_env& callEnv) { |
---|
161 | char *buffer = ARB_strdup(commands); |
---|
162 | |
---|
163 | // ********************** remove all spaces and tabs ******************* |
---|
164 | { |
---|
165 | const char *s1; |
---|
166 | char *s2; |
---|
167 | s1 = commands; |
---|
168 | s2 = buffer; |
---|
169 | { |
---|
170 | int c; |
---|
171 | for (; (c = *s1); s1++) { |
---|
172 | if (c=='\\') { |
---|
173 | *(s2++) = c; |
---|
174 | if (!(c=*++s1)) { break; } |
---|
175 | *(s2++) = c; |
---|
176 | continue; |
---|
177 | } |
---|
178 | |
---|
179 | if (c=='"') { // search the second " |
---|
180 | const char *hp = search_matching_dquote(s1+1); |
---|
181 | if (!hp) { |
---|
182 | GB_export_errorf("unbalanced '\"' in '%s'", commands); |
---|
183 | free(buffer); |
---|
184 | return NULp; |
---|
185 | } |
---|
186 | while (s1 <= hp) *(s2++) = *(s1++); // LOOP_VECTORIZED |
---|
187 | s1--; |
---|
188 | continue; |
---|
189 | } |
---|
190 | if (c!=' ' && c!='\t') *(s2++) = c; |
---|
191 | } |
---|
192 | } |
---|
193 | *s2 = 0; |
---|
194 | } |
---|
195 | |
---|
196 | GBL_streams orig; |
---|
197 | |
---|
198 | orig.insert(ARB_strdup(str)); |
---|
199 | |
---|
200 | GB_ERROR error = NULp; |
---|
201 | GBL_streams out; |
---|
202 | { |
---|
203 | char *s1, *s2; |
---|
204 | s1 = buffer; |
---|
205 | if (*s1 == '|') s1++; |
---|
206 | |
---|
207 | // ** loop over all commands ** |
---|
208 | for (; s1; s1 = s2) { |
---|
209 | int separator; |
---|
210 | GBL_COMMAND command; |
---|
211 | s2 = search_next_separator(s1, "|;,"); |
---|
212 | if (s2) { |
---|
213 | separator = *(s2); |
---|
214 | *(s2++) = 0; |
---|
215 | } |
---|
216 | else { |
---|
217 | separator = 0; |
---|
218 | } |
---|
219 | // collect the parameters |
---|
220 | GBL_streams argStreams; |
---|
221 | if (*s1 == '"') { // copy "text" to out |
---|
222 | char *end = search_matching_dquote(s1+1); |
---|
223 | if (!end) { |
---|
224 | UNCOVERED(); // seems unreachable (balancing is already ensured by search_next_separator) |
---|
225 | error = "Missing second '\"'"; |
---|
226 | break; |
---|
227 | } |
---|
228 | *end = 0; |
---|
229 | |
---|
230 | TRACE_ACI(GBS_global_string("copy '%s'\n", s1+1)); |
---|
231 | out.insert(ARB_strdup(s1+1)); |
---|
232 | } |
---|
233 | else { |
---|
234 | char *bracket = strchr(s1, '('); |
---|
235 | if (bracket) { // I got the parameter list |
---|
236 | *(bracket++) = 0; |
---|
237 | int slen = strlen(bracket); |
---|
238 | if (slen<1 || bracket[slen-1] != ')') { |
---|
239 | error = "Missing ')'"; |
---|
240 | } |
---|
241 | else if (slen == 1) { |
---|
242 | error = "Invalid empty parameter list '()'. To pass an empty argument use '(\"\")'"; |
---|
243 | } |
---|
244 | else { |
---|
245 | // go through the parameters |
---|
246 | char *p1, *p2; |
---|
247 | bracket[slen-1] = 0; |
---|
248 | for (p1 = bracket; p1; p1 = p2) { |
---|
249 | p2 = search_next_separator(p1, ";,"); |
---|
250 | if (p2) { |
---|
251 | *(p2++) = 0; |
---|
252 | } |
---|
253 | if (p1[0] == '"') { // remove "" pairs |
---|
254 | int len2; |
---|
255 | p1++; |
---|
256 | len2 = strlen(p1)-1; |
---|
257 | |
---|
258 | if (p1[len2] != '\"') { |
---|
259 | error = GBS_global_string("Invalid parameter syntax for '%s' (needs '\"' at begin AND end of parameter)", p1-1); |
---|
260 | } |
---|
261 | else { |
---|
262 | p1[len2] = 0; |
---|
263 | } |
---|
264 | } |
---|
265 | argStreams.insert(ARB_strdup(p1)); |
---|
266 | } |
---|
267 | } |
---|
268 | } |
---|
269 | if (!error && (bracket || *s1)) { |
---|
270 | command = callEnv.get_env().lookup_command(s1); |
---|
271 | if (!command) { |
---|
272 | error = GBS_global_string("Unknown command '%s'", s1); |
---|
273 | } |
---|
274 | else { |
---|
275 | GBL_command_arguments args(callEnv, s1, orig, argStreams, out); |
---|
276 | |
---|
277 | TRACE_ACI(GBS_global_string("execute '%s':\n", args.get_cmdName())); |
---|
278 | { |
---|
279 | LocallyModify<int> inc(traceIndent, traceIndent+1); |
---|
280 | if (traceACI) { |
---|
281 | dumpStreams("ArgStreams", args.get_param_streams()); |
---|
282 | dumpStreams("InpStreams", args.input); |
---|
283 | } |
---|
284 | |
---|
285 | error = command(&args); // execute the command |
---|
286 | |
---|
287 | if (!error && traceACI) dumpStreams("OutStreams", args.output); |
---|
288 | } |
---|
289 | |
---|
290 | if (error) { |
---|
291 | char *dup_error = ARB_strdup(error); |
---|
292 | |
---|
293 | #define MAX_PRINT_LEN 200 |
---|
294 | |
---|
295 | char *paramlist = NULp; |
---|
296 | for (int j = 0; j<args.param_count(); ++j) { |
---|
297 | const char *param = args.get_param(j); |
---|
298 | const char *param_short = shortenLongString(param, MAX_PRINT_LEN); |
---|
299 | |
---|
300 | if (!paramlist) paramlist = ARB_strdup(param_short); |
---|
301 | else freeset(paramlist, GBS_global_string_copy("%s,%s", paramlist, param_short)); |
---|
302 | } |
---|
303 | char *inputstreams = NULp; |
---|
304 | for (int j = 0; j<args.input.size(); ++j) { |
---|
305 | const char *input = args.input.get(j); |
---|
306 | const char *input_short = shortenLongString(input, MAX_PRINT_LEN); |
---|
307 | |
---|
308 | if (!inputstreams) inputstreams = ARB_strdup(input_short); |
---|
309 | else freeset(inputstreams, GBS_global_string_copy("%s;%s", inputstreams, input_short)); |
---|
310 | } |
---|
311 | #undef MAX_PRINT_LEN |
---|
312 | if (paramlist) { |
---|
313 | error = GBS_global_string("while applying '%s(%s)'\nto '%s':\n%s", s1, paramlist, inputstreams, dup_error); |
---|
314 | } |
---|
315 | else { |
---|
316 | error = GBS_global_string("while applying '%s'\nto '%s':\n%s", s1, inputstreams, dup_error); |
---|
317 | } |
---|
318 | |
---|
319 | free(inputstreams); |
---|
320 | free(paramlist); |
---|
321 | free(dup_error); |
---|
322 | } |
---|
323 | } |
---|
324 | } |
---|
325 | } |
---|
326 | |
---|
327 | if (error) break; |
---|
328 | |
---|
329 | if (separator == '|') { // out -> in pipe; clear in |
---|
330 | out.swap(orig); |
---|
331 | out.erase(); |
---|
332 | } |
---|
333 | } |
---|
334 | } |
---|
335 | |
---|
336 | { |
---|
337 | char *s1 = out.concatenated(); |
---|
338 | free(buffer); |
---|
339 | if (!error) return s1; |
---|
340 | free(s1); |
---|
341 | } |
---|
342 | |
---|
343 | GB_export_errorf("Command '%s' failed:\nReason: %s", commands, error); |
---|
344 | return NULp; |
---|
345 | } |
---|
346 | // -------------------------------------------------------------------------------- |
---|
347 | |
---|
348 | char *GBL_streams::concatenated() const { |
---|
349 | int count = size(); |
---|
350 | if (!count) return ARB_strdup(""); |
---|
351 | if (count == 1) return ARB_strdup(get(0)); |
---|
352 | |
---|
353 | GBS_strstruct buf(1000); |
---|
354 | for (int i=0; i<count; i++) { |
---|
355 | const char *s = get(i); |
---|
356 | if (s) buf.cat(s); |
---|
357 | } |
---|
358 | return buf.release_memfriendly(); |
---|
359 | } |
---|
360 | |
---|
361 | NOT4PERL char *GB_command_interpreter_in_env(const char *str, const char *commands, const GBL_call_env& callEnv) { |
---|
362 | /* simple command interpreter returns NULp on error (which should be exported in that case) |
---|
363 | * if first character is == ':' run string parser |
---|
364 | * if first character is == '/' run regexpr |
---|
365 | * else run ACI |
---|
366 | */ |
---|
367 | |
---|
368 | // @@@ most code here and code in apply_ACI could be moved into GBL_call_env::interpret_subcommand |
---|
369 | |
---|
370 | LocallyModify<int> localT(traceACI); // localize effect of command 'trace' |
---|
371 | SmartMallocPtr(char) heapstr; |
---|
372 | |
---|
373 | if (!str) { |
---|
374 | if (!callEnv.get_item_ref()) { |
---|
375 | GB_export_error("ACI: no input streams found"); |
---|
376 | return NULp; |
---|
377 | } |
---|
378 | |
---|
379 | if (GB_read_type(callEnv.get_item_ref()) == GB_STRING) { |
---|
380 | str = GB_read_char_pntr(callEnv.get_item_ref()); |
---|
381 | } |
---|
382 | else { |
---|
383 | char *asstr = GB_read_as_string(callEnv.get_item_ref()); |
---|
384 | if (!asstr) { |
---|
385 | GB_export_error("Can't read this DB entry as string"); |
---|
386 | return NULp; |
---|
387 | } |
---|
388 | |
---|
389 | heapstr = asstr; |
---|
390 | str = &*heapstr; |
---|
391 | } |
---|
392 | } |
---|
393 | |
---|
394 | if (traceACI) { |
---|
395 | print_trace(GBS_global_string("CI: command '%s' apply to '%s'\n", commands, str)); |
---|
396 | } |
---|
397 | modify_trace_indent(+1); |
---|
398 | |
---|
399 | char *result = NULp; |
---|
400 | |
---|
401 | if (!commands || !commands[0]) { // empty command -> do not modify string |
---|
402 | result = ARB_strdup(str); |
---|
403 | } |
---|
404 | else if (commands[0] == ':') { // ':' -> string parser |
---|
405 | result = GBS_string_eval_in_env(str, commands+1, callEnv); |
---|
406 | } |
---|
407 | else if (commands[0] == '/') { // regular expression |
---|
408 | GB_ERROR err = NULp; |
---|
409 | result = GBS_regreplace(str, commands, &err); |
---|
410 | |
---|
411 | if (!result) { |
---|
412 | if (strcmp(err, "Missing '/' between search and replace string") == 0) { |
---|
413 | // if GBS_regreplace didn't find a third '/' -> silently use GBS_regmatch: |
---|
414 | size_t matchlen; |
---|
415 | err = NULp; |
---|
416 | |
---|
417 | const char *matched = GBS_regmatch(str, commands, &matchlen, &err); |
---|
418 | |
---|
419 | if (matched) result = ARB_strndup(matched, matchlen); |
---|
420 | else if (!err) result = ARB_strdup(""); |
---|
421 | } |
---|
422 | |
---|
423 | if (!result && err) GB_export_error(err); |
---|
424 | } |
---|
425 | } |
---|
426 | else { |
---|
427 | result = apply_ACI(str, commands, callEnv); |
---|
428 | } |
---|
429 | |
---|
430 | modify_trace_indent(-1); |
---|
431 | if (traceACI) { |
---|
432 | GBS_strstruct final_msg(1000); |
---|
433 | if (result) { |
---|
434 | final_msg.cat("CI: result ='"); |
---|
435 | final_msg.cat(result); |
---|
436 | } |
---|
437 | else { |
---|
438 | final_msg.cat("CI: no result. error ='"); |
---|
439 | final_msg.cat(GB_get_error()); |
---|
440 | } |
---|
441 | final_msg.put('\''); |
---|
442 | final_msg.put('\n'); |
---|
443 | final_msg.nput('-', final_msg.get_position()-1); |
---|
444 | final_msg.put('\n'); |
---|
445 | |
---|
446 | print_trace(final_msg.get_data()); |
---|
447 | } |
---|
448 | |
---|
449 | gb_assert(contradicted(result, GB_have_error())); |
---|
450 | return result; |
---|
451 | } |
---|
452 | |
---|
453 | char *GB_command_interpreter(const char *str, const char *commands, GBDATA *gb_main) { |
---|
454 | //! @see GB_command_interpreter_in_env - this flavor runs in dummy environment |
---|
455 | GBL_env env(gb_main, NULp); |
---|
456 | GBL_call_env callEnv(NULp, env); |
---|
457 | |
---|
458 | return GB_command_interpreter_in_env(str, commands, callEnv); |
---|
459 | } |
---|
460 | |
---|
461 | void GBL_custom_command_lookup_table::warn_about_overwritten_commands(const GBL_command_definition *custom_table, unsigned custom_size) const { |
---|
462 | int errcount = 0; |
---|
463 | for (unsigned i = 0; i<custom_size; ++i) { |
---|
464 | const GBL_command_definition& cdef = custom_table[i]; |
---|
465 | gb_assert(cdef.is_defined()); |
---|
466 | |
---|
467 | const char *cmd = cdef.identifier; |
---|
468 | if (base_table.lookup(cmd)) { |
---|
469 | fprintf(stderr, "Warning: ACI-command '%s' is substituted w/o permission\n", cmd); |
---|
470 | ++errcount; |
---|
471 | } |
---|
472 | } |
---|
473 | if (errcount>0) { |
---|
474 | fprintf(stderr, "Warning: Detected probably unwanted substitution of %i ACI-commands\n", errcount); |
---|
475 | gb_assert(0); // either use PERMIT_SUBSTITUTION or fix command names |
---|
476 | } |
---|
477 | } |
---|
478 | |
---|
479 | // -------------------------------------------------------------------------------- |
---|
480 | |
---|
481 | #ifdef UNIT_TESTS |
---|
482 | #include <test_unit.h> |
---|
483 | |
---|
484 | #include <arb_defs.h> |
---|
485 | |
---|
486 | #define TEST_CI__INTERNAL(input,cmd,expected,got,TEST_RESULT,callEnv) do { \ |
---|
487 | char *result; \ |
---|
488 | TEST_EXPECT_RESULT__NOERROREXPORTED(result = GB_command_interpreter_in_env(input, cmd, callEnv)); \ |
---|
489 | TEST_RESULT(result,expected,got); \ |
---|
490 | free(result); \ |
---|
491 | } while(0) |
---|
492 | |
---|
493 | #define TEST_CI(input,cmd,expected) TEST_CI__INTERNAL(input, cmd, expected, narg, TEST_EXPECT_EQUAL__IGNARG, callEnv) |
---|
494 | #define TEST_CI_WITH_ENV(input,env,cmd,expected) TEST_CI__INTERNAL(input, cmd, expected, narg, TEST_EXPECT_EQUAL__IGNARG, env) |
---|
495 | #define TEST_CI__BROKEN(input,cmd,expected,regr) TEST_CI__INTERNAL(input, cmd, expected, regr, TEST_EXPECT_EQUAL__BROKEN, callEnv) |
---|
496 | #define TEST_CI_NOOP(inandout,cmd) TEST_CI__INTERNAL(inandout, cmd, inandout, narg, TEST_EXPECT_EQUAL__IGNARG, callEnv) |
---|
497 | #define TEST_CI_NOOP__BROKEN(inandout,regr,cmd) TEST_CI__INTERNAL(inandout, cmd, inandout, regr, TEST_EXPECT_EQUAL__BROKEN, callEnv) |
---|
498 | |
---|
499 | #define TEST_CI_INVERSE(in,cmd,inv_cmd,out) do { \ |
---|
500 | TEST_CI(in, cmd, out); \ |
---|
501 | TEST_CI(out, inv_cmd, in); \ |
---|
502 | } while(0) |
---|
503 | |
---|
504 | // @@@ rename errorpart_expected -> expected_errorpart |
---|
505 | |
---|
506 | #define TEST_CI_ERROR_CONTAINS(input,cmd,errorpart_expected) \ |
---|
507 | TEST_EXPECT_NORESULT__ERROREXPORTED_CONTAINS(GB_command_interpreter_in_env(input, cmd, callEnv), errorpart_expected) |
---|
508 | |
---|
509 | #define TEST_CI_ERROR_CONTAINS__BROKEN(input,cmd,errorpart_expected,unexpected_result) do{ \ |
---|
510 | char *result; \ |
---|
511 | TEST_EXPECT_NORESULT__ERROREXPORTED_CONTAINS__BROKEN(result = GB_command_interpreter_in_env(input, cmd, callEnv), errorpart_expected); \ |
---|
512 | TEST_EXPECT_EQUAL(result, unexpected_result); \ |
---|
513 | free(result); \ |
---|
514 | }while(0) |
---|
515 | |
---|
516 | static GBDATA *RCI_gb_main = NULp; |
---|
517 | static const char *RCI_input = NULp; |
---|
518 | static const char *RCI_cmd = NULp; |
---|
519 | static GBDATA *RCI_gbd = NULp; |
---|
520 | |
---|
521 | inline void run_ci() { |
---|
522 | GBL_env env(RCI_gb_main, NULp); |
---|
523 | GBL_call_env callEnv(RCI_gbd, env); |
---|
524 | GB_command_interpreter_in_env(RCI_input, RCI_cmd, callEnv); |
---|
525 | } |
---|
526 | |
---|
527 | #define TEST_CI_SEGFAULTS(input,cmd) do{ \ |
---|
528 | RCI_gb_main = gb_main; \ |
---|
529 | RCI_input = input; \ |
---|
530 | RCI_cmd = cmd; \ |
---|
531 | RCI_gbd = gb_data; \ |
---|
532 | TEST_EXPECT_SEGFAULT(run_ci); \ |
---|
533 | }while(0) |
---|
534 | |
---|
535 | #define TEST_CI_SEGFAULTS__UNWANTED(input,cmd) do{ \ |
---|
536 | RCI_gb_main = gb_main; \ |
---|
537 | RCI_input = input; \ |
---|
538 | RCI_cmd = cmd; \ |
---|
539 | RCI_gbd = gb_data; \ |
---|
540 | TEST_EXPECT_SEGFAULT__UNWANTED(run_ci); \ |
---|
541 | }while(0) |
---|
542 | |
---|
543 | #define ACI_SPLIT "|split(\",\",0)" |
---|
544 | #define ACI_MERGE "|merge(\",\")" |
---|
545 | #define WITH_SPLITTED(aci) ACI_SPLIT aci ACI_MERGE |
---|
546 | |
---|
547 | static GB_ERROR gbx_custom(GBL_command_arguments *args) { |
---|
548 | EXPECT_NO_PARAM(args); |
---|
549 | for (int i=0; i<args->input.size(); ++i) { |
---|
550 | args->output.insert(strdup("4711")); |
---|
551 | } |
---|
552 | return NULp; |
---|
553 | } |
---|
554 | |
---|
555 | class ACI_test_env : virtual Noncopyable { |
---|
556 | GB_shell shell; |
---|
557 | GBDATA *gb_main; |
---|
558 | LocallyModify<int> traceMode; |
---|
559 | GB_transaction ta; |
---|
560 | GBDATA *gb_species; |
---|
561 | public: |
---|
562 | ACI_test_env() : |
---|
563 | gb_main(GB_open("TEST_aci.arb", "rw")), |
---|
564 | traceMode(traceACI, 0), // set to 1 to trace all ACI tests |
---|
565 | ta(gb_main) |
---|
566 | { |
---|
567 | gb_assert(gb_main); |
---|
568 | gb_species = GBT_find_species(gb_main, "LcbReu40"); // ../UNIT_TESTER/run/TEST_aci.arb@LcbReu40 |
---|
569 | } |
---|
570 | ~ACI_test_env() { |
---|
571 | TEST_EXPECT_NO_ERROR(ta.close(NULp)); |
---|
572 | GB_close(gb_main); |
---|
573 | } |
---|
574 | |
---|
575 | GBDATA *gbmain() const { return gb_main; } |
---|
576 | GBDATA *gbspecies() const { return gb_species; } |
---|
577 | }; |
---|
578 | |
---|
579 | __ATTR__REDUCED_OPTIMIZE__NO_GCSE void TEST_GB_command_interpreter_1a() { |
---|
580 | ACI_test_env E; |
---|
581 | GBL_env base_env(E.gbmain(), NULp); |
---|
582 | |
---|
583 | // execute ACI on species container (=GB_DB) in this section ------------------------------ |
---|
584 | GBDATA * const gb_data = E.gbspecies(); |
---|
585 | GBL_call_env callEnv(gb_data, base_env); |
---|
586 | |
---|
587 | TEST_CI_NOOP("bla", ""); |
---|
588 | |
---|
589 | TEST_CI("bla", ":a=u", "blu"); // simple SRT |
---|
590 | |
---|
591 | // GBS_REGREPLACE_TESTS: |
---|
592 | TEST_CI("bla", "/a/u/", "blu"); // simple regExp replace |
---|
593 | |
---|
594 | TEST_CI("test", "/_[0-9]+//", "test"); // simple regExp replace (failing, ie. no match -> no replace) |
---|
595 | |
---|
596 | TEST_CI("blabla", "/l.*b/", "lab"); // simple regExp match |
---|
597 | TEST_CI("blabla", "/b.b/", ""); // simple regExp match (failing) |
---|
598 | |
---|
599 | TEST_CI("tx_01_2", "/_[0-9]+//", "tx"); // simple regExp replace (replace all occurrences) |
---|
600 | TEST_CI("tx_01_2", "/_[0-9]+$//", "tx_01"); // simple regExp replace (replace one occurrence) |
---|
601 | |
---|
602 | TEST_CI_ERROR_CONTAINS("xx_____", "/_*//", "regular expression '_*' matched an empty string"); // caused a deadlock until [16326] |
---|
603 | TEST_CI("xx_____", "/_//", "xx"); // working removal of multiple '_' |
---|
604 | TEST_CI("xx_____yy", "/(_+)([^_]|$)/-=-\\2/", "xx-=-yy"); // replace multiple consecutive '_' |
---|
605 | TEST_CI("xx_____", "/(_+)([^_]|$)/-=-\\2/", "xx-=-"); // replace multiple consecutive '_' |
---|
606 | |
---|
607 | TEST_CI("xx_____", "/_*$//", "xx"); // removal of multiple '_' from end of sequence |
---|
608 | TEST_CI("xx", "/_*$//", "xx"); // removal of no '_' from end of sequence |
---|
609 | TEST_CI("_____yy", "/^_*//", "yy"); // removal of multiple '_' from start of sequence |
---|
610 | TEST_CI("yy", "/^_*//", "yy"); // removal of no '_' from start of sequence |
---|
611 | |
---|
612 | TEST_CI("", "/^$/ABC/", "ABC"); // replacing a complete empty string should be possible |
---|
613 | TEST_CI("XXX", "/^XXX$//", ""); // erase whole known text |
---|
614 | |
---|
615 | TEST_CI("xx/yy/zz", "/\\//-/", "xx-yy-zz"); // search expression with an escaped slash |
---|
616 | TEST_CI("xx-yy-zz", "/-/\\//", "xx/yy/zz"); // reverse (escaped slash in replace expression) |
---|
617 | |
---|
618 | TEST_CI_ERROR_CONTAINS("xx", "\\///", "Unknown command"); |
---|
619 | TEST_CI ("x/x", "/\\//", "/"); |
---|
620 | TEST_CI_ERROR_CONTAINS("xx", "//\\/", "railing backslash"); // [Tt]railing (lib dependent?) |
---|
621 | |
---|
622 | // escape / quote |
---|
623 | TEST_CI_INVERSE("ac", "|quote", "|unquote", "\"ac\""); |
---|
624 | TEST_CI_INVERSE("ac", "|escape", "|unescape", "ac"); |
---|
625 | TEST_CI_INVERSE("ac", "|escape|quote", "|unquote|unescape", "\"ac\""); |
---|
626 | TEST_CI_INVERSE("ac", "|quote|escape", "|unescape|unquote", "\\\"ac\\\""); |
---|
627 | |
---|
628 | TEST_CI_INVERSE("a\"b\\c", "|quote", "|unquote", "\"a\"b\\c\""); |
---|
629 | TEST_CI_INVERSE("a\"b\\c", "|escape", "|unescape", "a\\\"b\\\\c"); |
---|
630 | TEST_CI_INVERSE("a\"b\\c", "|escape|quote", "|unquote|unescape", "\"a\\\"b\\\\c\""); |
---|
631 | TEST_CI_INVERSE("a\"b\\c", "|quote|escape", "|unescape|unquote", "\\\"a\\\"b\\\\c\\\""); |
---|
632 | |
---|
633 | TEST_CI_NOOP("ac", "|unquote"); |
---|
634 | TEST_CI_NOOP("\"ac", "|unquote"); |
---|
635 | TEST_CI_NOOP("ac\"", "|unquote"); |
---|
636 | |
---|
637 | TEST_CI ("blabla", "|coUNT(ab)", "4"); // simple ACI |
---|
638 | TEST_CI ("l", "|\"b\";dd;\"a\"|dd", "bla"); // ACI with muliple streams |
---|
639 | TEST_CI_ERROR_CONTAINS("bla", "|count()", "Invalid empty parameter list"); // no longer interpret '()' as "1 empty arg" (force use of explicit form; see next line) |
---|
640 | TEST_CI ("bla", "|count(\"\")", "0"); // explicitly empty parameter (still strange, counts 0-byte before string-terminator; always 0) |
---|
641 | TEST_CI ("b a", "|count(\" \")", "1"); // space in quotes |
---|
642 | TEST_CI ("b\\a", "|count(\\a)", "2"); // count '\\' and 'a' (ok) |
---|
643 | TEST_CI__BROKEN ("b\\a", "|count(\"\\a\")", "1", "2"); // should only count 'a' (which is escaped in param) |
---|
644 | TEST_CI ("b\\a", "|count(\"\a\")", "0"); // does not contain '\a' |
---|
645 | TEST_CI ("b\a", "|count(\"\a\")", "1"); // counts '\a' |
---|
646 | |
---|
647 | // escaping (behavior is unexpected or weird and not documented very well) |
---|
648 | TEST_CI("b\\a\a", "|count(\\a)", "2"); // counts '\\' and 'a' (but not '\a') |
---|
649 | TEST_CI("b\\a", "|contains(\"\\\\\")", "0"); // searches for 2 backslashes (not in input) |
---|
650 | TEST_CI("b\\a", "|contains(\"\")", "0"); // search for empty string never succeeds |
---|
651 | TEST_CI("b\\a", "|contains(\\)", "2"); // finds backslash at position 1 |
---|
652 | TEST_CI("b\\\\a", "|contains(\"\\\\\")", "2"); // finds two backslashes at position 2 |
---|
653 | |
---|
654 | TEST_CI_ERROR_CONTAINS("b\\a", "|contains(\"\\\")", "ARB ERROR: unbalanced '\"' in '|contains(\"\\\")'"); // FIX: raises error (should search for 1 backslash) |
---|
655 | |
---|
656 | // test binary ops |
---|
657 | { |
---|
658 | // LocallyModify<int> traceHere(traceACI, 1); |
---|
659 | TEST_CI("", "\"5\";\"7\"|minus", "-2"); |
---|
660 | TEST_CI("", "\"5\"|minus(\"7\")", "-2"); |
---|
661 | // TEST_CI("", "minus(5,7)", "-2"); // @@@ this fails (stating command '5' fails). fix how? |
---|
662 | TEST_CI("", "minus(\"\"5\"\",\"\"7\"\")", "-2"); // @@@ syntax needed here 'minus(""5"", ""7"")' should be documented more in-depth |
---|
663 | TEST_CI("", "minus(\"\"5\";\"2\"|mult\",\"\"7\"\")", "3"); // (5*2)-7 |
---|
664 | TEST_CI("", "minus(\"\"5\";\"2\\,\"|mult\",\"\"7\"\")", "3"); // comma has to be escaped |
---|
665 | |
---|
666 | TEST_CI_ERROR_CONTAINS("", "minus(\"\"5\";\"2,\"|mult\",\"\"7\"\")", "Invalid parameter syntax for '\"\"5\";\"2'"); |
---|
667 | } |
---|
668 | |
---|
669 | TEST_CI_NOOP("ab,bcb,abac", WITH_SPLITTED("")); |
---|
670 | TEST_CI ("ab,bcb,abac", WITH_SPLITTED("|len"), "2,3,4"); |
---|
671 | TEST_CI ("ab,bcb,abac", WITH_SPLITTED("|count(a)"), "1,0,2"); |
---|
672 | TEST_CI ("ab,bcb,abac", WITH_SPLITTED("|minus(len,count(a))"), "1,3,2"); |
---|
673 | TEST_CI ("ab,bcb,abac", WITH_SPLITTED("|minus(\"\"5\"\",count(a))"), "4,5,3"); |
---|
674 | |
---|
675 | // test other recursive uses of GB_command_interpreter |
---|
676 | TEST_CI("one", "|dd;\"two\";dd|command(\"dd;\"_\";dd;\"-\"\")", "one_one-two_two-one_one-"); |
---|
677 | TEST_CI("", "|sequence|command(\"/^([\\\\.-]*)[A-Z].*/\\\\1/\")|len", "9"); // count gaps at start of sequence |
---|
678 | TEST_CI("one", "|dd;dd|eval(\"\"up\";\"per\"|merge\")", "ONEONE"); |
---|
679 | TEST_CI("1,2,3", WITH_SPLITTED("|select(\"\", \"\"one\"\", \"\"two\"\", \"\"three\"\")"), "one,two,three"); |
---|
680 | TEST_CI_ERROR_CONTAINS("1,4", WITH_SPLITTED("|select(\"\", \"\"one\"\", \"\"two\"\", \"\"three\"\")"), "Illegal param number '4' (allowed [0..3])"); |
---|
681 | |
---|
682 | // test define and do |
---|
683 | TEST_CI("ignored", "define(d4, \"dd;dd;dd;dd\")", ""); |
---|
684 | TEST_CI("ignored", "define(d16, \"do(d4)|do(d4)\")", ""); |
---|
685 | TEST_CI("ignored", "define(d64, \"do(d4)|do(d16)\")", ""); |
---|
686 | TEST_CI("ignored", "define(d4096, \"do(d64)|do(d64)\")", ""); |
---|
687 | |
---|
688 | TEST_CI("x", "do(d4)", "xxxx"); |
---|
689 | TEST_CI("xy", "do(d4)", "xyxyxyxy"); |
---|
690 | TEST_CI("x", "do(d16)", "xxxxxxxxxxxxxxxx"); |
---|
691 | TEST_CI("x", "do(d64)|len", "64"); |
---|
692 | TEST_CI("xy", "do(d4)|len", "8"); |
---|
693 | TEST_CI("xy", "do(d4)|len(\"\")", "8"); |
---|
694 | TEST_CI("xy", "do(d4)|len(x)", "4"); |
---|
695 | TEST_CI("x", "do(d4096)|len", "4096"); |
---|
696 | |
---|
697 | // create 4096 streams (disable trace; logs to much): |
---|
698 | TEST_CI("x", "trace(0)|dd;dd|dd;dd|dd;dd|dd;dd|dd;dd|dd;dd|dd;dd|dd;dd|dd;dd|dd;dd|dd;dd|dd;dd|streams", "4096"); |
---|
699 | } |
---|
700 | |
---|
701 | __ATTR__REDUCED_OPTIMIZE__NO_GCSE void TEST_GB_command_interpreter_1b() { |
---|
702 | ACI_test_env E; |
---|
703 | GBL_env base_env(E.gbmain(), NULp); |
---|
704 | |
---|
705 | // execute ACI on species container (=GB_DB) in this section ------------------------------ |
---|
706 | GBDATA * const gb_data = E.gbspecies(); |
---|
707 | GBL_call_env callEnv(gb_data, base_env); |
---|
708 | |
---|
709 | // streams |
---|
710 | TEST_CI("x", "dd;dd|streams", "2"); |
---|
711 | TEST_CI("x", "dd;dd|dd;dd|streams", "4"); |
---|
712 | TEST_CI("x", "dd;dd|dd;dd|dd;dd|streams", "8"); |
---|
713 | TEST_CI("x", "do(d4)|streams", "1"); // stream is merged when do() returns |
---|
714 | |
---|
715 | TEST_CI("", "ali_name", "ali_16s"); // ask for default-alignment name |
---|
716 | TEST_CI("", "sequence_type", "rna"); // ask for sequence_type of default-alignment |
---|
717 | |
---|
718 | // format |
---|
719 | TEST_CI("acgt", "format", " acgt"); |
---|
720 | TEST_CI("acgt", "format(firsttab=1)", " acgt"); |
---|
721 | TEST_CI("acgt", "format(firsttab=1, width=2)", |
---|
722 | " ac\n" |
---|
723 | " gt"); |
---|
724 | TEST_CI("acgt", "format(firsttab=1,tab=1,width=2)", |
---|
725 | " ac\n" |
---|
726 | " gt"); |
---|
727 | TEST_CI("acgt", "format(firsttab=0,tab=0,width=2)", |
---|
728 | "ac\n" |
---|
729 | "gt"); |
---|
730 | TEST_CI("acgt", "format(firsttab=0,tab=0,width=1)", |
---|
731 | "a\n" |
---|
732 | "c\n" |
---|
733 | "g\n" |
---|
734 | "t"); |
---|
735 | |
---|
736 | TEST_CI_ERROR_CONTAINS("acgt", "format(gap=0)", "Unknown Parameter 'gap=0' in command 'format'"); |
---|
737 | TEST_CI_ERROR_CONTAINS("acgt", "format(numleft)", "Unknown Parameter 'numleft' in command 'format'"); |
---|
738 | |
---|
739 | // format_sequence |
---|
740 | TEST_CI_ERROR_CONTAINS("acgt", "format_sequence(numright=5, numleft)", "You may only specify 'numleft' OR 'numright', not both"); |
---|
741 | |
---|
742 | TEST_CI("acgtacgtacgtacg", "format_sequence(firsttab=5,tab=5,width=4,numleft=1)", |
---|
743 | "1 acgt\n" |
---|
744 | "5 acgt\n" |
---|
745 | "9 acgt\n" |
---|
746 | "13 acg"); |
---|
747 | |
---|
748 | TEST_CI("acgtacgtacgtacg", "format_sequence(firsttab=5,tab=5,width=4,numright=9)", // test EMBL sequence formatting |
---|
749 | " acgt 4\n" |
---|
750 | " acgt 8\n" |
---|
751 | " acgt 12\n" |
---|
752 | " acg 15"); |
---|
753 | |
---|
754 | TEST_CI("acgtacgtacgtac", "format_sequence(firsttab=5,tab=5,width=4,gap=2,numright=-1)", // autodetect width for 'numright' |
---|
755 | " ac gt 4\n" |
---|
756 | " ac gt 8\n" |
---|
757 | " ac gt 12\n" |
---|
758 | " ac 14"); |
---|
759 | |
---|
760 | TEST_CI("acgt", "format_sequence(firsttab=0,tab=0,width=2,gap=1)", |
---|
761 | "a c\n" |
---|
762 | "g t"); |
---|
763 | TEST_CI("acgt", "format_sequence(firsttab=0,tab=0,width=4,gap=1)", "a c g t"); |
---|
764 | TEST_CI("acgt", "format_sequence(firsttab=0,tab=0,width=4,gap=2)", "ac gt"); |
---|
765 | TEST_CI("acgtacgt", "format_sequence(firsttab=0,width=10,gap=4)", "acgt acgt"); |
---|
766 | TEST_CI("acgtacgt", "format_sequence(firsttab=1,width=10,gap=4)", " acgt acgt"); |
---|
767 | |
---|
768 | TEST_CI("acgt", "format_sequence(firsttab=0,tab=0,gap=0)", "acgt"); |
---|
769 | TEST_CI("acgt", "format_sequence(firsttab=0,tab=0,gap=-1)", "acgt"); // no big alloc |
---|
770 | TEST_CI("acgt", "format_sequence(firsttab=0,tab=-1,gap=-1)", "acgt"); // no big alloc |
---|
771 | TEST_CI("acgt", "format(firsttab=0,tab=0,width=-1)", "acgt"); // no big alloc for(!)format |
---|
772 | |
---|
773 | TEST_CI("acgt", "format(firsttab=-1,tab=0)", "acgt"); // did a 4Gb-alloc! |
---|
774 | TEST_CI("acgt", "format(firsttab=-1,tab=-1)", "acgt"); // did a 4Gb-alloc! |
---|
775 | TEST_CI("acgt", "format(firsttab=-1,tab=-1,width=-1)", "acgt"); // did a 4Gb-alloc! |
---|
776 | |
---|
777 | TEST_CI("acgt", "format_sequence(firsttab=0,tab=0,gap=0,width=-1)", "acgt"); // did a 4Gb-alloc! |
---|
778 | TEST_CI("acgt", "format_sequence(firsttab=-1,tab=0,gap=-1)", "acgt"); // did a 4Gb-alloc! |
---|
779 | TEST_CI("acgt", "format_sequence(firsttab=-1,tab=-1,gap=-1)", "acgt"); // did a 4Gb-alloc! |
---|
780 | TEST_CI("acgt", "format_sequence(firsttab=-1,tab=-1,gap=-1,width=-1)", "acgt"); // did a 4Gb-alloc! |
---|
781 | |
---|
782 | TEST_CI_ERROR_CONTAINS("acgt", "format_sequence(nl=c)", "Unknown Parameter 'nl=c' in command 'format_sequence'"); |
---|
783 | TEST_CI_ERROR_CONTAINS("acgt", "format_sequence(forcenl=)", "Unknown Parameter 'forcenl=' in command 'format_sequence'"); |
---|
784 | |
---|
785 | TEST_CI_ERROR_CONTAINS("acgt", "format(width=0)", "Illegal zero width"); |
---|
786 | TEST_CI_ERROR_CONTAINS("acgt", "format_sequence(width=0)", "Illegal zero width"); |
---|
787 | |
---|
788 | // remove + keep |
---|
789 | TEST_CI_NOOP("acgtacgt", "remove(-.)"); |
---|
790 | TEST_CI ("..acg--ta-cgt...", "remove(-.)", "acgtacgt"); |
---|
791 | TEST_CI ("..acg--ta-cgt...", "remove(acgt)", "..---..."); |
---|
792 | |
---|
793 | TEST_CI_NOOP("acgtacgt", "keep(acgt)"); |
---|
794 | TEST_CI ("..acg--ta-cgt...", "keep(-.)", "..---..."); |
---|
795 | TEST_CI ("..acg--ta-cgt...", "keep(acgt)", "acgtacgt"); |
---|
796 | |
---|
797 | // compare + icompare |
---|
798 | TEST_CI("x,z,y,y,z,x,x,Z,y,Y,Z,x", WITH_SPLITTED("|compare"), "-1,0,1,1,1,-1"); |
---|
799 | TEST_CI("x,z,y,y,z,x,x,Z,y,Y,Z,x", WITH_SPLITTED("|icompare"), "-1,0,1,-1,0,1"); |
---|
800 | |
---|
801 | TEST_CI("x,y,z", WITH_SPLITTED("|compare(\"y\")"), "-1,0,1"); |
---|
802 | |
---|
803 | // equals + iequals |
---|
804 | TEST_CI("a,b,a,a,a,A", WITH_SPLITTED("|equals"), "0,1,0"); |
---|
805 | TEST_CI("a,b,a,a,a,A", WITH_SPLITTED("|iequals"), "0,1,1"); |
---|
806 | |
---|
807 | // contains + icontains |
---|
808 | TEST_CI("abc,bcd,BCD", WITH_SPLITTED("|contains(\"bc\")"), "2,1,0"); |
---|
809 | TEST_CI("abc,bcd,BCD", WITH_SPLITTED("|icontains(\"bc\")"), "2,1,1"); |
---|
810 | TEST_CI("abc,bcd,BCD", WITH_SPLITTED("|icontains(\"d\")"), "0,3,3"); |
---|
811 | |
---|
812 | // partof + ipartof |
---|
813 | TEST_CI("abc,BCD,def,deg", WITH_SPLITTED("|partof(\"abcdefg\")"), "1,0,4,0"); |
---|
814 | TEST_CI("abc,BCD,def,deg", WITH_SPLITTED("|ipartof(\"abcdefg\")"), "1,2,4,0"); |
---|
815 | |
---|
816 | TEST_CI(", , ,x", WITH_SPLITTED("|isempty"), "1,0,0,0"); |
---|
817 | TEST_CI(", , ,x", WITH_SPLITTED("|crop(\" \")|isempty"), "1,1,1,0"); |
---|
818 | |
---|
819 | // translate |
---|
820 | TEST_CI("abcdefgh", "translate(abc,cba)", "cbadefgh"); |
---|
821 | TEST_CI("abcdefgh", "translate(cba,abc)", "cbadefgh"); |
---|
822 | TEST_CI("abcdefgh", "translate(hcba,abch,-)", "hcb----a"); |
---|
823 | TEST_CI("abcdefgh", "translate(aceg,aceg,-)", "a-c-e-g-"); |
---|
824 | TEST_CI("abbaabba", "translate(ab,ba,-)", "baabbaab"); |
---|
825 | TEST_CI("abbaabba", "translate(a,x,-)", "x--xx--x"); |
---|
826 | TEST_CI("abbaabba", "translate(,,-)", "--------"); |
---|
827 | |
---|
828 | // echo |
---|
829 | TEST_CI("", "echo", ""); |
---|
830 | TEST_CI("", "echo(x,y,z)", "xyz"); |
---|
831 | TEST_CI("", "echo(x;y,z)", "xyz"); // check ';' as param-separator |
---|
832 | TEST_CI("", "echo(x;y;z)", "xyz"); |
---|
833 | TEST_CI("", "echo(x,y,z)|streams", "3"); |
---|
834 | |
---|
835 | // upper, lower + caps |
---|
836 | TEST_CI("the QUICK brOwn Fox", "lower", "the quick brown fox"); |
---|
837 | TEST_CI("the QUICK brOwn Fox", "upper", "THE QUICK BROWN FOX"); |
---|
838 | TEST_CI("the QUICK brOwn FoX", "caps", "The Quick Brown Fox"); |
---|
839 | } |
---|
840 | |
---|
841 | __ATTR__REDUCED_OPTIMIZE__NO_GCSE void TEST_GB_command_interpreter_2a() { |
---|
842 | ACI_test_env E; |
---|
843 | GBL_env base_env(E.gbmain(), NULp); |
---|
844 | |
---|
845 | // execute ACI on species container (=GB_DB) in this section ------------------------------ |
---|
846 | GBDATA * const gb_data = E.gbspecies(); |
---|
847 | GBL_call_env callEnv(gb_data, base_env); |
---|
848 | |
---|
849 | TEST_CI_ERROR_CONTAINS("a;b;c", "split(;)|merge(-)", "Invalid separator (cannot be empty"); |
---|
850 | TEST_CI ("a;b;c", "split(\";\")|merge(-)", "a-b-c"); |
---|
851 | |
---|
852 | // head, tail + mid/mid0 |
---|
853 | TEST_CI ("1234567890", "head(3)", "123"); |
---|
854 | TEST_CI ("1234567890", "head(9)", "123456789"); |
---|
855 | TEST_CI_NOOP("1234567890", "head(10)"); |
---|
856 | TEST_CI_NOOP("1234567890", "head(20)"); |
---|
857 | |
---|
858 | TEST_CI ("1234567890", "tail(4)", "7890"); |
---|
859 | TEST_CI ("1234567890", "tail(9)", "234567890"); |
---|
860 | TEST_CI_NOOP("1234567890", "tail(10)"); |
---|
861 | TEST_CI_NOOP("1234567890", "tail(20)"); |
---|
862 | |
---|
863 | TEST_CI("1234567890", "tail(0)", ""); |
---|
864 | TEST_CI("1234567890", "head(0)", ""); |
---|
865 | TEST_CI("1234567890", "tail(-2)", ""); |
---|
866 | TEST_CI("1234567890", "head(-2)", ""); |
---|
867 | |
---|
868 | TEST_CI("1234567890", "mid(3,5)", "345"); |
---|
869 | TEST_CI("1234567890", "mid(2,2)", "2"); |
---|
870 | |
---|
871 | TEST_CI("1234567890", "mid0(3,5)", "456"); |
---|
872 | |
---|
873 | TEST_CI("1234567890", "mid(9,20)", "90"); |
---|
874 | TEST_CI("1234567890", "mid(20,20)", ""); |
---|
875 | |
---|
876 | TEST_CI("1234567890", "tail(3)", "890"); // example from ../HELP_SOURCE/source/aci.hlp@mid0 |
---|
877 | TEST_CI("1234567890", "mid(-2,0)", "890"); |
---|
878 | TEST_CI("1234567890", "mid0(-3,-1)", "890"); |
---|
879 | |
---|
880 | // tab + pretab |
---|
881 | TEST_CI("x,xx,xxx", WITH_SPLITTED("|tab(2)"), "x ,xx,xxx"); |
---|
882 | TEST_CI("x,xx,xxx", WITH_SPLITTED("|tab(3)"), "x ,xx ,xxx"); |
---|
883 | TEST_CI("x,xx,xxx", WITH_SPLITTED("|tab(4)"), "x ,xx ,xxx "); |
---|
884 | TEST_CI("x,xx,xxx", WITH_SPLITTED("|pretab(2)"), " x,xx,xxx"); |
---|
885 | TEST_CI("x,xx,xxx", WITH_SPLITTED("|pretab(3)"), " x, xx,xxx"); |
---|
886 | TEST_CI("x,xx,xxx", WITH_SPLITTED("|pretab(4)"), " x, xx, xxx"); |
---|
887 | |
---|
888 | // crop |
---|
889 | TEST_CI(" x x ", "crop(\" \")", "x x"); |
---|
890 | TEST_CI("\n \t x x \n \t", "crop(\"\t\n \")", "x x"); |
---|
891 | |
---|
892 | // cut, drop, dropempty and dropzero |
---|
893 | TEST_CI("one,two,three,four,five,six", WITH_SPLITTED("|cut(2,3,5)"), "two,three,five"); |
---|
894 | TEST_CI("one,two,three,four,five,six", WITH_SPLITTED("|drop(2,3,5)"), "one,four,six"); |
---|
895 | |
---|
896 | TEST_CI_ERROR_CONTAINS("a", "drop(2)", "Illegal stream number '2' (allowed [1..1])"); |
---|
897 | TEST_CI_ERROR_CONTAINS("a", "drop(0)", "Illegal stream number '0' (allowed [1..1])"); |
---|
898 | TEST_CI_ERROR_CONTAINS("a", "drop", "syntax: drop(streamnumber[,streamnumber]+)"); |
---|
899 | TEST_CI_ERROR_CONTAINS("a", "cut(2)", "Illegal stream number '2' (allowed [1..1])"); |
---|
900 | TEST_CI_ERROR_CONTAINS("a", "cut(0)", "Illegal stream number '0' (allowed [1..1])"); |
---|
901 | TEST_CI_ERROR_CONTAINS("a", "cut", "syntax: cut(streamnumber[,streamnumber]+)"); |
---|
902 | TEST_CI_ERROR_CONTAINS("a", "cut()", "Invalid empty parameter list '()'"); |
---|
903 | TEST_CI_ERROR_CONTAINS("a", "cut(\"\")", "Illegal stream number '0' (allowed [1..1])"); // still strange (atoi("")->0) |
---|
904 | |
---|
905 | TEST_CI("one,two,three,four,five,six", WITH_SPLITTED("|dropempty|streams"), "6"); |
---|
906 | TEST_CI("one,two,,,five,six", WITH_SPLITTED("|dropempty|streams"), "4"); |
---|
907 | TEST_CI(",,,,,", WITH_SPLITTED("|dropempty"), ""); |
---|
908 | TEST_CI(",,,,,", WITH_SPLITTED("|dropempty|streams"), "0"); |
---|
909 | |
---|
910 | TEST_CI("1,0,0,2,3,0", WITH_SPLITTED("|dropzero"), "1,2,3"); |
---|
911 | TEST_CI("0,0,0,0,0,0", WITH_SPLITTED("|dropzero"), ""); |
---|
912 | TEST_CI("0,0,0,0,0,0", WITH_SPLITTED("|dropzero|streams"), "0"); |
---|
913 | |
---|
914 | TEST_CI("12345", "|colsplit|streams", "5"); |
---|
915 | TEST_CI("12345", "|colsplit" ACI_MERGE, "1,2,3,4,5"); |
---|
916 | TEST_CI("12345", "|colsplit(3)" ACI_MERGE, "123,45"); |
---|
917 | TEST_CI("12345,678,90", WITH_SPLITTED("|colsplit(2)"), "12,34,5,67,8,90"); |
---|
918 | TEST_CI_NOOP("12345,678,90", WITH_SPLITTED("|colsplit(5)")); |
---|
919 | |
---|
920 | // swap |
---|
921 | TEST_CI("1,2,3,four,five,six", WITH_SPLITTED("|swap"), "1,2,3,four,six,five"); |
---|
922 | TEST_CI("1,2,3,four,five,six", WITH_SPLITTED("|swap(2,3)"), "1,3,2,four,five,six"); |
---|
923 | TEST_CI("1,2,3,four,five,six", WITH_SPLITTED("|swap(2,3)|swap(4,3)"), "1,3,four,2,five,six"); |
---|
924 | TEST_CI_NOOP("1,2,3,four,five,six", WITH_SPLITTED("|swap(3,3)")); |
---|
925 | TEST_CI_NOOP("1,2,3,four,five,six", WITH_SPLITTED("|swap(3,2)|swap(2,3)")); |
---|
926 | TEST_CI_NOOP("1,2,3,four,five,six", WITH_SPLITTED("|swap(3,2)|swap(3,1)|swap(2,1)|swap(1,3)")); |
---|
927 | |
---|
928 | TEST_CI_ERROR_CONTAINS("a", "swap", "need at least two input streams"); |
---|
929 | TEST_CI_ERROR_CONTAINS("a,b", WITH_SPLITTED("|swap(2,3)"), "Illegal stream number '3' (allowed [1..2])"); |
---|
930 | TEST_CI_ERROR_CONTAINS("a,b", WITH_SPLITTED("|swap(3,2)"), "Illegal stream number '3' (allowed [1..2])"); |
---|
931 | TEST_CI_ERROR_CONTAINS("a,b", WITH_SPLITTED("|swap(1)"), "syntax: swap[(streamnumber,streamnumber)]"); |
---|
932 | TEST_CI_ERROR_CONTAINS("a,b", WITH_SPLITTED("|swap(1,2,3)"), "syntax: swap[(streamnumber,streamnumber)]"); |
---|
933 | |
---|
934 | // toback + tofront |
---|
935 | TEST_CI ("front,mid,back", WITH_SPLITTED("|toback(2)"), "front,back,mid"); |
---|
936 | TEST_CI ("front,mid,back", WITH_SPLITTED("|tofront(2)"), "mid,front,back"); |
---|
937 | TEST_CI_NOOP("front,mid,back", WITH_SPLITTED("|toback(3)")); |
---|
938 | TEST_CI_NOOP("front,mid,back", WITH_SPLITTED("|tofront(1)")); |
---|
939 | TEST_CI_NOOP("a", WITH_SPLITTED("|tofront(1)")); |
---|
940 | TEST_CI_NOOP("a", WITH_SPLITTED("|toback(1)")); |
---|
941 | |
---|
942 | TEST_CI_ERROR_CONTAINS("a,b", WITH_SPLITTED("|tofront(3)"), "Illegal stream number '3' (allowed [1..2])"); |
---|
943 | TEST_CI_ERROR_CONTAINS("a,b", WITH_SPLITTED("|toback(3)"), "Illegal stream number '3' (allowed [1..2])"); |
---|
944 | TEST_CI_ERROR_CONTAINS("a,b", WITH_SPLITTED("|tofront"), "syntax: tofront(streamnumber)"); |
---|
945 | TEST_CI_ERROR_CONTAINS("a,b", WITH_SPLITTED("|toback(1,2)"), "syntax: toback(streamnumber)"); |
---|
946 | TEST_CI_ERROR_CONTAINS("a,b", WITH_SPLITTED("|merge(1,2)"), "syntax: merge[(\"separator\")]"); |
---|
947 | |
---|
948 | // split |
---|
949 | TEST_CI ("a\nb", "|split" ACI_MERGE, "a,b"); |
---|
950 | TEST_CI ("a-b", "|split(-)" ACI_MERGE, "a,b"); |
---|
951 | TEST_CI ("a-b", "|split(-,0)" ACI_MERGE, "a,b"); |
---|
952 | TEST_CI ("a-b", "|split(-,1)" ACI_MERGE, "a,-b"); |
---|
953 | TEST_CI ("a-b", "|split(-,2)" ACI_MERGE, "a-,b"); |
---|
954 | TEST_CI_ERROR_CONTAINS("a-b", "|split(-,3)" ACI_MERGE, "Illegal split mode '3' (valid: 0..2)"); |
---|
955 | TEST_CI_ERROR_CONTAINS("a\nb", "|split(1,2,3)" ACI_MERGE, "syntax: split[(\"separator\"[,mode])]"); |
---|
956 | |
---|
957 | #define C0_9 "0123456789" |
---|
958 | #define CA_Z "ABCDEFGHIJKLMNOPQRSTUVWXYZ" |
---|
959 | #define Ca_z "abcdefghijklmnopqrstuvwxyz" |
---|
960 | |
---|
961 | // extract_words + extract_sequence |
---|
962 | TEST_CI("1,2,3,four,five,six", "extract_words(\"" C0_9 "\",1)", "1 2 3"); |
---|
963 | TEST_CI("1,2,3,four,five,six", "extract_words(\"" Ca_z "\", 3)", "five four six"); |
---|
964 | TEST_CI("1,2,3,four,five,six", "extract_words(\"" CA_Z "\", 3)", ""); // extract words works case sensitive |
---|
965 | TEST_CI("1,2,3,four,five,six", "extract_words(\"" Ca_z "\", 4)", "five four"); |
---|
966 | TEST_CI("1,2,3,four,five,six", "extract_words(\"" Ca_z "\", 5)", ""); |
---|
967 | TEST_CI("7 3b 12A 1 767 111 1 77", "extract_words(\"" C0_9 CA_Z Ca_z "\", 1)", "1 1 111 12A 3b 7 767 77"); // does sort a list of helix numbers |
---|
968 | |
---|
969 | TEST_CI ("1,2,3,four,five,six", "extract_sequence(\"acgtu\", 1.0)", ""); |
---|
970 | TEST_CI ("1,2,3,four,five,six", "extract_sequence(\"acgtu\", 0.5)", ""); |
---|
971 | TEST_CI ("1,2,3,four,five,six", "extract_sequence(\"acgtu\", 0.0)", "four five six"); |
---|
972 | TEST_CI ("..acg--ta-cgt...", "extract_sequence(\"acgtu\", 1.0)", ""); |
---|
973 | TEST_CI_NOOP("..acg--ta-cgt...", "extract_sequence(\"acgtu-.\", 1.0)"); |
---|
974 | TEST_CI_NOOP("..acg--ta-ygt...", "extract_sequence(\"acgtu-.\", 0.7)"); |
---|
975 | TEST_CI ("70 ..acg--ta-cgt... 70", "extract_sequence(\"acgtu-.\", 1.0)", "..acg--ta-cgt..."); |
---|
976 | |
---|
977 | // checksum + gcgchecksum |
---|
978 | TEST_CI("", "sequence|checksum", "4C549A5F"); |
---|
979 | TEST_CI("", "sequence | gcgchecksum", "4308"); |
---|
980 | |
---|
981 | // SRT |
---|
982 | TEST_CI("The quick brown fox", "srt(\"quick=lazy:brown fox=dog\")", "The lazy dog"); // no need to escape spaces in quoted ACI parameter |
---|
983 | TEST_CI("The quick brown fox", "srt(quick=lazy:brown\\ fox=dog)", "The lazy dog"); // spaces need to be escaped in unquoted ACI parameter |
---|
984 | TEST_CI_ERROR_CONTAINS("x", "srt(x=y,z)", "SRT ERROR: no '=' found in command"); |
---|
985 | TEST_CI_ERROR_CONTAINS("x", "srt", "syntax: srt(expr[,expr]+)"); |
---|
986 | |
---|
987 | // REG-replace and -match |
---|
988 | TEST_CI("stars*to*stripes", "/\\*/--/", "stars--to--stripes"); |
---|
989 | |
---|
990 | TEST_CI_ERROR_CONTAINS("xxx", "//--", "Regular expression format is '/expr/' or '/expr/i', not '//--'"); |
---|
991 | TEST_CI_ERROR_CONTAINS("xxx", "/*/bla/", |
---|
992 | #if defined(DARWIN) |
---|
993 | // @@@ RESULT_MODIFIED_OSX: this test depends on library version |
---|
994 | // should either test for one-of-several results or just test for any error |
---|
995 | "repetition-operator operand invalid" |
---|
996 | #else // !DARWIN |
---|
997 | "Invalid preceding regular expression" |
---|
998 | #endif |
---|
999 | ); |
---|
1000 | |
---|
1001 | TEST_CI("sImILaRWIllBE,GonEEASIly", WITH_SPLITTED("|command(/[A-Z]//)"), "small,only"); |
---|
1002 | TEST_CI("sthBIGinside,FATnotCAP", WITH_SPLITTED("|command(/([A-Z])+/)"), "BIG,FAT"); // does only do match |
---|
1003 | |
---|
1004 | // command-queue vs. command-pipe (vs. both as sub-commands) |
---|
1005 | TEST_CI("a,bb,ccc", WITH_SPLITTED("|\"[\";len;\"]\""), "[,1,2,3,]"); // queue |
---|
1006 | TEST_CI("a,bb,ccc", WITH_SPLITTED("|command(\"\"[\";len;\"]\"\")"), "[1],[2],[3]"); // queue as sub-command |
---|
1007 | |
---|
1008 | TEST_CI("a,bb,ccc", WITH_SPLITTED("|len|minus(1)"), "0,1,2"); // pipe |
---|
1009 | TEST_CI("a,bb,ccc", WITH_SPLITTED("|command(\"len|minus(1)\")"), "0,1,2"); // pipe as sub-command |
---|
1010 | |
---|
1011 | TEST_CI( "a,bb,ccc,dd", WITH_SPLITTED("|len|minus"), "-1,1"); // pipe |
---|
1012 | TEST_CI_ERROR_CONTAINS("a,bb,ccc,dd", WITH_SPLITTED("|command(\"len|minus\")"), "Expect an even number of input streams"); // pipe as sub-command FAILS |
---|
1013 | } |
---|
1014 | |
---|
1015 | __ATTR__REDUCED_OPTIMIZE__NO_GCSE void TEST_GB_command_interpreter_2b() { |
---|
1016 | ACI_test_env E; |
---|
1017 | GBL_env base_env(E.gbmain(), NULp); |
---|
1018 | |
---|
1019 | // execute ACI on species container (=GB_DB) in this section ------------------------------ |
---|
1020 | GBDATA * const gb_data = E.gbspecies(); |
---|
1021 | GBL_call_env callEnv(gb_data, base_env); |
---|
1022 | |
---|
1023 | // calculator |
---|
1024 | TEST_CI("", "echo(9.9,3.9) |plus;fplus" ACI_MERGE, "12,13.8"); |
---|
1025 | TEST_CI("", "echo(9.1,3.9) |minus;fminus" ACI_MERGE, "6,5.2"); |
---|
1026 | TEST_CI("", "echo(9,3.5) |mult;fmult" ACI_MERGE, "27,31.5"); |
---|
1027 | TEST_CI("", "echo(9,0.1) |mult;fmult" ACI_MERGE, "0,0.9"); |
---|
1028 | TEST_CI("", "echo(9,3) |div;fdiv" ACI_MERGE, "3,3"); |
---|
1029 | TEST_CI("", "echo(10,3) |div;fdiv" ACI_MERGE, "3,3.33333"); |
---|
1030 | |
---|
1031 | TEST_CI("", "echo(9,3)|rest", "0"); |
---|
1032 | TEST_CI("", "echo(9,5)|rest", "4"); |
---|
1033 | |
---|
1034 | TEST_CI("", "echo(9,3) |per_cent;fper_cent" ACI_MERGE, "300,300"); |
---|
1035 | TEST_CI("", "echo(3,9) |per_cent;fper_cent" ACI_MERGE, "33,33.3333"); |
---|
1036 | TEST_CI("", "echo(1,8) |per_cent;fper_cent" ACI_MERGE, "12,12.5"); |
---|
1037 | TEST_CI("", "echo(15,16)|per_cent;fper_cent" ACI_MERGE, "93,93.75"); |
---|
1038 | TEST_CI("", "echo(1,8) |fper_cent|round(0)", "13"); |
---|
1039 | TEST_CI("", "echo(15,16)|fper_cent|round(0);round(1)" ACI_MERGE, "94,93.8"); |
---|
1040 | |
---|
1041 | TEST_CI("", "echo(1,2,3)|plus(1)" ACI_MERGE, "2,3,4"); |
---|
1042 | TEST_CI("", "echo(1,2,3)|minus(2)" ACI_MERGE, "-1,0,1"); |
---|
1043 | TEST_CI("", "echo(1,2,3)|mult(42)" ACI_MERGE, "42,84,126"); |
---|
1044 | TEST_CI("", "echo(1,2,3)|div(2)" ACI_MERGE, "0,1,1"); |
---|
1045 | TEST_CI("", "echo(1,2,3)|rest(2)" ACI_MERGE, "1,0,1"); |
---|
1046 | TEST_CI("", "echo(1,2,3)|per_cent(3)" ACI_MERGE, "33,66,100"); |
---|
1047 | |
---|
1048 | // rounding |
---|
1049 | #define ROUND_FLOATS(dig) "echo(0.3826,0.50849,12.58,77.2,700.099,0.9472e-4,0.175e+7)|round(" #dig ")" ACI_MERGE |
---|
1050 | |
---|
1051 | TEST_CI("", ROUND_FLOATS(4), "0.3826,0.5085,12.58,77.2,700.099,0.0001,1.75e+06"); |
---|
1052 | TEST_CI("", ROUND_FLOATS(3), "0.383,0.508,12.58,77.2,700.099,0,1.75e+06"); |
---|
1053 | TEST_CI("", ROUND_FLOATS(2), "0.38,0.51,12.58,77.2,700.1,0,1.75e+06"); |
---|
1054 | TEST_CI("", ROUND_FLOATS(1), "0.4,0.5,12.6,77.2,700.1,0,1.75e+06"); |
---|
1055 | TEST_CI("", ROUND_FLOATS(0), "0,1,13,77,700,0,1.75e+06"); |
---|
1056 | TEST_CI("", ROUND_FLOATS(-1), "0,0,10,80,700,0,1.75e+06"); |
---|
1057 | TEST_CI("", ROUND_FLOATS(-2), "0,0,0,100,700,0,1.75e+06"); |
---|
1058 | TEST_CI("", ROUND_FLOATS(-3), "0,0,0,0,1000,0,1.75e+06"); |
---|
1059 | TEST_CI("", ROUND_FLOATS(-5), "0,0,0,0,0,0,1.8e+06"); |
---|
1060 | TEST_CI("", ROUND_FLOATS(-6), "0,0,0,0,0,0,2e+06"); |
---|
1061 | |
---|
1062 | |
---|
1063 | // compare (integers) |
---|
1064 | TEST_CI("", "echo(9,3)|isBelow;isAbove;isEqual", "010"); |
---|
1065 | TEST_CI("", "echo(3,9)|isBelow;isAbove;isEqual", "100"); |
---|
1066 | TEST_CI("", "echo(5,5)|isBelow;isAbove;isEqual", "001"); |
---|
1067 | |
---|
1068 | TEST_CI("", "echo(1,2,3)|isBelow(2)", "100"); |
---|
1069 | TEST_CI("", "echo(1,2,3)|isAbove(2)", "001"); |
---|
1070 | TEST_CI("", "echo(1,2,3)|isEqual(2)", "010"); |
---|
1071 | |
---|
1072 | TEST_CI("", "echo(1,2,3,4,5)|inRange(2,4)", "01110"); |
---|
1073 | TEST_CI("", "echo(-1,-2,-3,-4,-5)|inRange(-2,-4)", "00000"); // empty range |
---|
1074 | TEST_CI("", "echo(-1,-2,-3,-4,-5)|inRange(-4,-2)", "01110"); |
---|
1075 | |
---|
1076 | // compare (floats) |
---|
1077 | TEST_CI("", "echo(1.7,1.4) |isBelow;isAbove;isEqual", "010"); |
---|
1078 | TEST_CI("", "echo(-0.7,0.1) |isBelow;isAbove;isEqual", "100"); |
---|
1079 | TEST_CI("", "echo(5.10,5.1) |isBelow;isAbove;isEqual", "001"); |
---|
1080 | TEST_CI("", "echo(0.10,.11) |isBelow;isAbove;isEqual", "100"); |
---|
1081 | TEST_CI("", "echo(-7.1,-6.9)|isBelow;isAbove;isEqual", "100"); |
---|
1082 | TEST_CI("", "echo(1e+5,1e+6)|isBelow;isAbove;isEqual", "100"); |
---|
1083 | TEST_CI("", "echo(2e+5,1e+6)|isBelow;isAbove;isEqual", "100"); |
---|
1084 | TEST_CI("", "echo(2e+5,1e-6)|isBelow;isAbove;isEqual", "010"); |
---|
1085 | TEST_CI("", "echo(2e-5,1e+6)|isBelow;isAbove;isEqual", "100"); |
---|
1086 | |
---|
1087 | TEST_CI("", "echo(.1,.2,.3,.4,.5) |inRange(.2,.4)", "01110"); |
---|
1088 | TEST_CI("", "echo(.8,.9,1.0,1.1,1.2)|inRange(.9,1.1)", "01110"); |
---|
1089 | TEST_CI("", "echo(-.2,-.1,0.0,.1,.2)|inRange(-.1,.1)", "01110"); |
---|
1090 | |
---|
1091 | // boolean operators |
---|
1092 | TEST_CI("0", "Not", "1"); |
---|
1093 | TEST_CI("1", "Not", "0"); |
---|
1094 | |
---|
1095 | TEST_CI("", "Not", "1"); |
---|
1096 | TEST_CI("text", "Not", "1"); |
---|
1097 | |
---|
1098 | TEST_CI("", "echo(0,1)|Not", "10"); |
---|
1099 | TEST_CI("", "echo(0,0)|Or;And", "00"); |
---|
1100 | TEST_CI("", "echo(0,1)|Or;And", "10"); |
---|
1101 | TEST_CI("", "echo(1,0)|Or;And", "10"); |
---|
1102 | TEST_CI("", "echo(1,1)|Or;And", "11"); |
---|
1103 | |
---|
1104 | TEST_CI("", "command(echo(1\\,0)|Or);command(echo(0\\,1)|Or)|And", "1"); |
---|
1105 | |
---|
1106 | // readdb |
---|
1107 | TEST_CI("", "readdb(name)", "LcbReu40"); |
---|
1108 | TEST_CI("", "readdb(acc)", "X76328"); |
---|
1109 | TEST_CI("", "readdb(acc,name)", "X76328LcbReu40"); |
---|
1110 | |
---|
1111 | TEST_CI_ERROR_CONTAINS("", "readdb()", "Invalid empty parameter list '()'"); |
---|
1112 | TEST_CI_ERROR_CONTAINS("", "readdb", "syntax: readdb(fieldname[,fieldname]+)"); |
---|
1113 | TEST_CI ("", "readdb(\"\")", ""); // still weird (want field error?) |
---|
1114 | |
---|
1115 | // taxonomy |
---|
1116 | TEST_CI("", "taxonomy(1)", "No default tree"); |
---|
1117 | TEST_CI("", "taxonomy(tree_nuc, 1)", "group1"); |
---|
1118 | TEST_CI("", "taxonomy(tree_nuc, 5)", "lower-red/group1"); |
---|
1119 | } |
---|
1120 | |
---|
1121 | __ATTR__REDUCED_OPTIMIZE__NO_GCSE void TEST_GB_command_interpreter_2c() { |
---|
1122 | ACI_test_env E; |
---|
1123 | GBL_env base_env(E.gbmain(), NULp); |
---|
1124 | |
---|
1125 | GBDATA * const gb_data = E.gbspecies(); |
---|
1126 | GBL_call_env callEnv(gb_data, base_env); |
---|
1127 | |
---|
1128 | GBL_env env_tree_nuc(E.gbmain(), "tree_nuc"); |
---|
1129 | GBL_call_env callEnv_tree_nuc(gb_data, env_tree_nuc); |
---|
1130 | |
---|
1131 | TEST_CI_ERROR_CONTAINS("", "taxonomy", "syntax: taxonomy([tree_name,]count)"); |
---|
1132 | TEST_CI_ERROR_CONTAINS("", "taxonomy(1,2,3)", "syntax: taxonomy([tree_name,]count)"); |
---|
1133 | TEST_CI_WITH_ENV("", callEnv_tree_nuc, "taxonomy(1)", "group1"); |
---|
1134 | |
---|
1135 | // diff, filter + change |
---|
1136 | TEST_CI("..acg--ta-cgt..." "," |
---|
1137 | "..acg--ta-cgt...", WITH_SPLITTED("|diff(pairwise=1)"), |
---|
1138 | "................"); |
---|
1139 | TEST_CI("..acg--ta-cgt..." "," |
---|
1140 | "..cgt--ta-acg...", WITH_SPLITTED("|diff(pairwise=1,equal==)"), |
---|
1141 | "==cgt=====acg==="); |
---|
1142 | TEST_CI("..acg--ta-cgt..." "," |
---|
1143 | "..cgt--ta-acg...", WITH_SPLITTED("|diff(pairwise=1,differ=X)"), |
---|
1144 | "..XXX.....XXX..."); |
---|
1145 | TEST_CI("", "sequence|diff(species=LcbFruct)|checksum", "645E3107"); |
---|
1146 | |
---|
1147 | TEST_CI("..XXX.....XXX..." "," |
---|
1148 | "..acg--ta-cgt...", WITH_SPLITTED("|filter(pairwise=1,exclude=X)"), |
---|
1149 | "..--ta-..."); |
---|
1150 | TEST_CI("..XXX.....XXX..." "," |
---|
1151 | "..acg--ta-cgt...", WITH_SPLITTED("|filter(pairwise=1,include=X)"), |
---|
1152 | "acgcgt"); |
---|
1153 | TEST_CI("", "sequence|filter(species=LcbFruct,include=.-)", "-----------T----T-------G----------C-----T----T..."); |
---|
1154 | |
---|
1155 | TEST_CI("...XXX....XXX..." "," |
---|
1156 | "..acg--ta-cgt...", WITH_SPLITTED("|change(pairwise=1,include=X,to=C,change=100)"), |
---|
1157 | "..aCC--ta-CCC..."); |
---|
1158 | TEST_CI("...XXXXXXXXX...." "," |
---|
1159 | "..acg--ta-cgt...", WITH_SPLITTED("|change(pairwise=1,include=X,to=-,change=100)"), |
---|
1160 | "..a---------t..."); |
---|
1161 | |
---|
1162 | // test environment forwarding |
---|
1163 | TEST_CI("x", ":*=*,*(acc)", "x,X76328"); // test DB-item is forwarded to direct SRT-command |
---|
1164 | TEST_CI("x", "srt(\"*=*,*(acc)\")", "x,X76328"); // test DB-item is forwarded to ACI-command 'srt' |
---|
1165 | TEST_CI("x", ":*=*,*(acc|dd;\",\";readdb(name))", "x,X76328,LcbReu40"); // test DB-item is forwarded to ACI-subexpression inside SRT-command |
---|
1166 | TEST_CI("x", "srt(\"*=*,*(acc|dd;\"\\,\";readdb(name))\")", "x,X76328,LcbReu40"); // test DB-item is forwarded to ACI-subexpression inside ACI-command 'srt' |
---|
1167 | TEST_CI("x", "command(\"dd;\\\",\\\";readdb(name)\")", "x,LcbReu40"); // test DB-item is forwarded to ACI-subexpression inside ACI-command 'command' |
---|
1168 | |
---|
1169 | // test treename is forwarded to sub-expressions |
---|
1170 | TEST_CI_WITH_ENV("x", callEnv_tree_nuc, ":*=*,*(acc|dd;\\\",\\\";taxonomy(1))", "x,X76328,group1"); |
---|
1171 | TEST_CI_WITH_ENV("", callEnv_tree_nuc, "taxonomy(5)|srt(*=*\\,*(acc|dd;\\\",\\\";taxonomy(1)))", "lower-red/group1,X76328,group1"); |
---|
1172 | TEST_CI_WITH_ENV("", callEnv_tree_nuc, "taxonomy(5)|command(\"dd;\\\",\\\";taxonomy(1)\")", "lower-red/group1,group1"); |
---|
1173 | |
---|
1174 | // test database root is forwarded to sub-expressions (used by commands 'ali_name', 'sequence_type', ...) |
---|
1175 | TEST_CI("x", ":*=*,*(acc|dd;\\\",\\\";ali_name;\\\",\\\";sequence_type)", "x,X76328,ali_16s,rna"); |
---|
1176 | TEST_CI("x", "srt(\"*=*,*(acc|dd;\\\",\\\";ali_name;\\\",\\\";sequence_type)\")", "x,X76328,ali_16s,rna"); |
---|
1177 | TEST_CI("x", "command(\"dd;\\\",\\\";ali_name;\\\",\\\";sequence_type\")", "x,ali_16s,rna"); |
---|
1178 | |
---|
1179 | // exec |
---|
1180 | TEST_CI("c,b,c,b,a,a", WITH_SPLITTED("|exec(\"(sort|uniq)\")|split|dropempty"), "a,b,c"); |
---|
1181 | TEST_CI("a,aba,cac", WITH_SPLITTED("|exec(\"perl\",-pe,s/([bc])/$1$1/g)|split|dropempty"), "a,abba,ccacc"); |
---|
1182 | |
---|
1183 | // error cases |
---|
1184 | TEST_CI_ERROR_CONTAINS("", "nocmd", "Unknown command 'nocmd'"); |
---|
1185 | TEST_CI_ERROR_CONTAINS("", "|nocmd", "Unknown command 'nocmd'"); |
---|
1186 | TEST_CI_ERROR_CONTAINS("", "caps(x)", "syntax: caps (no parameters)"); |
---|
1187 | TEST_CI_ERROR_CONTAINS("", "trace", "syntax: trace(0|1)"); |
---|
1188 | TEST_CI_ERROR_CONTAINS("", "count", "syntax: count(\"characters to count\")"); |
---|
1189 | TEST_CI_ERROR_CONTAINS("", "count(a,b)", "syntax: count(\"characters to count\")"); |
---|
1190 | TEST_CI_ERROR_CONTAINS("", "len(a,b)", "syntax: len[(\"characters not to count\")]"); |
---|
1191 | TEST_CI_ERROR_CONTAINS("", "plus(a,b,c)", "syntax: plus[(Expr1[,Expr2])]"); |
---|
1192 | TEST_CI_ERROR_CONTAINS("", "count(a,b", "Reason: Missing ')'"); |
---|
1193 | TEST_CI_ERROR_CONTAINS("", "count(a,\"b)", "unbalanced '\"' in 'count(a,\"b)'"); |
---|
1194 | TEST_CI_ERROR_CONTAINS("", "count(a,\"b)\"", "Reason: Missing ')'"); |
---|
1195 | TEST_CI_ERROR_CONTAINS("", "dd;dd|count", "syntax: count(\"characters to count\")"); |
---|
1196 | TEST_CI_ERROR_CONTAINS("", "|count(\"a\"x)", "Invalid parameter syntax for '\"a\"x'"); |
---|
1197 | TEST_CI_ERROR_CONTAINS("", "|count(\"a\"x\")", "unbalanced '\"' in '|count(\"a\"x\")'"); |
---|
1198 | TEST_CI_ERROR_CONTAINS("", "|count(\"a)", "unbalanced '\"' in '|count(\"a)'"); |
---|
1199 | |
---|
1200 | TEST_CI_ERROR_CONTAINS__BROKEN("", "|\"xx\"bla", "bla", "xx"); // @@@ should report some error referring to unseparated + unknown command 'bla' |
---|
1201 | |
---|
1202 | TEST_CI_ERROR_CONTAINS("", "translate(a)", "syntax: translate(old,new[,other])"); |
---|
1203 | TEST_CI_ERROR_CONTAINS("", "translate(a,b,c,d)", "syntax: translate(old,new[,other])"); |
---|
1204 | TEST_CI_ERROR_CONTAINS("", "translate(a,b,xx)", "has to be one character"); |
---|
1205 | TEST_CI_ERROR_CONTAINS("", "translate(a,b,)", "has to be one character"); |
---|
1206 | |
---|
1207 | TEST_CI_ERROR_CONTAINS(NULp, "whatever", "ARB ERROR: Can't read this DB entry as string"); // here gb_data is the species container |
---|
1208 | |
---|
1209 | TEST_CI("hello", ":??""=(?-?)", "(h-e)(l-l)o"); |
---|
1210 | TEST_CI("hello", ":??""=(?-?)?", "(h-e)?(l-l)?o"); |
---|
1211 | TEST_CI("hello", ":??""=(?-?0)?", "(h-e0)?(l-l0)?o"); |
---|
1212 | TEST_CI("hello", ":??""=(?-?3)?", "(h-?)e(l-?)lo"); |
---|
1213 | |
---|
1214 | // show linefeed is handled identical for encoded and escaped linefeeds: |
---|
1215 | TEST_CI("abc", ":?=?\\n", "a\nb\nc\n"); |
---|
1216 | TEST_CI("abc", ":?=?\n", "a\nb\nc\n"); |
---|
1217 | |
---|
1218 | // same for string-terminator: |
---|
1219 | TEST_CI("abc", ":?=?.\\0 ignored:b=d", "a.b.c."); |
---|
1220 | TEST_CI("abc", ":?=?.\0 ignored:b=d", "a.b.c."); |
---|
1221 | |
---|
1222 | TEST_CI("", ":*=X*Y*(full_name|len)", "XY21"); |
---|
1223 | TEST_CI("", ":*=*(full_name\\:reuteri=xxx)", "Lactobacillus xxx"); |
---|
1224 | TEST_CI("", ":*=*(abc\\:a=A)", ""); // non-existing field -> empty input -> empty output |
---|
1225 | TEST_CI("hello world", ":* =*(\\:*=hi)-", "hi-world"); // srt subexpressions also work w/o key |
---|
1226 | TEST_CI_ERROR_CONTAINS("", ":*=*(full_name\\:reuteri)", "no '=' found"); // test handling of errors from invalid srt-subexpression |
---|
1227 | |
---|
1228 | TEST_CI("", ":*=*(acc#have no acc)", "X76328"); |
---|
1229 | TEST_CI("", ":*=*(abc#have no abc)", "have no abc"); |
---|
1230 | TEST_CI("", ":*=*(#no field)", "no field"); |
---|
1231 | |
---|
1232 | TEST_CI_ERROR_CONTAINS("", ":*=*(unbalanced", "Unbalanced parenthesis in '(unbalanced'"); |
---|
1233 | TEST_CI_ERROR_CONTAINS("", ":*=*(unba(lan)ced", "Unbalanced parenthesis in '(unba(lan)ced'"); |
---|
1234 | TEST_CI_ERROR_CONTAINS("", ":*=*(unba(lan)c)ed)", "Invalid char '(' in key 'unba(lan)c'"); // invalid key name |
---|
1235 | TEST_CI ("", ":*=*(unbalanc)ed)", "ed)"); |
---|
1236 | } |
---|
1237 | |
---|
1238 | __ATTR__REDUCED_OPTIMIZE void TEST_GB_command_interpreter_3() { |
---|
1239 | ACI_test_env E; |
---|
1240 | GBL_env base_env(E.gbmain(), NULp); |
---|
1241 | |
---|
1242 | { |
---|
1243 | // execute ACI on 'full_name' (=GB_STRING) in this section ------------------------------ |
---|
1244 | GBDATA * const gb_data = GB_entry(E.gbspecies(), "full_name"); |
---|
1245 | GBL_call_env callEnv(gb_data, base_env); |
---|
1246 | |
---|
1247 | TEST_CI(NULp, "", "Lactobacillus reuteri"); // noop |
---|
1248 | TEST_CI(NULp, "|len", "21"); |
---|
1249 | TEST_CI(NULp, ":tobac=", "Lacillus reuteri"); |
---|
1250 | TEST_CI(NULp, "/ba.*us/B/", "LactoB reuteri"); |
---|
1251 | TEST_CI(NULp, ":::*=hello:::hell=heaven:::", "heaveno"); // test superfluous ':'s |
---|
1252 | TEST_CI(NULp, ":* *=;*2,*1;", ";reuteri,Lactobacillus;"); // tests multiple successful matches of '*' |
---|
1253 | TEST_CI(NULp, ":* ??*=;?2,?1,*2,*1;", ";e,r,uteri,Lactobacillus;"); // tests multiple successful matches of '*' and '?' (also tests working multi-wildcards "??" and "?*") |
---|
1254 | TEST_CI(NULp, ":Lacto*eutei=*1", "Lactobacillus reuteri"); // test match failing after '*' (=> skips replace) |
---|
1255 | TEST_CI(NULp, ":Lact?bac?lls=?1?2", "Lactobacillus reuteri"); // test match failing after 2nd '?' (=> skips replace) |
---|
1256 | TEST_CI(NULp, ":*reuteri?=?1", "Lactobacillus reuteri"); // test match failing on '?' behind EOS (=> skips replace) |
---|
1257 | |
---|
1258 | // tests for (unwanted) multi-wildcards: |
---|
1259 | TEST_CI__BROKEN(NULp, ":Lacto*?lus=(*1,?1)", "(baci,l)", "Lactobacillus reuteri"); // @@@ diffcult to achieve (alternative: forbid "*?" and report error) |
---|
1260 | TEST_CI__BROKEN("Lactobaci\4lus reuteri", ":Lacto*?lus=(*1,?1)", "<want error instead>", "(baci,?) reuteri"); // @@@ pathological case forcing a match for above situation (ASCII 4 is code for '?' wildcard) |
---|
1261 | TEST_CI_ERROR_CONTAINS__BROKEN(NULp, ":Lacto**lus=(*1,*2)", "invalid", "Lactobacillus reuteri"); // @@@ impossible: (forbid "**" and report error) |
---|
1262 | TEST_CI_ERROR_CONTAINS__BROKEN("Lactobac\3lus reuteri", ":Lacto**lus=(*1,*2)", "invalid", "(bac,*) reuteri"); // @@@ pathological case forcing a match for above situation (ASCII 3 is code for '*' wildcard) |
---|
1263 | |
---|
1264 | TEST_CI_ERROR_CONTAINS(NULp, ":*=*(|wot)", "Unknown command 'wot'"); // provoke error in gbs_build_replace_string [coverage] |
---|
1265 | TEST_CI_ERROR_CONTAINS("", ":*=X*Y*(|wot)", "Unknown command 'wot'"); // dito (other caller) |
---|
1266 | |
---|
1267 | TEST_CI_ERROR_CONTAINS("", ":*=X*Y*(full_name|len)", "can't read key 'full_name' (DB item is no container)"); |
---|
1268 | TEST_CI ("", ":*=X*Y*(../full_name|len)", "XY21"); // searches entry via parent-entry (from non-container) |
---|
1269 | |
---|
1270 | TEST_CI(NULp, "|taxonomy(1)", "No default tree"); |
---|
1271 | TEST_CI_ERROR_CONTAINS(NULp, "|taxonomy(tree_nuc,2)", "Container has neither 'name' nor 'group_name' entry - can't detect container type"); |
---|
1272 | } |
---|
1273 | { |
---|
1274 | // execute ACI on 'ARB_color' (=GB_INT) in this section ------------------------------ |
---|
1275 | GBDATA * const gb_data = GB_entry(E.gbspecies(), "ARB_color"); |
---|
1276 | GBL_call_env callEnv(gb_data, base_env); |
---|
1277 | |
---|
1278 | TEST_CI(NULp, "", "1"); // noop |
---|
1279 | TEST_CI("", "ali_name;\",\";sequence_type", "ali_16s,rna"); // test global database access works when specific database element is specified |
---|
1280 | } |
---|
1281 | { |
---|
1282 | // execute ACI without database element in this section ------------------------------ |
---|
1283 | GBDATA * const gb_data = NULp; |
---|
1284 | GBL_call_env callEnv(gb_data, base_env); |
---|
1285 | |
---|
1286 | TEST_CI_ERROR_CONTAINS(NULp, "", "no input streams found"); |
---|
1287 | TEST_CI("", ":*=\\tA*1Z\t", "\tAZ\t"); // special case (match empty input using '*'); test TAB conversion |
---|
1288 | |
---|
1289 | TEST_CI_ERROR_CONTAINS("", ":*=X*Y*(|wot)", "Unknown command 'wot'"); |
---|
1290 | TEST_CI_ERROR_CONTAINS("", ":*=X*Y*(nokey|len)", "can't read key 'nokey' (called w/o database item)"); |
---|
1291 | TEST_CI_ERROR_CONTAINS("", ":*=X*Y*(nokey)", "can't read key 'nokey' (called w/o database item)"); |
---|
1292 | |
---|
1293 | // test global database access also works w/o specific database element |
---|
1294 | TEST_CI("", "ali_name;\",\";sequence_type", "ali_16s,rna"); |
---|
1295 | TEST_CI("", "command(\"ali_name;\\\",\\\";sequence_type\")", "ali_16s,rna"); |
---|
1296 | |
---|
1297 | // empty+NULp commands: |
---|
1298 | TEST_CI("in", NULp, "in"); |
---|
1299 | TEST_CI("in", "", "in"); |
---|
1300 | TEST_CI("in", ":", "in"); |
---|
1301 | TEST_CI("in", "::", "in"); |
---|
1302 | |
---|
1303 | // empty+NULp commands: |
---|
1304 | TEST_CI("in", NULp, "in"); |
---|
1305 | TEST_CI("in", "", "in"); |
---|
1306 | TEST_CI("in", ":", "in"); |
---|
1307 | TEST_CI("in", "::", "in"); |
---|
1308 | } |
---|
1309 | |
---|
1310 | // register custom ACI commands |
---|
1311 | { |
---|
1312 | const GBL_command_lookup_table& stdCmds = ACI_get_standard_commands(); |
---|
1313 | |
---|
1314 | GBL_command_definition custom_cmds[] = { |
---|
1315 | { "custom", gbx_custom }, // new command 'custom' |
---|
1316 | { "upper", stdCmds.lookup("lower") }, // change meaning of lower .. |
---|
1317 | { "lower", stdCmds.lookup("upper") }, // .. and upper |
---|
1318 | |
---|
1319 | {NULp, NULp} |
---|
1320 | }; |
---|
1321 | |
---|
1322 | GBL_custom_command_lookup_table custom(custom_cmds, ARRAY_ELEMS(custom_cmds)-1, stdCmds, PERMIT_SUBSTITUTION); |
---|
1323 | |
---|
1324 | GBDATA * const gb_data = E.gbspecies(); |
---|
1325 | |
---|
1326 | GBL_env custom_env(E.gbmain(), NULp, custom); |
---|
1327 | GBL_call_env customCallEnv(gb_data, custom_env); |
---|
1328 | GBL_call_env callEnv(gb_data, base_env); |
---|
1329 | |
---|
1330 | // lookup overwritten commands: |
---|
1331 | TEST_EXPECT(custom.lookup("upper") == stdCmds.lookup("lower")); |
---|
1332 | TEST_EXPECT(custom.lookup("lower") == stdCmds.lookup("upper")); |
---|
1333 | |
---|
1334 | // test new commands: |
---|
1335 | TEST_CI_WITH_ENV ("abc", customCallEnv, "dd;custom;dd", "abc4711abc"); |
---|
1336 | TEST_CI_ERROR_CONTAINS("abc", "dd;custom;dd", "Unknown command 'custom'"); // unknown in standard environment |
---|
1337 | |
---|
1338 | // test overwritten commands: |
---|
1339 | TEST_CI_WITH_ENV("abcDEF,", customCallEnv, "dd;lower;upper", "abcDEF,ABCDEF,abcdef,"); |
---|
1340 | TEST_CI ("abcDEF,", "dd;lower;upper", "abcDEF,abcdef,ABCDEF,"); |
---|
1341 | } |
---|
1342 | } |
---|
1343 | |
---|
1344 | void TEST_GB_command_interpreter_4() { |
---|
1345 | ACI_test_env E; |
---|
1346 | GBL_env base_env(E.gbmain(), NULp); |
---|
1347 | |
---|
1348 | // execute ACI on species container (=GB_DB) in this section ------------------------------ |
---|
1349 | GBDATA * const gb_data = E.gbspecies(); |
---|
1350 | GBL_call_env callEnv(gb_data, base_env); |
---|
1351 | |
---|
1352 | TEST_CI("LcbReu40", "findspec(\"readdb (acc)\")", "X76328"); |
---|
1353 | TEST_CI("LcbFruct", "findspec(\"readdb (acc)\")", "X76330"); |
---|
1354 | TEST_CI("", "readdb(name)|findspec(\"readdb(acc)\")", "X76328"); |
---|
1355 | |
---|
1356 | TEST_CI("LcbReu40;lcbfruct", "split(\";\")|findspec(\"readdb(acc)\")|merge(\";\")", "X76328;X76330"); // usecase ("bring next-relatives info into name-independent format") |
---|
1357 | TEST_CI("X76328;x76330", "split(\";\")|findacc(\"readdb(name)\")|merge(\";\")", "LcbReu40;LcbFruct"); // perform opposite (tests 'findacc') |
---|
1358 | |
---|
1359 | TEST_CI ("", "findspec(\"invalid\")", ""); // does not execute command for unnamed item |
---|
1360 | TEST_CI_ERROR_CONTAINS("LcbReu40", "findspec(\"invalid\")", "Unknown command 'invalid'"); |
---|
1361 | TEST_CI_ERROR_CONTAINS("unknown", "findspec(\"invalid\")", "No species with name 'unknown' found"); |
---|
1362 | TEST_CI_ERROR_CONTAINS("unknown", "findacc(\"invalid\")", "No species with acc 'unknown' found"); |
---|
1363 | } |
---|
1364 | |
---|
1365 | #endif // UNIT_TESTS |
---|
1366 | |
---|