1 | // =============================================================== // |
---|
2 | // // |
---|
3 | // File : PARS_dtree.cxx // |
---|
4 | // Purpose : // |
---|
5 | // // |
---|
6 | // Institute of Microbiology (Technical University Munich) // |
---|
7 | // http://www.arb-home.de/ // |
---|
8 | // // |
---|
9 | // =============================================================== // |
---|
10 | |
---|
11 | #include "pars_dtree.hxx" |
---|
12 | #include "pars_main.hxx" |
---|
13 | #include "pars_debug.hxx" |
---|
14 | #include "ap_tree_nlen.hxx" |
---|
15 | #include "ap_main.hxx" |
---|
16 | |
---|
17 | #include <AP_seq_dna.hxx> |
---|
18 | #include <AP_seq_protein.hxx> |
---|
19 | #include <AP_filter.hxx> |
---|
20 | |
---|
21 | #include <ColumnStat.hxx> |
---|
22 | #include <awt_sel_boxes.hxx> |
---|
23 | #include <awt_filter.hxx> |
---|
24 | |
---|
25 | #include <gui_aliview.hxx> |
---|
26 | |
---|
27 | #include <aw_preset.hxx> |
---|
28 | #include <aw_awar.hxx> |
---|
29 | #include <aw_msg.hxx> |
---|
30 | #include <arb_progress.h> |
---|
31 | #include <aw_root.hxx> |
---|
32 | #include <aw_question.hxx> |
---|
33 | |
---|
34 | static void AWT_graphic_parsimony_root_changed(void *cd, AP_tree *old, AP_tree *newroot) { |
---|
35 | AWT_graphic_tree *agt = (AWT_graphic_tree*)cd; // @@@ dynacast? |
---|
36 | UNCOVERED(); |
---|
37 | |
---|
38 | if (old == agt->displayed_root) agt->displayed_root = newroot; |
---|
39 | } |
---|
40 | |
---|
41 | static AliView *pars_generate_aliview(WeightedFilter *pars_weighted_filter) { |
---|
42 | GBDATA *gb_main = pars_weighted_filter->get_gb_main(); |
---|
43 | char *ali_name; |
---|
44 | { |
---|
45 | GB_transaction ta(gb_main); |
---|
46 | ali_name = GBT_read_string(gb_main, AWAR_ALIGNMENT); |
---|
47 | } |
---|
48 | GB_ERROR error = NULL; |
---|
49 | AliView *aliview = pars_weighted_filter->create_aliview(ali_name, error); |
---|
50 | if (!aliview) aw_popup_exit(error); |
---|
51 | free(ali_name); |
---|
52 | return aliview; |
---|
53 | } |
---|
54 | |
---|
55 | void PARS_tree_init(AWT_graphic_parsimony *agt) { |
---|
56 | ap_assert(agt->get_root_node()); |
---|
57 | ap_assert(agt == ap_main->get_graphic_tree()); |
---|
58 | |
---|
59 | GBDATA *gb_main = ap_main->get_gb_main(); |
---|
60 | GB_transaction ta(gb_main); |
---|
61 | |
---|
62 | const char *use = ap_main->get_aliname(); |
---|
63 | long ali_len = GBT_get_alignment_len(gb_main, use); |
---|
64 | if (ali_len <= 1) { |
---|
65 | aw_popup_exit("No valid alignment selected! Try again"); |
---|
66 | } |
---|
67 | |
---|
68 | agt->get_tree_root()->set_root_changed_callback(AWT_graphic_parsimony_root_changed, agt); |
---|
69 | } |
---|
70 | |
---|
71 | static double funktion_quadratisch(double wert, double *param_list, int param_anz) { |
---|
72 | if (param_anz != 3) { |
---|
73 | ap_assert(0); // wrong number of parameters |
---|
74 | return 0; |
---|
75 | } |
---|
76 | return wert * wert * param_list[0] + wert * param_list[1] + param_list[2]; |
---|
77 | } |
---|
78 | |
---|
79 | |
---|
80 | void ArbParsimony::kernighan_optimize_tree(AP_tree *at) { |
---|
81 | GBDATA *gb_main = ap_main->get_gb_main(); |
---|
82 | GB_push_transaction(gb_main); |
---|
83 | |
---|
84 | long prevCombineCount = AP_sequence::combine_count(); |
---|
85 | |
---|
86 | AP_FLOAT pars_start = get_root_node()->costs(); |
---|
87 | const AP_FLOAT pars_org = pars_start; |
---|
88 | |
---|
89 | int rek_deep_max = *GBT_read_int(gb_main, "genetic/kh/maxdepth"); |
---|
90 | |
---|
91 | AP_KL_FLAG funktype = (AP_KL_FLAG)*GBT_read_int(gb_main, "genetic/kh/function_type"); |
---|
92 | |
---|
93 | int param_anz; |
---|
94 | double param_list[3]; |
---|
95 | |
---|
96 | double f_max_deep = (double)rek_deep_max; |
---|
97 | double f_startx = (double)*GBT_read_int(gb_main, "genetic/kh/dynamic/start"); |
---|
98 | double f_maxy = (double)*GBT_read_int(gb_main, "genetic/kh/dynamic/maxy"); |
---|
99 | double f_maxx = (double)*GBT_read_int(gb_main, "genetic/kh/dynamic/maxx"); |
---|
100 | |
---|
101 | double (*funktion)(double wert, double *param_list, int param_anz); |
---|
102 | switch (funktype) { |
---|
103 | default: |
---|
104 | case AP_QUADRAT_START: |
---|
105 | funktion = funktion_quadratisch; |
---|
106 | param_anz = 3; |
---|
107 | param_list[2] = f_startx; |
---|
108 | param_list[0] = (f_startx - f_maxy) / (f_maxx * f_maxx); |
---|
109 | param_list[1] = -2.0 * param_list[0] * f_maxx; |
---|
110 | break; |
---|
111 | case AP_QUADRAT_MAX: // parameter liste fuer quadratische gleichung (y =ax^2 +bx +c) |
---|
112 | funktion = funktion_quadratisch; |
---|
113 | param_anz = 3; |
---|
114 | param_list[0] = - f_maxy / ((f_max_deep - f_maxx) * (f_max_deep - f_maxx)); |
---|
115 | param_list[1] = -2.0 * param_list[0] * f_maxx; |
---|
116 | param_list[2] = f_maxy + param_list[0] * f_maxx * f_maxx; |
---|
117 | break; |
---|
118 | } |
---|
119 | |
---|
120 | |
---|
121 | AP_KL_FLAG searchflag=(AP_KL_FLAG)0; |
---|
122 | if (*GBT_read_int(gb_main, "genetic/kh/dynamic/enable")) { |
---|
123 | searchflag = AP_DYNAMIK; |
---|
124 | } |
---|
125 | if (*GBT_read_int(gb_main, "genetic/kh/static/enable")) { |
---|
126 | searchflag = (AP_KL_FLAG)(searchflag|AP_STATIC); |
---|
127 | } |
---|
128 | |
---|
129 | int rek_breite[8]; |
---|
130 | rek_breite[0] = *GBT_read_int(gb_main, "genetic/kh/static/depth0"); |
---|
131 | rek_breite[1] = *GBT_read_int(gb_main, "genetic/kh/static/depth1"); |
---|
132 | rek_breite[2] = *GBT_read_int(gb_main, "genetic/kh/static/depth2"); |
---|
133 | rek_breite[3] = *GBT_read_int(gb_main, "genetic/kh/static/depth3"); |
---|
134 | rek_breite[4] = *GBT_read_int(gb_main, "genetic/kh/static/depth4"); |
---|
135 | int rek_breite_anz = 5; |
---|
136 | |
---|
137 | int anzahl = (int)(*GBT_read_float(gb_main, "genetic/kh/nodes")*at->count_leafs()); |
---|
138 | AP_tree **list = at->getRandomNodes(anzahl); |
---|
139 | |
---|
140 | arb_progress progress(anzahl); |
---|
141 | |
---|
142 | progress.subtitle(GBS_global_string("Old Parsimony: %.1f", pars_start)); |
---|
143 | |
---|
144 | GB_pop_transaction(gb_main); |
---|
145 | |
---|
146 | for (int i=0; i<anzahl && !progress.aborted(); i++) { |
---|
147 | AP_tree_nlen *tree_elem = DOWNCAST(AP_tree_nlen*, list[i]); // @@@ pass 'at' as AP_tree_nlen |
---|
148 | |
---|
149 | bool in_folded_group = tree_elem->gr.hidden || |
---|
150 | (tree_elem->father && tree_elem->get_father()->gr.hidden); |
---|
151 | |
---|
152 | if (!in_folded_group) { |
---|
153 | bool better_tree_found = false; |
---|
154 | ap_main->remember(); |
---|
155 | display_clear(funktion, param_list, param_anz, (int)pars_start, (int)rek_deep_max); |
---|
156 | |
---|
157 | tree_elem->kernighan_rek(0, |
---|
158 | rek_breite, rek_breite_anz, rek_deep_max, |
---|
159 | funktion, param_list, param_anz, |
---|
160 | pars_start, pars_start, pars_org, |
---|
161 | searchflag, &better_tree_found); |
---|
162 | |
---|
163 | if (better_tree_found) { |
---|
164 | ap_main->accept(); |
---|
165 | pars_start = get_root_node()->costs(); |
---|
166 | progress.subtitle(GBS_global_string("New parsimony: %.1f (gain: %.1f)", pars_start, pars_org-pars_start)); |
---|
167 | } |
---|
168 | else { |
---|
169 | ap_main->revert(); |
---|
170 | } |
---|
171 | } |
---|
172 | progress.inc(); |
---|
173 | } |
---|
174 | delete [] list; |
---|
175 | printf("Combines: %li\n", AP_sequence::combine_count()-prevCombineCount); |
---|
176 | } |
---|
177 | |
---|
178 | |
---|
179 | |
---|
180 | void ArbParsimony::optimize_tree(AP_tree *at, arb_progress& progress) { |
---|
181 | AP_tree *oldrootleft = get_root_node()->get_leftson(); |
---|
182 | AP_tree *oldrootright = get_root_node()->get_rightson(); |
---|
183 | const AP_FLOAT org_pars = get_root_node()->costs(); |
---|
184 | AP_FLOAT prev_pars = org_pars; |
---|
185 | |
---|
186 | progress.subtitle(GBS_global_string("Old parsimony: %.1f", org_pars)); |
---|
187 | |
---|
188 | while (!progress.aborted()) { |
---|
189 | AP_FLOAT nni_pars = DOWNCAST(AP_tree_nlen*, at)->nn_interchange_rek(-1, AP_BL_NNI_ONLY, false); |
---|
190 | |
---|
191 | if (nni_pars == prev_pars) { // NNI did not reduce costs -> kern-lin |
---|
192 | kernighan_optimize_tree(at); |
---|
193 | AP_FLOAT ker_pars = get_root_node()->costs(); |
---|
194 | if (ker_pars == prev_pars) break; // kern-lin did not improve tree -> done |
---|
195 | prev_pars = ker_pars; |
---|
196 | } |
---|
197 | else { |
---|
198 | prev_pars = nni_pars; |
---|
199 | } |
---|
200 | progress.subtitle(GBS_global_string("New parsimony: %.1f (gain: %.1f)", prev_pars, org_pars-prev_pars)); |
---|
201 | } |
---|
202 | |
---|
203 | if (oldrootleft->father == oldrootright) oldrootleft->set_root(); |
---|
204 | else oldrootright->set_root(); |
---|
205 | |
---|
206 | get_root_node()->costs(); |
---|
207 | } |
---|
208 | |
---|
209 | AWT_graphic_parsimony::AWT_graphic_parsimony(ArbParsimony& parsimony_, GBDATA *gb_main_, AD_map_viewer_cb map_viewer_cb_) |
---|
210 | : AWT_graphic_tree(AW_root::SINGLETON, gb_main_, map_viewer_cb_), |
---|
211 | parsimony(parsimony_) |
---|
212 | {} |
---|
213 | |
---|
214 | AP_tree_root *AWT_graphic_parsimony::create_tree_root(RootedTreeNodeFactory *nodeMaker_, AliView *aliview, AP_sequence *seq_prototype, bool insert_delete_cbs) { |
---|
215 | return new AP_pars_root(aliview, nodeMaker_, seq_prototype, insert_delete_cbs); |
---|
216 | } |
---|
217 | |
---|
218 | |
---|
219 | void ArbParsimony::generate_tree(WeightedFilter *pars_weighted_filter) { |
---|
220 | AliView *aliview = pars_generate_aliview(pars_weighted_filter); |
---|
221 | AP_sequence *seq_templ = 0; |
---|
222 | |
---|
223 | GBDATA *gb_main = aliview->get_gb_main(); |
---|
224 | { |
---|
225 | GB_transaction ta(gb_main); |
---|
226 | bool is_aa = GBT_is_alignment_protein(gb_main, aliview->get_aliname()); |
---|
227 | |
---|
228 | if (is_aa) seq_templ = new AP_sequence_protein(aliview); |
---|
229 | else seq_templ = new AP_sequence_parsimony(aliview); |
---|
230 | } |
---|
231 | |
---|
232 | AWT_graphic_parsimony *new_tree = new AWT_graphic_parsimony(*this, aliview->get_gb_main(), PARS_map_viewer); |
---|
233 | new_tree->init(new AP_TreeNlenNodeFactory, aliview, seq_templ, true, false); |
---|
234 | set_tree(new_tree); |
---|
235 | } |
---|
236 | |
---|
237 | AW_gc_manager AWT_graphic_parsimony::init_devices(AW_window *aww, AW_device *device, AWT_canvas* ntw) { |
---|
238 | AW_init_color_group_defaults("arb_pars"); |
---|
239 | |
---|
240 | AW_gc_manager gc_manager = |
---|
241 | AW_manage_GC(aww, |
---|
242 | ntw->get_gc_base_name(), |
---|
243 | device, AWT_GC_CURSOR, AWT_GC_MAX, /* AWT_GC_CURSOR+7, */ AW_GCM_DATA_AREA, |
---|
244 | makeWindowCallback(AWT_resize_cb, ntw), |
---|
245 | true, // uses color groups |
---|
246 | "#AAAA55", |
---|
247 | |
---|
248 | // Important note : |
---|
249 | // Many gc indices are shared between ABR_NTREE and ARB_PARSIMONY |
---|
250 | // e.g. the tree drawing routines use same gc's for drawing both trees |
---|
251 | // (check AWT_dtree.cxx AWT_graphic_tree::init_devices) |
---|
252 | |
---|
253 | "Cursor$#FFFFFF", |
---|
254 | "Branch remarks$#DBE994", |
---|
255 | "+-Bootstrap$#DBE994", "-B.(limited)$white", |
---|
256 | "--unused$#ff0000", |
---|
257 | "Marked$#FFFF00", |
---|
258 | "Some marked$#eeee88", |
---|
259 | "Not marked$black", |
---|
260 | "Zombies etc.$#cc5924", |
---|
261 | |
---|
262 | "--unused", "--unused", // these reserve the numbers which are used for probe colors in ARB_NTREE |
---|
263 | "--unused", "--unused", // (this is necessary because ARB_PARS and ARB_NTREE use the same tree painting routines) |
---|
264 | "--unused", "--unused", |
---|
265 | "--unused", "--unused", |
---|
266 | |
---|
267 | NULL); |
---|
268 | return gc_manager; |
---|
269 | } |
---|
270 | |
---|
271 | void AWT_graphic_parsimony::show(AW_device *device) { |
---|
272 | AP_tree_nlen *root_node = parsimony.get_root_node(); |
---|
273 | AW_awar *awar_pars = aw_root->awar(AWAR_PARSIMONY); |
---|
274 | AW_awar *awar_best = aw_root->awar(AWAR_BEST_PARSIMONY); |
---|
275 | |
---|
276 | long parsval = root_node ? root_node->costs() : 0; |
---|
277 | awar_pars->write_int(parsval); |
---|
278 | |
---|
279 | long best_pars = awar_best->read_int(); |
---|
280 | if (parsval < best_pars || 0==best_pars) awar_best->write_int(parsval); |
---|
281 | |
---|
282 | AWT_graphic_tree::show(device); |
---|
283 | } |
---|
284 | |
---|
285 | void AWT_graphic_parsimony::handle_command(AW_device *device, AWT_graphic_event& event) { |
---|
286 | ClickedTarget clicked(this, event.best_click()); |
---|
287 | bool recalc_branchlengths_on_structure_change = true; |
---|
288 | |
---|
289 | switch (event.cmd()) { |
---|
290 | // @@@ something is designed completely wrong here! |
---|
291 | // why do all commands close TA and reopen when done? |
---|
292 | |
---|
293 | case AWT_MODE_NNI: |
---|
294 | if (event.type()==AW_Mouse_Press) { |
---|
295 | GB_pop_transaction(gb_main); |
---|
296 | switch (event.button()) { |
---|
297 | case AW_BUTTON_LEFT: { |
---|
298 | if (clicked.node()) { |
---|
299 | arb_progress progress("NNI optimize subtree"); |
---|
300 | AP_tree_nlen *atn = DOWNCAST(AP_tree_nlen*, clicked.node()); |
---|
301 | atn->nn_interchange_rek(-1, AP_BL_NNI_ONLY, false); |
---|
302 | exports.save = 1; |
---|
303 | ASSERT_VALID_TREE(get_root_node()); |
---|
304 | } |
---|
305 | break; |
---|
306 | } |
---|
307 | case AW_BUTTON_RIGHT: { |
---|
308 | arb_progress progress("NNI optimize tree"); |
---|
309 | long prevCombineCount = AP_sequence::combine_count(); |
---|
310 | |
---|
311 | AP_tree_nlen *atn = DOWNCAST(AP_tree_nlen*, get_root_node()); |
---|
312 | atn->nn_interchange_rek(-1, AP_BL_NNI_ONLY, false); |
---|
313 | printf("Combines: %li\n", AP_sequence::combine_count()-prevCombineCount); |
---|
314 | |
---|
315 | exports.save = 1; |
---|
316 | ASSERT_VALID_TREE(get_root_node()); |
---|
317 | break; |
---|
318 | } |
---|
319 | |
---|
320 | default: break; |
---|
321 | } |
---|
322 | GB_begin_transaction(gb_main); |
---|
323 | } |
---|
324 | break; |
---|
325 | case AWT_MODE_KERNINGHAN: |
---|
326 | if (event.type()==AW_Mouse_Press) { |
---|
327 | GB_pop_transaction(gb_main); |
---|
328 | switch (event.button()) { |
---|
329 | case AW_BUTTON_LEFT: |
---|
330 | if (clicked.node()) { |
---|
331 | arb_progress progress("Kernighan-Lin optimize subtree"); |
---|
332 | parsimony.kernighan_optimize_tree(clicked.node()); |
---|
333 | this->exports.save = 1; |
---|
334 | ASSERT_VALID_TREE(get_root_node()); |
---|
335 | } |
---|
336 | break; |
---|
337 | case AW_BUTTON_RIGHT: { |
---|
338 | arb_progress progress("Kernighan-Lin optimize tree"); |
---|
339 | parsimony.kernighan_optimize_tree(get_root_node()); |
---|
340 | this->exports.save = 1; |
---|
341 | ASSERT_VALID_TREE(get_root_node()); |
---|
342 | break; |
---|
343 | } |
---|
344 | default: break; |
---|
345 | } |
---|
346 | GB_begin_transaction(gb_main); |
---|
347 | } |
---|
348 | break; |
---|
349 | case AWT_MODE_OPTIMIZE: |
---|
350 | if (event.type()==AW_Mouse_Press) { |
---|
351 | GB_pop_transaction(gb_main); |
---|
352 | switch (event.button()) { |
---|
353 | case AW_BUTTON_LEFT: |
---|
354 | if (clicked.node()) { |
---|
355 | arb_progress progress("Optimizing subtree"); |
---|
356 | parsimony.optimize_tree(clicked.node(), progress); |
---|
357 | this->exports.save = 1; |
---|
358 | ASSERT_VALID_TREE(get_root_node()); |
---|
359 | } |
---|
360 | break; |
---|
361 | case AW_BUTTON_RIGHT: { |
---|
362 | arb_progress progress("Optimizing tree"); |
---|
363 | |
---|
364 | parsimony.optimize_tree(get_root_node(), progress); |
---|
365 | this->exports.save = 1; |
---|
366 | ASSERT_VALID_TREE(get_root_node()); |
---|
367 | break; |
---|
368 | } |
---|
369 | default: break; |
---|
370 | } |
---|
371 | GB_begin_transaction(gb_main); |
---|
372 | } |
---|
373 | break; |
---|
374 | |
---|
375 | default: |
---|
376 | recalc_branchlengths_on_structure_change = false; |
---|
377 | // fall-through (modes listed below trigger branchlength calculation) |
---|
378 | case AWT_MODE_MOVE: |
---|
379 | AWT_graphic_tree::handle_command(device, event); |
---|
380 | break; |
---|
381 | } |
---|
382 | |
---|
383 | if (exports.save == 1 && recalc_branchlengths_on_structure_change) { |
---|
384 | arb_progress progress("Recalculating branch lengths"); |
---|
385 | rootEdge()->calc_branchlengths(); |
---|
386 | reorder_tree(BIG_BRANCHES_TO_TOP); // beautify after recalc_branch_lengths |
---|
387 | } |
---|
388 | } |
---|
389 | |
---|
390 | |
---|
391 | // -------------------------------------------------------------------------------- |
---|
392 | |
---|
393 | #ifdef UNIT_TESTS |
---|
394 | #include <arb_diff.h> |
---|
395 | #include <test_unit.h> |
---|
396 | #include "test_env.h" |
---|
397 | |
---|
398 | template<typename SEQTYPE> |
---|
399 | PARSIMONY_testenv<SEQTYPE>::PARSIMONY_testenv(const char *dbname, const char *aliName) |
---|
400 | : parsimony() |
---|
401 | { |
---|
402 | common_init(dbname); |
---|
403 | GBDATA *gb_main = ap_main->get_gb_main(); |
---|
404 | GB_transaction ta(gb_main); |
---|
405 | size_t aliLength = GBT_get_alignment_len(gb_main, aliName); |
---|
406 | |
---|
407 | AP_filter filter(aliLength); |
---|
408 | if (!filter.is_invalid()) { |
---|
409 | AP_weights weights(&filter); |
---|
410 | agt->init(new AliView(gb_main, filter, weights, aliName)); |
---|
411 | } |
---|
412 | } |
---|
413 | |
---|
414 | template PARSIMONY_testenv<AP_sequence_protein>::PARSIMONY_testenv(const char *dbname, const char *aliName); // explicit instanciation (otherwise link error in unittest) |
---|
415 | |
---|
416 | |
---|
417 | void TEST_basic_tree_modifications() { |
---|
418 | PARSIMONY_testenv<AP_sequence_parsimony> env("TEST_trees.arb"); |
---|
419 | TEST_EXPECT_NO_ERROR(env.load_tree("tree_test")); |
---|
420 | |
---|
421 | { |
---|
422 | AP_tree_nlen *root = env.root_node(); |
---|
423 | root->compute_tree(); |
---|
424 | |
---|
425 | // first check initial state: |
---|
426 | { |
---|
427 | AP_tree_members& root_info = root->gr; |
---|
428 | |
---|
429 | TEST_EXPECT_EQUAL(root_info.grouped, 0); |
---|
430 | TEST_EXPECT_EQUAL(root_info.hidden, 0); |
---|
431 | TEST_EXPECT_EQUAL(root_info.has_marked_children, 1); |
---|
432 | TEST_EXPECT_EQUAL(root_info.leaf_sum, 15); |
---|
433 | |
---|
434 | TEST_EXPECT_SIMILAR(root_info.max_tree_depth, 1.624975, 0.000001); |
---|
435 | TEST_EXPECT_SIMILAR(root_info.min_tree_depth, 0.341681, 0.000001); |
---|
436 | |
---|
437 | GB_transaction ta(env.gbmain()); |
---|
438 | GBT_mark_all(env.gbmain(), 0); // unmark all species |
---|
439 | root->compute_tree(); |
---|
440 | TEST_EXPECT_EQUAL(root_info.has_marked_children, 0); |
---|
441 | } |
---|
442 | |
---|
443 | |
---|
444 | #define B1_TOP "(((((CloTyro3:1.046,CloTyro4:0.061):0.026,CloTyro2:0.017):0.017,CloTyrob:0.009):0.274,CloInnoc:0.371):0.057,CloBifer:0.388):0.124" |
---|
445 | #define B1_BOT "(CloBifer:0.388,(CloInnoc:0.371,(CloTyrob:0.009,(CloTyro2:0.017,(CloTyro3:1.046,CloTyro4:0.061):0.026):0.017):0.274):0.057):0.124" |
---|
446 | #define B2_TOP "(((CloButy2:0.009,CloButyr:0.000):0.564,CloCarni:0.120):0.010,CloPaste:0.179):0.131" |
---|
447 | #define B2_BOT "(CloPaste:0.179,(CloCarni:0.120,(CloButy2:0.009,CloButyr:0.000):0.564):0.010):0.131" |
---|
448 | |
---|
449 | |
---|
450 | #define B3_LEFT_TOP_SONS "(((CorAquat:0.084,CurCitre:0.058):0.103,CorGluta:0.522):0.053,CelBiazo:0.059)" |
---|
451 | #define B3_TOP_SONS B3_LEFT_TOP_SONS ":0.207,CytAquat:0.711" |
---|
452 | #define B3_TOP_SONS_CCR "((CorAquat:0.187,CorGluta:0.522):0.053,CelBiazo:0.059):0.207,CytAquat:0.711" // CCR = CurCitre removed |
---|
453 | #define B3_TOP "(" B3_TOP_SONS "):0.081" |
---|
454 | #define B3_BOT "(CytAquat:0.711,(CelBiazo:0.059,(CorGluta:0.522,(CorAquat:0.084,CurCitre:0.058):0.103):0.053):0.207):0.081" |
---|
455 | |
---|
456 | |
---|
457 | const char *top_topo = "((" B1_TOP "," B2_TOP "):0.081," B3_TOP ");"; |
---|
458 | const char *edge_topo = "((" B1_TOP "," B2_BOT "):0.081," B3_BOT ");"; |
---|
459 | const char *bottom_topo = "(" B3_BOT ",(" B2_BOT "," B1_BOT "):0.081);"; |
---|
460 | |
---|
461 | const char *radial_topo = |
---|
462 | "(((CloPaste:0.179,((CloButy2:0.009,CloButyr:0.000):0.564,CloCarni:0.120):0.010):0.131," |
---|
463 | "((CloInnoc:0.371,((CloTyro2:0.017,(CloTyro3:1.046,CloTyro4:0.061):0.026):0.017,CloTyrob:0.009):0.274):0.057,CloBifer:0.388):0.124):0.081," |
---|
464 | "((CelBiazo:0.059,((CorAquat:0.084,CurCitre:0.058):0.103,CorGluta:0.522):0.053):0.207,CytAquat:0.711):0.081);"; |
---|
465 | const char *radial_topo2 = |
---|
466 | "(((CloBifer:0.388,(CloInnoc:0.371,(((CloTyro3:1.046,CloTyro4:0.061):0.026,CloTyro2:0.017):0.017,CloTyrob:0.009):0.274):0.057):0.124," B2_TOP "):0.081," |
---|
467 | "(CytAquat:0.711," B3_LEFT_TOP_SONS ":0.207):0.081);"; |
---|
468 | |
---|
469 | // expect that no mode reproduces another mode: |
---|
470 | TEST_EXPECT_DIFFERENT(top_topo, edge_topo); |
---|
471 | TEST_EXPECT_DIFFERENT(top_topo, bottom_topo); |
---|
472 | TEST_EXPECT_DIFFERENT(top_topo, radial_topo); |
---|
473 | TEST_EXPECT_DIFFERENT(top_topo, radial_topo2); |
---|
474 | TEST_EXPECT_DIFFERENT(edge_topo, bottom_topo); |
---|
475 | TEST_EXPECT_DIFFERENT(edge_topo, radial_topo); |
---|
476 | TEST_EXPECT_DIFFERENT(edge_topo, radial_topo2); |
---|
477 | TEST_EXPECT_DIFFERENT(bottom_topo, radial_topo); |
---|
478 | TEST_EXPECT_DIFFERENT(bottom_topo, radial_topo2); |
---|
479 | TEST_EXPECT_DIFFERENT(radial_topo, radial_topo2); |
---|
480 | |
---|
481 | env.push(); // 1st stack level (=top_topo) |
---|
482 | |
---|
483 | TEST_ASSERT_VALID_TREE(root); |
---|
484 | |
---|
485 | TEST_EXPECT_NEWICK(nLENGTH, root, top_topo); |
---|
486 | // test reorder_tree: |
---|
487 | root->reorder_tree(BIG_BRANCHES_TO_EDGE); TEST_EXPECT_NEWICK(nLENGTH, root, edge_topo); env.push(); // 2nd stack level (=edge_topo) |
---|
488 | root->reorder_tree(BIG_BRANCHES_TO_BOTTOM); TEST_EXPECT_NEWICK(nLENGTH, root, bottom_topo); env.push(); // 3rd stack level (=bottom_topo) |
---|
489 | root->reorder_tree(BIG_BRANCHES_TO_CENTER); TEST_EXPECT_NEWICK(nLENGTH, root, radial_topo); |
---|
490 | root->reorder_tree(BIG_BRANCHES_ALTERNATING); TEST_EXPECT_NEWICK(nLENGTH, root, radial_topo2); |
---|
491 | root->reorder_tree(BIG_BRANCHES_TO_TOP); TEST_EXPECT_NEWICK(nLENGTH, root, top_topo); |
---|
492 | |
---|
493 | TEST_ASSERT_VALID_TREE(root); |
---|
494 | |
---|
495 | // test set root: |
---|
496 | AP_tree_nlen *CloTyrob = root->findLeafNamed("CloTyrob"); |
---|
497 | TEST_REJECT_NULL(CloTyrob); |
---|
498 | |
---|
499 | ARB_edge rootEdge(root->get_leftson(), root->get_rightson()); |
---|
500 | CloTyrob->set_root(); |
---|
501 | |
---|
502 | TEST_ASSERT_VALID_TREE(root); |
---|
503 | |
---|
504 | const char *rootAtCloTyrob_topo = |
---|
505 | "(CloTyrob:0.004," |
---|
506 | "(((CloTyro3:1.046,CloTyro4:0.061):0.026,CloTyro2:0.017):0.017," |
---|
507 | "((((" B3_TOP_SONS "):0.162," B2_TOP "):0.124,CloBifer:0.388):0.057,CloInnoc:0.371):0.274):0.004);"; |
---|
508 | |
---|
509 | TEST_EXPECT_NEWICK(nLENGTH, root, rootAtCloTyrob_topo); |
---|
510 | env.push(); // 4th stack level (=rootAtCloTyrob_topo) |
---|
511 | |
---|
512 | TEST_ASSERT_VALID_TREE(root); |
---|
513 | |
---|
514 | AP_tree_nlen *CelBiazoFather = root->findLeafNamed("CelBiazo")->get_father(); |
---|
515 | TEST_REJECT_NULL(CelBiazoFather); |
---|
516 | CelBiazoFather->set_root(); |
---|
517 | |
---|
518 | const char *rootAtCelBiazoFather_topo = "(" B3_LEFT_TOP_SONS ":0.104,((" B1_TOP "," B2_TOP "):0.162,CytAquat:0.711):0.104);"; |
---|
519 | TEST_EXPECT_NEWICK(nLENGTH, root, rootAtCelBiazoFather_topo); |
---|
520 | |
---|
521 | TEST_ASSERT_VALID_TREE(root); |
---|
522 | |
---|
523 | ARB_edge oldRootEdge(rootEdge.source(), rootEdge.dest()); |
---|
524 | DOWNCAST(AP_tree_nlen*,oldRootEdge.son())->set_root(); |
---|
525 | |
---|
526 | const char *rootSetBack_topo = top_topo; |
---|
527 | TEST_EXPECT_NEWICK(nLENGTH, root, rootSetBack_topo); |
---|
528 | env.push(); // 5th stack level (=rootSetBack_topo) |
---|
529 | |
---|
530 | TEST_ASSERT_VALID_TREE(root); |
---|
531 | |
---|
532 | // test remove: |
---|
533 | AP_tree_nlen *CurCitre = root->findLeafNamed("CurCitre"); |
---|
534 | TEST_REJECT_NULL(CurCitre); |
---|
535 | TEST_REJECT_NULL(CurCitre->get_father()); |
---|
536 | |
---|
537 | CurCitre->remove(); |
---|
538 | const char *CurCitre_removed_topo = "((" B1_TOP "," B2_TOP "):0.081,(" B3_TOP_SONS_CCR "):0.081);"; |
---|
539 | // ------------------------------------------------------------------- ^^^ = B3_TOP_SONS minus CurCitre |
---|
540 | TEST_EXPECT_NEWICK(nLENGTH, root, CurCitre_removed_topo); |
---|
541 | |
---|
542 | TEST_ASSERT_VALID_TREE(root); |
---|
543 | TEST_ASSERT_VALID_TREE(CurCitre); |
---|
544 | |
---|
545 | TEST_EXPECT_EQUAL(root->gr.leaf_sum, 15); // out of date |
---|
546 | root->compute_tree(); |
---|
547 | TEST_EXPECT_EQUAL(root->gr.leaf_sum, 14); |
---|
548 | |
---|
549 | env.push(); // 6th stack level (=CurCitre_removed_topo) |
---|
550 | |
---|
551 | TEST_ASSERT_VALID_TREE(root); |
---|
552 | |
---|
553 | // test insert: |
---|
554 | AP_tree_nlen *CloCarni = root->findLeafNamed("CloCarni"); |
---|
555 | TEST_REJECT_NULL(CloCarni); |
---|
556 | CurCitre->insert(CloCarni); // this creates two extra edges (not destroyed by destroy() below) and one extra node |
---|
557 | |
---|
558 | const char *CurCitre_inserted_topo = "((" B1_TOP ",(((CloButy2:0.009,CloButyr:0.000):0.564,(CurCitre:0.060,CloCarni:0.060):0.060):0.010,CloPaste:0.179):0.131):0.081,(" B3_TOP_SONS_CCR "):0.081);"; |
---|
559 | TEST_EXPECT_NEWICK(nLENGTH, root, CurCitre_inserted_topo); |
---|
560 | |
---|
561 | AP_tree_nlen *node_del_manually = CurCitre->get_father(); |
---|
562 | AP_tree_edge *edge1_del_manually = CurCitre->edgeTo(node_del_manually); |
---|
563 | AP_tree_edge *edge2_del_manually = CurCitre->get_brother()->edgeTo(node_del_manually); |
---|
564 | |
---|
565 | TEST_ASSERT_VALID_TREE(root); |
---|
566 | |
---|
567 | // now check pops: |
---|
568 | env.pop(); TEST_EXPECT_NEWICK(nLENGTH, root, CurCitre_removed_topo); |
---|
569 | env.pop(); TEST_EXPECT_NEWICK(nLENGTH, root, rootSetBack_topo); |
---|
570 | env.pop(); TEST_EXPECT_NEWICK(nLENGTH, root, rootAtCloTyrob_topo); |
---|
571 | env.pop(); TEST_EXPECT_NEWICK(nLENGTH, root, bottom_topo); |
---|
572 | env.pop(); TEST_EXPECT_NEWICK(nLENGTH, root, edge_topo); |
---|
573 | env.pop(); TEST_EXPECT_NEWICK(nLENGTH, root, top_topo); |
---|
574 | |
---|
575 | TEST_ASSERT_VALID_TREE(root); |
---|
576 | |
---|
577 | // delete memory allocated by insert() above and lost due to pop()s |
---|
578 | delete edge1_del_manually; |
---|
579 | delete edge2_del_manually; |
---|
580 | |
---|
581 | node_del_manually->forget_origin(); |
---|
582 | node_del_manually->father = NULL; |
---|
583 | node_del_manually->leftson = NULL; |
---|
584 | node_del_manually->rightson = NULL; |
---|
585 | delete node_del_manually; |
---|
586 | } |
---|
587 | } |
---|
588 | |
---|
589 | // @@@ Tests wanted: |
---|
590 | // - NNI |
---|
591 | // - tree optimize |
---|
592 | // - ... |
---|
593 | |
---|
594 | void TEST_calc_bootstraps() { |
---|
595 | PARSIMONY_testenv<AP_sequence_parsimony> env("TEST_trees.arb", "ali_5s"); |
---|
596 | TEST_EXPECT_NO_ERROR(env.load_tree("tree_test")); |
---|
597 | |
---|
598 | const char *bs_origi_topo = "(((((((CloTyro3,CloTyro4)'40%',CloTyro2)'0%',CloTyrob)'97%',CloInnoc)'0%',CloBifer)'53%',(((CloButy2,CloButyr)'100%',CloCarni)'33%',CloPaste)'97%')'100%',((((CorAquat,CurCitre)'100%',CorGluta)'17%',CelBiazo)'40%',CytAquat)'100%');"; |
---|
599 | const char *bs_limit_topo = "(((((((CloTyro3,CloTyro4)'87%',CloTyro2)'0%',CloTyrob)'100%',CloInnoc)'87%',CloBifer)'83%',(((CloButy2,CloButyr)'99%',CloCarni)'17%',CloPaste)'56%')'61%',((((CorAquat,CurCitre)'78%',CorGluta)'0%',CelBiazo)'59%',CytAquat)'61%');"; |
---|
600 | const char *bs_estim_topo = "(((((((CloTyro3,CloTyro4)'75%',CloTyro2)'0%',CloTyrob)'100%',CloInnoc)'75%',CloBifer)'78%',(((CloButy2,CloButyr)'99%',CloCarni)'13%',CloPaste)'32%')'53%',((((CorAquat,CurCitre)'74%',CorGluta)'0%',CelBiazo)'56%',CytAquat)'53%');"; |
---|
601 | |
---|
602 | { |
---|
603 | AP_tree_nlen *root = env.root_node(); |
---|
604 | AP_tree_edge *root_edge = rootEdge(); |
---|
605 | |
---|
606 | TEST_EXPECT(root && rootEdge); |
---|
607 | |
---|
608 | root->reorder_tree(BIG_BRANCHES_TO_TOP); TEST_EXPECT_NEWICK(nREMARK, root, bs_origi_topo); |
---|
609 | |
---|
610 | TEST_EXPECT_EQUAL(env.combines_performed(), 0); |
---|
611 | root_edge->nni_rek(-1, false, AP_BL_MODE(AP_BL_BL_ONLY|AP_BL_BOOTSTRAP_LIMIT), NULL); root->reorder_tree(BIG_BRANCHES_TO_TOP); TEST_EXPECT_NEWICK(nREMARK, root, bs_limit_topo); |
---|
612 | TEST_EXPECT_EQUAL(env.combines_performed(), 214); |
---|
613 | root_edge->nni_rek(-1, false, AP_BL_MODE(AP_BL_BL_ONLY|AP_BL_BOOTSTRAP_ESTIMATE), NULL); root->reorder_tree(BIG_BRANCHES_TO_TOP); TEST_EXPECT_NEWICK(nREMARK, root, bs_estim_topo); |
---|
614 | TEST_EXPECT_EQUAL(env.combines_performed(), 200); |
---|
615 | |
---|
616 | TEST_EXPECT_EQUAL(env.root_node(), root); |
---|
617 | } |
---|
618 | |
---|
619 | } |
---|
620 | |
---|
621 | void TEST_tree_remove_add_all() { |
---|
622 | // reproduces crash as described in #527 |
---|
623 | PARSIMONY_testenv<AP_sequence_parsimony> env("TEST_trees.arb", "ali_5s"); |
---|
624 | TEST_EXPECT_NO_ERROR(env.load_tree("tree_nj")); |
---|
625 | |
---|
626 | const int LEAFS = 6; |
---|
627 | AP_tree_nlen *leaf[LEAFS]; |
---|
628 | const char *name[LEAFS] = { |
---|
629 | "CloButy2", |
---|
630 | "CloButyr", |
---|
631 | "CytAquat", |
---|
632 | "CorAquat", |
---|
633 | "CurCitre", |
---|
634 | "CorGluta", |
---|
635 | }; |
---|
636 | |
---|
637 | AP_tree_nlen *root = env.root_node(); |
---|
638 | |
---|
639 | for (int i = 0; i<LEAFS; ++i) { |
---|
640 | leaf[i] = root->findLeafNamed(name[i]); |
---|
641 | TEST_REJECT_NULL(leaf[i]); |
---|
642 | } |
---|
643 | |
---|
644 | TEST_ASSERT_VALID_TREE(root); |
---|
645 | |
---|
646 | AP_pars_root *troot = leaf[0]->get_tree_root(); |
---|
647 | TEST_REJECT_NULL(troot); |
---|
648 | |
---|
649 | // Note: following loop leaks father nodes and edges |
---|
650 | // suppressed in valgrind via ../SOURCE_TOOLS/arb.supp@TEST_tree_remove_add_all |
---|
651 | for (int i = 0; i<LEAFS-1; ++i) { // removing the second to last leaf, "removes" both remaining leafs |
---|
652 | TEST_ASSERT_VALID_TREE(root); |
---|
653 | leaf[i]->remove(); |
---|
654 | TEST_ASSERT_VALID_TREE(leaf[i]); |
---|
655 | } |
---|
656 | leaf[LEAFS-1]->father = NULL; // correct final leaf (not removed regularily) |
---|
657 | |
---|
658 | leaf[0]->initial_insert(leaf[1], troot); |
---|
659 | for (int i = 2; i<LEAFS; ++i) { |
---|
660 | TEST_ASSERT_VALID_TREE(leaf[i-1]); |
---|
661 | TEST_ASSERT_VALID_TREE(leaf[i]); |
---|
662 | leaf[i]->insert(leaf[i-1]); |
---|
663 | } |
---|
664 | } |
---|
665 | |
---|
666 | #endif // UNIT_TESTS |
---|
667 | |
---|
668 | // -------------------------------------------------------------------------------- |
---|