1 /*
2 * Copyright 2008-2009 Katholieke Universiteit Leuven
3 * Copyright 2010 INRIA Saclay
4 * Copyright 2016-2017 Sven Verdoolaege
5 *
6 * Use of this software is governed by the MIT license
7 *
8 * Written by Sven Verdoolaege, K.U.Leuven, Departement
9 * Computerwetenschappen, Celestijnenlaan 200A, B-3001 Leuven, Belgium
10 * and INRIA Saclay - Ile-de-France, Parc Club Orsay Universite,
11 * ZAC des vignes, 4 rue Jacques Monod, 91893 Orsay, France
12 */
13
14 #include <isl_ctx_private.h>
15 #include "isl_map_private.h"
16 #include <isl_seq.h>
17 #include "isl_tab.h"
18 #include "isl_sample.h"
19 #include <isl_mat_private.h>
20 #include <isl_vec_private.h>
21 #include <isl_aff_private.h>
22 #include <isl_constraint_private.h>
23 #include <isl_options_private.h>
24 #include <isl_config.h>
25
26 #include <bset_to_bmap.c>
27
28 /*
29 * The implementation of parametric integer linear programming in this file
30 * was inspired by the paper "Parametric Integer Programming" and the
31 * report "Solving systems of affine (in)equalities" by Paul Feautrier
32 * (and others).
33 *
34 * The strategy used for obtaining a feasible solution is different
35 * from the one used in isl_tab.c. In particular, in isl_tab.c,
36 * upon finding a constraint that is not yet satisfied, we pivot
37 * in a row that increases the constant term of the row holding the
38 * constraint, making sure the sample solution remains feasible
39 * for all the constraints it already satisfied.
40 * Here, we always pivot in the row holding the constraint,
41 * choosing a column that induces the lexicographically smallest
42 * increment to the sample solution.
43 *
44 * By starting out from a sample value that is lexicographically
45 * smaller than any integer point in the problem space, the first
46 * feasible integer sample point we find will also be the lexicographically
47 * smallest. If all variables can be assumed to be non-negative,
48 * then the initial sample value may be chosen equal to zero.
49 * However, we will not make this assumption. Instead, we apply
50 * the "big parameter" trick. Any variable x is then not directly
51 * used in the tableau, but instead it is represented by another
52 * variable x' = M + x, where M is an arbitrarily large (positive)
53 * value. x' is therefore always non-negative, whatever the value of x.
54 * Taking as initial sample value x' = 0 corresponds to x = -M,
55 * which is always smaller than any possible value of x.
56 *
57 * The big parameter trick is used in the main tableau and
58 * also in the context tableau if isl_context_lex is used.
59 * In this case, each tableaus has its own big parameter.
60 * Before doing any real work, we check if all the parameters
61 * happen to be non-negative. If so, we drop the column corresponding
62 * to M from the initial context tableau.
63 * If isl_context_gbr is used, then the big parameter trick is only
64 * used in the main tableau.
65 */
66
67 struct isl_context;
68 struct isl_context_op {
69 /* detect nonnegative parameters in context and mark them in tab */
70 struct isl_tab *(*detect_nonnegative_parameters)(
71 struct isl_context *context, struct isl_tab *tab);
72 /* return temporary reference to basic set representation of context */
73 struct isl_basic_set *(*peek_basic_set)(struct isl_context *context);
74 /* return temporary reference to tableau representation of context */
75 struct isl_tab *(*peek_tab)(struct isl_context *context);
76 /* add equality; check is 1 if eq may not be valid;
77 * update is 1 if we may want to call ineq_sign on context later.
78 */
79 void (*add_eq)(struct isl_context *context, isl_int *eq,
80 int check, int update);
81 /* add inequality; check is 1 if ineq may not be valid;
82 * update is 1 if we may want to call ineq_sign on context later.
83 */
84 void (*add_ineq)(struct isl_context *context, isl_int *ineq,
85 int check, int update);
86 /* check sign of ineq based on previous information.
87 * strict is 1 if saturation should be treated as a positive sign.
88 */
89 enum isl_tab_row_sign (*ineq_sign)(struct isl_context *context,
90 isl_int *ineq, int strict);
91 /* check if inequality maintains feasibility */
92 int (*test_ineq)(struct isl_context *context, isl_int *ineq);
93 /* return index of a div that corresponds to "div" */
94 int (*get_div)(struct isl_context *context, struct isl_tab *tab,
95 struct isl_vec *div);
96 /* insert div "div" to context at "pos" and return non-negativity */
97 isl_bool (*insert_div)(struct isl_context *context, int pos,
98 __isl_keep isl_vec *div);
99 int (*detect_equalities)(struct isl_context *context,
100 struct isl_tab *tab);
101 /* return row index of "best" split */
102 int (*best_split)(struct isl_context *context, struct isl_tab *tab);
103 /* check if context has already been determined to be empty */
104 int (*is_empty)(struct isl_context *context);
105 /* check if context is still usable */
106 int (*is_ok)(struct isl_context *context);
107 /* save a copy/snapshot of context */
108 void *(*save)(struct isl_context *context);
109 /* restore saved context */
110 void (*restore)(struct isl_context *context, void *);
111 /* discard saved context */
112 void (*discard)(void *);
113 /* invalidate context */
114 void (*invalidate)(struct isl_context *context);
115 /* free context */
116 __isl_null struct isl_context *(*free)(struct isl_context *context);
117 };
118
119 /* Shared parts of context representation.
120 *
121 * "n_unknown" is the number of final unknown integer divisions
122 * in the input domain.
123 */
124 struct isl_context {
125 struct isl_context_op *op;
126 int n_unknown;
127 };
128
129 struct isl_context_lex {
130 struct isl_context context;
131 struct isl_tab *tab;
132 };
133
134 /* A stack (linked list) of solutions of subtrees of the search space.
135 *
136 * "ma" describes the solution as a function of "dom".
137 * In particular, the domain space of "ma" is equal to the space of "dom".
138 *
139 * If "ma" is NULL, then there is no solution on "dom".
140 */
141 struct isl_partial_sol {
142 int level;
143 struct isl_basic_set *dom;
144 isl_multi_aff *ma;
145
146 struct isl_partial_sol *next;
147 };
148
149 struct isl_sol;
150 struct isl_sol_callback {
151 struct isl_tab_callback callback;
152 struct isl_sol *sol;
153 };
154
155 /* isl_sol is an interface for constructing a solution to
156 * a parametric integer linear programming problem.
157 * Every time the algorithm reaches a state where a solution
158 * can be read off from the tableau, the function "add" is called
159 * on the isl_sol passed to find_solutions_main. In a state where
160 * the tableau is empty, "add_empty" is called instead.
161 * "free" is called to free the implementation specific fields, if any.
162 *
163 * "error" is set if some error has occurred. This flag invalidates
164 * the remainder of the data structure.
165 * If "rational" is set, then a rational optimization is being performed.
166 * "level" is the current level in the tree with nodes for each
167 * split in the context.
168 * If "max" is set, then a maximization problem is being solved, rather than
169 * a minimization problem, which means that the variables in the
170 * tableau have value "M - x" rather than "M + x".
171 * "n_out" is the number of output dimensions in the input.
172 * "space" is the space in which the solution (and also the input) lives.
173 *
174 * The context tableau is owned by isl_sol and is updated incrementally.
175 *
176 * There are currently two implementations of this interface,
177 * isl_sol_map, which simply collects the solutions in an isl_map
178 * and (optionally) the parts of the context where there is no solution
179 * in an isl_set, and
180 * isl_sol_pma, which collects an isl_pw_multi_aff instead.
181 */
182 struct isl_sol {
183 int error;
184 int rational;
185 int level;
186 int max;
187 isl_size n_out;
188 isl_space *space;
189 struct isl_context *context;
190 struct isl_partial_sol *partial;
191 void (*add)(struct isl_sol *sol,
192 __isl_take isl_basic_set *dom, __isl_take isl_multi_aff *ma);
193 void (*add_empty)(struct isl_sol *sol, struct isl_basic_set *bset);
194 void (*free)(struct isl_sol *sol);
195 struct isl_sol_callback dec_level;
196 };
197
sol_free(struct isl_sol * sol)198 static void sol_free(struct isl_sol *sol)
199 {
200 struct isl_partial_sol *partial, *next;
201 if (!sol)
202 return;
203 for (partial = sol->partial; partial; partial = next) {
204 next = partial->next;
205 isl_basic_set_free(partial->dom);
206 isl_multi_aff_free(partial->ma);
207 free(partial);
208 }
209 isl_space_free(sol->space);
210 if (sol->context)
211 sol->context->op->free(sol->context);
212 sol->free(sol);
213 free(sol);
214 }
215
216 /* Push a partial solution represented by a domain and function "ma"
217 * onto the stack of partial solutions.
218 * If "ma" is NULL, then "dom" represents a part of the domain
219 * with no solution.
220 */
sol_push_sol(struct isl_sol * sol,__isl_take isl_basic_set * dom,__isl_take isl_multi_aff * ma)221 static void sol_push_sol(struct isl_sol *sol,
222 __isl_take isl_basic_set *dom, __isl_take isl_multi_aff *ma)
223 {
224 struct isl_partial_sol *partial;
225
226 if (sol->error || !dom)
227 goto error;
228
229 partial = isl_alloc_type(dom->ctx, struct isl_partial_sol);
230 if (!partial)
231 goto error;
232
233 partial->level = sol->level;
234 partial->dom = dom;
235 partial->ma = ma;
236 partial->next = sol->partial;
237
238 sol->partial = partial;
239
240 return;
241 error:
242 isl_basic_set_free(dom);
243 isl_multi_aff_free(ma);
244 sol->error = 1;
245 }
246
247 /* Check that the final columns of "M", starting at "first", are zero.
248 */
check_final_columns_are_zero(__isl_keep isl_mat * M,unsigned first)249 static isl_stat check_final_columns_are_zero(__isl_keep isl_mat *M,
250 unsigned first)
251 {
252 int i;
253 isl_size rows, cols;
254 unsigned n;
255
256 rows = isl_mat_rows(M);
257 cols = isl_mat_cols(M);
258 if (rows < 0 || cols < 0)
259 return isl_stat_error;
260 n = cols - first;
261 for (i = 0; i < rows; ++i)
262 if (isl_seq_first_non_zero(M->row[i] + first, n) != -1)
263 isl_die(isl_mat_get_ctx(M), isl_error_internal,
264 "final columns should be zero",
265 return isl_stat_error);
266 return isl_stat_ok;
267 }
268
269 /* Set the affine expressions in "ma" according to the rows in "M", which
270 * are defined over the local space "ls".
271 * The matrix "M" may have extra (zero) columns beyond the number
272 * of variables in "ls".
273 */
set_from_affine_matrix(__isl_take isl_multi_aff * ma,__isl_take isl_local_space * ls,__isl_take isl_mat * M)274 static __isl_give isl_multi_aff *set_from_affine_matrix(
275 __isl_take isl_multi_aff *ma, __isl_take isl_local_space *ls,
276 __isl_take isl_mat *M)
277 {
278 int i;
279 isl_size dim;
280 isl_aff *aff;
281
282 dim = isl_local_space_dim(ls, isl_dim_all);
283 if (!ma || dim < 0 || !M)
284 goto error;
285
286 if (check_final_columns_are_zero(M, 1 + dim) < 0)
287 goto error;
288 for (i = 1; i < M->n_row; ++i) {
289 aff = isl_aff_alloc(isl_local_space_copy(ls));
290 if (aff) {
291 isl_int_set(aff->v->el[0], M->row[0][0]);
292 isl_seq_cpy(aff->v->el + 1, M->row[i], 1 + dim);
293 }
294 aff = isl_aff_normalize(aff);
295 ma = isl_multi_aff_set_aff(ma, i - 1, aff);
296 }
297 isl_local_space_free(ls);
298 isl_mat_free(M);
299
300 return ma;
301 error:
302 isl_local_space_free(ls);
303 isl_mat_free(M);
304 isl_multi_aff_free(ma);
305 return NULL;
306 }
307
308 /* Push a partial solution represented by a domain and mapping M
309 * onto the stack of partial solutions.
310 *
311 * The affine matrix "M" maps the dimensions of the context
312 * to the output variables. Convert it into an isl_multi_aff and
313 * then call sol_push_sol.
314 *
315 * Note that the description of the initial context may have involved
316 * existentially quantified variables, in which case they also appear
317 * in "dom". These need to be removed before creating the affine
318 * expression because an affine expression cannot be defined in terms
319 * of existentially quantified variables without a known representation.
320 * Since newly added integer divisions are inserted before these
321 * existentially quantified variables, they are still in the final
322 * positions and the corresponding final columns of "M" are zero
323 * because align_context_divs adds the existentially quantified
324 * variables of the context to the main tableau without any constraints and
325 * any equality constraints that are added later on can only serve
326 * to eliminate these existentially quantified variables.
327 */
sol_push_sol_mat(struct isl_sol * sol,__isl_take isl_basic_set * dom,__isl_take isl_mat * M)328 static void sol_push_sol_mat(struct isl_sol *sol,
329 __isl_take isl_basic_set *dom, __isl_take isl_mat *M)
330 {
331 isl_local_space *ls;
332 isl_multi_aff *ma;
333 isl_size n_div;
334 int n_known;
335
336 n_div = isl_basic_set_dim(dom, isl_dim_div);
337 if (n_div < 0)
338 goto error;
339 n_known = n_div - sol->context->n_unknown;
340
341 ma = isl_multi_aff_alloc(isl_space_copy(sol->space));
342 ls = isl_basic_set_get_local_space(dom);
343 ls = isl_local_space_drop_dims(ls, isl_dim_div,
344 n_known, n_div - n_known);
345 ma = set_from_affine_matrix(ma, ls, M);
346
347 if (!ma)
348 dom = isl_basic_set_free(dom);
349 sol_push_sol(sol, dom, ma);
350 return;
351 error:
352 isl_basic_set_free(dom);
353 isl_mat_free(M);
354 sol_push_sol(sol, NULL, NULL);
355 }
356
357 /* Pop one partial solution from the partial solution stack and
358 * pass it on to sol->add or sol->add_empty.
359 */
sol_pop_one(struct isl_sol * sol)360 static void sol_pop_one(struct isl_sol *sol)
361 {
362 struct isl_partial_sol *partial;
363
364 partial = sol->partial;
365 sol->partial = partial->next;
366
367 if (partial->ma)
368 sol->add(sol, partial->dom, partial->ma);
369 else
370 sol->add_empty(sol, partial->dom);
371 free(partial);
372 }
373
374 /* Return a fresh copy of the domain represented by the context tableau.
375 */
sol_domain(struct isl_sol * sol)376 static struct isl_basic_set *sol_domain(struct isl_sol *sol)
377 {
378 struct isl_basic_set *bset;
379
380 if (sol->error)
381 return NULL;
382
383 bset = isl_basic_set_dup(sol->context->op->peek_basic_set(sol->context));
384 bset = isl_basic_set_update_from_tab(bset,
385 sol->context->op->peek_tab(sol->context));
386
387 return bset;
388 }
389
390 /* Check whether two partial solutions have the same affine expressions.
391 */
same_solution(struct isl_partial_sol * s1,struct isl_partial_sol * s2)392 static isl_bool same_solution(struct isl_partial_sol *s1,
393 struct isl_partial_sol *s2)
394 {
395 if (!s1->ma != !s2->ma)
396 return isl_bool_false;
397 if (!s1->ma)
398 return isl_bool_true;
399
400 return isl_multi_aff_plain_is_equal(s1->ma, s2->ma);
401 }
402
403 /* Swap the initial two partial solutions in "sol".
404 *
405 * That is, go from
406 *
407 * sol->partial = p1; p1->next = p2; p2->next = p3
408 *
409 * to
410 *
411 * sol->partial = p2; p2->next = p1; p1->next = p3
412 */
swap_initial(struct isl_sol * sol)413 static void swap_initial(struct isl_sol *sol)
414 {
415 struct isl_partial_sol *partial;
416
417 partial = sol->partial;
418 sol->partial = partial->next;
419 partial->next = partial->next->next;
420 sol->partial->next = partial;
421 }
422
423 /* Combine the initial two partial solution of "sol" into
424 * a partial solution with the current context domain of "sol" and
425 * the function description of the second partial solution in the list.
426 * The level of the new partial solution is set to the current level.
427 *
428 * That is, the first two partial solutions (D1,M1) and (D2,M2) are
429 * replaced by (D,M2), where D is the domain of "sol", which is assumed
430 * to be the union of D1 and D2, while M1 is assumed to be equal to M2
431 * (at least on D1).
432 */
combine_initial_into_second(struct isl_sol * sol)433 static isl_stat combine_initial_into_second(struct isl_sol *sol)
434 {
435 struct isl_partial_sol *partial;
436 isl_basic_set *bset;
437
438 partial = sol->partial;
439
440 bset = sol_domain(sol);
441 isl_basic_set_free(partial->next->dom);
442 partial->next->dom = bset;
443 partial->next->level = sol->level;
444
445 if (!bset)
446 return isl_stat_error;
447
448 sol->partial = partial->next;
449 isl_basic_set_free(partial->dom);
450 isl_multi_aff_free(partial->ma);
451 free(partial);
452
453 return isl_stat_ok;
454 }
455
456 /* Are "ma1" and "ma2" equal to each other on "dom"?
457 *
458 * Combine "ma1" and "ma2" with "dom" and check if the results are the same.
459 * "dom" may have existentially quantified variables. Eliminate them first
460 * as otherwise they would have to be eliminated twice, in a more complicated
461 * context.
462 */
equal_on_domain(__isl_keep isl_multi_aff * ma1,__isl_keep isl_multi_aff * ma2,__isl_keep isl_basic_set * dom)463 static isl_bool equal_on_domain(__isl_keep isl_multi_aff *ma1,
464 __isl_keep isl_multi_aff *ma2, __isl_keep isl_basic_set *dom)
465 {
466 isl_set *set;
467 isl_pw_multi_aff *pma1, *pma2;
468 isl_bool equal;
469
470 set = isl_basic_set_compute_divs(isl_basic_set_copy(dom));
471 pma1 = isl_pw_multi_aff_alloc(isl_set_copy(set),
472 isl_multi_aff_copy(ma1));
473 pma2 = isl_pw_multi_aff_alloc(set, isl_multi_aff_copy(ma2));
474 equal = isl_pw_multi_aff_is_equal(pma1, pma2);
475 isl_pw_multi_aff_free(pma1);
476 isl_pw_multi_aff_free(pma2);
477
478 return equal;
479 }
480
481 /* The initial two partial solutions of "sol" are known to be at
482 * the same level.
483 * If they represent the same solution (on different parts of the domain),
484 * then combine them into a single solution at the current level.
485 * Otherwise, pop them both.
486 *
487 * Even if the two partial solution are not obviously the same,
488 * one may still be a simplification of the other over its own domain.
489 * Also check if the two sets of affine functions are equal when
490 * restricted to one of the domains. If so, combine the two
491 * using the set of affine functions on the other domain.
492 * That is, for two partial solutions (D1,M1) and (D2,M2),
493 * if M1 = M2 on D1, then the pair of partial solutions can
494 * be replaced by (D1+D2,M2) and similarly when M1 = M2 on D2.
495 */
combine_initial_if_equal(struct isl_sol * sol)496 static isl_stat combine_initial_if_equal(struct isl_sol *sol)
497 {
498 struct isl_partial_sol *partial;
499 isl_bool same;
500
501 partial = sol->partial;
502
503 same = same_solution(partial, partial->next);
504 if (same < 0)
505 return isl_stat_error;
506 if (same)
507 return combine_initial_into_second(sol);
508 if (partial->ma && partial->next->ma) {
509 same = equal_on_domain(partial->ma, partial->next->ma,
510 partial->dom);
511 if (same < 0)
512 return isl_stat_error;
513 if (same)
514 return combine_initial_into_second(sol);
515 same = equal_on_domain(partial->ma, partial->next->ma,
516 partial->next->dom);
517 if (same) {
518 swap_initial(sol);
519 return combine_initial_into_second(sol);
520 }
521 }
522
523 sol_pop_one(sol);
524 sol_pop_one(sol);
525
526 return isl_stat_ok;
527 }
528
529 /* Pop all solutions from the partial solution stack that were pushed onto
530 * the stack at levels that are deeper than the current level.
531 * If the two topmost elements on the stack have the same level
532 * and represent the same solution, then their domains are combined.
533 * This combined domain is the same as the current context domain
534 * as sol_pop is called each time we move back to a higher level.
535 * If the outer level (0) has been reached, then all partial solutions
536 * at the current level are also popped off.
537 */
sol_pop(struct isl_sol * sol)538 static void sol_pop(struct isl_sol *sol)
539 {
540 struct isl_partial_sol *partial;
541
542 if (sol->error)
543 return;
544
545 partial = sol->partial;
546 if (!partial)
547 return;
548
549 if (partial->level == 0 && sol->level == 0) {
550 for (partial = sol->partial; partial; partial = sol->partial)
551 sol_pop_one(sol);
552 return;
553 }
554
555 if (partial->level <= sol->level)
556 return;
557
558 if (partial->next && partial->next->level == partial->level) {
559 if (combine_initial_if_equal(sol) < 0)
560 goto error;
561 } else
562 sol_pop_one(sol);
563
564 if (sol->level == 0) {
565 for (partial = sol->partial; partial; partial = sol->partial)
566 sol_pop_one(sol);
567 return;
568 }
569
570 if (0)
571 error: sol->error = 1;
572 }
573
sol_dec_level(struct isl_sol * sol)574 static void sol_dec_level(struct isl_sol *sol)
575 {
576 if (sol->error)
577 return;
578
579 sol->level--;
580
581 sol_pop(sol);
582 }
583
sol_dec_level_wrap(struct isl_tab_callback * cb)584 static isl_stat sol_dec_level_wrap(struct isl_tab_callback *cb)
585 {
586 struct isl_sol_callback *callback = (struct isl_sol_callback *)cb;
587
588 sol_dec_level(callback->sol);
589
590 return callback->sol->error ? isl_stat_error : isl_stat_ok;
591 }
592
593 /* Move down to next level and push callback onto context tableau
594 * to decrease the level again when it gets rolled back across
595 * the current state. That is, dec_level will be called with
596 * the context tableau in the same state as it is when inc_level
597 * is called.
598 */
sol_inc_level(struct isl_sol * sol)599 static void sol_inc_level(struct isl_sol *sol)
600 {
601 struct isl_tab *tab;
602
603 if (sol->error)
604 return;
605
606 sol->level++;
607 tab = sol->context->op->peek_tab(sol->context);
608 if (isl_tab_push_callback(tab, &sol->dec_level.callback) < 0)
609 sol->error = 1;
610 }
611
scale_rows(struct isl_mat * mat,isl_int m,int n_row)612 static void scale_rows(struct isl_mat *mat, isl_int m, int n_row)
613 {
614 int i;
615
616 if (isl_int_is_one(m))
617 return;
618
619 for (i = 0; i < n_row; ++i)
620 isl_seq_scale(mat->row[i], mat->row[i], m, mat->n_col);
621 }
622
623 /* Add the solution identified by the tableau and the context tableau.
624 *
625 * The layout of the variables is as follows.
626 * tab->n_var is equal to the total number of variables in the input
627 * map (including divs that were copied from the context)
628 * + the number of extra divs constructed
629 * Of these, the first tab->n_param and the last tab->n_div variables
630 * correspond to the variables in the context, i.e.,
631 * tab->n_param + tab->n_div = context_tab->n_var
632 * tab->n_param is equal to the number of parameters and input
633 * dimensions in the input map
634 * tab->n_div is equal to the number of divs in the context
635 *
636 * If there is no solution, then call add_empty with a basic set
637 * that corresponds to the context tableau. (If add_empty is NULL,
638 * then do nothing).
639 *
640 * If there is a solution, then first construct a matrix that maps
641 * all dimensions of the context to the output variables, i.e.,
642 * the output dimensions in the input map.
643 * The divs in the input map (if any) that do not correspond to any
644 * div in the context do not appear in the solution.
645 * The algorithm will make sure that they have an integer value,
646 * but these values themselves are of no interest.
647 * We have to be careful not to drop or rearrange any divs in the
648 * context because that would change the meaning of the matrix.
649 *
650 * To extract the value of the output variables, it should be noted
651 * that we always use a big parameter M in the main tableau and so
652 * the variable stored in this tableau is not an output variable x itself, but
653 * x' = M + x (in case of minimization)
654 * or
655 * x' = M - x (in case of maximization)
656 * If x' appears in a column, then its optimal value is zero,
657 * which means that the optimal value of x is an unbounded number
658 * (-M for minimization and M for maximization).
659 * We currently assume that the output dimensions in the original map
660 * are bounded, so this cannot occur.
661 * Similarly, when x' appears in a row, then the coefficient of M in that
662 * row is necessarily 1.
663 * If the row in the tableau represents
664 * d x' = c + d M + e(y)
665 * then, in case of minimization, the corresponding row in the matrix
666 * will be
667 * a c + a e(y)
668 * with a d = m, the (updated) common denominator of the matrix.
669 * In case of maximization, the row will be
670 * -a c - a e(y)
671 */
sol_add(struct isl_sol * sol,struct isl_tab * tab)672 static void sol_add(struct isl_sol *sol, struct isl_tab *tab)
673 {
674 struct isl_basic_set *bset = NULL;
675 struct isl_mat *mat = NULL;
676 unsigned off;
677 int row;
678 isl_int m;
679
680 if (sol->error || !tab)
681 goto error;
682
683 if (tab->empty && !sol->add_empty)
684 return;
685 if (sol->context->op->is_empty(sol->context))
686 return;
687
688 bset = sol_domain(sol);
689
690 if (tab->empty) {
691 sol_push_sol(sol, bset, NULL);
692 return;
693 }
694
695 off = 2 + tab->M;
696
697 mat = isl_mat_alloc(tab->mat->ctx, 1 + sol->n_out,
698 1 + tab->n_param + tab->n_div);
699 if (!mat)
700 goto error;
701
702 isl_int_init(m);
703
704 isl_seq_clr(mat->row[0] + 1, mat->n_col - 1);
705 isl_int_set_si(mat->row[0][0], 1);
706 for (row = 0; row < sol->n_out; ++row) {
707 int i = tab->n_param + row;
708 int r, j;
709
710 isl_seq_clr(mat->row[1 + row], mat->n_col);
711 if (!tab->var[i].is_row) {
712 if (tab->M)
713 isl_die(mat->ctx, isl_error_invalid,
714 "unbounded optimum", goto error2);
715 continue;
716 }
717
718 r = tab->var[i].index;
719 if (tab->M &&
720 isl_int_ne(tab->mat->row[r][2], tab->mat->row[r][0]))
721 isl_die(mat->ctx, isl_error_invalid,
722 "unbounded optimum", goto error2);
723 isl_int_gcd(m, mat->row[0][0], tab->mat->row[r][0]);
724 isl_int_divexact(m, tab->mat->row[r][0], m);
725 scale_rows(mat, m, 1 + row);
726 isl_int_divexact(m, mat->row[0][0], tab->mat->row[r][0]);
727 isl_int_mul(mat->row[1 + row][0], m, tab->mat->row[r][1]);
728 for (j = 0; j < tab->n_param; ++j) {
729 int col;
730 if (tab->var[j].is_row)
731 continue;
732 col = tab->var[j].index;
733 isl_int_mul(mat->row[1 + row][1 + j], m,
734 tab->mat->row[r][off + col]);
735 }
736 for (j = 0; j < tab->n_div; ++j) {
737 int col;
738 if (tab->var[tab->n_var - tab->n_div+j].is_row)
739 continue;
740 col = tab->var[tab->n_var - tab->n_div+j].index;
741 isl_int_mul(mat->row[1 + row][1 + tab->n_param + j], m,
742 tab->mat->row[r][off + col]);
743 }
744 if (sol->max)
745 isl_seq_neg(mat->row[1 + row], mat->row[1 + row],
746 mat->n_col);
747 }
748
749 isl_int_clear(m);
750
751 sol_push_sol_mat(sol, bset, mat);
752 return;
753 error2:
754 isl_int_clear(m);
755 error:
756 isl_basic_set_free(bset);
757 isl_mat_free(mat);
758 sol->error = 1;
759 }
760
761 struct isl_sol_map {
762 struct isl_sol sol;
763 struct isl_map *map;
764 struct isl_set *empty;
765 };
766
sol_map_free(struct isl_sol * sol)767 static void sol_map_free(struct isl_sol *sol)
768 {
769 struct isl_sol_map *sol_map = (struct isl_sol_map *) sol;
770 isl_map_free(sol_map->map);
771 isl_set_free(sol_map->empty);
772 }
773
774 /* This function is called for parts of the context where there is
775 * no solution, with "bset" corresponding to the context tableau.
776 * Simply add the basic set to the set "empty".
777 */
sol_map_add_empty(struct isl_sol_map * sol,struct isl_basic_set * bset)778 static void sol_map_add_empty(struct isl_sol_map *sol,
779 struct isl_basic_set *bset)
780 {
781 if (!bset || !sol->empty)
782 goto error;
783
784 sol->empty = isl_set_grow(sol->empty, 1);
785 bset = isl_basic_set_simplify(bset);
786 bset = isl_basic_set_finalize(bset);
787 sol->empty = isl_set_add_basic_set(sol->empty, isl_basic_set_copy(bset));
788 if (!sol->empty)
789 goto error;
790 isl_basic_set_free(bset);
791 return;
792 error:
793 isl_basic_set_free(bset);
794 sol->sol.error = 1;
795 }
796
sol_map_add_empty_wrap(struct isl_sol * sol,struct isl_basic_set * bset)797 static void sol_map_add_empty_wrap(struct isl_sol *sol,
798 struct isl_basic_set *bset)
799 {
800 sol_map_add_empty((struct isl_sol_map *)sol, bset);
801 }
802
803 /* Given a basic set "dom" that represents the context and a tuple of
804 * affine expressions "ma" defined over this domain, construct a basic map
805 * that expresses this function on the domain.
806 */
sol_map_add(struct isl_sol_map * sol,__isl_take isl_basic_set * dom,__isl_take isl_multi_aff * ma)807 static void sol_map_add(struct isl_sol_map *sol,
808 __isl_take isl_basic_set *dom, __isl_take isl_multi_aff *ma)
809 {
810 isl_basic_map *bmap;
811
812 if (sol->sol.error || !dom || !ma)
813 goto error;
814
815 bmap = isl_basic_map_from_multi_aff2(ma, sol->sol.rational);
816 bmap = isl_basic_map_intersect_domain(bmap, dom);
817 sol->map = isl_map_grow(sol->map, 1);
818 sol->map = isl_map_add_basic_map(sol->map, bmap);
819 if (!sol->map)
820 sol->sol.error = 1;
821 return;
822 error:
823 isl_basic_set_free(dom);
824 isl_multi_aff_free(ma);
825 sol->sol.error = 1;
826 }
827
sol_map_add_wrap(struct isl_sol * sol,__isl_take isl_basic_set * dom,__isl_take isl_multi_aff * ma)828 static void sol_map_add_wrap(struct isl_sol *sol,
829 __isl_take isl_basic_set *dom, __isl_take isl_multi_aff *ma)
830 {
831 sol_map_add((struct isl_sol_map *)sol, dom, ma);
832 }
833
834
835 /* Store the "parametric constant" of row "row" of tableau "tab" in "line",
836 * i.e., the constant term and the coefficients of all variables that
837 * appear in the context tableau.
838 * Note that the coefficient of the big parameter M is NOT copied.
839 * The context tableau may not have a big parameter and even when it
840 * does, it is a different big parameter.
841 */
get_row_parameter_line(struct isl_tab * tab,int row,isl_int * line)842 static void get_row_parameter_line(struct isl_tab *tab, int row, isl_int *line)
843 {
844 int i;
845 unsigned off = 2 + tab->M;
846
847 isl_int_set(line[0], tab->mat->row[row][1]);
848 for (i = 0; i < tab->n_param; ++i) {
849 if (tab->var[i].is_row)
850 isl_int_set_si(line[1 + i], 0);
851 else {
852 int col = tab->var[i].index;
853 isl_int_set(line[1 + i], tab->mat->row[row][off + col]);
854 }
855 }
856 for (i = 0; i < tab->n_div; ++i) {
857 if (tab->var[tab->n_var - tab->n_div + i].is_row)
858 isl_int_set_si(line[1 + tab->n_param + i], 0);
859 else {
860 int col = tab->var[tab->n_var - tab->n_div + i].index;
861 isl_int_set(line[1 + tab->n_param + i],
862 tab->mat->row[row][off + col]);
863 }
864 }
865 }
866
867 /* Check if rows "row1" and "row2" have identical "parametric constants",
868 * as explained above.
869 * In this case, we also insist that the coefficients of the big parameter
870 * be the same as the values of the constants will only be the same
871 * if these coefficients are also the same.
872 */
identical_parameter_line(struct isl_tab * tab,int row1,int row2)873 static int identical_parameter_line(struct isl_tab *tab, int row1, int row2)
874 {
875 int i;
876 unsigned off = 2 + tab->M;
877
878 if (isl_int_ne(tab->mat->row[row1][1], tab->mat->row[row2][1]))
879 return 0;
880
881 if (tab->M && isl_int_ne(tab->mat->row[row1][2],
882 tab->mat->row[row2][2]))
883 return 0;
884
885 for (i = 0; i < tab->n_param + tab->n_div; ++i) {
886 int pos = i < tab->n_param ? i :
887 tab->n_var - tab->n_div + i - tab->n_param;
888 int col;
889
890 if (tab->var[pos].is_row)
891 continue;
892 col = tab->var[pos].index;
893 if (isl_int_ne(tab->mat->row[row1][off + col],
894 tab->mat->row[row2][off + col]))
895 return 0;
896 }
897 return 1;
898 }
899
900 /* Return an inequality that expresses that the "parametric constant"
901 * should be non-negative.
902 * This function is only called when the coefficient of the big parameter
903 * is equal to zero.
904 */
get_row_parameter_ineq(struct isl_tab * tab,int row)905 static struct isl_vec *get_row_parameter_ineq(struct isl_tab *tab, int row)
906 {
907 struct isl_vec *ineq;
908
909 ineq = isl_vec_alloc(tab->mat->ctx, 1 + tab->n_param + tab->n_div);
910 if (!ineq)
911 return NULL;
912
913 get_row_parameter_line(tab, row, ineq->el);
914 if (ineq)
915 ineq = isl_vec_normalize(ineq);
916
917 return ineq;
918 }
919
920 /* Normalize a div expression of the form
921 *
922 * [(g*f(x) + c)/(g * m)]
923 *
924 * with c the constant term and f(x) the remaining coefficients, to
925 *
926 * [(f(x) + [c/g])/m]
927 */
normalize_div(__isl_keep isl_vec * div)928 static void normalize_div(__isl_keep isl_vec *div)
929 {
930 isl_ctx *ctx = isl_vec_get_ctx(div);
931 int len = div->size - 2;
932
933 isl_seq_gcd(div->el + 2, len, &ctx->normalize_gcd);
934 isl_int_gcd(ctx->normalize_gcd, ctx->normalize_gcd, div->el[0]);
935
936 if (isl_int_is_one(ctx->normalize_gcd))
937 return;
938
939 isl_int_divexact(div->el[0], div->el[0], ctx->normalize_gcd);
940 isl_int_fdiv_q(div->el[1], div->el[1], ctx->normalize_gcd);
941 isl_seq_scale_down(div->el + 2, div->el + 2, ctx->normalize_gcd, len);
942 }
943
944 /* Return an integer division for use in a parametric cut based
945 * on the given row.
946 * In particular, let the parametric constant of the row be
947 *
948 * \sum_i a_i y_i
949 *
950 * where y_0 = 1, but none of the y_i corresponds to the big parameter M.
951 * The div returned is equal to
952 *
953 * floor(\sum_i {-a_i} y_i) = floor((\sum_i (-a_i mod d) y_i)/d)
954 */
get_row_parameter_div(struct isl_tab * tab,int row)955 static struct isl_vec *get_row_parameter_div(struct isl_tab *tab, int row)
956 {
957 struct isl_vec *div;
958
959 div = isl_vec_alloc(tab->mat->ctx, 1 + 1 + tab->n_param + tab->n_div);
960 if (!div)
961 return NULL;
962
963 isl_int_set(div->el[0], tab->mat->row[row][0]);
964 get_row_parameter_line(tab, row, div->el + 1);
965 isl_seq_neg(div->el + 1, div->el + 1, div->size - 1);
966 normalize_div(div);
967 isl_seq_fdiv_r(div->el + 1, div->el + 1, div->el[0], div->size - 1);
968
969 return div;
970 }
971
972 /* Return an integer division for use in transferring an integrality constraint
973 * to the context.
974 * In particular, let the parametric constant of the row be
975 *
976 * \sum_i a_i y_i
977 *
978 * where y_0 = 1, but none of the y_i corresponds to the big parameter M.
979 * The the returned div is equal to
980 *
981 * floor(\sum_i {a_i} y_i) = floor((\sum_i (a_i mod d) y_i)/d)
982 */
get_row_split_div(struct isl_tab * tab,int row)983 static struct isl_vec *get_row_split_div(struct isl_tab *tab, int row)
984 {
985 struct isl_vec *div;
986
987 div = isl_vec_alloc(tab->mat->ctx, 1 + 1 + tab->n_param + tab->n_div);
988 if (!div)
989 return NULL;
990
991 isl_int_set(div->el[0], tab->mat->row[row][0]);
992 get_row_parameter_line(tab, row, div->el + 1);
993 normalize_div(div);
994 isl_seq_fdiv_r(div->el + 1, div->el + 1, div->el[0], div->size - 1);
995
996 return div;
997 }
998
999 /* Construct and return an inequality that expresses an upper bound
1000 * on the given div.
1001 * In particular, if the div is given by
1002 *
1003 * d = floor(e/m)
1004 *
1005 * then the inequality expresses
1006 *
1007 * m d <= e
1008 */
ineq_for_div(__isl_keep isl_basic_set * bset,unsigned div)1009 static __isl_give isl_vec *ineq_for_div(__isl_keep isl_basic_set *bset,
1010 unsigned div)
1011 {
1012 isl_size total;
1013 unsigned div_pos;
1014 struct isl_vec *ineq;
1015
1016 total = isl_basic_set_dim(bset, isl_dim_all);
1017 if (total < 0)
1018 return NULL;
1019
1020 div_pos = 1 + total - bset->n_div + div;
1021
1022 ineq = isl_vec_alloc(bset->ctx, 1 + total);
1023 if (!ineq)
1024 return NULL;
1025
1026 isl_seq_cpy(ineq->el, bset->div[div] + 1, 1 + total);
1027 isl_int_neg(ineq->el[div_pos], bset->div[div][0]);
1028 return ineq;
1029 }
1030
1031 /* Given a row in the tableau and a div that was created
1032 * using get_row_split_div and that has been constrained to equality, i.e.,
1033 *
1034 * d = floor(\sum_i {a_i} y_i) = \sum_i {a_i} y_i
1035 *
1036 * replace the expression "\sum_i {a_i} y_i" in the row by d,
1037 * i.e., we subtract "\sum_i {a_i} y_i" and add 1 d.
1038 * The coefficients of the non-parameters in the tableau have been
1039 * verified to be integral. We can therefore simply replace coefficient b
1040 * by floor(b). For the coefficients of the parameters we have
1041 * floor(a_i) = a_i - {a_i}, while for the other coefficients, we have
1042 * floor(b) = b.
1043 */
set_row_cst_to_div(struct isl_tab * tab,int row,int div)1044 static struct isl_tab *set_row_cst_to_div(struct isl_tab *tab, int row, int div)
1045 {
1046 isl_seq_fdiv_q(tab->mat->row[row] + 1, tab->mat->row[row] + 1,
1047 tab->mat->row[row][0], 1 + tab->M + tab->n_col);
1048
1049 isl_int_set_si(tab->mat->row[row][0], 1);
1050
1051 if (tab->var[tab->n_var - tab->n_div + div].is_row) {
1052 int drow = tab->var[tab->n_var - tab->n_div + div].index;
1053
1054 isl_assert(tab->mat->ctx,
1055 isl_int_is_one(tab->mat->row[drow][0]), goto error);
1056 isl_seq_combine(tab->mat->row[row] + 1,
1057 tab->mat->ctx->one, tab->mat->row[row] + 1,
1058 tab->mat->ctx->one, tab->mat->row[drow] + 1,
1059 1 + tab->M + tab->n_col);
1060 } else {
1061 int dcol = tab->var[tab->n_var - tab->n_div + div].index;
1062
1063 isl_int_add_ui(tab->mat->row[row][2 + tab->M + dcol],
1064 tab->mat->row[row][2 + tab->M + dcol], 1);
1065 }
1066
1067 return tab;
1068 error:
1069 isl_tab_free(tab);
1070 return NULL;
1071 }
1072
1073 /* Check if the (parametric) constant of the given row is obviously
1074 * negative, meaning that we don't need to consult the context tableau.
1075 * If there is a big parameter and its coefficient is non-zero,
1076 * then this coefficient determines the outcome.
1077 * Otherwise, we check whether the constant is negative and
1078 * all non-zero coefficients of parameters are negative and
1079 * belong to non-negative parameters.
1080 */
is_obviously_neg(struct isl_tab * tab,int row)1081 static int is_obviously_neg(struct isl_tab *tab, int row)
1082 {
1083 int i;
1084 int col;
1085 unsigned off = 2 + tab->M;
1086
1087 if (tab->M) {
1088 if (isl_int_is_pos(tab->mat->row[row][2]))
1089 return 0;
1090 if (isl_int_is_neg(tab->mat->row[row][2]))
1091 return 1;
1092 }
1093
1094 if (isl_int_is_nonneg(tab->mat->row[row][1]))
1095 return 0;
1096 for (i = 0; i < tab->n_param; ++i) {
1097 /* Eliminated parameter */
1098 if (tab->var[i].is_row)
1099 continue;
1100 col = tab->var[i].index;
1101 if (isl_int_is_zero(tab->mat->row[row][off + col]))
1102 continue;
1103 if (!tab->var[i].is_nonneg)
1104 return 0;
1105 if (isl_int_is_pos(tab->mat->row[row][off + col]))
1106 return 0;
1107 }
1108 for (i = 0; i < tab->n_div; ++i) {
1109 if (tab->var[tab->n_var - tab->n_div + i].is_row)
1110 continue;
1111 col = tab->var[tab->n_var - tab->n_div + i].index;
1112 if (isl_int_is_zero(tab->mat->row[row][off + col]))
1113 continue;
1114 if (!tab->var[tab->n_var - tab->n_div + i].is_nonneg)
1115 return 0;
1116 if (isl_int_is_pos(tab->mat->row[row][off + col]))
1117 return 0;
1118 }
1119 return 1;
1120 }
1121
1122 /* Check if the (parametric) constant of the given row is obviously
1123 * non-negative, meaning that we don't need to consult the context tableau.
1124 * If there is a big parameter and its coefficient is non-zero,
1125 * then this coefficient determines the outcome.
1126 * Otherwise, we check whether the constant is non-negative and
1127 * all non-zero coefficients of parameters are positive and
1128 * belong to non-negative parameters.
1129 */
is_obviously_nonneg(struct isl_tab * tab,int row)1130 static int is_obviously_nonneg(struct isl_tab *tab, int row)
1131 {
1132 int i;
1133 int col;
1134 unsigned off = 2 + tab->M;
1135
1136 if (tab->M) {
1137 if (isl_int_is_pos(tab->mat->row[row][2]))
1138 return 1;
1139 if (isl_int_is_neg(tab->mat->row[row][2]))
1140 return 0;
1141 }
1142
1143 if (isl_int_is_neg(tab->mat->row[row][1]))
1144 return 0;
1145 for (i = 0; i < tab->n_param; ++i) {
1146 /* Eliminated parameter */
1147 if (tab->var[i].is_row)
1148 continue;
1149 col = tab->var[i].index;
1150 if (isl_int_is_zero(tab->mat->row[row][off + col]))
1151 continue;
1152 if (!tab->var[i].is_nonneg)
1153 return 0;
1154 if (isl_int_is_neg(tab->mat->row[row][off + col]))
1155 return 0;
1156 }
1157 for (i = 0; i < tab->n_div; ++i) {
1158 if (tab->var[tab->n_var - tab->n_div + i].is_row)
1159 continue;
1160 col = tab->var[tab->n_var - tab->n_div + i].index;
1161 if (isl_int_is_zero(tab->mat->row[row][off + col]))
1162 continue;
1163 if (!tab->var[tab->n_var - tab->n_div + i].is_nonneg)
1164 return 0;
1165 if (isl_int_is_neg(tab->mat->row[row][off + col]))
1166 return 0;
1167 }
1168 return 1;
1169 }
1170
1171 /* Given a row r and two columns, return the column that would
1172 * lead to the lexicographically smallest increment in the sample
1173 * solution when leaving the basis in favor of the row.
1174 * Pivoting with column c will increment the sample value by a non-negative
1175 * constant times a_{V,c}/a_{r,c}, with a_{V,c} the elements of column c
1176 * corresponding to the non-parametric variables.
1177 * If variable v appears in a column c_v, then a_{v,c} = 1 iff c = c_v,
1178 * with all other entries in this virtual row equal to zero.
1179 * If variable v appears in a row, then a_{v,c} is the element in column c
1180 * of that row.
1181 *
1182 * Let v be the first variable with a_{v,c1}/a_{r,c1} != a_{v,c2}/a_{r,c2}.
1183 * Then if a_{v,c1}/a_{r,c1} < a_{v,c2}/a_{r,c2}, i.e.,
1184 * a_{v,c2} a_{r,c1} - a_{v,c1} a_{r,c2} > 0, c1 results in the minimal
1185 * increment. Otherwise, it's c2.
1186 */
lexmin_col_pair(struct isl_tab * tab,int row,int col1,int col2,isl_int tmp)1187 static int lexmin_col_pair(struct isl_tab *tab,
1188 int row, int col1, int col2, isl_int tmp)
1189 {
1190 int i;
1191 isl_int *tr;
1192
1193 tr = tab->mat->row[row] + 2 + tab->M;
1194
1195 for (i = tab->n_param; i < tab->n_var - tab->n_div; ++i) {
1196 int s1, s2;
1197 isl_int *r;
1198
1199 if (!tab->var[i].is_row) {
1200 if (tab->var[i].index == col1)
1201 return col2;
1202 if (tab->var[i].index == col2)
1203 return col1;
1204 continue;
1205 }
1206
1207 if (tab->var[i].index == row)
1208 continue;
1209
1210 r = tab->mat->row[tab->var[i].index] + 2 + tab->M;
1211 s1 = isl_int_sgn(r[col1]);
1212 s2 = isl_int_sgn(r[col2]);
1213 if (s1 == 0 && s2 == 0)
1214 continue;
1215 if (s1 < s2)
1216 return col1;
1217 if (s2 < s1)
1218 return col2;
1219
1220 isl_int_mul(tmp, r[col2], tr[col1]);
1221 isl_int_submul(tmp, r[col1], tr[col2]);
1222 if (isl_int_is_pos(tmp))
1223 return col1;
1224 if (isl_int_is_neg(tmp))
1225 return col2;
1226 }
1227 return -1;
1228 }
1229
1230 /* Does the index into the tab->var or tab->con array "index"
1231 * correspond to a variable in the context tableau?
1232 * In particular, it needs to be an index into the tab->var array and
1233 * it needs to refer to either one of the first tab->n_param variables or
1234 * one of the last tab->n_div variables.
1235 */
is_parameter_var(struct isl_tab * tab,int index)1236 static int is_parameter_var(struct isl_tab *tab, int index)
1237 {
1238 if (index < 0)
1239 return 0;
1240 if (index < tab->n_param)
1241 return 1;
1242 if (index >= tab->n_var - tab->n_div)
1243 return 1;
1244 return 0;
1245 }
1246
1247 /* Does column "col" of "tab" refer to a variable in the context tableau?
1248 */
col_is_parameter_var(struct isl_tab * tab,int col)1249 static int col_is_parameter_var(struct isl_tab *tab, int col)
1250 {
1251 return is_parameter_var(tab, tab->col_var[col]);
1252 }
1253
1254 /* Does row "row" of "tab" refer to a variable in the context tableau?
1255 */
row_is_parameter_var(struct isl_tab * tab,int row)1256 static int row_is_parameter_var(struct isl_tab *tab, int row)
1257 {
1258 return is_parameter_var(tab, tab->row_var[row]);
1259 }
1260
1261 /* Given a row in the tableau, find and return the column that would
1262 * result in the lexicographically smallest, but positive, increment
1263 * in the sample point.
1264 * If there is no such column, then return tab->n_col.
1265 * If anything goes wrong, return -1.
1266 */
lexmin_pivot_col(struct isl_tab * tab,int row)1267 static int lexmin_pivot_col(struct isl_tab *tab, int row)
1268 {
1269 int j;
1270 int col = tab->n_col;
1271 isl_int *tr;
1272 isl_int tmp;
1273
1274 tr = tab->mat->row[row] + 2 + tab->M;
1275
1276 isl_int_init(tmp);
1277
1278 for (j = tab->n_dead; j < tab->n_col; ++j) {
1279 if (col_is_parameter_var(tab, j))
1280 continue;
1281
1282 if (!isl_int_is_pos(tr[j]))
1283 continue;
1284
1285 if (col == tab->n_col)
1286 col = j;
1287 else
1288 col = lexmin_col_pair(tab, row, col, j, tmp);
1289 isl_assert(tab->mat->ctx, col >= 0, goto error);
1290 }
1291
1292 isl_int_clear(tmp);
1293 return col;
1294 error:
1295 isl_int_clear(tmp);
1296 return -1;
1297 }
1298
1299 /* Return the first known violated constraint, i.e., a non-negative
1300 * constraint that currently has an either obviously negative value
1301 * or a previously determined to be negative value.
1302 *
1303 * If any constraint has a negative coefficient for the big parameter,
1304 * if any, then we return one of these first.
1305 */
first_neg(struct isl_tab * tab)1306 static int first_neg(struct isl_tab *tab)
1307 {
1308 int row;
1309
1310 if (tab->M)
1311 for (row = tab->n_redundant; row < tab->n_row; ++row) {
1312 if (!isl_tab_var_from_row(tab, row)->is_nonneg)
1313 continue;
1314 if (!isl_int_is_neg(tab->mat->row[row][2]))
1315 continue;
1316 if (tab->row_sign)
1317 tab->row_sign[row] = isl_tab_row_neg;
1318 return row;
1319 }
1320 for (row = tab->n_redundant; row < tab->n_row; ++row) {
1321 if (!isl_tab_var_from_row(tab, row)->is_nonneg)
1322 continue;
1323 if (tab->row_sign) {
1324 if (tab->row_sign[row] == 0 &&
1325 is_obviously_neg(tab, row))
1326 tab->row_sign[row] = isl_tab_row_neg;
1327 if (tab->row_sign[row] != isl_tab_row_neg)
1328 continue;
1329 } else if (!is_obviously_neg(tab, row))
1330 continue;
1331 return row;
1332 }
1333 return -1;
1334 }
1335
1336 /* Check whether the invariant that all columns are lexico-positive
1337 * is satisfied. This function is not called from the current code
1338 * but is useful during debugging.
1339 */
1340 static void check_lexpos(struct isl_tab *tab) __attribute__ ((unused));
check_lexpos(struct isl_tab * tab)1341 static void check_lexpos(struct isl_tab *tab)
1342 {
1343 unsigned off = 2 + tab->M;
1344 int col;
1345 int var;
1346 int row;
1347
1348 for (col = tab->n_dead; col < tab->n_col; ++col) {
1349 if (col_is_parameter_var(tab, col))
1350 continue;
1351 for (var = tab->n_param; var < tab->n_var - tab->n_div; ++var) {
1352 if (!tab->var[var].is_row) {
1353 if (tab->var[var].index == col)
1354 break;
1355 else
1356 continue;
1357 }
1358 row = tab->var[var].index;
1359 if (isl_int_is_zero(tab->mat->row[row][off + col]))
1360 continue;
1361 if (isl_int_is_pos(tab->mat->row[row][off + col]))
1362 break;
1363 fprintf(stderr, "lexneg column %d (row %d)\n",
1364 col, row);
1365 }
1366 if (var >= tab->n_var - tab->n_div)
1367 fprintf(stderr, "zero column %d\n", col);
1368 }
1369 }
1370
1371 /* Report to the caller that the given constraint is part of an encountered
1372 * conflict.
1373 */
report_conflicting_constraint(struct isl_tab * tab,int con)1374 static int report_conflicting_constraint(struct isl_tab *tab, int con)
1375 {
1376 return tab->conflict(con, tab->conflict_user);
1377 }
1378
1379 /* Given a conflicting row in the tableau, report all constraints
1380 * involved in the row to the caller. That is, the row itself
1381 * (if it represents a constraint) and all constraint columns with
1382 * non-zero (and therefore negative) coefficients.
1383 */
report_conflict(struct isl_tab * tab,int row)1384 static int report_conflict(struct isl_tab *tab, int row)
1385 {
1386 int j;
1387 isl_int *tr;
1388
1389 if (!tab->conflict)
1390 return 0;
1391
1392 if (tab->row_var[row] < 0 &&
1393 report_conflicting_constraint(tab, ~tab->row_var[row]) < 0)
1394 return -1;
1395
1396 tr = tab->mat->row[row] + 2 + tab->M;
1397
1398 for (j = tab->n_dead; j < tab->n_col; ++j) {
1399 if (col_is_parameter_var(tab, j))
1400 continue;
1401
1402 if (!isl_int_is_neg(tr[j]))
1403 continue;
1404
1405 if (tab->col_var[j] < 0 &&
1406 report_conflicting_constraint(tab, ~tab->col_var[j]) < 0)
1407 return -1;
1408 }
1409
1410 return 0;
1411 }
1412
1413 /* Resolve all known or obviously violated constraints through pivoting.
1414 * In particular, as long as we can find any violated constraint, we
1415 * look for a pivoting column that would result in the lexicographically
1416 * smallest increment in the sample point. If there is no such column
1417 * then the tableau is infeasible.
1418 */
1419 static int restore_lexmin(struct isl_tab *tab) WARN_UNUSED;
restore_lexmin(struct isl_tab * tab)1420 static int restore_lexmin(struct isl_tab *tab)
1421 {
1422 int row, col;
1423
1424 if (!tab)
1425 return -1;
1426 if (tab->empty)
1427 return 0;
1428 while ((row = first_neg(tab)) != -1) {
1429 col = lexmin_pivot_col(tab, row);
1430 if (col >= tab->n_col) {
1431 if (report_conflict(tab, row) < 0)
1432 return -1;
1433 if (isl_tab_mark_empty(tab) < 0)
1434 return -1;
1435 return 0;
1436 }
1437 if (col < 0)
1438 return -1;
1439 if (isl_tab_pivot(tab, row, col) < 0)
1440 return -1;
1441 }
1442 return 0;
1443 }
1444
1445 /* Given a row that represents an equality, look for an appropriate
1446 * pivoting column.
1447 * In particular, if there are any non-zero coefficients among
1448 * the non-parameter variables, then we take the last of these
1449 * variables. Eliminating this variable in terms of the other
1450 * variables and/or parameters does not influence the property
1451 * that all column in the initial tableau are lexicographically
1452 * positive. The row corresponding to the eliminated variable
1453 * will only have non-zero entries below the diagonal of the
1454 * initial tableau. That is, we transform
1455 *
1456 * I I
1457 * 1 into a
1458 * I I
1459 *
1460 * If there is no such non-parameter variable, then we are dealing with
1461 * pure parameter equality and we pick any parameter with coefficient 1 or -1
1462 * for elimination. This will ensure that the eliminated parameter
1463 * always has an integer value whenever all the other parameters are integral.
1464 * If there is no such parameter then we return -1.
1465 */
last_var_col_or_int_par_col(struct isl_tab * tab,int row)1466 static int last_var_col_or_int_par_col(struct isl_tab *tab, int row)
1467 {
1468 unsigned off = 2 + tab->M;
1469 int i;
1470
1471 for (i = tab->n_var - tab->n_div - 1; i >= 0 && i >= tab->n_param; --i) {
1472 int col;
1473 if (tab->var[i].is_row)
1474 continue;
1475 col = tab->var[i].index;
1476 if (col <= tab->n_dead)
1477 continue;
1478 if (!isl_int_is_zero(tab->mat->row[row][off + col]))
1479 return col;
1480 }
1481 for (i = tab->n_dead; i < tab->n_col; ++i) {
1482 if (isl_int_is_one(tab->mat->row[row][off + i]))
1483 return i;
1484 if (isl_int_is_negone(tab->mat->row[row][off + i]))
1485 return i;
1486 }
1487 return -1;
1488 }
1489
1490 /* Add an equality that is known to be valid to the tableau.
1491 * We first check if we can eliminate a variable or a parameter.
1492 * If not, we add the equality as two inequalities.
1493 * In this case, the equality was a pure parameter equality and there
1494 * is no need to resolve any constraint violations.
1495 *
1496 * This function assumes that at least two more rows and at least
1497 * two more elements in the constraint array are available in the tableau.
1498 */
add_lexmin_valid_eq(struct isl_tab * tab,isl_int * eq)1499 static struct isl_tab *add_lexmin_valid_eq(struct isl_tab *tab, isl_int *eq)
1500 {
1501 int i;
1502 int r;
1503
1504 if (!tab)
1505 return NULL;
1506 r = isl_tab_add_row(tab, eq);
1507 if (r < 0)
1508 goto error;
1509
1510 r = tab->con[r].index;
1511 i = last_var_col_or_int_par_col(tab, r);
1512 if (i < 0) {
1513 tab->con[r].is_nonneg = 1;
1514 if (isl_tab_push_var(tab, isl_tab_undo_nonneg, &tab->con[r]) < 0)
1515 goto error;
1516 isl_seq_neg(eq, eq, 1 + tab->n_var);
1517 r = isl_tab_add_row(tab, eq);
1518 if (r < 0)
1519 goto error;
1520 tab->con[r].is_nonneg = 1;
1521 if (isl_tab_push_var(tab, isl_tab_undo_nonneg, &tab->con[r]) < 0)
1522 goto error;
1523 } else {
1524 if (isl_tab_pivot(tab, r, i) < 0)
1525 goto error;
1526 if (isl_tab_kill_col(tab, i) < 0)
1527 goto error;
1528 tab->n_eq++;
1529 }
1530
1531 return tab;
1532 error:
1533 isl_tab_free(tab);
1534 return NULL;
1535 }
1536
1537 /* Check if the given row is a pure constant.
1538 */
is_constant(struct isl_tab * tab,int row)1539 static int is_constant(struct isl_tab *tab, int row)
1540 {
1541 unsigned off = 2 + tab->M;
1542
1543 return isl_seq_first_non_zero(tab->mat->row[row] + off + tab->n_dead,
1544 tab->n_col - tab->n_dead) == -1;
1545 }
1546
1547 /* Is the given row a parametric constant?
1548 * That is, does it only involve variables that also appear in the context?
1549 */
is_parametric_constant(struct isl_tab * tab,int row)1550 static int is_parametric_constant(struct isl_tab *tab, int row)
1551 {
1552 unsigned off = 2 + tab->M;
1553 int col;
1554
1555 for (col = tab->n_dead; col < tab->n_col; ++col) {
1556 if (col_is_parameter_var(tab, col))
1557 continue;
1558 if (isl_int_is_zero(tab->mat->row[row][off + col]))
1559 continue;
1560 return 0;
1561 }
1562
1563 return 1;
1564 }
1565
1566 /* Add an equality that may or may not be valid to the tableau.
1567 * If the resulting row is a pure constant, then it must be zero.
1568 * Otherwise, the resulting tableau is empty.
1569 *
1570 * If the row is not a pure constant, then we add two inequalities,
1571 * each time checking that they can be satisfied.
1572 * In the end we try to use one of the two constraints to eliminate
1573 * a column.
1574 *
1575 * This function assumes that at least two more rows and at least
1576 * two more elements in the constraint array are available in the tableau.
1577 */
1578 static int add_lexmin_eq(struct isl_tab *tab, isl_int *eq) WARN_UNUSED;
add_lexmin_eq(struct isl_tab * tab,isl_int * eq)1579 static int add_lexmin_eq(struct isl_tab *tab, isl_int *eq)
1580 {
1581 int r1, r2;
1582 int row;
1583 struct isl_tab_undo *snap;
1584
1585 if (!tab)
1586 return -1;
1587 snap = isl_tab_snap(tab);
1588 r1 = isl_tab_add_row(tab, eq);
1589 if (r1 < 0)
1590 return -1;
1591 tab->con[r1].is_nonneg = 1;
1592 if (isl_tab_push_var(tab, isl_tab_undo_nonneg, &tab->con[r1]) < 0)
1593 return -1;
1594
1595 row = tab->con[r1].index;
1596 if (is_constant(tab, row)) {
1597 if (!isl_int_is_zero(tab->mat->row[row][1]) ||
1598 (tab->M && !isl_int_is_zero(tab->mat->row[row][2]))) {
1599 if (isl_tab_mark_empty(tab) < 0)
1600 return -1;
1601 return 0;
1602 }
1603 if (isl_tab_rollback(tab, snap) < 0)
1604 return -1;
1605 return 0;
1606 }
1607
1608 if (restore_lexmin(tab) < 0)
1609 return -1;
1610 if (tab->empty)
1611 return 0;
1612
1613 isl_seq_neg(eq, eq, 1 + tab->n_var);
1614
1615 r2 = isl_tab_add_row(tab, eq);
1616 if (r2 < 0)
1617 return -1;
1618 tab->con[r2].is_nonneg = 1;
1619 if (isl_tab_push_var(tab, isl_tab_undo_nonneg, &tab->con[r2]) < 0)
1620 return -1;
1621
1622 if (restore_lexmin(tab) < 0)
1623 return -1;
1624 if (tab->empty)
1625 return 0;
1626
1627 if (!tab->con[r1].is_row) {
1628 if (isl_tab_kill_col(tab, tab->con[r1].index) < 0)
1629 return -1;
1630 } else if (!tab->con[r2].is_row) {
1631 if (isl_tab_kill_col(tab, tab->con[r2].index) < 0)
1632 return -1;
1633 }
1634
1635 if (tab->bmap) {
1636 tab->bmap = isl_basic_map_add_ineq(tab->bmap, eq);
1637 if (isl_tab_push(tab, isl_tab_undo_bmap_ineq) < 0)
1638 return -1;
1639 isl_seq_neg(eq, eq, 1 + tab->n_var);
1640 tab->bmap = isl_basic_map_add_ineq(tab->bmap, eq);
1641 isl_seq_neg(eq, eq, 1 + tab->n_var);
1642 if (isl_tab_push(tab, isl_tab_undo_bmap_ineq) < 0)
1643 return -1;
1644 if (!tab->bmap)
1645 return -1;
1646 }
1647
1648 return 0;
1649 }
1650
1651 /* Add an inequality to the tableau, resolving violations using
1652 * restore_lexmin.
1653 *
1654 * This function assumes that at least one more row and at least
1655 * one more element in the constraint array are available in the tableau.
1656 */
add_lexmin_ineq(struct isl_tab * tab,isl_int * ineq)1657 static struct isl_tab *add_lexmin_ineq(struct isl_tab *tab, isl_int *ineq)
1658 {
1659 int r;
1660
1661 if (!tab)
1662 return NULL;
1663 if (tab->bmap) {
1664 tab->bmap = isl_basic_map_add_ineq(tab->bmap, ineq);
1665 if (isl_tab_push(tab, isl_tab_undo_bmap_ineq) < 0)
1666 goto error;
1667 if (!tab->bmap)
1668 goto error;
1669 }
1670 r = isl_tab_add_row(tab, ineq);
1671 if (r < 0)
1672 goto error;
1673 tab->con[r].is_nonneg = 1;
1674 if (isl_tab_push_var(tab, isl_tab_undo_nonneg, &tab->con[r]) < 0)
1675 goto error;
1676 if (isl_tab_row_is_redundant(tab, tab->con[r].index)) {
1677 if (isl_tab_mark_redundant(tab, tab->con[r].index) < 0)
1678 goto error;
1679 return tab;
1680 }
1681
1682 if (restore_lexmin(tab) < 0)
1683 goto error;
1684 if (!tab->empty && tab->con[r].is_row &&
1685 isl_tab_row_is_redundant(tab, tab->con[r].index))
1686 if (isl_tab_mark_redundant(tab, tab->con[r].index) < 0)
1687 goto error;
1688 return tab;
1689 error:
1690 isl_tab_free(tab);
1691 return NULL;
1692 }
1693
1694 /* Check if the coefficients of the parameters are all integral.
1695 */
integer_parameter(struct isl_tab * tab,int row)1696 static int integer_parameter(struct isl_tab *tab, int row)
1697 {
1698 int i;
1699 int col;
1700 unsigned off = 2 + tab->M;
1701
1702 for (i = 0; i < tab->n_param; ++i) {
1703 /* Eliminated parameter */
1704 if (tab->var[i].is_row)
1705 continue;
1706 col = tab->var[i].index;
1707 if (!isl_int_is_divisible_by(tab->mat->row[row][off + col],
1708 tab->mat->row[row][0]))
1709 return 0;
1710 }
1711 for (i = 0; i < tab->n_div; ++i) {
1712 if (tab->var[tab->n_var - tab->n_div + i].is_row)
1713 continue;
1714 col = tab->var[tab->n_var - tab->n_div + i].index;
1715 if (!isl_int_is_divisible_by(tab->mat->row[row][off + col],
1716 tab->mat->row[row][0]))
1717 return 0;
1718 }
1719 return 1;
1720 }
1721
1722 /* Check if the coefficients of the non-parameter variables are all integral.
1723 */
integer_variable(struct isl_tab * tab,int row)1724 static int integer_variable(struct isl_tab *tab, int row)
1725 {
1726 int i;
1727 unsigned off = 2 + tab->M;
1728
1729 for (i = tab->n_dead; i < tab->n_col; ++i) {
1730 if (col_is_parameter_var(tab, i))
1731 continue;
1732 if (!isl_int_is_divisible_by(tab->mat->row[row][off + i],
1733 tab->mat->row[row][0]))
1734 return 0;
1735 }
1736 return 1;
1737 }
1738
1739 /* Check if the constant term is integral.
1740 */
integer_constant(struct isl_tab * tab,int row)1741 static int integer_constant(struct isl_tab *tab, int row)
1742 {
1743 return isl_int_is_divisible_by(tab->mat->row[row][1],
1744 tab->mat->row[row][0]);
1745 }
1746
1747 #define I_CST 1 << 0
1748 #define I_PAR 1 << 1
1749 #define I_VAR 1 << 2
1750
1751 /* Check for next (non-parameter) variable after "var" (first if var == -1)
1752 * that is non-integer and therefore requires a cut and return
1753 * the index of the variable.
1754 * For parametric tableaus, there are three parts in a row,
1755 * the constant, the coefficients of the parameters and the rest.
1756 * For each part, we check whether the coefficients in that part
1757 * are all integral and if so, set the corresponding flag in *f.
1758 * If the constant and the parameter part are integral, then the
1759 * current sample value is integral and no cut is required
1760 * (irrespective of whether the variable part is integral).
1761 */
next_non_integer_var(struct isl_tab * tab,int var,int * f)1762 static int next_non_integer_var(struct isl_tab *tab, int var, int *f)
1763 {
1764 var = var < 0 ? tab->n_param : var + 1;
1765
1766 for (; var < tab->n_var - tab->n_div; ++var) {
1767 int flags = 0;
1768 int row;
1769 if (!tab->var[var].is_row)
1770 continue;
1771 row = tab->var[var].index;
1772 if (integer_constant(tab, row))
1773 ISL_FL_SET(flags, I_CST);
1774 if (integer_parameter(tab, row))
1775 ISL_FL_SET(flags, I_PAR);
1776 if (ISL_FL_ISSET(flags, I_CST) && ISL_FL_ISSET(flags, I_PAR))
1777 continue;
1778 if (integer_variable(tab, row))
1779 ISL_FL_SET(flags, I_VAR);
1780 *f = flags;
1781 return var;
1782 }
1783 return -1;
1784 }
1785
1786 /* Check for first (non-parameter) variable that is non-integer and
1787 * therefore requires a cut and return the corresponding row.
1788 * For parametric tableaus, there are three parts in a row,
1789 * the constant, the coefficients of the parameters and the rest.
1790 * For each part, we check whether the coefficients in that part
1791 * are all integral and if so, set the corresponding flag in *f.
1792 * If the constant and the parameter part are integral, then the
1793 * current sample value is integral and no cut is required
1794 * (irrespective of whether the variable part is integral).
1795 */
first_non_integer_row(struct isl_tab * tab,int * f)1796 static int first_non_integer_row(struct isl_tab *tab, int *f)
1797 {
1798 int var = next_non_integer_var(tab, -1, f);
1799
1800 return var < 0 ? -1 : tab->var[var].index;
1801 }
1802
1803 /* Add a (non-parametric) cut to cut away the non-integral sample
1804 * value of the given row.
1805 *
1806 * If the row is given by
1807 *
1808 * m r = f + \sum_i a_i y_i
1809 *
1810 * then the cut is
1811 *
1812 * c = - {-f/m} + \sum_i {a_i/m} y_i >= 0
1813 *
1814 * The big parameter, if any, is ignored, since it is assumed to be big
1815 * enough to be divisible by any integer.
1816 * If the tableau is actually a parametric tableau, then this function
1817 * is only called when all coefficients of the parameters are integral.
1818 * The cut therefore has zero coefficients for the parameters.
1819 *
1820 * The current value is known to be negative, so row_sign, if it
1821 * exists, is set accordingly.
1822 *
1823 * Return the row of the cut or -1.
1824 */
add_cut(struct isl_tab * tab,int row)1825 static int add_cut(struct isl_tab *tab, int row)
1826 {
1827 int i;
1828 int r;
1829 isl_int *r_row;
1830 unsigned off = 2 + tab->M;
1831
1832 if (isl_tab_extend_cons(tab, 1) < 0)
1833 return -1;
1834 r = isl_tab_allocate_con(tab);
1835 if (r < 0)
1836 return -1;
1837
1838 r_row = tab->mat->row[tab->con[r].index];
1839 isl_int_set(r_row[0], tab->mat->row[row][0]);
1840 isl_int_neg(r_row[1], tab->mat->row[row][1]);
1841 isl_int_fdiv_r(r_row[1], r_row[1], tab->mat->row[row][0]);
1842 isl_int_neg(r_row[1], r_row[1]);
1843 if (tab->M)
1844 isl_int_set_si(r_row[2], 0);
1845 for (i = 0; i < tab->n_col; ++i)
1846 isl_int_fdiv_r(r_row[off + i],
1847 tab->mat->row[row][off + i], tab->mat->row[row][0]);
1848
1849 tab->con[r].is_nonneg = 1;
1850 if (isl_tab_push_var(tab, isl_tab_undo_nonneg, &tab->con[r]) < 0)
1851 return -1;
1852 if (tab->row_sign)
1853 tab->row_sign[tab->con[r].index] = isl_tab_row_neg;
1854
1855 return tab->con[r].index;
1856 }
1857
1858 #define CUT_ALL 1
1859 #define CUT_ONE 0
1860
1861 /* Given a non-parametric tableau, add cuts until an integer
1862 * sample point is obtained or until the tableau is determined
1863 * to be integer infeasible.
1864 * As long as there is any non-integer value in the sample point,
1865 * we add appropriate cuts, if possible, for each of these
1866 * non-integer values and then resolve the violated
1867 * cut constraints using restore_lexmin.
1868 * If one of the corresponding rows is equal to an integral
1869 * combination of variables/constraints plus a non-integral constant,
1870 * then there is no way to obtain an integer point and we return
1871 * a tableau that is marked empty.
1872 * The parameter cutting_strategy controls the strategy used when adding cuts
1873 * to remove non-integer points. CUT_ALL adds all possible cuts
1874 * before continuing the search. CUT_ONE adds only one cut at a time.
1875 */
cut_to_integer_lexmin(struct isl_tab * tab,int cutting_strategy)1876 static struct isl_tab *cut_to_integer_lexmin(struct isl_tab *tab,
1877 int cutting_strategy)
1878 {
1879 int var;
1880 int row;
1881 int flags;
1882
1883 if (!tab)
1884 return NULL;
1885 if (tab->empty)
1886 return tab;
1887
1888 while ((var = next_non_integer_var(tab, -1, &flags)) != -1) {
1889 do {
1890 if (ISL_FL_ISSET(flags, I_VAR)) {
1891 if (isl_tab_mark_empty(tab) < 0)
1892 goto error;
1893 return tab;
1894 }
1895 row = tab->var[var].index;
1896 row = add_cut(tab, row);
1897 if (row < 0)
1898 goto error;
1899 if (cutting_strategy == CUT_ONE)
1900 break;
1901 } while ((var = next_non_integer_var(tab, var, &flags)) != -1);
1902 if (restore_lexmin(tab) < 0)
1903 goto error;
1904 if (tab->empty)
1905 break;
1906 }
1907 return tab;
1908 error:
1909 isl_tab_free(tab);
1910 return NULL;
1911 }
1912
1913 /* Check whether all the currently active samples also satisfy the inequality
1914 * "ineq" (treated as an equality if eq is set).
1915 * Remove those samples that do not.
1916 */
check_samples(struct isl_tab * tab,isl_int * ineq,int eq)1917 static struct isl_tab *check_samples(struct isl_tab *tab, isl_int *ineq, int eq)
1918 {
1919 int i;
1920 isl_int v;
1921
1922 if (!tab)
1923 return NULL;
1924
1925 isl_assert(tab->mat->ctx, tab->bmap, goto error);
1926 isl_assert(tab->mat->ctx, tab->samples, goto error);
1927 isl_assert(tab->mat->ctx, tab->samples->n_col == 1 + tab->n_var, goto error);
1928
1929 isl_int_init(v);
1930 for (i = tab->n_outside; i < tab->n_sample; ++i) {
1931 int sgn;
1932 isl_seq_inner_product(ineq, tab->samples->row[i],
1933 1 + tab->n_var, &v);
1934 sgn = isl_int_sgn(v);
1935 if (eq ? (sgn == 0) : (sgn >= 0))
1936 continue;
1937 tab = isl_tab_drop_sample(tab, i);
1938 if (!tab)
1939 break;
1940 }
1941 isl_int_clear(v);
1942
1943 return tab;
1944 error:
1945 isl_tab_free(tab);
1946 return NULL;
1947 }
1948
1949 /* Check whether the sample value of the tableau is finite,
1950 * i.e., either the tableau does not use a big parameter, or
1951 * all values of the variables are equal to the big parameter plus
1952 * some constant. This constant is the actual sample value.
1953 */
sample_is_finite(struct isl_tab * tab)1954 static int sample_is_finite(struct isl_tab *tab)
1955 {
1956 int i;
1957
1958 if (!tab->M)
1959 return 1;
1960
1961 for (i = 0; i < tab->n_var; ++i) {
1962 int row;
1963 if (!tab->var[i].is_row)
1964 return 0;
1965 row = tab->var[i].index;
1966 if (isl_int_ne(tab->mat->row[row][0], tab->mat->row[row][2]))
1967 return 0;
1968 }
1969 return 1;
1970 }
1971
1972 /* Check if the context tableau of sol has any integer points.
1973 * Leave tab in empty state if no integer point can be found.
1974 * If an integer point can be found and if moreover it is finite,
1975 * then it is added to the list of sample values.
1976 *
1977 * This function is only called when none of the currently active sample
1978 * values satisfies the most recently added constraint.
1979 */
check_integer_feasible(struct isl_tab * tab)1980 static struct isl_tab *check_integer_feasible(struct isl_tab *tab)
1981 {
1982 struct isl_tab_undo *snap;
1983
1984 if (!tab)
1985 return NULL;
1986
1987 snap = isl_tab_snap(tab);
1988 if (isl_tab_push_basis(tab) < 0)
1989 goto error;
1990
1991 tab = cut_to_integer_lexmin(tab, CUT_ALL);
1992 if (!tab)
1993 goto error;
1994
1995 if (!tab->empty && sample_is_finite(tab)) {
1996 struct isl_vec *sample;
1997
1998 sample = isl_tab_get_sample_value(tab);
1999
2000 if (isl_tab_add_sample(tab, sample) < 0)
2001 goto error;
2002 }
2003
2004 if (!tab->empty && isl_tab_rollback(tab, snap) < 0)
2005 goto error;
2006
2007 return tab;
2008 error:
2009 isl_tab_free(tab);
2010 return NULL;
2011 }
2012
2013 /* Check if any of the currently active sample values satisfies
2014 * the inequality "ineq" (an equality if eq is set).
2015 */
tab_has_valid_sample(struct isl_tab * tab,isl_int * ineq,int eq)2016 static int tab_has_valid_sample(struct isl_tab *tab, isl_int *ineq, int eq)
2017 {
2018 int i;
2019 isl_int v;
2020
2021 if (!tab)
2022 return -1;
2023
2024 isl_assert(tab->mat->ctx, tab->bmap, return -1);
2025 isl_assert(tab->mat->ctx, tab->samples, return -1);
2026 isl_assert(tab->mat->ctx, tab->samples->n_col == 1 + tab->n_var, return -1);
2027
2028 isl_int_init(v);
2029 for (i = tab->n_outside; i < tab->n_sample; ++i) {
2030 int sgn;
2031 isl_seq_inner_product(ineq, tab->samples->row[i],
2032 1 + tab->n_var, &v);
2033 sgn = isl_int_sgn(v);
2034 if (eq ? (sgn == 0) : (sgn >= 0))
2035 break;
2036 }
2037 isl_int_clear(v);
2038
2039 return i < tab->n_sample;
2040 }
2041
2042 /* Insert a div specified by "div" to the tableau "tab" at position "pos" and
2043 * return isl_bool_true if the div is obviously non-negative.
2044 */
context_tab_insert_div(struct isl_tab * tab,int pos,__isl_keep isl_vec * div,isl_stat (* add_ineq)(void * user,isl_int *),void * user)2045 static isl_bool context_tab_insert_div(struct isl_tab *tab, int pos,
2046 __isl_keep isl_vec *div,
2047 isl_stat (*add_ineq)(void *user, isl_int *), void *user)
2048 {
2049 int i;
2050 int r;
2051 struct isl_mat *samples;
2052 int nonneg;
2053
2054 r = isl_tab_insert_div(tab, pos, div, add_ineq, user);
2055 if (r < 0)
2056 return isl_bool_error;
2057 nonneg = tab->var[r].is_nonneg;
2058 tab->var[r].frozen = 1;
2059
2060 samples = isl_mat_extend(tab->samples,
2061 tab->n_sample, 1 + tab->n_var);
2062 tab->samples = samples;
2063 if (!samples)
2064 return isl_bool_error;
2065 for (i = tab->n_outside; i < samples->n_row; ++i) {
2066 isl_seq_inner_product(div->el + 1, samples->row[i],
2067 div->size - 1, &samples->row[i][samples->n_col - 1]);
2068 isl_int_fdiv_q(samples->row[i][samples->n_col - 1],
2069 samples->row[i][samples->n_col - 1], div->el[0]);
2070 }
2071 tab->samples = isl_mat_move_cols(tab->samples, 1 + pos,
2072 1 + tab->n_var - 1, 1);
2073 if (!tab->samples)
2074 return isl_bool_error;
2075
2076 return isl_bool_ok(nonneg);
2077 }
2078
2079 /* Add a div specified by "div" to both the main tableau and
2080 * the context tableau. In case of the main tableau, we only
2081 * need to add an extra div. In the context tableau, we also
2082 * need to express the meaning of the div.
2083 * Return the index of the div or -1 if anything went wrong.
2084 *
2085 * The new integer division is added before any unknown integer
2086 * divisions in the context to ensure that it does not get
2087 * equated to some linear combination involving unknown integer
2088 * divisions.
2089 */
add_div(struct isl_tab * tab,struct isl_context * context,__isl_keep isl_vec * div)2090 static int add_div(struct isl_tab *tab, struct isl_context *context,
2091 __isl_keep isl_vec *div)
2092 {
2093 int r;
2094 int pos;
2095 isl_bool nonneg;
2096 struct isl_tab *context_tab = context->op->peek_tab(context);
2097
2098 if (!tab || !context_tab)
2099 goto error;
2100
2101 pos = context_tab->n_var - context->n_unknown;
2102 if ((nonneg = context->op->insert_div(context, pos, div)) < 0)
2103 goto error;
2104
2105 if (!context->op->is_ok(context))
2106 goto error;
2107
2108 pos = tab->n_var - context->n_unknown;
2109 if (isl_tab_extend_vars(tab, 1) < 0)
2110 goto error;
2111 r = isl_tab_insert_var(tab, pos);
2112 if (r < 0)
2113 goto error;
2114 if (nonneg)
2115 tab->var[r].is_nonneg = 1;
2116 tab->var[r].frozen = 1;
2117 tab->n_div++;
2118
2119 return tab->n_div - 1 - context->n_unknown;
2120 error:
2121 context->op->invalidate(context);
2122 return -1;
2123 }
2124
2125 /* Return the position of the integer division that is equal to div/denom
2126 * if there is one. Otherwise, return a position beyond the integer divisions.
2127 */
find_div(struct isl_tab * tab,isl_int * div,isl_int denom)2128 static int find_div(struct isl_tab *tab, isl_int *div, isl_int denom)
2129 {
2130 int i;
2131 isl_size total = isl_basic_map_dim(tab->bmap, isl_dim_all);
2132 isl_size n_div;
2133
2134 n_div = isl_basic_map_dim(tab->bmap, isl_dim_div);
2135 if (total < 0 || n_div < 0)
2136 return -1;
2137 for (i = 0; i < n_div; ++i) {
2138 if (isl_int_ne(tab->bmap->div[i][0], denom))
2139 continue;
2140 if (!isl_seq_eq(tab->bmap->div[i] + 1, div, 1 + total))
2141 continue;
2142 return i;
2143 }
2144 return n_div;
2145 }
2146
2147 /* Return the index of a div that corresponds to "div".
2148 * We first check if we already have such a div and if not, we create one.
2149 */
get_div(struct isl_tab * tab,struct isl_context * context,struct isl_vec * div)2150 static int get_div(struct isl_tab *tab, struct isl_context *context,
2151 struct isl_vec *div)
2152 {
2153 int d;
2154 struct isl_tab *context_tab = context->op->peek_tab(context);
2155 unsigned n_div;
2156
2157 if (!context_tab)
2158 return -1;
2159
2160 n_div = isl_basic_map_dim(context_tab->bmap, isl_dim_div);
2161 d = find_div(context_tab, div->el + 1, div->el[0]);
2162 if (d < 0)
2163 return -1;
2164 if (d < n_div)
2165 return d;
2166
2167 return add_div(tab, context, div);
2168 }
2169
2170 /* Add a parametric cut to cut away the non-integral sample value
2171 * of the given row.
2172 * Let a_i be the coefficients of the constant term and the parameters
2173 * and let b_i be the coefficients of the variables or constraints
2174 * in basis of the tableau.
2175 * Let q be the div q = floor(\sum_i {-a_i} y_i).
2176 *
2177 * The cut is expressed as
2178 *
2179 * c = \sum_i -{-a_i} y_i + \sum_i {b_i} x_i + q >= 0
2180 *
2181 * If q did not already exist in the context tableau, then it is added first.
2182 * If q is in a column of the main tableau then the "+ q" can be accomplished
2183 * by setting the corresponding entry to the denominator of the constraint.
2184 * If q happens to be in a row of the main tableau, then the corresponding
2185 * row needs to be added instead (taking care of the denominators).
2186 * Note that this is very unlikely, but perhaps not entirely impossible.
2187 *
2188 * The current value of the cut is known to be negative (or at least
2189 * non-positive), so row_sign is set accordingly.
2190 *
2191 * Return the row of the cut or -1.
2192 */
add_parametric_cut(struct isl_tab * tab,int row,struct isl_context * context)2193 static int add_parametric_cut(struct isl_tab *tab, int row,
2194 struct isl_context *context)
2195 {
2196 struct isl_vec *div;
2197 int d;
2198 int i;
2199 int r;
2200 isl_int *r_row;
2201 int col;
2202 int n;
2203 unsigned off = 2 + tab->M;
2204
2205 if (!context)
2206 return -1;
2207
2208 div = get_row_parameter_div(tab, row);
2209 if (!div)
2210 return -1;
2211
2212 n = tab->n_div - context->n_unknown;
2213 d = context->op->get_div(context, tab, div);
2214 isl_vec_free(div);
2215 if (d < 0)
2216 return -1;
2217
2218 if (isl_tab_extend_cons(tab, 1) < 0)
2219 return -1;
2220 r = isl_tab_allocate_con(tab);
2221 if (r < 0)
2222 return -1;
2223
2224 r_row = tab->mat->row[tab->con[r].index];
2225 isl_int_set(r_row[0], tab->mat->row[row][0]);
2226 isl_int_neg(r_row[1], tab->mat->row[row][1]);
2227 isl_int_fdiv_r(r_row[1], r_row[1], tab->mat->row[row][0]);
2228 isl_int_neg(r_row[1], r_row[1]);
2229 if (tab->M)
2230 isl_int_set_si(r_row[2], 0);
2231 for (i = 0; i < tab->n_param; ++i) {
2232 if (tab->var[i].is_row)
2233 continue;
2234 col = tab->var[i].index;
2235 isl_int_neg(r_row[off + col], tab->mat->row[row][off + col]);
2236 isl_int_fdiv_r(r_row[off + col], r_row[off + col],
2237 tab->mat->row[row][0]);
2238 isl_int_neg(r_row[off + col], r_row[off + col]);
2239 }
2240 for (i = 0; i < tab->n_div; ++i) {
2241 if (tab->var[tab->n_var - tab->n_div + i].is_row)
2242 continue;
2243 col = tab->var[tab->n_var - tab->n_div + i].index;
2244 isl_int_neg(r_row[off + col], tab->mat->row[row][off + col]);
2245 isl_int_fdiv_r(r_row[off + col], r_row[off + col],
2246 tab->mat->row[row][0]);
2247 isl_int_neg(r_row[off + col], r_row[off + col]);
2248 }
2249 for (i = 0; i < tab->n_col; ++i) {
2250 if (tab->col_var[i] >= 0 &&
2251 (tab->col_var[i] < tab->n_param ||
2252 tab->col_var[i] >= tab->n_var - tab->n_div))
2253 continue;
2254 isl_int_fdiv_r(r_row[off + i],
2255 tab->mat->row[row][off + i], tab->mat->row[row][0]);
2256 }
2257 if (tab->var[tab->n_var - tab->n_div + d].is_row) {
2258 isl_int gcd;
2259 int d_row = tab->var[tab->n_var - tab->n_div + d].index;
2260 isl_int_init(gcd);
2261 isl_int_gcd(gcd, tab->mat->row[d_row][0], r_row[0]);
2262 isl_int_divexact(r_row[0], r_row[0], gcd);
2263 isl_int_divexact(gcd, tab->mat->row[d_row][0], gcd);
2264 isl_seq_combine(r_row + 1, gcd, r_row + 1,
2265 r_row[0], tab->mat->row[d_row] + 1,
2266 off - 1 + tab->n_col);
2267 isl_int_mul(r_row[0], r_row[0], tab->mat->row[d_row][0]);
2268 isl_int_clear(gcd);
2269 } else {
2270 col = tab->var[tab->n_var - tab->n_div + d].index;
2271 isl_int_set(r_row[off + col], tab->mat->row[row][0]);
2272 }
2273
2274 tab->con[r].is_nonneg = 1;
2275 if (isl_tab_push_var(tab, isl_tab_undo_nonneg, &tab->con[r]) < 0)
2276 return -1;
2277 if (tab->row_sign)
2278 tab->row_sign[tab->con[r].index] = isl_tab_row_neg;
2279
2280 row = tab->con[r].index;
2281
2282 if (d >= n && context->op->detect_equalities(context, tab) < 0)
2283 return -1;
2284
2285 return row;
2286 }
2287
2288 /* Construct a tableau for bmap that can be used for computing
2289 * the lexicographic minimum (or maximum) of bmap.
2290 * If not NULL, then dom is the domain where the minimum
2291 * should be computed. In this case, we set up a parametric
2292 * tableau with row signs (initialized to "unknown").
2293 * If M is set, then the tableau will use a big parameter.
2294 * If max is set, then a maximum should be computed instead of a minimum.
2295 * This means that for each variable x, the tableau will contain the variable
2296 * x' = M - x, rather than x' = M + x. This in turn means that the coefficient
2297 * of the variables in all constraints are negated prior to adding them
2298 * to the tableau.
2299 */
tab_for_lexmin(__isl_keep isl_basic_map * bmap,__isl_keep isl_basic_set * dom,unsigned M,int max)2300 static __isl_give struct isl_tab *tab_for_lexmin(__isl_keep isl_basic_map *bmap,
2301 __isl_keep isl_basic_set *dom, unsigned M, int max)
2302 {
2303 int i;
2304 struct isl_tab *tab;
2305 unsigned n_var;
2306 unsigned o_var;
2307 isl_size total;
2308
2309 total = isl_basic_map_dim(bmap, isl_dim_all);
2310 if (total < 0)
2311 return NULL;
2312 tab = isl_tab_alloc(bmap->ctx, 2 * bmap->n_eq + bmap->n_ineq + 1,
2313 total, M);
2314 if (!tab)
2315 return NULL;
2316
2317 tab->rational = ISL_F_ISSET(bmap, ISL_BASIC_MAP_RATIONAL);
2318 if (dom) {
2319 isl_size dom_total;
2320 dom_total = isl_basic_set_dim(dom, isl_dim_all);
2321 if (dom_total < 0)
2322 goto error;
2323 tab->n_param = dom_total - dom->n_div;
2324 tab->n_div = dom->n_div;
2325 tab->row_sign = isl_calloc_array(bmap->ctx,
2326 enum isl_tab_row_sign, tab->mat->n_row);
2327 if (tab->mat->n_row && !tab->row_sign)
2328 goto error;
2329 }
2330 if (ISL_F_ISSET(bmap, ISL_BASIC_MAP_EMPTY)) {
2331 if (isl_tab_mark_empty(tab) < 0)
2332 goto error;
2333 return tab;
2334 }
2335
2336 for (i = tab->n_param; i < tab->n_var - tab->n_div; ++i) {
2337 tab->var[i].is_nonneg = 1;
2338 tab->var[i].frozen = 1;
2339 }
2340 o_var = 1 + tab->n_param;
2341 n_var = tab->n_var - tab->n_param - tab->n_div;
2342 for (i = 0; i < bmap->n_eq; ++i) {
2343 if (max)
2344 isl_seq_neg(bmap->eq[i] + o_var,
2345 bmap->eq[i] + o_var, n_var);
2346 tab = add_lexmin_valid_eq(tab, bmap->eq[i]);
2347 if (max)
2348 isl_seq_neg(bmap->eq[i] + o_var,
2349 bmap->eq[i] + o_var, n_var);
2350 if (!tab || tab->empty)
2351 return tab;
2352 }
2353 if (bmap->n_eq && restore_lexmin(tab) < 0)
2354 goto error;
2355 for (i = 0; i < bmap->n_ineq; ++i) {
2356 if (max)
2357 isl_seq_neg(bmap->ineq[i] + o_var,
2358 bmap->ineq[i] + o_var, n_var);
2359 tab = add_lexmin_ineq(tab, bmap->ineq[i]);
2360 if (max)
2361 isl_seq_neg(bmap->ineq[i] + o_var,
2362 bmap->ineq[i] + o_var, n_var);
2363 if (!tab || tab->empty)
2364 return tab;
2365 }
2366 return tab;
2367 error:
2368 isl_tab_free(tab);
2369 return NULL;
2370 }
2371
2372 /* Given a main tableau where more than one row requires a split,
2373 * determine and return the "best" row to split on.
2374 *
2375 * If any of the rows requiring a split only involves
2376 * variables that also appear in the context tableau,
2377 * then the negative part is guaranteed not to have a solution.
2378 * It is therefore best to split on any of these rows first.
2379 *
2380 * Otherwise,
2381 * given two rows in the main tableau, if the inequality corresponding
2382 * to the first row is redundant with respect to that of the second row
2383 * in the current tableau, then it is better to split on the second row,
2384 * since in the positive part, both rows will be positive.
2385 * (In the negative part a pivot will have to be performed and just about
2386 * anything can happen to the sign of the other row.)
2387 *
2388 * As a simple heuristic, we therefore select the row that makes the most
2389 * of the other rows redundant.
2390 *
2391 * Perhaps it would also be useful to look at the number of constraints
2392 * that conflict with any given constraint.
2393 *
2394 * best is the best row so far (-1 when we have not found any row yet).
2395 * best_r is the number of other rows made redundant by row best.
2396 * When best is still -1, bset_r is meaningless, but it is initialized
2397 * to some arbitrary value (0) anyway. Without this redundant initialization
2398 * valgrind may warn about uninitialized memory accesses when isl
2399 * is compiled with some versions of gcc.
2400 */
best_split(struct isl_tab * tab,struct isl_tab * context_tab)2401 static int best_split(struct isl_tab *tab, struct isl_tab *context_tab)
2402 {
2403 struct isl_tab_undo *snap;
2404 int split;
2405 int row;
2406 int best = -1;
2407 int best_r = 0;
2408
2409 if (isl_tab_extend_cons(context_tab, 2) < 0)
2410 return -1;
2411
2412 snap = isl_tab_snap(context_tab);
2413
2414 for (split = tab->n_redundant; split < tab->n_row; ++split) {
2415 struct isl_tab_undo *snap2;
2416 struct isl_vec *ineq = NULL;
2417 int r = 0;
2418 int ok;
2419
2420 if (!isl_tab_var_from_row(tab, split)->is_nonneg)
2421 continue;
2422 if (tab->row_sign[split] != isl_tab_row_any)
2423 continue;
2424
2425 if (is_parametric_constant(tab, split))
2426 return split;
2427
2428 ineq = get_row_parameter_ineq(tab, split);
2429 if (!ineq)
2430 return -1;
2431 ok = isl_tab_add_ineq(context_tab, ineq->el) >= 0;
2432 isl_vec_free(ineq);
2433 if (!ok)
2434 return -1;
2435
2436 snap2 = isl_tab_snap(context_tab);
2437
2438 for (row = tab->n_redundant; row < tab->n_row; ++row) {
2439 struct isl_tab_var *var;
2440
2441 if (row == split)
2442 continue;
2443 if (!isl_tab_var_from_row(tab, row)->is_nonneg)
2444 continue;
2445 if (tab->row_sign[row] != isl_tab_row_any)
2446 continue;
2447
2448 ineq = get_row_parameter_ineq(tab, row);
2449 if (!ineq)
2450 return -1;
2451 ok = isl_tab_add_ineq(context_tab, ineq->el) >= 0;
2452 isl_vec_free(ineq);
2453 if (!ok)
2454 return -1;
2455 var = &context_tab->con[context_tab->n_con - 1];
2456 if (!context_tab->empty &&
2457 !isl_tab_min_at_most_neg_one(context_tab, var))
2458 r++;
2459 if (isl_tab_rollback(context_tab, snap2) < 0)
2460 return -1;
2461 }
2462 if (best == -1 || r > best_r) {
2463 best = split;
2464 best_r = r;
2465 }
2466 if (isl_tab_rollback(context_tab, snap) < 0)
2467 return -1;
2468 }
2469
2470 return best;
2471 }
2472
context_lex_peek_basic_set(struct isl_context * context)2473 static struct isl_basic_set *context_lex_peek_basic_set(
2474 struct isl_context *context)
2475 {
2476 struct isl_context_lex *clex = (struct isl_context_lex *)context;
2477 if (!clex->tab)
2478 return NULL;
2479 return isl_tab_peek_bset(clex->tab);
2480 }
2481
context_lex_peek_tab(struct isl_context * context)2482 static struct isl_tab *context_lex_peek_tab(struct isl_context *context)
2483 {
2484 struct isl_context_lex *clex = (struct isl_context_lex *)context;
2485 return clex->tab;
2486 }
2487
context_lex_add_eq(struct isl_context * context,isl_int * eq,int check,int update)2488 static void context_lex_add_eq(struct isl_context *context, isl_int *eq,
2489 int check, int update)
2490 {
2491 struct isl_context_lex *clex = (struct isl_context_lex *)context;
2492 if (isl_tab_extend_cons(clex->tab, 2) < 0)
2493 goto error;
2494 if (add_lexmin_eq(clex->tab, eq) < 0)
2495 goto error;
2496 if (check) {
2497 int v = tab_has_valid_sample(clex->tab, eq, 1);
2498 if (v < 0)
2499 goto error;
2500 if (!v)
2501 clex->tab = check_integer_feasible(clex->tab);
2502 }
2503 if (update)
2504 clex->tab = check_samples(clex->tab, eq, 1);
2505 return;
2506 error:
2507 isl_tab_free(clex->tab);
2508 clex->tab = NULL;
2509 }
2510
context_lex_add_ineq(struct isl_context * context,isl_int * ineq,int check,int update)2511 static void context_lex_add_ineq(struct isl_context *context, isl_int *ineq,
2512 int check, int update)
2513 {
2514 struct isl_context_lex *clex = (struct isl_context_lex *)context;
2515 if (isl_tab_extend_cons(clex->tab, 1) < 0)
2516 goto error;
2517 clex->tab = add_lexmin_ineq(clex->tab, ineq);
2518 if (check) {
2519 int v = tab_has_valid_sample(clex->tab, ineq, 0);
2520 if (v < 0)
2521 goto error;
2522 if (!v)
2523 clex->tab = check_integer_feasible(clex->tab);
2524 }
2525 if (update)
2526 clex->tab = check_samples(clex->tab, ineq, 0);
2527 return;
2528 error:
2529 isl_tab_free(clex->tab);
2530 clex->tab = NULL;
2531 }
2532
context_lex_add_ineq_wrap(void * user,isl_int * ineq)2533 static isl_stat context_lex_add_ineq_wrap(void *user, isl_int *ineq)
2534 {
2535 struct isl_context *context = (struct isl_context *)user;
2536 context_lex_add_ineq(context, ineq, 0, 0);
2537 return context->op->is_ok(context) ? isl_stat_ok : isl_stat_error;
2538 }
2539
2540 /* Check which signs can be obtained by "ineq" on all the currently
2541 * active sample values. See row_sign for more information.
2542 */
tab_ineq_sign(struct isl_tab * tab,isl_int * ineq,int strict)2543 static enum isl_tab_row_sign tab_ineq_sign(struct isl_tab *tab, isl_int *ineq,
2544 int strict)
2545 {
2546 int i;
2547 int sgn;
2548 isl_int tmp;
2549 enum isl_tab_row_sign res = isl_tab_row_unknown;
2550
2551 isl_assert(tab->mat->ctx, tab->samples, return isl_tab_row_unknown);
2552 isl_assert(tab->mat->ctx, tab->samples->n_col == 1 + tab->n_var,
2553 return isl_tab_row_unknown);
2554
2555 isl_int_init(tmp);
2556 for (i = tab->n_outside; i < tab->n_sample; ++i) {
2557 isl_seq_inner_product(tab->samples->row[i], ineq,
2558 1 + tab->n_var, &tmp);
2559 sgn = isl_int_sgn(tmp);
2560 if (sgn > 0 || (sgn == 0 && strict)) {
2561 if (res == isl_tab_row_unknown)
2562 res = isl_tab_row_pos;
2563 if (res == isl_tab_row_neg)
2564 res = isl_tab_row_any;
2565 }
2566 if (sgn < 0) {
2567 if (res == isl_tab_row_unknown)
2568 res = isl_tab_row_neg;
2569 if (res == isl_tab_row_pos)
2570 res = isl_tab_row_any;
2571 }
2572 if (res == isl_tab_row_any)
2573 break;
2574 }
2575 isl_int_clear(tmp);
2576
2577 return res;
2578 }
2579
context_lex_ineq_sign(struct isl_context * context,isl_int * ineq,int strict)2580 static enum isl_tab_row_sign context_lex_ineq_sign(struct isl_context *context,
2581 isl_int *ineq, int strict)
2582 {
2583 struct isl_context_lex *clex = (struct isl_context_lex *)context;
2584 return tab_ineq_sign(clex->tab, ineq, strict);
2585 }
2586
2587 /* Check whether "ineq" can be added to the tableau without rendering
2588 * it infeasible.
2589 */
context_lex_test_ineq(struct isl_context * context,isl_int * ineq)2590 static int context_lex_test_ineq(struct isl_context *context, isl_int *ineq)
2591 {
2592 struct isl_context_lex *clex = (struct isl_context_lex *)context;
2593 struct isl_tab_undo *snap;
2594 int feasible;
2595
2596 if (!clex->tab)
2597 return -1;
2598
2599 if (isl_tab_extend_cons(clex->tab, 1) < 0)
2600 return -1;
2601
2602 snap = isl_tab_snap(clex->tab);
2603 if (isl_tab_push_basis(clex->tab) < 0)
2604 return -1;
2605 clex->tab = add_lexmin_ineq(clex->tab, ineq);
2606 clex->tab = check_integer_feasible(clex->tab);
2607 if (!clex->tab)
2608 return -1;
2609 feasible = !clex->tab->empty;
2610 if (isl_tab_rollback(clex->tab, snap) < 0)
2611 return -1;
2612
2613 return feasible;
2614 }
2615
context_lex_get_div(struct isl_context * context,struct isl_tab * tab,struct isl_vec * div)2616 static int context_lex_get_div(struct isl_context *context, struct isl_tab *tab,
2617 struct isl_vec *div)
2618 {
2619 return get_div(tab, context, div);
2620 }
2621
2622 /* Insert a div specified by "div" to the context tableau at position "pos" and
2623 * return isl_bool_true if the div is obviously non-negative.
2624 * context_tab_add_div will always return isl_bool_true, because all variables
2625 * in a isl_context_lex tableau are non-negative.
2626 * However, if we are using a big parameter in the context, then this only
2627 * reflects the non-negativity of the variable used to _encode_ the
2628 * div, i.e., div' = M + div, so we can't draw any conclusions.
2629 */
context_lex_insert_div(struct isl_context * context,int pos,__isl_keep isl_vec * div)2630 static isl_bool context_lex_insert_div(struct isl_context *context, int pos,
2631 __isl_keep isl_vec *div)
2632 {
2633 struct isl_context_lex *clex = (struct isl_context_lex *)context;
2634 isl_bool nonneg;
2635 nonneg = context_tab_insert_div(clex->tab, pos, div,
2636 context_lex_add_ineq_wrap, context);
2637 if (nonneg < 0)
2638 return isl_bool_error;
2639 if (clex->tab->M)
2640 return isl_bool_false;
2641 return nonneg;
2642 }
2643
context_lex_detect_equalities(struct isl_context * context,struct isl_tab * tab)2644 static int context_lex_detect_equalities(struct isl_context *context,
2645 struct isl_tab *tab)
2646 {
2647 return 0;
2648 }
2649
context_lex_best_split(struct isl_context * context,struct isl_tab * tab)2650 static int context_lex_best_split(struct isl_context *context,
2651 struct isl_tab *tab)
2652 {
2653 struct isl_context_lex *clex = (struct isl_context_lex *)context;
2654 struct isl_tab_undo *snap;
2655 int r;
2656
2657 snap = isl_tab_snap(clex->tab);
2658 if (isl_tab_push_basis(clex->tab) < 0)
2659 return -1;
2660 r = best_split(tab, clex->tab);
2661
2662 if (r >= 0 && isl_tab_rollback(clex->tab, snap) < 0)
2663 return -1;
2664
2665 return r;
2666 }
2667
context_lex_is_empty(struct isl_context * context)2668 static int context_lex_is_empty(struct isl_context *context)
2669 {
2670 struct isl_context_lex *clex = (struct isl_context_lex *)context;
2671 if (!clex->tab)
2672 return -1;
2673 return clex->tab->empty;
2674 }
2675
context_lex_save(struct isl_context * context)2676 static void *context_lex_save(struct isl_context *context)
2677 {
2678 struct isl_context_lex *clex = (struct isl_context_lex *)context;
2679 struct isl_tab_undo *snap;
2680
2681 snap = isl_tab_snap(clex->tab);
2682 if (isl_tab_push_basis(clex->tab) < 0)
2683 return NULL;
2684 if (isl_tab_save_samples(clex->tab) < 0)
2685 return NULL;
2686
2687 return snap;
2688 }
2689
context_lex_restore(struct isl_context * context,void * save)2690 static void context_lex_restore(struct isl_context *context, void *save)
2691 {
2692 struct isl_context_lex *clex = (struct isl_context_lex *)context;
2693 if (isl_tab_rollback(clex->tab, (struct isl_tab_undo *)save) < 0) {
2694 isl_tab_free(clex->tab);
2695 clex->tab = NULL;
2696 }
2697 }
2698
context_lex_discard(void * save)2699 static void context_lex_discard(void *save)
2700 {
2701 }
2702
context_lex_is_ok(struct isl_context * context)2703 static int context_lex_is_ok(struct isl_context *context)
2704 {
2705 struct isl_context_lex *clex = (struct isl_context_lex *)context;
2706 return !!clex->tab;
2707 }
2708
2709 /* For each variable in the context tableau, check if the variable can
2710 * only attain non-negative values. If so, mark the parameter as non-negative
2711 * in the main tableau. This allows for a more direct identification of some
2712 * cases of violated constraints.
2713 */
tab_detect_nonnegative_parameters(struct isl_tab * tab,struct isl_tab * context_tab)2714 static struct isl_tab *tab_detect_nonnegative_parameters(struct isl_tab *tab,
2715 struct isl_tab *context_tab)
2716 {
2717 int i;
2718 struct isl_tab_undo *snap;
2719 struct isl_vec *ineq = NULL;
2720 struct isl_tab_var *var;
2721 int n;
2722
2723 if (context_tab->n_var == 0)
2724 return tab;
2725
2726 ineq = isl_vec_alloc(tab->mat->ctx, 1 + context_tab->n_var);
2727 if (!ineq)
2728 goto error;
2729
2730 if (isl_tab_extend_cons(context_tab, 1) < 0)
2731 goto error;
2732
2733 snap = isl_tab_snap(context_tab);
2734
2735 n = 0;
2736 isl_seq_clr(ineq->el, ineq->size);
2737 for (i = 0; i < context_tab->n_var; ++i) {
2738 isl_int_set_si(ineq->el[1 + i], 1);
2739 if (isl_tab_add_ineq(context_tab, ineq->el) < 0)
2740 goto error;
2741 var = &context_tab->con[context_tab->n_con - 1];
2742 if (!context_tab->empty &&
2743 !isl_tab_min_at_most_neg_one(context_tab, var)) {
2744 int j = i;
2745 if (i >= tab->n_param)
2746 j = i - tab->n_param + tab->n_var - tab->n_div;
2747 tab->var[j].is_nonneg = 1;
2748 n++;
2749 }
2750 isl_int_set_si(ineq->el[1 + i], 0);
2751 if (isl_tab_rollback(context_tab, snap) < 0)
2752 goto error;
2753 }
2754
2755 if (context_tab->M && n == context_tab->n_var) {
2756 context_tab->mat = isl_mat_drop_cols(context_tab->mat, 2, 1);
2757 context_tab->M = 0;
2758 }
2759
2760 isl_vec_free(ineq);
2761 return tab;
2762 error:
2763 isl_vec_free(ineq);
2764 isl_tab_free(tab);
2765 return NULL;
2766 }
2767
context_lex_detect_nonnegative_parameters(struct isl_context * context,struct isl_tab * tab)2768 static struct isl_tab *context_lex_detect_nonnegative_parameters(
2769 struct isl_context *context, struct isl_tab *tab)
2770 {
2771 struct isl_context_lex *clex = (struct isl_context_lex *)context;
2772 struct isl_tab_undo *snap;
2773
2774 if (!tab)
2775 return NULL;
2776
2777 snap = isl_tab_snap(clex->tab);
2778 if (isl_tab_push_basis(clex->tab) < 0)
2779 goto error;
2780
2781 tab = tab_detect_nonnegative_parameters(tab, clex->tab);
2782
2783 if (isl_tab_rollback(clex->tab, snap) < 0)
2784 goto error;
2785
2786 return tab;
2787 error:
2788 isl_tab_free(tab);
2789 return NULL;
2790 }
2791
context_lex_invalidate(struct isl_context * context)2792 static void context_lex_invalidate(struct isl_context *context)
2793 {
2794 struct isl_context_lex *clex = (struct isl_context_lex *)context;
2795 isl_tab_free(clex->tab);
2796 clex->tab = NULL;
2797 }
2798
context_lex_free(struct isl_context * context)2799 static __isl_null struct isl_context *context_lex_free(
2800 struct isl_context *context)
2801 {
2802 struct isl_context_lex *clex = (struct isl_context_lex *)context;
2803 isl_tab_free(clex->tab);
2804 free(clex);
2805
2806 return NULL;
2807 }
2808
2809 struct isl_context_op isl_context_lex_op = {
2810 context_lex_detect_nonnegative_parameters,
2811 context_lex_peek_basic_set,
2812 context_lex_peek_tab,
2813 context_lex_add_eq,
2814 context_lex_add_ineq,
2815 context_lex_ineq_sign,
2816 context_lex_test_ineq,
2817 context_lex_get_div,
2818 context_lex_insert_div,
2819 context_lex_detect_equalities,
2820 context_lex_best_split,
2821 context_lex_is_empty,
2822 context_lex_is_ok,
2823 context_lex_save,
2824 context_lex_restore,
2825 context_lex_discard,
2826 context_lex_invalidate,
2827 context_lex_free,
2828 };
2829
context_tab_for_lexmin(__isl_take isl_basic_set * bset)2830 static struct isl_tab *context_tab_for_lexmin(__isl_take isl_basic_set *bset)
2831 {
2832 struct isl_tab *tab;
2833
2834 if (!bset)
2835 return NULL;
2836 tab = tab_for_lexmin(bset_to_bmap(bset), NULL, 1, 0);
2837 if (isl_tab_track_bset(tab, bset) < 0)
2838 goto error;
2839 tab = isl_tab_init_samples(tab);
2840 return tab;
2841 error:
2842 isl_tab_free(tab);
2843 return NULL;
2844 }
2845
isl_context_lex_alloc(struct isl_basic_set * dom)2846 static struct isl_context *isl_context_lex_alloc(struct isl_basic_set *dom)
2847 {
2848 struct isl_context_lex *clex;
2849
2850 if (!dom)
2851 return NULL;
2852
2853 clex = isl_alloc_type(dom->ctx, struct isl_context_lex);
2854 if (!clex)
2855 return NULL;
2856
2857 clex->context.op = &isl_context_lex_op;
2858
2859 clex->tab = context_tab_for_lexmin(isl_basic_set_copy(dom));
2860 if (restore_lexmin(clex->tab) < 0)
2861 goto error;
2862 clex->tab = check_integer_feasible(clex->tab);
2863 if (!clex->tab)
2864 goto error;
2865
2866 return &clex->context;
2867 error:
2868 clex->context.op->free(&clex->context);
2869 return NULL;
2870 }
2871
2872 /* Representation of the context when using generalized basis reduction.
2873 *
2874 * "shifted" contains the offsets of the unit hypercubes that lie inside the
2875 * context. Any rational point in "shifted" can therefore be rounded
2876 * up to an integer point in the context.
2877 * If the context is constrained by any equality, then "shifted" is not used
2878 * as it would be empty.
2879 */
2880 struct isl_context_gbr {
2881 struct isl_context context;
2882 struct isl_tab *tab;
2883 struct isl_tab *shifted;
2884 struct isl_tab *cone;
2885 };
2886
context_gbr_detect_nonnegative_parameters(struct isl_context * context,struct isl_tab * tab)2887 static struct isl_tab *context_gbr_detect_nonnegative_parameters(
2888 struct isl_context *context, struct isl_tab *tab)
2889 {
2890 struct isl_context_gbr *cgbr = (struct isl_context_gbr *)context;
2891 if (!tab)
2892 return NULL;
2893 return tab_detect_nonnegative_parameters(tab, cgbr->tab);
2894 }
2895
context_gbr_peek_basic_set(struct isl_context * context)2896 static struct isl_basic_set *context_gbr_peek_basic_set(
2897 struct isl_context *context)
2898 {
2899 struct isl_context_gbr *cgbr = (struct isl_context_gbr *)context;
2900 if (!cgbr->tab)
2901 return NULL;
2902 return isl_tab_peek_bset(cgbr->tab);
2903 }
2904
context_gbr_peek_tab(struct isl_context * context)2905 static struct isl_tab *context_gbr_peek_tab(struct isl_context *context)
2906 {
2907 struct isl_context_gbr *cgbr = (struct isl_context_gbr *)context;
2908 return cgbr->tab;
2909 }
2910
2911 /* Initialize the "shifted" tableau of the context, which
2912 * contains the constraints of the original tableau shifted
2913 * by the sum of all negative coefficients. This ensures
2914 * that any rational point in the shifted tableau can
2915 * be rounded up to yield an integer point in the original tableau.
2916 */
gbr_init_shifted(struct isl_context_gbr * cgbr)2917 static void gbr_init_shifted(struct isl_context_gbr *cgbr)
2918 {
2919 int i, j;
2920 struct isl_vec *cst;
2921 struct isl_basic_set *bset = isl_tab_peek_bset(cgbr->tab);
2922 isl_size dim = isl_basic_set_dim(bset, isl_dim_all);
2923
2924 if (dim < 0)
2925 return;
2926 cst = isl_vec_alloc(cgbr->tab->mat->ctx, bset->n_ineq);
2927 if (!cst)
2928 return;
2929
2930 for (i = 0; i < bset->n_ineq; ++i) {
2931 isl_int_set(cst->el[i], bset->ineq[i][0]);
2932 for (j = 0; j < dim; ++j) {
2933 if (!isl_int_is_neg(bset->ineq[i][1 + j]))
2934 continue;
2935 isl_int_add(bset->ineq[i][0], bset->ineq[i][0],
2936 bset->ineq[i][1 + j]);
2937 }
2938 }
2939
2940 cgbr->shifted = isl_tab_from_basic_set(bset, 0);
2941
2942 for (i = 0; i < bset->n_ineq; ++i)
2943 isl_int_set(bset->ineq[i][0], cst->el[i]);
2944
2945 isl_vec_free(cst);
2946 }
2947
2948 /* Check if the shifted tableau is non-empty, and if so
2949 * use the sample point to construct an integer point
2950 * of the context tableau.
2951 */
gbr_get_shifted_sample(struct isl_context_gbr * cgbr)2952 static struct isl_vec *gbr_get_shifted_sample(struct isl_context_gbr *cgbr)
2953 {
2954 struct isl_vec *sample;
2955
2956 if (!cgbr->shifted)
2957 gbr_init_shifted(cgbr);
2958 if (!cgbr->shifted)
2959 return NULL;
2960 if (cgbr->shifted->empty)
2961 return isl_vec_alloc(cgbr->tab->mat->ctx, 0);
2962
2963 sample = isl_tab_get_sample_value(cgbr->shifted);
2964 sample = isl_vec_ceil(sample);
2965
2966 return sample;
2967 }
2968
drop_constant_terms(__isl_take isl_basic_set * bset)2969 static __isl_give isl_basic_set *drop_constant_terms(
2970 __isl_take isl_basic_set *bset)
2971 {
2972 int i;
2973
2974 if (!bset)
2975 return NULL;
2976
2977 for (i = 0; i < bset->n_eq; ++i)
2978 isl_int_set_si(bset->eq[i][0], 0);
2979
2980 for (i = 0; i < bset->n_ineq; ++i)
2981 isl_int_set_si(bset->ineq[i][0], 0);
2982
2983 return bset;
2984 }
2985
use_shifted(struct isl_context_gbr * cgbr)2986 static int use_shifted(struct isl_context_gbr *cgbr)
2987 {
2988 if (!cgbr->tab)
2989 return 0;
2990 return cgbr->tab->bmap->n_eq == 0 && cgbr->tab->bmap->n_div == 0;
2991 }
2992
gbr_get_sample(struct isl_context_gbr * cgbr)2993 static struct isl_vec *gbr_get_sample(struct isl_context_gbr *cgbr)
2994 {
2995 struct isl_basic_set *bset;
2996 struct isl_basic_set *cone;
2997
2998 if (isl_tab_sample_is_integer(cgbr->tab))
2999 return isl_tab_get_sample_value(cgbr->tab);
3000
3001 if (use_shifted(cgbr)) {
3002 struct isl_vec *sample;
3003
3004 sample = gbr_get_shifted_sample(cgbr);
3005 if (!sample || sample->size > 0)
3006 return sample;
3007
3008 isl_vec_free(sample);
3009 }
3010
3011 if (!cgbr->cone) {
3012 bset = isl_tab_peek_bset(cgbr->tab);
3013 cgbr->cone = isl_tab_from_recession_cone(bset, 0);
3014 if (!cgbr->cone)
3015 return NULL;
3016 if (isl_tab_track_bset(cgbr->cone,
3017 isl_basic_set_copy(bset)) < 0)
3018 return NULL;
3019 }
3020 if (isl_tab_detect_implicit_equalities(cgbr->cone) < 0)
3021 return NULL;
3022
3023 if (cgbr->cone->n_dead == cgbr->cone->n_col) {
3024 struct isl_vec *sample;
3025 struct isl_tab_undo *snap;
3026
3027 if (cgbr->tab->basis) {
3028 if (cgbr->tab->basis->n_col != 1 + cgbr->tab->n_var) {
3029 isl_mat_free(cgbr->tab->basis);
3030 cgbr->tab->basis = NULL;
3031 }
3032 cgbr->tab->n_zero = 0;
3033 cgbr->tab->n_unbounded = 0;
3034 }
3035
3036 snap = isl_tab_snap(cgbr->tab);
3037
3038 sample = isl_tab_sample(cgbr->tab);
3039
3040 if (!sample || isl_tab_rollback(cgbr->tab, snap) < 0) {
3041 isl_vec_free(sample);
3042 return NULL;
3043 }
3044
3045 return sample;
3046 }
3047
3048 cone = isl_basic_set_dup(isl_tab_peek_bset(cgbr->cone));
3049 cone = drop_constant_terms(cone);
3050 cone = isl_basic_set_update_from_tab(cone, cgbr->cone);
3051 cone = isl_basic_set_underlying_set(cone);
3052 cone = isl_basic_set_gauss(cone, NULL);
3053
3054 bset = isl_basic_set_dup(isl_tab_peek_bset(cgbr->tab));
3055 bset = isl_basic_set_update_from_tab(bset, cgbr->tab);
3056 bset = isl_basic_set_underlying_set(bset);
3057 bset = isl_basic_set_gauss(bset, NULL);
3058
3059 return isl_basic_set_sample_with_cone(bset, cone);
3060 }
3061
check_gbr_integer_feasible(struct isl_context_gbr * cgbr)3062 static void check_gbr_integer_feasible(struct isl_context_gbr *cgbr)
3063 {
3064 struct isl_vec *sample;
3065
3066 if (!cgbr->tab)
3067 return;
3068
3069 if (cgbr->tab->empty)
3070 return;
3071
3072 sample = gbr_get_sample(cgbr);
3073 if (!sample)
3074 goto error;
3075
3076 if (sample->size == 0) {
3077 isl_vec_free(sample);
3078 if (isl_tab_mark_empty(cgbr->tab) < 0)
3079 goto error;
3080 return;
3081 }
3082
3083 if (isl_tab_add_sample(cgbr->tab, sample) < 0)
3084 goto error;
3085
3086 return;
3087 error:
3088 isl_tab_free(cgbr->tab);
3089 cgbr->tab = NULL;
3090 }
3091
add_gbr_eq(struct isl_tab * tab,isl_int * eq)3092 static struct isl_tab *add_gbr_eq(struct isl_tab *tab, isl_int *eq)
3093 {
3094 if (!tab)
3095 return NULL;
3096
3097 if (isl_tab_extend_cons(tab, 2) < 0)
3098 goto error;
3099
3100 if (isl_tab_add_eq(tab, eq) < 0)
3101 goto error;
3102
3103 return tab;
3104 error:
3105 isl_tab_free(tab);
3106 return NULL;
3107 }
3108
3109 /* Add the equality described by "eq" to the context.
3110 * If "check" is set, then we check if the context is empty after
3111 * adding the equality.
3112 * If "update" is set, then we check if the samples are still valid.
3113 *
3114 * We do not explicitly add shifted copies of the equality to
3115 * cgbr->shifted since they would conflict with each other.
3116 * Instead, we directly mark cgbr->shifted empty.
3117 */
context_gbr_add_eq(struct isl_context * context,isl_int * eq,int check,int update)3118 static void context_gbr_add_eq(struct isl_context *context, isl_int *eq,
3119 int check, int update)
3120 {
3121 struct isl_context_gbr *cgbr = (struct isl_context_gbr *)context;
3122
3123 cgbr->tab = add_gbr_eq(cgbr->tab, eq);
3124
3125 if (cgbr->shifted && !cgbr->shifted->empty && use_shifted(cgbr)) {
3126 if (isl_tab_mark_empty(cgbr->shifted) < 0)
3127 goto error;
3128 }
3129
3130 if (cgbr->cone && cgbr->cone->n_col != cgbr->cone->n_dead) {
3131 if (isl_tab_extend_cons(cgbr->cone, 2) < 0)
3132 goto error;
3133 if (isl_tab_add_eq(cgbr->cone, eq) < 0)
3134 goto error;
3135 }
3136
3137 if (check) {
3138 int v = tab_has_valid_sample(cgbr->tab, eq, 1);
3139 if (v < 0)
3140 goto error;
3141 if (!v)
3142 check_gbr_integer_feasible(cgbr);
3143 }
3144 if (update)
3145 cgbr->tab = check_samples(cgbr->tab, eq, 1);
3146 return;
3147 error:
3148 isl_tab_free(cgbr->tab);
3149 cgbr->tab = NULL;
3150 }
3151
add_gbr_ineq(struct isl_context_gbr * cgbr,isl_int * ineq)3152 static void add_gbr_ineq(struct isl_context_gbr *cgbr, isl_int *ineq)
3153 {
3154 if (!cgbr->tab)
3155 return;
3156
3157 if (isl_tab_extend_cons(cgbr->tab, 1) < 0)
3158 goto error;
3159
3160 if (isl_tab_add_ineq(cgbr->tab, ineq) < 0)
3161 goto error;
3162
3163 if (cgbr->shifted && !cgbr->shifted->empty && use_shifted(cgbr)) {
3164 int i;
3165 isl_size dim;
3166 dim = isl_basic_map_dim(cgbr->tab->bmap, isl_dim_all);
3167 if (dim < 0)
3168 goto error;
3169
3170 if (isl_tab_extend_cons(cgbr->shifted, 1) < 0)
3171 goto error;
3172
3173 for (i = 0; i < dim; ++i) {
3174 if (!isl_int_is_neg(ineq[1 + i]))
3175 continue;
3176 isl_int_add(ineq[0], ineq[0], ineq[1 + i]);
3177 }
3178
3179 if (isl_tab_add_ineq(cgbr->shifted, ineq) < 0)
3180 goto error;
3181
3182 for (i = 0; i < dim; ++i) {
3183 if (!isl_int_is_neg(ineq[1 + i]))
3184 continue;
3185 isl_int_sub(ineq[0], ineq[0], ineq[1 + i]);
3186 }
3187 }
3188
3189 if (cgbr->cone && cgbr->cone->n_col != cgbr->cone->n_dead) {
3190 if (isl_tab_extend_cons(cgbr->cone, 1) < 0)
3191 goto error;
3192 if (isl_tab_add_ineq(cgbr->cone, ineq) < 0)
3193 goto error;
3194 }
3195
3196 return;
3197 error:
3198 isl_tab_free(cgbr->tab);
3199 cgbr->tab = NULL;
3200 }
3201
context_gbr_add_ineq(struct isl_context * context,isl_int * ineq,int check,int update)3202 static void context_gbr_add_ineq(struct isl_context *context, isl_int *ineq,
3203 int check, int update)
3204 {
3205 struct isl_context_gbr *cgbr = (struct isl_context_gbr *)context;
3206
3207 add_gbr_ineq(cgbr, ineq);
3208 if (!cgbr->tab)
3209 return;
3210
3211 if (check) {
3212 int v = tab_has_valid_sample(cgbr->tab, ineq, 0);
3213 if (v < 0)
3214 goto error;
3215 if (!v)
3216 check_gbr_integer_feasible(cgbr);
3217 }
3218 if (update)
3219 cgbr->tab = check_samples(cgbr->tab, ineq, 0);
3220 return;
3221 error:
3222 isl_tab_free(cgbr->tab);
3223 cgbr->tab = NULL;
3224 }
3225
context_gbr_add_ineq_wrap(void * user,isl_int * ineq)3226 static isl_stat context_gbr_add_ineq_wrap(void *user, isl_int *ineq)
3227 {
3228 struct isl_context *context = (struct isl_context *)user;
3229 context_gbr_add_ineq(context, ineq, 0, 0);
3230 return context->op->is_ok(context) ? isl_stat_ok : isl_stat_error;
3231 }
3232
context_gbr_ineq_sign(struct isl_context * context,isl_int * ineq,int strict)3233 static enum isl_tab_row_sign context_gbr_ineq_sign(struct isl_context *context,
3234 isl_int *ineq, int strict)
3235 {
3236 struct isl_context_gbr *cgbr = (struct isl_context_gbr *)context;
3237 return tab_ineq_sign(cgbr->tab, ineq, strict);
3238 }
3239
3240 /* Check whether "ineq" can be added to the tableau without rendering
3241 * it infeasible.
3242 */
context_gbr_test_ineq(struct isl_context * context,isl_int * ineq)3243 static int context_gbr_test_ineq(struct isl_context *context, isl_int *ineq)
3244 {
3245 struct isl_context_gbr *cgbr = (struct isl_context_gbr *)context;
3246 struct isl_tab_undo *snap;
3247 struct isl_tab_undo *shifted_snap = NULL;
3248 struct isl_tab_undo *cone_snap = NULL;
3249 int feasible;
3250
3251 if (!cgbr->tab)
3252 return -1;
3253
3254 if (isl_tab_extend_cons(cgbr->tab, 1) < 0)
3255 return -1;
3256
3257 snap = isl_tab_snap(cgbr->tab);
3258 if (cgbr->shifted)
3259 shifted_snap = isl_tab_snap(cgbr->shifted);
3260 if (cgbr->cone)
3261 cone_snap = isl_tab_snap(cgbr->cone);
3262 add_gbr_ineq(cgbr, ineq);
3263 check_gbr_integer_feasible(cgbr);
3264 if (!cgbr->tab)
3265 return -1;
3266 feasible = !cgbr->tab->empty;
3267 if (isl_tab_rollback(cgbr->tab, snap) < 0)
3268 return -1;
3269 if (shifted_snap) {
3270 if (isl_tab_rollback(cgbr->shifted, shifted_snap))
3271 return -1;
3272 } else if (cgbr->shifted) {
3273 isl_tab_free(cgbr->shifted);
3274 cgbr->shifted = NULL;
3275 }
3276 if (cone_snap) {
3277 if (isl_tab_rollback(cgbr->cone, cone_snap))
3278 return -1;
3279 } else if (cgbr->cone) {
3280 isl_tab_free(cgbr->cone);
3281 cgbr->cone = NULL;
3282 }
3283
3284 return feasible;
3285 }
3286
3287 /* Return the column of the last of the variables associated to
3288 * a column that has a non-zero coefficient.
3289 * This function is called in a context where only coefficients
3290 * of parameters or divs can be non-zero.
3291 */
last_non_zero_var_col(struct isl_tab * tab,isl_int * p)3292 static int last_non_zero_var_col(struct isl_tab *tab, isl_int *p)
3293 {
3294 int i;
3295 int col;
3296
3297 if (tab->n_var == 0)
3298 return -1;
3299
3300 for (i = tab->n_var - 1; i >= 0; --i) {
3301 if (i >= tab->n_param && i < tab->n_var - tab->n_div)
3302 continue;
3303 if (tab->var[i].is_row)
3304 continue;
3305 col = tab->var[i].index;
3306 if (!isl_int_is_zero(p[col]))
3307 return col;
3308 }
3309
3310 return -1;
3311 }
3312
3313 /* Look through all the recently added equalities in the context
3314 * to see if we can propagate any of them to the main tableau.
3315 *
3316 * The newly added equalities in the context are encoded as pairs
3317 * of inequalities starting at inequality "first".
3318 *
3319 * We tentatively add each of these equalities to the main tableau
3320 * and if this happens to result in a row with a final coefficient
3321 * that is one or negative one, we use it to kill a column
3322 * in the main tableau. Otherwise, we discard the tentatively
3323 * added row.
3324 * This tentative addition of equality constraints turns
3325 * on the undo facility of the tableau. Turn it off again
3326 * at the end, assuming it was turned off to begin with.
3327 *
3328 * Return 0 on success and -1 on failure.
3329 */
propagate_equalities(struct isl_context_gbr * cgbr,struct isl_tab * tab,unsigned first)3330 static int propagate_equalities(struct isl_context_gbr *cgbr,
3331 struct isl_tab *tab, unsigned first)
3332 {
3333 int i;
3334 struct isl_vec *eq = NULL;
3335 isl_bool needs_undo;
3336
3337 needs_undo = isl_tab_need_undo(tab);
3338 if (needs_undo < 0)
3339 goto error;
3340 eq = isl_vec_alloc(tab->mat->ctx, 1 + tab->n_var);
3341 if (!eq)
3342 goto error;
3343
3344 if (isl_tab_extend_cons(tab, (cgbr->tab->bmap->n_ineq - first)/2) < 0)
3345 goto error;
3346
3347 isl_seq_clr(eq->el + 1 + tab->n_param,
3348 tab->n_var - tab->n_param - tab->n_div);
3349 for (i = first; i < cgbr->tab->bmap->n_ineq; i += 2) {
3350 int j;
3351 int r;
3352 struct isl_tab_undo *snap;
3353 snap = isl_tab_snap(tab);
3354
3355 isl_seq_cpy(eq->el, cgbr->tab->bmap->ineq[i], 1 + tab->n_param);
3356 isl_seq_cpy(eq->el + 1 + tab->n_var - tab->n_div,
3357 cgbr->tab->bmap->ineq[i] + 1 + tab->n_param,
3358 tab->n_div);
3359
3360 r = isl_tab_add_row(tab, eq->el);
3361 if (r < 0)
3362 goto error;
3363 r = tab->con[r].index;
3364 j = last_non_zero_var_col(tab, tab->mat->row[r] + 2 + tab->M);
3365 if (j < 0 || j < tab->n_dead ||
3366 !isl_int_is_one(tab->mat->row[r][0]) ||
3367 (!isl_int_is_one(tab->mat->row[r][2 + tab->M + j]) &&
3368 !isl_int_is_negone(tab->mat->row[r][2 + tab->M + j]))) {
3369 if (isl_tab_rollback(tab, snap) < 0)
3370 goto error;
3371 continue;
3372 }
3373 if (isl_tab_pivot(tab, r, j) < 0)
3374 goto error;
3375 if (isl_tab_kill_col(tab, j) < 0)
3376 goto error;
3377
3378 if (restore_lexmin(tab) < 0)
3379 goto error;
3380 }
3381
3382 if (!needs_undo)
3383 isl_tab_clear_undo(tab);
3384 isl_vec_free(eq);
3385
3386 return 0;
3387 error:
3388 isl_vec_free(eq);
3389 isl_tab_free(cgbr->tab);
3390 cgbr->tab = NULL;
3391 return -1;
3392 }
3393
context_gbr_detect_equalities(struct isl_context * context,struct isl_tab * tab)3394 static int context_gbr_detect_equalities(struct isl_context *context,
3395 struct isl_tab *tab)
3396 {
3397 struct isl_context_gbr *cgbr = (struct isl_context_gbr *)context;
3398 unsigned n_ineq;
3399
3400 if (!cgbr->cone) {
3401 struct isl_basic_set *bset = isl_tab_peek_bset(cgbr->tab);
3402 cgbr->cone = isl_tab_from_recession_cone(bset, 0);
3403 if (!cgbr->cone)
3404 goto error;
3405 if (isl_tab_track_bset(cgbr->cone,
3406 isl_basic_set_copy(bset)) < 0)
3407 goto error;
3408 }
3409 if (isl_tab_detect_implicit_equalities(cgbr->cone) < 0)
3410 goto error;
3411
3412 n_ineq = cgbr->tab->bmap->n_ineq;
3413 cgbr->tab = isl_tab_detect_equalities(cgbr->tab, cgbr->cone);
3414 if (!cgbr->tab)
3415 return -1;
3416 if (cgbr->tab->bmap->n_ineq > n_ineq &&
3417 propagate_equalities(cgbr, tab, n_ineq) < 0)
3418 return -1;
3419
3420 return 0;
3421 error:
3422 isl_tab_free(cgbr->tab);
3423 cgbr->tab = NULL;
3424 return -1;
3425 }
3426
context_gbr_get_div(struct isl_context * context,struct isl_tab * tab,struct isl_vec * div)3427 static int context_gbr_get_div(struct isl_context *context, struct isl_tab *tab,
3428 struct isl_vec *div)
3429 {
3430 return get_div(tab, context, div);
3431 }
3432
context_gbr_insert_div(struct isl_context * context,int pos,__isl_keep isl_vec * div)3433 static isl_bool context_gbr_insert_div(struct isl_context *context, int pos,
3434 __isl_keep isl_vec *div)
3435 {
3436 struct isl_context_gbr *cgbr = (struct isl_context_gbr *)context;
3437 if (cgbr->cone) {
3438 int r, o_div;
3439 isl_size n_div;
3440
3441 n_div = isl_basic_map_dim(cgbr->cone->bmap, isl_dim_div);
3442 if (n_div < 0)
3443 return isl_bool_error;
3444 o_div = cgbr->cone->n_var - n_div;
3445
3446 if (isl_tab_extend_cons(cgbr->cone, 3) < 0)
3447 return isl_bool_error;
3448 if (isl_tab_extend_vars(cgbr->cone, 1) < 0)
3449 return isl_bool_error;
3450 if ((r = isl_tab_insert_var(cgbr->cone, pos)) <0)
3451 return isl_bool_error;
3452
3453 cgbr->cone->bmap = isl_basic_map_insert_div(cgbr->cone->bmap,
3454 r - o_div, div);
3455 if (!cgbr->cone->bmap)
3456 return isl_bool_error;
3457 if (isl_tab_push_var(cgbr->cone, isl_tab_undo_bmap_div,
3458 &cgbr->cone->var[r]) < 0)
3459 return isl_bool_error;
3460 }
3461 return context_tab_insert_div(cgbr->tab, pos, div,
3462 context_gbr_add_ineq_wrap, context);
3463 }
3464
context_gbr_best_split(struct isl_context * context,struct isl_tab * tab)3465 static int context_gbr_best_split(struct isl_context *context,
3466 struct isl_tab *tab)
3467 {
3468 struct isl_context_gbr *cgbr = (struct isl_context_gbr *)context;
3469 struct isl_tab_undo *snap;
3470 int r;
3471
3472 snap = isl_tab_snap(cgbr->tab);
3473 r = best_split(tab, cgbr->tab);
3474
3475 if (r >= 0 && isl_tab_rollback(cgbr->tab, snap) < 0)
3476 return -1;
3477
3478 return r;
3479 }
3480
context_gbr_is_empty(struct isl_context * context)3481 static int context_gbr_is_empty(struct isl_context *context)
3482 {
3483 struct isl_context_gbr *cgbr = (struct isl_context_gbr *)context;
3484 if (!cgbr->tab)
3485 return -1;
3486 return cgbr->tab->empty;
3487 }
3488
3489 struct isl_gbr_tab_undo {
3490 struct isl_tab_undo *tab_snap;
3491 struct isl_tab_undo *shifted_snap;
3492 struct isl_tab_undo *cone_snap;
3493 };
3494
context_gbr_save(struct isl_context * context)3495 static void *context_gbr_save(struct isl_context *context)
3496 {
3497 struct isl_context_gbr *cgbr = (struct isl_context_gbr *)context;
3498 struct isl_gbr_tab_undo *snap;
3499
3500 if (!cgbr->tab)
3501 return NULL;
3502
3503 snap = isl_alloc_type(cgbr->tab->mat->ctx, struct isl_gbr_tab_undo);
3504 if (!snap)
3505 return NULL;
3506
3507 snap->tab_snap = isl_tab_snap(cgbr->tab);
3508 if (isl_tab_save_samples(cgbr->tab) < 0)
3509 goto error;
3510
3511 if (cgbr->shifted)
3512 snap->shifted_snap = isl_tab_snap(cgbr->shifted);
3513 else
3514 snap->shifted_snap = NULL;
3515
3516 if (cgbr->cone)
3517 snap->cone_snap = isl_tab_snap(cgbr->cone);
3518 else
3519 snap->cone_snap = NULL;
3520
3521 return snap;
3522 error:
3523 free(snap);
3524 return NULL;
3525 }
3526
context_gbr_restore(struct isl_context * context,void * save)3527 static void context_gbr_restore(struct isl_context *context, void *save)
3528 {
3529 struct isl_context_gbr *cgbr = (struct isl_context_gbr *)context;
3530 struct isl_gbr_tab_undo *snap = (struct isl_gbr_tab_undo *)save;
3531 if (!snap)
3532 goto error;
3533 if (isl_tab_rollback(cgbr->tab, snap->tab_snap) < 0)
3534 goto error;
3535
3536 if (snap->shifted_snap) {
3537 if (isl_tab_rollback(cgbr->shifted, snap->shifted_snap) < 0)
3538 goto error;
3539 } else if (cgbr->shifted) {
3540 isl_tab_free(cgbr->shifted);
3541 cgbr->shifted = NULL;
3542 }
3543
3544 if (snap->cone_snap) {
3545 if (isl_tab_rollback(cgbr->cone, snap->cone_snap) < 0)
3546 goto error;
3547 } else if (cgbr->cone) {
3548 isl_tab_free(cgbr->cone);
3549 cgbr->cone = NULL;
3550 }
3551
3552 free(snap);
3553
3554 return;
3555 error:
3556 free(snap);
3557 isl_tab_free(cgbr->tab);
3558 cgbr->tab = NULL;
3559 }
3560
context_gbr_discard(void * save)3561 static void context_gbr_discard(void *save)
3562 {
3563 struct isl_gbr_tab_undo *snap = (struct isl_gbr_tab_undo *)save;
3564 free(snap);
3565 }
3566
context_gbr_is_ok(struct isl_context * context)3567 static int context_gbr_is_ok(struct isl_context *context)
3568 {
3569 struct isl_context_gbr *cgbr = (struct isl_context_gbr *)context;
3570 return !!cgbr->tab;
3571 }
3572
context_gbr_invalidate(struct isl_context * context)3573 static void context_gbr_invalidate(struct isl_context *context)
3574 {
3575 struct isl_context_gbr *cgbr = (struct isl_context_gbr *)context;
3576 isl_tab_free(cgbr->tab);
3577 cgbr->tab = NULL;
3578 }
3579
context_gbr_free(struct isl_context * context)3580 static __isl_null struct isl_context *context_gbr_free(
3581 struct isl_context *context)
3582 {
3583 struct isl_context_gbr *cgbr = (struct isl_context_gbr *)context;
3584 isl_tab_free(cgbr->tab);
3585 isl_tab_free(cgbr->shifted);
3586 isl_tab_free(cgbr->cone);
3587 free(cgbr);
3588
3589 return NULL;
3590 }
3591
3592 struct isl_context_op isl_context_gbr_op = {
3593 context_gbr_detect_nonnegative_parameters,
3594 context_gbr_peek_basic_set,
3595 context_gbr_peek_tab,
3596 context_gbr_add_eq,
3597 context_gbr_add_ineq,
3598 context_gbr_ineq_sign,
3599 context_gbr_test_ineq,
3600 context_gbr_get_div,
3601 context_gbr_insert_div,
3602 context_gbr_detect_equalities,
3603 context_gbr_best_split,
3604 context_gbr_is_empty,
3605 context_gbr_is_ok,
3606 context_gbr_save,
3607 context_gbr_restore,
3608 context_gbr_discard,
3609 context_gbr_invalidate,
3610 context_gbr_free,
3611 };
3612
isl_context_gbr_alloc(__isl_keep isl_basic_set * dom)3613 static struct isl_context *isl_context_gbr_alloc(__isl_keep isl_basic_set *dom)
3614 {
3615 struct isl_context_gbr *cgbr;
3616
3617 if (!dom)
3618 return NULL;
3619
3620 cgbr = isl_calloc_type(dom->ctx, struct isl_context_gbr);
3621 if (!cgbr)
3622 return NULL;
3623
3624 cgbr->context.op = &isl_context_gbr_op;
3625
3626 cgbr->shifted = NULL;
3627 cgbr->cone = NULL;
3628 cgbr->tab = isl_tab_from_basic_set(dom, 1);
3629 cgbr->tab = isl_tab_init_samples(cgbr->tab);
3630 if (!cgbr->tab)
3631 goto error;
3632 check_gbr_integer_feasible(cgbr);
3633
3634 return &cgbr->context;
3635 error:
3636 cgbr->context.op->free(&cgbr->context);
3637 return NULL;
3638 }
3639
3640 /* Allocate a context corresponding to "dom".
3641 * The representation specific fields are initialized by
3642 * isl_context_lex_alloc or isl_context_gbr_alloc.
3643 * The shared "n_unknown" field is initialized to the number
3644 * of final unknown integer divisions in "dom".
3645 */
isl_context_alloc(__isl_keep isl_basic_set * dom)3646 static struct isl_context *isl_context_alloc(__isl_keep isl_basic_set *dom)
3647 {
3648 struct isl_context *context;
3649 int first;
3650 isl_size n_div;
3651
3652 if (!dom)
3653 return NULL;
3654
3655 if (dom->ctx->opt->context == ISL_CONTEXT_LEXMIN)
3656 context = isl_context_lex_alloc(dom);
3657 else
3658 context = isl_context_gbr_alloc(dom);
3659
3660 if (!context)
3661 return NULL;
3662
3663 first = isl_basic_set_first_unknown_div(dom);
3664 n_div = isl_basic_set_dim(dom, isl_dim_div);
3665 if (first < 0 || n_div < 0)
3666 return context->op->free(context);
3667 context->n_unknown = n_div - first;
3668
3669 return context;
3670 }
3671
3672 /* Initialize some common fields of "sol", which keeps track
3673 * of the solution of an optimization problem on "bmap" over
3674 * the domain "dom".
3675 * If "max" is set, then a maximization problem is being solved, rather than
3676 * a minimization problem, which means that the variables in the
3677 * tableau have value "M - x" rather than "M + x".
3678 */
sol_init(struct isl_sol * sol,__isl_keep isl_basic_map * bmap,__isl_keep isl_basic_set * dom,int max)3679 static isl_stat sol_init(struct isl_sol *sol, __isl_keep isl_basic_map *bmap,
3680 __isl_keep isl_basic_set *dom, int max)
3681 {
3682 sol->rational = ISL_F_ISSET(bmap, ISL_BASIC_MAP_RATIONAL);
3683 sol->dec_level.callback.run = &sol_dec_level_wrap;
3684 sol->dec_level.sol = sol;
3685 sol->max = max;
3686 sol->n_out = isl_basic_map_dim(bmap, isl_dim_out);
3687 sol->space = isl_basic_map_get_space(bmap);
3688
3689 sol->context = isl_context_alloc(dom);
3690 if (sol->n_out < 0 || !sol->space || !sol->context)
3691 return isl_stat_error;
3692
3693 return isl_stat_ok;
3694 }
3695
3696 /* Construct an isl_sol_map structure for accumulating the solution.
3697 * If track_empty is set, then we also keep track of the parts
3698 * of the context where there is no solution.
3699 * If max is set, then we are solving a maximization, rather than
3700 * a minimization problem, which means that the variables in the
3701 * tableau have value "M - x" rather than "M + x".
3702 */
sol_map_init(__isl_keep isl_basic_map * bmap,__isl_take isl_basic_set * dom,int track_empty,int max)3703 static struct isl_sol *sol_map_init(__isl_keep isl_basic_map *bmap,
3704 __isl_take isl_basic_set *dom, int track_empty, int max)
3705 {
3706 struct isl_sol_map *sol_map = NULL;
3707 isl_space *space;
3708
3709 if (!bmap)
3710 goto error;
3711
3712 sol_map = isl_calloc_type(bmap->ctx, struct isl_sol_map);
3713 if (!sol_map)
3714 goto error;
3715
3716 sol_map->sol.free = &sol_map_free;
3717 if (sol_init(&sol_map->sol, bmap, dom, max) < 0)
3718 goto error;
3719 sol_map->sol.add = &sol_map_add_wrap;
3720 sol_map->sol.add_empty = track_empty ? &sol_map_add_empty_wrap : NULL;
3721 space = isl_space_copy(sol_map->sol.space);
3722 sol_map->map = isl_map_alloc_space(space, 1, ISL_MAP_DISJOINT);
3723 if (!sol_map->map)
3724 goto error;
3725
3726 if (track_empty) {
3727 sol_map->empty = isl_set_alloc_space(isl_basic_set_get_space(dom),
3728 1, ISL_SET_DISJOINT);
3729 if (!sol_map->empty)
3730 goto error;
3731 }
3732
3733 isl_basic_set_free(dom);
3734 return &sol_map->sol;
3735 error:
3736 isl_basic_set_free(dom);
3737 sol_free(&sol_map->sol);
3738 return NULL;
3739 }
3740
3741 /* Check whether all coefficients of (non-parameter) variables
3742 * are non-positive, meaning that no pivots can be performed on the row.
3743 */
is_critical(struct isl_tab * tab,int row)3744 static int is_critical(struct isl_tab *tab, int row)
3745 {
3746 int j;
3747 unsigned off = 2 + tab->M;
3748
3749 for (j = tab->n_dead; j < tab->n_col; ++j) {
3750 if (col_is_parameter_var(tab, j))
3751 continue;
3752
3753 if (isl_int_is_pos(tab->mat->row[row][off + j]))
3754 return 0;
3755 }
3756
3757 return 1;
3758 }
3759
3760 /* Check whether the inequality represented by vec is strict over the integers,
3761 * i.e., there are no integer values satisfying the constraint with
3762 * equality. This happens if the gcd of the coefficients is not a divisor
3763 * of the constant term. If so, scale the constraint down by the gcd
3764 * of the coefficients.
3765 */
is_strict(struct isl_vec * vec)3766 static int is_strict(struct isl_vec *vec)
3767 {
3768 isl_int gcd;
3769 int strict = 0;
3770
3771 isl_int_init(gcd);
3772 isl_seq_gcd(vec->el + 1, vec->size - 1, &gcd);
3773 if (!isl_int_is_one(gcd)) {
3774 strict = !isl_int_is_divisible_by(vec->el[0], gcd);
3775 isl_int_fdiv_q(vec->el[0], vec->el[0], gcd);
3776 isl_seq_scale_down(vec->el + 1, vec->el + 1, gcd, vec->size-1);
3777 }
3778 isl_int_clear(gcd);
3779
3780 return strict;
3781 }
3782
3783 /* Determine the sign of the given row of the main tableau.
3784 * The result is one of
3785 * isl_tab_row_pos: always non-negative; no pivot needed
3786 * isl_tab_row_neg: always non-positive; pivot
3787 * isl_tab_row_any: can be both positive and negative; split
3788 *
3789 * We first handle some simple cases
3790 * - the row sign may be known already
3791 * - the row may be obviously non-negative
3792 * - the parametric constant may be equal to that of another row
3793 * for which we know the sign. This sign will be either "pos" or
3794 * "any". If it had been "neg" then we would have pivoted before.
3795 *
3796 * If none of these cases hold, we check the value of the row for each
3797 * of the currently active samples. Based on the signs of these values
3798 * we make an initial determination of the sign of the row.
3799 *
3800 * all zero -> unk(nown)
3801 * all non-negative -> pos
3802 * all non-positive -> neg
3803 * both negative and positive -> all
3804 *
3805 * If we end up with "all", we are done.
3806 * Otherwise, we perform a check for positive and/or negative
3807 * values as follows.
3808 *
3809 * samples neg unk pos
3810 * <0 ? Y N Y N
3811 * pos any pos
3812 * >0 ? Y N Y N
3813 * any neg any neg
3814 *
3815 * There is no special sign for "zero", because we can usually treat zero
3816 * as either non-negative or non-positive, whatever works out best.
3817 * However, if the row is "critical", meaning that pivoting is impossible
3818 * then we don't want to limp zero with the non-positive case, because
3819 * then we we would lose the solution for those values of the parameters
3820 * where the value of the row is zero. Instead, we treat 0 as non-negative
3821 * ensuring a split if the row can attain both zero and negative values.
3822 * The same happens when the original constraint was one that could not
3823 * be satisfied with equality by any integer values of the parameters.
3824 * In this case, we normalize the constraint, but then a value of zero
3825 * for the normalized constraint is actually a positive value for the
3826 * original constraint, so again we need to treat zero as non-negative.
3827 * In both these cases, we have the following decision tree instead:
3828 *
3829 * all non-negative -> pos
3830 * all negative -> neg
3831 * both negative and non-negative -> all
3832 *
3833 * samples neg pos
3834 * <0 ? Y N
3835 * any pos
3836 * >=0 ? Y N
3837 * any neg
3838 */
row_sign(struct isl_tab * tab,struct isl_sol * sol,int row)3839 static enum isl_tab_row_sign row_sign(struct isl_tab *tab,
3840 struct isl_sol *sol, int row)
3841 {
3842 struct isl_vec *ineq = NULL;
3843 enum isl_tab_row_sign res = isl_tab_row_unknown;
3844 int critical;
3845 int strict;
3846 int row2;
3847
3848 if (tab->row_sign[row] != isl_tab_row_unknown)
3849 return tab->row_sign[row];
3850 if (is_obviously_nonneg(tab, row))
3851 return isl_tab_row_pos;
3852 for (row2 = tab->n_redundant; row2 < tab->n_row; ++row2) {
3853 if (tab->row_sign[row2] == isl_tab_row_unknown)
3854 continue;
3855 if (identical_parameter_line(tab, row, row2))
3856 return tab->row_sign[row2];
3857 }
3858
3859 critical = is_critical(tab, row);
3860
3861 ineq = get_row_parameter_ineq(tab, row);
3862 if (!ineq)
3863 goto error;
3864
3865 strict = is_strict(ineq);
3866
3867 res = sol->context->op->ineq_sign(sol->context, ineq->el,
3868 critical || strict);
3869
3870 if (res == isl_tab_row_unknown || res == isl_tab_row_pos) {
3871 /* test for negative values */
3872 int feasible;
3873 isl_seq_neg(ineq->el, ineq->el, ineq->size);
3874 isl_int_sub_ui(ineq->el[0], ineq->el[0], 1);
3875
3876 feasible = sol->context->op->test_ineq(sol->context, ineq->el);
3877 if (feasible < 0)
3878 goto error;
3879 if (!feasible)
3880 res = isl_tab_row_pos;
3881 else
3882 res = (res == isl_tab_row_unknown) ? isl_tab_row_neg
3883 : isl_tab_row_any;
3884 if (res == isl_tab_row_neg) {
3885 isl_seq_neg(ineq->el, ineq->el, ineq->size);
3886 isl_int_sub_ui(ineq->el[0], ineq->el[0], 1);
3887 }
3888 }
3889
3890 if (res == isl_tab_row_neg) {
3891 /* test for positive values */
3892 int feasible;
3893 if (!critical && !strict)
3894 isl_int_sub_ui(ineq->el[0], ineq->el[0], 1);
3895
3896 feasible = sol->context->op->test_ineq(sol->context, ineq->el);
3897 if (feasible < 0)
3898 goto error;
3899 if (feasible)
3900 res = isl_tab_row_any;
3901 }
3902
3903 isl_vec_free(ineq);
3904 return res;
3905 error:
3906 isl_vec_free(ineq);
3907 return isl_tab_row_unknown;
3908 }
3909
3910 static void find_solutions(struct isl_sol *sol, struct isl_tab *tab);
3911
3912 /* Find solutions for values of the parameters that satisfy the given
3913 * inequality.
3914 *
3915 * We currently take a snapshot of the context tableau that is reset
3916 * when we return from this function, while we make a copy of the main
3917 * tableau, leaving the original main tableau untouched.
3918 * These are fairly arbitrary choices. Making a copy also of the context
3919 * tableau would obviate the need to undo any changes made to it later,
3920 * while taking a snapshot of the main tableau could reduce memory usage.
3921 * If we were to switch to taking a snapshot of the main tableau,
3922 * we would have to keep in mind that we need to save the row signs
3923 * and that we need to do this before saving the current basis
3924 * such that the basis has been restore before we restore the row signs.
3925 */
find_in_pos(struct isl_sol * sol,struct isl_tab * tab,isl_int * ineq)3926 static void find_in_pos(struct isl_sol *sol, struct isl_tab *tab, isl_int *ineq)
3927 {
3928 void *saved;
3929
3930 if (!sol->context)
3931 goto error;
3932 saved = sol->context->op->save(sol->context);
3933
3934 tab = isl_tab_dup(tab);
3935 if (!tab)
3936 goto error;
3937
3938 sol->context->op->add_ineq(sol->context, ineq, 0, 1);
3939
3940 find_solutions(sol, tab);
3941
3942 if (!sol->error)
3943 sol->context->op->restore(sol->context, saved);
3944 else
3945 sol->context->op->discard(saved);
3946 return;
3947 error:
3948 sol->error = 1;
3949 }
3950
3951 /* Record the absence of solutions for those values of the parameters
3952 * that do not satisfy the given inequality with equality.
3953 */
no_sol_in_strict(struct isl_sol * sol,struct isl_tab * tab,struct isl_vec * ineq)3954 static void no_sol_in_strict(struct isl_sol *sol,
3955 struct isl_tab *tab, struct isl_vec *ineq)
3956 {
3957 int empty;
3958 void *saved;
3959
3960 if (!sol->context || sol->error)
3961 goto error;
3962 saved = sol->context->op->save(sol->context);
3963
3964 isl_int_sub_ui(ineq->el[0], ineq->el[0], 1);
3965
3966 sol->context->op->add_ineq(sol->context, ineq->el, 1, 0);
3967 if (!sol->context)
3968 goto error;
3969
3970 empty = tab->empty;
3971 tab->empty = 1;
3972 sol_add(sol, tab);
3973 tab->empty = empty;
3974
3975 isl_int_add_ui(ineq->el[0], ineq->el[0], 1);
3976
3977 sol->context->op->restore(sol->context, saved);
3978 return;
3979 error:
3980 sol->error = 1;
3981 }
3982
3983 /* Reset all row variables that are marked to have a sign that may
3984 * be both positive and negative to have an unknown sign.
3985 */
reset_any_to_unknown(struct isl_tab * tab)3986 static void reset_any_to_unknown(struct isl_tab *tab)
3987 {
3988 int row;
3989
3990 for (row = tab->n_redundant; row < tab->n_row; ++row) {
3991 if (!isl_tab_var_from_row(tab, row)->is_nonneg)
3992 continue;
3993 if (tab->row_sign[row] == isl_tab_row_any)
3994 tab->row_sign[row] = isl_tab_row_unknown;
3995 }
3996 }
3997
3998 /* Compute the lexicographic minimum of the set represented by the main
3999 * tableau "tab" within the context "sol->context_tab".
4000 * On entry the sample value of the main tableau is lexicographically
4001 * less than or equal to this lexicographic minimum.
4002 * Pivots are performed until a feasible point is found, which is then
4003 * necessarily equal to the minimum, or until the tableau is found to
4004 * be infeasible. Some pivots may need to be performed for only some
4005 * feasible values of the context tableau. If so, the context tableau
4006 * is split into a part where the pivot is needed and a part where it is not.
4007 *
4008 * Whenever we enter the main loop, the main tableau is such that no
4009 * "obvious" pivots need to be performed on it, where "obvious" means
4010 * that the given row can be seen to be negative without looking at
4011 * the context tableau. In particular, for non-parametric problems,
4012 * no pivots need to be performed on the main tableau.
4013 * The caller of find_solutions is responsible for making this property
4014 * hold prior to the first iteration of the loop, while restore_lexmin
4015 * is called before every other iteration.
4016 *
4017 * Inside the main loop, we first examine the signs of the rows of
4018 * the main tableau within the context of the context tableau.
4019 * If we find a row that is always non-positive for all values of
4020 * the parameters satisfying the context tableau and negative for at
4021 * least one value of the parameters, we perform the appropriate pivot
4022 * and start over. An exception is the case where no pivot can be
4023 * performed on the row. In this case, we require that the sign of
4024 * the row is negative for all values of the parameters (rather than just
4025 * non-positive). This special case is handled inside row_sign, which
4026 * will say that the row can have any sign if it determines that it can
4027 * attain both negative and zero values.
4028 *
4029 * If we can't find a row that always requires a pivot, but we can find
4030 * one or more rows that require a pivot for some values of the parameters
4031 * (i.e., the row can attain both positive and negative signs), then we split
4032 * the context tableau into two parts, one where we force the sign to be
4033 * non-negative and one where we force is to be negative.
4034 * The non-negative part is handled by a recursive call (through find_in_pos).
4035 * Upon returning from this call, we continue with the negative part and
4036 * perform the required pivot.
4037 *
4038 * If no such rows can be found, all rows are non-negative and we have
4039 * found a (rational) feasible point. If we only wanted a rational point
4040 * then we are done.
4041 * Otherwise, we check if all values of the sample point of the tableau
4042 * are integral for the variables. If so, we have found the minimal
4043 * integral point and we are done.
4044 * If the sample point is not integral, then we need to make a distinction
4045 * based on whether the constant term is non-integral or the coefficients
4046 * of the parameters. Furthermore, in order to decide how to handle
4047 * the non-integrality, we also need to know whether the coefficients
4048 * of the other columns in the tableau are integral. This leads
4049 * to the following table. The first two rows do not correspond
4050 * to a non-integral sample point and are only mentioned for completeness.
4051 *
4052 * constant parameters other
4053 *
4054 * int int int |
4055 * int int rat | -> no problem
4056 *
4057 * rat int int -> fail
4058 *
4059 * rat int rat -> cut
4060 *
4061 * int rat rat |
4062 * rat rat rat | -> parametric cut
4063 *
4064 * int rat int |
4065 * rat rat int | -> split context
4066 *
4067 * If the parametric constant is completely integral, then there is nothing
4068 * to be done. If the constant term is non-integral, but all the other
4069 * coefficient are integral, then there is nothing that can be done
4070 * and the tableau has no integral solution.
4071 * If, on the other hand, one or more of the other columns have rational
4072 * coefficients, but the parameter coefficients are all integral, then
4073 * we can perform a regular (non-parametric) cut.
4074 * Finally, if there is any parameter coefficient that is non-integral,
4075 * then we need to involve the context tableau. There are two cases here.
4076 * If at least one other column has a rational coefficient, then we
4077 * can perform a parametric cut in the main tableau by adding a new
4078 * integer division in the context tableau.
4079 * If all other columns have integral coefficients, then we need to
4080 * enforce that the rational combination of parameters (c + \sum a_i y_i)/m
4081 * is always integral. We do this by introducing an integer division
4082 * q = floor((c + \sum a_i y_i)/m) and stipulating that its argument should
4083 * always be integral in the context tableau, i.e., m q = c + \sum a_i y_i.
4084 * Since q is expressed in the tableau as
4085 * c + \sum a_i y_i - m q >= 0
4086 * -c - \sum a_i y_i + m q + m - 1 >= 0
4087 * it is sufficient to add the inequality
4088 * -c - \sum a_i y_i + m q >= 0
4089 * In the part of the context where this inequality does not hold, the
4090 * main tableau is marked as being empty.
4091 */
find_solutions(struct isl_sol * sol,struct isl_tab * tab)4092 static void find_solutions(struct isl_sol *sol, struct isl_tab *tab)
4093 {
4094 struct isl_context *context;
4095 int r;
4096
4097 if (!tab || sol->error)
4098 goto error;
4099
4100 context = sol->context;
4101
4102 if (tab->empty)
4103 goto done;
4104 if (context->op->is_empty(context))
4105 goto done;
4106
4107 for (r = 0; r >= 0 && tab && !tab->empty; r = restore_lexmin(tab)) {
4108 int flags;
4109 int row;
4110 enum isl_tab_row_sign sgn;
4111 int split = -1;
4112 int n_split = 0;
4113
4114 for (row = tab->n_redundant; row < tab->n_row; ++row) {
4115 if (!isl_tab_var_from_row(tab, row)->is_nonneg)
4116 continue;
4117 sgn = row_sign(tab, sol, row);
4118 if (!sgn)
4119 goto error;
4120 tab->row_sign[row] = sgn;
4121 if (sgn == isl_tab_row_any)
4122 n_split++;
4123 if (sgn == isl_tab_row_any && split == -1)
4124 split = row;
4125 if (sgn == isl_tab_row_neg)
4126 break;
4127 }
4128 if (row < tab->n_row)
4129 continue;
4130 if (split != -1) {
4131 struct isl_vec *ineq;
4132 if (n_split != 1)
4133 split = context->op->best_split(context, tab);
4134 if (split < 0)
4135 goto error;
4136 ineq = get_row_parameter_ineq(tab, split);
4137 if (!ineq)
4138 goto error;
4139 is_strict(ineq);
4140 reset_any_to_unknown(tab);
4141 tab->row_sign[split] = isl_tab_row_pos;
4142 sol_inc_level(sol);
4143 find_in_pos(sol, tab, ineq->el);
4144 tab->row_sign[split] = isl_tab_row_neg;
4145 isl_seq_neg(ineq->el, ineq->el, ineq->size);
4146 isl_int_sub_ui(ineq->el[0], ineq->el[0], 1);
4147 if (!sol->error)
4148 context->op->add_ineq(context, ineq->el, 0, 1);
4149 isl_vec_free(ineq);
4150 if (sol->error)
4151 goto error;
4152 continue;
4153 }
4154 if (tab->rational)
4155 break;
4156 row = first_non_integer_row(tab, &flags);
4157 if (row < 0)
4158 break;
4159 if (ISL_FL_ISSET(flags, I_PAR)) {
4160 if (ISL_FL_ISSET(flags, I_VAR)) {
4161 if (isl_tab_mark_empty(tab) < 0)
4162 goto error;
4163 break;
4164 }
4165 row = add_cut(tab, row);
4166 } else if (ISL_FL_ISSET(flags, I_VAR)) {
4167 struct isl_vec *div;
4168 struct isl_vec *ineq;
4169 int d;
4170 div = get_row_split_div(tab, row);
4171 if (!div)
4172 goto error;
4173 d = context->op->get_div(context, tab, div);
4174 isl_vec_free(div);
4175 if (d < 0)
4176 goto error;
4177 ineq = ineq_for_div(context->op->peek_basic_set(context), d);
4178 if (!ineq)
4179 goto error;
4180 sol_inc_level(sol);
4181 no_sol_in_strict(sol, tab, ineq);
4182 isl_seq_neg(ineq->el, ineq->el, ineq->size);
4183 context->op->add_ineq(context, ineq->el, 1, 1);
4184 isl_vec_free(ineq);
4185 if (sol->error || !context->op->is_ok(context))
4186 goto error;
4187 tab = set_row_cst_to_div(tab, row, d);
4188 if (context->op->is_empty(context))
4189 break;
4190 } else
4191 row = add_parametric_cut(tab, row, context);
4192 if (row < 0)
4193 goto error;
4194 }
4195 if (r < 0)
4196 goto error;
4197 done:
4198 sol_add(sol, tab);
4199 isl_tab_free(tab);
4200 return;
4201 error:
4202 isl_tab_free(tab);
4203 sol->error = 1;
4204 }
4205
4206 /* Does "sol" contain a pair of partial solutions that could potentially
4207 * be merged?
4208 *
4209 * We currently only check that "sol" is not in an error state
4210 * and that there are at least two partial solutions of which the final two
4211 * are defined at the same level.
4212 */
sol_has_mergeable_solutions(struct isl_sol * sol)4213 static int sol_has_mergeable_solutions(struct isl_sol *sol)
4214 {
4215 if (sol->error)
4216 return 0;
4217 if (!sol->partial)
4218 return 0;
4219 if (!sol->partial->next)
4220 return 0;
4221 return sol->partial->level == sol->partial->next->level;
4222 }
4223
4224 /* Compute the lexicographic minimum of the set represented by the main
4225 * tableau "tab" within the context "sol->context_tab".
4226 *
4227 * As a preprocessing step, we first transfer all the purely parametric
4228 * equalities from the main tableau to the context tableau, i.e.,
4229 * parameters that have been pivoted to a row.
4230 * These equalities are ignored by the main algorithm, because the
4231 * corresponding rows may not be marked as being non-negative.
4232 * In parts of the context where the added equality does not hold,
4233 * the main tableau is marked as being empty.
4234 *
4235 * Before we embark on the actual computation, we save a copy
4236 * of the context. When we return, we check if there are any
4237 * partial solutions that can potentially be merged. If so,
4238 * we perform a rollback to the initial state of the context.
4239 * The merging of partial solutions happens inside calls to
4240 * sol_dec_level that are pushed onto the undo stack of the context.
4241 * If there are no partial solutions that can potentially be merged
4242 * then the rollback is skipped as it would just be wasted effort.
4243 */
find_solutions_main(struct isl_sol * sol,struct isl_tab * tab)4244 static void find_solutions_main(struct isl_sol *sol, struct isl_tab *tab)
4245 {
4246 int row;
4247 void *saved;
4248
4249 if (!tab)
4250 goto error;
4251
4252 sol->level = 0;
4253
4254 for (row = tab->n_redundant; row < tab->n_row; ++row) {
4255 int p;
4256 struct isl_vec *eq;
4257
4258 if (!row_is_parameter_var(tab, row))
4259 continue;
4260 if (tab->row_var[row] < tab->n_param)
4261 p = tab->row_var[row];
4262 else
4263 p = tab->row_var[row]
4264 + tab->n_param - (tab->n_var - tab->n_div);
4265
4266 eq = isl_vec_alloc(tab->mat->ctx, 1+tab->n_param+tab->n_div);
4267 if (!eq)
4268 goto error;
4269 get_row_parameter_line(tab, row, eq->el);
4270 isl_int_neg(eq->el[1 + p], tab->mat->row[row][0]);
4271 eq = isl_vec_normalize(eq);
4272
4273 sol_inc_level(sol);
4274 no_sol_in_strict(sol, tab, eq);
4275
4276 isl_seq_neg(eq->el, eq->el, eq->size);
4277 sol_inc_level(sol);
4278 no_sol_in_strict(sol, tab, eq);
4279 isl_seq_neg(eq->el, eq->el, eq->size);
4280
4281 sol->context->op->add_eq(sol->context, eq->el, 1, 1);
4282
4283 isl_vec_free(eq);
4284
4285 if (isl_tab_mark_redundant(tab, row) < 0)
4286 goto error;
4287
4288 if (sol->context->op->is_empty(sol->context))
4289 break;
4290
4291 row = tab->n_redundant - 1;
4292 }
4293
4294 saved = sol->context->op->save(sol->context);
4295
4296 find_solutions(sol, tab);
4297
4298 if (sol_has_mergeable_solutions(sol))
4299 sol->context->op->restore(sol->context, saved);
4300 else
4301 sol->context->op->discard(saved);
4302
4303 sol->level = 0;
4304 sol_pop(sol);
4305
4306 return;
4307 error:
4308 isl_tab_free(tab);
4309 sol->error = 1;
4310 }
4311
4312 /* Check if integer division "div" of "dom" also occurs in "bmap".
4313 * If so, return its position within the divs.
4314 * Otherwise, return a position beyond the integer divisions.
4315 */
find_context_div(__isl_keep isl_basic_map * bmap,__isl_keep isl_basic_set * dom,unsigned div)4316 static int find_context_div(__isl_keep isl_basic_map *bmap,
4317 __isl_keep isl_basic_set *dom, unsigned div)
4318 {
4319 int i;
4320 isl_size b_v_div, d_v_div;
4321 isl_size n_div;
4322
4323 b_v_div = isl_basic_map_var_offset(bmap, isl_dim_div);
4324 d_v_div = isl_basic_set_var_offset(dom, isl_dim_div);
4325 n_div = isl_basic_map_dim(bmap, isl_dim_div);
4326 if (b_v_div < 0 || d_v_div < 0 || n_div < 0)
4327 return -1;
4328
4329 if (isl_int_is_zero(dom->div[div][0]))
4330 return n_div;
4331 if (isl_seq_first_non_zero(dom->div[div] + 2 + d_v_div,
4332 dom->n_div) != -1)
4333 return n_div;
4334
4335 for (i = 0; i < n_div; ++i) {
4336 if (isl_int_is_zero(bmap->div[i][0]))
4337 continue;
4338 if (isl_seq_first_non_zero(bmap->div[i] + 2 + d_v_div,
4339 (b_v_div - d_v_div) + n_div) != -1)
4340 continue;
4341 if (isl_seq_eq(bmap->div[i], dom->div[div], 2 + d_v_div))
4342 return i;
4343 }
4344 return n_div;
4345 }
4346
4347 /* The correspondence between the variables in the main tableau,
4348 * the context tableau, and the input map and domain is as follows.
4349 * The first n_param and the last n_div variables of the main tableau
4350 * form the variables of the context tableau.
4351 * In the basic map, these n_param variables correspond to the
4352 * parameters and the input dimensions. In the domain, they correspond
4353 * to the parameters and the set dimensions.
4354 * The n_div variables correspond to the integer divisions in the domain.
4355 * To ensure that everything lines up, we may need to copy some of the
4356 * integer divisions of the domain to the map. These have to be placed
4357 * in the same order as those in the context and they have to be placed
4358 * after any other integer divisions that the map may have.
4359 * This function performs the required reordering.
4360 */
align_context_divs(__isl_take isl_basic_map * bmap,__isl_keep isl_basic_set * dom)4361 static __isl_give isl_basic_map *align_context_divs(
4362 __isl_take isl_basic_map *bmap, __isl_keep isl_basic_set *dom)
4363 {
4364 int i;
4365 int common = 0;
4366 int other;
4367 unsigned bmap_n_div;
4368
4369 bmap_n_div = isl_basic_map_dim(bmap, isl_dim_div);
4370
4371 for (i = 0; i < dom->n_div; ++i) {
4372 int pos;
4373
4374 pos = find_context_div(bmap, dom, i);
4375 if (pos < 0)
4376 return isl_basic_map_free(bmap);
4377 if (pos < bmap_n_div)
4378 common++;
4379 }
4380 other = bmap_n_div - common;
4381 if (dom->n_div - common > 0) {
4382 bmap = isl_basic_map_extend(bmap, dom->n_div - common, 0, 0);
4383 if (!bmap)
4384 return NULL;
4385 }
4386 for (i = 0; i < dom->n_div; ++i) {
4387 int pos = find_context_div(bmap, dom, i);
4388 if (pos < 0)
4389 bmap = isl_basic_map_free(bmap);
4390 if (pos >= bmap_n_div) {
4391 pos = isl_basic_map_alloc_div(bmap);
4392 if (pos < 0)
4393 goto error;
4394 isl_int_set_si(bmap->div[pos][0], 0);
4395 bmap_n_div++;
4396 }
4397 if (pos != other + i)
4398 bmap = isl_basic_map_swap_div(bmap, pos, other + i);
4399 }
4400 return bmap;
4401 error:
4402 isl_basic_map_free(bmap);
4403 return NULL;
4404 }
4405
4406 /* Base case of isl_tab_basic_map_partial_lexopt, after removing
4407 * some obvious symmetries.
4408 *
4409 * We make sure the divs in the domain are properly ordered,
4410 * because they will be added one by one in the given order
4411 * during the construction of the solution map.
4412 * Furthermore, make sure that the known integer divisions
4413 * appear before any unknown integer division because the solution
4414 * may depend on the known integer divisions, while anything that
4415 * depends on any variable starting from the first unknown integer
4416 * division is ignored in sol_pma_add.
4417 */
basic_map_partial_lexopt_base_sol(__isl_take isl_basic_map * bmap,__isl_take isl_basic_set * dom,__isl_give isl_set ** empty,int max,struct isl_sol * (* init)(__isl_keep isl_basic_map * bmap,__isl_take isl_basic_set * dom,int track_empty,int max))4418 static struct isl_sol *basic_map_partial_lexopt_base_sol(
4419 __isl_take isl_basic_map *bmap, __isl_take isl_basic_set *dom,
4420 __isl_give isl_set **empty, int max,
4421 struct isl_sol *(*init)(__isl_keep isl_basic_map *bmap,
4422 __isl_take isl_basic_set *dom, int track_empty, int max))
4423 {
4424 struct isl_tab *tab;
4425 struct isl_sol *sol = NULL;
4426 struct isl_context *context;
4427
4428 if (dom->n_div) {
4429 dom = isl_basic_set_sort_divs(dom);
4430 bmap = align_context_divs(bmap, dom);
4431 }
4432 sol = init(bmap, dom, !!empty, max);
4433 if (!sol)
4434 goto error;
4435
4436 context = sol->context;
4437 if (isl_basic_set_plain_is_empty(context->op->peek_basic_set(context)))
4438 /* nothing */;
4439 else if (isl_basic_map_plain_is_empty(bmap)) {
4440 if (sol->add_empty)
4441 sol->add_empty(sol,
4442 isl_basic_set_copy(context->op->peek_basic_set(context)));
4443 } else {
4444 tab = tab_for_lexmin(bmap,
4445 context->op->peek_basic_set(context), 1, max);
4446 tab = context->op->detect_nonnegative_parameters(context, tab);
4447 find_solutions_main(sol, tab);
4448 }
4449 if (sol->error)
4450 goto error;
4451
4452 isl_basic_map_free(bmap);
4453 return sol;
4454 error:
4455 sol_free(sol);
4456 isl_basic_map_free(bmap);
4457 return NULL;
4458 }
4459
4460 /* Base case of isl_tab_basic_map_partial_lexopt, after removing
4461 * some obvious symmetries.
4462 *
4463 * We call basic_map_partial_lexopt_base_sol and extract the results.
4464 */
basic_map_partial_lexopt_base(__isl_take isl_basic_map * bmap,__isl_take isl_basic_set * dom,__isl_give isl_set ** empty,int max)4465 static __isl_give isl_map *basic_map_partial_lexopt_base(
4466 __isl_take isl_basic_map *bmap, __isl_take isl_basic_set *dom,
4467 __isl_give isl_set **empty, int max)
4468 {
4469 isl_map *result = NULL;
4470 struct isl_sol *sol;
4471 struct isl_sol_map *sol_map;
4472
4473 sol = basic_map_partial_lexopt_base_sol(bmap, dom, empty, max,
4474 &sol_map_init);
4475 if (!sol)
4476 return NULL;
4477 sol_map = (struct isl_sol_map *) sol;
4478
4479 result = isl_map_copy(sol_map->map);
4480 if (empty)
4481 *empty = isl_set_copy(sol_map->empty);
4482 sol_free(&sol_map->sol);
4483 return result;
4484 }
4485
4486 /* Return a count of the number of occurrences of the "n" first
4487 * variables in the inequality constraints of "bmap".
4488 */
count_occurrences(__isl_keep isl_basic_map * bmap,int n)4489 static __isl_give int *count_occurrences(__isl_keep isl_basic_map *bmap,
4490 int n)
4491 {
4492 int i, j;
4493 isl_ctx *ctx;
4494 int *occurrences;
4495
4496 if (!bmap)
4497 return NULL;
4498 ctx = isl_basic_map_get_ctx(bmap);
4499 occurrences = isl_calloc_array(ctx, int, n);
4500 if (!occurrences)
4501 return NULL;
4502
4503 for (i = 0; i < bmap->n_ineq; ++i) {
4504 for (j = 0; j < n; ++j) {
4505 if (!isl_int_is_zero(bmap->ineq[i][1 + j]))
4506 occurrences[j]++;
4507 }
4508 }
4509
4510 return occurrences;
4511 }
4512
4513 /* Do all of the "n" variables with non-zero coefficients in "c"
4514 * occur in exactly a single constraint.
4515 * "occurrences" is an array of length "n" containing the number
4516 * of occurrences of each of the variables in the inequality constraints.
4517 */
single_occurrence(int n,isl_int * c,int * occurrences)4518 static int single_occurrence(int n, isl_int *c, int *occurrences)
4519 {
4520 int i;
4521
4522 for (i = 0; i < n; ++i) {
4523 if (isl_int_is_zero(c[i]))
4524 continue;
4525 if (occurrences[i] != 1)
4526 return 0;
4527 }
4528
4529 return 1;
4530 }
4531
4532 /* Do all of the "n" initial variables that occur in inequality constraint
4533 * "ineq" of "bmap" only occur in that constraint?
4534 */
all_single_occurrence(__isl_keep isl_basic_map * bmap,int ineq,int n)4535 static int all_single_occurrence(__isl_keep isl_basic_map *bmap, int ineq,
4536 int n)
4537 {
4538 int i, j;
4539
4540 for (i = 0; i < n; ++i) {
4541 if (isl_int_is_zero(bmap->ineq[ineq][1 + i]))
4542 continue;
4543 for (j = 0; j < bmap->n_ineq; ++j) {
4544 if (j == ineq)
4545 continue;
4546 if (!isl_int_is_zero(bmap->ineq[j][1 + i]))
4547 return 0;
4548 }
4549 }
4550
4551 return 1;
4552 }
4553
4554 /* Structure used during detection of parallel constraints.
4555 * n_in: number of "input" variables: isl_dim_param + isl_dim_in
4556 * n_out: number of "output" variables: isl_dim_out + isl_dim_div
4557 * val: the coefficients of the output variables
4558 */
4559 struct isl_constraint_equal_info {
4560 unsigned n_in;
4561 unsigned n_out;
4562 isl_int *val;
4563 };
4564
4565 /* Check whether the coefficients of the output variables
4566 * of the constraint in "entry" are equal to info->val.
4567 */
constraint_equal(const void * entry,const void * val)4568 static isl_bool constraint_equal(const void *entry, const void *val)
4569 {
4570 isl_int **row = (isl_int **)entry;
4571 const struct isl_constraint_equal_info *info = val;
4572 int eq;
4573
4574 eq = isl_seq_eq((*row) + 1 + info->n_in, info->val, info->n_out);
4575 return isl_bool_ok(eq);
4576 }
4577
4578 /* Check whether "bmap" has a pair of constraints that have
4579 * the same coefficients for the output variables.
4580 * Note that the coefficients of the existentially quantified
4581 * variables need to be zero since the existentially quantified
4582 * of the result are usually not the same as those of the input.
4583 * Furthermore, check that each of the input variables that occur
4584 * in those constraints does not occur in any other constraint.
4585 * If so, return true and return the row indices of the two constraints
4586 * in *first and *second.
4587 */
parallel_constraints(__isl_keep isl_basic_map * bmap,int * first,int * second)4588 static isl_bool parallel_constraints(__isl_keep isl_basic_map *bmap,
4589 int *first, int *second)
4590 {
4591 int i;
4592 isl_ctx *ctx;
4593 int *occurrences = NULL;
4594 struct isl_hash_table *table = NULL;
4595 struct isl_hash_table_entry *entry;
4596 struct isl_constraint_equal_info info;
4597 isl_size nparam, n_in, n_out, n_div;
4598
4599 ctx = isl_basic_map_get_ctx(bmap);
4600 table = isl_hash_table_alloc(ctx, bmap->n_ineq);
4601 if (!table)
4602 goto error;
4603
4604 nparam = isl_basic_map_dim(bmap, isl_dim_param);
4605 n_in = isl_basic_map_dim(bmap, isl_dim_in);
4606 n_out = isl_basic_map_dim(bmap, isl_dim_out);
4607 n_div = isl_basic_map_dim(bmap, isl_dim_div);
4608 if (nparam < 0 || n_in < 0 || n_out < 0 || n_div < 0)
4609 goto error;
4610 info.n_in = nparam + n_in;
4611 occurrences = count_occurrences(bmap, info.n_in);
4612 if (info.n_in && !occurrences)
4613 goto error;
4614 info.n_out = n_out + n_div;
4615 for (i = 0; i < bmap->n_ineq; ++i) {
4616 uint32_t hash;
4617
4618 info.val = bmap->ineq[i] + 1 + info.n_in;
4619 if (isl_seq_first_non_zero(info.val, n_out) < 0)
4620 continue;
4621 if (isl_seq_first_non_zero(info.val + n_out, n_div) >= 0)
4622 continue;
4623 if (!single_occurrence(info.n_in, bmap->ineq[i] + 1,
4624 occurrences))
4625 continue;
4626 hash = isl_seq_get_hash(info.val, info.n_out);
4627 entry = isl_hash_table_find(ctx, table, hash,
4628 constraint_equal, &info, 1);
4629 if (!entry)
4630 goto error;
4631 if (entry->data)
4632 break;
4633 entry->data = &bmap->ineq[i];
4634 }
4635
4636 if (i < bmap->n_ineq) {
4637 *first = ((isl_int **)entry->data) - bmap->ineq;
4638 *second = i;
4639 }
4640
4641 isl_hash_table_free(ctx, table);
4642 free(occurrences);
4643
4644 return isl_bool_ok(i < bmap->n_ineq);
4645 error:
4646 isl_hash_table_free(ctx, table);
4647 free(occurrences);
4648 return isl_bool_error;
4649 }
4650
4651 /* Given a set of upper bounds in "var", add constraints to "bset"
4652 * that make the i-th bound smallest.
4653 *
4654 * In particular, if there are n bounds b_i, then add the constraints
4655 *
4656 * b_i <= b_j for j > i
4657 * b_i < b_j for j < i
4658 */
select_minimum(__isl_take isl_basic_set * bset,__isl_keep isl_mat * var,int i)4659 static __isl_give isl_basic_set *select_minimum(__isl_take isl_basic_set *bset,
4660 __isl_keep isl_mat *var, int i)
4661 {
4662 isl_ctx *ctx;
4663 int j, k;
4664
4665 ctx = isl_mat_get_ctx(var);
4666
4667 for (j = 0; j < var->n_row; ++j) {
4668 if (j == i)
4669 continue;
4670 k = isl_basic_set_alloc_inequality(bset);
4671 if (k < 0)
4672 goto error;
4673 isl_seq_combine(bset->ineq[k], ctx->one, var->row[j],
4674 ctx->negone, var->row[i], var->n_col);
4675 isl_int_set_si(bset->ineq[k][var->n_col], 0);
4676 if (j < i)
4677 isl_int_sub_ui(bset->ineq[k][0], bset->ineq[k][0], 1);
4678 }
4679
4680 bset = isl_basic_set_finalize(bset);
4681
4682 return bset;
4683 error:
4684 isl_basic_set_free(bset);
4685 return NULL;
4686 }
4687
4688 /* Given a set of upper bounds on the last "input" variable m,
4689 * construct a set that assigns the minimal upper bound to m, i.e.,
4690 * construct a set that divides the space into cells where one
4691 * of the upper bounds is smaller than all the others and assign
4692 * this upper bound to m.
4693 *
4694 * In particular, if there are n bounds b_i, then the result
4695 * consists of n basic sets, each one of the form
4696 *
4697 * m = b_i
4698 * b_i <= b_j for j > i
4699 * b_i < b_j for j < i
4700 */
set_minimum(__isl_take isl_space * space,__isl_take isl_mat * var)4701 static __isl_give isl_set *set_minimum(__isl_take isl_space *space,
4702 __isl_take isl_mat *var)
4703 {
4704 int i, k;
4705 isl_basic_set *bset = NULL;
4706 isl_set *set = NULL;
4707
4708 if (!space || !var)
4709 goto error;
4710
4711 set = isl_set_alloc_space(isl_space_copy(space),
4712 var->n_row, ISL_SET_DISJOINT);
4713
4714 for (i = 0; i < var->n_row; ++i) {
4715 bset = isl_basic_set_alloc_space(isl_space_copy(space), 0,
4716 1, var->n_row - 1);
4717 k = isl_basic_set_alloc_equality(bset);
4718 if (k < 0)
4719 goto error;
4720 isl_seq_cpy(bset->eq[k], var->row[i], var->n_col);
4721 isl_int_set_si(bset->eq[k][var->n_col], -1);
4722 bset = select_minimum(bset, var, i);
4723 set = isl_set_add_basic_set(set, bset);
4724 }
4725
4726 isl_space_free(space);
4727 isl_mat_free(var);
4728 return set;
4729 error:
4730 isl_basic_set_free(bset);
4731 isl_set_free(set);
4732 isl_space_free(space);
4733 isl_mat_free(var);
4734 return NULL;
4735 }
4736
4737 /* Given that the last input variable of "bmap" represents the minimum
4738 * of the bounds in "cst", check whether we need to split the domain
4739 * based on which bound attains the minimum.
4740 *
4741 * A split is needed when the minimum appears in an integer division
4742 * or in an equality. Otherwise, it is only needed if it appears in
4743 * an upper bound that is different from the upper bounds on which it
4744 * is defined.
4745 */
need_split_basic_map(__isl_keep isl_basic_map * bmap,__isl_keep isl_mat * cst)4746 static isl_bool need_split_basic_map(__isl_keep isl_basic_map *bmap,
4747 __isl_keep isl_mat *cst)
4748 {
4749 int i, j;
4750 isl_size total;
4751 unsigned pos;
4752
4753 pos = cst->n_col - 1;
4754 total = isl_basic_map_dim(bmap, isl_dim_all);
4755 if (total < 0)
4756 return isl_bool_error;
4757
4758 for (i = 0; i < bmap->n_div; ++i)
4759 if (!isl_int_is_zero(bmap->div[i][2 + pos]))
4760 return isl_bool_true;
4761
4762 for (i = 0; i < bmap->n_eq; ++i)
4763 if (!isl_int_is_zero(bmap->eq[i][1 + pos]))
4764 return isl_bool_true;
4765
4766 for (i = 0; i < bmap->n_ineq; ++i) {
4767 if (isl_int_is_nonneg(bmap->ineq[i][1 + pos]))
4768 continue;
4769 if (!isl_int_is_negone(bmap->ineq[i][1 + pos]))
4770 return isl_bool_true;
4771 if (isl_seq_first_non_zero(bmap->ineq[i] + 1 + pos + 1,
4772 total - pos - 1) >= 0)
4773 return isl_bool_true;
4774
4775 for (j = 0; j < cst->n_row; ++j)
4776 if (isl_seq_eq(bmap->ineq[i], cst->row[j], cst->n_col))
4777 break;
4778 if (j >= cst->n_row)
4779 return isl_bool_true;
4780 }
4781
4782 return isl_bool_false;
4783 }
4784
4785 /* Given that the last set variable of "bset" represents the minimum
4786 * of the bounds in "cst", check whether we need to split the domain
4787 * based on which bound attains the minimum.
4788 *
4789 * We simply call need_split_basic_map here. This is safe because
4790 * the position of the minimum is computed from "cst" and not
4791 * from "bmap".
4792 */
need_split_basic_set(__isl_keep isl_basic_set * bset,__isl_keep isl_mat * cst)4793 static isl_bool need_split_basic_set(__isl_keep isl_basic_set *bset,
4794 __isl_keep isl_mat *cst)
4795 {
4796 return need_split_basic_map(bset_to_bmap(bset), cst);
4797 }
4798
4799 /* Given that the last set variable of "set" represents the minimum
4800 * of the bounds in "cst", check whether we need to split the domain
4801 * based on which bound attains the minimum.
4802 */
need_split_set(__isl_keep isl_set * set,__isl_keep isl_mat * cst)4803 static isl_bool need_split_set(__isl_keep isl_set *set, __isl_keep isl_mat *cst)
4804 {
4805 int i;
4806
4807 for (i = 0; i < set->n; ++i) {
4808 isl_bool split;
4809
4810 split = need_split_basic_set(set->p[i], cst);
4811 if (split < 0 || split)
4812 return split;
4813 }
4814
4815 return isl_bool_false;
4816 }
4817
4818 /* Given a map of which the last input variable is the minimum
4819 * of the bounds in "cst", split each basic set in the set
4820 * in pieces where one of the bounds is (strictly) smaller than the others.
4821 * This subdivision is given in "min_expr".
4822 * The variable is subsequently projected out.
4823 *
4824 * We only do the split when it is needed.
4825 * For example if the last input variable m = min(a,b) and the only
4826 * constraints in the given basic set are lower bounds on m,
4827 * i.e., l <= m = min(a,b), then we can simply project out m
4828 * to obtain l <= a and l <= b, without having to split on whether
4829 * m is equal to a or b.
4830 */
split_domain(__isl_take isl_map * opt,__isl_take isl_set * min_expr,__isl_take isl_mat * cst)4831 static __isl_give isl_map *split_domain(__isl_take isl_map *opt,
4832 __isl_take isl_set *min_expr, __isl_take isl_mat *cst)
4833 {
4834 isl_size n_in;
4835 int i;
4836 isl_space *space;
4837 isl_map *res;
4838
4839 n_in = isl_map_dim(opt, isl_dim_in);
4840 if (n_in < 0 || !min_expr || !cst)
4841 goto error;
4842
4843 space = isl_map_get_space(opt);
4844 space = isl_space_drop_dims(space, isl_dim_in, n_in - 1, 1);
4845 res = isl_map_empty(space);
4846
4847 for (i = 0; i < opt->n; ++i) {
4848 isl_map *map;
4849 isl_bool split;
4850
4851 map = isl_map_from_basic_map(isl_basic_map_copy(opt->p[i]));
4852 split = need_split_basic_map(opt->p[i], cst);
4853 if (split < 0)
4854 map = isl_map_free(map);
4855 else if (split)
4856 map = isl_map_intersect_domain(map,
4857 isl_set_copy(min_expr));
4858 map = isl_map_remove_dims(map, isl_dim_in, n_in - 1, 1);
4859
4860 res = isl_map_union_disjoint(res, map);
4861 }
4862
4863 isl_map_free(opt);
4864 isl_set_free(min_expr);
4865 isl_mat_free(cst);
4866 return res;
4867 error:
4868 isl_map_free(opt);
4869 isl_set_free(min_expr);
4870 isl_mat_free(cst);
4871 return NULL;
4872 }
4873
4874 /* Given a set of which the last set variable is the minimum
4875 * of the bounds in "cst", split each basic set in the set
4876 * in pieces where one of the bounds is (strictly) smaller than the others.
4877 * This subdivision is given in "min_expr".
4878 * The variable is subsequently projected out.
4879 */
split(__isl_take isl_set * empty,__isl_take isl_set * min_expr,__isl_take isl_mat * cst)4880 static __isl_give isl_set *split(__isl_take isl_set *empty,
4881 __isl_take isl_set *min_expr, __isl_take isl_mat *cst)
4882 {
4883 isl_map *map;
4884
4885 map = isl_map_from_domain(empty);
4886 map = split_domain(map, min_expr, cst);
4887 empty = isl_map_domain(map);
4888
4889 return empty;
4890 }
4891
4892 static __isl_give isl_map *basic_map_partial_lexopt(
4893 __isl_take isl_basic_map *bmap, __isl_take isl_basic_set *dom,
4894 __isl_give isl_set **empty, int max);
4895
4896 /* This function is called from basic_map_partial_lexopt_symm.
4897 * The last variable of "bmap" and "dom" corresponds to the minimum
4898 * of the bounds in "cst". "map_space" is the space of the original
4899 * input relation (of basic_map_partial_lexopt_symm) and "set_space"
4900 * is the space of the original domain.
4901 *
4902 * We recursively call basic_map_partial_lexopt and then plug in
4903 * the definition of the minimum in the result.
4904 */
basic_map_partial_lexopt_symm_core(__isl_take isl_basic_map * bmap,__isl_take isl_basic_set * dom,__isl_give isl_set ** empty,int max,__isl_take isl_mat * cst,__isl_take isl_space * map_space,__isl_take isl_space * set_space)4905 static __isl_give isl_map *basic_map_partial_lexopt_symm_core(
4906 __isl_take isl_basic_map *bmap, __isl_take isl_basic_set *dom,
4907 __isl_give isl_set **empty, int max, __isl_take isl_mat *cst,
4908 __isl_take isl_space *map_space, __isl_take isl_space *set_space)
4909 {
4910 isl_map *opt;
4911 isl_set *min_expr;
4912
4913 min_expr = set_minimum(isl_basic_set_get_space(dom), isl_mat_copy(cst));
4914
4915 opt = basic_map_partial_lexopt(bmap, dom, empty, max);
4916
4917 if (empty) {
4918 *empty = split(*empty,
4919 isl_set_copy(min_expr), isl_mat_copy(cst));
4920 *empty = isl_set_reset_space(*empty, set_space);
4921 }
4922
4923 opt = split_domain(opt, min_expr, cst);
4924 opt = isl_map_reset_space(opt, map_space);
4925
4926 return opt;
4927 }
4928
4929 /* Extract a domain from "bmap" for the purpose of computing
4930 * a lexicographic optimum.
4931 *
4932 * This function is only called when the caller wants to compute a full
4933 * lexicographic optimum, i.e., without specifying a domain. In this case,
4934 * the caller is not interested in the part of the domain space where
4935 * there is no solution and the domain can be initialized to those constraints
4936 * of "bmap" that only involve the parameters and the input dimensions.
4937 * This relieves the parametric programming engine from detecting those
4938 * inequalities and transferring them to the context. More importantly,
4939 * it ensures that those inequalities are transferred first and not
4940 * intermixed with inequalities that actually split the domain.
4941 *
4942 * If the caller does not require the absence of existentially quantified
4943 * variables in the result (i.e., if ISL_OPT_QE is not set in "flags"),
4944 * then the actual domain of "bmap" can be used. This ensures that
4945 * the domain does not need to be split at all just to separate out
4946 * pieces of the domain that do not have a solution from piece that do.
4947 * This domain cannot be used in general because it may involve
4948 * (unknown) existentially quantified variables which will then also
4949 * appear in the solution.
4950 */
extract_domain(__isl_keep isl_basic_map * bmap,unsigned flags)4951 static __isl_give isl_basic_set *extract_domain(__isl_keep isl_basic_map *bmap,
4952 unsigned flags)
4953 {
4954 isl_size n_div;
4955 isl_size n_out;
4956
4957 n_div = isl_basic_map_dim(bmap, isl_dim_div);
4958 n_out = isl_basic_map_dim(bmap, isl_dim_out);
4959 if (n_div < 0 || n_out < 0)
4960 return NULL;
4961 bmap = isl_basic_map_copy(bmap);
4962 if (ISL_FL_ISSET(flags, ISL_OPT_QE)) {
4963 bmap = isl_basic_map_drop_constraints_involving_dims(bmap,
4964 isl_dim_div, 0, n_div);
4965 bmap = isl_basic_map_drop_constraints_involving_dims(bmap,
4966 isl_dim_out, 0, n_out);
4967 }
4968 return isl_basic_map_domain(bmap);
4969 }
4970
4971 #undef TYPE
4972 #define TYPE isl_map
4973 #undef SUFFIX
4974 #define SUFFIX
4975 #include "isl_tab_lexopt_templ.c"
4976
4977 /* Extract the subsequence of the sample value of "tab"
4978 * starting at "pos" and of length "len".
4979 */
extract_sample_sequence(struct isl_tab * tab,int pos,int len)4980 static __isl_give isl_vec *extract_sample_sequence(struct isl_tab *tab,
4981 int pos, int len)
4982 {
4983 int i;
4984 isl_ctx *ctx;
4985 isl_vec *v;
4986
4987 ctx = isl_tab_get_ctx(tab);
4988 v = isl_vec_alloc(ctx, len);
4989 if (!v)
4990 return NULL;
4991 for (i = 0; i < len; ++i) {
4992 if (!tab->var[pos + i].is_row) {
4993 isl_int_set_si(v->el[i], 0);
4994 } else {
4995 int row;
4996
4997 row = tab->var[pos + i].index;
4998 isl_int_divexact(v->el[i], tab->mat->row[row][1],
4999 tab->mat->row[row][0]);
5000 }
5001 }
5002
5003 return v;
5004 }
5005
5006 /* Check if the sequence of variables starting at "pos"
5007 * represents a trivial solution according to "trivial".
5008 * That is, is the result of applying "trivial" to this sequence
5009 * equal to the zero vector?
5010 */
region_is_trivial(struct isl_tab * tab,int pos,__isl_keep isl_mat * trivial)5011 static isl_bool region_is_trivial(struct isl_tab *tab, int pos,
5012 __isl_keep isl_mat *trivial)
5013 {
5014 isl_size n, len;
5015 isl_vec *v;
5016 isl_bool is_trivial;
5017
5018 n = isl_mat_rows(trivial);
5019 if (n < 0)
5020 return isl_bool_error;
5021
5022 if (n == 0)
5023 return isl_bool_false;
5024
5025 len = isl_mat_cols(trivial);
5026 if (len < 0)
5027 return isl_bool_error;
5028 v = extract_sample_sequence(tab, pos, len);
5029 v = isl_mat_vec_product(isl_mat_copy(trivial), v);
5030 is_trivial = isl_vec_is_zero(v);
5031 isl_vec_free(v);
5032
5033 return is_trivial;
5034 }
5035
5036 /* Global internal data for isl_tab_basic_set_non_trivial_lexmin.
5037 *
5038 * "n_op" is the number of initial coordinates to optimize,
5039 * as passed to isl_tab_basic_set_non_trivial_lexmin.
5040 * "region" is the "n_region"-sized array of regions passed
5041 * to isl_tab_basic_set_non_trivial_lexmin.
5042 *
5043 * "tab" is the tableau that corresponds to the ILP problem.
5044 * "local" is an array of local data structure, one for each
5045 * (potential) level of the backtracking procedure of
5046 * isl_tab_basic_set_non_trivial_lexmin.
5047 * "v" is a pre-allocated vector that can be used for adding
5048 * constraints to the tableau.
5049 *
5050 * "sol" contains the best solution found so far.
5051 * It is initialized to a vector of size zero.
5052 */
5053 struct isl_lexmin_data {
5054 int n_op;
5055 int n_region;
5056 struct isl_trivial_region *region;
5057
5058 struct isl_tab *tab;
5059 struct isl_local_region *local;
5060 isl_vec *v;
5061
5062 isl_vec *sol;
5063 };
5064
5065 /* Return the index of the first trivial region, "n_region" if all regions
5066 * are non-trivial or -1 in case of error.
5067 */
first_trivial_region(struct isl_lexmin_data * data)5068 static int first_trivial_region(struct isl_lexmin_data *data)
5069 {
5070 int i;
5071
5072 for (i = 0; i < data->n_region; ++i) {
5073 isl_bool trivial;
5074 trivial = region_is_trivial(data->tab, data->region[i].pos,
5075 data->region[i].trivial);
5076 if (trivial < 0)
5077 return -1;
5078 if (trivial)
5079 return i;
5080 }
5081
5082 return data->n_region;
5083 }
5084
5085 /* Check if the solution is optimal, i.e., whether the first
5086 * n_op entries are zero.
5087 */
is_optimal(__isl_keep isl_vec * sol,int n_op)5088 static int is_optimal(__isl_keep isl_vec *sol, int n_op)
5089 {
5090 int i;
5091
5092 for (i = 0; i < n_op; ++i)
5093 if (!isl_int_is_zero(sol->el[1 + i]))
5094 return 0;
5095 return 1;
5096 }
5097
5098 /* Add constraints to "tab" that ensure that any solution is significantly
5099 * better than that represented by "sol". That is, find the first
5100 * relevant (within first n_op) non-zero coefficient and force it (along
5101 * with all previous coefficients) to be zero.
5102 * If the solution is already optimal (all relevant coefficients are zero),
5103 * then just mark the table as empty.
5104 * "n_zero" is the number of coefficients that have been forced zero
5105 * by previous calls to this function at the same level.
5106 * Return the updated number of forced zero coefficients or -1 on error.
5107 *
5108 * This function assumes that at least 2 * (n_op - n_zero) more rows and
5109 * at least 2 * (n_op - n_zero) more elements in the constraint array
5110 * are available in the tableau.
5111 */
force_better_solution(struct isl_tab * tab,__isl_keep isl_vec * sol,int n_op,int n_zero)5112 static int force_better_solution(struct isl_tab *tab,
5113 __isl_keep isl_vec *sol, int n_op, int n_zero)
5114 {
5115 int i, n;
5116 isl_ctx *ctx;
5117 isl_vec *v = NULL;
5118
5119 if (!sol)
5120 return -1;
5121
5122 for (i = n_zero; i < n_op; ++i)
5123 if (!isl_int_is_zero(sol->el[1 + i]))
5124 break;
5125
5126 if (i == n_op) {
5127 if (isl_tab_mark_empty(tab) < 0)
5128 return -1;
5129 return n_op;
5130 }
5131
5132 ctx = isl_vec_get_ctx(sol);
5133 v = isl_vec_alloc(ctx, 1 + tab->n_var);
5134 if (!v)
5135 return -1;
5136
5137 n = i + 1;
5138 for (; i >= n_zero; --i) {
5139 v = isl_vec_clr(v);
5140 isl_int_set_si(v->el[1 + i], -1);
5141 if (add_lexmin_eq(tab, v->el) < 0)
5142 goto error;
5143 }
5144
5145 isl_vec_free(v);
5146 return n;
5147 error:
5148 isl_vec_free(v);
5149 return -1;
5150 }
5151
5152 /* Fix triviality direction "dir" of the given region to zero.
5153 *
5154 * This function assumes that at least two more rows and at least
5155 * two more elements in the constraint array are available in the tableau.
5156 */
fix_zero(struct isl_tab * tab,struct isl_trivial_region * region,int dir,struct isl_lexmin_data * data)5157 static isl_stat fix_zero(struct isl_tab *tab, struct isl_trivial_region *region,
5158 int dir, struct isl_lexmin_data *data)
5159 {
5160 isl_size len;
5161
5162 data->v = isl_vec_clr(data->v);
5163 if (!data->v)
5164 return isl_stat_error;
5165 len = isl_mat_cols(region->trivial);
5166 if (len < 0)
5167 return isl_stat_error;
5168 isl_seq_cpy(data->v->el + 1 + region->pos, region->trivial->row[dir],
5169 len);
5170 if (add_lexmin_eq(tab, data->v->el) < 0)
5171 return isl_stat_error;
5172
5173 return isl_stat_ok;
5174 }
5175
5176 /* This function selects case "side" for non-triviality region "region",
5177 * assuming all the equality constraints have been imposed already.
5178 * In particular, the triviality direction side/2 is made positive
5179 * if side is even and made negative if side is odd.
5180 *
5181 * This function assumes that at least one more row and at least
5182 * one more element in the constraint array are available in the tableau.
5183 */
pos_neg(struct isl_tab * tab,struct isl_trivial_region * region,int side,struct isl_lexmin_data * data)5184 static struct isl_tab *pos_neg(struct isl_tab *tab,
5185 struct isl_trivial_region *region,
5186 int side, struct isl_lexmin_data *data)
5187 {
5188 isl_size len;
5189
5190 data->v = isl_vec_clr(data->v);
5191 if (!data->v)
5192 goto error;
5193 isl_int_set_si(data->v->el[0], -1);
5194 len = isl_mat_cols(region->trivial);
5195 if (len < 0)
5196 goto error;
5197 if (side % 2 == 0)
5198 isl_seq_cpy(data->v->el + 1 + region->pos,
5199 region->trivial->row[side / 2], len);
5200 else
5201 isl_seq_neg(data->v->el + 1 + region->pos,
5202 region->trivial->row[side / 2], len);
5203 return add_lexmin_ineq(tab, data->v->el);
5204 error:
5205 isl_tab_free(tab);
5206 return NULL;
5207 }
5208
5209 /* Local data at each level of the backtracking procedure of
5210 * isl_tab_basic_set_non_trivial_lexmin.
5211 *
5212 * "update" is set if a solution has been found in the current case
5213 * of this level, such that a better solution needs to be enforced
5214 * in the next case.
5215 * "n_zero" is the number of initial coordinates that have already
5216 * been forced to be zero at this level.
5217 * "region" is the non-triviality region considered at this level.
5218 * "side" is the index of the current case at this level.
5219 * "n" is the number of triviality directions.
5220 * "snap" is a snapshot of the tableau holding a state that needs
5221 * to be satisfied by all subsequent cases.
5222 */
5223 struct isl_local_region {
5224 int update;
5225 int n_zero;
5226 int region;
5227 int side;
5228 int n;
5229 struct isl_tab_undo *snap;
5230 };
5231
5232 /* Initialize the global data structure "data" used while solving
5233 * the ILP problem "bset".
5234 */
init_lexmin_data(struct isl_lexmin_data * data,__isl_keep isl_basic_set * bset)5235 static isl_stat init_lexmin_data(struct isl_lexmin_data *data,
5236 __isl_keep isl_basic_set *bset)
5237 {
5238 isl_ctx *ctx;
5239
5240 ctx = isl_basic_set_get_ctx(bset);
5241
5242 data->tab = tab_for_lexmin(bset, NULL, 0, 0);
5243 if (!data->tab)
5244 return isl_stat_error;
5245
5246 data->v = isl_vec_alloc(ctx, 1 + data->tab->n_var);
5247 if (!data->v)
5248 return isl_stat_error;
5249 data->local = isl_calloc_array(ctx, struct isl_local_region,
5250 data->n_region);
5251 if (data->n_region && !data->local)
5252 return isl_stat_error;
5253
5254 data->sol = isl_vec_alloc(ctx, 0);
5255
5256 return isl_stat_ok;
5257 }
5258
5259 /* Mark all outer levels as requiring a better solution
5260 * in the next cases.
5261 */
update_outer_levels(struct isl_lexmin_data * data,int level)5262 static void update_outer_levels(struct isl_lexmin_data *data, int level)
5263 {
5264 int i;
5265
5266 for (i = 0; i < level; ++i)
5267 data->local[i].update = 1;
5268 }
5269
5270 /* Initialize "local" to refer to region "region" and
5271 * to initiate processing at this level.
5272 */
init_local_region(struct isl_local_region * local,int region,struct isl_lexmin_data * data)5273 static isl_stat init_local_region(struct isl_local_region *local, int region,
5274 struct isl_lexmin_data *data)
5275 {
5276 isl_size n = isl_mat_rows(data->region[region].trivial);
5277
5278 if (n < 0)
5279 return isl_stat_error;
5280 local->n = n;
5281 local->region = region;
5282 local->side = 0;
5283 local->update = 0;
5284 local->n_zero = 0;
5285
5286 return isl_stat_ok;
5287 }
5288
5289 /* What to do next after entering a level of the backtracking procedure.
5290 *
5291 * error: some error has occurred; abort
5292 * done: an optimal solution has been found; stop search
5293 * backtrack: backtrack to the previous level
5294 * handle: add the constraints for the current level and
5295 * move to the next level
5296 */
5297 enum isl_next {
5298 isl_next_error = -1,
5299 isl_next_done,
5300 isl_next_backtrack,
5301 isl_next_handle,
5302 };
5303
5304 /* Have all cases of the current region been considered?
5305 * If there are n directions, then there are 2n cases.
5306 *
5307 * The constraints in the current tableau are imposed
5308 * in all subsequent cases. This means that if the current
5309 * tableau is empty, then none of those cases should be considered
5310 * anymore and all cases have effectively been considered.
5311 */
finished_all_cases(struct isl_local_region * local,struct isl_lexmin_data * data)5312 static int finished_all_cases(struct isl_local_region *local,
5313 struct isl_lexmin_data *data)
5314 {
5315 if (data->tab->empty)
5316 return 1;
5317 return local->side >= 2 * local->n;
5318 }
5319
5320 /* Enter level "level" of the backtracking search and figure out
5321 * what to do next. "init" is set if the level was entered
5322 * from a higher level and needs to be initialized.
5323 * Otherwise, the level is entered as a result of backtracking and
5324 * the tableau needs to be restored to a position that can
5325 * be used for the next case at this level.
5326 * The snapshot is assumed to have been saved in the previous case,
5327 * before the constraints specific to that case were added.
5328 *
5329 * In the initialization case, the local region is initialized
5330 * to point to the first violated region.
5331 * If the constraints of all regions are satisfied by the current
5332 * sample of the tableau, then tell the caller to continue looking
5333 * for a better solution or to stop searching if an optimal solution
5334 * has been found.
5335 *
5336 * If the tableau is empty or if all cases at the current level
5337 * have been considered, then the caller needs to backtrack as well.
5338 */
enter_level(int level,int init,struct isl_lexmin_data * data)5339 static enum isl_next enter_level(int level, int init,
5340 struct isl_lexmin_data *data)
5341 {
5342 struct isl_local_region *local = &data->local[level];
5343
5344 if (init) {
5345 int r;
5346
5347 data->tab = cut_to_integer_lexmin(data->tab, CUT_ONE);
5348 if (!data->tab)
5349 return isl_next_error;
5350 if (data->tab->empty)
5351 return isl_next_backtrack;
5352 r = first_trivial_region(data);
5353 if (r < 0)
5354 return isl_next_error;
5355 if (r == data->n_region) {
5356 update_outer_levels(data, level);
5357 isl_vec_free(data->sol);
5358 data->sol = isl_tab_get_sample_value(data->tab);
5359 if (!data->sol)
5360 return isl_next_error;
5361 if (is_optimal(data->sol, data->n_op))
5362 return isl_next_done;
5363 return isl_next_backtrack;
5364 }
5365 if (level >= data->n_region)
5366 isl_die(isl_vec_get_ctx(data->v), isl_error_internal,
5367 "nesting level too deep",
5368 return isl_next_error);
5369 if (init_local_region(local, r, data) < 0)
5370 return isl_next_error;
5371 if (isl_tab_extend_cons(data->tab,
5372 2 * local->n + 2 * data->n_op) < 0)
5373 return isl_next_error;
5374 } else {
5375 if (isl_tab_rollback(data->tab, local->snap) < 0)
5376 return isl_next_error;
5377 }
5378
5379 if (finished_all_cases(local, data))
5380 return isl_next_backtrack;
5381 return isl_next_handle;
5382 }
5383
5384 /* If a solution has been found in the previous case at this level
5385 * (marked by local->update being set), then add constraints
5386 * that enforce a better solution in the present and all following cases.
5387 * The constraints only need to be imposed once because they are
5388 * included in the snapshot (taken in pick_side) that will be used in
5389 * subsequent cases.
5390 */
better_next_side(struct isl_local_region * local,struct isl_lexmin_data * data)5391 static isl_stat better_next_side(struct isl_local_region *local,
5392 struct isl_lexmin_data *data)
5393 {
5394 if (!local->update)
5395 return isl_stat_ok;
5396
5397 local->n_zero = force_better_solution(data->tab,
5398 data->sol, data->n_op, local->n_zero);
5399 if (local->n_zero < 0)
5400 return isl_stat_error;
5401
5402 local->update = 0;
5403
5404 return isl_stat_ok;
5405 }
5406
5407 /* Add constraints to data->tab that select the current case (local->side)
5408 * at the current level.
5409 *
5410 * If the linear combinations v should not be zero, then the cases are
5411 * v_0 >= 1
5412 * v_0 <= -1
5413 * v_0 = 0 and v_1 >= 1
5414 * v_0 = 0 and v_1 <= -1
5415 * v_0 = 0 and v_1 = 0 and v_2 >= 1
5416 * v_0 = 0 and v_1 = 0 and v_2 <= -1
5417 * ...
5418 * in this order.
5419 *
5420 * A snapshot is taken after the equality constraint (if any) has been added
5421 * such that the next case can start off from this position.
5422 * The rollback to this position is performed in enter_level.
5423 */
pick_side(struct isl_local_region * local,struct isl_lexmin_data * data)5424 static isl_stat pick_side(struct isl_local_region *local,
5425 struct isl_lexmin_data *data)
5426 {
5427 struct isl_trivial_region *region;
5428 int side, base;
5429
5430 region = &data->region[local->region];
5431 side = local->side;
5432 base = 2 * (side/2);
5433
5434 if (side == base && base >= 2 &&
5435 fix_zero(data->tab, region, base / 2 - 1, data) < 0)
5436 return isl_stat_error;
5437
5438 local->snap = isl_tab_snap(data->tab);
5439 if (isl_tab_push_basis(data->tab) < 0)
5440 return isl_stat_error;
5441
5442 data->tab = pos_neg(data->tab, region, side, data);
5443 if (!data->tab)
5444 return isl_stat_error;
5445 return isl_stat_ok;
5446 }
5447
5448 /* Free the memory associated to "data".
5449 */
clear_lexmin_data(struct isl_lexmin_data * data)5450 static void clear_lexmin_data(struct isl_lexmin_data *data)
5451 {
5452 free(data->local);
5453 isl_vec_free(data->v);
5454 isl_tab_free(data->tab);
5455 }
5456
5457 /* Return the lexicographically smallest non-trivial solution of the
5458 * given ILP problem.
5459 *
5460 * All variables are assumed to be non-negative.
5461 *
5462 * n_op is the number of initial coordinates to optimize.
5463 * That is, once a solution has been found, we will only continue looking
5464 * for solutions that result in significantly better values for those
5465 * initial coordinates. That is, we only continue looking for solutions
5466 * that increase the number of initial zeros in this sequence.
5467 *
5468 * A solution is non-trivial, if it is non-trivial on each of the
5469 * specified regions. Each region represents a sequence of
5470 * triviality directions on a sequence of variables that starts
5471 * at a given position. A solution is non-trivial on such a region if
5472 * at least one of the triviality directions is non-zero
5473 * on that sequence of variables.
5474 *
5475 * Whenever a conflict is encountered, all constraints involved are
5476 * reported to the caller through a call to "conflict".
5477 *
5478 * We perform a simple branch-and-bound backtracking search.
5479 * Each level in the search represents an initially trivial region
5480 * that is forced to be non-trivial.
5481 * At each level we consider 2 * n cases, where n
5482 * is the number of triviality directions.
5483 * In terms of those n directions v_i, we consider the cases
5484 * v_0 >= 1
5485 * v_0 <= -1
5486 * v_0 = 0 and v_1 >= 1
5487 * v_0 = 0 and v_1 <= -1
5488 * v_0 = 0 and v_1 = 0 and v_2 >= 1
5489 * v_0 = 0 and v_1 = 0 and v_2 <= -1
5490 * ...
5491 * in this order.
5492 */
isl_tab_basic_set_non_trivial_lexmin(__isl_take isl_basic_set * bset,int n_op,int n_region,struct isl_trivial_region * region,int (* conflict)(int con,void * user),void * user)5493 __isl_give isl_vec *isl_tab_basic_set_non_trivial_lexmin(
5494 __isl_take isl_basic_set *bset, int n_op, int n_region,
5495 struct isl_trivial_region *region,
5496 int (*conflict)(int con, void *user), void *user)
5497 {
5498 struct isl_lexmin_data data = { n_op, n_region, region };
5499 int level, init;
5500
5501 if (!bset)
5502 return NULL;
5503
5504 if (init_lexmin_data(&data, bset) < 0)
5505 goto error;
5506 data.tab->conflict = conflict;
5507 data.tab->conflict_user = user;
5508
5509 level = 0;
5510 init = 1;
5511
5512 while (level >= 0) {
5513 enum isl_next next;
5514 struct isl_local_region *local = &data.local[level];
5515
5516 next = enter_level(level, init, &data);
5517 if (next < 0)
5518 goto error;
5519 if (next == isl_next_done)
5520 break;
5521 if (next == isl_next_backtrack) {
5522 level--;
5523 init = 0;
5524 continue;
5525 }
5526
5527 if (better_next_side(local, &data) < 0)
5528 goto error;
5529 if (pick_side(local, &data) < 0)
5530 goto error;
5531
5532 local->side++;
5533 level++;
5534 init = 1;
5535 }
5536
5537 clear_lexmin_data(&data);
5538 isl_basic_set_free(bset);
5539
5540 return data.sol;
5541 error:
5542 clear_lexmin_data(&data);
5543 isl_basic_set_free(bset);
5544 isl_vec_free(data.sol);
5545 return NULL;
5546 }
5547
5548 /* Wrapper for a tableau that is used for computing
5549 * the lexicographically smallest rational point of a non-negative set.
5550 * This point is represented by the sample value of "tab",
5551 * unless "tab" is empty.
5552 */
5553 struct isl_tab_lexmin {
5554 isl_ctx *ctx;
5555 struct isl_tab *tab;
5556 };
5557
5558 /* Free "tl" and return NULL.
5559 */
isl_tab_lexmin_free(__isl_take isl_tab_lexmin * tl)5560 __isl_null isl_tab_lexmin *isl_tab_lexmin_free(__isl_take isl_tab_lexmin *tl)
5561 {
5562 if (!tl)
5563 return NULL;
5564 isl_ctx_deref(tl->ctx);
5565 isl_tab_free(tl->tab);
5566 free(tl);
5567
5568 return NULL;
5569 }
5570
5571 /* Construct an isl_tab_lexmin for computing
5572 * the lexicographically smallest rational point in "bset",
5573 * assuming that all variables are non-negative.
5574 */
isl_tab_lexmin_from_basic_set(__isl_take isl_basic_set * bset)5575 __isl_give isl_tab_lexmin *isl_tab_lexmin_from_basic_set(
5576 __isl_take isl_basic_set *bset)
5577 {
5578 isl_ctx *ctx;
5579 isl_tab_lexmin *tl;
5580
5581 if (!bset)
5582 return NULL;
5583
5584 ctx = isl_basic_set_get_ctx(bset);
5585 tl = isl_calloc_type(ctx, struct isl_tab_lexmin);
5586 if (!tl)
5587 goto error;
5588 tl->ctx = ctx;
5589 isl_ctx_ref(ctx);
5590 tl->tab = tab_for_lexmin(bset, NULL, 0, 0);
5591 isl_basic_set_free(bset);
5592 if (!tl->tab)
5593 return isl_tab_lexmin_free(tl);
5594 return tl;
5595 error:
5596 isl_basic_set_free(bset);
5597 isl_tab_lexmin_free(tl);
5598 return NULL;
5599 }
5600
5601 /* Return the dimension of the set represented by "tl".
5602 */
isl_tab_lexmin_dim(__isl_keep isl_tab_lexmin * tl)5603 int isl_tab_lexmin_dim(__isl_keep isl_tab_lexmin *tl)
5604 {
5605 return tl ? tl->tab->n_var : -1;
5606 }
5607
5608 /* Add the equality with coefficients "eq" to "tl", updating the optimal
5609 * solution if needed.
5610 * The equality is added as two opposite inequality constraints.
5611 */
isl_tab_lexmin_add_eq(__isl_take isl_tab_lexmin * tl,isl_int * eq)5612 __isl_give isl_tab_lexmin *isl_tab_lexmin_add_eq(__isl_take isl_tab_lexmin *tl,
5613 isl_int *eq)
5614 {
5615 unsigned n_var;
5616
5617 if (!tl || !eq)
5618 return isl_tab_lexmin_free(tl);
5619
5620 if (isl_tab_extend_cons(tl->tab, 2) < 0)
5621 return isl_tab_lexmin_free(tl);
5622 n_var = tl->tab->n_var;
5623 isl_seq_neg(eq, eq, 1 + n_var);
5624 tl->tab = add_lexmin_ineq(tl->tab, eq);
5625 isl_seq_neg(eq, eq, 1 + n_var);
5626 tl->tab = add_lexmin_ineq(tl->tab, eq);
5627
5628 if (!tl->tab)
5629 return isl_tab_lexmin_free(tl);
5630
5631 return tl;
5632 }
5633
5634 /* Add cuts to "tl" until the sample value reaches an integer value or
5635 * until the result becomes empty.
5636 */
isl_tab_lexmin_cut_to_integer(__isl_take isl_tab_lexmin * tl)5637 __isl_give isl_tab_lexmin *isl_tab_lexmin_cut_to_integer(
5638 __isl_take isl_tab_lexmin *tl)
5639 {
5640 if (!tl)
5641 return NULL;
5642 tl->tab = cut_to_integer_lexmin(tl->tab, CUT_ONE);
5643 if (!tl->tab)
5644 return isl_tab_lexmin_free(tl);
5645 return tl;
5646 }
5647
5648 /* Return the lexicographically smallest rational point in the basic set
5649 * from which "tl" was constructed.
5650 * If the original input was empty, then return a zero-length vector.
5651 */
isl_tab_lexmin_get_solution(__isl_keep isl_tab_lexmin * tl)5652 __isl_give isl_vec *isl_tab_lexmin_get_solution(__isl_keep isl_tab_lexmin *tl)
5653 {
5654 if (!tl)
5655 return NULL;
5656 if (tl->tab->empty)
5657 return isl_vec_alloc(tl->ctx, 0);
5658 else
5659 return isl_tab_get_sample_value(tl->tab);
5660 }
5661
5662 struct isl_sol_pma {
5663 struct isl_sol sol;
5664 isl_pw_multi_aff *pma;
5665 isl_set *empty;
5666 };
5667
sol_pma_free(struct isl_sol * sol)5668 static void sol_pma_free(struct isl_sol *sol)
5669 {
5670 struct isl_sol_pma *sol_pma = (struct isl_sol_pma *) sol;
5671 isl_pw_multi_aff_free(sol_pma->pma);
5672 isl_set_free(sol_pma->empty);
5673 }
5674
5675 /* This function is called for parts of the context where there is
5676 * no solution, with "bset" corresponding to the context tableau.
5677 * Simply add the basic set to the set "empty".
5678 */
sol_pma_add_empty(struct isl_sol_pma * sol,__isl_take isl_basic_set * bset)5679 static void sol_pma_add_empty(struct isl_sol_pma *sol,
5680 __isl_take isl_basic_set *bset)
5681 {
5682 if (!bset || !sol->empty)
5683 goto error;
5684
5685 sol->empty = isl_set_grow(sol->empty, 1);
5686 bset = isl_basic_set_simplify(bset);
5687 bset = isl_basic_set_finalize(bset);
5688 sol->empty = isl_set_add_basic_set(sol->empty, bset);
5689 if (!sol->empty)
5690 sol->sol.error = 1;
5691 return;
5692 error:
5693 isl_basic_set_free(bset);
5694 sol->sol.error = 1;
5695 }
5696
5697 /* Given a basic set "dom" that represents the context and a tuple of
5698 * affine expressions "maff" defined over this domain, construct
5699 * an isl_pw_multi_aff with a single cell corresponding to "dom" and
5700 * the affine expressions in "maff".
5701 */
sol_pma_add(struct isl_sol_pma * sol,__isl_take isl_basic_set * dom,__isl_take isl_multi_aff * maff)5702 static void sol_pma_add(struct isl_sol_pma *sol,
5703 __isl_take isl_basic_set *dom, __isl_take isl_multi_aff *maff)
5704 {
5705 isl_pw_multi_aff *pma;
5706
5707 dom = isl_basic_set_simplify(dom);
5708 dom = isl_basic_set_finalize(dom);
5709 pma = isl_pw_multi_aff_alloc(isl_set_from_basic_set(dom), maff);
5710 sol->pma = isl_pw_multi_aff_add_disjoint(sol->pma, pma);
5711 if (!sol->pma)
5712 sol->sol.error = 1;
5713 }
5714
sol_pma_add_empty_wrap(struct isl_sol * sol,__isl_take isl_basic_set * bset)5715 static void sol_pma_add_empty_wrap(struct isl_sol *sol,
5716 __isl_take isl_basic_set *bset)
5717 {
5718 sol_pma_add_empty((struct isl_sol_pma *)sol, bset);
5719 }
5720
sol_pma_add_wrap(struct isl_sol * sol,__isl_take isl_basic_set * dom,__isl_take isl_multi_aff * ma)5721 static void sol_pma_add_wrap(struct isl_sol *sol,
5722 __isl_take isl_basic_set *dom, __isl_take isl_multi_aff *ma)
5723 {
5724 sol_pma_add((struct isl_sol_pma *)sol, dom, ma);
5725 }
5726
5727 /* Construct an isl_sol_pma structure for accumulating the solution.
5728 * If track_empty is set, then we also keep track of the parts
5729 * of the context where there is no solution.
5730 * If max is set, then we are solving a maximization, rather than
5731 * a minimization problem, which means that the variables in the
5732 * tableau have value "M - x" rather than "M + x".
5733 */
sol_pma_init(__isl_keep isl_basic_map * bmap,__isl_take isl_basic_set * dom,int track_empty,int max)5734 static struct isl_sol *sol_pma_init(__isl_keep isl_basic_map *bmap,
5735 __isl_take isl_basic_set *dom, int track_empty, int max)
5736 {
5737 struct isl_sol_pma *sol_pma = NULL;
5738 isl_space *space;
5739
5740 if (!bmap)
5741 goto error;
5742
5743 sol_pma = isl_calloc_type(bmap->ctx, struct isl_sol_pma);
5744 if (!sol_pma)
5745 goto error;
5746
5747 sol_pma->sol.free = &sol_pma_free;
5748 if (sol_init(&sol_pma->sol, bmap, dom, max) < 0)
5749 goto error;
5750 sol_pma->sol.add = &sol_pma_add_wrap;
5751 sol_pma->sol.add_empty = track_empty ? &sol_pma_add_empty_wrap : NULL;
5752 space = isl_space_copy(sol_pma->sol.space);
5753 sol_pma->pma = isl_pw_multi_aff_empty(space);
5754 if (!sol_pma->pma)
5755 goto error;
5756
5757 if (track_empty) {
5758 sol_pma->empty = isl_set_alloc_space(isl_basic_set_get_space(dom),
5759 1, ISL_SET_DISJOINT);
5760 if (!sol_pma->empty)
5761 goto error;
5762 }
5763
5764 isl_basic_set_free(dom);
5765 return &sol_pma->sol;
5766 error:
5767 isl_basic_set_free(dom);
5768 sol_free(&sol_pma->sol);
5769 return NULL;
5770 }
5771
5772 /* Base case of isl_tab_basic_map_partial_lexopt, after removing
5773 * some obvious symmetries.
5774 *
5775 * We call basic_map_partial_lexopt_base_sol and extract the results.
5776 */
basic_map_partial_lexopt_base_pw_multi_aff(__isl_take isl_basic_map * bmap,__isl_take isl_basic_set * dom,__isl_give isl_set ** empty,int max)5777 static __isl_give isl_pw_multi_aff *basic_map_partial_lexopt_base_pw_multi_aff(
5778 __isl_take isl_basic_map *bmap, __isl_take isl_basic_set *dom,
5779 __isl_give isl_set **empty, int max)
5780 {
5781 isl_pw_multi_aff *result = NULL;
5782 struct isl_sol *sol;
5783 struct isl_sol_pma *sol_pma;
5784
5785 sol = basic_map_partial_lexopt_base_sol(bmap, dom, empty, max,
5786 &sol_pma_init);
5787 if (!sol)
5788 return NULL;
5789 sol_pma = (struct isl_sol_pma *) sol;
5790
5791 result = isl_pw_multi_aff_copy(sol_pma->pma);
5792 if (empty)
5793 *empty = isl_set_copy(sol_pma->empty);
5794 sol_free(&sol_pma->sol);
5795 return result;
5796 }
5797
5798 /* Given that the last input variable of "maff" represents the minimum
5799 * of some bounds, check whether we need to plug in the expression
5800 * of the minimum.
5801 *
5802 * In particular, check if the last input variable appears in any
5803 * of the expressions in "maff".
5804 */
need_substitution(__isl_keep isl_multi_aff * maff)5805 static isl_bool need_substitution(__isl_keep isl_multi_aff *maff)
5806 {
5807 int i;
5808 isl_size n_in;
5809 unsigned pos;
5810
5811 n_in = isl_multi_aff_dim(maff, isl_dim_in);
5812 if (n_in < 0)
5813 return isl_bool_error;
5814 pos = n_in - 1;
5815
5816 for (i = 0; i < maff->n; ++i) {
5817 isl_bool involves;
5818
5819 involves = isl_aff_involves_dims(maff->u.p[i],
5820 isl_dim_in, pos, 1);
5821 if (involves < 0 || involves)
5822 return involves;
5823 }
5824
5825 return isl_bool_false;
5826 }
5827
5828 /* Given a set of upper bounds on the last "input" variable m,
5829 * construct a piecewise affine expression that selects
5830 * the minimal upper bound to m, i.e.,
5831 * divide the space into cells where one
5832 * of the upper bounds is smaller than all the others and select
5833 * this upper bound on that cell.
5834 *
5835 * In particular, if there are n bounds b_i, then the result
5836 * consists of n cell, each one of the form
5837 *
5838 * b_i <= b_j for j > i
5839 * b_i < b_j for j < i
5840 *
5841 * The affine expression on this cell is
5842 *
5843 * b_i
5844 */
set_minimum_pa(__isl_take isl_space * space,__isl_take isl_mat * var)5845 static __isl_give isl_pw_aff *set_minimum_pa(__isl_take isl_space *space,
5846 __isl_take isl_mat *var)
5847 {
5848 int i;
5849 isl_aff *aff = NULL;
5850 isl_basic_set *bset = NULL;
5851 isl_pw_aff *paff = NULL;
5852 isl_space *pw_space;
5853 isl_local_space *ls = NULL;
5854
5855 if (!space || !var)
5856 goto error;
5857
5858 ls = isl_local_space_from_space(isl_space_copy(space));
5859 pw_space = isl_space_copy(space);
5860 pw_space = isl_space_from_domain(pw_space);
5861 pw_space = isl_space_add_dims(pw_space, isl_dim_out, 1);
5862 paff = isl_pw_aff_alloc_size(pw_space, var->n_row);
5863
5864 for (i = 0; i < var->n_row; ++i) {
5865 isl_pw_aff *paff_i;
5866
5867 aff = isl_aff_alloc(isl_local_space_copy(ls));
5868 bset = isl_basic_set_alloc_space(isl_space_copy(space), 0,
5869 0, var->n_row - 1);
5870 if (!aff || !bset)
5871 goto error;
5872 isl_int_set_si(aff->v->el[0], 1);
5873 isl_seq_cpy(aff->v->el + 1, var->row[i], var->n_col);
5874 isl_int_set_si(aff->v->el[1 + var->n_col], 0);
5875 bset = select_minimum(bset, var, i);
5876 paff_i = isl_pw_aff_alloc(isl_set_from_basic_set(bset), aff);
5877 paff = isl_pw_aff_add_disjoint(paff, paff_i);
5878 }
5879
5880 isl_local_space_free(ls);
5881 isl_space_free(space);
5882 isl_mat_free(var);
5883 return paff;
5884 error:
5885 isl_aff_free(aff);
5886 isl_basic_set_free(bset);
5887 isl_pw_aff_free(paff);
5888 isl_local_space_free(ls);
5889 isl_space_free(space);
5890 isl_mat_free(var);
5891 return NULL;
5892 }
5893
5894 /* Given a piecewise multi-affine expression of which the last input variable
5895 * is the minimum of the bounds in "cst", plug in the value of the minimum.
5896 * This minimum expression is given in "min_expr_pa".
5897 * The set "min_expr" contains the same information, but in the form of a set.
5898 * The variable is subsequently projected out.
5899 *
5900 * The implementation is similar to those of "split" and "split_domain".
5901 * If the variable appears in a given expression, then minimum expression
5902 * is plugged in. Otherwise, if the variable appears in the constraints
5903 * and a split is required, then the domain is split. Otherwise, no split
5904 * is performed.
5905 */
split_domain_pma(__isl_take isl_pw_multi_aff * opt,__isl_take isl_pw_aff * min_expr_pa,__isl_take isl_set * min_expr,__isl_take isl_mat * cst)5906 static __isl_give isl_pw_multi_aff *split_domain_pma(
5907 __isl_take isl_pw_multi_aff *opt, __isl_take isl_pw_aff *min_expr_pa,
5908 __isl_take isl_set *min_expr, __isl_take isl_mat *cst)
5909 {
5910 isl_size n_in;
5911 int i;
5912 isl_space *space;
5913 isl_pw_multi_aff *res;
5914
5915 if (!opt || !min_expr || !cst)
5916 goto error;
5917
5918 n_in = isl_pw_multi_aff_dim(opt, isl_dim_in);
5919 if (n_in < 0)
5920 goto error;
5921 space = isl_pw_multi_aff_get_space(opt);
5922 space = isl_space_drop_dims(space, isl_dim_in, n_in - 1, 1);
5923 res = isl_pw_multi_aff_empty(space);
5924
5925 for (i = 0; i < opt->n; ++i) {
5926 isl_bool subs;
5927 isl_pw_multi_aff *pma;
5928
5929 pma = isl_pw_multi_aff_alloc(isl_set_copy(opt->p[i].set),
5930 isl_multi_aff_copy(opt->p[i].maff));
5931 subs = need_substitution(opt->p[i].maff);
5932 if (subs < 0) {
5933 pma = isl_pw_multi_aff_free(pma);
5934 } else if (subs) {
5935 pma = isl_pw_multi_aff_substitute(pma,
5936 isl_dim_in, n_in - 1, min_expr_pa);
5937 } else {
5938 isl_bool split;
5939 split = need_split_set(opt->p[i].set, cst);
5940 if (split < 0)
5941 pma = isl_pw_multi_aff_free(pma);
5942 else if (split)
5943 pma = isl_pw_multi_aff_intersect_domain(pma,
5944 isl_set_copy(min_expr));
5945 }
5946 pma = isl_pw_multi_aff_project_out(pma,
5947 isl_dim_in, n_in - 1, 1);
5948
5949 res = isl_pw_multi_aff_add_disjoint(res, pma);
5950 }
5951
5952 isl_pw_multi_aff_free(opt);
5953 isl_pw_aff_free(min_expr_pa);
5954 isl_set_free(min_expr);
5955 isl_mat_free(cst);
5956 return res;
5957 error:
5958 isl_pw_multi_aff_free(opt);
5959 isl_pw_aff_free(min_expr_pa);
5960 isl_set_free(min_expr);
5961 isl_mat_free(cst);
5962 return NULL;
5963 }
5964
5965 static __isl_give isl_pw_multi_aff *basic_map_partial_lexopt_pw_multi_aff(
5966 __isl_take isl_basic_map *bmap, __isl_take isl_basic_set *dom,
5967 __isl_give isl_set **empty, int max);
5968
5969 /* This function is called from basic_map_partial_lexopt_symm.
5970 * The last variable of "bmap" and "dom" corresponds to the minimum
5971 * of the bounds in "cst". "map_space" is the space of the original
5972 * input relation (of basic_map_partial_lexopt_symm) and "set_space"
5973 * is the space of the original domain.
5974 *
5975 * We recursively call basic_map_partial_lexopt and then plug in
5976 * the definition of the minimum in the result.
5977 */
5978 static __isl_give isl_pw_multi_aff *
basic_map_partial_lexopt_symm_core_pw_multi_aff(__isl_take isl_basic_map * bmap,__isl_take isl_basic_set * dom,__isl_give isl_set ** empty,int max,__isl_take isl_mat * cst,__isl_take isl_space * map_space,__isl_take isl_space * set_space)5979 basic_map_partial_lexopt_symm_core_pw_multi_aff(
5980 __isl_take isl_basic_map *bmap, __isl_take isl_basic_set *dom,
5981 __isl_give isl_set **empty, int max, __isl_take isl_mat *cst,
5982 __isl_take isl_space *map_space, __isl_take isl_space *set_space)
5983 {
5984 isl_pw_multi_aff *opt;
5985 isl_pw_aff *min_expr_pa;
5986 isl_set *min_expr;
5987
5988 min_expr = set_minimum(isl_basic_set_get_space(dom), isl_mat_copy(cst));
5989 min_expr_pa = set_minimum_pa(isl_basic_set_get_space(dom),
5990 isl_mat_copy(cst));
5991
5992 opt = basic_map_partial_lexopt_pw_multi_aff(bmap, dom, empty, max);
5993
5994 if (empty) {
5995 *empty = split(*empty,
5996 isl_set_copy(min_expr), isl_mat_copy(cst));
5997 *empty = isl_set_reset_space(*empty, set_space);
5998 }
5999
6000 opt = split_domain_pma(opt, min_expr_pa, min_expr, cst);
6001 opt = isl_pw_multi_aff_reset_space(opt, map_space);
6002
6003 return opt;
6004 }
6005
6006 #undef TYPE
6007 #define TYPE isl_pw_multi_aff
6008 #undef SUFFIX
6009 #define SUFFIX _pw_multi_aff
6010 #include "isl_tab_lexopt_templ.c"
6011