dependence_graph.cc

   1 #include <isl/val.h>
   2 #include <isl/space.h>
   3 #include <isl/aff.h>
   4 #include <isl/set.h>
   5 #include <isl/map.h>
   6 #include <isl/printer.h>
   7 #include <isa/pdg.h>
   8 #include "dependence_graph.h"
   9
  10 void edge::dump(void)
  11 {
  12         isl_ctx *ctx;
  13         isl_printer *prn;
  14         const char *s;
  15         switch (type) {
  16         case normal:            s = ""; break;
  17         case expansion:         s = "expansion "; break;
  18         }
  19         fprintf(stderr, "\tpos: %d, source: %d,%s %s[%p]\n",
  20                         pos, source->location, source->operation, s, source);
  21         ctx = isl_map_get_ctx(relation);
  22         prn = isl_printer_to_file(ctx, stderr);
  23         prn = isl_printer_set_indent(prn, 8);
  24         prn = isl_printer_print_map(prn, relation);
  25         prn = isl_printer_end_line(prn);
  26         isl_printer_free(prn);
  27 }
  28
  29 void computation::dump(void)
  30 {
  31         isl_ctx *ctx;
  32         isl_printer *prn;
  33         const char *s;
  34         if (input)
  35                 s = "input ";
  36         else if (is_expanded)
  37                 s = "is_expanded ";
  38         else
  39                 s = "";
  40         fprintf(stderr, "op: %d,%s/%d %s[%p]\n",
  41                         location, operation, arity, s, this);
  42         ctx = isl_set_get_ctx(domain);
  43         prn = isl_printer_to_file(ctx, stderr);
  44         prn = isl_printer_print_set(prn, domain);
  45         prn = isl_printer_end_line(prn);
  46         isl_printer_free(prn);
  47
  48         for (int i = 0; i < edges.size(); ++i) {
  49                 fprintf(stderr, "edge %d:\n", i);
  50                 edges[i]->dump();
  51         }
  52 }
  53
  54 void dependence_graph::dump(void)
  55 {
  56         for (int i = 0; i < vertices.size(); ++i)
  57                 vertices[i]->dump();
  58         out->dump();
  59 }
  60
  61 static void add_input_edges(isl_ctx *ctx, int pos, pdg::dependence *dep,
  62                         computation *comp, computation *source)
  63 {
  64         pdg::access *a = dep->to_access;
  65         assert(source);
  66         isl_map *map = a->map->get_isl_map(ctx);
  67         isl_map *relation = dep->relation->get_isl_map(ctx);
  68         isl_set *domain = isl_map_range(relation);
  69         map = isl_map_intersect_domain(map, domain);
  70
  71         edge *e = new edge;
  72         e->source = source;
  73         e->pos = pos;
  74         e->relation = map;
  75         comp->edges.push_back(e);
  76 }
  77
  78 /* For each basic map in relation, add an edge to comp with
  79  * given source and pos.
  80  */
  81 static void add_split_edge(computation *comp, computation *source,
  82         int pos, isl_map *relation, std::vector<computation **> *missing,
  83         enum edge::type type = edge::normal)
  84 {
  85         edge *e = new edge;
  86         e->source = source;
  87         if (!source) {
  88                 assert(missing);
  89                 missing->push_back(&e->source);
  90         }
  91         e->pos = pos;
  92         e->relation = relation;
  93         e->type = type;
  94         comp->edges.push_back(e);
  95 }
  96
  97 /* For each (flow) dependence with write access a, and an
  98  * edge to computation comp.
  99  * Note that in the pdg, the dependences have as "input" the source (read)
 100  * and as "output" the sink (write), while in the dependence_graph,
 101  * we want edges that point from sink to source.
 102  *
 103  * If the (read) access has an extension, i.e., if the access
 104  * reads a row or an even larger chunk of an array, then we introduces
 105  * an extra "expansion" edge to an extra node that corresponds to the
 106  * reading of the whole array.  The iteration domain of this extra node
 107  * has extra dimensions, as many as were missing from the access.
 108  * The extra edge maps each iteration of the statement in which
 109  * the read appears to all iterations in the extended iteration domain
 110  * with the same values for the first iterators.
 111  * The remaining iterators range over the elements of the array chunk.
 112  * All dependences in which the given access is involved are attached
 113  * to the new node, where we need to be careful to use the extended_relation
 114  * instead of the projected "standard" relations.
 115  * The operation associated with the new node is the
 116  * empty string since the new node can be treated as a copy operation.
 117  * The edge connecting the original computation and the new node
 118  * is marked as an "expansion" edge because it needs to be treated
 119  * in a special way.
 120  */
 121 static void add_dep_edges(dependence_graph *dg, pdg::PDG *pdg,
 122                 std::map<pdg::access *, computation *> &s2c,
 123                 std::map<pdg::array *, computation *> &a2c,
 124                 std::map<pdg::access *, std::vector<computation **> > &missing,
 125                 int pos, pdg::access *a, computation *comp)
 126 {
 127         isl_ctx *ctx = pdg->get_isl_ctx();
 128         if (a->extension) {
 129                 isl_map *ext = a->extension->get_isl_map(ctx);
 130
 131                 computation *child = new computation();
 132                 child->domain = isl_set_apply(isl_set_copy(comp->domain),
 133                                                 isl_map_copy(ext));
 134                 child->operation = strdup("");
 135                 child->arity = 1;
 136                 child->location = comp->location;
 137                 dg->vertices.push_back(child);
 138
 139                 add_split_edge(comp, child, pos, ext, NULL, edge::expansion);
 140                 comp->is_expanded = 1;
 141                 comp = child;
 142                 pos = 0;
 143         }
 144         for (int i = 0; i < pdg->dependences.size(); ++i) {
 145                 pdg::dependence *dep = pdg->dependences[i];
 146                 if (dep->to_access != a)
 147                         continue;
 148
 149                 if (dep->type == pdg::dependence::uninitialized) {
 150                         add_input_edges(ctx, pos, dep, comp, a2c[dep->array]);
 151                         continue;
 152                 }
 153                 assert(dep->type == pdg::dependence::flow);
 154
 155                 isl_map *relation;
 156                 if (!dep->extended_relation)
 157                         relation = dep->relation->get_isl_map(ctx);
 158                 else
 159                         relation = dep->extended_relation->get_isl_map(ctx);
 160                 relation = isl_map_reverse(relation);
 161                 add_split_edge(comp, s2c[dep->from_access], pos, relation,
 162                                 &missing[dep->from_access]);
 163         }
 164 }
 165
 166 /* Each access without an associated array corresponds to a read
 167  * of an (affine combination of) iterator value(s).
 168  * The expression in terms of the iterators is given by the access map.
 169  * For each of these accesses, we add an edge to a special
 170  * "input computation" that is not associated to any particular
 171  * (input) array.  The map of the edge is the access map,
 172  * with the domain intersected with the domain of the current computation.
 173  * This ensures that corresponding reads are considered equal iff the
 174  * value they read is the same for both programs.
 175  *
 176  * In the special case where the affine expression is a mere integer constant
 177  * that appears as an argument to a #test operation, the domain of "comp"
 178  * may reference an argument that may not be present in "a" if it was
 179  * created by c2pdg from an integer expression.
 180  * In this case, we not only need to intersect the domain of
 181  * the access relation, but also introduce a reference to the argument.
 182  */
 183 static void add_iterator_edges(pdg::PDG *pdg,
 184                             std::map<pdg::array *, computation *> &a2c,
 185                             int pos,
 186                             pdg::access *a, computation *comp)
 187 {
 188         isl_ctx *ctx = pdg->get_isl_ctx();
 189         computation *Z = a2c[NULL];
 190         isl_map *map = a->map->get_isl_map(ctx);
 191         isl_set *domain = isl_set_copy(comp->domain);
 192         if (isl_set_is_wrapping(domain) && !isl_map_domain_is_wrapping(map)) {
 193                 isl_map *domain_map;
 194                 domain_map = isl_map_domain_map(isl_set_unwrap(domain));
 195                 map = isl_map_apply_range(domain_map, map);
 196         } else
 197                 map = isl_map_intersect_domain(map, domain);
 198         add_split_edge(comp, Z, pos, map, NULL);
 199 }
 200
 201 static void add_access_edges(dependence_graph *dg, pdg::PDG *pdg,
 202                 std::map<pdg::access *, computation *> &s2c,
 203                 std::map<pdg::array *, computation *> &a2c,
 204                 std::map<pdg::access *, std::vector<computation **> > &missing,
 205                 int pos, pdg::access *a, computation *comp)
 206 {
 207         if (a->array)
 208                 add_dep_edges(dg, pdg, s2c, a2c, missing, pos, a, comp);
 209         else
 210                 add_iterator_edges(pdg, a2c, pos, a, comp);
 211 }
 212
 213 static int add_edges_at_pos(dependence_graph *dg, pdg::PDG *pdg,
 214                 std::map<pdg::access *, computation *> &s2c,
 215                 std::map<pdg::array *, computation *> &a2c,
 216                 std::map<pdg::access *, std::vector<computation **> > &missing,
 217                 int pos, pdg::call_or_access *coa, computation *comp);
 218
 219 /* Add a new copy computation to dependence graph dg with given
 220  * domain and location and return a pointer to the copy computation.
 221  */
 222 static computation *add_copy_computation(dependence_graph *dg,
 223                 isl_set *domain, int location)
 224 {
 225         computation *copy;
 226         copy = new computation();
 227         copy->domain = domain;
 228         copy->operation = strdup("");
 229         copy->arity = 1;
 230         copy->location = location;
 231         dg->vertices.push_back(copy);
 232         return copy;
 233 }
 234
 235 /* Create a "#NEST computation, with n + 1 arguments, where n is the
 236  * number of nested accesses.
 237  * The first n arguments correspond to the nested accesses and
 238  * edges for these arguments are added as usual.
 239  * Note that if the access "a" appears in a "#test" function,
 240  * then some of the nested accesses will already have been
 241  * added by an outer #NEST computation and should therefore be skipped.
 242  * The final argument corresponds to the expansion and for this position
 243  * a single expansion edge is added to the given copy computation.
 244  * The mapping on the expansion edge is the identity
 245  * mapping on the domain, with the range extended by one dimension for
 246  * each of nested accesses.  The range of values in each of these dimensions
 247  * is given by the value_bounds on the corresponding array.
 248  * The iteration domain of the given copy computation is adjusted accordingly.
 249  */
 250 static computation *add_nest_computation(dependence_graph *dg, pdg::PDG *pdg,
 251                 std::map<pdg::access *, computation *> &s2c,
 252                 std::map<pdg::array *, computation *> &a2c,
 253                 std::map<pdg::access *, std::vector<computation **> > &missing,
 254                 pdg::access *a, computation *copy)
 255 {
 256         isl_ctx *ctx = pdg->get_isl_ctx();
 257         computation *nest = new computation();
 258         nest->domain = isl_set_copy(copy->domain);
 259         nest->operation = strdup("#NEST");
 260         nest->arity = a->nested.size() + 1;
 261         nest->location = copy->location;
 262         dg->vertices.push_back(nest);
 263
 264         int nested_dim = a->map->input() - isl_set_dim(copy->domain, isl_dim_set);
 265         assert(nested_dim > 0 && nested_dim <= a->nested.size());
 266         int skip_dim = a->nested.size() - nested_dim;
 267
 268         isl_space *dim;
 269         isl_set *bounds;
 270         isl_map *ext;
 271         int pos = 0;
 272
 273         dim = isl_set_get_space(copy->domain);
 274         dim = isl_space_drop_dims(dim, isl_dim_set,
 275                                         0, isl_space_dim(dim, isl_dim_set));
 276         bounds = isl_set_universe(dim);
 277
 278         for (int i = skip_dim; i < a->nested.size(); ++i) {
 279                 pdg::call_or_access *coa = a->nested[i];
 280
 281                 if (add_edges_at_pos(dg, pdg, s2c, a2c,
 282                                      missing, pos, coa, nest))
 283                         ++pos;
 284
 285                 assert(coa->type == pdg::call_or_access::t_access);
 286                 pdg::access *nested = coa->access;
 287                 assert(nested->array->value_bounds);
 288                 isl_set *bounds_i;
 289                 bounds_i = nested->array->value_bounds->get_isl_set(ctx);
 290
 291                 bounds = isl_set_flat_product(bounds, bounds_i);
 292         }
 293
 294         dim = isl_set_get_space(copy->domain);
 295         copy->domain = isl_set_product(copy->domain, isl_set_copy(bounds));
 296         bounds = isl_set_product(isl_set_universe(dim), bounds);
 297         ext = isl_map_reverse(isl_map_domain_map(isl_set_unwrap(bounds)));
 298
 299         add_split_edge(nest, copy, pos, ext, NULL, edge::expansion);
 300         nest->is_expanded = 1;
 301
 302         return nest;
 303 }
 304
 305 /* Add an edge to "comp" at position "pos" according to access "a",
 306  * where "a" is has nested accesses.
 307  * We first create a copy computation where the actual access
 308  * will be attached.  Then we create a "#NEST" computation that
 309  * sits between "comp" and the copy computation.
 310  */
 311 static void add_nested_access_edge(dependence_graph *dg, pdg::PDG *pdg,
 312                 std::map<pdg::access *, computation *> &s2c,
 313                 std::map<pdg::array *, computation *> &a2c,
 314                 std::map<pdg::access *, std::vector<computation **> > &missing,
 315                 int pos, pdg::access *a, computation *comp)
 316 {
 317         computation *copy;
 318         copy = add_copy_computation(dg, isl_set_copy(comp->domain),
 319                                     comp->location);
 320
 321         computation *nest;
 322         nest = add_nest_computation(dg, pdg, s2c, a2c, missing, a, copy);
 323
 324         edge *e = new edge;
 325         e->pos = pos;
 326         e->source = nest;
 327         isl_space *dim = isl_space_map_from_set(isl_set_get_space(comp->domain));
 328         e->relation = isl_map_identity(dim);
 329         comp->edges.push_back(e);
 330
 331         add_access_edges(dg, pdg, s2c, a2c, missing, 0, a, copy);
 332 }
 333
 334 /* "Invocations" of integer constants are replaced by accesses
 335  * to the "input computation", so we can treat them like and combine them
 336  * with iterator accesses.
 337  */
 338 static void add_constant_edge(pdg::PDG *pdg,
 339                             std::map<pdg::array *, computation *> &a2c,
 340                             int pos, long cst, computation *comp)
 341 {
 342         isl_ctx *ctx = pdg->get_isl_ctx();
 343         computation *Z = a2c[NULL];
 344
 345         isl_map *map = isl_map_from_range(isl_set_copy(comp->domain));
 346         map = isl_map_reverse(map);
 347         map = isl_map_add_dims(map, isl_dim_out, 1);
 348         map = isl_map_fix_si(map, isl_dim_out, 0, cst);
 349         add_split_edge(comp, Z, pos, map, NULL);
 350 }
 351
 352 static void add_edges(dependence_graph *dg, pdg::PDG *pdg,
 353                 std::map<pdg::access *, computation *> &s2c,
 354                 std::map<pdg::array *, computation *> &a2c,
 355                 std::map<pdg::access *, std::vector<computation **> > &missing,
 356                 pdg::function_call *call, computation *comp);
 357
 358 /* Scale the single output dimension of bmap by a factor of f */
 359 static __isl_give isl_map *scale(__isl_take isl_map *map, __isl_take isl_val *f)
 360 {
 361         isl_multi_aff *scaling;
 362         isl_space *space;
 363
 364         space = isl_map_get_space(map);
 365         space = isl_space_range(space);
 366         space = isl_space_map_from_set(space);
 367         scaling = isl_multi_aff_identity(space);
 368         scaling = isl_multi_aff_scale_val(scaling, f);
 369
 370         map = isl_map_apply_range(map, isl_map_from_multi_aff(scaling));
 371
 372         return map;
 373 }
 374
 375 /* Compute the mapping along the given edge to the Z computation,
 376  * where the Z computation may be either the source of the edge
 377  * or it may be the source of the single edge leaving the copy
 378  * computation that is the source of the given edge.
 379  */
 380 static isl_map *map_to_Z(edge *edge, computation *Z)
 381 {
 382         if (edge->source == Z)
 383                 return isl_map_copy(edge->relation);
 384         assert(edge->source->is_copy());
 385         assert(edge->source->edges.size() == 1);
 386         assert(edge->source->edges[0]->source == Z);
 387         return isl_map_apply_range(
 388                 isl_map_copy(edge->relation),
 389                 isl_map_copy(edge->source->edges[0]->relation));
 390 }
 391
 392 static isl_map *affine_expression_div(computation *comp, computation *Z)
 393 {
 394         isl_map *map = NULL;
 395         isl_val *v;
 396         isl_map *rel = map_to_Z(comp->edges[1], Z);
 397
 398         v = isl_map_plain_get_val_if_fixed(rel, isl_dim_out, 0);
 399         if (isl_val_is_int(v)) {
 400                 map = isl_map_floordiv_val(
 401                     isl_map_copy(comp->edges[0]->relation), v);
 402         } else
 403                 isl_val_free(v);
 404         isl_map_free(rel);
 405         return map;
 406 }
 407
 408 /* Construct a map for CLooG's ceild operation.
 409  *
 410  * We simply apply the identity
 411  *
 412  *      ceil(a/b) = - floor(-a/b)
 413  */
 414 static isl_map *affine_expression_ceildiv(computation *comp, computation *Z)
 415 {
 416         isl_map *map = NULL;
 417         isl_map *map2;
 418         isl_val *v;
 419
 420         map2 = map_to_Z(comp->edges[1], Z);
 421         v = isl_map_plain_get_val_if_fixed(map2, isl_dim_out, 0);
 422         if (isl_val_is_int(v)) {
 423                 map = isl_map_neg(map_to_Z(comp->edges[0], Z));
 424                 map = isl_map_neg(isl_map_floordiv_val(map, v));
 425         } else
 426                 isl_val_free(v);
 427
 428         isl_map_free(map2);
 429         return map;
 430 }
 431
 432 /* Construct a mapping for the maximum of two mappings.
 433  *
 434  * In particular, given two mappings in the arguments of "comp"
 435  *
 436  *      [input] -> [a]
 437  *      [input] -> [b]
 438  *
 439  * construct
 440  *
 441  *      [input] -> [a] : a >= b; [input] -> [b] : a < b
 442  *
 443  * We first construct
 444  *
 445  *      [input] -> [[a] -> [b]]
 446  *
 447  * intersect the range with [a] -> [b] : a >= b and [a] -> [b] : a < b
 448  * and then map the range to its domain and range in the respective results.
 449  */
 450 static isl_map *affine_expression_max(computation *comp, computation *Z)
 451 {
 452         isl_space *dim;
 453         isl_map *map, *ge, *lt;
 454         isl_map *map1, *map2;
 455
 456         map1 = map_to_Z(comp->edges[0], Z);
 457         map2 = map_to_Z(comp->edges[1], Z);
 458
 459         dim = isl_map_get_space(map1);
 460         dim = isl_space_range(dim);
 461
 462         map = isl_map_range_product(map1, map2);
 463
 464         ge = isl_map_lex_ge(isl_space_copy(dim));
 465         lt = isl_map_lex_lt(isl_space_copy(dim));
 466
 467         ge = isl_map_intersect_range(isl_map_copy(map), isl_map_wrap(ge));
 468         lt = isl_map_intersect_range(map, isl_map_wrap(lt));
 469
 470         dim = isl_space_map_from_set(dim);
 471         map = isl_map_universe(isl_space_copy(dim));
 472         map = isl_map_domain_map(map);
 473         ge = isl_map_apply_range(ge, map);
 474
 475         map = isl_map_universe(dim);
 476         map = isl_map_range_map(map);
 477         lt = isl_map_apply_range(lt, map);
 478
 479         map = isl_map_union(ge, lt);
 480
 481         return map;
 482 }
 483
 484 /* Given two maps A -> f(A) and B -> g(B), construct a map
 485  * A -> f(A) * g(B) or B -> f(A) * g(B), if at least one of
 486  * "rel0" or "rel1" maps to a constant value.
 487  * Otherwise, return NULL.
 488  */
 489 static __isl_give isl_map *map_mul(__isl_take isl_map *rel0,
 490         __isl_take isl_map *rel1)
 491 {
 492         isl_val *v;
 493
 494         v = isl_map_plain_get_val_if_fixed(rel0, isl_dim_out, 0);
 495         if (isl_val_is_int(v)) {
 496                 isl_map_free(rel0);
 497                 return scale(rel1, v);
 498         }
 499         isl_val_free(v);
 500
 501         v = isl_map_plain_get_val_if_fixed(rel1, isl_dim_out, 0);
 502         if (isl_val_is_int(v)) {
 503                 isl_map_free(rel1);
 504                 return scale(rel0, v);
 505         }
 506         isl_val_free(v);
 507
 508         isl_map_free(rel0);
 509         isl_map_free(rel1);
 510
 511         return NULL;
 512 }
 513
 514 /* If comp represents an operation on affine expressions that can
 515  * be represented by a single affine expression, then return a mapping
 516  * encoding this single affine expression.  Otherwise return NULL.
 517  */
 518 static isl_map *affine_expression(computation *comp, computation *Z)
 519 {
 520         if (comp->arity != comp->edges.size())
 521                 return NULL;
 522         for (int i = 0; i < comp->edges.size(); ++i) {
 523                 computation *source = comp->edges[i]->source;
 524                 if (source == Z)
 525                         continue;
 526                 if (source && source->is_copy() && source->edges.size() == 1 &&
 527                     source->edges[0]->source == Z)
 528                         continue;
 529                 return NULL;
 530         }
 531         if (!strcmp(comp->operation, "+") && comp->arity == 2)
 532                 return isl_map_sum(map_to_Z(comp->edges[0], Z),
 533                                          map_to_Z(comp->edges[1], Z));
 534         if (!strcmp(comp->operation, "-") && comp->arity == 2)
 535                 return isl_map_sum(
 536                         map_to_Z(comp->edges[0], Z),
 537                         isl_map_neg(map_to_Z(comp->edges[1], Z)));
 538         if (!strcmp(comp->operation, "-") && comp->arity == 1)
 539                 return isl_map_neg(map_to_Z(comp->edges[0], Z));
 540         if (!strcmp(comp->operation, "/") && comp->arity == 2)
 541                 return affine_expression_div(comp, Z);
 542         if (!strcmp(comp->operation, "floord") && comp->arity == 2)
 543                 return affine_expression_div(comp, Z);
 544         if (!strcmp(comp->operation, "ceild") && comp->arity == 2)
 545                 return affine_expression_ceildiv(comp, Z);
 546         if (!strcmp(comp->operation, "max") && comp->arity == 2)
 547                 return affine_expression_max(comp, Z);
 548         if (!strcmp(comp->operation, "*") && comp->arity == 2) {
 549                 isl_map *rel0 = map_to_Z(comp->edges[0], Z);
 550                 isl_map *rel1 = map_to_Z(comp->edges[1], Z);
 551                 return map_mul(rel0, rel1);
 552         }
 553         return NULL;
 554 }
 555
 556 static void add_computation_edge(dependence_graph *dg, pdg::PDG *pdg,
 557                 std::map<pdg::access *, computation *> &s2c,
 558                 std::map<pdg::array *, computation *> &a2c,
 559                 std::map<pdg::access *, std::vector<computation **> > &missing,
 560                 pdg::function_call *call, computation *comp, int pos)
 561 {
 562         char *endp;
 563         long int cst;
 564         cst = strtol(call->name->s.c_str(), &endp, 0);
 565         if (*call->name->s.c_str() && !*endp) {
 566                 add_constant_edge(pdg, a2c, pos, cst, comp);
 567                 return;
 568         }
 569
 570         computation *child = new computation();
 571         child->domain = isl_set_copy(comp->domain);
 572         child->operation = strdup(call->name->s.c_str());
 573         child->arity = call->arguments.size();
 574         child->location = comp->location;
 575
 576         edge *e = new edge;
 577         e->pos = pos;
 578         comp->edges.push_back(e);
 579
 580         add_edges(dg, pdg, s2c, a2c, missing, call, child);
 581
 582         isl_map *expr = affine_expression(child, a2c[NULL]);
 583         if (expr) {
 584                 delete child;
 585                 e->source = a2c[NULL];
 586                 e->relation = expr;
 587         } else {
 588                 dg->vertices.push_back(child);
 589                 e->source = child;
 590                 isl_space *dim = isl_set_get_space(comp->domain);
 591                 e->relation = isl_map_identity(isl_space_map_from_set(dim));
 592         }
 593 }
 594
 595 /* Add and edge from computation "at" to the integer computation "Z".
 596  * The edge maps the domain of "at" to the value of its dimension "index_dim".
 597  */
 598 static void add_index_edge(dependence_graph *dg,
 599         computation *at, computation *Z, int pos, unsigned index_dim)
 600 {
 601         unsigned total_out = isl_set_dim(at->domain, isl_dim_out);
 602         isl_space *dim = isl_set_get_space(at->domain);
 603         isl_map *id = isl_map_identity(isl_space_map_from_set(dim));
 604         id = isl_map_remove_dims(id, isl_dim_out, index_dim + 1,
 605                                      total_out - index_dim - 1);
 606         id = isl_map_remove_dims(id, isl_dim_out, 0, index_dim);
 607         add_split_edge(at, Z, pos, id, NULL);
 608 }
 609
 610 /* Given a write access "a" inside the arguments of a function call
 611  * that was translated into computation "comp", make "a" point to
 612  * "comp" as its computation and fill in locations collected in
 613  * "missing" that should refer to the computation of "a".
 614  *
 615  * If the write access has an extension, i.e., if a whole row or
 616  * an even larger chunk of an array is written, then we introduce
 617  * a new node that corresponds to selecting the individual elements.
 618  * Dependences that flow from the write are then turned into edges that
 619  * point to the new computation.
 620  * If the write access extends the dimension by s, i.e., if the
 621  * chunk written is of dimension s, then the new computation with
 622  * operation "#at" has 1 + s arguments, one for the chunk itself
 623  * and one for each index in the chunk.
 624  * There is exactly one edge for each arguments position, each
 625  * selecting the appropriate dimensions from the domain.
 626  * The first argument ensures that the values of the chunks
 627  * are the same in both programs, while the remaining arguments
 628  * ensure that the same element from this chunk is selected.
 629  */
 630 static void set_write_access(dependence_graph *dg, pdg::PDG *pdg,
 631                 std::map<pdg::access *, computation *> &s2c,
 632                 std::map<pdg::array *, computation *> &a2c,
 633                 std::map<pdg::access *, std::vector<computation **> > &missing,
 634                 pdg::access *a, computation *comp)
 635 {
 636         if (a->extension) {
 637                 isl_ctx *ctx = pdg->get_isl_ctx();
 638                 isl_map *ext = a->extension->get_isl_map(ctx);
 639                 unsigned dim = isl_map_dim(ext, isl_dim_in);
 640                 unsigned e_dim = isl_map_dim(ext, isl_dim_out);
 641
 642                 computation *at = new computation();
 643                 at->domain = isl_set_apply(isl_set_copy(comp->domain),
 644                                                 isl_map_copy(ext));
 645                 at->operation = strdup("#at");
 646                 at->arity = 1 + (e_dim - dim);
 647                 at->location = comp->location;
 648                 dg->vertices.push_back(at);
 649
 650                 ext = isl_map_reverse(ext);
 651                 add_split_edge(at, comp, 0, ext, NULL);
 652                 for (int i = 0; i < e_dim - dim; ++i)
 653                         add_index_edge(dg, at, a2c[NULL], 1 + i, dim + i);
 654                 comp = at;
 655         }
 656         s2c[a] = comp;
 657         for (int k = 0; k < missing[a].size(); ++k)
 658                 *missing[a][k] = comp;
 659 }
 660
 661 /* For a given call or access "coa" which appears as argument "pos" of
 662  * a function call, add one or more edges to computation comp.
 663  * In case the argument is an access, the edges corresponding to
 664  * the dependences are added in add_dep_edges.
 665  * If it is itself a function call, then a single edge is added
 666  * to a new child and add_edges is called recursively on the
 667  * nested function call.
 668  * Return 1 if any edges were added for this position and 0 if not.
 669  * In particular, a write access should not be considered as an
 670  * argument and is therefore skipped.
 671  */
 672 static int add_edges_at_pos(dependence_graph *dg, pdg::PDG *pdg,
 673                 std::map<pdg::access *, computation *> &s2c,
 674                 std::map<pdg::array *, computation *> &a2c,
 675                 std::map<pdg::access *, std::vector<computation **> > &missing,
 676                 int pos, pdg::call_or_access *coa, computation *comp)
 677 {
 678         if (coa->type == pdg::call_or_access::t_access) {
 679                 pdg::access *a = coa->access;
 680                 if (a->type == pdg::access::write) {
 681                         set_write_access(dg, pdg, s2c, a2c, missing, a, comp);
 682                         comp->arity--;
 683                         return 0;
 684                 }
 685                 int nested_dim = a->map->input() -
 686                                         isl_set_dim(comp->domain, isl_dim_set);
 687                 if (nested_dim > 0)
 688                         add_nested_access_edge(dg, pdg, s2c, a2c, missing,
 689                                                 pos, coa->access, comp);
 690                 else
 691                         add_access_edges(dg, pdg, s2c, a2c, missing,
 692                                          pos, coa->access, comp);
 693         } else {
 694                 add_computation_edge(dg, pdg, s2c, a2c, missing,
 695                                         coa->call, comp, pos);
 696         }
 697         return 1;
 698 }
 699
 700 /* For each argument of function call call, we add one or more edges to
 701  * computation comp.
 702  */
 703 static void add_edges(dependence_graph *dg, pdg::PDG *pdg,
 704                 std::map<pdg::access *, computation *> &s2c,
 705                 std::map<pdg::array *, computation *> &a2c,
 706                 std::map<pdg::access *, std::vector<computation **> > &missing,
 707                 pdg::function_call *call, computation *comp)
 708 {
 709         int pos = 0;
 710         for (int i = 0; i < call->arguments.size(); ++i) {
 711                 pdg::call_or_access *coa = call->arguments[i];
 712
 713                 if (add_edges_at_pos(dg, pdg, s2c, a2c,
 714                                      missing, pos, coa, comp))
 715                         ++pos;
 716         }
 717
 718         return;
 719 }
 720
 721 /* Add an edge from the output computation (out) to a computation computing
 722  * (part of) an output array.  node is pdg node corresponding to this
 723  * computation.  It is assumed to have a single write access, corresponding
 724  * to the output array.  exposed is that part of the node domain that
 725  * is not the source of an output dependence, i.e., those for which
 726  * the computed array elements are not overwritten.
 727  * Let f(i) be the index expression of the write access and let
 728  * pos be the position of the output array in the sorted list of
 729  * output arrays, then an edge is added to out with relation
 730  *
 731  *      { [ f(i), 0, pos ] -> [i] | i \in exposed }
 732  *
 733  * where the total dimension of the domain is out_dim, and this domain
 734  * is added to the domain of the output computation.
 735  */
 736 static void add_output_edge(isl_ctx *ctx, computation *out, pdg::node *node,
 737         std::map<pdg::array *, int> &array2pos,
 738         computation *last,
 739         isl_set *exposed, unsigned nparam, unsigned out_dim)
 740 {
 741         pdg::statement *s = node->statement;
 742         int j;
 743         for (j = 0;  j < s->accesses.size(); ++j)
 744                 if (s->accesses[j]->type == pdg::access::write &&
 745                     s->accesses[j]->array->type == pdg::array::output)
 746                         break;
 747         pdg::array *array = s->accesses[j]->array;
 748         int pos = array2pos[array];
 749         isl_map *rel;
 750         if (!s->accesses[j]->extended_map)
 751                 rel = isl_map_reverse(s->accesses[j]->map->get_isl_map(ctx));
 752         else
 753                 rel = isl_map_reverse(s->accesses[j]->extended_map->get_isl_map(ctx));
 754         rel = isl_map_add_dims(rel, isl_dim_in,
 755                                 out_dim - isl_map_dim(rel, isl_dim_in));
 756         rel = isl_map_intersect_range(rel, exposed);
 757         rel = isl_map_fix_input_si(rel, out_dim-1, pos);
 758         for (int k = array->dims.size(); k < out_dim-1; ++k)
 759                 rel = isl_map_fix_input_si(rel, k, 0);
 760
 761         out->domain = isl_set_union_disjoint(out->domain,
 762                                         isl_map_domain(isl_map_copy(rel)));
 763         add_split_edge(out, last, 0, rel, NULL);
 764 }
 765
 766 static void connect_top_level_outputs(computation *comp,
 767         std::map<pdg::access *, computation *> &s2c,
 768         std::map<pdg::access *, std::vector<computation **> > &missing,
 769         pdg::node *node)
 770 {
 771         pdg::statement *s = node->statement;
 772
 773         for (int j = 0; j < s->top_outputs.size(); ++j) {
 774                 pdg::access *a = s->top_outputs[j];
 775                 s2c[a] = comp;
 776                 for (int k = 0; k < missing[a].size(); ++k)
 777                         *missing[a][k] = comp;
 778         }
 779 }
 780
 781 /* Add some computations to model a "#test" operation generated
 782  * by pers for data dependent assignments.
 783  * The test operation has three arguments.
 784  * The first is an "iteration" access with nested accesses corresponding
 785  * to the data dependent constructs in the conditions of the assignment.
 786  * The access relation maps iteration in the extended domain that
 787  * satisfy the conditions to 1, and those that do not satisfy the
 788  * conditions to 0.
 789  * The other two arguments are the operations or accesses performed
 790  * when the conditions hold (second argument) or do not hold (third
 791  * argument).
 792  *
 793  * We first create a copy computation and put it inside a #NEST
 794  * computation that add the required dimensions.
 795  * Then we split the extended iteration domain according to
 796  * the data dependent conditions using two child copy computations
 797  * with the appropriate dependence relations.
 798  * The second and third arguments of the "#test" operation are
 799  * then attached to these two child copy computations.
 800  */
 801 static void add_test_computation(dependence_graph *dg, pdg::PDG *pdg,
 802         std::map<pdg::access *, computation *> &s2c,
 803         std::map<pdg::array *, computation *> &a2c,
 804         std::map<pdg::access *, std::vector<computation **> > &missing,
 805         pdg::node *node)
 806 {
 807         isl_ctx *ctx = pdg->get_isl_ctx();
 808         pdg::statement *s = node->statement;
 809
 810         computation *copy;
 811         copy = add_copy_computation(dg, node->source->get_isl_set(ctx),
 812                                     s->line);
 813
 814         assert(s->top_function->arguments.size() == 3);
 815         pdg::call_or_access *coa = s->top_function->arguments[0];
 816         assert(coa->type == pdg::call_or_access::t_access);
 817         pdg::access *a = coa->access;
 818
 819         computation *nest;
 820         nest = add_nest_computation(dg, pdg, s2c, a2c, missing, a, copy);
 821
 822         isl_map *map_true = a->map->get_isl_map(ctx);
 823         isl_map *map_false = isl_map_copy(map_true);
 824
 825         map_true = isl_map_fix_si(map_true, isl_dim_out, 0, 1);
 826         map_false = isl_map_fix_si(map_false, isl_dim_out, 0, 0);
 827
 828         isl_space *dim = isl_space_domain(isl_map_get_space(map_true));
 829         dim = isl_space_map_from_set(dim);
 830         map_true = isl_map_intersect_domain(isl_map_identity(isl_space_copy(dim)),
 831                                             isl_map_domain(map_true));
 832         map_false = isl_map_intersect_domain(isl_map_identity(dim),
 833                                             isl_map_domain(map_false));
 834
 835         computation *copy_true;
 836         copy_true = add_copy_computation(dg, isl_set_copy(copy->domain),
 837                                          copy->location);
 838         computation *copy_false;
 839         copy_false = add_copy_computation(dg, isl_set_copy(copy->domain),
 840                                          copy->location);
 841
 842         add_split_edge(copy, copy_true, 0, map_true, NULL);
 843         add_split_edge(copy, copy_false, 0, map_false, NULL);
 844
 845         add_edges_at_pos(dg, pdg, s2c, a2c, missing, 0,
 846                                 s->top_function->arguments[1], copy_true);
 847         add_edges_at_pos(dg, pdg, s2c, a2c, missing, 0,
 848                                 s->top_function->arguments[2], copy_false);
 849
 850         connect_top_level_outputs(nest, s2c, missing, node);
 851 }
 852
 853 static void add_top_level_computation(dependence_graph *dg, pdg::PDG *pdg,
 854         std::map<pdg::access *, computation *> &s2c,
 855         std::map<pdg::array *, computation *> &a2c,
 856         std::map<pdg::access *, std::vector<computation **> > &missing,
 857         pdg::node *node, __isl_keep isl_set *context)
 858 {
 859         isl_ctx *ctx = pdg->get_isl_ctx();
 860         pdg::statement *s = node->statement;
 861
 862         if (!strcmp(s->top_function->name->s.c_str(), "#test")) {
 863                 add_test_computation(dg, pdg, s2c, a2c, missing, node);
 864                 return;
 865         }
 866
 867         computation *comp = new computation();
 868         comp->domain = node->source->get_isl_set(ctx);
 869         comp->domain = isl_set_intersect_params(comp->domain,
 870                                                 isl_set_copy(context));
 871         comp->location = s->line;
 872
 873         char *endp;
 874         long int cst;
 875         cst = strtol(s->top_function->name->s.c_str(), &endp, 0);
 876         if (*s->top_function->name->s.c_str() && !*endp) {
 877                 comp->arity = 1;
 878                 comp->operation = strdup("");
 879                 add_constant_edge(pdg, a2c, 0, cst, comp);
 880         } else {
 881                 comp->arity = s->top_function->arguments.size();
 882                 comp->operation = strdup(s->top_function->name->s.c_str());
 883                 add_edges(dg, pdg, s2c, a2c, missing, s->top_function, comp);
 884                 isl_map *expr = affine_expression(comp, a2c[NULL]);
 885                 if (expr) {
 886                         delete comp;
 887                         comp = new computation();
 888                         comp->domain = node->source->get_isl_set(ctx);
 889                         comp->domain = isl_set_intersect_params(comp->domain,
 890                                                         isl_set_copy(context));
 891                         comp->location = s->line;
 892                         comp->arity = 1;
 893                         comp->operation = strdup("");
 894
 895                         edge *e = new edge;
 896                         e->pos = 0;
 897                         e->source = a2c[NULL];
 898                         e->relation = expr;
 899                         comp->edges.push_back(e);
 900                 }
 901         }
 902
 903         connect_top_level_outputs(comp, s2c, missing, node);
 904
 905         dg->vertices.push_back(comp);
 906 }
 907
 908 static void ensure_output_deps(pdg::PDG *pdg, pdg::array *array)
 909 {
 910         for (int i = 0; i < array->analysis_performed.size(); ++i)
 911                 if (array->analysis_performed[i]->type ==
 912                                                     pdg::dependence::output)
 913                         return;
 914         fprintf(stderr, "no output dependence analysis performed on array %s\n",
 915                 array->name->s.c_str());
 916         exit(-1);
 917 }
 918
 919 struct less_name : public std::binary_function<pdg::array*, pdg::array*, bool> {
 920         bool operator()(pdg::array* x, pdg::array* y) {
 921                 return strcmp(x->name->s.c_str(), y->name->s.c_str()) < 0;
 922         }
 923 };
 924
 925 /* Convert a pdg to a dependence_graph containing all the information
 926  * needed for equivalence checking.
 927  *
 928  * We first compute the total dimension of the output computation
 929  * and create input computations for each input array.
 930  * Then we create computations for each node in the pdg and
 931  * a special output computation.
 932  * For each node, we subsequently compute all the edges emanating
 933  * from the corresponding computation.
 934  * Finally, for each node writing to an output array, we compute
 935  * that part of the domain that computes part of the final
 936  * contents of the output array and add corresponding edges
 937  * to the output computation.
 938  */
 939 dependence_graph *pdg_to_dg(pdg::PDG *pdg, unsigned out_dim,
 940         __isl_take isl_set *context)
 941 {
 942         isl_space *dims;
 943         isl_ctx *ctx = pdg->get_isl_ctx();
 944         unsigned nparam = pdg->params.size();
 945         dependence_graph *dg = new dependence_graph;
 946         std::map<pdg::access *, computation *> s2c;
 947         std::map<pdg::array *, computation *> a2c;
 948         std::map<pdg::access *, std::vector<computation **> > missing;
 949
 950         std::vector<pdg::array *> output_arrays;
 951         std::map<pdg::array *, int> array2pos;
 952         std::map<pdg::access *, isl_set *> exposed;
 953
 954         if (context)
 955                 context = isl_set_intersect(context, pdg->get_context_isl_set());
 956         else
 957                 context = pdg->get_context_isl_set();
 958
 959         /* add a special "input computation"; see add_iterator_edges */
 960         computation *comp;
 961         dims = isl_space_set_alloc(ctx, nparam, 1);
 962         isl_dim_set_parameter_names(dims, pdg->params);
 963         comp = new input_array("", dims);
 964         a2c[NULL] = comp;
 965         dg->vertices.push_back(comp);
 966
 967         for (int i = 0; i < pdg->arrays.size(); ++i) {
 968                 pdg::array *array = pdg->arrays[i];
 969                 if (array->type == pdg::array::output) {
 970                         output_arrays.push_back(array);
 971                         ensure_output_deps(pdg, array);
 972                 }
 973
 974                 if (array->type != pdg::array::input)
 975                         continue;
 976
 977                 computation *comp;
 978                 dims = isl_space_set_alloc(ctx, nparam, array->dims.size());
 979                 isl_dim_set_parameter_names(dims, pdg->params);
 980                 comp = new input_array(array->name->s.c_str(), dims);
 981                 a2c[array] = comp;
 982                 dg->vertices.push_back(comp);
 983                 dg->input_computations.push_back(comp);
 984         }
 985         if (!out_dim) {
 986                 fprintf(stderr, "no output arrays\n");
 987                 exit(-1);
 988         }
 989         std::sort(output_arrays.begin(), output_arrays.end(), less_name());
 990         for (int i = 0; i < output_arrays.size(); ++i) {
 991                 dg->output_arrays.push_back(strdup(output_arrays[i]->name->s.c_str()));
 992                 dg->output_array_dims.push_back(output_arrays[i]->dims.size());
 993                 array2pos[output_arrays[i]] = i;
 994         }
 995         dg->out = new computation();
 996         dims = isl_space_set_alloc(ctx, nparam, out_dim);
 997         isl_dim_set_parameter_names(dims, pdg->params);
 998         dg->out->domain = isl_set_empty(dims);
 999         dg->out->operation = strdup("#Out");
1000         dg->out->arity = 1;
1001         dg->out->location = -1;
1002         for (int i = 0; i < pdg->nodes.size(); ++i) {
1003                 pdg::node *node = pdg->nodes[i];
1004                 pdg::statement *s = node->statement;
1005
1006                 add_top_level_computation(dg, pdg, s2c, a2c, missing, node,
1007                                             context);
1008
1009                 for (int j = 0; j < s->accesses.size(); ++j) {
1010                         if (s->accesses[j]->type != pdg::access::write)
1011                                 continue;
1012                         pdg::access *a = s->accesses[j];
1013
1014                         if (s->accesses[j]->array->type != pdg::array::output)
1015                                 continue;
1016
1017                         exposed[a] = node->source->get_isl_set(ctx);
1018                         if (a->extension) {
1019                                 isl_map *ext = a->extension->get_isl_map(ctx);
1020                                 exposed[a] = isl_set_apply(exposed[a], ext);
1021                         }
1022                         exposed[a] = isl_set_intersect_params(exposed[a],
1023                                                         isl_set_copy(context));
1024                 }
1025         }
1026         for (int i = 0; i < pdg->dependences.size(); ++i) {
1027                 pdg::dependence *dep = pdg->dependences[i];
1028                 if (dep->type != pdg::dependence::output)
1029                         continue;
1030                 pdg::access *a = dep->from_access;
1031                 if (!exposed[a] || isl_set_is_empty(exposed[a]))
1032                         continue;
1033                 isl_map *rel;
1034                 if (!dep->extended_relation)
1035                         rel = dep->relation->get_isl_map(ctx);
1036                 else
1037                         rel = dep->extended_relation->get_isl_map(ctx);
1038                 exposed[a] = isl_set_subtract(exposed[a], isl_map_domain(rel));
1039         }
1040         for (int i = 0; i < pdg->nodes.size(); ++i) {
1041                 pdg::node *node = pdg->nodes[i];
1042                 pdg::statement *s = node->statement;
1043                 for (int j = 0;  j < s->accesses.size(); ++j) {
1044                         pdg::access *a = s->accesses[j];
1045                         if (!exposed[a] || isl_set_is_empty(exposed[a])) {
1046                                 isl_set_free(exposed[a]);
1047                                 continue;
1048                         }
1049                         add_output_edge(ctx, dg->out, node, array2pos,
1050                                         s2c[a], exposed[a], nparam, out_dim);
1051                 }
1052         }
1053         dg->context = context;
1054         return dg;
1055 }