doc/implementation.tex

   1 \section{Sets and Relations}
   2
   3 \begin{definition}[Polyhedral Set]
   4 A {\em polyhedral set}\index{polyhedral set} $S$ is a finite union of basic sets
   5 $S = \bigcup_i S_i$, each of which can be represented using affine
   6 constraints
   7 $$
   8 S_i : \Q^n \to 2^{\Q^d} : \vec s \mapsto
   9 S_i(\vec s) =
  10 \{\, \vec x \in \Z^d \mid \exists \vec z \in \Z^e :
  11 A \vec x + B \vec s + D \vec z + \vec c \geq \vec 0 \,\}
  12 ,
  13 $$
  14 with $A \in \Z^{m \times d}$,
  15 $B \in \Z^{m \times n}$,
  16 $D \in \Z^{m \times e}$
  17 and $\vec c \in \Z^m$.
  18 \end{definition}
  19
  20 \begin{definition}[Parameter Domain of a Set]
  21 Let $S \in \Q^n \to 2^{\Q^d}$ be a set.
  22 The {\em parameter domain} of $S$ is the set
  23 $$\pdom S \coloneqq \{\, \vec s \in \Z^n \mid S(\vec s) \ne \emptyset \,\}.$$
  24 \end{definition}
  25
  26 \begin{definition}[Polyhedral Relation]
  27 A {\em polyhedral relation}\index{polyhedral relation}
  28 $R$ is a finite union of basic relations
  29 $R = \bigcup_i R_i$ of type
  30 $\Q^n \to 2^{\Q^{d_1+d_2}}$,
  31 each of which can be represented using affine
  32 constraints
  33 $$
  34 R_i = \vec s \mapsto
  35 R_i(\vec s) =
  36 \{\, \vec x_1 \to \vec x_2 \in \Z^{d_1} \times \Z^{d_2}
  37 \mid \exists \vec z \in \Z^e :
  38 A_1 \vec x_1 + A_2 \vec x_2 + B \vec s + D \vec z + \vec c \geq \vec 0 \,\}
  39 ,
  40 $$
  41 with $A_i \in \Z^{m \times d_i}$,
  42 $B \in \Z^{m \times n}$,
  43 $D \in \Z^{m \times e}$
  44 and $\vec c \in \Z^m$.
  45 \end{definition}
  46
  47 \begin{definition}[Parameter Domain of a Relation]
  48 Let $R \in \Q^n \to 2^{\Q^{d+d}}$ be a relation.
  49 The {\em parameter domain} of $R$ is the set
  50 $$\pdom R \coloneqq \{\, \vec s \in \Z^n \mid R(\vec s) \ne \emptyset \,\}.$$
  51 \end{definition}
  52
  53 \begin{definition}[Domain of a Relation]
  54 Let $R \in \Q^n \to 2^{\Q^{d+d}}$ be a relation.
  55 The {\em domain} of $R$ is the polyhedral set
  56 $$\domain R \coloneqq \vec s \mapsto
  57 \{\, \vec x_1 \in \Z^{d_1} \mid \exists \vec x_2 \in \Z^{d_2} :
  58 (\vec x_1, \vec x_2) \in R(\vec s) \,\}
  59 .
  60 $$
  61 \end{definition}
  62
  63 \begin{definition}[Range of a Relation]
  64 Let $R \in \Q^n \to 2^{\Q^{d+d}}$ be a relation.
  65 The {\em range} of $R$ is the polyhedral set
  66 $$
  67 \range R \coloneqq \vec s \mapsto
  68 \{\, \vec x_2 \in \Z^{d_2} \mid \exists \vec x_1 \in \Z^{d_1} :
  69 (\vec x_1, \vec x_2) \in R(\vec s) \,\}
  70 .
  71 $$
  72 \end{definition}
  73
  74 \begin{definition}[Composition of Relations]
  75 Let $R \in \Q^n \to 2^{\Q^{d_1+d_2}}$ and
  76 $S \in \Q^n \to 2^{\Q^{d_2+d_3}}$ be two relations,
  77 then the composition of
  78 $R$ and $S$ is defined as
  79 $$
  80 S \circ R \coloneqq
  81 \vec s \mapsto
  82 \{\, \vec x_1 \to \vec x_3 \in \Z^{d_1} \times \Z^{d_3}
  83 \mid \exists \vec x_2 \in \Z^{d_2} :
  84 \vec x_1 \to \vec x_2 \in R(\vec s) \wedge
  85 \vec x_2 \to \vec x_3 \in S(\vec s)
  86 \,\}
  87 .
  88 $$
  89 \end{definition}
  90
  91 \begin{definition}[Difference Set of a Relation]
  92 Let $R \in \Q^n \to 2^{\Q^{d+d}}$ be a relation.
  93 The difference set ($\Delta \, R$) of $R$ is the set
  94 of differences between image elements and the corresponding
  95 domain elements,
  96 $$
  97 \Delta \, R \coloneqq
  98 \vec s \mapsto
  99 \{\, \vec \delta \in \Z^{d} \mid \exists \vec x \to \vec y \in R :
 100 \vec \delta = \vec y - \vec x
 101 \,\}
 102 $$
 103 \end{definition}
 104
 105 \section{Coalescing}\label{s:coalescing}
 106
 107 See \shortciteN{Verdoolaege2009isl}, for now.
 108 More details will be added later.
 109
 110 \section{Transitive Closure}
 111
 112 \subsection{Introduction}
 113
 114 \begin{definition}[Power of a Relation]
 115 Let $R \in \Q^n \to 2^{\Q^{d+d}}$ be a relation and
 116 $k \in \Z_{\ge 1}$
 117 a positive number, then power $k$ of relation $R$ is defined as
 118 \begin{equation}
 119 \label{eq:transitive:power}
 120 R^k \coloneqq
 121 \begin{cases}
 122 R & \text{if $k = 1$}
 123 \\
 124 R \circ R^{k-1} & \text{if $k \ge 2$}
 125 .
 126 \end{cases}
 127 \end{equation}
 128 \end{definition}
 129
 130 \begin{definition}[Transitive Closure of a Relation]
 131 Let $R \in \Q^n \to 2^{\Q^{d+d}}$ be a relation,
 132 then the transitive closure $R^+$ of $R$ is the union
 133 of all positive powers of $R$,
 134 $$
 135 R^+ \coloneqq \bigcup_{k \ge 1} R^k
 136 .
 137 $$
 138 \end{definition}
 139 Alternatively, the transitive closure may be defined
 140 inductively as
 141 \begin{equation}
 142 \label{eq:transitive:inductive}
 143 R^+ \coloneqq R \cup \left(R \circ R^+\right)
 144 .
 145 \end{equation}
 146
 147 Since the transitive closure of a polyhedral relation
 148 may no longer be a polyhedral relation \shortcite{Kelly1996closure},
 149 we can, in the general case, only compute an approximation
 150 of the transitive closure.
 151 Whereas \shortciteN{Kelly1996closure} compute underapproximations,
 152 we, like \shortciteN{Beletska2009}, compute overapproximations.
 153 That is, given a relation $R$, we will compute a relation $T$
 154 such that $R^+ \subseteq T$.  Of course, we want this approximation
 155 to be as close as possible to the actual transitive closure
 156 $R^+$ and we want to detect the cases where the approximation is
 157 exact, i.e., where $T = R^+$.
 158
 159 For computing an approximation of the transitive closure of $R$,
 160 we follow the same general strategy as \shortciteN{Beletska2009}
 161 and first compute an approximation of $R^k$ for $k \ge 1$ and then project
 162 out the parameter $k$ from the resulting relation.
 163
 164 \begin{example}
 165 As a trivial example, consider the relation
 166 $R = \{\, x \to x + 1 \,\}$.  The $k$th power of this map
 167 for arbitrary $k$ is
 168 $$
 169 R^k = k \mapsto \{\, x \to x + k \mid k \ge 1 \,\}
 170 .
 171 $$
 172 The transitive closure is then
 173 $$
 174 \begin{aligned}
 175 R^+ & = \{\, x \to y \mid \exists k \in \Z_{\ge 1} : y = x + k \,\}
 176 \\
 177 & = \{\, x \to y \mid y \ge x + 1 \,\}
 178 .
 179 \end{aligned}
 180 $$
 181 \end{example}
 182
 183 \subsection{Computing an Approximation of $R^k$}
 184 \label{s:power}
 185
 186 There are some special cases where the computation of $R^k$ is very easy.
 187 One such case is that where $R$ does not compose with itself,
 188 i.e., $R \circ R = \emptyset$ or $\domain R \cap \range R = \emptyset$.
 189 In this case, $R^k$ is only non-empty for $k=1$ where it is equal
 190 to $R$ itself.
 191
 192 In general, it is impossible to construct a closed form
 193 of $R^k$ as a polyhedral relation.
 194 We will therefore need to make some approximations.
 195 As a first approximations, we will consider each of the basic
 196 relations in $R$ as simply adding one or more offsets to a domain element
 197 to arrive at an image element and ignore the fact that some of these
 198 offsets may only be applied to some of the domain elements.
 199 That is, we will only consider the difference set $\Delta\,R$ of the relation.
 200 In particular, we will first construct a collection $P$ of paths
 201 that move through
 202 a total of $k$ offsets and then intersect domain and range of this
 203 collection with those of $R$.
 204 That is,
 205 \begin{equation}
 206 \label{eq:transitive:approx}
 207 K = P \cap \left(\domain R \to \range R\right)
 208 ,
 209 \end{equation}
 210 with
 211 \begin{equation}
 212 \label{eq:transitive:path}
 213 P = \vec s \mapsto \{\, \vec x \to \vec y \mid
 214 \exists k_i \in \Z_{\ge 0} :
 215 \vec y = \vec x + \sum_i k_i \, \Delta_i(\vec s)
 216 \wedge
 217 \sum_i k_i = k > 0
 218 \,\}
 219 \end{equation}
 220 and with $\Delta_i$ the basic sets that compose
 221 the difference set $\Delta\,R$.
 222 Note that the number of basic sets $\Delta_i$ need not be
 223 the same as the number of basic relations in $R$.
 224 Also note that since addition is commutative, it does not
 225 matter in which order we add the offsets and so we are allowed
 226 to group them as we did in \eqref{eq:transitive:path}.
 227
 228 If all the $\Delta_i$s are singleton sets
 229 $\Delta_i = \{\, \vec \delta_i \,\}$ with $\vec \delta_i \in \Z^d$,
 230 then \eqref{eq:transitive:path} simplifies to
 231 \begin{equation}
 232 \label{eq:transitive:singleton}
 233 P = \{\, \vec x \to \vec y \mid
 234 \exists k_i \in \Z_{\ge 0} :
 235 \vec y = \vec x + \sum_i k_i \, \vec \delta_i
 236 \wedge
 237 \sum_i k_i = k > 0
 238 \,\}
 239 \end{equation}
 240 and then the approximation computed in \eqref{eq:transitive:approx}
 241 is essentially the same as that of \shortciteN{Beletska2009}.
 242 If some of $\Delta_i$s are not singleton sets or if
 243 some of $\vec \delta_i$s are parametric, then we need
 244 to resort to further approximations.
 245
 246 To ease both the exposition and the implementation, we will for
 247 the remainder of this section work with extended offsets
 248 $\Delta_i' = \Delta_i \times \{\, 1 \,\}$.
 249 That is, each offset is extended with an extra coordinate that is
 250 set equal to one.  The paths constructed by summing such extended
 251 offsets have the length encoded as the difference of their
 252 final coordinates.  The path $P'$ can then be decomposed into
 253 paths $P_i'$, one for each $\Delta_i$,
 254 \begin{equation}
 255 \label{eq:transitive:decompose}
 256 P' = \left(
 257 (P_m' \cup \identity) \circ \cdots \circ
 258 (P_2' \cup \identity) \circ
 259 (P_1' \cup \identity)
 260 \right) \cap
 261 \{\,
 262 \vec x' \to \vec y' \mid y_{d+1} - x_{d+1} = k > 0
 263 \,\}
 264 ,
 265 \end{equation}
 266 with
 267 $$
 268 P_i' = \vec s \mapsto \{\, \vec x' \to \vec y' \mid
 269 \exists k \in \Z_{\ge 1} :
 270 \vec y' = \vec x' + k \, \Delta_i'(\vec s)
 271 \,\}
 272 .
 273 $$
 274 Note that each $P_i'$ contains paths of length at least one.
 275 We therefore need to take the union with the identity relation
 276 when composing the $P_i'$s to allow for paths that do not contain
 277 any offsets from one or more $\Delta_i'$.
 278 The path that consists of only identity relations is removed
 279 by imposing the constraint $y_{d+1} - x_{d+1} > 0$.
 280 Taking the union with the identity relation means that
 281 that the relations we compose in \eqref{eq:transitive:decompose}
 282 each consist of two basic relations.  If there are $m$
 283 disjuncts in the input relation, then a direct application
 284 of the composition operation may therefore result in a relation
 285 with $2^m$ disjuncts, which is prohibitively expensive.
 286 It is therefore crucial to apply coalescing (\autoref{s:coalescing})
 287 after each composition.
 288
 289 Let us now consider how to compute an overapproximation of $P_i'$.
 290 Those that correspond to singleton $\Delta_i$s are grouped together
 291 and handled as in \eqref{eq:transitive:singleton}.
 292 Note that this is just an optimization.  The procedure described
 293 below would produce results that are at least as accurate.
 294 For simplicity, we first assume that no constraint in $\Delta_i'$
 295 involves any existentially quantified variables.
 296 We will return to existentially quantified variables at the end
 297 of this section.
 298 Without existentially quantified variables, we can classify
 299 the constraints of $\Delta_i'$ as follows
 300 \begin{enumerate}
 301 \item non-parametric constraints
 302 \begin{equation}
 303 \label{eq:transitive:non-parametric}
 304 A_1 \vec x + \vec c_1 \geq \vec 0
 305 \end{equation}
 306 \item purely parametric constraints
 307 \begin{equation}
 308 \label{eq:transitive:parametric}
 309 B_2 \vec s + \vec c_2 \geq \vec 0
 310 \end{equation}
 311 \item negative mixed constraints
 312 \begin{equation}
 313 \label{eq:transitive:mixed}
 314 A_3 \vec x + B_3 \vec s + \vec c_3 \geq \vec 0
 315 \end{equation}
 316 such that for each row $j$ and for all $\vec s$,
 317 $$
 318 \Delta_i'(\vec s) \cap
 319 \{\, \vec x' \to \vec y' \mid B_{3,j} \vec s + c_{3,j} > 0 \,\}
 320 = \emptyset
 321 $$
 322 \item positive mixed constraints
 323 $$
 324 A_4 \vec x + B_4 \vec s + \vec c_4 \geq \vec 0
 325 $$
 326 such that for each row $j$, there is at least one $\vec s$ such that
 327 $$
 328 \Delta_i'(\vec s) \cap
 329 \{\, \vec x' \to \vec y' \mid B_{4,j} \vec s + c_{4,j} > 0 \,\}
 330 \ne \emptyset
 331 $$
 332 \end{enumerate}
 333 We will use the following approximation $Q_i$ for $P_i'$:
 334 \begin{equation}
 335 \label{eq:transitive:Q}
 336 \begin{aligned}
 337 Q_i = \vec s \mapsto
 338 \{\,
 339 \vec x' \to \vec y'
 340 \mid {} & \exists k \in \Z_{\ge 1}, \vec f \in \Z^d :
 341 \vec y' = \vec x' + (\vec f, k)
 342 \wedge {}
 343 \\
 344 &
 345 A_1 \vec f + k \vec c_1 \geq \vec 0
 346 \wedge
 347 B_2 \vec s + \vec c_2 \geq \vec 0
 348 \wedge
 349 A_3 \vec f + B_3 \vec s + \vec c_3 \geq \vec 0
 350 \,\}
 351 .
 352 \end{aligned}
 353 \end{equation}
 354 To prove that $Q_i$ is indeed an overapproximation of $P_i'$,
 355 we need to show that for every $\vec s \in \Z^n$, for every
 356 $k \in \Z_{\ge 1}$ and for every $\vec f \in k \, \Delta_i(\vec s)$
 357 we have that
 358 $(\vec f, k)$ satisfies the constraints in \eqref{eq:transitive:Q}.
 359 If $\Delta_i(\vec s)$ is non-empty, then $\vec s$ must satisfy
 360 the constraints in \eqref{eq:transitive:parametric}.
 361 Each element $(\vec f, k) \in k \, \Delta_i'(\vec s)$ is a sum
 362 of $k$ elements $(\vec f_j, 1)$ in $\Delta_i'(\vec s)$.
 363 Each of these elements satisfies the constraints in
 364 \eqref{eq:transitive:non-parametric}, i.e.,
 365 $$
 366 \left[
 367 \begin{matrix}
 368 A_1 & \vec c_1
 369 \end{matrix}
 370 \right]
 371 \left[
 372 \begin{matrix}
 373 \vec f_j \\ 1
 374 \end{matrix}
 375 \right]
 376 \ge \vec 0
 377 .
 378 $$
 379 The sum of these elements therefore satisfies the same set of inequalities,
 380 i.e., $A_1 \vec f + k \vec c_1 \geq \vec 0$.
 381 Finally, the constraints in \eqref{eq:transitive:mixed} are such
 382 that for any $\vec s$ in the parameter domain of $\Delta$,
 383 we have $-\vec r(\vec s) \coloneqq B_3 \vec s + \vec c_3 \le \vec 0$,
 384 i.e., $A_3 \vec f_j \ge \vec r(\vec s) \ge \vec 0$
 385 and therefore also $A_3 \vec f \ge \vec r(\vec s)$.
 386 Note that if there are no mixed constraints and if the
 387 rational relaxation of $\Delta_i(\vec s)$, i.e.,
 388 $\{\, \vec x \in \Q^d \mid A_1 \vec x + \vec c_1 \ge \vec 0\,\}$,
 389 has integer vertices, then the approximation is exact, i.e.,
 390 $Q_i = P_i'$.  In this case, the vertices of $\Delta'_i(\vec s)$
 391 generate the rational cone
 392 $\{\, \vec x' \in \Q^{d+1} \mid \left[
 393 \begin{matrix}
 394 A_1 & \vec c_1
 395 \end{matrix}
 396 \right] \vec x' \,\}$ and therefore $\Delta'_i(\vec s)$ is
 397 a Hilbert basis of this cone \shortcite[Theorem~16.4]{Schrijver1986}.
 398
 399 Existentially quantified variables can be handled by
 400 classifying them into variables that are uniquely
 401 determined by the parameters, variables that are independent
 402 of the parameters and others.  The first set can be treated
 403 as parameters and the second as variables.  Constraints involving
 404 the other existentially quantified variables are removed.
 405
 406 \begin{example}
 407 Consider the relation
 408 $$
 409 R =
 410 n \to \{\, x \to y \mid \exists \, \alpha_0, \alpha_1: 7\alpha_0 = -2 + n \wedge 5\alpha_1 = -1 - x + y \wedge y \ge 6 + x \,\}
 411 .
 412 $$
 413 The difference set of this relation is
 414 $$
 415 \Delta = \Delta \, R =
 416 n \to \{\, x \mid \exists \, \alpha_0, \alpha_1: 7\alpha_0 = -2 + n \wedge 5\alpha_1 = -1 + x \wedge x \ge 6 \,\}
 417 .
 418 $$
 419 The existentially quantified variables can be defined in terms
 420 of the parameters and variables as
 421 $$
 422 \alpha_0 = \floor{\frac{-2 + n}7}
 423 \qquad
 424 \text{and}
 425 \qquad
 426 \alpha_1 = \floor{\frac{-1 + x}5}
 427 .
 428 $$
 429 $\alpha_0$ can therefore be treated as a parameter,
 430 while $\alpha_1$ can be treated as a variable.
 431 This in turn means that $7\alpha_0 = -2 + n$ can be treated as
 432 a purely parametric constraint, while the other two constraints are
 433 non-parametric.
 434 The corresponding $Q$~\eqref{eq:transitive:Q} is therefore
 435 $$
 436 \begin{aligned}
 437 n \to \{\, (x,z) \to (y,w) \mid
 438 \exists\, \alpha_0, \alpha_1, k, f : {} &
 439 k \ge 1 \wedge
 440 y = x + f \wedge
 441 w = z + k \wedge {} \\
 442 &
 443 7\alpha_0 = -2 + n \wedge
 444 5\alpha_1 = -k + x \wedge
 445 x \ge 6 k
 446 \,\}
 447 .
 448 \end{aligned}
 449 $$
 450 Projecting out the final coordinates encoding the length of the paths,
 451 results in the exact transitive closure
 452 $$
 453 R^+ =
 454 n \to \{\, x \to y \mid \exists \, \alpha_0, \alpha_1: 7\alpha_1 = -2 + n \wedge 6\alpha_0 \ge -x + y \wedge 5\alpha_0 \le -1 - x + y \,\}
 455 .
 456 $$
 457 \end{example}
 458
 459 \subsection{Checking Exactness}
 460
 461 The approximation $T$ for the transitive closure $R^+$ can be obtained
 462 by projecting out the parameter $k$ from the approximation $K$
 463 \eqref{eq:transitive:approx} of the power $R^k$.
 464 Since $K$ is an overapproximation of $R^k$, $T$ will also be an
 465 overapproximation of $R^+$.
 466 To check whether the results are exact, we need to consider two
 467 cases depending on whether $R$ is {\em cyclic}, where $R$ is defined
 468 to be cyclic if $R^+$ maps any element to itself, i.e.,
 469 $R^+ \cap \identity \ne \emptyset$.
 470 If $R$ is acyclic, then the inductive definition of
 471 \eqref{eq:transitive:inductive} is equivalent to its completion,
 472 i.e.,
 473 $$
 474 R^+ = R \cup \left(R \circ R^+\right)
 475 $$
 476 is a defining property.
 477 Since $T$ is known to be an overapproximation, we only need to check
 478 whether
 479 $$
 480 T \subseteq R \cup \left(R \circ T\right)
 481 .
 482 $$
 483 This is essentially Theorem~5 of \shortciteN{Kelly1996closure}.
 484 The only difference is that they only consider lexicographically
 485 forward relations, a special case of acyclic relations.
 486
 487 If, on the other hand, $R$ is cyclic, then we have to resort
 488 to checking whether the approximation $K$ of the power is exact.
 489 Note that $T$ may be exact even if $K$ is not exact, so the check
 490 is sound, but incomplete.
 491 To check exactness of the power, we simply need to check
 492 \eqref{eq:transitive:power}.  Since again $K$ is known
 493 to be an overapproximation, we only need to check whether
 494 $$
 495 \begin{aligned}
 496 K'|_{y_{d+1} - x_{d+1} = 1} & \subseteq R'
 497 \\
 498 K'|_{y_{d+1} - x_{d+1} \ge 2} & \subseteq R' \circ K'|_{y_{d+1} - x_{d+1} \ge 1}
 499 ,
 500 \end{aligned}
 501 $$
 502 where $R' = \{\, \vec x' \to \vec y' \mid \vec x \to \vec y \in R
 503 \wedge y_{d+1} - x_{d+1} = 1\,\}$, i.e., $R$ extended with path
 504 lengths equal to 1.
 505
 506 All that remains is to explain how to check the cyclicity of $R$.
 507 Note that the exactness on the power is always sound, even
 508 in the acyclic case, so we only need to be careful that we find
 509 all cyclic cases.  Now, if $R$ is cyclic, i.e.,
 510 $R^+ \cap \identity \ne \emptyset$, then, since $T$ is
 511 an overapproximation of $R^+$, also
 512 $T \cap \identity \ne \emptyset$.  This in turn means
 513 that $\Delta \, K'$ contains a point whose first $d$ coordinates
 514 are zero and whose final coordinate is positive.
 515 In the implementation we currently perform this test on $P'$ instead of $K'$.
 516 Note that if $R^+$ is acyclic and $T$ is not, then the approximation
 517 is clearly not exact and the approximation of the power $K$
 518 will not be exact either.
 519
 520 \subsection{Decomposing $R$ into strongly connected components}
 521
 522 If the input relation $R$ is a union of several basic relations
 523 that can be partially ordered
 524 then the accuracy of the approximation may be improved by computing
 525 an approximation of each strongly connected components separately.
 526 For example, if $R = R_1 \cup R_2$ and $R_1 \circ R_2 = \emptyset$,
 527 then we know that any path that passes through $R_2$ cannot later
 528 pass through $R_1$, i.e.,
 529 $$
 530 R^+ = R_1^+ \cup R_2^+ \cup \left(R_2^+ \circ R_1^+\right)
 531 .
 532 $$
 533 We can therefore compute (approximations of) transitive closures
 534 of $R_1$ and $R_2$ separately.
 535 Note, however, that the condition $R_1 \circ R_2 = \emptyset$
 536 is actually too strong.
 537 If $R_1 \circ R_2$ is a subset of $R_2 \circ R_1$
 538 then we can reorder the segments
 539 in any path that moves through both $R_1$ and $R_2$ to
 540 first move through $R_1$ and then through $R_2$.
 541
 542 This idea can be generalized to relations that are unions
 543 of more than two basic relations by constructing the
 544 strongly connected components in the graph with as vertices
 545 the basic relations and an edge between two basic relations
 546 $R_i$ and $R_j$ if $R_i$ needs to follow $R_j$ in some paths.
 547 That is, there is an edge from $R_i$ to $R_j$ iff
 548 \begin{equation}
 549 \label{eq:transitive:edge}
 550 R_i \circ R_j
 551 \not\subseteq
 552 R_j \circ R_i
 553 .
 554 \end{equation}
 555 The components can be obtained from the graph by applying
 556 Tarjan's algorithm \shortcite{Tarjan1972}.
 557
 558 In practice, we compute the (extended) powers $K_i'$ of each component
 559 separately and then compose them as in \eqref{eq:transitive:decompose}.
 560 Note, however, that in this case the order in which we apply them is
 561 important and should correspond to a topological ordering of the
 562 strongly connected components.  Simply applying Tarjan's
 563 algorithm will produce topologically sorted strongly connected components.
 564 The graph on which Tarjan's algorithm is applied is constructed on-the-fly.
 565 That is, whenever the algorithm checks if there is an edge between
 566 two vertices, we evaluate \eqref{eq:transitive:edge}.
 567 The exactness check is performed on each component separately.
 568 If the approximation turns out to be inexact for any of the components,
 569 then the entire result is marked inexact and the exactness check
 570 is skipped on the components that still need to be handled.
 571
 572 \begin{figure}
 573 \begin{center}
 574 \begin{tikzpicture}[x=0.5cm,y=0.5cm,>=stealth,shorten >=1pt]
 575 \foreach \x in {1,...,10}{
 576     \foreach \y in {1,...,10}{
 577         \draw[->] (\x,\y) -- (\x,\y+1);
 578     }
 579 }
 580 \foreach \x in {1,...,20}{
 581     \foreach \y in {5,...,15}{
 582         \draw[->] (\x,\y) -- (\x+1,\y);
 583     }
 584 }
 585 \end{tikzpicture}
 586 \end{center}
 587 \caption{The relation from \autoref{ex:closure4}}
 588 \label{f:closure4}
 589 \end{figure}
 590 \begin{example}
 591 \label{ex:closure4}
 592 Consider the relation in example {\tt closure4} that comes with
 593 the Omega calculator~\shortcite{Omega_calc}, $R = R_1 \cup R_2$,
 594 with
 595 $$
 596 \begin{aligned}
 597 R_1 & = \{\, (x,y) \to (x,y+1) \mid 1 \le x,y \le 10 \,\}
 598 \\
 599 R_2 & = \{\, (x,y) \to (x+1,y) \mid 1 \le x \le 20 \wedge 5 \le y \le 15 \,\}
 600 .
 601 \end{aligned}
 602 $$
 603 This relation is shown graphically in \autoref{f:closure4}.
 604 We have
 605 $$
 606 \begin{aligned}
 607 R_1 \circ R_2 &=
 608 \{\, (x,y) \to (x+1,y+1) \mid 1 \le x \le 9 \wedge 5 \le y \le 10 \,\}
 609 \\
 610 R_2 \circ R_1 &=
 611 \{\, (x,y) \to (x+1,y+1) \mid 1 \le x \le 10 \wedge 4 \le y \le 10 \,\}
 612 .
 613 \end{aligned}
 614 $$
 615 Clearly, $R_1 \circ R_2 \subseteq R_2 \circ R_1$ and so
 616 $$
 617 \left(
 618 R_1 \cup R_2
 619 \right)^+
 620 =
 621 \left(R_2^+ \circ R_1^+\right)
 622 \cup R_1^+
 623 \cup R_2^+
 624 .
 625 $$
 626 \end{example}
 627
 628 \begin{figure}
 629 \newcounter{n}
 630 \newcounter{t1}
 631 \newcounter{t2}
 632 \newcounter{t3}
 633 \newcounter{t4}
 634 \begin{center}
 635 \begin{tikzpicture}[>=stealth,shorten >=1pt]
 636 \setcounter{n}{7}
 637 \foreach \i in {1,...,\value{n}}{
 638     \foreach \j in {1,...,\value{n}}{
 639         \setcounter{t1}{2 * \j - 4 - \i + 1}
 640         \setcounter{t2}{\value{n} - 3 - \i + 1}
 641         \setcounter{t3}{2 * \i - 1 - \j + 1}
 642         \setcounter{t4}{\value{n} - \j + 1}
 643         \ifnum\value{t1}>0\ifnum\value{t2}>0
 644         \ifnum\value{t3}>0\ifnum\value{t4}>0
 645             \draw[thick,->] (\i,\j) to[out=20] (\i+3,\j);
 646         \fi\fi\fi\fi
 647         \setcounter{t1}{2 * \j - 1 - \i + 1}
 648         \setcounter{t2}{\value{n} - \i + 1}
 649         \setcounter{t3}{2 * \i - 4 - \j + 1}
 650         \setcounter{t4}{\value{n} - 3 - \j + 1}
 651         \ifnum\value{t1}>0\ifnum\value{t2}>0
 652         \ifnum\value{t3}>0\ifnum\value{t4}>0
 653             \draw[thick,->] (\i,\j) to[in=-20,out=20] (\i,\j+3);
 654         \fi\fi\fi\fi
 655         \setcounter{t1}{2 * \j - 1 - \i + 1}
 656         \setcounter{t2}{\value{n} - 1 - \i + 1}
 657         \setcounter{t3}{2 * \i - 1 - \j + 1}
 658         \setcounter{t4}{\value{n} - 1 - \j + 1}
 659         \ifnum\value{t1}>0\ifnum\value{t2}>0
 660         \ifnum\value{t3}>0\ifnum\value{t4}>0
 661             \draw[thick,->] (\i,\j) to (\i+1,\j+1);
 662         \fi\fi\fi\fi
 663     }
 664 }
 665 \end{tikzpicture}
 666 \end{center}
 667 \caption{The relation from \autoref{ex:decomposition}}
 668 \label{f:decomposition}
 669 \end{figure}
 670 \begin{example}
 671 \label{ex:decomposition}
 672 Consider the relation on the right of \shortciteN[Figure~2]{Beletska2009},
 673 reproduced in \autoref{f:decomposition}.
 674 The relation can be described as $R = R_1 \cup R_2 \cup R_3$,
 675 with
 676 $$
 677 \begin{aligned}
 678 R_1 &= n \mapsto \{\, (i,j) \to (i+3,j) \mid
 679 i \le 2 j - 4 \wedge
 680 i \le n - 3 \wedge
 681 j \le 2 i - 1 \wedge
 682 j \le n \,\}
 683 \\
 684 R_2 &= n \mapsto \{\, (i,j) \to (i,j+3) \mid
 685 i \le 2 j - 1 \wedge
 686 i \le n \wedge
 687 j \le 2 i - 4 \wedge
 688 j \le n - 3 \,\}
 689 \\
 690 R_3 &= n \mapsto \{\, (i,j) \to (i+1,j+1) \mid
 691 i \le 2 j - 1 \wedge
 692 i \le n - 1 \wedge
 693 j \le 2 i - 1 \wedge
 694 j \le n - 1\,\}
 695 .
 696 \end{aligned}
 697 $$
 698 The figure shows this relation for $n = 7$.
 699 Both
 700 $R_3 \circ R_1 \subseteq R_1 \circ R_3$
 701 and
 702 $R_3 \circ R_2 \subseteq R_2 \circ R_3$,
 703 which the reader can verify using the {\tt iscc} calculator:
 704 \begin{verbatim}
 705 R1 := [n] -> { [i,j] -> [i+3,j] : i <= 2 j - 4 and i <= n - 3 and
 706                                   j <= 2 i - 1 and j <= n };
 707 R2 := [n] -> { [i,j] -> [i,j+3] : i <= 2 j - 1 and i <= n and
 708                                   j <= 2 i - 4 and j <= n - 3 };
 709 R3 := [n] -> { [i,j] -> [i+1,j+1] : i <= 2 j - 1 and i <= n - 1 and
 710                                     j <= 2 i - 1 and j <= n - 1 };
 711 (R1 . R3) - (R3 . R1);
 712 (R2 . R3) - (R3 . R2);
 713 \end{verbatim}
 714 $R_3$ can therefore be moved forward in any path.
 715 For the other two basic relations, we have both
 716 $R_2 \circ R_1 \not\subseteq R_1 \circ R_2$
 717 and
 718 $R_1 \circ R_2 \not\subseteq R_2 \circ R_1$
 719 and so $R_1$ and $R_2$ form a strongly connected component.
 720 By computing the power of $R_3$ and $R_1 \cup R_2$ separately
 721 and composing the results, the power of $R$ can be computed exactly
 722 using \eqref{eq:transitive:singleton}.
 723 As explained by \shortciteN{Beletska2009}, applying the same formula
 724 to $R$ directly, without a decomposition, would result in
 725 an overapproximation of the power.
 726 \end{example}
 727
 728 \subsection{An {\tt Omega}-like implementation}
 729
 730 While the main algorithm of \shortciteN{Kelly1996closure} is
 731 designed to compute and underapproximation of the transitive closure,
 732 the authors mention that they could also compute overapproximations.
 733 In this section, we describe our implementation of an algorithm
 734 that is based on their ideas.
 735 Note that the {\tt Omega} library computes underapproximations
 736 \shortcite[Section 6.4]{Omega_lib}.
 737
 738 The main tool is Equation~(2) of \shortciteN{Kelly1996closure}.
 739 The input relation $R$ is first overapproximated by a ``d-form'' relation
 740 $$
 741 \{\, \vec i \to \vec j \mid \exists \vec \alpha :
 742 \vec L \le \vec j - \vec i \le \vec U
 743 \wedge
 744 (\forall p : j_p - i_p = M_p \alpha_p)
 745 \,\}
 746 ,
 747 $$
 748 where $p$ ranges over the dimensions and $\vec L$, $\vec U$ and
 749 $\vec M$ are constant integer vectors.  The elements of $\vec U$
 750 may be $\infty$, meaning that there is no upper bound corresponding
 751 to that element, and similarly for $\vec L$.
 752 Such an overapproximation can be obtained by computing strides,
 753 lower and upper bounds on the difference set $\Delta \, R$.
 754 The transitive closure of such a ``d-form'' relation is
 755 \begin{equation}
 756 \label{eq:omega}
 757 \{\, \vec i \to \vec j \mid \exists \vec \alpha, k :
 758 k \ge 1 \wedge
 759 k \, \vec L \le \vec j - \vec i \le k \, \vec U
 760 \wedge
 761 (\forall p : j_p - i_p = M_p \alpha_p)
 762 \,\}
 763 .
 764 \end{equation}
 765 The domain and range of this transitive closure are then
 766 intersected with those of the input relation.
 767 This is a special case of the algorithm in \autoref{s:power}.
 768
 769 In their algorithm for computing lower bounds, the authors
 770 use the above algorithm as a substep on the disjuncts in the relation.
 771 At the end, they say
 772 \begin{quote}
 773 If an upper bound is required, it can be calculated in a manner
 774 similar to that of a single conjunct [sic] relation.
 775 \end{quote}
 776 Presumably, the authors mean that a ``d-form'' approximation
 777 of the whole input relation should be used.
 778 However, the accuracy can be improved by also using the following
 779 idea from the same paper.  If $R$ is a union of $m$ basic maps,
 780 $$
 781 R = \bigcup_i R_i
 782 ,
 783 $$
 784 and if we can find an $R_i$ such that for all other $R_j$ we have
 785 that
 786 $$
 787 R_i^* \circ R_j \circ R_i^*
 788 $$
 789 can be represented as a single basic map, i.e., without a union,
 790 then we can compute $R^+$ as
 791 $$
 792 R^+ = R_i^+ \cup
 793 \left(
 794 \bigcup_{j \ne i}
 795 R_i^* \circ R_j \circ R_i^*
 796 \right)^+
 797 ,
 798 $$
 799 reducing the number of disjuncts in the argument of the transitive
 800 closure by one.
 801 An overapproximation of $R_i^*$ can be obtained by
 802 allowing the value zero for $k$ in \eqref{eq:omega},
 803 i.e., by computing
 804 $$
 805 \{\, \vec i \to \vec j \mid \exists \vec \alpha, k :
 806 k \ge 0 \wedge
 807 k \, \vec L \le \vec j - \vec i \le k \, \vec U
 808 \wedge
 809 (\forall p : j_p - i_p = M_p \alpha_p)
 810 \,\}
 811 .
 812 $$
 813 However, when we intersect domain and range of this relation
 814 with those of the input relation, then the result only contains
 815 the identity mapping on the intersection of domain and range.
 816 \shortciteN{Kelly1996closure} propose to intersect domain
 817 and range with then {\em union} of domain and range of the input
 818 relation instead and call the result $R_i^?$.
 819 Now, this union of domain and range of $R_i$ may not contain
 820 the domains and ranges of the whole of $R$.
 821 We can therefore not always replace
 822 $R_i^* \circ R_j \circ R_i^*$ by
 823 $R_i^? \circ R_j \circ R_i^?$.
 824 \shortciteN{Kelly1996closure} propose to check the following
 825 conditions to decide whether this replacement is justified:
 826 $R_i^? - R_i^+$ is not a union and for each $j \ne i$
 827 the condition
 828 $$
 829 \left(R_i^? - R_i^+\right)
 830 \circ
 831 R_j
 832 \circ
 833 \left(R_i^? - R_i^+\right)
 834 =
 835 R_j
 836 $$
 837 holds.