• Home
  • Line#
  • Scopes#
  • Navigate#
  • Raw
  • Download
1 // Copyright (c) 2018 Google LLC.
2 //
3 // Licensed under the Apache License, Version 2.0 (the "License");
4 // you may not use this file except in compliance with the License.
5 // You may obtain a copy of the License at
6 //
7 //     http://www.apache.org/licenses/LICENSE-2.0
8 //
9 // Unless required by applicable law or agreed to in writing, software
10 // distributed under the License is distributed on an "AS IS" BASIS,
11 // WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
12 // See the License for the specific language governing permissions and
13 // limitations under the License.
14 
15 #include "source/opt/loop_dependence.h"
16 
17 #include <functional>
18 #include <memory>
19 #include <numeric>
20 #include <string>
21 #include <utility>
22 #include <vector>
23 
24 #include "source/opt/instruction.h"
25 #include "source/opt/scalar_analysis.h"
26 #include "source/opt/scalar_analysis_nodes.h"
27 
28 namespace spvtools {
29 namespace opt {
30 
31 using SubscriptPair = std::pair<SENode*, SENode*>;
32 
33 namespace {
34 
35 // Calculate the greatest common divisor of a & b using Stein's algorithm.
36 // https://en.wikipedia.org/wiki/Binary_GCD_algorithm
GreatestCommonDivisor(int64_t a,int64_t b)37 int64_t GreatestCommonDivisor(int64_t a, int64_t b) {
38   // Simple cases
39   if (a == b) {
40     return a;
41   } else if (a == 0) {
42     return b;
43   } else if (b == 0) {
44     return a;
45   }
46 
47   // Both even
48   if (a % 2 == 0 && b % 2 == 0) {
49     return 2 * GreatestCommonDivisor(a / 2, b / 2);
50   }
51 
52   // Even a, odd b
53   if (a % 2 == 0 && b % 2 == 1) {
54     return GreatestCommonDivisor(a / 2, b);
55   }
56 
57   // Odd a, even b
58   if (a % 2 == 1 && b % 2 == 0) {
59     return GreatestCommonDivisor(a, b / 2);
60   }
61 
62   // Both odd, reduce the larger argument
63   if (a > b) {
64     return GreatestCommonDivisor((a - b) / 2, b);
65   } else {
66     return GreatestCommonDivisor((b - a) / 2, a);
67   }
68 }
69 
70 // Check if node is affine, ie in the form: a0*i0 + a1*i1 + ... an*in + c
71 // and contains only the following types of nodes: SERecurrentNode, SEAddNode
72 // and SEConstantNode
IsInCorrectFormForGCDTest(SENode * node)73 bool IsInCorrectFormForGCDTest(SENode* node) {
74   bool children_ok = true;
75 
76   if (auto add_node = node->AsSEAddNode()) {
77     for (auto child : add_node->GetChildren()) {
78       children_ok &= IsInCorrectFormForGCDTest(child);
79     }
80   }
81 
82   bool this_ok = node->AsSERecurrentNode() || node->AsSEAddNode() ||
83                  node->AsSEConstantNode();
84 
85   return children_ok && this_ok;
86 }
87 
88 // If |node| is an SERecurrentNode then returns |node| or if |node| is an
89 // SEAddNode returns a vector of SERecurrentNode that are its children.
GetAllTopLevelRecurrences(SENode * node)90 std::vector<SERecurrentNode*> GetAllTopLevelRecurrences(SENode* node) {
91   auto nodes = std::vector<SERecurrentNode*>{};
92   if (auto recurrent_node = node->AsSERecurrentNode()) {
93     nodes.push_back(recurrent_node);
94   }
95 
96   if (auto add_node = node->AsSEAddNode()) {
97     for (auto child : add_node->GetChildren()) {
98       auto child_nodes = GetAllTopLevelRecurrences(child);
99       nodes.insert(nodes.end(), child_nodes.begin(), child_nodes.end());
100     }
101   }
102 
103   return nodes;
104 }
105 
106 // If |node| is an SEConstantNode then returns |node| or if |node| is an
107 // SEAddNode returns a vector of SEConstantNode that are its children.
GetAllTopLevelConstants(SENode * node)108 std::vector<SEConstantNode*> GetAllTopLevelConstants(SENode* node) {
109   auto nodes = std::vector<SEConstantNode*>{};
110   if (auto recurrent_node = node->AsSEConstantNode()) {
111     nodes.push_back(recurrent_node);
112   }
113 
114   if (auto add_node = node->AsSEAddNode()) {
115     for (auto child : add_node->GetChildren()) {
116       auto child_nodes = GetAllTopLevelConstants(child);
117       nodes.insert(nodes.end(), child_nodes.begin(), child_nodes.end());
118     }
119   }
120 
121   return nodes;
122 }
123 
AreOffsetsAndCoefficientsConstant(const std::vector<SERecurrentNode * > & nodes)124 bool AreOffsetsAndCoefficientsConstant(
125     const std::vector<SERecurrentNode*>& nodes) {
126   for (auto node : nodes) {
127     if (!node->GetOffset()->AsSEConstantNode() ||
128         !node->GetOffset()->AsSEConstantNode()) {
129       return false;
130     }
131   }
132   return true;
133 }
134 
135 // Fold all SEConstantNode that appear in |recurrences| and |constants| into a
136 // single integer value.
CalculateConstantTerm(const std::vector<SERecurrentNode * > & recurrences,const std::vector<SEConstantNode * > & constants)137 int64_t CalculateConstantTerm(const std::vector<SERecurrentNode*>& recurrences,
138                               const std::vector<SEConstantNode*>& constants) {
139   int64_t constant_term = 0;
140   for (auto recurrence : recurrences) {
141     constant_term +=
142         recurrence->GetOffset()->AsSEConstantNode()->FoldToSingleValue();
143   }
144 
145   for (auto constant : constants) {
146     constant_term += constant->FoldToSingleValue();
147   }
148 
149   return constant_term;
150 }
151 
CalculateGCDFromCoefficients(const std::vector<SERecurrentNode * > & recurrences,int64_t running_gcd)152 int64_t CalculateGCDFromCoefficients(
153     const std::vector<SERecurrentNode*>& recurrences, int64_t running_gcd) {
154   for (SERecurrentNode* recurrence : recurrences) {
155     auto coefficient = recurrence->GetCoefficient()->AsSEConstantNode();
156 
157     running_gcd = GreatestCommonDivisor(
158         running_gcd, std::abs(coefficient->FoldToSingleValue()));
159   }
160 
161   return running_gcd;
162 }
163 
164 // Compare 2 fractions while first normalizing them, e.g. 2/4 and 4/8 will both
165 // be simplified to 1/2 and then determined to be equal.
NormalizeAndCompareFractions(int64_t numerator_0,int64_t denominator_0,int64_t numerator_1,int64_t denominator_1)166 bool NormalizeAndCompareFractions(int64_t numerator_0, int64_t denominator_0,
167                                   int64_t numerator_1, int64_t denominator_1) {
168   auto gcd_0 =
169       GreatestCommonDivisor(std::abs(numerator_0), std::abs(denominator_0));
170   auto gcd_1 =
171       GreatestCommonDivisor(std::abs(numerator_1), std::abs(denominator_1));
172 
173   auto normalized_numerator_0 = numerator_0 / gcd_0;
174   auto normalized_denominator_0 = denominator_0 / gcd_0;
175   auto normalized_numerator_1 = numerator_1 / gcd_1;
176   auto normalized_denominator_1 = denominator_1 / gcd_1;
177 
178   return normalized_numerator_0 == normalized_numerator_1 &&
179          normalized_denominator_0 == normalized_denominator_1;
180 }
181 
182 }  // namespace
183 
GetDependence(const Instruction * source,const Instruction * destination,DistanceVector * distance_vector)184 bool LoopDependenceAnalysis::GetDependence(const Instruction* source,
185                                            const Instruction* destination,
186                                            DistanceVector* distance_vector) {
187   // Start off by finding and marking all the loops in |loops_| that are
188   // irrelevant to the dependence analysis.
189   MarkUnsusedDistanceEntriesAsIrrelevant(source, destination, distance_vector);
190 
191   Instruction* source_access_chain = GetOperandDefinition(source, 0);
192   Instruction* destination_access_chain = GetOperandDefinition(destination, 0);
193 
194   auto num_access_chains =
195       (source_access_chain->opcode() == SpvOpAccessChain) +
196       (destination_access_chain->opcode() == SpvOpAccessChain);
197 
198   // If neither is an access chain, then they are load/store to a variable.
199   if (num_access_chains == 0) {
200     if (source_access_chain != destination_access_chain) {
201       // Not the same location, report independence
202       return true;
203     } else {
204       // Accessing the same variable
205       for (auto& entry : distance_vector->GetEntries()) {
206         entry = DistanceEntry();
207       }
208       return false;
209     }
210   }
211 
212   // If only one is an access chain, it could be accessing a part of a struct
213   if (num_access_chains == 1) {
214     auto source_is_chain = source_access_chain->opcode() == SpvOpAccessChain;
215     auto access_chain =
216         source_is_chain ? source_access_chain : destination_access_chain;
217     auto variable =
218         source_is_chain ? destination_access_chain : source_access_chain;
219 
220     auto location_in_chain = GetOperandDefinition(access_chain, 0);
221 
222     if (variable != location_in_chain) {
223       // Not the same location, report independence
224       return true;
225     } else {
226       // Accessing the same variable
227       for (auto& entry : distance_vector->GetEntries()) {
228         entry = DistanceEntry();
229       }
230       return false;
231     }
232   }
233 
234   // If the access chains aren't collecting from the same structure there is no
235   // dependence.
236   Instruction* source_array = GetOperandDefinition(source_access_chain, 0);
237   Instruction* destination_array =
238       GetOperandDefinition(destination_access_chain, 0);
239 
240   // Nested access chains are not supported yet, bail out.
241   if (source_array->opcode() == SpvOpAccessChain ||
242       destination_array->opcode() == SpvOpAccessChain) {
243     for (auto& entry : distance_vector->GetEntries()) {
244       entry = DistanceEntry();
245     }
246     return false;
247   }
248 
249   if (source_array != destination_array) {
250     PrintDebug("Proved independence through different arrays.");
251     return true;
252   }
253 
254   // To handle multiple subscripts we must get every operand in the access
255   // chains past the first.
256   std::vector<Instruction*> source_subscripts = GetSubscripts(source);
257   std::vector<Instruction*> destination_subscripts = GetSubscripts(destination);
258 
259   auto sets_of_subscripts =
260       PartitionSubscripts(source_subscripts, destination_subscripts);
261 
262   auto first_coupled = std::partition(
263       std::begin(sets_of_subscripts), std::end(sets_of_subscripts),
264       [](const std::set<std::pair<Instruction*, Instruction*>>& set) {
265         return set.size() == 1;
266       });
267 
268   // Go through each subscript testing for independence.
269   // If any subscript results in independence, we prove independence between the
270   // load and store.
271   // If we can't prove independence we store what information we can gather in
272   // a DistanceVector.
273   for (auto it = std::begin(sets_of_subscripts); it < first_coupled; ++it) {
274     auto source_subscript = std::get<0>(*(*it).begin());
275     auto destination_subscript = std::get<1>(*(*it).begin());
276 
277     SENode* source_node = scalar_evolution_.SimplifyExpression(
278         scalar_evolution_.AnalyzeInstruction(source_subscript));
279     SENode* destination_node = scalar_evolution_.SimplifyExpression(
280         scalar_evolution_.AnalyzeInstruction(destination_subscript));
281 
282     // Check the loops are in a form we support.
283     auto subscript_pair = std::make_pair(source_node, destination_node);
284 
285     const Loop* loop = GetLoopForSubscriptPair(subscript_pair);
286     if (loop) {
287       if (!IsSupportedLoop(loop)) {
288         PrintDebug(
289             "GetDependence found an unsupported loop form. Assuming <=> for "
290             "loop.");
291         DistanceEntry* distance_entry =
292             GetDistanceEntryForSubscriptPair(subscript_pair, distance_vector);
293         if (distance_entry) {
294           distance_entry->direction = DistanceEntry::Directions::ALL;
295         }
296         continue;
297       }
298     }
299 
300     // If either node is simplified to a CanNotCompute we can't perform any
301     // analysis so must assume <=> dependence and return.
302     if (source_node->GetType() == SENode::CanNotCompute ||
303         destination_node->GetType() == SENode::CanNotCompute) {
304       // Record the <=> dependence if we can get a DistanceEntry
305       PrintDebug(
306           "GetDependence found source_node || destination_node as "
307           "CanNotCompute. Abandoning evaluation for this subscript.");
308       DistanceEntry* distance_entry =
309           GetDistanceEntryForSubscriptPair(subscript_pair, distance_vector);
310       if (distance_entry) {
311         distance_entry->direction = DistanceEntry::Directions::ALL;
312       }
313       continue;
314     }
315 
316     // We have no induction variables so can apply a ZIV test.
317     if (IsZIV(subscript_pair)) {
318       PrintDebug("Found a ZIV subscript pair");
319       if (ZIVTest(subscript_pair)) {
320         PrintDebug("Proved independence with ZIVTest.");
321         return true;
322       }
323     }
324 
325     // We have only one induction variable so should attempt an SIV test.
326     if (IsSIV(subscript_pair)) {
327       PrintDebug("Found a SIV subscript pair.");
328       if (SIVTest(subscript_pair, distance_vector)) {
329         PrintDebug("Proved independence with SIVTest.");
330         return true;
331       }
332     }
333 
334     // We have multiple induction variables so should attempt an MIV test.
335     if (IsMIV(subscript_pair)) {
336       PrintDebug("Found a MIV subscript pair.");
337       if (GCDMIVTest(subscript_pair)) {
338         PrintDebug("Proved independence with the GCD test.");
339         auto current_loops = CollectLoops(source_node, destination_node);
340 
341         for (auto current_loop : current_loops) {
342           auto distance_entry =
343               GetDistanceEntryForLoop(current_loop, distance_vector);
344           distance_entry->direction = DistanceEntry::Directions::NONE;
345         }
346         return true;
347       }
348     }
349   }
350 
351   for (auto it = first_coupled; it < std::end(sets_of_subscripts); ++it) {
352     auto coupled_instructions = *it;
353     std::vector<SubscriptPair> coupled_subscripts{};
354 
355     for (const auto& elem : coupled_instructions) {
356       auto source_subscript = std::get<0>(elem);
357       auto destination_subscript = std::get<1>(elem);
358 
359       SENode* source_node = scalar_evolution_.SimplifyExpression(
360           scalar_evolution_.AnalyzeInstruction(source_subscript));
361       SENode* destination_node = scalar_evolution_.SimplifyExpression(
362           scalar_evolution_.AnalyzeInstruction(destination_subscript));
363 
364       coupled_subscripts.push_back({source_node, destination_node});
365     }
366 
367     auto supported = true;
368 
369     for (const auto& subscript : coupled_subscripts) {
370       auto loops = CollectLoops(std::get<0>(subscript), std::get<1>(subscript));
371 
372       auto is_subscript_supported =
373           std::all_of(std::begin(loops), std::end(loops),
374                       [this](const Loop* l) { return IsSupportedLoop(l); });
375 
376       supported = supported && is_subscript_supported;
377     }
378 
379     if (DeltaTest(coupled_subscripts, distance_vector)) {
380       return true;
381     }
382   }
383 
384   // We were unable to prove independence so must gather all of the direction
385   // information we found.
386   PrintDebug(
387       "Couldn't prove independence.\n"
388       "All possible direction information has been collected in the input "
389       "DistanceVector.");
390 
391   return false;
392 }
393 
ZIVTest(const std::pair<SENode *,SENode * > & subscript_pair)394 bool LoopDependenceAnalysis::ZIVTest(
395     const std::pair<SENode*, SENode*>& subscript_pair) {
396   auto source = std::get<0>(subscript_pair);
397   auto destination = std::get<1>(subscript_pair);
398 
399   PrintDebug("Performing ZIVTest");
400   // If source == destination, dependence with direction = and distance 0.
401   if (source == destination) {
402     PrintDebug("ZIVTest found EQ dependence.");
403     return false;
404   } else {
405     PrintDebug("ZIVTest found independence.");
406     // Otherwise we prove independence.
407     return true;
408   }
409 }
410 
SIVTest(const std::pair<SENode *,SENode * > & subscript_pair,DistanceVector * distance_vector)411 bool LoopDependenceAnalysis::SIVTest(
412     const std::pair<SENode*, SENode*>& subscript_pair,
413     DistanceVector* distance_vector) {
414   DistanceEntry* distance_entry =
415       GetDistanceEntryForSubscriptPair(subscript_pair, distance_vector);
416   if (!distance_entry) {
417     PrintDebug(
418         "SIVTest could not find a DistanceEntry for subscript_pair. Exiting");
419   }
420 
421   SENode* source_node = std::get<0>(subscript_pair);
422   SENode* destination_node = std::get<1>(subscript_pair);
423 
424   int64_t source_induction_count = CountInductionVariables(source_node);
425   int64_t destination_induction_count =
426       CountInductionVariables(destination_node);
427 
428   // If the source node has no induction variables we can apply a
429   // WeakZeroSrcTest.
430   if (source_induction_count == 0) {
431     PrintDebug("Found source has no induction variable.");
432     if (WeakZeroSourceSIVTest(
433             source_node, destination_node->AsSERecurrentNode(),
434             destination_node->AsSERecurrentNode()->GetCoefficient(),
435             distance_entry)) {
436       PrintDebug("Proved independence with WeakZeroSourceSIVTest.");
437       distance_entry->dependence_information =
438           DistanceEntry::DependenceInformation::DIRECTION;
439       distance_entry->direction = DistanceEntry::Directions::NONE;
440       return true;
441     }
442   }
443 
444   // If the destination has no induction variables we can apply a
445   // WeakZeroDestTest.
446   if (destination_induction_count == 0) {
447     PrintDebug("Found destination has no induction variable.");
448     if (WeakZeroDestinationSIVTest(
449             source_node->AsSERecurrentNode(), destination_node,
450             source_node->AsSERecurrentNode()->GetCoefficient(),
451             distance_entry)) {
452       PrintDebug("Proved independence with WeakZeroDestinationSIVTest.");
453       distance_entry->dependence_information =
454           DistanceEntry::DependenceInformation::DIRECTION;
455       distance_entry->direction = DistanceEntry::Directions::NONE;
456       return true;
457     }
458   }
459 
460   // We now need to collect the SERecurrentExpr nodes from source and
461   // destination. We do not handle cases where source or destination have
462   // multiple SERecurrentExpr nodes.
463   std::vector<SERecurrentNode*> source_recurrent_nodes =
464       source_node->CollectRecurrentNodes();
465   std::vector<SERecurrentNode*> destination_recurrent_nodes =
466       destination_node->CollectRecurrentNodes();
467 
468   if (source_recurrent_nodes.size() == 1 &&
469       destination_recurrent_nodes.size() == 1) {
470     PrintDebug("Found source and destination have 1 induction variable.");
471     SERecurrentNode* source_recurrent_expr = *source_recurrent_nodes.begin();
472     SERecurrentNode* destination_recurrent_expr =
473         *destination_recurrent_nodes.begin();
474 
475     // If the coefficients are identical we can apply a StrongSIVTest.
476     if (source_recurrent_expr->GetCoefficient() ==
477         destination_recurrent_expr->GetCoefficient()) {
478       PrintDebug("Found source and destination share coefficient.");
479       if (StrongSIVTest(source_node, destination_node,
480                         source_recurrent_expr->GetCoefficient(),
481                         distance_entry)) {
482         PrintDebug("Proved independence with StrongSIVTest");
483         distance_entry->dependence_information =
484             DistanceEntry::DependenceInformation::DIRECTION;
485         distance_entry->direction = DistanceEntry::Directions::NONE;
486         return true;
487       }
488     }
489 
490     // If the coefficients are of equal magnitude and opposite sign we can
491     // apply a WeakCrossingSIVTest.
492     if (source_recurrent_expr->GetCoefficient() ==
493         scalar_evolution_.CreateNegation(
494             destination_recurrent_expr->GetCoefficient())) {
495       PrintDebug("Found source coefficient = -destination coefficient.");
496       if (WeakCrossingSIVTest(source_node, destination_node,
497                               source_recurrent_expr->GetCoefficient(),
498                               distance_entry)) {
499         PrintDebug("Proved independence with WeakCrossingSIVTest");
500         distance_entry->dependence_information =
501             DistanceEntry::DependenceInformation::DIRECTION;
502         distance_entry->direction = DistanceEntry::Directions::NONE;
503         return true;
504       }
505     }
506   }
507 
508   return false;
509 }
510 
StrongSIVTest(SENode * source,SENode * destination,SENode * coefficient,DistanceEntry * distance_entry)511 bool LoopDependenceAnalysis::StrongSIVTest(SENode* source, SENode* destination,
512                                            SENode* coefficient,
513                                            DistanceEntry* distance_entry) {
514   PrintDebug("Performing StrongSIVTest.");
515   // If both source and destination are SERecurrentNodes we can perform tests
516   // based on distance.
517   // If either source or destination contain value unknown nodes or if one or
518   // both are not SERecurrentNodes we must attempt a symbolic test.
519   std::vector<SEValueUnknown*> source_value_unknown_nodes =
520       source->CollectValueUnknownNodes();
521   std::vector<SEValueUnknown*> destination_value_unknown_nodes =
522       destination->CollectValueUnknownNodes();
523   if (source_value_unknown_nodes.size() > 0 ||
524       destination_value_unknown_nodes.size() > 0) {
525     PrintDebug(
526         "StrongSIVTest found symbolics. Will attempt SymbolicStrongSIVTest.");
527     return SymbolicStrongSIVTest(source, destination, coefficient,
528                                  distance_entry);
529   }
530 
531   if (!source->AsSERecurrentNode() || !destination->AsSERecurrentNode()) {
532     PrintDebug(
533         "StrongSIVTest could not simplify source and destination to "
534         "SERecurrentNodes so will exit.");
535     distance_entry->direction = DistanceEntry::Directions::ALL;
536     return false;
537   }
538 
539   // Build an SENode for distance.
540   std::pair<SENode*, SENode*> subscript_pair =
541       std::make_pair(source, destination);
542   const Loop* subscript_loop = GetLoopForSubscriptPair(subscript_pair);
543   SENode* source_constant_term =
544       GetConstantTerm(subscript_loop, source->AsSERecurrentNode());
545   SENode* destination_constant_term =
546       GetConstantTerm(subscript_loop, destination->AsSERecurrentNode());
547   if (!source_constant_term || !destination_constant_term) {
548     PrintDebug(
549         "StrongSIVTest could not collect the constant terms of either source "
550         "or destination so will exit.");
551     return false;
552   }
553   SENode* constant_term_delta =
554       scalar_evolution_.SimplifyExpression(scalar_evolution_.CreateSubtraction(
555           destination_constant_term, source_constant_term));
556 
557   // Scalar evolution doesn't perform division, so we must fold to constants and
558   // do it manually.
559   // We must check the offset delta and coefficient are constants.
560   int64_t distance = 0;
561   SEConstantNode* delta_constant = constant_term_delta->AsSEConstantNode();
562   SEConstantNode* coefficient_constant = coefficient->AsSEConstantNode();
563   if (delta_constant && coefficient_constant) {
564     int64_t delta_value = delta_constant->FoldToSingleValue();
565     int64_t coefficient_value = coefficient_constant->FoldToSingleValue();
566     PrintDebug(
567         "StrongSIVTest found delta value and coefficient value as constants "
568         "with values:\n"
569         "\tdelta value: " +
570         ToString(delta_value) +
571         "\n\tcoefficient value: " + ToString(coefficient_value) + "\n");
572     // Check if the distance is not integral to try to prove independence.
573     if (delta_value % coefficient_value != 0) {
574       PrintDebug(
575           "StrongSIVTest proved independence through distance not being an "
576           "integer.");
577       distance_entry->dependence_information =
578           DistanceEntry::DependenceInformation::DIRECTION;
579       distance_entry->direction = DistanceEntry::Directions::NONE;
580       return true;
581     } else {
582       distance = delta_value / coefficient_value;
583       PrintDebug("StrongSIV test found distance as " + ToString(distance));
584     }
585   } else {
586     // If we can't fold delta and coefficient to single values we can't produce
587     // distance.
588     // As a result we can't perform the rest of the pass and must assume
589     // dependence in all directions.
590     PrintDebug("StrongSIVTest could not produce a distance. Must exit.");
591     distance_entry->distance = DistanceEntry::Directions::ALL;
592     return false;
593   }
594 
595   // Next we gather the upper and lower bounds as constants if possible. If
596   // distance > upper_bound - lower_bound we prove independence.
597   SENode* lower_bound = GetLowerBound(subscript_loop);
598   SENode* upper_bound = GetUpperBound(subscript_loop);
599   if (lower_bound && upper_bound) {
600     PrintDebug("StrongSIVTest found bounds.");
601     SENode* bounds = scalar_evolution_.SimplifyExpression(
602         scalar_evolution_.CreateSubtraction(upper_bound, lower_bound));
603 
604     if (bounds->GetType() == SENode::SENodeType::Constant) {
605       int64_t bounds_value = bounds->AsSEConstantNode()->FoldToSingleValue();
606       PrintDebug(
607           "StrongSIVTest found upper_bound - lower_bound as a constant with "
608           "value " +
609           ToString(bounds_value));
610 
611       // If the absolute value of the distance is > upper bound - lower bound
612       // then we prove independence.
613       if (llabs(distance) > llabs(bounds_value)) {
614         PrintDebug(
615             "StrongSIVTest proved independence through distance escaping the "
616             "loop bounds.");
617         distance_entry->dependence_information =
618             DistanceEntry::DependenceInformation::DISTANCE;
619         distance_entry->direction = DistanceEntry::Directions::NONE;
620         distance_entry->distance = distance;
621         return true;
622       }
623     }
624   } else {
625     PrintDebug("StrongSIVTest was unable to gather lower and upper bounds.");
626   }
627 
628   // Otherwise we can get a direction as follows
629   //             { < if distance > 0
630   // direction = { = if distance == 0
631   //             { > if distance < 0
632   PrintDebug(
633       "StrongSIVTest could not prove independence. Gathering direction "
634       "information.");
635   if (distance > 0) {
636     distance_entry->dependence_information =
637         DistanceEntry::DependenceInformation::DISTANCE;
638     distance_entry->direction = DistanceEntry::Directions::LT;
639     distance_entry->distance = distance;
640     return false;
641   }
642   if (distance == 0) {
643     distance_entry->dependence_information =
644         DistanceEntry::DependenceInformation::DISTANCE;
645     distance_entry->direction = DistanceEntry::Directions::EQ;
646     distance_entry->distance = 0;
647     return false;
648   }
649   if (distance < 0) {
650     distance_entry->dependence_information =
651         DistanceEntry::DependenceInformation::DISTANCE;
652     distance_entry->direction = DistanceEntry::Directions::GT;
653     distance_entry->distance = distance;
654     return false;
655   }
656 
657   // We were unable to prove independence or discern any additional information
658   // Must assume <=> direction.
659   PrintDebug(
660       "StrongSIVTest was unable to determine any dependence information.");
661   distance_entry->direction = DistanceEntry::Directions::ALL;
662   return false;
663 }
664 
SymbolicStrongSIVTest(SENode * source,SENode * destination,SENode * coefficient,DistanceEntry * distance_entry)665 bool LoopDependenceAnalysis::SymbolicStrongSIVTest(
666     SENode* source, SENode* destination, SENode* coefficient,
667     DistanceEntry* distance_entry) {
668   PrintDebug("Performing SymbolicStrongSIVTest.");
669   SENode* source_destination_delta = scalar_evolution_.SimplifyExpression(
670       scalar_evolution_.CreateSubtraction(source, destination));
671   // By cancelling out the induction variables by subtracting the source and
672   // destination we can produce an expression of symbolics and constants. This
673   // expression can be compared to the loop bounds to find if the offset is
674   // outwith the bounds.
675   std::pair<SENode*, SENode*> subscript_pair =
676       std::make_pair(source, destination);
677   const Loop* subscript_loop = GetLoopForSubscriptPair(subscript_pair);
678   if (IsProvablyOutsideOfLoopBounds(subscript_loop, source_destination_delta,
679                                     coefficient)) {
680     PrintDebug(
681         "SymbolicStrongSIVTest proved independence through loop bounds.");
682     distance_entry->dependence_information =
683         DistanceEntry::DependenceInformation::DIRECTION;
684     distance_entry->direction = DistanceEntry::Directions::NONE;
685     return true;
686   }
687   // We were unable to prove independence or discern any additional information.
688   // Must assume <=> direction.
689   PrintDebug(
690       "SymbolicStrongSIVTest was unable to determine any dependence "
691       "information.");
692   distance_entry->direction = DistanceEntry::Directions::ALL;
693   return false;
694 }
695 
WeakZeroSourceSIVTest(SENode * source,SERecurrentNode * destination,SENode * coefficient,DistanceEntry * distance_entry)696 bool LoopDependenceAnalysis::WeakZeroSourceSIVTest(
697     SENode* source, SERecurrentNode* destination, SENode* coefficient,
698     DistanceEntry* distance_entry) {
699   PrintDebug("Performing WeakZeroSourceSIVTest.");
700   std::pair<SENode*, SENode*> subscript_pair =
701       std::make_pair(source, destination);
702   const Loop* subscript_loop = GetLoopForSubscriptPair(subscript_pair);
703   // Build an SENode for distance.
704   SENode* destination_constant_term =
705       GetConstantTerm(subscript_loop, destination);
706   SENode* delta = scalar_evolution_.SimplifyExpression(
707       scalar_evolution_.CreateSubtraction(source, destination_constant_term));
708 
709   // Scalar evolution doesn't perform division, so we must fold to constants and
710   // do it manually.
711   int64_t distance = 0;
712   SEConstantNode* delta_constant = delta->AsSEConstantNode();
713   SEConstantNode* coefficient_constant = coefficient->AsSEConstantNode();
714   if (delta_constant && coefficient_constant) {
715     PrintDebug(
716         "WeakZeroSourceSIVTest folding delta and coefficient to constants.");
717     int64_t delta_value = delta_constant->FoldToSingleValue();
718     int64_t coefficient_value = coefficient_constant->FoldToSingleValue();
719     // Check if the distance is not integral.
720     if (delta_value % coefficient_value != 0) {
721       PrintDebug(
722           "WeakZeroSourceSIVTest proved independence through distance not "
723           "being an integer.");
724       distance_entry->dependence_information =
725           DistanceEntry::DependenceInformation::DIRECTION;
726       distance_entry->direction = DistanceEntry::Directions::NONE;
727       return true;
728     } else {
729       distance = delta_value / coefficient_value;
730       PrintDebug(
731           "WeakZeroSourceSIVTest calculated distance with the following "
732           "values\n"
733           "\tdelta value: " +
734           ToString(delta_value) +
735           "\n\tcoefficient value: " + ToString(coefficient_value) +
736           "\n\tdistance: " + ToString(distance) + "\n");
737     }
738   } else {
739     PrintDebug(
740         "WeakZeroSourceSIVTest was unable to fold delta and coefficient to "
741         "constants.");
742   }
743 
744   // If we can prove the distance is outside the bounds we prove independence.
745   SEConstantNode* lower_bound =
746       GetLowerBound(subscript_loop)->AsSEConstantNode();
747   SEConstantNode* upper_bound =
748       GetUpperBound(subscript_loop)->AsSEConstantNode();
749   if (lower_bound && upper_bound) {
750     PrintDebug("WeakZeroSourceSIVTest found bounds as SEConstantNodes.");
751     int64_t lower_bound_value = lower_bound->FoldToSingleValue();
752     int64_t upper_bound_value = upper_bound->FoldToSingleValue();
753     if (!IsWithinBounds(llabs(distance), lower_bound_value,
754                         upper_bound_value)) {
755       PrintDebug(
756           "WeakZeroSourceSIVTest proved independence through distance escaping "
757           "the loop bounds.");
758       PrintDebug(
759           "Bound values were as follow\n"
760           "\tlower bound value: " +
761           ToString(lower_bound_value) +
762           "\n\tupper bound value: " + ToString(upper_bound_value) +
763           "\n\tdistance value: " + ToString(distance) + "\n");
764       distance_entry->dependence_information =
765           DistanceEntry::DependenceInformation::DISTANCE;
766       distance_entry->direction = DistanceEntry::Directions::NONE;
767       distance_entry->distance = distance;
768       return true;
769     }
770   } else {
771     PrintDebug(
772         "WeakZeroSourceSIVTest was unable to find lower and upper bound as "
773         "SEConstantNodes.");
774   }
775 
776   // Now we want to see if we can detect to peel the first or last iterations.
777 
778   // We get the FirstTripValue as GetFirstTripInductionNode() +
779   // GetConstantTerm(destination)
780   SENode* first_trip_SENode =
781       scalar_evolution_.SimplifyExpression(scalar_evolution_.CreateAddNode(
782           GetFirstTripInductionNode(subscript_loop),
783           GetConstantTerm(subscript_loop, destination)));
784 
785   // If source == FirstTripValue, peel_first.
786   if (first_trip_SENode) {
787     PrintDebug("WeakZeroSourceSIVTest built first_trip_SENode.");
788     if (first_trip_SENode->AsSEConstantNode()) {
789       PrintDebug(
790           "WeakZeroSourceSIVTest has found first_trip_SENode as an "
791           "SEConstantNode with value: " +
792           ToString(first_trip_SENode->AsSEConstantNode()->FoldToSingleValue()) +
793           "\n");
794     }
795     if (source == first_trip_SENode) {
796       // We have found that peeling the first iteration will break dependency.
797       PrintDebug(
798           "WeakZeroSourceSIVTest has found peeling first iteration will break "
799           "dependency");
800       distance_entry->dependence_information =
801           DistanceEntry::DependenceInformation::PEEL;
802       distance_entry->peel_first = true;
803       return false;
804     }
805   } else {
806     PrintDebug("WeakZeroSourceSIVTest was unable to build first_trip_SENode");
807   }
808 
809   // We get the LastTripValue as GetFinalTripInductionNode(coefficient) +
810   // GetConstantTerm(destination)
811   SENode* final_trip_SENode =
812       scalar_evolution_.SimplifyExpression(scalar_evolution_.CreateAddNode(
813           GetFinalTripInductionNode(subscript_loop, coefficient),
814           GetConstantTerm(subscript_loop, destination)));
815 
816   // If source == LastTripValue, peel_last.
817   if (final_trip_SENode) {
818     PrintDebug("WeakZeroSourceSIVTest built final_trip_SENode.");
819     if (first_trip_SENode->AsSEConstantNode()) {
820       PrintDebug(
821           "WeakZeroSourceSIVTest has found final_trip_SENode as an "
822           "SEConstantNode with value: " +
823           ToString(final_trip_SENode->AsSEConstantNode()->FoldToSingleValue()) +
824           "\n");
825     }
826     if (source == final_trip_SENode) {
827       // We have found that peeling the last iteration will break dependency.
828       PrintDebug(
829           "WeakZeroSourceSIVTest has found peeling final iteration will break "
830           "dependency");
831       distance_entry->dependence_information =
832           DistanceEntry::DependenceInformation::PEEL;
833       distance_entry->peel_last = true;
834       return false;
835     }
836   } else {
837     PrintDebug("WeakZeroSourceSIVTest was unable to build final_trip_SENode");
838   }
839 
840   // We were unable to prove independence or discern any additional information.
841   // Must assume <=> direction.
842   PrintDebug(
843       "WeakZeroSourceSIVTest was unable to determine any dependence "
844       "information.");
845   distance_entry->direction = DistanceEntry::Directions::ALL;
846   return false;
847 }
848 
WeakZeroDestinationSIVTest(SERecurrentNode * source,SENode * destination,SENode * coefficient,DistanceEntry * distance_entry)849 bool LoopDependenceAnalysis::WeakZeroDestinationSIVTest(
850     SERecurrentNode* source, SENode* destination, SENode* coefficient,
851     DistanceEntry* distance_entry) {
852   PrintDebug("Performing WeakZeroDestinationSIVTest.");
853   // Build an SENode for distance.
854   std::pair<SENode*, SENode*> subscript_pair =
855       std::make_pair(source, destination);
856   const Loop* subscript_loop = GetLoopForSubscriptPair(subscript_pair);
857   SENode* source_constant_term = GetConstantTerm(subscript_loop, source);
858   SENode* delta = scalar_evolution_.SimplifyExpression(
859       scalar_evolution_.CreateSubtraction(destination, source_constant_term));
860 
861   // Scalar evolution doesn't perform division, so we must fold to constants and
862   // do it manually.
863   int64_t distance = 0;
864   SEConstantNode* delta_constant = delta->AsSEConstantNode();
865   SEConstantNode* coefficient_constant = coefficient->AsSEConstantNode();
866   if (delta_constant && coefficient_constant) {
867     PrintDebug(
868         "WeakZeroDestinationSIVTest folding delta and coefficient to "
869         "constants.");
870     int64_t delta_value = delta_constant->FoldToSingleValue();
871     int64_t coefficient_value = coefficient_constant->FoldToSingleValue();
872     // Check if the distance is not integral.
873     if (delta_value % coefficient_value != 0) {
874       PrintDebug(
875           "WeakZeroDestinationSIVTest proved independence through distance not "
876           "being an integer.");
877       distance_entry->dependence_information =
878           DistanceEntry::DependenceInformation::DIRECTION;
879       distance_entry->direction = DistanceEntry::Directions::NONE;
880       return true;
881     } else {
882       distance = delta_value / coefficient_value;
883       PrintDebug(
884           "WeakZeroDestinationSIVTest calculated distance with the following "
885           "values\n"
886           "\tdelta value: " +
887           ToString(delta_value) +
888           "\n\tcoefficient value: " + ToString(coefficient_value) +
889           "\n\tdistance: " + ToString(distance) + "\n");
890     }
891   } else {
892     PrintDebug(
893         "WeakZeroDestinationSIVTest was unable to fold delta and coefficient "
894         "to constants.");
895   }
896 
897   // If we can prove the distance is outside the bounds we prove independence.
898   SEConstantNode* lower_bound =
899       GetLowerBound(subscript_loop)->AsSEConstantNode();
900   SEConstantNode* upper_bound =
901       GetUpperBound(subscript_loop)->AsSEConstantNode();
902   if (lower_bound && upper_bound) {
903     PrintDebug("WeakZeroDestinationSIVTest found bounds as SEConstantNodes.");
904     int64_t lower_bound_value = lower_bound->FoldToSingleValue();
905     int64_t upper_bound_value = upper_bound->FoldToSingleValue();
906     if (!IsWithinBounds(llabs(distance), lower_bound_value,
907                         upper_bound_value)) {
908       PrintDebug(
909           "WeakZeroDestinationSIVTest proved independence through distance "
910           "escaping the loop bounds.");
911       PrintDebug(
912           "Bound values were as follows\n"
913           "\tlower bound value: " +
914           ToString(lower_bound_value) +
915           "\n\tupper bound value: " + ToString(upper_bound_value) +
916           "\n\tdistance value: " + ToString(distance));
917       distance_entry->dependence_information =
918           DistanceEntry::DependenceInformation::DISTANCE;
919       distance_entry->direction = DistanceEntry::Directions::NONE;
920       distance_entry->distance = distance;
921       return true;
922     }
923   } else {
924     PrintDebug(
925         "WeakZeroDestinationSIVTest was unable to find lower and upper bound "
926         "as SEConstantNodes.");
927   }
928 
929   // Now we want to see if we can detect to peel the first or last iterations.
930 
931   // We get the FirstTripValue as GetFirstTripInductionNode() +
932   // GetConstantTerm(source)
933   SENode* first_trip_SENode = scalar_evolution_.SimplifyExpression(
934       scalar_evolution_.CreateAddNode(GetFirstTripInductionNode(subscript_loop),
935                                       GetConstantTerm(subscript_loop, source)));
936 
937   // If destination == FirstTripValue, peel_first.
938   if (first_trip_SENode) {
939     PrintDebug("WeakZeroDestinationSIVTest built first_trip_SENode.");
940     if (first_trip_SENode->AsSEConstantNode()) {
941       PrintDebug(
942           "WeakZeroDestinationSIVTest has found first_trip_SENode as an "
943           "SEConstantNode with value: " +
944           ToString(first_trip_SENode->AsSEConstantNode()->FoldToSingleValue()) +
945           "\n");
946     }
947     if (destination == first_trip_SENode) {
948       // We have found that peeling the first iteration will break dependency.
949       PrintDebug(
950           "WeakZeroDestinationSIVTest has found peeling first iteration will "
951           "break dependency");
952       distance_entry->dependence_information =
953           DistanceEntry::DependenceInformation::PEEL;
954       distance_entry->peel_first = true;
955       return false;
956     }
957   } else {
958     PrintDebug(
959         "WeakZeroDestinationSIVTest was unable to build first_trip_SENode");
960   }
961 
962   // We get the LastTripValue as GetFinalTripInductionNode(coefficient) +
963   // GetConstantTerm(source)
964   SENode* final_trip_SENode =
965       scalar_evolution_.SimplifyExpression(scalar_evolution_.CreateAddNode(
966           GetFinalTripInductionNode(subscript_loop, coefficient),
967           GetConstantTerm(subscript_loop, source)));
968 
969   // If destination == LastTripValue, peel_last.
970   if (final_trip_SENode) {
971     PrintDebug("WeakZeroDestinationSIVTest built final_trip_SENode.");
972     if (final_trip_SENode->AsSEConstantNode()) {
973       PrintDebug(
974           "WeakZeroDestinationSIVTest has found final_trip_SENode as an "
975           "SEConstantNode with value: " +
976           ToString(final_trip_SENode->AsSEConstantNode()->FoldToSingleValue()) +
977           "\n");
978     }
979     if (destination == final_trip_SENode) {
980       // We have found that peeling the last iteration will break dependency.
981       PrintDebug(
982           "WeakZeroDestinationSIVTest has found peeling final iteration will "
983           "break dependency");
984       distance_entry->dependence_information =
985           DistanceEntry::DependenceInformation::PEEL;
986       distance_entry->peel_last = true;
987       return false;
988     }
989   } else {
990     PrintDebug(
991         "WeakZeroDestinationSIVTest was unable to build final_trip_SENode");
992   }
993 
994   // We were unable to prove independence or discern any additional information.
995   // Must assume <=> direction.
996   PrintDebug(
997       "WeakZeroDestinationSIVTest was unable to determine any dependence "
998       "information.");
999   distance_entry->direction = DistanceEntry::Directions::ALL;
1000   return false;
1001 }
1002 
WeakCrossingSIVTest(SENode * source,SENode * destination,SENode * coefficient,DistanceEntry * distance_entry)1003 bool LoopDependenceAnalysis::WeakCrossingSIVTest(
1004     SENode* source, SENode* destination, SENode* coefficient,
1005     DistanceEntry* distance_entry) {
1006   PrintDebug("Performing WeakCrossingSIVTest.");
1007   // We currently can't handle symbolic WeakCrossingSIVTests. If either source
1008   // or destination are not SERecurrentNodes we must exit.
1009   if (!source->AsSERecurrentNode() || !destination->AsSERecurrentNode()) {
1010     PrintDebug(
1011         "WeakCrossingSIVTest found source or destination != SERecurrentNode. "
1012         "Exiting");
1013     distance_entry->direction = DistanceEntry::Directions::ALL;
1014     return false;
1015   }
1016 
1017   // Build an SENode for distance.
1018   SENode* offset_delta =
1019       scalar_evolution_.SimplifyExpression(scalar_evolution_.CreateSubtraction(
1020           destination->AsSERecurrentNode()->GetOffset(),
1021           source->AsSERecurrentNode()->GetOffset()));
1022 
1023   // Scalar evolution doesn't perform division, so we must fold to constants and
1024   // do it manually.
1025   int64_t distance = 0;
1026   SEConstantNode* delta_constant = offset_delta->AsSEConstantNode();
1027   SEConstantNode* coefficient_constant = coefficient->AsSEConstantNode();
1028   if (delta_constant && coefficient_constant) {
1029     PrintDebug(
1030         "WeakCrossingSIVTest folding offset_delta and coefficient to "
1031         "constants.");
1032     int64_t delta_value = delta_constant->FoldToSingleValue();
1033     int64_t coefficient_value = coefficient_constant->FoldToSingleValue();
1034     // Check if the distance is not integral or if it has a non-integral part
1035     // equal to 1/2.
1036     if (delta_value % (2 * coefficient_value) != 0 &&
1037         static_cast<float>(delta_value % (2 * coefficient_value)) /
1038                 static_cast<float>(2 * coefficient_value) !=
1039             0.5) {
1040       PrintDebug(
1041           "WeakCrossingSIVTest proved independence through distance escaping "
1042           "the loop bounds.");
1043       distance_entry->dependence_information =
1044           DistanceEntry::DependenceInformation::DIRECTION;
1045       distance_entry->direction = DistanceEntry::Directions::NONE;
1046       return true;
1047     } else {
1048       distance = delta_value / (2 * coefficient_value);
1049     }
1050 
1051     if (distance == 0) {
1052       PrintDebug("WeakCrossingSIVTest found EQ dependence.");
1053       distance_entry->dependence_information =
1054           DistanceEntry::DependenceInformation::DISTANCE;
1055       distance_entry->direction = DistanceEntry::Directions::EQ;
1056       distance_entry->distance = 0;
1057       return false;
1058     }
1059   } else {
1060     PrintDebug(
1061         "WeakCrossingSIVTest was unable to fold offset_delta and coefficient "
1062         "to constants.");
1063   }
1064 
1065   // We were unable to prove independence or discern any additional information.
1066   // Must assume <=> direction.
1067   PrintDebug(
1068       "WeakCrossingSIVTest was unable to determine any dependence "
1069       "information.");
1070   distance_entry->direction = DistanceEntry::Directions::ALL;
1071   return false;
1072 }
1073 
1074 // Perform the GCD test if both, the source and the destination nodes, are in
1075 // the form a0*i0 + a1*i1 + ... an*in + c.
GCDMIVTest(const std::pair<SENode *,SENode * > & subscript_pair)1076 bool LoopDependenceAnalysis::GCDMIVTest(
1077     const std::pair<SENode*, SENode*>& subscript_pair) {
1078   auto source = std::get<0>(subscript_pair);
1079   auto destination = std::get<1>(subscript_pair);
1080 
1081   // Bail out if source/destination is in an unexpected form.
1082   if (!IsInCorrectFormForGCDTest(source) ||
1083       !IsInCorrectFormForGCDTest(destination)) {
1084     return false;
1085   }
1086 
1087   auto source_recurrences = GetAllTopLevelRecurrences(source);
1088   auto dest_recurrences = GetAllTopLevelRecurrences(destination);
1089 
1090   // Bail out if all offsets and coefficients aren't constant.
1091   if (!AreOffsetsAndCoefficientsConstant(source_recurrences) ||
1092       !AreOffsetsAndCoefficientsConstant(dest_recurrences)) {
1093     return false;
1094   }
1095 
1096   // Calculate the GCD of all coefficients.
1097   auto source_constants = GetAllTopLevelConstants(source);
1098   int64_t source_constant =
1099       CalculateConstantTerm(source_recurrences, source_constants);
1100 
1101   auto dest_constants = GetAllTopLevelConstants(destination);
1102   int64_t destination_constant =
1103       CalculateConstantTerm(dest_recurrences, dest_constants);
1104 
1105   int64_t delta = std::abs(source_constant - destination_constant);
1106 
1107   int64_t running_gcd = 0;
1108 
1109   running_gcd = CalculateGCDFromCoefficients(source_recurrences, running_gcd);
1110   running_gcd = CalculateGCDFromCoefficients(dest_recurrences, running_gcd);
1111 
1112   return delta % running_gcd != 0;
1113 }
1114 
1115 using PartitionedSubscripts =
1116     std::vector<std::set<std::pair<Instruction*, Instruction*>>>;
PartitionSubscripts(const std::vector<Instruction * > & source_subscripts,const std::vector<Instruction * > & destination_subscripts)1117 PartitionedSubscripts LoopDependenceAnalysis::PartitionSubscripts(
1118     const std::vector<Instruction*>& source_subscripts,
1119     const std::vector<Instruction*>& destination_subscripts) {
1120   PartitionedSubscripts partitions{};
1121 
1122   auto num_subscripts = source_subscripts.size();
1123 
1124   // Create initial partitions with one subscript pair per partition.
1125   for (size_t i = 0; i < num_subscripts; ++i) {
1126     partitions.push_back({{source_subscripts[i], destination_subscripts[i]}});
1127   }
1128 
1129   // Iterate over the loops to create all partitions
1130   for (auto loop : loops_) {
1131     int64_t k = -1;
1132 
1133     for (size_t j = 0; j < partitions.size(); ++j) {
1134       auto& current_partition = partitions[j];
1135 
1136       // Does |loop| appear in |current_partition|
1137       auto it = std::find_if(
1138           current_partition.begin(), current_partition.end(),
1139           [loop,
1140            this](const std::pair<Instruction*, Instruction*>& elem) -> bool {
1141             auto source_recurrences =
1142                 scalar_evolution_.AnalyzeInstruction(std::get<0>(elem))
1143                     ->CollectRecurrentNodes();
1144             auto destination_recurrences =
1145                 scalar_evolution_.AnalyzeInstruction(std::get<1>(elem))
1146                     ->CollectRecurrentNodes();
1147 
1148             source_recurrences.insert(source_recurrences.end(),
1149                                       destination_recurrences.begin(),
1150                                       destination_recurrences.end());
1151 
1152             auto loops_in_pair = CollectLoops(source_recurrences);
1153             auto end_it = loops_in_pair.end();
1154 
1155             return std::find(loops_in_pair.begin(), end_it, loop) != end_it;
1156           });
1157 
1158       auto has_loop = it != current_partition.end();
1159 
1160       if (has_loop) {
1161         if (k == -1) {
1162           k = j;
1163         } else {
1164           // Add |partitions[j]| to |partitions[k]| and discard |partitions[j]|
1165           partitions[static_cast<size_t>(k)].insert(current_partition.begin(),
1166                                                     current_partition.end());
1167           current_partition.clear();
1168         }
1169       }
1170     }
1171   }
1172 
1173   // Remove empty (discarded) partitions
1174   partitions.erase(
1175       std::remove_if(
1176           partitions.begin(), partitions.end(),
1177           [](const std::set<std::pair<Instruction*, Instruction*>>& partition) {
1178             return partition.empty();
1179           }),
1180       partitions.end());
1181 
1182   return partitions;
1183 }
1184 
IntersectConstraints(Constraint * constraint_0,Constraint * constraint_1,const SENode * lower_bound,const SENode * upper_bound)1185 Constraint* LoopDependenceAnalysis::IntersectConstraints(
1186     Constraint* constraint_0, Constraint* constraint_1,
1187     const SENode* lower_bound, const SENode* upper_bound) {
1188   if (constraint_0->AsDependenceNone()) {
1189     return constraint_1;
1190   } else if (constraint_1->AsDependenceNone()) {
1191     return constraint_0;
1192   }
1193 
1194   // Both constraints are distances. Either the same distance or independent.
1195   if (constraint_0->AsDependenceDistance() &&
1196       constraint_1->AsDependenceDistance()) {
1197     auto dist_0 = constraint_0->AsDependenceDistance();
1198     auto dist_1 = constraint_1->AsDependenceDistance();
1199 
1200     if (*dist_0->GetDistance() == *dist_1->GetDistance()) {
1201       return constraint_0;
1202     } else {
1203       return make_constraint<DependenceEmpty>();
1204     }
1205   }
1206 
1207   // Both constraints are points. Either the same point or independent.
1208   if (constraint_0->AsDependencePoint() && constraint_1->AsDependencePoint()) {
1209     auto point_0 = constraint_0->AsDependencePoint();
1210     auto point_1 = constraint_1->AsDependencePoint();
1211 
1212     if (*point_0->GetSource() == *point_1->GetSource() &&
1213         *point_0->GetDestination() == *point_1->GetDestination()) {
1214       return constraint_0;
1215     } else {
1216       return make_constraint<DependenceEmpty>();
1217     }
1218   }
1219 
1220   // Both constraints are lines/distances.
1221   if ((constraint_0->AsDependenceDistance() ||
1222        constraint_0->AsDependenceLine()) &&
1223       (constraint_1->AsDependenceDistance() ||
1224        constraint_1->AsDependenceLine())) {
1225     auto is_distance_0 = constraint_0->AsDependenceDistance() != nullptr;
1226     auto is_distance_1 = constraint_1->AsDependenceDistance() != nullptr;
1227 
1228     auto a0 = is_distance_0 ? scalar_evolution_.CreateConstant(1)
1229                             : constraint_0->AsDependenceLine()->GetA();
1230     auto b0 = is_distance_0 ? scalar_evolution_.CreateConstant(-1)
1231                             : constraint_0->AsDependenceLine()->GetB();
1232     auto c0 =
1233         is_distance_0
1234             ? scalar_evolution_.SimplifyExpression(
1235                   scalar_evolution_.CreateNegation(
1236                       constraint_0->AsDependenceDistance()->GetDistance()))
1237             : constraint_0->AsDependenceLine()->GetC();
1238 
1239     auto a1 = is_distance_1 ? scalar_evolution_.CreateConstant(1)
1240                             : constraint_1->AsDependenceLine()->GetA();
1241     auto b1 = is_distance_1 ? scalar_evolution_.CreateConstant(-1)
1242                             : constraint_1->AsDependenceLine()->GetB();
1243     auto c1 =
1244         is_distance_1
1245             ? scalar_evolution_.SimplifyExpression(
1246                   scalar_evolution_.CreateNegation(
1247                       constraint_1->AsDependenceDistance()->GetDistance()))
1248             : constraint_1->AsDependenceLine()->GetC();
1249 
1250     if (a0->AsSEConstantNode() && b0->AsSEConstantNode() &&
1251         c0->AsSEConstantNode() && a1->AsSEConstantNode() &&
1252         b1->AsSEConstantNode() && c1->AsSEConstantNode()) {
1253       auto constant_a0 = a0->AsSEConstantNode()->FoldToSingleValue();
1254       auto constant_b0 = b0->AsSEConstantNode()->FoldToSingleValue();
1255       auto constant_c0 = c0->AsSEConstantNode()->FoldToSingleValue();
1256 
1257       auto constant_a1 = a1->AsSEConstantNode()->FoldToSingleValue();
1258       auto constant_b1 = b1->AsSEConstantNode()->FoldToSingleValue();
1259       auto constant_c1 = c1->AsSEConstantNode()->FoldToSingleValue();
1260 
1261       // a & b can't both be zero, otherwise it wouldn't be line.
1262       if (NormalizeAndCompareFractions(constant_a0, constant_b0, constant_a1,
1263                                        constant_b1)) {
1264         // Slopes are equal, either parallel lines or the same line.
1265 
1266         if (constant_b0 == 0 && constant_b1 == 0) {
1267           if (NormalizeAndCompareFractions(constant_c0, constant_a0,
1268                                            constant_c1, constant_a1)) {
1269             return constraint_0;
1270           }
1271 
1272           return make_constraint<DependenceEmpty>();
1273         } else if (NormalizeAndCompareFractions(constant_c0, constant_b0,
1274                                                 constant_c1, constant_b1)) {
1275           // Same line.
1276           return constraint_0;
1277         } else {
1278           // Parallel lines can't intersect, report independence.
1279           return make_constraint<DependenceEmpty>();
1280         }
1281 
1282       } else {
1283         // Lines are not parallel, therefore, they must intersect.
1284 
1285         // Calculate intersection.
1286         if (upper_bound->AsSEConstantNode() &&
1287             lower_bound->AsSEConstantNode()) {
1288           auto constant_lower_bound =
1289               lower_bound->AsSEConstantNode()->FoldToSingleValue();
1290           auto constant_upper_bound =
1291               upper_bound->AsSEConstantNode()->FoldToSingleValue();
1292 
1293           auto up = constant_b1 * constant_c0 - constant_b0 * constant_c1;
1294           // Both b or both a can't be 0, so down is never 0
1295           // otherwise would have entered the parallel line section.
1296           auto down = constant_b1 * constant_a0 - constant_b0 * constant_a1;
1297 
1298           auto x_coord = up / down;
1299 
1300           int64_t y_coord = 0;
1301           int64_t arg1 = 0;
1302           int64_t const_b_to_use = 0;
1303 
1304           if (constant_b1 != 0) {
1305             arg1 = constant_c1 - constant_a1 * x_coord;
1306             y_coord = arg1 / constant_b1;
1307             const_b_to_use = constant_b1;
1308           } else if (constant_b0 != 0) {
1309             arg1 = constant_c0 - constant_a0 * x_coord;
1310             y_coord = arg1 / constant_b0;
1311             const_b_to_use = constant_b0;
1312           }
1313 
1314           if (up % down == 0 &&
1315               arg1 % const_b_to_use == 0 &&  // Coordinates are integers.
1316               constant_lower_bound <=
1317                   x_coord &&  // x_coord is within loop bounds.
1318               x_coord <= constant_upper_bound &&
1319               constant_lower_bound <=
1320                   y_coord &&  // y_coord is within loop bounds.
1321               y_coord <= constant_upper_bound) {
1322             // Lines intersect at integer coordinates.
1323             return make_constraint<DependencePoint>(
1324                 scalar_evolution_.CreateConstant(x_coord),
1325                 scalar_evolution_.CreateConstant(y_coord),
1326                 constraint_0->GetLoop());
1327 
1328           } else {
1329             return make_constraint<DependenceEmpty>();
1330           }
1331 
1332         } else {
1333           // Not constants, bail out.
1334           return make_constraint<DependenceNone>();
1335         }
1336       }
1337 
1338     } else {
1339       // Not constants, bail out.
1340       return make_constraint<DependenceNone>();
1341     }
1342   }
1343 
1344   // One constraint is a line/distance and the other is a point.
1345   if ((constraint_0->AsDependencePoint() &&
1346        (constraint_1->AsDependenceLine() ||
1347         constraint_1->AsDependenceDistance())) ||
1348       (constraint_1->AsDependencePoint() &&
1349        (constraint_0->AsDependenceLine() ||
1350         constraint_0->AsDependenceDistance()))) {
1351     auto point_0 = constraint_0->AsDependencePoint() != nullptr;
1352 
1353     auto point = point_0 ? constraint_0->AsDependencePoint()
1354                          : constraint_1->AsDependencePoint();
1355 
1356     auto line_or_distance = point_0 ? constraint_1 : constraint_0;
1357 
1358     auto is_distance = line_or_distance->AsDependenceDistance() != nullptr;
1359 
1360     auto a = is_distance ? scalar_evolution_.CreateConstant(1)
1361                          : line_or_distance->AsDependenceLine()->GetA();
1362     auto b = is_distance ? scalar_evolution_.CreateConstant(-1)
1363                          : line_or_distance->AsDependenceLine()->GetB();
1364     auto c =
1365         is_distance
1366             ? scalar_evolution_.SimplifyExpression(
1367                   scalar_evolution_.CreateNegation(
1368                       line_or_distance->AsDependenceDistance()->GetDistance()))
1369             : line_or_distance->AsDependenceLine()->GetC();
1370 
1371     auto x = point->GetSource();
1372     auto y = point->GetDestination();
1373 
1374     if (a->AsSEConstantNode() && b->AsSEConstantNode() &&
1375         c->AsSEConstantNode() && x->AsSEConstantNode() &&
1376         y->AsSEConstantNode()) {
1377       auto constant_a = a->AsSEConstantNode()->FoldToSingleValue();
1378       auto constant_b = b->AsSEConstantNode()->FoldToSingleValue();
1379       auto constant_c = c->AsSEConstantNode()->FoldToSingleValue();
1380 
1381       auto constant_x = x->AsSEConstantNode()->FoldToSingleValue();
1382       auto constant_y = y->AsSEConstantNode()->FoldToSingleValue();
1383 
1384       auto left_hand_side = constant_a * constant_x + constant_b * constant_y;
1385 
1386       if (left_hand_side == constant_c) {
1387         // Point is on line, return point
1388         return point_0 ? constraint_0 : constraint_1;
1389       } else {
1390         // Point not on line, report independence (empty constraint).
1391         return make_constraint<DependenceEmpty>();
1392       }
1393 
1394     } else {
1395       // Not constants, bail out.
1396       return make_constraint<DependenceNone>();
1397     }
1398   }
1399 
1400   return nullptr;
1401 }
1402 
1403 // Propagate constraints function as described in section 5 of Practical
1404 // Dependence Testing, Goff, Kennedy, Tseng, 1991.
PropagateConstraints(const SubscriptPair & subscript_pair,const std::vector<Constraint * > & constraints)1405 SubscriptPair LoopDependenceAnalysis::PropagateConstraints(
1406     const SubscriptPair& subscript_pair,
1407     const std::vector<Constraint*>& constraints) {
1408   SENode* new_first = subscript_pair.first;
1409   SENode* new_second = subscript_pair.second;
1410 
1411   for (auto& constraint : constraints) {
1412     // In the paper this is a[k]. We're extracting the coefficient ('a') of a
1413     // recurrent expression with respect to the loop 'k'.
1414     SENode* coefficient_of_recurrent =
1415         scalar_evolution_.GetCoefficientFromRecurrentTerm(
1416             new_first, constraint->GetLoop());
1417 
1418     // In the paper this is a'[k].
1419     SENode* coefficient_of_recurrent_prime =
1420         scalar_evolution_.GetCoefficientFromRecurrentTerm(
1421             new_second, constraint->GetLoop());
1422 
1423     if (constraint->GetType() == Constraint::Distance) {
1424       DependenceDistance* as_distance = constraint->AsDependenceDistance();
1425 
1426       // In the paper this is a[k]*d
1427       SENode* rhs = scalar_evolution_.CreateMultiplyNode(
1428           coefficient_of_recurrent, as_distance->GetDistance());
1429 
1430       // In the paper this is a[k] <- 0
1431       SENode* zeroed_coefficient =
1432           scalar_evolution_.BuildGraphWithoutRecurrentTerm(
1433               new_first, constraint->GetLoop());
1434 
1435       // In the paper this is e <- e - a[k]*d.
1436       new_first = scalar_evolution_.CreateSubtraction(zeroed_coefficient, rhs);
1437       new_first = scalar_evolution_.SimplifyExpression(new_first);
1438 
1439       // In the paper this is a'[k] - a[k].
1440       SENode* new_child = scalar_evolution_.SimplifyExpression(
1441           scalar_evolution_.CreateSubtraction(coefficient_of_recurrent_prime,
1442                                               coefficient_of_recurrent));
1443 
1444       // In the paper this is a'[k]'i[k].
1445       SERecurrentNode* prime_recurrent =
1446           scalar_evolution_.GetRecurrentTerm(new_second, constraint->GetLoop());
1447 
1448       if (!prime_recurrent) continue;
1449 
1450       // As we hash the nodes we need to create a new node when we update a
1451       // child.
1452       SENode* new_recurrent = scalar_evolution_.CreateRecurrentExpression(
1453           constraint->GetLoop(), prime_recurrent->GetOffset(), new_child);
1454       // In the paper this is a'[k] <- a'[k] - a[k].
1455       new_second = scalar_evolution_.UpdateChildNode(
1456           new_second, prime_recurrent, new_recurrent);
1457     }
1458   }
1459 
1460   new_second = scalar_evolution_.SimplifyExpression(new_second);
1461   return std::make_pair(new_first, new_second);
1462 }
1463 
DeltaTest(const std::vector<SubscriptPair> & coupled_subscripts,DistanceVector * dv_entry)1464 bool LoopDependenceAnalysis::DeltaTest(
1465     const std::vector<SubscriptPair>& coupled_subscripts,
1466     DistanceVector* dv_entry) {
1467   std::vector<Constraint*> constraints(loops_.size());
1468 
1469   std::vector<bool> loop_appeared(loops_.size());
1470 
1471   std::generate(std::begin(constraints), std::end(constraints),
1472                 [this]() { return make_constraint<DependenceNone>(); });
1473 
1474   // Separate SIV and MIV subscripts
1475   std::vector<SubscriptPair> siv_subscripts{};
1476   std::vector<SubscriptPair> miv_subscripts{};
1477 
1478   for (const auto& subscript_pair : coupled_subscripts) {
1479     if (IsSIV(subscript_pair)) {
1480       siv_subscripts.push_back(subscript_pair);
1481     } else {
1482       miv_subscripts.push_back(subscript_pair);
1483     }
1484   }
1485 
1486   // Delta Test
1487   while (!siv_subscripts.empty()) {
1488     std::vector<bool> results(siv_subscripts.size());
1489 
1490     std::vector<DistanceVector> current_distances(
1491         siv_subscripts.size(), DistanceVector(loops_.size()));
1492 
1493     // Apply SIV test to all SIV subscripts, report independence if any of them
1494     // is independent
1495     std::transform(
1496         std::begin(siv_subscripts), std::end(siv_subscripts),
1497         std::begin(current_distances), std::begin(results),
1498         [this](SubscriptPair& p, DistanceVector& d) { return SIVTest(p, &d); });
1499 
1500     if (std::accumulate(std::begin(results), std::end(results), false,
1501                         std::logical_or<bool>{})) {
1502       return true;
1503     }
1504 
1505     // Derive new constraint vector.
1506     std::vector<std::pair<Constraint*, size_t>> all_new_constrants{};
1507 
1508     for (size_t i = 0; i < siv_subscripts.size(); ++i) {
1509       auto loop = GetLoopForSubscriptPair(siv_subscripts[i]);
1510 
1511       auto loop_id =
1512           std::distance(std::begin(loops_),
1513                         std::find(std::begin(loops_), std::end(loops_), loop));
1514 
1515       loop_appeared[loop_id] = true;
1516       auto distance_entry = current_distances[i].GetEntries()[loop_id];
1517 
1518       if (distance_entry.dependence_information ==
1519           DistanceEntry::DependenceInformation::DISTANCE) {
1520         // Construct a DependenceDistance.
1521         auto node = scalar_evolution_.CreateConstant(distance_entry.distance);
1522 
1523         all_new_constrants.push_back(
1524             {make_constraint<DependenceDistance>(node, loop), loop_id});
1525       } else {
1526         // Construct a DependenceLine.
1527         const auto& subscript_pair = siv_subscripts[i];
1528         SENode* source_node = std::get<0>(subscript_pair);
1529         SENode* destination_node = std::get<1>(subscript_pair);
1530 
1531         int64_t source_induction_count = CountInductionVariables(source_node);
1532         int64_t destination_induction_count =
1533             CountInductionVariables(destination_node);
1534 
1535         SENode* a = nullptr;
1536         SENode* b = nullptr;
1537         SENode* c = nullptr;
1538 
1539         if (destination_induction_count != 0) {
1540           a = destination_node->AsSERecurrentNode()->GetCoefficient();
1541           c = scalar_evolution_.CreateNegation(
1542               destination_node->AsSERecurrentNode()->GetOffset());
1543         } else {
1544           a = scalar_evolution_.CreateConstant(0);
1545           c = scalar_evolution_.CreateNegation(destination_node);
1546         }
1547 
1548         if (source_induction_count != 0) {
1549           b = scalar_evolution_.CreateNegation(
1550               source_node->AsSERecurrentNode()->GetCoefficient());
1551           c = scalar_evolution_.CreateAddNode(
1552               c, source_node->AsSERecurrentNode()->GetOffset());
1553         } else {
1554           b = scalar_evolution_.CreateConstant(0);
1555           c = scalar_evolution_.CreateAddNode(c, source_node);
1556         }
1557 
1558         a = scalar_evolution_.SimplifyExpression(a);
1559         b = scalar_evolution_.SimplifyExpression(b);
1560         c = scalar_evolution_.SimplifyExpression(c);
1561 
1562         all_new_constrants.push_back(
1563             {make_constraint<DependenceLine>(a, b, c, loop), loop_id});
1564       }
1565     }
1566 
1567     // Calculate the intersection between the new and existing constraints.
1568     std::vector<Constraint*> intersection = constraints;
1569     for (const auto& constraint_to_intersect : all_new_constrants) {
1570       auto loop_id = std::get<1>(constraint_to_intersect);
1571       auto loop = loops_[loop_id];
1572       intersection[loop_id] = IntersectConstraints(
1573           intersection[loop_id], std::get<0>(constraint_to_intersect),
1574           GetLowerBound(loop), GetUpperBound(loop));
1575     }
1576 
1577     // Report independence if an empty constraint (DependenceEmpty) is found.
1578     auto first_empty =
1579         std::find_if(std::begin(intersection), std::end(intersection),
1580                      [](Constraint* constraint) {
1581                        return constraint->AsDependenceEmpty() != nullptr;
1582                      });
1583     if (first_empty != std::end(intersection)) {
1584       return true;
1585     }
1586     std::vector<SubscriptPair> new_siv_subscripts{};
1587     std::vector<SubscriptPair> new_miv_subscripts{};
1588 
1589     auto equal =
1590         std::equal(std::begin(constraints), std::end(constraints),
1591                    std::begin(intersection),
1592                    [](Constraint* a, Constraint* b) { return *a == *b; });
1593 
1594     // If any constraints have changed, propagate them into the rest of the
1595     // subscripts possibly creating new ZIV/SIV subscripts.
1596     if (!equal) {
1597       std::vector<SubscriptPair> new_subscripts(miv_subscripts.size());
1598 
1599       // Propagate constraints into MIV subscripts
1600       std::transform(std::begin(miv_subscripts), std::end(miv_subscripts),
1601                      std::begin(new_subscripts),
1602                      [this, &intersection](SubscriptPair& subscript_pair) {
1603                        return PropagateConstraints(subscript_pair,
1604                                                    intersection);
1605                      });
1606 
1607       // If a ZIV subscript is returned, apply test, otherwise, update untested
1608       // subscripts.
1609       for (auto& subscript : new_subscripts) {
1610         if (IsZIV(subscript) && ZIVTest(subscript)) {
1611           return true;
1612         } else if (IsSIV(subscript)) {
1613           new_siv_subscripts.push_back(subscript);
1614         } else {
1615           new_miv_subscripts.push_back(subscript);
1616         }
1617       }
1618     }
1619 
1620     // Set new constraints and subscripts to test.
1621     std::swap(siv_subscripts, new_siv_subscripts);
1622     std::swap(miv_subscripts, new_miv_subscripts);
1623     std::swap(constraints, intersection);
1624   }
1625 
1626   // Create the dependence vector from the constraints.
1627   for (size_t i = 0; i < loops_.size(); ++i) {
1628     // Don't touch entries for loops that weren't tested.
1629     if (loop_appeared[i]) {
1630       auto current_constraint = constraints[i];
1631       auto& current_distance_entry = (*dv_entry).GetEntries()[i];
1632 
1633       if (auto dependence_distance =
1634               current_constraint->AsDependenceDistance()) {
1635         if (auto constant_node =
1636                 dependence_distance->GetDistance()->AsSEConstantNode()) {
1637           current_distance_entry.dependence_information =
1638               DistanceEntry::DependenceInformation::DISTANCE;
1639 
1640           current_distance_entry.distance = constant_node->FoldToSingleValue();
1641           if (current_distance_entry.distance == 0) {
1642             current_distance_entry.direction = DistanceEntry::Directions::EQ;
1643           } else if (current_distance_entry.distance < 0) {
1644             current_distance_entry.direction = DistanceEntry::Directions::GT;
1645           } else {
1646             current_distance_entry.direction = DistanceEntry::Directions::LT;
1647           }
1648         }
1649       } else if (auto dependence_point =
1650                      current_constraint->AsDependencePoint()) {
1651         auto source = dependence_point->GetSource();
1652         auto destination = dependence_point->GetDestination();
1653 
1654         if (source->AsSEConstantNode() && destination->AsSEConstantNode()) {
1655           current_distance_entry = DistanceEntry(
1656               source->AsSEConstantNode()->FoldToSingleValue(),
1657               destination->AsSEConstantNode()->FoldToSingleValue());
1658         }
1659       }
1660     }
1661   }
1662 
1663   // Test any remaining MIV subscripts and report independence if found.
1664   std::vector<bool> results(miv_subscripts.size());
1665 
1666   std::transform(std::begin(miv_subscripts), std::end(miv_subscripts),
1667                  std::begin(results),
1668                  [this](const SubscriptPair& p) { return GCDMIVTest(p); });
1669 
1670   return std::accumulate(std::begin(results), std::end(results), false,
1671                          std::logical_or<bool>{});
1672 }
1673 
1674 }  // namespace opt
1675 }  // namespace spvtools
1676