1
0
mirror of https://github.com/danog/psalm.git synced 2025-01-10 15:09:04 +01:00
psalm/src/Psalm/Internal/Algebra.php

675 lines
23 KiB
PHP
Raw Normal View History

2018-05-07 07:26:06 +02:00
<?php
2020-11-03 22:15:44 +01:00
namespace Psalm\Internal;
2018-05-07 07:26:06 +02:00
2021-06-08 04:55:21 +02:00
use Psalm\Exception\ComplicatedExpressionException;
use Psalm\Storage\Assertion;
use Psalm\Storage\Assertion\Falsy;
2021-12-03 21:40:18 +01:00
use UnexpectedValueException;
2021-06-08 04:55:21 +02:00
2019-07-05 22:24:00 +02:00
use function array_filter;
use function array_intersect_key;
2019-07-05 22:24:00 +02:00
use function array_keys;
use function array_map;
use function array_merge;
use function array_pop;
use function array_values;
use function count;
use function in_array;
2021-12-03 21:07:25 +01:00
use function mt_rand;
2022-03-13 04:33:58 +01:00
use function reset;
2018-05-07 07:26:06 +02:00
2022-01-03 07:55:32 +01:00
/**
* @internal
*/
2018-05-07 07:26:06 +02:00
class Algebra
{
/**
* @param array<string, non-empty-list<non-empty-list<Assertion>>> $all_types
2018-05-07 07:26:06 +02:00
*
* @return array<string, non-empty-list<non-empty-list<Assertion>>>
2020-08-23 19:52:31 +02:00
*
* @psalm-pure
2018-05-07 07:26:06 +02:00
*/
public static function negateTypes(array $all_types): array
2018-05-07 07:26:06 +02:00
{
return array_filter(
array_map(
/**
* @param non-empty-list<non-empty-list<Assertion>> $anded_types
*
* @return list<non-empty-list<Assertion>>
*/
function (array $anded_types): array {
if (count($anded_types) > 1) {
$new_anded_types = [];
foreach ($anded_types as $orred_types) {
if (count($orred_types) > 1) {
return [];
}
$new_anded_types[] = $orred_types[0]->getNegation();
}
return [$new_anded_types];
}
$new_orred_types = [];
foreach ($anded_types[0] as $orred_type) {
$new_orred_types[] = [$orred_type->getNegation()];
}
return $new_orred_types;
},
$all_types
)
2018-05-07 07:26:06 +02:00
);
}
/**
* This is a very simple simplification heuristic
* for CNF formulae.
*
* It simplifies formulae:
* ($a) && ($a || $b) => $a
* (!$a) && (!$b) && ($a || $b || $c) => $c
*
2020-10-17 18:36:44 +02:00
* @param list<Clause> $clauses
2018-05-07 07:26:06 +02:00
*
2019-10-09 00:44:46 +02:00
* @return list<Clause>
*
* @psalm-pure
2018-05-07 07:26:06 +02:00
*/
public static function simplifyCNF(array $clauses): array
2018-05-07 07:26:06 +02:00
{
$clause_count = count($clauses);
//65536 seems to be a significant threshold, when put at 65537, the code https://psalm.dev/r/216f362ea6 goes
//from seconds in analysis to many minutes
if ($clause_count > 65_536) {
return [];
}
if ($clause_count > 50) {
$all_has_unknown = true;
foreach ($clauses as $clause) {
$clause_has_unknown = false;
foreach ($clause->possibilities as $key => $_) {
if ($key[0] === '*') {
$clause_has_unknown = true;
break;
}
}
if (!$clause_has_unknown) {
$all_has_unknown = false;
break;
}
}
if ($all_has_unknown) {
return $clauses;
}
}
2018-05-07 07:26:06 +02:00
$cloned_clauses = [];
// avoid strict duplicates
foreach ($clauses as $clause) {
$cloned_clauses[$clause->hash] = $clause;
2018-05-07 07:26:06 +02:00
}
// remove impossible types
2020-10-24 18:23:59 +02:00
foreach ($cloned_clauses as $clause_a_hash => $clause_a) {
if (!$clause_a->reconcilable || $clause_a->wedge) {
2018-05-07 07:26:06 +02:00
continue;
}
if (count($clause_a->possibilities) !== 1 || count(array_values($clause_a->possibilities)[0]) !== 1) {
2020-10-24 18:23:59 +02:00
foreach ($cloned_clauses as $clause_b) {
if ($clause_a === $clause_b || !$clause_b->reconcilable || $clause_b->wedge) {
continue;
}
if (array_keys($clause_a->possibilities) === array_keys($clause_b->possibilities)) {
$opposing_keys = [];
foreach ($clause_a->possibilities as $key => $a_possibilities) {
$b_possibilities = $clause_b->possibilities[$key];
2022-03-13 04:33:58 +01:00
if (array_keys($clause_a->possibilities[$key])
=== array_keys($clause_b->possibilities[$key])
) {
continue;
}
if (count($a_possibilities) === 1 && count($b_possibilities) === 1) {
if (reset($a_possibilities)->isNegationOf(reset($b_possibilities))) {
$opposing_keys[] = $key;
continue;
}
}
continue 2;
}
if (count($opposing_keys) === 1) {
2020-10-24 18:23:59 +02:00
unset($cloned_clauses[$clause_a_hash]);
$clause_a = $clause_a->removePossibilities($opposing_keys[0]);
2020-10-24 17:37:08 +02:00
2020-10-24 18:23:59 +02:00
if (!$clause_a) {
continue 2;
2020-10-24 17:37:08 +02:00
}
2020-10-24 18:23:59 +02:00
$cloned_clauses[$clause_a->hash] = $clause_a;
}
}
}
2018-05-07 07:26:06 +02:00
continue;
}
$clause_var = array_keys($clause_a->possibilities)[0];
$only_type = array_pop(array_values($clause_a->possibilities)[0]);
$negated_clause_type = $only_type->getNegation();
$negated_clause_type_string = (string)$negated_clause_type;
2018-05-07 07:26:06 +02:00
2020-10-24 18:23:59 +02:00
foreach ($cloned_clauses as $clause_b_hash => $clause_b) {
2018-05-07 07:26:06 +02:00
if ($clause_a === $clause_b || !$clause_b->reconcilable || $clause_b->wedge) {
continue;
}
if (isset($clause_b->possibilities[$clause_var])) {
$unmatched = [];
$matched = [];
foreach ($clause_b->possibilities[$clause_var] as $k => $possible_type) {
if ((string)$possible_type === $negated_clause_type_string) {
$matched[] = $possible_type;
} else {
$unmatched[$k] = $possible_type;
}
}
2018-05-07 07:26:06 +02:00
if ($matched) {
$clause_var_possibilities = $unmatched;
2020-08-26 22:41:40 +02:00
unset($cloned_clauses[$clause_b_hash]);
if (!$clause_var_possibilities) {
$updated_clause = $clause_b->removePossibilities($clause_var);
if ($updated_clause) {
$cloned_clauses[$updated_clause->hash] = $updated_clause;
}
} else {
$updated_clause = $clause_b->addPossibilities(
$clause_var,
$clause_var_possibilities
);
2020-08-26 22:41:40 +02:00
$cloned_clauses[$updated_clause->hash] = $updated_clause;
}
2018-05-07 07:26:06 +02:00
}
}
}
}
$simplified_clauses = [];
2020-08-26 22:41:40 +02:00
foreach ($cloned_clauses as $clause_a) {
2018-05-07 07:26:06 +02:00
$is_redundant = false;
2020-08-26 22:41:40 +02:00
foreach ($cloned_clauses as $clause_b) {
2018-05-14 22:29:51 +02:00
if ($clause_a === $clause_b
|| !$clause_b->reconcilable
|| $clause_b->wedge
|| $clause_a->wedge
) {
2018-05-07 07:26:06 +02:00
continue;
}
if ($clause_a->contains($clause_b)) {
$is_redundant = true;
break;
}
}
if (!$is_redundant) {
$simplified_clauses[$clause_a->hash] = $clause_a;
2018-05-07 07:26:06 +02:00
}
}
$clause_count = count($simplified_clauses);
// simplify (A || X) && (!A || Y) && (X || Y)
// to
// simplify (A || X) && (!A || Y)
// where X and Y are sets of orred terms
if ($clause_count > 2 && $clause_count < 256) {
$clauses = array_values($simplified_clauses);
for ($i = 0; $i < $clause_count; $i++) {
$clause_a = $clauses[$i];
for ($k = $i + 1; $k < $clause_count; $k++) {
$clause_b = $clauses[$k];
$common_keys = array_keys(
array_intersect_key($clause_a->possibilities, $clause_b->possibilities)
);
if ($common_keys) {
$common_negated_keys = [];
foreach ($common_keys as $common_key) {
if (count($clause_a->possibilities[$common_key]) === 1
&& count($clause_b->possibilities[$common_key]) === 1
&& reset($clause_a->possibilities[$common_key])->isNegationOf(
reset($clause_b->possibilities[$common_key])
)
) {
$common_negated_keys[] = $common_key;
}
}
if ($common_negated_keys) {
$new_possibilities = [];
foreach ($clause_a->possibilities as $var_id => $possibilities) {
if (in_array($var_id, $common_negated_keys, true)) {
continue;
}
if (!isset($new_possibilities[$var_id])) {
$new_possibilities[$var_id] = $possibilities;
} else {
$new_possibilities[$var_id] = array_merge(
$new_possibilities[$var_id],
$possibilities,
);
}
}
foreach ($clause_b->possibilities as $var_id => $possibilities) {
if (in_array($var_id, $common_negated_keys, true)) {
continue;
}
if (!isset($new_possibilities[$var_id])) {
$new_possibilities[$var_id] = $possibilities;
} else {
$new_possibilities[$var_id] = array_merge(
$new_possibilities[$var_id],
$possibilities,
);
}
}
/** @psalm-suppress MixedArgumentTypeCoercion due I think to Psalm bug */
$conflict_clause = (new Clause(
$new_possibilities,
$clause_a->creating_conditional_id,
$clause_a->creating_conditional_id,
false,
true,
true,
[]
));
unset($simplified_clauses[$conflict_clause->hash]);
}
}
}
}
}
return array_values($simplified_clauses);
2018-05-07 07:26:06 +02:00
}
/**
* Look for clauses with only one possible value
*
2019-10-09 00:44:46 +02:00
* @param list<Clause> $clauses
* @param array<string, bool> $cond_referenced_var_ids
* @param array<string, array<int, array<int, Assertion>>> $active_truths
2018-05-07 07:26:06 +02:00
*
* @return array<string, list<list<Assertion>>>
2018-05-07 07:26:06 +02:00
*/
public static function getTruthsFromFormula(
array $clauses,
2020-08-26 21:35:29 +02:00
?int $creating_conditional_id = null,
array &$cond_referenced_var_ids = [],
array &$active_truths = []
): array {
2018-05-07 07:26:06 +02:00
$truths = [];
$active_truths = [];
2018-05-07 07:26:06 +02:00
if ($clauses === []) {
2018-05-07 07:26:06 +02:00
return [];
}
foreach ($clauses as $clause) {
2020-12-21 18:14:25 +01:00
if (!$clause->reconcilable || count($clause->possibilities) !== 1) {
2018-05-07 07:26:06 +02:00
continue;
}
foreach ($clause->possibilities as $var => $possible_types) {
2020-11-03 22:44:24 +01:00
if ($var[0] === '*') {
continue;
}
2018-05-07 07:26:06 +02:00
// if there's only one possible type, return it
2020-12-21 18:14:25 +01:00
if (count($possible_types) === 1) {
$possible_type = array_pop($possible_types);
if (isset($truths[$var]) && !isset($clause->redefined_vars[$var])) {
$truths[$var][] = [$possible_type];
2018-05-07 07:26:06 +02:00
} else {
$truths[$var] = [[$possible_type]];
}
2020-08-26 21:35:29 +02:00
if ($creating_conditional_id && $creating_conditional_id === $clause->creating_conditional_id) {
if (!isset($active_truths[$var])) {
$active_truths[$var] = [];
}
$active_truths[$var][count($truths[$var]) - 1] = [$possible_type];
2018-05-07 07:26:06 +02:00
}
2020-12-21 18:14:25 +01:00
} else {
2018-05-07 07:26:06 +02:00
// if there's only one active clause, return all the non-negation clause members ORed together
$things_that_can_be_said = [];
2018-05-07 07:26:06 +02:00
foreach ($possible_types as $assertion) {
if ($assertion instanceof Falsy || !$assertion->isNegation()) {
$things_that_can_be_said[(string)$assertion] = $assertion;
}
}
2018-05-07 07:26:06 +02:00
if ($things_that_can_be_said && count($things_that_can_be_said) === count($possible_types)) {
if ($clause->generated && count($possible_types) > 1) {
unset($cond_referenced_var_ids[$var]);
}
$truths[$var] = [array_values($things_that_can_be_said)];
2020-08-26 21:35:29 +02:00
if ($creating_conditional_id && $creating_conditional_id === $clause->creating_conditional_id) {
$active_truths[$var] = [array_values($things_that_can_be_said)];
}
2018-05-07 07:26:06 +02:00
}
}
}
}
return $truths;
}
/**
2020-10-17 18:36:44 +02:00
* @param non-empty-list<Clause> $clauses
2018-05-07 07:26:06 +02:00
*
2020-10-17 18:36:44 +02:00
* @return list<Clause>
*
* @psalm-pure
2018-05-07 07:26:06 +02:00
*/
public static function groupImpossibilities(array $clauses): array
2018-05-07 07:26:06 +02:00
{
$complexity = 1;
$seed_clauses = [];
2018-05-07 07:26:06 +02:00
$clause = array_pop($clauses);
2018-05-07 07:26:06 +02:00
if (!$clause->wedge) {
if ($clause->impossibilities === null) {
2021-12-03 21:40:18 +01:00
throw new UnexpectedValueException('$clause->impossibilities should not be null');
}
foreach ($clause->impossibilities as $var => $impossible_types) {
foreach ($impossible_types as $impossible_type) {
$seed_clause = new Clause(
[$var => [(string)$impossible_type => $impossible_type]],
2020-08-26 21:35:29 +02:00
$clause->creating_conditional_id,
$clause->creating_object_id
);
2018-05-07 07:26:06 +02:00
$seed_clauses[] = $seed_clause;
2018-05-07 07:26:06 +02:00
++$complexity;
}
2018-05-07 07:26:06 +02:00
}
}
if (!$clauses || !$seed_clauses) {
return $seed_clauses;
}
while ($clauses) {
$clause = array_pop($clauses);
$new_clauses = [];
2018-05-07 07:26:06 +02:00
foreach ($seed_clauses as $grouped_clause) {
2018-05-07 07:26:06 +02:00
if ($clause->impossibilities === null) {
2021-12-03 21:40:18 +01:00
throw new UnexpectedValueException('$clause->impossibilities should not be null');
2018-05-07 07:26:06 +02:00
}
foreach ($clause->impossibilities as $var => $impossible_types) {
foreach ($impossible_types as $impossible_type) {
$new_clause_possibilities = $grouped_clause->possibilities;
if (isset($new_clause_possibilities[$var])) {
$impossible_type_string = (string)$impossible_type;
$new_clause_possibilities[$var][$impossible_type_string] = $impossible_type;
foreach ($new_clause_possibilities[$var] as $ak => $av) {
foreach ($new_clause_possibilities[$var] as $bk => $bv) {
if ($ak == $bk) {
break;
}
if ($ak !== $impossible_type_string && $bk !== $impossible_type_string) {
continue;
}
if ($av->isNegationOf($bv)) {
break 3;
}
}
}
2018-05-07 07:26:06 +02:00
} else {
$new_clause_possibilities[$var] = [(string)$impossible_type => $impossible_type];
2018-05-07 07:26:06 +02:00
}
$new_clause = new Clause(
$new_clause_possibilities,
$grouped_clause->creating_conditional_id,
2020-08-26 21:35:29 +02:00
$clause->creating_object_id,
false,
true,
true,
2020-08-26 21:35:29 +02:00
[]
);
2018-05-07 07:26:06 +02:00
$new_clauses[] = $new_clause;
++$complexity;
if ($complexity > 20_000) {
throw new ComplicatedExpressionException();
}
2018-05-07 07:26:06 +02:00
}
}
}
$seed_clauses = $new_clauses;
2018-05-07 07:26:06 +02:00
}
return $seed_clauses;
2018-05-07 07:26:06 +02:00
}
/**
2020-10-16 17:17:52 +02:00
* @param list<Clause> $left_clauses
* @param list<Clause> $right_clauses
2018-05-07 07:26:06 +02:00
*
2020-10-16 17:17:52 +02:00
* @return list<Clause>
*
* @psalm-pure
2018-05-07 07:26:06 +02:00
*/
public static function combineOredClauses(
array $left_clauses,
array $right_clauses,
int $conditional_object_id
): array {
if (count($left_clauses) > 60_000 || count($right_clauses) > 60_000) {
return [];
}
2018-05-07 07:26:06 +02:00
$clauses = [];
$all_wedges = true;
2018-05-14 22:29:51 +02:00
$has_wedge = false;
2018-05-07 07:26:06 +02:00
foreach ($left_clauses as $left_clause) {
foreach ($right_clauses as $right_clause) {
2018-05-14 22:29:51 +02:00
$all_wedges = $all_wedges && ($left_clause->wedge && $right_clause->wedge);
$has_wedge = $has_wedge || ($left_clause->wedge && $right_clause->wedge);
}
}
if ($all_wedges) {
2020-08-26 21:35:29 +02:00
return [new Clause([], $conditional_object_id, $conditional_object_id, true)];
2018-05-14 22:29:51 +02:00
}
foreach ($left_clauses as $left_clause) {
foreach ($right_clauses as $right_clause) {
if ($left_clause->wedge && $right_clause->wedge) {
// handled below
continue;
}
/** @var array<string, non-empty-array<string, Assertion>> */
2018-05-07 07:26:06 +02:00
$possibilities = [];
$can_reconcile = true;
if ($left_clause->wedge ||
$right_clause->wedge ||
!$left_clause->reconcilable ||
!$right_clause->reconcilable
) {
$can_reconcile = false;
}
foreach ($left_clause->possibilities as $var => $possible_types) {
if (isset($right_clause->redefined_vars[$var])) {
continue;
}
2018-05-07 07:26:06 +02:00
if (isset($possibilities[$var])) {
$possibilities[$var] = array_merge($possibilities[$var], $possible_types);
} else {
$possibilities[$var] = $possible_types;
}
}
foreach ($right_clause->possibilities as $var => $possible_types) {
if (isset($possibilities[$var])) {
$possibilities[$var] = array_merge($possibilities[$var], $possible_types);
} else {
$possibilities[$var] = $possible_types;
}
}
foreach ($possibilities as $var_possibilities) {
if (count($var_possibilities) === 2) {
$vals = array_values($var_possibilities);
/** @psalm-suppress PossiblyUndefinedIntArrayOffset */
if ($vals[0]->isNegationOf($vals[1])) {
continue 2;
}
}
}
2020-08-26 22:27:35 +02:00
$creating_conditional_id =
$right_clause->creating_conditional_id === $left_clause->creating_conditional_id
2020-08-26 21:35:29 +02:00
? $right_clause->creating_conditional_id
: $conditional_object_id;
2018-05-07 20:52:45 +02:00
$clauses[] = new Clause(
$possibilities,
2020-08-26 21:35:29 +02:00
$creating_conditional_id,
$creating_conditional_id,
2018-05-07 20:52:45 +02:00
false,
$can_reconcile,
$right_clause->generated
|| $left_clause->generated
|| count($left_clauses) > 1
|| count($right_clauses) > 1,
2020-08-26 21:35:29 +02:00
[]
2018-05-07 20:52:45 +02:00
);
2018-05-07 07:26:06 +02:00
}
}
2018-05-14 22:29:51 +02:00
if ($has_wedge) {
2020-08-26 21:35:29 +02:00
$clauses[] = new Clause([], $conditional_object_id, $conditional_object_id, true);
2018-05-07 07:26:06 +02:00
}
return $clauses;
}
/**
* Negates a set of clauses
* negateClauses([$a || $b]) => !$a && !$b
* negateClauses([$a, $b]) => !$a || !$b
* negateClauses([$a, $b || $c]) =>
* (!$a || !$b) &&
* (!$a || !$c)
* negateClauses([$a, $b || $c, $d || $e || $f]) =>
* (!$a || !$b || !$d) &&
* (!$a || !$b || !$e) &&
* (!$a || !$b || !$f) &&
* (!$a || !$c || !$d) &&
* (!$a || !$c || !$e) &&
* (!$a || !$c || !$f)
*
2020-10-17 18:36:44 +02:00
* @param list<Clause> $clauses
2018-05-07 07:26:06 +02:00
*
* @return non-empty-list<Clause>
2018-05-07 07:26:06 +02:00
*/
public static function negateFormula(array $clauses): array
2018-05-07 07:26:06 +02:00
{
2020-11-03 22:44:24 +01:00
$clauses = array_filter(
$clauses,
2022-01-05 23:45:11 +01:00
fn($clause) => $clause->reconcilable
2020-11-03 22:44:24 +01:00
);
if (!$clauses) {
$cond_id = mt_rand(0, 100_000_000);
2020-08-26 21:35:29 +02:00
return [new Clause([], $cond_id, $cond_id, true)];
}
$clauses_with_impossibilities = [];
2018-05-07 07:26:06 +02:00
foreach ($clauses as $clause) {
$clauses_with_impossibilities[] = $clause->calculateNegation();
2018-05-07 07:26:06 +02:00
}
unset($clauses);
$impossible_clauses = self::groupImpossibilities($clauses_with_impossibilities);
if (!$impossible_clauses) {
$cond_id = mt_rand(0, 100_000_000);
2020-08-26 21:35:29 +02:00
return [new Clause([], $cond_id, $cond_id, true)];
}
$negated = self::simplifyCNF($impossible_clauses);
2019-07-05 22:24:00 +02:00
if (!$negated) {
$cond_id = mt_rand(0, 100_000_000);
2020-08-26 21:35:29 +02:00
return [new Clause([], $cond_id, $cond_id, true)];
}
return $negated;
2018-05-07 07:26:06 +02:00
}
}