1
0
mirror of https://github.com/danog/psalm.git synced 2025-01-10 15:09:04 +01:00
psalm/src/Psalm/Internal/Algebra.php

633 lines
21 KiB
PHP
Raw Normal View History

2018-05-07 07:26:06 +02:00
<?php
2020-11-03 22:15:44 +01:00
namespace Psalm\Internal;
2018-05-07 07:26:06 +02:00
2021-06-08 04:55:21 +02:00
use Psalm\Exception\ComplicatedExpressionException;
2021-12-03 21:40:18 +01:00
use UnexpectedValueException;
2021-06-08 04:55:21 +02:00
2021-12-03 21:07:25 +01:00
use function array_diff_key;
2019-07-05 22:24:00 +02:00
use function array_filter;
use function array_keys;
use function array_map;
use function array_merge;
use function array_pop;
use function array_unique;
use function array_values;
use function count;
use function in_array;
2021-12-03 21:07:25 +01:00
use function mt_rand;
2019-07-05 22:24:00 +02:00
use function substr;
2018-05-07 07:26:06 +02:00
2022-01-03 07:55:32 +01:00
/**
* @internal
*/
2018-05-07 07:26:06 +02:00
class Algebra
{
/**
2020-08-23 19:52:31 +02:00
* @param array<string, non-empty-list<non-empty-list<string>>> $all_types
2018-05-07 07:26:06 +02:00
*
* @return array<string, non-empty-list<non-empty-list<string>>>
2020-08-23 19:52:31 +02:00
*
* @psalm-pure
2018-05-07 07:26:06 +02:00
*/
public static function negateTypes(array $all_types): array
2018-05-07 07:26:06 +02:00
{
return array_filter(
array_map(
/**
* @param non-empty-list<non-empty-list<string>> $anded_types
*
* @return list<non-empty-list<string>>
*/
function (array $anded_types): array {
if (count($anded_types) > 1) {
$new_anded_types = [];
foreach ($anded_types as $orred_types) {
if (count($orred_types) > 1) {
return [];
}
$new_anded_types[] = self::negateType($orred_types[0]);
}
return [$new_anded_types];
}
$new_orred_types = [];
foreach ($anded_types[0] as $orred_type) {
$new_orred_types[] = [self::negateType($orred_type)];
}
return $new_orred_types;
},
$all_types
)
2018-05-07 07:26:06 +02:00
);
}
/**
2020-08-23 19:52:31 +02:00
* @psalm-pure
2018-05-07 07:26:06 +02:00
*/
public static function negateType(string $type): string
2018-05-07 07:26:06 +02:00
{
if ($type === 'mixed') {
return $type;
}
return $type[0] === '!' ? substr($type, 1) : '!' . $type;
2018-05-07 07:26:06 +02:00
}
/**
* This is a very simple simplification heuristic
* for CNF formulae.
*
* It simplifies formulae:
* ($a) && ($a || $b) => $a
* (!$a) && (!$b) && ($a || $b || $c) => $c
*
2020-10-17 18:36:44 +02:00
* @param list<Clause> $clauses
2018-05-07 07:26:06 +02:00
*
2019-10-09 00:44:46 +02:00
* @return list<Clause>
*
* @psalm-pure
2018-05-07 07:26:06 +02:00
*/
public static function simplifyCNF(array $clauses): array
2018-05-07 07:26:06 +02:00
{
$clause_count = count($clauses);
//65536 seems to be a significant threshold, when put at 65537, the code https://psalm.dev/r/216f362ea6 goes
//from seconds in analysis to many minutes
if ($clause_count > 65_536) {
return [];
}
if ($clause_count > 50) {
$all_has_unknown = true;
foreach ($clauses as $clause) {
$clause_has_unknown = false;
foreach ($clause->possibilities as $key => $_) {
if ($key[0] === '*') {
$clause_has_unknown = true;
break;
}
}
if (!$clause_has_unknown) {
$all_has_unknown = false;
break;
}
}
if ($all_has_unknown) {
return $clauses;
}
}
2018-05-07 07:26:06 +02:00
$cloned_clauses = [];
// avoid strict duplicates
foreach ($clauses as $clause) {
$unique_clause = $clause->makeUnique();
$cloned_clauses[$unique_clause->hash] = $unique_clause;
2018-05-07 07:26:06 +02:00
}
// remove impossible types
2020-10-24 18:23:59 +02:00
foreach ($cloned_clauses as $clause_a_hash => $clause_a) {
if (!$clause_a->reconcilable || $clause_a->wedge) {
2018-05-07 07:26:06 +02:00
continue;
}
if (count($clause_a->possibilities) !== 1 || count(array_values($clause_a->possibilities)[0]) !== 1) {
2020-10-24 18:23:59 +02:00
foreach ($cloned_clauses as $clause_b) {
if ($clause_a === $clause_b || !$clause_b->reconcilable || $clause_b->wedge) {
continue;
}
if (array_keys($clause_a->possibilities) === array_keys($clause_b->possibilities)) {
$opposing_keys = [];
foreach ($clause_a->possibilities as $key => $a_possibilities) {
$b_possibilities = $clause_b->possibilities[$key];
if ($a_possibilities === $b_possibilities) {
continue;
}
if (count($a_possibilities) === 1 && count($b_possibilities) === 1) {
if ($a_possibilities[0] === '!' . $b_possibilities[0]
|| $b_possibilities[0] === '!' . $a_possibilities[0]
) {
$opposing_keys[] = $key;
continue;
}
}
continue 2;
}
if (count($opposing_keys) === 1) {
2020-10-24 18:23:59 +02:00
unset($cloned_clauses[$clause_a_hash]);
$clause_a = $clause_a->removePossibilities($opposing_keys[0]);
2020-10-24 17:37:08 +02:00
2020-10-24 18:23:59 +02:00
if (!$clause_a) {
continue 2;
2020-10-24 17:37:08 +02:00
}
2020-10-24 18:23:59 +02:00
$cloned_clauses[$clause_a->hash] = $clause_a;
}
}
}
2018-05-07 07:26:06 +02:00
continue;
}
$clause_var = array_keys($clause_a->possibilities)[0];
$only_type = array_pop(array_values($clause_a->possibilities)[0]);
$negated_clause_type = self::negateType($only_type);
2020-10-24 18:23:59 +02:00
foreach ($cloned_clauses as $clause_b_hash => $clause_b) {
2018-05-07 07:26:06 +02:00
if ($clause_a === $clause_b || !$clause_b->reconcilable || $clause_b->wedge) {
continue;
}
if (isset($clause_b->possibilities[$clause_var]) &&
in_array($negated_clause_type, $clause_b->possibilities[$clause_var], true)
) {
$clause_var_possibilities = array_values(
array_filter(
$clause_b->possibilities[$clause_var],
function (string $possible_type) use ($negated_clause_type): bool {
return $possible_type !== $negated_clause_type;
}
)
2018-05-07 07:26:06 +02:00
);
2020-10-24 18:23:59 +02:00
unset($cloned_clauses[$clause_b_hash]);
2020-08-26 22:41:40 +02:00
if (!$clause_var_possibilities) {
2020-08-26 22:41:40 +02:00
$updated_clause = $clause_b->removePossibilities($clause_var);
if ($updated_clause) {
$cloned_clauses[$updated_clause->hash] = $updated_clause;
}
} else {
2020-08-26 22:41:40 +02:00
$updated_clause = $clause_b->addPossibilities(
$clause_var,
$clause_var_possibilities
);
2020-08-26 22:41:40 +02:00
$cloned_clauses[$updated_clause->hash] = $updated_clause;
2018-05-07 07:26:06 +02:00
}
}
}
}
$simplified_clauses = [];
2020-08-26 22:41:40 +02:00
foreach ($cloned_clauses as $clause_a) {
2018-05-07 07:26:06 +02:00
$is_redundant = false;
2020-08-26 22:41:40 +02:00
foreach ($cloned_clauses as $clause_b) {
2018-05-14 22:29:51 +02:00
if ($clause_a === $clause_b
|| !$clause_b->reconcilable
|| $clause_b->wedge
|| $clause_a->wedge
) {
2018-05-07 07:26:06 +02:00
continue;
}
if ($clause_a->contains($clause_b)) {
$is_redundant = true;
break;
}
}
if (!$is_redundant) {
$simplified_clauses[] = $clause_a;
}
}
return $simplified_clauses;
}
/**
* Look for clauses with only one possible value
*
2019-10-09 00:44:46 +02:00
* @param list<Clause> $clauses
* @param array<string, bool> $cond_referenced_var_ids
* @param array<string, array<int, array<int, string>>> $active_truths
2018-05-07 07:26:06 +02:00
*
2020-10-17 18:36:44 +02:00
* @return array<string, list<array<int, string>>>
2018-05-07 07:26:06 +02:00
*/
public static function getTruthsFromFormula(
array $clauses,
2020-08-26 21:35:29 +02:00
?int $creating_conditional_id = null,
array &$cond_referenced_var_ids = [],
array &$active_truths = []
): array {
2018-05-07 07:26:06 +02:00
$truths = [];
$active_truths = [];
2018-05-07 07:26:06 +02:00
if ($clauses === []) {
2018-05-07 07:26:06 +02:00
return [];
}
foreach ($clauses as $clause) {
2020-12-21 18:14:25 +01:00
if (!$clause->reconcilable || count($clause->possibilities) !== 1) {
2018-05-07 07:26:06 +02:00
continue;
}
foreach ($clause->possibilities as $var => $possible_types) {
2020-11-03 22:44:24 +01:00
if ($var[0] === '*') {
continue;
}
2018-05-07 07:26:06 +02:00
// if there's only one possible type, return it
2020-12-21 18:14:25 +01:00
if (count($possible_types) === 1) {
$possible_type = array_pop($possible_types);
if (isset($truths[$var]) && !isset($clause->redefined_vars[$var])) {
$truths[$var][] = [$possible_type];
2018-05-07 07:26:06 +02:00
} else {
$truths[$var] = [[$possible_type]];
}
2020-08-26 21:35:29 +02:00
if ($creating_conditional_id && $creating_conditional_id === $clause->creating_conditional_id) {
if (!isset($active_truths[$var])) {
$active_truths[$var] = [];
}
$active_truths[$var][count($truths[$var]) - 1] = [$possible_type];
2018-05-07 07:26:06 +02:00
}
2020-12-21 18:14:25 +01:00
} else {
2018-05-07 07:26:06 +02:00
// if there's only one active clause, return all the non-negation clause members ORed together
$things_that_can_be_said = array_filter(
$possible_types,
function (string $possible_type): bool {
2018-05-07 07:26:06 +02:00
return $possible_type[0] !== '!';
}
);
if ($things_that_can_be_said && count($things_that_can_be_said) === count($possible_types)) {
$things_that_can_be_said = array_unique($things_that_can_be_said);
if ($clause->generated && count($possible_types) > 1) {
unset($cond_referenced_var_ids[$var]);
}
/** @var array<int, string> $things_that_can_be_said */
$truths[$var] = [$things_that_can_be_said];
2020-08-26 21:35:29 +02:00
if ($creating_conditional_id && $creating_conditional_id === $clause->creating_conditional_id) {
$active_truths[$var] = [$things_that_can_be_said];
}
2018-05-07 07:26:06 +02:00
}
}
}
}
return $truths;
}
/**
2020-10-17 18:36:44 +02:00
* @param non-empty-list<Clause> $clauses
2018-05-07 07:26:06 +02:00
*
2020-10-17 18:36:44 +02:00
* @return list<Clause>
*
* @psalm-pure
2018-05-07 07:26:06 +02:00
*/
public static function groupImpossibilities(array $clauses): array
2018-05-07 07:26:06 +02:00
{
$complexity = 1;
$seed_clauses = [];
2018-05-07 07:26:06 +02:00
$clause = array_pop($clauses);
2018-05-07 07:26:06 +02:00
if (!$clause->wedge) {
if ($clause->impossibilities === null) {
2021-12-03 21:40:18 +01:00
throw new UnexpectedValueException('$clause->impossibilities should not be null');
}
foreach ($clause->impossibilities as $var => $impossible_types) {
foreach ($impossible_types as $impossible_type) {
$seed_clause = new Clause(
[$var => [$impossible_type]],
2020-08-26 21:35:29 +02:00
$clause->creating_conditional_id,
$clause->creating_object_id
);
2018-05-07 07:26:06 +02:00
$seed_clauses[] = $seed_clause;
2018-05-07 07:26:06 +02:00
++$complexity;
}
2018-05-07 07:26:06 +02:00
}
}
if (!$clauses || !$seed_clauses) {
return $seed_clauses;
}
while ($clauses) {
$clause = array_pop($clauses);
$new_clauses = [];
2018-05-07 07:26:06 +02:00
foreach ($seed_clauses as $grouped_clause) {
2018-05-07 07:26:06 +02:00
if ($clause->impossibilities === null) {
2021-12-03 21:40:18 +01:00
throw new UnexpectedValueException('$clause->impossibilities should not be null');
2018-05-07 07:26:06 +02:00
}
foreach ($clause->impossibilities as $var => $impossible_types) {
foreach ($impossible_types as $impossible_type) {
$new_clause_possibilities = $grouped_clause->possibilities;
if (isset($grouped_clause->possibilities[$var])) {
$new_clause_possibilities[$var] = array_values(
array_unique(
array_merge([$impossible_type], $new_clause_possibilities[$var])
)
);
$removed_indexes = [];
for ($i = 0, $l = count($new_clause_possibilities[$var]); $i < $l; $i++) {
for ($j = $i + 1; $j < $l; $j++) {
$ith = $new_clause_possibilities[$var][$i];
$jth = $new_clause_possibilities[$var][$j];
if ($ith === '!' . $jth || $jth === '!' . $ith) {
$removed_indexes[$i] = true;
$removed_indexes[$j] = true;
}
}
}
if ($removed_indexes) {
2020-10-24 18:23:59 +02:00
$new_possibilities = array_values(
2021-12-03 21:07:25 +01:00
array_diff_key(
2020-10-24 18:23:59 +02:00
$new_clause_possibilities[$var],
$removed_indexes
)
);
2020-10-24 18:23:59 +02:00
if (!$new_possibilities) {
unset($new_clause_possibilities[$var]);
} else {
2020-10-24 18:23:59 +02:00
$new_clause_possibilities[$var] = $new_possibilities;
}
}
2018-05-07 07:26:06 +02:00
} else {
$new_clause_possibilities[$var] = [$impossible_type];
}
if (!$new_clause_possibilities) {
continue;
}
$new_clause = new Clause(
$new_clause_possibilities,
$grouped_clause->creating_conditional_id,
2020-08-26 21:35:29 +02:00
$clause->creating_object_id,
false,
true,
true,
2020-08-26 21:35:29 +02:00
[]
);
2018-05-07 07:26:06 +02:00
$new_clauses[] = $new_clause;
++$complexity;
if ($complexity > 20_000) {
throw new ComplicatedExpressionException();
}
2018-05-07 07:26:06 +02:00
}
}
}
$seed_clauses = $new_clauses;
2018-05-07 07:26:06 +02:00
}
return $seed_clauses;
2018-05-07 07:26:06 +02:00
}
/**
2020-10-16 17:17:52 +02:00
* @param list<Clause> $left_clauses
* @param list<Clause> $right_clauses
2018-05-07 07:26:06 +02:00
*
2020-10-16 17:17:52 +02:00
* @return list<Clause>
*
* @psalm-pure
2018-05-07 07:26:06 +02:00
*/
public static function combineOredClauses(
array $left_clauses,
array $right_clauses,
int $conditional_object_id
): array {
if (count($left_clauses) > 60_000 || count($right_clauses) > 60_000) {
return [];
}
2018-05-07 07:26:06 +02:00
$clauses = [];
$all_wedges = true;
2018-05-14 22:29:51 +02:00
$has_wedge = false;
2018-05-07 07:26:06 +02:00
foreach ($left_clauses as $left_clause) {
foreach ($right_clauses as $right_clause) {
2018-05-14 22:29:51 +02:00
$all_wedges = $all_wedges && ($left_clause->wedge && $right_clause->wedge);
$has_wedge = $has_wedge || ($left_clause->wedge && $right_clause->wedge);
}
}
if ($all_wedges) {
2020-08-26 21:35:29 +02:00
return [new Clause([], $conditional_object_id, $conditional_object_id, true)];
2018-05-14 22:29:51 +02:00
}
foreach ($left_clauses as $left_clause) {
foreach ($right_clauses as $right_clause) {
if ($left_clause->wedge && $right_clause->wedge) {
// handled below
continue;
}
/** @var array<string, non-empty-list<string>> */
2018-05-07 07:26:06 +02:00
$possibilities = [];
$can_reconcile = true;
if ($left_clause->wedge ||
$right_clause->wedge ||
!$left_clause->reconcilable ||
!$right_clause->reconcilable
) {
$can_reconcile = false;
}
foreach ($left_clause->possibilities as $var => $possible_types) {
if (isset($right_clause->redefined_vars[$var])) {
continue;
}
2018-05-07 07:26:06 +02:00
if (isset($possibilities[$var])) {
$possibilities[$var] = array_merge($possibilities[$var], $possible_types);
} else {
$possibilities[$var] = $possible_types;
}
}
foreach ($right_clause->possibilities as $var => $possible_types) {
if (isset($possibilities[$var])) {
$possibilities[$var] = array_merge($possibilities[$var], $possible_types);
} else {
$possibilities[$var] = $possible_types;
}
}
2018-05-07 20:52:45 +02:00
if (count($left_clauses) > 1 || count($right_clauses) > 1) {
foreach ($possibilities as $var => $p) {
$possibilities[$var] = array_values(array_unique($p));
2018-05-07 20:52:45 +02:00
}
}
foreach ($possibilities as $var_possibilities) {
if (count($var_possibilities) === 2) {
if ($var_possibilities[0] === '!' . $var_possibilities[1]
|| $var_possibilities[1] === '!' . $var_possibilities[0]
) {
continue 2;
}
}
}
2020-08-26 22:27:35 +02:00
$creating_conditional_id =
$right_clause->creating_conditional_id === $left_clause->creating_conditional_id
2020-08-26 21:35:29 +02:00
? $right_clause->creating_conditional_id
: $conditional_object_id;
2018-05-07 20:52:45 +02:00
$clauses[] = new Clause(
$possibilities,
2020-08-26 21:35:29 +02:00
$creating_conditional_id,
$creating_conditional_id,
2018-05-07 20:52:45 +02:00
false,
$can_reconcile,
$right_clause->generated
|| $left_clause->generated
|| count($left_clauses) > 1
|| count($right_clauses) > 1,
2020-08-26 21:35:29 +02:00
[]
2018-05-07 20:52:45 +02:00
);
2018-05-07 07:26:06 +02:00
}
}
2018-05-14 22:29:51 +02:00
if ($has_wedge) {
2020-08-26 21:35:29 +02:00
$clauses[] = new Clause([], $conditional_object_id, $conditional_object_id, true);
2018-05-07 07:26:06 +02:00
}
return $clauses;
}
/**
* Negates a set of clauses
* negateClauses([$a || $b]) => !$a && !$b
* negateClauses([$a, $b]) => !$a || !$b
* negateClauses([$a, $b || $c]) =>
* (!$a || !$b) &&
* (!$a || !$c)
* negateClauses([$a, $b || $c, $d || $e || $f]) =>
* (!$a || !$b || !$d) &&
* (!$a || !$b || !$e) &&
* (!$a || !$b || !$f) &&
* (!$a || !$c || !$d) &&
* (!$a || !$c || !$e) &&
* (!$a || !$c || !$f)
*
2020-10-17 18:36:44 +02:00
* @param list<Clause> $clauses
2018-05-07 07:26:06 +02:00
*
* @return non-empty-list<Clause>
2018-05-07 07:26:06 +02:00
*/
public static function negateFormula(array $clauses): array
2018-05-07 07:26:06 +02:00
{
2020-11-03 22:44:24 +01:00
$clauses = array_filter(
$clauses,
function ($clause) {
return $clause->reconcilable;
}
);
if (!$clauses) {
$cond_id = mt_rand(0, 100_000_000);
2020-08-26 21:35:29 +02:00
return [new Clause([], $cond_id, $cond_id, true)];
}
$clauses_with_impossibilities = [];
2018-05-07 07:26:06 +02:00
foreach ($clauses as $clause) {
$clauses_with_impossibilities[] = $clause->calculateNegation();
2018-05-07 07:26:06 +02:00
}
unset($clauses);
$impossible_clauses = self::groupImpossibilities($clauses_with_impossibilities);
if (!$impossible_clauses) {
$cond_id = mt_rand(0, 100_000_000);
2020-08-26 21:35:29 +02:00
return [new Clause([], $cond_id, $cond_id, true)];
}
$negated = self::simplifyCNF($impossible_clauses);
2019-07-05 22:24:00 +02:00
if (!$negated) {
$cond_id = mt_rand(0, 100_000_000);
2020-08-26 21:35:29 +02:00
return [new Clause([], $cond_id, $cond_id, true)];
}
return $negated;
2018-05-07 07:26:06 +02:00
}
}