1
0
mirror of https://github.com/danog/psalm.git synced 2025-01-10 15:09:04 +01:00
psalm/src/Psalm/Internal/Analyzer/Statements/Expression/ArrayAnalyzer.php

598 lines
23 KiB
PHP
Raw Normal View History

2018-01-14 18:09:40 +01:00
<?php
2018-11-06 03:57:36 +01:00
namespace Psalm\Internal\Analyzer\Statements\Expression;
2018-01-14 18:09:40 +01:00
use PhpParser;
2021-06-08 04:55:21 +02:00
use Psalm\CodeLocation;
use Psalm\Codebase;
2021-06-08 04:55:21 +02:00
use Psalm\Context;
2018-11-06 03:57:36 +01:00
use Psalm\Internal\Analyzer\Statements\ExpressionAnalyzer;
use Psalm\Internal\Analyzer\StatementsAnalyzer;
2021-12-03 20:11:20 +01:00
use Psalm\Internal\Codebase\TaintFlowGraph;
use Psalm\Internal\Codebase\VariableUseGraph;
use Psalm\Internal\DataFlow\DataFlowNode;
2021-06-08 04:55:21 +02:00
use Psalm\Internal\Type\TypeCombiner;
use Psalm\Issue\DuplicateArrayKey;
use Psalm\Issue\InvalidArrayOffset;
use Psalm\Issue\MixedArrayOffset;
2021-12-03 20:11:20 +01:00
use Psalm\Issue\ParseError;
use Psalm\IssueBuffer;
use Psalm\Plugin\EventHandler\Event\AddRemoveTaintsEvent;
2021-06-08 04:55:21 +02:00
use Psalm\Type;
2021-12-13 04:45:57 +01:00
use Psalm\Type\Atomic\TArray;
use Psalm\Type\Atomic\TArrayKey;
use Psalm\Type\Atomic\TBool;
use Psalm\Type\Atomic\TFalse;
use Psalm\Type\Atomic\TFloat;
use Psalm\Type\Atomic\TGenericObject;
use Psalm\Type\Atomic\TInt;
use Psalm\Type\Atomic\TIterable;
use Psalm\Type\Atomic\TKeyedArray;
use Psalm\Type\Atomic\TList;
use Psalm\Type\Atomic\TLiteralClassString;
use Psalm\Type\Atomic\TLiteralFloat;
use Psalm\Type\Atomic\TLiteralInt;
use Psalm\Type\Atomic\TLiteralString;
use Psalm\Type\Atomic\TMixed;
use Psalm\Type\Atomic\TNonEmptyArray;
use Psalm\Type\Atomic\TNonEmptyList;
use Psalm\Type\Atomic\TObjectWithProperties;
use Psalm\Type\Atomic\TString;
use Psalm\Type\Atomic\TTemplateParam;
use Psalm\Type\Atomic\TTrue;
2021-12-13 16:28:14 +01:00
use Psalm\Type\Union;
use function array_merge;
use function array_values;
use function count;
2021-12-03 21:07:25 +01:00
use function in_array;
use function is_string;
2021-06-08 04:55:21 +02:00
use function preg_match;
use const PHP_INT_MAX;
2018-01-14 18:09:40 +01:00
/**
* @internal
*/
2018-11-06 03:57:36 +01:00
class ArrayAnalyzer
2018-01-14 18:09:40 +01:00
{
public static function analyze(
2018-11-11 18:01:14 +01:00
StatementsAnalyzer $statements_analyzer,
2018-01-14 18:09:40 +01:00
PhpParser\Node\Expr\Array_ $stmt,
Context $context
): bool {
2018-01-14 18:09:40 +01:00
// if the array is empty, this special type allows us to match any other array type against it
if (empty($stmt->items)) {
$statements_analyzer->node_data->setType($stmt, Type::getEmptyArray());
2018-01-14 18:09:40 +01:00
2020-05-18 21:13:27 +02:00
return true;
2018-01-14 18:09:40 +01:00
}
$codebase = $statements_analyzer->getCodebase();
2020-11-27 20:19:55 +01:00
$array_creation_info = new ArrayCreationInfo();
2019-10-12 05:28:17 +02:00
foreach ($stmt->items as $item) {
2018-01-14 18:09:40 +01:00
if ($item === null) {
2021-12-03 20:11:20 +01:00
IssueBuffer::add(
new ParseError(
'Array element cannot be empty',
new CodeLocation($statements_analyzer, $stmt)
)
);
return false;
2018-01-14 18:09:40 +01:00
}
2020-11-27 20:19:55 +01:00
self::analyzeArrayItem(
$statements_analyzer,
$context,
$array_creation_info,
$item,
$codebase
2020-11-27 20:19:55 +01:00
);
2018-01-14 18:09:40 +01:00
}
2020-11-27 20:19:55 +01:00
if ($array_creation_info->item_key_atomic_types) {
2020-11-22 00:11:29 +01:00
$item_key_type = TypeCombiner::combine(
2020-11-27 20:19:55 +01:00
$array_creation_info->item_key_atomic_types,
$codebase,
false,
true,
30
);
} else {
$item_key_type = null;
}
2020-11-27 20:19:55 +01:00
if ($array_creation_info->item_value_atomic_types) {
2020-11-22 00:11:29 +01:00
$item_value_type = TypeCombiner::combine(
2020-11-27 20:19:55 +01:00
$array_creation_info->item_value_atomic_types,
$codebase,
false,
true,
30
);
} else {
$item_value_type = null;
}
2019-10-09 00:44:46 +02:00
2018-01-14 18:09:40 +01:00
// if this array looks like an object-like array, let's return that instead
if ($item_value_type
&& $item_key_type
&& ($item_key_type->hasString() || $item_key_type->hasInt())
2020-11-27 20:19:55 +01:00
&& $array_creation_info->can_create_objectlike
&& $array_creation_info->property_types
2018-01-14 18:09:40 +01:00
) {
2021-12-13 04:45:57 +01:00
$object_like = new TKeyedArray(
2020-11-27 20:19:55 +01:00
$array_creation_info->property_types,
$array_creation_info->class_strings
);
$object_like->sealed = true;
2020-11-27 20:19:55 +01:00
$object_like->is_list = $array_creation_info->all_list;
2021-12-13 16:28:14 +01:00
$stmt_type = new Union([$object_like]);
2018-01-14 18:09:40 +01:00
2020-11-27 20:19:55 +01:00
if ($array_creation_info->parent_taint_nodes) {
$stmt_type->parent_nodes = $array_creation_info->parent_taint_nodes;
2019-10-12 05:28:17 +02:00
}
$statements_analyzer->node_data->setType($stmt, $stmt_type);
2020-05-18 21:13:27 +02:00
return true;
2018-01-14 18:09:40 +01:00
}
2020-11-27 20:19:55 +01:00
if ($array_creation_info->all_list) {
if (empty($array_creation_info->item_key_atomic_types)) {
2021-12-13 04:45:57 +01:00
$array_type = new TList($item_value_type ?? Type::getMixed());
} else {
2021-12-13 04:45:57 +01:00
$array_type = new TNonEmptyList($item_value_type ?? Type::getMixed());
$array_type->count = count($array_creation_info->property_types);
}
2019-10-09 00:44:46 +02:00
2021-12-13 16:28:14 +01:00
$stmt_type = new Union([
2019-10-09 00:44:46 +02:00
$array_type,
]);
2020-11-27 20:19:55 +01:00
if ($array_creation_info->parent_taint_nodes) {
$stmt_type->parent_nodes = $array_creation_info->parent_taint_nodes;
2019-10-12 05:28:17 +02:00
}
$statements_analyzer->node_data->setType($stmt, $stmt_type);
2020-05-18 21:13:27 +02:00
return true;
2019-10-09 00:44:46 +02:00
}
if ($item_key_type) {
$bad_types = [];
$good_types = [];
foreach ($item_key_type->getAtomicTypes() as $atomic_key_type) {
2021-12-13 04:45:57 +01:00
if ($atomic_key_type instanceof TMixed) {
IssueBuffer::maybeAdd(
new MixedArrayOffset(
'Cannot create mixed offset expecting array-key',
new CodeLocation($statements_analyzer->getSource(), $stmt)
),
$statements_analyzer->getSuppressedIssues()
);
$bad_types[] = $atomic_key_type;
2021-12-13 04:45:57 +01:00
$good_types[] = new TArrayKey;
continue;
}
2021-12-13 04:45:57 +01:00
if (!$atomic_key_type instanceof TString
&& !$atomic_key_type instanceof TInt
&& !$atomic_key_type instanceof TArrayKey
&& !$atomic_key_type instanceof TTemplateParam
&& !(
2021-12-13 04:45:57 +01:00
$atomic_key_type instanceof TObjectWithProperties
&& isset($atomic_key_type->methods['__toString'])
)
) {
IssueBuffer::maybeAdd(
new InvalidArrayOffset(
'Cannot create offset of type ' . $item_key_type->getKey() . ', expecting array-key',
new CodeLocation($statements_analyzer->getSource(), $stmt)
),
$statements_analyzer->getSuppressedIssues()
);
$bad_types[] = $atomic_key_type;
2021-12-13 04:45:57 +01:00
if ($atomic_key_type instanceof TFalse) {
$good_types[] = new TLiteralInt(0);
} elseif ($atomic_key_type instanceof TTrue) {
$good_types[] = new TLiteralInt(1);
} elseif ($atomic_key_type instanceof TBool) {
$good_types[] = new TLiteralInt(0);
$good_types[] = new TLiteralInt(1);
} elseif ($atomic_key_type instanceof TLiteralFloat) {
$good_types[] = new TLiteralInt((int) $atomic_key_type->value);
} elseif ($atomic_key_type instanceof TFloat) {
$good_types[] = new TInt;
} else {
2021-12-13 04:45:57 +01:00
$good_types[] = new TArrayKey;
}
}
}
if ($bad_types && $good_types) {
$item_key_type->substitute(
TypeCombiner::combine($bad_types, $codebase),
TypeCombiner::combine($good_types, $codebase)
);
}
}
2021-12-13 04:45:57 +01:00
$array_type = new TNonEmptyArray([
$item_key_type && !$item_key_type->hasMixed() ? $item_key_type : Type::getArrayKey(),
$item_value_type ?? Type::getMixed(),
]);
$array_type->count = count($array_creation_info->property_types);
2021-12-13 16:28:14 +01:00
$stmt_type = new Union([
$array_type,
2018-01-14 18:09:40 +01:00
]);
2020-11-27 20:19:55 +01:00
if ($array_creation_info->parent_taint_nodes) {
$stmt_type->parent_nodes = $array_creation_info->parent_taint_nodes;
2019-10-12 05:28:17 +02:00
}
$statements_analyzer->node_data->setType($stmt, $stmt_type);
2020-05-18 21:13:27 +02:00
return true;
2018-01-14 18:09:40 +01:00
}
2020-11-27 20:19:55 +01:00
private static function analyzeArrayItem(
StatementsAnalyzer $statements_analyzer,
Context $context,
ArrayCreationInfo $array_creation_info,
PhpParser\Node\Expr\ArrayItem $item,
Codebase $codebase
): void {
2020-11-27 20:19:55 +01:00
if ($item->unpack) {
if (ExpressionAnalyzer::analyze($statements_analyzer, $item->value, $context) === false) {
return;
}
2020-11-27 20:19:55 +01:00
$unpacked_array_type = $statements_analyzer->node_data->getType($item->value);
if (!$unpacked_array_type) {
return;
}
self::handleUnpackedArray(
$statements_analyzer,
$array_creation_info,
2021-10-13 10:49:25 +02:00
$item,
$unpacked_array_type,
$codebase
2020-11-27 20:19:55 +01:00
);
if (($data_flow_graph = $statements_analyzer->data_flow_graph)
2021-12-03 20:11:20 +01:00
&& $data_flow_graph instanceof VariableUseGraph
&& $unpacked_array_type->parent_nodes
) {
$var_location = new CodeLocation($statements_analyzer->getSource(), $item->value);
2021-12-03 20:11:20 +01:00
$new_parent_node = DataFlowNode::getForAssignment(
'array',
$var_location
);
$data_flow_graph->addNode($new_parent_node);
foreach ($unpacked_array_type->parent_nodes as $parent_node) {
$data_flow_graph->addPath(
$parent_node,
$new_parent_node,
'arrayvalue-assignment'
);
}
$array_creation_info->parent_taint_nodes += [$new_parent_node->id => $new_parent_node];
}
2020-11-27 20:19:55 +01:00
return;
}
$item_key_value = null;
$item_key_type = null;
$item_is_list_item = false;
2020-11-27 20:19:55 +01:00
if ($item->key) {
2021-06-25 15:54:39 +02:00
$was_inside_general_use = $context->inside_general_use;
$context->inside_general_use = true;
2020-11-27 20:19:55 +01:00
if (ExpressionAnalyzer::analyze($statements_analyzer, $item->key, $context) === false) {
$context->inside_general_use = $was_inside_general_use;
2020-11-27 20:19:55 +01:00
return;
}
2021-06-25 15:54:39 +02:00
$context->inside_general_use = $was_inside_general_use;
2020-11-27 20:19:55 +01:00
if ($item_key_type = $statements_analyzer->node_data->getType($item->key)) {
$key_type = $item_key_type;
if ($key_type->isNull()) {
$key_type = Type::getString('');
}
if ($item->key instanceof PhpParser\Node\Scalar\String_
&& preg_match('/^(0|[1-9][0-9]*)$/', $item->key->value)
&& (
(int) $item->key->value < PHP_INT_MAX ||
$item->key->value === (string) PHP_INT_MAX
)
) {
$key_type = Type::getInt(false, (int) $item->key->value);
}
$array_creation_info->item_key_atomic_types = array_merge(
$array_creation_info->item_key_atomic_types,
array_values($key_type->getAtomicTypes())
);
if ($key_type->isSingleStringLiteral()) {
$item_key_literal_type = $key_type->getSingleStringLiteral();
$item_key_value = $item_key_literal_type->value;
2021-12-13 04:45:57 +01:00
if ($item_key_literal_type instanceof TLiteralClassString) {
2020-11-27 20:19:55 +01:00
$array_creation_info->class_strings[$item_key_value] = true;
}
} elseif ($key_type->isSingleIntLiteral()) {
$item_key_value = $key_type->getSingleIntLiteral()->value;
if ($item_key_value >= $array_creation_info->int_offset) {
if ($item_key_value === $array_creation_info->int_offset) {
$item_is_list_item = true;
}
$array_creation_info->int_offset = $item_key_value + 1;
2020-11-27 20:19:55 +01:00
}
}
}
} else {
$item_is_list_item = true;
$item_key_value = $array_creation_info->int_offset++;
2021-12-13 04:45:57 +01:00
$array_creation_info->item_key_atomic_types[] = new TLiteralInt($item_key_value);
2020-11-27 20:19:55 +01:00
}
if (ExpressionAnalyzer::analyze($statements_analyzer, $item->value, $context) === false) {
return;
}
$array_creation_info->all_list = $array_creation_info->all_list && $item_is_list_item;
2020-11-27 20:19:55 +01:00
if ($item_key_value !== null) {
if (isset($array_creation_info->array_keys[$item_key_value])) {
IssueBuffer::maybeAdd(
2020-11-27 20:19:55 +01:00
new DuplicateArrayKey(
'Key \'' . $item_key_value . '\' already exists on array',
new CodeLocation($statements_analyzer->getSource(), $item)
),
$statements_analyzer->getSuppressedIssues()
);
2020-11-27 20:19:55 +01:00
}
$array_creation_info->array_keys[$item_key_value] = true;
}
2020-11-27 20:19:55 +01:00
if (($data_flow_graph = $statements_analyzer->data_flow_graph)
2021-12-03 20:11:20 +01:00
&& ($data_flow_graph instanceof VariableUseGraph
2021-12-03 21:07:25 +01:00
|| !in_array('TaintedInput', $statements_analyzer->getSuppressedIssues()))
2020-11-27 20:19:55 +01:00
) {
if ($item_value_type = $statements_analyzer->node_data->getType($item->value)) {
if ($item_value_type->parent_nodes
&& !($item_value_type->isSingle()
&& $item_value_type->hasLiteralValue()
2021-12-03 20:11:20 +01:00
&& $data_flow_graph instanceof TaintFlowGraph)
2020-11-27 20:19:55 +01:00
) {
$var_location = new CodeLocation($statements_analyzer->getSource(), $item);
2021-12-03 20:11:20 +01:00
$new_parent_node = DataFlowNode::getForAssignment(
2020-11-27 20:19:55 +01:00
'array'
. ($item_key_value !== null ? '[\'' . $item_key_value . '\']' : ''),
$var_location
);
$data_flow_graph->addNode($new_parent_node);
$event = new AddRemoveTaintsEvent($item, $context, $statements_analyzer, $codebase);
$added_taints = $codebase->config->eventDispatcher->dispatchAddTaints($event);
$removed_taints = $codebase->config->eventDispatcher->dispatchRemoveTaints($event);
2020-11-27 20:19:55 +01:00
foreach ($item_value_type->parent_nodes as $parent_node) {
$data_flow_graph->addPath(
$parent_node,
$new_parent_node,
'arrayvalue-assignment'
. ($item_key_value !== null ? '-\'' . $item_key_value . '\'' : ''),
$added_taints,
$removed_taints
2020-11-27 20:19:55 +01:00
);
}
$array_creation_info->parent_taint_nodes += [$new_parent_node->id => $new_parent_node];
}
if ($item_key_type
&& $item_key_type->parent_nodes
&& $item_key_value === null
&& !($item_key_type->isSingle()
&& $item_key_type->hasLiteralValue()
2021-12-03 20:11:20 +01:00
&& $data_flow_graph instanceof TaintFlowGraph)
) {
$var_location = new CodeLocation($statements_analyzer->getSource(), $item);
2021-12-03 20:11:20 +01:00
$new_parent_node = DataFlowNode::getForAssignment(
'array',
$var_location
);
$data_flow_graph->addNode($new_parent_node);
$event = new AddRemoveTaintsEvent($item, $context, $statements_analyzer, $codebase);
$added_taints = $codebase->config->eventDispatcher->dispatchAddTaints($event);
$removed_taints = $codebase->config->eventDispatcher->dispatchRemoveTaints($event);
foreach ($item_key_type->parent_nodes as $parent_node) {
$data_flow_graph->addPath(
$parent_node,
$new_parent_node,
'arraykey-assignment',
$added_taints,
$removed_taints
);
}
$array_creation_info->parent_taint_nodes += [$new_parent_node->id => $new_parent_node];
}
2020-11-27 20:19:55 +01:00
}
}
if ($item->byRef) {
$var_id = ExpressionIdentifier::getArrayVarId(
$item->value,
$statements_analyzer->getFQCLN(),
$statements_analyzer
);
if ($var_id) {
$context->removeDescendents(
$var_id,
$context->vars_in_scope[$var_id] ?? null,
null,
$statements_analyzer
);
$context->vars_in_scope[$var_id] = Type::getMixed();
}
}
if ($item_value_type = $statements_analyzer->node_data->getType($item->value)) {
if ($item_key_value !== null && count($array_creation_info->property_types) <= 100) {
$array_creation_info->property_types[$item_key_value] = $item_value_type;
} else {
$array_creation_info->can_create_objectlike = false;
}
$array_creation_info->item_value_atomic_types = array_merge(
$array_creation_info->item_value_atomic_types,
array_values($item_value_type->getAtomicTypes())
);
} else {
2021-12-13 04:45:57 +01:00
$array_creation_info->item_value_atomic_types[] = new TMixed();
2020-11-27 20:19:55 +01:00
if ($item_key_value !== null && count($array_creation_info->property_types) <= 100) {
$array_creation_info->property_types[$item_key_value] = Type::getMixed();
} else {
$array_creation_info->can_create_objectlike = false;
}
}
}
private static function handleUnpackedArray(
StatementsAnalyzer $statements_analyzer,
ArrayCreationInfo $array_creation_info,
2021-10-13 10:49:25 +02:00
PhpParser\Node\Expr\ArrayItem $item,
2021-12-13 16:28:14 +01:00
Union $unpacked_array_type,
2021-10-13 10:49:25 +02:00
Codebase $codebase
): void {
2020-11-27 20:19:55 +01:00
foreach ($unpacked_array_type->getAtomicTypes() as $unpacked_atomic_type) {
2021-12-13 04:45:57 +01:00
if ($unpacked_atomic_type instanceof TKeyedArray) {
2020-11-27 20:19:55 +01:00
foreach ($unpacked_atomic_type->properties as $key => $property_value) {
2021-12-03 21:07:25 +01:00
if (is_string($key)) {
if ($codebase->analysis_php_version_id <= 80000) {
IssueBuffer::maybeAdd(
2021-10-13 10:49:25 +02:00
new DuplicateArrayKey(
'String keys are not supported in unpacked arrays',
new CodeLocation($statements_analyzer->getSource(), $item->value)
),
$statements_analyzer->getSuppressedIssues()
);
2021-10-13 10:49:25 +02:00
return;
}
2021-10-08 17:13:29 +02:00
$new_offset = $key;
2021-12-13 04:45:57 +01:00
$array_creation_info->item_key_atomic_types[] = new TLiteralString($new_offset);
2021-10-08 17:13:29 +02:00
} else {
$new_offset = $array_creation_info->int_offset++;
2021-12-13 04:45:57 +01:00
$array_creation_info->item_key_atomic_types[] = new TLiteralInt($new_offset);
2020-11-27 20:19:55 +01:00
}
$array_creation_info->item_value_atomic_types = array_merge(
$array_creation_info->item_value_atomic_types,
array_values($property_value->getAtomicTypes())
);
2021-10-08 17:13:29 +02:00
$array_creation_info->array_keys[$new_offset] = true;
$array_creation_info->property_types[$new_offset] = $property_value;
2020-11-27 20:19:55 +01:00
}
} else {
$codebase = $statements_analyzer->getCodebase();
2021-12-13 04:45:57 +01:00
if ($unpacked_atomic_type instanceof TArray
|| $unpacked_atomic_type instanceof TIterable
2020-11-27 20:19:55 +01:00
|| (
2021-12-13 04:45:57 +01:00
$unpacked_atomic_type instanceof TGenericObject
2020-11-27 20:19:55 +01:00
&& $unpacked_atomic_type->hasTraversableInterface($codebase)
2021-12-03 21:07:25 +01:00
&& count($unpacked_atomic_type->type_params) === 2
2020-11-27 20:19:55 +01:00
)) {
2021-03-23 04:26:03 +01:00
/** @psalm-suppress PossiblyUndefinedArrayOffset provably true, but Psalm cant see it */
if ($unpacked_atomic_type->type_params[1]->isEmpty()) {
continue;
}
$array_creation_info->can_create_objectlike = false;
2020-11-27 20:19:55 +01:00
if ($unpacked_atomic_type->type_params[0]->hasString()) {
if ($codebase->analysis_php_version_id <= 80000) {
IssueBuffer::maybeAdd(
2021-10-13 10:49:25 +02:00
new DuplicateArrayKey(
'String keys are not supported in unpacked arrays',
new CodeLocation($statements_analyzer->getSource(), $item->value)
),
$statements_analyzer->getSuppressedIssues()
);
2021-10-13 10:49:25 +02:00
return;
}
2021-12-13 04:45:57 +01:00
$array_creation_info->item_key_atomic_types[] = new TString();
2020-11-27 20:19:55 +01:00
} elseif ($unpacked_atomic_type->type_params[0]->hasInt()) {
2021-12-13 04:45:57 +01:00
$array_creation_info->item_key_atomic_types[] = new TInt();
2020-11-27 20:19:55 +01:00
}
$array_creation_info->item_value_atomic_types = array_merge(
$array_creation_info->item_value_atomic_types,
array_values(
isset($unpacked_atomic_type->type_params[1])
? $unpacked_atomic_type->type_params[1]->getAtomicTypes()
2021-12-13 04:45:57 +01:00
: [new TMixed()]
2020-11-27 20:19:55 +01:00
)
);
2021-12-13 04:45:57 +01:00
} elseif ($unpacked_atomic_type instanceof TList) {
if ($unpacked_atomic_type->type_param->isEmpty()) {
continue;
}
$array_creation_info->can_create_objectlike = false;
2021-12-13 04:45:57 +01:00
$array_creation_info->item_key_atomic_types[] = new TInt();
2020-11-27 20:19:55 +01:00
$array_creation_info->item_value_atomic_types = array_merge(
$array_creation_info->item_value_atomic_types,
array_values($unpacked_atomic_type->type_param->getAtomicTypes())
);
}
}
}
}
2018-01-14 18:09:40 +01:00
}