1: | <?php declare(strict_types = 1); |
2: | |
3: | namespace PHPStan\Type\Php; |
4: | |
5: | use PhpParser\Node\Expr; |
6: | use PHPStan\Analyser\Scope; |
7: | use PHPStan\Php\PhpVersion; |
8: | use PHPStan\TrinaryLogic; |
9: | use PHPStan\Type\Accessory\AccessoryArrayListType; |
10: | use PHPStan\Type\ArrayType; |
11: | use PHPStan\Type\Constant\ConstantArrayType; |
12: | use PHPStan\Type\Constant\ConstantArrayTypeBuilder; |
13: | use PHPStan\Type\Constant\ConstantIntegerType; |
14: | use PHPStan\Type\Constant\ConstantStringType; |
15: | use PHPStan\Type\IntegerRangeType; |
16: | use PHPStan\Type\IntegerType; |
17: | use PHPStan\Type\NullType; |
18: | use PHPStan\Type\Regex\RegexAlternation; |
19: | use PHPStan\Type\Regex\RegexCapturingGroup; |
20: | use PHPStan\Type\Regex\RegexExpressionHelper; |
21: | use PHPStan\Type\Regex\RegexGroupParser; |
22: | use PHPStan\Type\StringType; |
23: | use PHPStan\Type\Type; |
24: | use PHPStan\Type\TypeCombinator; |
25: | use function array_reverse; |
26: | use function count; |
27: | use function in_array; |
28: | use function is_string; |
29: | use const PREG_OFFSET_CAPTURE; |
30: | use const PREG_PATTERN_ORDER; |
31: | use const PREG_SET_ORDER; |
32: | use const PREG_UNMATCHED_AS_NULL; |
33: | |
34: | |
35: | |
36: | |
37: | final class RegexArrayShapeMatcher |
38: | { |
39: | |
40: | |
41: | |
42: | |
43: | public const PREG_UNMATCHED_AS_NULL_ON_72_73 = 2048; |
44: | |
45: | public function __construct( |
46: | private RegexGroupParser $regexGroupParser, |
47: | private RegexExpressionHelper $regexExpressionHelper, |
48: | private PhpVersion $phpVersion, |
49: | ) |
50: | { |
51: | } |
52: | |
53: | public function matchAllExpr(Expr $patternExpr, ?Type $flagsType, TrinaryLogic $wasMatched, Scope $scope): ?Type |
54: | { |
55: | return $this->matchPatternType($this->getPatternType($patternExpr, $scope), $flagsType, $wasMatched, true); |
56: | } |
57: | |
58: | public function matchExpr(Expr $patternExpr, ?Type $flagsType, TrinaryLogic $wasMatched, Scope $scope): ?Type |
59: | { |
60: | return $this->matchPatternType($this->getPatternType($patternExpr, $scope), $flagsType, $wasMatched, false); |
61: | } |
62: | |
63: | private function matchPatternType(Type $patternType, ?Type $flagsType, TrinaryLogic $wasMatched, bool $matchesAll): ?Type |
64: | { |
65: | if ($wasMatched->no()) { |
66: | return new ConstantArrayType([], []); |
67: | } |
68: | |
69: | $constantStrings = $patternType->getConstantStrings(); |
70: | if (count($constantStrings) === 0) { |
71: | return null; |
72: | } |
73: | |
74: | $flags = null; |
75: | if ($flagsType !== null) { |
76: | if (!$flagsType instanceof ConstantIntegerType) { |
77: | return null; |
78: | } |
79: | |
80: | |
81: | $flags = $flagsType->getValue() & (PREG_OFFSET_CAPTURE | PREG_PATTERN_ORDER | PREG_SET_ORDER | PREG_UNMATCHED_AS_NULL | self::PREG_UNMATCHED_AS_NULL_ON_72_73); |
82: | |
83: | |
84: | if ($flags !== $flagsType->getValue()) { |
85: | return null; |
86: | } |
87: | } |
88: | |
89: | $matchedTypes = []; |
90: | foreach ($constantStrings as $constantString) { |
91: | $matched = $this->matchRegex($constantString->getValue(), $flags, $wasMatched, $matchesAll); |
92: | if ($matched === null) { |
93: | return null; |
94: | } |
95: | |
96: | $matchedTypes[] = $matched; |
97: | } |
98: | |
99: | if (count($matchedTypes) === 1) { |
100: | return $matchedTypes[0]; |
101: | } |
102: | |
103: | return TypeCombinator::union(...$matchedTypes); |
104: | } |
105: | |
106: | |
107: | |
108: | |
109: | private function matchRegex(string $regex, ?int $flags, TrinaryLogic $wasMatched, bool $matchesAll): ?Type |
110: | { |
111: | $parseResult = $this->regexGroupParser->parseGroups($regex); |
112: | if ($parseResult === null) { |
113: | |
114: | return null; |
115: | } |
116: | [$groupList, $markVerbs] = $parseResult; |
117: | |
118: | $trailingOptionals = 0; |
119: | foreach (array_reverse($groupList) as $captureGroup) { |
120: | if (!$captureGroup->isOptional()) { |
121: | break; |
122: | } |
123: | $trailingOptionals++; |
124: | } |
125: | |
126: | $onlyOptionalTopLevelGroup = $this->getOnlyOptionalTopLevelGroup($groupList); |
127: | $onlyTopLevelAlternation = $this->getOnlyTopLevelAlternation($groupList); |
128: | $flags ??= 0; |
129: | |
130: | if ( |
131: | !$matchesAll |
132: | && $wasMatched->yes() |
133: | && $onlyOptionalTopLevelGroup !== null |
134: | ) { |
135: | |
136: | |
137: | |
138: | $onlyOptionalTopLevelGroup->forceNonOptional(); |
139: | |
140: | $combiType = $this->buildArrayType( |
141: | $groupList, |
142: | $wasMatched, |
143: | $trailingOptionals, |
144: | $flags, |
145: | $markVerbs, |
146: | $matchesAll, |
147: | ); |
148: | |
149: | if (!$this->containsUnmatchedAsNull($flags, $matchesAll)) { |
150: | |
151: | $combiType = TypeCombinator::union( |
152: | new ConstantArrayType([new ConstantIntegerType(0)], [$this->createSubjectValueType($flags, $matchesAll)], [1], [], TrinaryLogic::createYes()), |
153: | $combiType, |
154: | ); |
155: | } |
156: | |
157: | $onlyOptionalTopLevelGroup->clearOverrides(); |
158: | |
159: | return $combiType; |
160: | } elseif ( |
161: | !$matchesAll |
162: | && $onlyOptionalTopLevelGroup === null |
163: | && $onlyTopLevelAlternation !== null |
164: | && !$wasMatched->no() |
165: | ) { |
166: | |
167: | |
168: | $combiTypes = []; |
169: | $isOptionalAlternation = false; |
170: | foreach ($onlyTopLevelAlternation->getGroupCombinations() as $groupCombo) { |
171: | $comboList = $groupList; |
172: | |
173: | $beforeCurrentCombo = true; |
174: | foreach ($comboList as $groupId => $group) { |
175: | if (in_array($groupId, $groupCombo, true)) { |
176: | $isOptionalAlternation = $group->inOptionalAlternation(); |
177: | $group->forceNonOptional(); |
178: | $beforeCurrentCombo = false; |
179: | } elseif ($beforeCurrentCombo && !$group->resetsGroupCounter()) { |
180: | $group->forceNonOptional(); |
181: | $group->forceType( |
182: | $this->containsUnmatchedAsNull($flags, $matchesAll) ? new NullType() : new ConstantStringType(''), |
183: | ); |
184: | } elseif ( |
185: | $group->getAlternationId() === $onlyTopLevelAlternation->getId() |
186: | && !$this->containsUnmatchedAsNull($flags, $matchesAll) |
187: | ) { |
188: | unset($comboList[$groupId]); |
189: | } |
190: | } |
191: | |
192: | $combiType = $this->buildArrayType( |
193: | $comboList, |
194: | $wasMatched, |
195: | $trailingOptionals, |
196: | $flags, |
197: | $markVerbs, |
198: | $matchesAll, |
199: | ); |
200: | |
201: | $combiTypes[] = $combiType; |
202: | |
203: | foreach ($groupCombo as $groupId) { |
204: | $group = $comboList[$groupId]; |
205: | $group->clearOverrides(); |
206: | } |
207: | } |
208: | |
209: | if ( |
210: | !$this->containsUnmatchedAsNull($flags, $matchesAll) |
211: | && ( |
212: | $onlyTopLevelAlternation->getAlternationsCount() !== count($onlyTopLevelAlternation->getGroupCombinations()) |
213: | || $isOptionalAlternation |
214: | ) |
215: | ) { |
216: | |
217: | $combiTypes[] = new ConstantArrayType([new ConstantIntegerType(0)], [$this->createSubjectValueType($flags, $matchesAll)], [1], [], TrinaryLogic::createYes()); |
218: | } |
219: | |
220: | return TypeCombinator::union(...$combiTypes); |
221: | } |
222: | |
223: | |
224: | |
225: | return $this->buildArrayType( |
226: | $groupList, |
227: | $wasMatched, |
228: | $trailingOptionals, |
229: | $flags, |
230: | $markVerbs, |
231: | $matchesAll, |
232: | ); |
233: | } |
234: | |
235: | |
236: | |
237: | |
238: | private function getOnlyOptionalTopLevelGroup(array $captureGroups): ?RegexCapturingGroup |
239: | { |
240: | $group = null; |
241: | foreach ($captureGroups as $captureGroup) { |
242: | if (!$captureGroup->isTopLevel()) { |
243: | continue; |
244: | } |
245: | |
246: | if (!$captureGroup->isOptional()) { |
247: | return null; |
248: | } |
249: | |
250: | if ($group !== null) { |
251: | return null; |
252: | } |
253: | |
254: | $group = $captureGroup; |
255: | } |
256: | |
257: | return $group; |
258: | } |
259: | |
260: | |
261: | |
262: | |
263: | private function getOnlyTopLevelAlternation(array $captureGroups): ?RegexAlternation |
264: | { |
265: | $alternation = null; |
266: | foreach ($captureGroups as $captureGroup) { |
267: | if (!$captureGroup->isTopLevel()) { |
268: | continue; |
269: | } |
270: | |
271: | if (!$captureGroup->inAlternation()) { |
272: | return null; |
273: | } |
274: | |
275: | if ($captureGroup->inOptionalQuantification()) { |
276: | return null; |
277: | } |
278: | |
279: | if ($alternation === null) { |
280: | $alternation = $captureGroup->getAlternation(); |
281: | } elseif ($alternation->getId() !== $captureGroup->getAlternation()->getId()) { |
282: | return null; |
283: | } |
284: | } |
285: | |
286: | return $alternation; |
287: | } |
288: | |
289: | |
290: | |
291: | |
292: | |
293: | private function buildArrayType( |
294: | array $captureGroups, |
295: | TrinaryLogic $wasMatched, |
296: | int $trailingOptionals, |
297: | int $flags, |
298: | array $markVerbs, |
299: | bool $matchesAll, |
300: | ): Type |
301: | { |
302: | $builder = ConstantArrayTypeBuilder::createEmpty(); |
303: | |
304: | |
305: | $builder->setOffsetValueType( |
306: | $this->getKeyType(0), |
307: | $this->createSubjectValueType($flags, $matchesAll), |
308: | $this->isSubjectOptional($wasMatched, $matchesAll), |
309: | ); |
310: | |
311: | $countGroups = count($captureGroups); |
312: | $i = 0; |
313: | foreach ($captureGroups as $captureGroup) { |
314: | $isTrailingOptional = $i >= $countGroups - $trailingOptionals; |
315: | $isLastGroup = $i === $countGroups - 1; |
316: | $groupValueType = $this->createGroupValueType($captureGroup, $wasMatched, $flags, $isTrailingOptional, $isLastGroup, $matchesAll); |
317: | $optional = $this->isGroupOptional($captureGroup, $wasMatched, $flags, $isTrailingOptional, $matchesAll); |
318: | |
319: | if ($captureGroup->isNamed()) { |
320: | $builder->setOffsetValueType( |
321: | $this->getKeyType($captureGroup->getName()), |
322: | $groupValueType, |
323: | $optional, |
324: | ); |
325: | } |
326: | |
327: | $builder->setOffsetValueType( |
328: | $this->getKeyType($i + 1), |
329: | $groupValueType, |
330: | $optional, |
331: | ); |
332: | |
333: | $i++; |
334: | } |
335: | |
336: | if (count($markVerbs) > 0) { |
337: | $markTypes = []; |
338: | foreach ($markVerbs as $mark) { |
339: | $markTypes[] = new ConstantStringType($mark); |
340: | } |
341: | $builder->setOffsetValueType( |
342: | $this->getKeyType('MARK'), |
343: | TypeCombinator::union(...$markTypes), |
344: | true, |
345: | ); |
346: | } |
347: | |
348: | if ($matchesAll && $this->containsSetOrder($flags)) { |
349: | $arrayType = TypeCombinator::intersect(new ArrayType(new IntegerType(), $builder->getArray()), new AccessoryArrayListType()); |
350: | if (!$wasMatched->yes()) { |
351: | $arrayType = TypeCombinator::union( |
352: | new ConstantArrayType([], []), |
353: | $arrayType, |
354: | ); |
355: | } |
356: | return $arrayType; |
357: | } |
358: | |
359: | return $builder->getArray(); |
360: | } |
361: | |
362: | private function isSubjectOptional(TrinaryLogic $wasMatched, bool $matchesAll): bool |
363: | { |
364: | if ($matchesAll) { |
365: | return false; |
366: | } |
367: | |
368: | return !$wasMatched->yes(); |
369: | } |
370: | |
371: | private function createSubjectValueType(int $flags, bool $matchesAll): Type |
372: | { |
373: | $subjectValueType = TypeCombinator::removeNull($this->getValueType(new StringType(), $flags, $matchesAll)); |
374: | |
375: | if ($matchesAll) { |
376: | if ($this->containsPatternOrder($flags)) { |
377: | $subjectValueType = TypeCombinator::intersect(new ArrayType(new IntegerType(), $subjectValueType), new AccessoryArrayListType()); |
378: | } |
379: | } |
380: | |
381: | return $subjectValueType; |
382: | } |
383: | |
384: | private function isGroupOptional(RegexCapturingGroup $captureGroup, TrinaryLogic $wasMatched, int $flags, bool $isTrailingOptional, bool $matchesAll): bool |
385: | { |
386: | if ($matchesAll) { |
387: | if ($isTrailingOptional && !$this->containsUnmatchedAsNull($flags, $matchesAll) && $this->containsSetOrder($flags)) { |
388: | return true; |
389: | } |
390: | |
391: | return false; |
392: | } |
393: | |
394: | if (!$wasMatched->yes()) { |
395: | $optional = true; |
396: | } else { |
397: | if (!$isTrailingOptional) { |
398: | $optional = false; |
399: | } elseif ($this->containsUnmatchedAsNull($flags, $matchesAll)) { |
400: | $optional = false; |
401: | } else { |
402: | $optional = $captureGroup->isOptional(); |
403: | } |
404: | } |
405: | |
406: | return $optional; |
407: | } |
408: | |
409: | private function createGroupValueType(RegexCapturingGroup $captureGroup, TrinaryLogic $wasMatched, int $flags, bool $isTrailingOptional, bool $isLastGroup, bool $matchesAll): Type |
410: | { |
411: | if ($matchesAll) { |
412: | if ( |
413: | ( |
414: | !$this->containsSetOrder($flags) |
415: | && !$this->containsUnmatchedAsNull($flags, $matchesAll) |
416: | && $captureGroup->isOptional() |
417: | ) |
418: | || |
419: | ( |
420: | $this->containsSetOrder($flags) |
421: | && !$this->containsUnmatchedAsNull($flags, $matchesAll) |
422: | && $captureGroup->isOptional() |
423: | && !$isTrailingOptional |
424: | ) |
425: | ) { |
426: | $groupValueType = $this->getValueType( |
427: | TypeCombinator::union($captureGroup->getType(), new ConstantStringType('')), |
428: | $flags, |
429: | $matchesAll, |
430: | ); |
431: | $groupValueType = TypeCombinator::removeNull($groupValueType); |
432: | } else { |
433: | $groupValueType = $this->getValueType($captureGroup->getType(), $flags, $matchesAll); |
434: | } |
435: | |
436: | if (!$isTrailingOptional && $this->containsUnmatchedAsNull($flags, $matchesAll) && !$captureGroup->isOptional()) { |
437: | $groupValueType = TypeCombinator::removeNull($groupValueType); |
438: | } |
439: | |
440: | if ($this->containsPatternOrder($flags)) { |
441: | $groupValueType = TypeCombinator::intersect(new ArrayType(new IntegerType(), $groupValueType), new AccessoryArrayListType()); |
442: | } |
443: | |
444: | return $groupValueType; |
445: | } |
446: | |
447: | if (!$isLastGroup && !$this->containsUnmatchedAsNull($flags, $matchesAll) && $captureGroup->isOptional()) { |
448: | $groupValueType = $this->getValueType( |
449: | TypeCombinator::union($captureGroup->getType(), new ConstantStringType('')), |
450: | $flags, |
451: | $matchesAll, |
452: | ); |
453: | } else { |
454: | $groupValueType = $this->getValueType($captureGroup->getType(), $flags, $matchesAll); |
455: | } |
456: | |
457: | if ($wasMatched->yes()) { |
458: | if (!$isTrailingOptional && $this->containsUnmatchedAsNull($flags, $matchesAll) && !$captureGroup->isOptional()) { |
459: | $groupValueType = TypeCombinator::removeNull($groupValueType); |
460: | } |
461: | } |
462: | |
463: | return $groupValueType; |
464: | } |
465: | |
466: | private function containsOffsetCapture(int $flags): bool |
467: | { |
468: | return ($flags & PREG_OFFSET_CAPTURE) !== 0; |
469: | } |
470: | |
471: | private function containsPatternOrder(int $flags): bool |
472: | { |
473: | |
474: | return !$this->containsSetOrder($flags); |
475: | } |
476: | |
477: | private function containsSetOrder(int $flags): bool |
478: | { |
479: | return ($flags & PREG_SET_ORDER) !== 0; |
480: | } |
481: | |
482: | private function containsUnmatchedAsNull(int $flags, bool $matchesAll): bool |
483: | { |
484: | if ($matchesAll) { |
485: | |
486: | |
487: | return ($flags & PREG_UNMATCHED_AS_NULL) !== 0; |
488: | } |
489: | |
490: | return ($flags & PREG_UNMATCHED_AS_NULL) !== 0 && (($flags & self::PREG_UNMATCHED_AS_NULL_ON_72_73) !== 0 || $this->phpVersion->supportsPregUnmatchedAsNull()); |
491: | } |
492: | |
493: | private function getKeyType(int|string $key): Type |
494: | { |
495: | if (is_string($key)) { |
496: | return new ConstantStringType($key); |
497: | } |
498: | |
499: | return new ConstantIntegerType($key); |
500: | } |
501: | |
502: | private function getValueType(Type $baseType, int $flags, bool $matchesAll): Type |
503: | { |
504: | $valueType = $baseType; |
505: | |
506: | |
507: | $offsetType = IntegerRangeType::fromInterval(-1, null); |
508: | if ($this->containsUnmatchedAsNull($flags, $matchesAll)) { |
509: | $valueType = TypeCombinator::addNull($valueType); |
510: | } |
511: | |
512: | if ($this->containsOffsetCapture($flags)) { |
513: | $builder = ConstantArrayTypeBuilder::createEmpty(); |
514: | |
515: | $builder->setOffsetValueType( |
516: | new ConstantIntegerType(0), |
517: | $valueType, |
518: | ); |
519: | $builder->setOffsetValueType( |
520: | new ConstantIntegerType(1), |
521: | $offsetType, |
522: | ); |
523: | |
524: | return $builder->getArray(); |
525: | } |
526: | |
527: | return $valueType; |
528: | } |
529: | |
530: | private function getPatternType(Expr $patternExpr, Scope $scope): Type |
531: | { |
532: | if ($patternExpr instanceof Expr\BinaryOp\Concat) { |
533: | return $this->regexExpressionHelper->resolvePatternConcat($patternExpr, $scope); |
534: | } |
535: | |
536: | return $scope->getType($patternExpr); |
537: | } |
538: | |
539: | } |
540: | |