mirror of
https://github.com/doctrine/lexer.git
synced 2026-03-23 22:22:11 +01:00
297 lines
9.7 KiB
PHP
297 lines
9.7 KiB
PHP
<?php
|
|
|
|
declare(strict_types=1);
|
|
|
|
namespace Doctrine\Tests\Common\Lexer;
|
|
|
|
use Doctrine\Common\Lexer\Token;
|
|
use PHPUnit\Framework\TestCase;
|
|
|
|
use function array_map;
|
|
use function assert;
|
|
use function count;
|
|
use function setlocale;
|
|
|
|
use const LC_ALL;
|
|
|
|
class AbstractLexerTest extends TestCase
|
|
{
|
|
private ConcreteLexer $concreteLexer;
|
|
|
|
public function setUp(): void
|
|
{
|
|
$this->concreteLexer = new ConcreteLexer();
|
|
}
|
|
|
|
public function tearDown(): void
|
|
{
|
|
setlocale(LC_ALL, null);
|
|
}
|
|
|
|
/** @psalm-return list<array{string, list<Token<string, string|int>>}> */
|
|
public function dataProvider(): array
|
|
{
|
|
return [
|
|
[
|
|
'price=10',
|
|
[
|
|
new Token('price', 'string', 0),
|
|
new Token('=', 'operator', 5),
|
|
new Token(10, 'int', 6),
|
|
],
|
|
],
|
|
];
|
|
}
|
|
|
|
public function testResetPeek(): void
|
|
{
|
|
$expectedTokens = [
|
|
new Token('price', 'string', 0),
|
|
new Token('=', 'operator', 5),
|
|
new Token(10, 'int', 6),
|
|
];
|
|
|
|
$this->concreteLexer->setInput('price=10');
|
|
|
|
$this->assertEquals($expectedTokens[0], $this->concreteLexer->peek());
|
|
$this->assertEquals($expectedTokens[1], $this->concreteLexer->peek());
|
|
$this->concreteLexer->resetPeek();
|
|
$this->assertEquals($expectedTokens[0], $this->concreteLexer->peek());
|
|
}
|
|
|
|
public function testResetPosition(): void
|
|
{
|
|
$expectedTokens = [
|
|
new Token('price', 'string', 0),
|
|
new Token('=', 'operator', 5),
|
|
new Token(10, 'int', 6),
|
|
];
|
|
|
|
$this->concreteLexer->setInput('price=10');
|
|
$this->assertNull($this->concreteLexer->lookahead);
|
|
|
|
$this->assertTrue($this->concreteLexer->moveNext());
|
|
$this->assertEquals($expectedTokens[0], $this->concreteLexer->lookahead);
|
|
|
|
$this->assertTrue($this->concreteLexer->moveNext());
|
|
$this->assertEquals($expectedTokens[1], $this->concreteLexer->lookahead);
|
|
|
|
$this->concreteLexer->resetPosition(0);
|
|
|
|
$this->assertTrue($this->concreteLexer->moveNext());
|
|
$this->assertEquals($expectedTokens[0], $this->concreteLexer->lookahead);
|
|
}
|
|
|
|
/**
|
|
* @psalm-param list<Token<string, string|int>> $expectedTokens
|
|
*
|
|
* @dataProvider dataProvider
|
|
*/
|
|
public function testMoveNext(string $input, array $expectedTokens): void
|
|
{
|
|
$this->concreteLexer->setInput($input);
|
|
$this->assertNull($this->concreteLexer->lookahead);
|
|
|
|
for ($i = 0; $i < count($expectedTokens); $i++) {
|
|
$this->assertTrue($this->concreteLexer->moveNext());
|
|
$this->assertEquals($expectedTokens[$i], $this->concreteLexer->lookahead);
|
|
}
|
|
|
|
$this->assertFalse($this->concreteLexer->moveNext());
|
|
$this->assertNull($this->concreteLexer->lookahead);
|
|
}
|
|
|
|
public function testSkipUntil(): void
|
|
{
|
|
$this->concreteLexer->setInput('price=10');
|
|
|
|
$this->assertTrue($this->concreteLexer->moveNext());
|
|
$this->concreteLexer->skipUntil('operator');
|
|
|
|
$this->assertEquals(
|
|
new Token('=', 'operator', 5),
|
|
$this->concreteLexer->lookahead,
|
|
);
|
|
}
|
|
|
|
public function testUtf8Mismatch(): void
|
|
{
|
|
$this->concreteLexer->setInput("\xE9=10");
|
|
|
|
$this->assertTrue($this->concreteLexer->moveNext());
|
|
|
|
$this->assertEquals(
|
|
new Token("\xE9=10", 'string', 0),
|
|
$this->concreteLexer->lookahead,
|
|
);
|
|
}
|
|
|
|
/**
|
|
* @psalm-param list<Token<string, string|int>> $expectedTokens
|
|
*
|
|
* @dataProvider dataProvider
|
|
*/
|
|
public function testPeek(string $input, array $expectedTokens): void
|
|
{
|
|
$this->concreteLexer->setInput($input);
|
|
foreach ($expectedTokens as $expectedToken) {
|
|
$actualToken = $this->concreteLexer->peek();
|
|
assert($actualToken !== null);
|
|
$this->assertEquals($expectedToken, $actualToken);
|
|
$this->assertSame($expectedToken->value, $actualToken->value);
|
|
$this->assertSame($expectedToken->type, $actualToken->type);
|
|
$this->assertSame($expectedToken->position, $actualToken->position);
|
|
}
|
|
|
|
$this->assertNull($this->concreteLexer->peek());
|
|
}
|
|
|
|
/**
|
|
* @psalm-param list<Token<string, string|int>> $expectedTokens
|
|
*
|
|
* @dataProvider dataProvider
|
|
*/
|
|
public function testGlimpse(string $input, array $expectedTokens): void
|
|
{
|
|
$this->concreteLexer->setInput($input);
|
|
|
|
foreach ($expectedTokens as $expectedToken) {
|
|
$actualToken = $this->concreteLexer->glimpse();
|
|
assert($actualToken !== null);
|
|
$this->assertEquals($expectedToken, $actualToken);
|
|
$this->assertEquals($expectedToken, $this->concreteLexer->glimpse());
|
|
$this->assertSame($expectedToken->value, $actualToken->value);
|
|
$this->assertSame($expectedToken->type, $actualToken->type);
|
|
$this->assertSame($expectedToken->position, $actualToken->position);
|
|
$this->concreteLexer->moveNext();
|
|
}
|
|
|
|
$this->assertNull($this->concreteLexer->peek());
|
|
}
|
|
|
|
/** @psalm-return list<array{string, int, string}> */
|
|
public function inputUntilPositionDataProvider(): array
|
|
{
|
|
return [
|
|
['price=10', 5, 'price'],
|
|
];
|
|
}
|
|
|
|
/** @dataProvider inputUntilPositionDataProvider */
|
|
public function testGetInputUntilPosition(
|
|
string $input,
|
|
int $position,
|
|
string $expectedInput,
|
|
): void {
|
|
$this->concreteLexer->setInput($input);
|
|
|
|
$this->assertSame($expectedInput, $this->concreteLexer->getInputUntilPosition($position));
|
|
}
|
|
|
|
/**
|
|
* @psalm-param list<Token<string, string|int>> $expectedTokens
|
|
*
|
|
* @dataProvider dataProvider
|
|
*/
|
|
public function testIsNextToken(string $input, array $expectedTokens): void
|
|
{
|
|
$this->concreteLexer->setInput($input);
|
|
|
|
$this->concreteLexer->moveNext();
|
|
for ($i = 0; $i < count($expectedTokens); $i++) {
|
|
assert($expectedTokens[$i]->type !== null);
|
|
$this->assertTrue($this->concreteLexer->isNextToken($expectedTokens[$i]->type));
|
|
$this->concreteLexer->moveNext();
|
|
}
|
|
}
|
|
|
|
/**
|
|
* @psalm-param list<Token<string, string|int>> $expectedTokens
|
|
*
|
|
* @dataProvider dataProvider
|
|
*/
|
|
public function testIsNextTokenAny(string $input, array $expectedTokens): void
|
|
{
|
|
$allTokenTypes = array_map(static function ($token): string {
|
|
assert($token->type !== null);
|
|
|
|
return $token->type;
|
|
}, $expectedTokens);
|
|
|
|
$this->concreteLexer->setInput($input);
|
|
|
|
$this->concreteLexer->moveNext();
|
|
for ($i = 0; $i < count($expectedTokens); $i++) {
|
|
assert($expectedTokens[$i]->type !== null);
|
|
$this->assertTrue($this->concreteLexer->isNextTokenAny([$expectedTokens[$i]->type]));
|
|
$this->assertTrue($this->concreteLexer->isNextTokenAny($allTokenTypes));
|
|
$this->concreteLexer->moveNext();
|
|
}
|
|
}
|
|
|
|
public function testGetLiteral(): void
|
|
{
|
|
$this->assertSame('Doctrine\Tests\Common\Lexer\ConcreteLexer::INT', $this->concreteLexer->getLiteral('int'));
|
|
$this->assertSame('fake_token', $this->concreteLexer->getLiteral('fake_token'));
|
|
}
|
|
|
|
public function testGetLiteralWithEnumLexer(): void
|
|
{
|
|
$enumLexer = new EnumLexer();
|
|
$this->assertSame(
|
|
'Doctrine\Tests\Common\Lexer\TokenType::OPERATOR',
|
|
$enumLexer->getLiteral(TokenType::OPERATOR),
|
|
);
|
|
}
|
|
|
|
public function testIsA(): void
|
|
{
|
|
$this->assertTrue($this->concreteLexer->isA('11', 'int'));
|
|
$this->assertTrue($this->concreteLexer->isA('1.1', 'int'));
|
|
$this->assertTrue($this->concreteLexer->isA('=', 'operator'));
|
|
$this->assertTrue($this->concreteLexer->isA('>', 'operator'));
|
|
$this->assertTrue($this->concreteLexer->isA('<', 'operator'));
|
|
$this->assertTrue($this->concreteLexer->isA('fake_text', 'string'));
|
|
}
|
|
|
|
public function testAddCatchablePatternsToMutableLexer(): void
|
|
{
|
|
$mutableLexer = new MutableLexer();
|
|
$mutableLexer->addCatchablePattern('[a-z]');
|
|
$mutableLexer->setInput('one');
|
|
$token = $mutableLexer->glimpse();
|
|
|
|
$this->assertNotNull($token);
|
|
$this->assertEquals('o', $token->value);
|
|
|
|
$mutableLexer = new MutableLexer();
|
|
$mutableLexer->addCatchablePattern('[a-z]+');
|
|
$mutableLexer->setInput('one');
|
|
$token = $mutableLexer->glimpse();
|
|
|
|
$this->assertNotNull($token);
|
|
$this->assertEquals('one', $token->value);
|
|
}
|
|
|
|
public function testMarkerAnnotationLocaleTr(): void
|
|
{
|
|
setlocale(LC_ALL, 'tr_TR.utf8', 'tr_TR');
|
|
$mutableLexer = new MutableLexer();
|
|
$mutableLexer->addCatchablePattern('[a-z_\\\][a-z0-9_\:\\\]*[a-z_][a-z0-9_]*');
|
|
$mutableLexer->addCatchablePattern('(?:[+-]?[0-9]+(?:[\.][0-9]+)*)(?:[eE][+-]?[0-9]+)?');
|
|
$mutableLexer->addCatchablePattern('"(?:""|[^"])*+"');
|
|
$mutableLexer->setInput('@ODM\Id');
|
|
|
|
self::assertNull($mutableLexer->token);
|
|
self::assertNull($mutableLexer->lookahead);
|
|
self::assertTrue($mutableLexer->moveNext());
|
|
self::assertNull($mutableLexer->token);
|
|
self::assertNotNull($mutableLexer->lookahead);
|
|
self::assertEquals('@', $mutableLexer->lookahead->value);
|
|
self::assertTrue($mutableLexer->moveNext());
|
|
self::assertNotNull($mutableLexer->token);
|
|
self::assertEquals('@', $mutableLexer->token->value);
|
|
self::assertEquals('ODM\Id', $mutableLexer->lookahead->value);
|
|
}
|
|
}
|