class Lexer
Same name in this branch
- 11.1.x vendor/phpstan/phpdoc-parser/src/Lexer/Lexer.php \PHPStan\PhpDocParser\Lexer\Lexer
- 11.1.x vendor/nikic/php-parser/lib/PhpParser/Lexer.php \PhpParser\Lexer
- 11.1.x vendor/twig/twig/src/Lexer.php \Twig\Lexer
Lexer class
Ported from https://github.com/zaach/jsonlint
Hierarchy
- class \Seld\JsonLint\Lexer
Expanded class hierarchy of Lexer
File
-
vendor/
seld/ jsonlint/ src/ Seld/ JsonLint/ Lexer.php, line 19
Namespace
Seld\JsonLintView source
class Lexer {
/** @internal */
const EOF = 1;
/** @internal */
const T_INVALID = -1;
const T_SKIP_WHITESPACE = 0;
const T_ERROR = 2;
/** @internal */
const T_BREAK_LINE = 3;
/** @internal */
const T_COMMENT = 30;
/** @internal */
const T_OPEN_COMMENT = 31;
/** @internal */
const T_CLOSE_COMMENT = 32;
/**
* @phpstan-var array<int<0,17>, string>
* @const
*/
private $rules = array(
0 => '/\\G\\s*\\n\\r?/',
1 => '/\\G\\s+/',
2 => '/\\G-?([0-9]|[1-9][0-9]+)(\\.[0-9]+)?([eE][+-]?[0-9]+)?\\b/',
3 => '{\\G"(?>\\\\["bfnrt/\\\\]|\\\\u[a-fA-F0-9]{4}|[^\\0-\\x1f\\\\"]++)*+"}',
4 => '/\\G\\{/',
5 => '/\\G\\}/',
6 => '/\\G\\[/',
7 => '/\\G\\]/',
8 => '/\\G,/',
9 => '/\\G:/',
10 => '/\\Gtrue\\b/',
11 => '/\\Gfalse\\b/',
12 => '/\\Gnull\\b/',
13 => '/\\G$/',
14 => '/\\G\\/\\//',
15 => '/\\G\\/\\*/',
16 => '/\\G\\*\\//',
17 => '/\\G./',
);
/** @var string */
private $input;
/** @var bool */
private $more;
/** @var bool */
private $done;
/** @var 0|positive-int */
private $offset;
/** @var int */
private $flags;
/** @var string */
public $match;
/** @var 0|positive-int */
public $yylineno;
/** @var 0|positive-int */
public $yyleng;
/** @var string */
public $yytext;
/** @var array{first_line: 0|positive-int, first_column: 0|positive-int, last_line: 0|positive-int, last_column: 0|positive-int} */
public $yylloc;
/**
* @param int $flags
*/
public function __construct($flags = 0) {
$this->flags = $flags;
}
/**
* @return 0|1|4|6|8|10|11|14|17|18|21|22|23|24|30|-1
*/
public function lex() {
while (true) {
$symbol = $this->next();
switch ($symbol) {
case self::T_SKIP_WHITESPACE:
case self::T_BREAK_LINE:
break;
case self::T_COMMENT:
case self::T_OPEN_COMMENT:
if (!($this->flags & JsonParser::ALLOW_COMMENTS)) {
$this->parseError('Lexical error on line ' . ($this->yylineno + 1) . ". Comments are not allowed.\n" . $this->showPosition());
}
$this->skipUntil($symbol === self::T_COMMENT ? self::T_BREAK_LINE : self::T_CLOSE_COMMENT);
if ($this->done) {
// last symbol '/\G$/' before EOF
return 14;
}
break;
case self::T_CLOSE_COMMENT:
$this->parseError('Lexical error on line ' . ($this->yylineno + 1) . ". Unexpected token.\n" . $this->showPosition());
default:
return $symbol;
}
}
}
/**
* @param string $input
* @return $this
*/
public function setInput($input) {
$this->input = $input;
$this->more = false;
$this->done = false;
$this->offset = 0;
$this->yylineno = $this->yyleng = 0;
$this->yytext = $this->match = '';
$this->yylloc = array(
'first_line' => 1,
'first_column' => 0,
'last_line' => 1,
'last_column' => 0,
);
return $this;
}
/**
* @return string
*/
public function showPosition() {
if ($this->yylineno === 0 && $this->offset === 1 && $this->match !== '{') {
return $this->match . '...' . "\n^";
}
$pre = str_replace("\n", '', $this->getPastInput());
$c = str_repeat('-', max(0, \strlen($pre) - 1));
// new Array(pre.length + 1).join("-");
return $pre . str_replace("\n", '', $this->getUpcomingInput()) . "\n" . $c . "^";
}
/**
* @return string
*/
public function getPastInput() {
$pastLength = $this->offset - \strlen($this->match);
return ($pastLength > 20 ? '...' : '') . substr($this->input, max(0, $pastLength - 20), min(20, $pastLength));
}
/**
* @return string
*/
public function getUpcomingInput() {
$next = $this->match;
if (\strlen($next) < 20) {
$next .= substr($this->input, $this->offset, 20 - \strlen($next));
}
return substr($next, 0, 20) . (\strlen($next) > 20 ? '...' : '');
}
/**
* @return string
*/
public function getFullUpcomingInput() {
$next = $this->match;
if (substr($next, 0, 1) === '"' && substr_count($next, '"') === 1) {
$len = \strlen($this->input);
if ($len === $this->offset) {
$strEnd = $len;
}
else {
$strEnd = min(strpos($this->input, '"', $this->offset + 1) ?: $len, strpos($this->input, "\n", $this->offset + 1) ?: $len);
}
$next .= substr($this->input, $this->offset, $strEnd - $this->offset);
}
elseif (\strlen($next) < 20) {
$next .= substr($this->input, $this->offset, 20 - \strlen($next));
}
return $next;
}
/**
* @param string $str
* @return never
*/
protected function parseError($str) {
throw new ParsingException($str);
}
/**
* @param int $token
* @return void
*/
private function skipUntil($token) {
$symbol = $this->next();
while ($symbol !== $token && false === $this->done) {
$symbol = $this->next();
}
}
/**
* @return 0|1|3|4|6|8|10|11|14|17|18|21|22|23|24|30|31|32|-1
*/
private function next() {
if ($this->done) {
return self::EOF;
}
if ($this->offset === \strlen($this->input)) {
$this->done = true;
}
$token = null;
$match = null;
$col = null;
$lines = null;
if (!$this->more) {
$this->yytext = '';
$this->match = '';
}
$rulesLen = count($this->rules);
for ($i = 0; $i < $rulesLen; $i++) {
if (preg_match($this->rules[$i], $this->input, $match, 0, $this->offset)) {
$lines = explode("\n", $match[0]);
array_shift($lines);
$lineCount = \count($lines);
$this->yylineno += $lineCount;
$this->yylloc = array(
'first_line' => $this->yylloc['last_line'],
'last_line' => $this->yylineno + 1,
'first_column' => $this->yylloc['last_column'],
'last_column' => $lineCount > 0 ? \strlen($lines[$lineCount - 1]) : $this->yylloc['last_column'] + \strlen($match[0]),
);
$this->yytext .= $match[0];
$this->match .= $match[0];
$this->yyleng = \strlen($this->yytext);
$this->more = false;
$this->offset += \strlen($match[0]);
return $this->performAction($i);
}
}
if ($this->offset === \strlen($this->input)) {
return self::EOF;
}
$this->parseError('Lexical error on line ' . ($this->yylineno + 1) . ". Unrecognized text.\n" . $this->showPosition());
}
/**
* @param int $rule
* @return 0|3|4|6|8|10|11|14|17|18|21|22|23|24|30|31|32|-1
*/
private function performAction($rule) {
switch ($rule) {
case 0:
/* skip break line */
return self::T_BREAK_LINE;
case 1:
/* skip whitespace */
return self::T_SKIP_WHITESPACE;
case 2:
return 6;
case 3:
$this->yytext = substr($this->yytext, 1, $this->yyleng - 2);
return 4;
case 4:
return 17;
case 5:
return 18;
case 6:
return 23;
case 7:
return 24;
case 8:
return 22;
case 9:
return 21;
case 10:
return 10;
case 11:
return 11;
case 12:
return 8;
case 13:
return 14;
case 14:
return self::T_COMMENT;
case 15:
return self::T_OPEN_COMMENT;
case 16:
return self::T_CLOSE_COMMENT;
case 17:
return self::T_INVALID;
default:
throw new \LogicException('Unsupported rule ' . $rule);
}
}
}
Members
Title Sort descending | Modifiers | Object type | Summary |
---|---|---|---|
Lexer::$done | private | property | @var bool |
Lexer::$flags | private | property | @var int |
Lexer::$input | private | property | @var string |
Lexer::$match | public | property | @var string |
Lexer::$more | private | property | @var bool |
Lexer::$offset | private | property | @var 0|positive-int |
Lexer::$rules | private | property | @phpstan-var array<int<0,17>, string> @const |
Lexer::$yyleng | public | property | @var 0|positive-int |
Lexer::$yylineno | public | property | @var 0|positive-int |
Lexer::$yylloc | public | property | @var array{first_line: 0|positive-int, first_column: 0|positive-int, last_line: 0|positive-int, last_column: 0|positive-int} |
Lexer::$yytext | public | property | @var string |
Lexer::EOF | constant | @internal | |
Lexer::getFullUpcomingInput | public | function | |
Lexer::getPastInput | public | function | |
Lexer::getUpcomingInput | public | function | |
Lexer::lex | public | function | |
Lexer::next | private | function | |
Lexer::parseError | protected | function | |
Lexer::performAction | private | function | |
Lexer::setInput | public | function | |
Lexer::showPosition | public | function | |
Lexer::skipUntil | private | function | |
Lexer::T_BREAK_LINE | constant | @internal | |
Lexer::T_CLOSE_COMMENT | constant | @internal | |
Lexer::T_COMMENT | constant | @internal | |
Lexer::T_ERROR | constant | ||
Lexer::T_INVALID | constant | @internal | |
Lexer::T_OPEN_COMMENT | constant | @internal | |
Lexer::T_SKIP_WHITESPACE | constant | ||
Lexer::__construct | public | function |