/usr/share/php/Nette/Tokenizer/Tokenizer.php is in php-nette 2.4-20160731-1.
This file is owned by root:root, with mode 0o644.
The actual contents of the file can be viewed below.
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72 73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96 | <?php
/**
* This file is part of the Nette Framework (https://nette.org)
* Copyright (c) 2004 David Grudl (https://davidgrudl.com)
*/
namespace Nette\Utils;
/**
* Simple lexical analyser.
*/
class Tokenizer
{
const VALUE = 0,
OFFSET = 1,
TYPE = 2;
/** @var string */
private $re;
/** @var array|FALSE */
private $types;
/**
* @param array of [(int|string) token type => (string) pattern]
* @param string regular expression flags
*/
public function __construct(array $patterns, $flags = '')
{
$this->re = '~(' . implode(')|(', $patterns) . ')~A' . $flags;
$keys = array_keys($patterns);
$this->types = $keys === range(0, count($patterns) - 1) ? FALSE : $keys;
}
/**
* Tokenizes string.
* @param string
* @return array
* @throws TokenizerException
*/
public function tokenize($input)
{
if ($this->types) {
preg_match_all($this->re, $input, $tokens, PREG_SET_ORDER);
$len = 0;
$count = count($this->types);
foreach ($tokens as & $match) {
$type = NULL;
for ($i = 1; $i <= $count; $i++) {
if (!isset($match[$i])) {
break;
} elseif ($match[$i] != NULL) {
$type = $this->types[$i - 1]; break;
}
}
$match = array(self::VALUE => $match[0], self::OFFSET => $len, self::TYPE => $type);
$len += strlen($match[self::VALUE]);
}
if ($len !== strlen($input)) {
$errorOffset = $len;
}
} else {
$tokens = preg_split($this->re, $input, -1, PREG_SPLIT_NO_EMPTY | PREG_SPLIT_OFFSET_CAPTURE | PREG_SPLIT_DELIM_CAPTURE);
$last = end($tokens);
if ($tokens && !preg_match($this->re, $last[0])) {
$errorOffset = $last[1];
}
}
if (isset($errorOffset)) {
list($line, $col) = $this->getCoordinates($input, $errorOffset);
$token = str_replace("\n", '\n', substr($input, $errorOffset, 10));
throw new TokenizerException("Unexpected '$token' on line $line, column $col.");
}
return $tokens;
}
/**
* Returns position of token in input string.
* @param string
* @param int
* @return array of [line, column]
*/
public static function getCoordinates($text, $offset)
{
$text = substr($text, 0, $offset);
return array(substr_count($text, "\n") + 1, $offset - strrpos("\n" . $text, "\n") + 1);
}
}
|