TextMate-style syntax highlighting in PHP
You can not select more than 25 topics Topics must start with a letter or number, can include dashes ('-') and can be up to 35 characters long.
 
 

393 lines
10 KiB

<?php
/** @license MIT
* Copyright 2021 Dustin Wilson et al.
* See LICENSE and AUTHORS files for details */
declare(strict_types=1);
namespace dW\Highlighter\Scope;
class Parser {
public static $debug = false;
protected Data $data;
protected int $debugCount = 1;
protected array $lastExceptionData = [];
protected static Parser $instance;
protected function __construct(string $selector) {
$this->data = new Data($selector);
}
public static function parse(string $selector): Matcher|false {
self::$instance = new self($selector);
$result = false;
self::parseSpace();
$s2 = self::parseSelector();
if ($s2 !== false) {
self::parseSpace();
$result = $s2;
}
if ($result === false && self::$instance->lastExceptionData !== []) {
throw new Exception(self::$instance->lastExceptionData['expected'], self::$instance->lastExceptionData['found']);
}
return $result;
}
protected static function parseComposite(): Matcher|false {
if (self::$debug === true) {
self::debug();
}
$result = false;
$position = self::$instance->data->position;
$s1 = self::parseExpression();
if ($s1 !== false) {
self::parseSpace();
$s3 = self::$instance->data->consumeIf('|&-');
if (in_array($s3, [ '|', '&', '-' ])) {
self::parseSpace();
$s5 = self::parseComposite();
if ($s5 !== false) {
$result = new CompositeMatcher($s1, $s3, $s5);
}
} else {
self::fail('|&-');
}
}
if ($result === false) {
self::$instance->data->unconsumeTo($position);
$result = self::parseExpression();
}
if (self::$debug === true) {
self::debugResult($result);
}
return $result;
}
protected static function parseExpression(): Matcher|false {
if (self::$debug === true) {
self::debug();
}
$result = false;
$s1 = self::$instance->data->consumeIf('-');
if ($s1 === '-') {
self::parseSpace();
$s3 = self::parseGroup();
if ($s3 !== false) {
self::parseSpace();
$result = new NegateMatcher($s3);
}
} else {
self::fail('-');
}
if ($result === false) {
$s1 = self::$instance->data->consumeIf('-');
if ($s1 === '' || $s1 === false) {
$s1 = false;
self::fail('-');
}
if ($s1 !== false) {
self::parseSpace();
$s3 = self::parsePath();
if ($s3 !== false) {
self::parseSpace();
$result = new NegateMatcher($s3);
}
}
if ($result === false) {
$result = self::parseGroup();
if ($result === false) {
$result = self::parsePath();
}
}
}
if (self::$debug === true) {
self::debugResult($result);
}
return $result;
}
protected static function parseGroup(): Matcher|false {
if (self::$debug === true) {
self::debug();
}
$result = false;
$prefix = null;
$s2 = self::$instance->data->consumeIf('LRB');
if ($s2 === '' || $s2 === false) {
$s2 = false;
self::fail('LRB');
}
if ($s2 !== false) {
$s3 = self::$instance->data->consumeIf(':');
if ($s3 === ':') {
$prefix = "$s2$s3";
} else {
self::fail(':');
}
}
$s2 = self::$instance->data->consumeIf('(');
if ($s2 === '(') {
self::parseSpace();
$s4 = self::parseSelector();
if ($s4 !== false) {
self::parseSpace();
$s6 = self::$instance->data->consumeIf(')');
if ($s6 === '' || $s6 === false) {
$s6 = false;
self::fail(')');
}
if ($s6 !== false) {
$result = new GroupMatcher($prefix, $s4);
}
}
} else {
self::fail('(');
}
if (self::$debug === true) {
self::debugResult($result);
}
return $result;
}
protected static function parsePath(): Matcher|false {
if (self::$debug === true) {
self::debug();
}
$result = false;
$prefix = null;
$s2 = self::$instance->data->consumeIf('LRB');
if (in_array($s2, [ 'L', 'R', 'B' ])) {
$s3 = self::$instance->data->consumeIf(':');
if ($s3 === '' || $s3 === false) {
$s3 = false;
self::fail(':');
}
if ($s3 !== false) {
$prefix = "$s2$s3";
}
} else {
self::fail('LRB');
}
$s2 = self::parseScope();
if ($s2 !== false) {
$s3 = [$s2];
do {
$s6 = false;
self::parseSpace();
$s6 = self::parseScope();
if ($s6 !== false) {
$s3[] = $s6;
}
} while ($s6 !== false);
$result = new PathMatcher($prefix, ...$s3);
}
if (self::$debug === true) {
self::debugResult($result);
}
return $result;
}
protected static function parseSegment(): SegmentMatcher|TrueMatcher|false {
if (self::$debug === true) {
self::debug();
}
$result = false;
self::parseSpace();
$s2 = self::$instance->data->consumeWhile('ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789+_');
if ($s2 === '' || $s2 === false) {
$s2 = false;
self::fail('ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789+_');
}
if ($s2 !== false) {
$s3 = self::$instance->data->consumeWhile('ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789-+_');
if ($s3 === '' || $s2 === false) {
$s3 = false;
self::fail('ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789-+_');
} else {
$s2 .= $s3;
}
}
if ($s2 !== false) {
self::parseSpace();
$result = new SegmentMatcher($s2);
}
if ($result === false) {
self::parseSpace();
$s2 = self::$instance->data->consumeIf('*');
if ($s2 === '*') {
self::parseSpace();
$result = new TrueMatcher($s2);
} else {
self::fail('*');
}
}
if (self::$debug === true) {
self::debugResult($result);
}
return $result;
}
protected static function parseSelector(): Matcher|false {
if (self::$debug === true) {
self::debug();
}
$result = false;
$position = self::$instance->data->position;
$s1 = self::parseComposite();
if ($s1 !== false) {
self::parseSpace();
$s3 = self::$instance->data->consumeIf(',');
if ($s3 === ',') {
self::parseSpace();
$s5 = self::parseSelector();
$result = ($s5 === false) ? $s1 : new OrMatcher($s1, $s5);
} else {
self::fail(',');
}
}
if ($result === false) {
self::$instance->data->unconsumeTo($position);
$result = self::parseComposite();
}
if (self::$debug === true) {
self::debugResult($result);
}
return $result;
}
protected static function parseScope(): ScopeMatcher|false {
if (self::$debug === true) {
self::debug();
}
$result = false;
$s1 = self::parseSegment();
if ($s1 !== false) {
$s2 = [$s1];
do {
$s3 = false;
$s4 = self::$instance->data->consumeIf('.');
if ($s4 === '.') {
$s3 = self::parseSegment();
if ($s3 !== false) {
$s2[] = $s3;
}
} else {
self::fail('.');
}
} while ($s3 !== false);
$result = new ScopeMatcher(...$s2);
}
if (self::$debug === true) {
self::debugResult($result);
}
return $result;
}
protected static function parseSpace(): string|false {
if (self::$debug === true) {
self::debug();
}
$result = self::$instance->data->consumeWhile(" \t");
if ($result === false) {
self::fail(" \t");
}
if (self::$debug === true) {
self::debugResult($result);
}
return $result;
}
protected static function debug() {
$message = <<<DEBUG
------------------------------
%s
Method: %s
Position: %s
Char: %s
DEBUG;
$methodTree = '';
$backtrace = debug_backtrace();
array_shift($backtrace);
array_pop($backtrace);
foreach ($backtrace as $b) {
$methodTree = "->{$b['function']}$methodTree";
}
printf($message,
self::instance->debugCount++,
ltrim($methodTree, '->'),
self::$instance->data->position,
var_export(self::$instance->data->peek(), true)
);
}
protected static function debugResult($result) {
printf("%s Result: %s\n",
debug_backtrace()[1]['function'],
var_export($result, true));
}
protected static function fail(string $expected) {
self::$instance->lastExceptionData = [
'expected' => $expected,
'found' => self::$instance->data->peek()
];
}
}