模式修改

This commit is contained in:
Jerry Yan 2021-01-26 16:53:37 +08:00
parent 5a5f36d67f
commit f3b66aeac3
7 changed files with 95 additions and 96 deletions

View File

@ -11,10 +11,11 @@
## src目录解析 ## src目录解析
- `Grammar` 语法解析器,验证语法及拆分语法 - `AST` 语法树
- `Grammar` 语法器提供Token识别的规则及种类
- `Output` 输出器,将解析的内容输出(并不执行) - `Output` 输出器,将解析的内容输出(并不执行)
- `Lexer` 词法解析器,将语义转换成正常的语法供`Grammar`使用 - `Lexer` 词法分析器,二次解析`Token``Tokenizer`读取使用
- `Reader` 读取器,供`Tokenizer`读取使用 - `Parser` 语法解析器,生成语法树
- `Reader` 读取器,供`Lexer`读取使用
- `Token` 所有的Token - `Token` 所有的Token
- `Token/Factory` Token工厂生成Token用的
- `Tokenizer` 转换成Token用的 - `Tokenizer` 转换成Token用的

View File

@ -1,12 +1,12 @@
<?php <?php
/** /**
* @filename DefaultFactory.php * @filename DefaultGrammar.php
* @author Jerry Yan <792602257@qq.com> * @author Jerry Yan <792602257@qq.com>
* @date 2020/12/17 14:48 * @date 2020/12/17 14:13
*/ */
namespace JerryYan\DSL\Token\Factory; namespace JerryYan\DSL\Grammar;
use JerryYan\DSL\Token\Token; use JerryYan\DSL\Token\Token;
@ -25,9 +25,9 @@ use JerryYan\DSL\Token\TokenNumber;
use JerryYan\DSL\Token\TokenUseVariable; use JerryYan\DSL\Token\TokenUseVariable;
use JerryYan\DSL\Token\TokenVariable; use JerryYan\DSL\Token\TokenVariable;
class DefaultFactory extends FactoryInterface class DefaultGrammar implements GrammarInterface
{ {
protected $tokenMap = [ protected $tokens = [
Token::FAKE => TokenFake::class, Token::FAKE => TokenFake::class,
Token::CURRY => TokenCurry::class, Token::CURRY => TokenCurry::class,
Token::LOGIC_AND => TokenLogicAnd::class, Token::LOGIC_AND => TokenLogicAnd::class,
@ -44,5 +44,21 @@ class DefaultFactory extends FactoryInterface
Token::USE_VARIABLE => TokenUseVariable::class, Token::USE_VARIABLE => TokenUseVariable::class,
]; ];
protected $undefinedTokenClass = TokenVariable::class; protected $undefinedTokenType = TokenVariable::class;
/**
* @inheritDoc
*/
public function getTokenTypes(): array
{
return $this->tokens;
}
/**
* @inheritDoc
*/
public function getUndefinedTokenType(): string
{
return $this->undefinedTokenType;
}
} }

View File

@ -1,15 +0,0 @@
<?php
/**
* @filename Grammar.php
* @author Jerry Yan <792602257@qq.com>
* @date 2020/12/17 14:13
*/
namespace JerryYan\DSL\Grammar;
class Grammar extends GrammarInterface
{
}

View File

@ -9,7 +9,19 @@
namespace JerryYan\DSL\Grammar; namespace JerryYan\DSL\Grammar;
abstract class GrammarInterface interface GrammarInterface
{ {
/**
* @return array<string, class-string>
* @author Jerry Yan <792602257@qq.com>
* @date 2021/1/26 16:27
*/
public function getTokenTypes(): array;
/**
* @return class-string
* @author Jerry Yan <792602257@qq.com>
* @date 2021/1/26 16:27
*/
public function getUndefinedTokenType(): string;
} }

View File

@ -1,62 +0,0 @@
<?php
/**
* @filename FactoryInterface.php
* @author Jerry Yan <792602257@qq.com>
* @date 2021/1/22 13:42
*/
namespace JerryYan\DSL\Token\Factory;
use JerryYan\DSL\Token\TokenInterface;
use JerryYan\DSL\Token\TokenUndefined;
abstract class FactoryInterface
{
/** @var array<string, class-string<TokenInterface>> Token类型及映射类 */
protected $tokenMap = [];
/** @var array<string, class-string<TokenInterface>> Token别名映射 */
protected $tokenNameMap = [];
/** @var array<string, class-string<TokenInterface>> Token别名映射 */
protected $regexNameMap = [];
/** @var class-string<TokenInterface> 默认Token类 */
protected $undefinedTokenClass = TokenUndefined::class;
public function __construct()
{
/**
* @var string $key
* @var TokenInterface $token
*/
foreach ($this->tokenMap as $key=>$token) {
foreach ($token::$alias as $name) {
$this->tokenNameMap[$name] = $key;
}
foreach ($token::$regexAlias as $name) {
$this->regexNameMap[$name] = $key;
}
}
}
public function getTokenByName(string $name): TokenInterface
{
$originalName = $name;
if (isset($this->tokenNameMap[$name])) {
$name = $this->tokenNameMap[$name];
} else {
foreach ($this->regexNameMap as $regex => $newName) {
if (preg_match($regex, $name) === 1) {
$name = $newName; break;
}
}
}
if (!isset($this->tokenMap[$name])) {
return new $this->undefinedTokenClass($originalName);
} else {
return new $this->tokenMap[$name]($originalName);
}
}
}

View File

@ -9,17 +9,37 @@
namespace JerryYan\DSL\Tokenizer; namespace JerryYan\DSL\Tokenizer;
use JerryYan\DSL\Grammar\GrammarInterface;
use JerryYan\DSL\Reader\ReaderInterface; use JerryYan\DSL\Reader\ReaderInterface;
use JerryYan\DSL\Token\Factory\FactoryInterface;
use JerryYan\DSL\Token\TokenInterface; use JerryYan\DSL\Token\TokenInterface;
class Tokenizer extends TokenizerInterface class Tokenizer extends TokenizerInterface
{ {
/** @var FactoryInterface token工厂 */ /** @var array<string, class-string<TokenInterface>> Token类型及映射类 */
protected $tokenFactory; protected $tokenMapping = [];
public function __construct(FactoryInterface $tokenFactory) /** @var array<string, class-string<TokenInterface>> Token别名映射 */
protected $tokenNameMapping = [];
/** @var array<string, class-string<TokenInterface>> Token别名映射 */
protected $regexNameMapping = [];
/** @var GrammarInterface 语法器 */
protected $grammar;
public function __construct(GrammarInterface $grammar)
{ {
$this->tokenFactory = $tokenFactory; $this->grammar = $grammar;
/**
* @var string $key
* @var TokenInterface $token
*/
foreach ($grammar->getTokenTypes() as $key=>$token) {
$this->tokenMapping[$key] = $token;
foreach ($token::$alias as $name) {
$this->tokenNameMapping[$name] = $key;
}
foreach ($token::$regexAlias as $name) {
$this->regexNameMapping[$name] = $key;
}
}
} }
/** /**
@ -33,11 +53,38 @@ class Tokenizer extends TokenizerInterface
do do
{ {
$currentTokenName = $reader->getCurrentToken(); $currentTokenName = $reader->getCurrentToken();
$currentToken = $this->tokenFactory->getTokenByName($currentTokenName); $currentToken = $this->getTokenByName($currentTokenName);
$currentToken->setPrevToken($lastToken); $currentToken->setPrevToken($lastToken);
if ($lastToken !== NULL) $lastToken->setNextToken($currentToken); if ($lastToken !== NULL) $lastToken->setNextToken($currentToken);
$lastToken = $currentToken; $lastToken = $currentToken;
}while($reader->moveToNextToken()); }while($reader->moveToNextToken());
return $lastToken->getFirstToken(); return $lastToken->getFirstToken();
} }
/**
* 根据文字获取Token
* @param string $name
* @return TokenInterface
* @author Jerry Yan <792602257@qq.com>
* @date 2021/1/26 16:41
*/
protected function getTokenByName(string $name): TokenInterface
{
$originalName = $name;
if (isset($this->tokenNameMapping[$name])) {
$name = $this->tokenNameMapping[$name];
} else {
foreach ($this->regexNameMapping as $regex => $newName) {
if (preg_match($regex, $name) === 1) {
$name = $newName; break;
}
}
}
if (!isset($this->tokenMapping[$name])) {
$undefinedType = $this->grammar->getUndefinedTokenType();
return new $undefinedType($originalName);
} else {
return new $this->tokenMapping[$name]($originalName);
}
}
} }

View File

@ -7,8 +7,8 @@
namespace JerryYan\DSL\Test\Tokenizer; namespace JerryYan\DSL\Test\Tokenizer;
use JerryYan\DSL\Grammar\DefaultGrammar;
use JerryYan\DSL\Reader\StringReader; use JerryYan\DSL\Reader\StringReader;
use JerryYan\DSL\Token\Factory\DefaultFactory;
use JerryYan\DSL\Token\TokenCurry; use JerryYan\DSL\Token\TokenCurry;
use JerryYan\DSL\Token\TokenLogicAnd; use JerryYan\DSL\Token\TokenLogicAnd;
use JerryYan\DSL\Token\TokenInterface; use JerryYan\DSL\Token\TokenInterface;
@ -43,7 +43,7 @@ class TokenizerTest extends TestCase
]; ];
protected function setUp(): void protected function setUp(): void
{ {
$this->tokenizer = new Tokenizer(new DefaultFactory()); $this->tokenizer = new Tokenizer(new DefaultGrammar());
$this->reader = new StringReader($this->text); $this->reader = new StringReader($this->text);
} }