2008-04-08 06:17:58 +00:00
|
|
|
<?php
|
|
|
|
|
|
|
|
/**
|
2012-09-27 09:34:00 +12:00
|
|
|
* A tokenised regular expression is a parser, similar to a regular expression, that acts on tokens rather than
|
|
|
|
* characters. This is a crucial component of the ManifestBuilder.
|
2014-08-15 18:53:05 +12:00
|
|
|
*
|
2012-04-12 18:02:46 +12:00
|
|
|
* @package framework
|
2008-06-15 13:33:53 +00:00
|
|
|
* @subpackage core
|
2014-08-15 18:53:05 +12:00
|
|
|
*/
|
2011-02-17 18:05:44 +11:00
|
|
|
class TokenisedRegularExpression {
|
2008-04-08 06:17:58 +00:00
|
|
|
/**
|
|
|
|
* The regular expression definition
|
|
|
|
*/
|
|
|
|
protected $expression;
|
2014-08-15 18:53:05 +12:00
|
|
|
|
2016-05-24 10:30:10 +01:00
|
|
|
/**
|
|
|
|
* The first expression to match
|
|
|
|
*/
|
|
|
|
protected $firstMatch;
|
|
|
|
|
2012-09-19 12:07:39 +02:00
|
|
|
public function __construct($expression) {
|
2008-04-08 06:17:58 +00:00
|
|
|
$this->expression = $expression;
|
2016-05-24 10:30:10 +01:00
|
|
|
$this->firstMatch = is_array($expression[0]) ? $expression[0][0] : $expression[0];
|
2008-04-08 06:17:58 +00:00
|
|
|
}
|
2014-08-15 18:53:05 +12:00
|
|
|
|
2012-09-19 12:07:39 +02:00
|
|
|
public function findAll($tokens) {
|
2008-04-08 06:17:58 +00:00
|
|
|
$tokenTypes = array();
|
|
|
|
foreach($tokens as $i => $token) {
|
|
|
|
if(is_array($token)) {
|
2016-05-24 10:30:10 +01:00
|
|
|
$tokenType = $token[0];
|
2008-04-08 06:17:58 +00:00
|
|
|
} else {
|
2016-05-24 10:30:10 +01:00
|
|
|
$tokenType = $token;
|
2008-04-08 06:17:58 +00:00
|
|
|
// Pre-process string tokens for matchFrom()
|
|
|
|
$tokens[$i] = array($token, $token);
|
|
|
|
}
|
2016-05-24 10:30:10 +01:00
|
|
|
|
|
|
|
if ($tokenType == $this->firstMatch) {
|
|
|
|
$tokenTypes[$i] = $tokenType;
|
|
|
|
}
|
2008-04-08 06:17:58 +00:00
|
|
|
}
|
2011-12-22 15:33:11 +13:00
|
|
|
|
2008-04-08 06:17:58 +00:00
|
|
|
$allMatches = array();
|
2016-05-24 10:30:10 +01:00
|
|
|
foreach($tokenTypes as $startKey => $dud) {
|
2008-04-08 06:17:58 +00:00
|
|
|
$matches = array();
|
|
|
|
if($this->matchFrom($startKey, 0, $tokens, $matches)) {
|
|
|
|
$allMatches[] = $matches;
|
|
|
|
}
|
|
|
|
}
|
2016-05-24 10:30:10 +01:00
|
|
|
|
2008-04-08 06:17:58 +00:00
|
|
|
return $allMatches;
|
|
|
|
}
|
2014-08-15 18:53:05 +12:00
|
|
|
|
2012-09-19 12:07:39 +02:00
|
|
|
public function matchFrom($tokenPos, $expressionPos, &$tokens, &$matches) {
|
2008-04-08 06:17:58 +00:00
|
|
|
$expressionRule = $this->expression[$expressionPos];
|
|
|
|
$expectation = is_array($expressionRule) ? $expressionRule[0] : $expressionRule;
|
|
|
|
if(!is_array($expressionRule)) $expressionRule = array();
|
2014-08-15 18:53:05 +12:00
|
|
|
|
2008-04-08 06:17:58 +00:00
|
|
|
if($expectation == $tokens[$tokenPos][0]) {
|
|
|
|
if(isset($expressionRule['save_to'])) {
|
|
|
|
// Append to an array
|
2012-09-27 09:34:00 +12:00
|
|
|
if(substr($expressionRule['save_to'],-2) == '[]') {
|
|
|
|
$matches[substr($expressionRule['save_to'],0,-2)][] = $tokens[$tokenPos][1];
|
|
|
|
}
|
2008-04-08 06:17:58 +00:00
|
|
|
// Regular variable setting
|
|
|
|
else $matches[$expressionRule['save_to']] = $tokens[$tokenPos][1];
|
|
|
|
}
|
2014-08-15 18:53:05 +12:00
|
|
|
|
2008-04-08 06:17:58 +00:00
|
|
|
// End of the expression
|
|
|
|
if(!isset($this->expression[$expressionPos+1])) {
|
|
|
|
return true;
|
2014-08-15 18:53:05 +12:00
|
|
|
|
2008-04-08 06:17:58 +00:00
|
|
|
// Process next step as normal
|
|
|
|
} else if($this->matchFrom($tokenPos+1, $expressionPos+1, $tokens, $matches)) {
|
|
|
|
return true;
|
|
|
|
|
|
|
|
// This step is optional
|
2014-08-15 18:53:05 +12:00
|
|
|
} else if(isset($expressionRule['optional'])
|
2012-09-27 09:34:00 +12:00
|
|
|
&& $this->matchFrom($tokenPos, $expressionPos+1, $tokens, $matches)) {
|
2008-04-08 06:17:58 +00:00
|
|
|
return true;
|
|
|
|
|
|
|
|
// Process jumps
|
|
|
|
} else if(isset($expressionRule['can_jump_to'])) {
|
|
|
|
if(is_array($expressionRule['can_jump_to'])) foreach($expressionRule['can_jump_to'] as $canJumpTo) {
|
|
|
|
// can_jump_to & optional both set
|
2014-08-15 18:53:05 +12:00
|
|
|
if(isset($expressionRule['optional'])
|
2012-09-27 09:34:00 +12:00
|
|
|
&& $this->matchFrom($tokenPos, $canJumpTo, $tokens, $matches)) {
|
2008-04-08 06:17:58 +00:00
|
|
|
return true;
|
|
|
|
}
|
|
|
|
// can_jump_to set (optional may or may not be set)
|
|
|
|
if($this->matchFrom($tokenPos+1, $canJumpTo, $tokens, $matches)) {
|
|
|
|
return true;
|
|
|
|
}
|
|
|
|
|
|
|
|
} else {
|
|
|
|
// can_jump_to & optional both set
|
2012-09-27 09:34:00 +12:00
|
|
|
if(isset($expressionRule['optional'])
|
|
|
|
&& $this->matchFrom($tokenPos, $expressionRule['can_jump_to'], $tokens, $matches)) {
|
2008-04-08 06:17:58 +00:00
|
|
|
return true;
|
|
|
|
}
|
|
|
|
// can_jump_to set (optional may or may not be set)
|
|
|
|
if($this->matchFrom($tokenPos+1, $expressionRule['can_jump_to'], $tokens, $matches)) {
|
|
|
|
return true;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
} else if(isset($expressionRule['optional'])) {
|
2012-09-27 09:34:00 +12:00
|
|
|
if(isset($this->expression[$expressionPos+1])) {
|
|
|
|
return $this->matchFrom($tokenPos, $expressionPos+1, $tokens, $matches);
|
|
|
|
}
|
2008-04-08 06:17:58 +00:00
|
|
|
else return true;
|
|
|
|
}
|
|
|
|
|
|
|
|
return false;
|
2014-08-15 18:53:05 +12:00
|
|
|
|
2008-04-08 06:17:58 +00:00
|
|
|
}
|
2012-03-24 16:04:52 +13:00
|
|
|
}
|