仓酷云
标题:
PHP网站制作之分享我写的PHP文法剖析的源码
[打印本页]
作者:
再现理想
时间:
2015-2-3 23:30
标题:
PHP网站制作之分享我写的PHP文法剖析的源码
说说这一个月左右的学习情况和心得吧!我个人认为,既然决定了去做一件事,那就要以认真的态度去对待!既然决定来学习了,那不管当初是抱着怎样的心态来到这个培训班的,都要让自己认真的投入到学习中。 比来测验考试做了文法剖析的东东,成绩较多。
请提建议。代码放不下,分两页。
下载地址 http://download.csdn.net/detail/xuzuning/4529066
PHP code
include 'ttrie.php'; class Rule extends TTrie { public $rule = array(); public $savematch = 0; function __construct($s='') { $this->set( array( ' ' => 'Separated', "\r\n" => 'set_rule', "\n" => 'set_rule', "\t" => 'Separated', '->' => 'Separated', '→' => 'Separated', '' => 'set_parallel_rule', )); $this->match($s); if($this->rule[0][0] == $this->rule[0][1]) { if(count($this->rule[0]) == 2) $this->rule[0][0] .= "'"; else array_unshift($this->rule, array($this->rule[0][0]."'", $this->rule[0][0])); }else { $c = $this->rule[0][0]; $n = 0; foreach($this->rule as $r) if($r[0] == $c) $n++; if($n > 1) array_unshift($this->rule, array($this->rule[0][0]."'", $this->rule[0][0])); } } function Separated() { } function set_rule() { $this->rule[] = $this->buffer; $this->buffer = array(); } function set_parallel_rule() { $t = $this->buffer[0]; $this->set_rule(); $this->buffer[] = $t; } } class Grammar { var $closure = array(); var $first = array(); var $follow = array(); var $rule = array(); var $identifier = array(); var $leay = array(); var $forecast = array(); var $stack = array(); var $ll = 'LL(0)'; var $lr = 'LR(0)'; function __construct($s='') { $p = new Rule($s); $this->rule = $p->rule; $this->set_grammar(); } function set_grammar() { foreach($this->rule as $rule) { if(! in_array($rule[0], $this->identifier)) $this->identifier[] = $rule[0]; } foreach($this->rule as $rule) { foreach($rule as $v) if(! in_array($v, $this->identifier) && ! in_array($v, $this->leay)) $this->leay[] = $v; } $this->set_first(); $this->set_follow(); $this->set_closure(); $this->set_select(); $this->set_forecast(); } function set_first() { foreach($this->rule as $rule) $this->first[$rule[0]] = array(); //直吸收
取 形如U->a…的发生
式(个中
a是终结符),把a支出
到First(U)中 foreach($this->rule as $v) { if(in_array($v[1], $this->leay)) $this->first[$v[0]][] = $v[1]; } //重复
传递 形入U->P1P2P3…Pn的发生
式(个中
P长短
终结符),应先把First(P1)中的全体
内容传送到First(U)中,假如
P1中有ε,把First(P2)中的内容传送到First(U)中,类推直到Pi中无ε do { $t = serialize($this->first); foreach($this->rule as $rule) { for($i=1; $i<count($rule); $i++) { $v = $rule[$i]; if(in_array($v, $this->identifier)) { $this->first[$rule[0]] = array_unique(array_merge($this->first[$rule[0]], $this->first[$v])); if(! in_array('#', $this->first[$v])) break; }else break; } } }while($t != serialize($this->first)); } function set_follow() { foreach($this->rule as $rule) $this->follow[$rule[0]] = array(); //直吸收
取 形如 …Ua… 的,把a直吸收
入到Follow(U)中 foreach($this->rule as $rule) { for($i=1; $i<count($rule)-1; $i++) { if(in_array($rule[$i], $this->identifier) && in_array($rule[$i+1], $this->leay)) $this->follow[$rule[$i]][] = $rule[$i+1]; } if(in_array($rule[$i], $this->identifier)) $this->follow[$rule[$i]][] = '#'; } foreach($this->follow as &$v) if(! $v) $v[] = '#'; //直吸收
取 形如 …UP…(P长短
终结符)的,把First(P)中非ε支出
到Follow(U)中 foreach($this->rule as $rule) { for($i=1; $i<count($rule)-1; $i++) { if(in_array($rule[$i], $this->identifier) && in_array($rule[$i+1], $this->identifier)) { $this->follow[$rule[$i]] = array_unique(array_merge($this->follow[$rule[$i]], array_diff($this->first[$rule[$i+1]], array('#')))); } } } //重复
传递 形如U->aP的(P长短
终结符)或U->aPQ(P,Q为非终结符且Q中含ε),应把Follow(U)中的全体
内容传送到Follow(P)中 do { $t = serialize($this->follow); foreach($this->rule as $rule) { $s = $rule[0]; $d = end($rule); if(in_array($d, $this->leay)) continue; $p = prev($rule); if(in_array($p, $this->leay)) $this->follow[$d] = array_unique(array_merge($this->follow[$d], $this->follow[$s])); elseif(in_array('#', $this->follow[$d])) $this->follow[$p] = array_unique(array_merge($this->follow[$p], $this->follow[$s])); } }while($t != serialize($this->follow)); } function set_closure() { $shift = array(); $this->closure[0][] = array('offs' => 1, 'rule' => 0); for($i=0 ; $i < count($this->closure); $i++) { $cnt = count($this->closure); //机关
闭包 closure $ex = array(); $j = 0; $tmp = array(); do { $size = count($this->closure[$i]); for($j=0; $j<count($this->closure[$i]); $j++) { $dfa = $this->closure[$i][$j]; $rule = $this->rule[$dfa['rule']]; if(isset($rule[$dfa['offs']])) { $ch = $ex[] = $rule[$dfa['offs']]; } foreach($this->rule as $r=>$rule) { if(in_array($rule[0], $ex)) { $t = array('offs' => 1, 'rule' => $r); if(!isset($tmp[$r][1])) $this->closure[$i][] = $t; $tmp[$r][1] = 1; } } } }while(count($this->closure[$i]) != $size); //直到不再增大 //判别
形态
转向 go $out = array(); foreach($this->closure[$i] as $k=>$dfa) { $rule = $this->rule[$dfa['rule']]; if(isset($rule[$dfa['offs']])) { $t = "$dfa[rule],$dfa[offs]"; $ch = $rule[$dfa['offs']]; $this->closure[$i][$k]['char'] = $ch; if(isset($out[$ch])) $shift[$t] = $out[$ch]; if(isset($shift[$t])) { $this->closure[$i][$k]['target'] = $shift[$t]; $dfa['offs']++; if(!$this->in_closure($dfa, $this->closure[$shift[$t]])) $this->closure[$shift[$t]][] = $dfa; } else { $cnt = count($this->closure); $this->closure[$i][$k]['target'] = $cnt; $shift[$t] = $cnt; $dfa['offs']++; $this->closure[count($this->closure)][] = $dfa; $out[$ch] = $cnt; } } } //机关
形态
转换表 foreach($this->closure[$i] as $k=>$dfa) { if(isset($dfa['target'])) { $v = $dfa['char']; if(in_array($v, $this->identifier)) $this->goto[$i][$v] = $dfa['target']; else { $this->action[$i][$v][] = "S$dfa[target]"; $this->request[$i][$v] = $dfa['rule']; } } else { $ch = $this->rule[$dfa['rule']][0]; foreach($this->follow[$ch] as $v) { $this->action[$i][$v][] = "r$dfa[rule]"; $this->request[$i][$v] = $dfa['rule']; } } } foreach($this->action[$i] as $c=>$v) { $v = array_unique($v); if(count($v) > 1) $this->lr = 'SLR(1)'; $this->action[$i][$c] = $v; } } } function in_closure($t, $s) { foreach($s as $r) if($t['offs'] == $r['offs'] && $t['rule'] == $r['rule']) return true; return false; return in_array(serialize($t), array_map('serialize', $s)); } function set_select() { foreach($this->rule as $i=>$rule) { $y = array($rule[1]); if(in_array($y[0], $this->leay)) { if($y[0] != '#') { $this->select[$i] = $y; continue; } }else $y = $this->first[$rule[1]]; $x = $this->follow[$rule[0]]; //SELECT(X->Y)=(FIRST(Y)-{ε})并FOLLOW(X) $this->select[$i] = array_unique( array_merge(array_diff($y, array('#')), $x) ); } } /** * 机关
展望
剖析
表 **/ function set_forecast() { foreach($this->select as $i=>$r) { $c = $this->rule[$i][0]; $v = array_reverse(array_slice($this->rule[$i], 1)); foreach($r as $k) { $this->forecast[$c][$k][] = $v; } } //反省
抵触
foreach($this->forecast as $c=>$r) { foreach($r as $k) { if(count($k) > 1) { $this->ll = 'LL(1)'; } } } }
复制代码
续
PHP code
复制代码
function ll_start($s) { $t = array(); foreach($this->rule as $rule) if($rule[0] == $rule[1]) $t[] = $rule; if($t) { foreach($t as $rule) printf('<tr><td colspan=4>%s 存在左递归</td></tr>', preg_replace('/ /', ' → ', join(' ', $rule), 1)); return; } $stack = array('#', key($this->forecast)); $i = 0; $step = 1; $timeout = 10 * strlen($s); while($stack && $i < strlen($s) && $timeout--) { $r = end($stack); if($r == $s{$i}) { $msg = $r == '#' ? '胜利
' : "$r 婚配
"; }elseif(isset($this->forecast[$r][$s{$i}])) $msg = $r . ' → ' . join(' ', array_reverse($this->forecast[$r][$s{$i}][0])); else $msg = '毛病
'; printf("<tr><td>%d</td><td>%s</td><td>%s</td><td>%s</td></tr>", $step++, substr(join('', $stack), -50), substr($s, $i), $msg); if($r == $s{$i}) { array_pop($stack); $i++; }elseif(isset($this->forecast[$r][$s{$i}])) { array_pop($stack); if(current($this->forecast[$r][$s{$i}][0]) != '#') $stack = array_merge($stack, $this->forecast[$r][$s{$i}][0]); }else break; } } function lr_start($s) { $State = array(0); //形态
栈 $Symbol = array('#'); //符号栈 $i = 0; $step = 1; $timeout = 10 * strlen($s); while($i < strlen($s) && $timeout--) { $ch = $s{$i}; $sp = end($State); $msg = substr($s, $i); if(isset($this->action[$sp][$ch]) && $this->action[$sp][$ch][0] == 'r0') $msg = 'acc'; if(isset($this->request[$sp][$ch])) $request = preg_replace('/ /', ' → ', join(' ', $this->rule[$this->request[$sp][$ch]]), 1); else $request = 'error'; printf("<tr><th>%d</td><td>%s</td><td>%s</td><td>%s</td><td>%s</td></tr>", $step++, substr(join('', $State), -50), join('', $Symbol), $msg, $request); if(isset($this->action[$sp][$ch]) isset($this->goto[$sp][$ch])) { $t = isset($this->action[$sp][$ch]) ? $this->action[$sp][$ch][0] : $this->goto[$sp][$ch]; $n = substr($t, 1) + 0; if($t{0} == 'r') { for($j=0; $j<count($this->rule[$n])-1; $j++) { array_pop($State); array_pop($Symbol); } if($n == 0) break; $c = $Symbol[] = $this->rule[$n][0]; $State[] = $this->goto[end($State)][$c]; }elseif($t{0} == 'S') { $State[] = $n; $Symbol[] = $ch; $i++; }else ; }else break; } } function report($in='') { if($in) $in = trim($in, '#') . '#'; echo '<style>table {font-size:10pt</style>'; echo '<table ><tr><td><b>文法</b></td></tr>'; foreach($this->rule as $rule) { echo '<tr><td>'; echo preg_replace('/ /', ' → ', join(' ', $rule), 1); echo '</td></tr>'; } echo '</table>'; $identifier = $this->identifier; echo '<table><tr><td><b>标识符</b></td>'; echo '<td>' . join(' ', $identifier) . '</td></tr>'; echo '</table>'; $leay = array_diff($this->leay, array('#')); $leay[] = '#'; echo '<table><tr><td><b>终结符</b></td>'; echo '<td>' . join(' ', $leay) . '</td></tr>'; echo '</table>'; echo '<table width=60% border=1><tr><th>标识符</th><th>推出空</th><th>FIRST集</th><th>FOLLOW集</th></tr>'; foreach($identifier as $ch) { echo '<tr><td>' . $ch . '</td>'; echo '<td>' . (in_array('#', $this->first[$ch]) ? 'True' : 'false') . '</td>'; echo '<td>' . join(' ', $this->first[$ch]) . '</td>'; echo '<td>' . join(' ', $this->follow[$ch]) . '</td>'; echo '</tr>'; } echo '</table>'; echo '<table width=100%><tr><td> </td></tr><tr><th>' . $this->ll . '文法剖析
</th></tr></table>'; echo '<table width=60% border=1><tr><th>发生
式</th><th>Select集</th></tr>'; foreach($this->rule as $i=>$rule) { echo '<tr>'; echo '<td>' . preg_replace('/ /', ' → ', join(' ', $rule), 1) . '</td>'; echo '<td>' . join(' ', $this->select[$i]) . '</td>'; echo '</tr>'; } echo '</table>'; $forecast = $this->forecast; echo '<table width=60%><tr><td><b>展望
剖析
表</b></td></tr>'; echo '<tr><td><table width=100% border=1>'; echo '<tr><th> </th><th>' . join('</th><th>', $leay) . '</th></tr>'; foreach($identifier as $ch) { echo '<tr><td>' . $ch . '</td>'; foreach($leay as $v) { $s = ''; if(isset($forecast[$ch][$v])) { foreach($forecast[$ch][$v] as $t) { if($s) $s .= '<br />'; $s .= $ch . ' → '. join(' ', array_reverse($t)); } if(count($forecast[$ch][$v]) > 1) $s = "<font color=red>$s</font>"; }else $s .= ' '; echo '<td>' . $s . '</td>'; } echo '<tr>'; } echo '</table></td></tr>'; echo '</table>'; if($in) { echo '<table><tr><th>测试字符串</th>'; echo '<td>' . trim($in, '#') . '</td></tr></table>'; echo '<table width=100% border=1>'; echo '<tr><th>步调
</th><th>剖析
栈</th><th>残剩
字符</th><th>生成式或婚配
</th></tr>'; $this->ll_start($in); echo '</table>'; } echo '<table width=100%><tr><td> </td></tr>'; echo '<tr><th>' . $this->lr . '文法剖析
<th></tr></table>'; echo '<table><tr><th>形态
转移表</th></tr></table>'; echo '<table width=100% border=1>'; echo '<tr><th rowspan=2>形态
</th><th colspan=' . count($leay) . '>Action</th><th colspan=' . count($identifier) . '>Goto</th><th rowspan=2>DFA</th></tr>'; echo '<tr><th>' . join('</th><th>', $leay) . '</th><th>'. join('</th><th>', $identifier) . '</th></tr>'; foreach($this->action as $i=>$item) { echo "<tr><td>$i</td>"; foreach($leay as $v) { $s = isset($item[$v]) ? join(',', $item[$v]) : ' '; if(strpos($s, ',')) $s = "<font color=red>$s</font>"; echo "<td>$s</td>"; } foreach($identifier as $v) { $s = isset($this->goto[$i][$v]) ? $this->goto[$i][$v] : ' '; echo "<td>$s</td>"; } echo '<td>' . $this->showDFA($i) .'</td>'; echo '</tr>'; } echo '</table>'; if($in) { echo '<table><tr><th>测试字符串</th>'; echo '<td>' . trim($in, '#') . '</td></tr></table>'; echo '<table width=100% border=1>'; echo '<tr><th>步调
</th><th>形态
栈</th><th>符号栈</th><th>残剩
字符</th><th>生成式</th></tr>'; $this->lr_start($in); echo '</table>'; } } function showDFA($i) { $res = array(); foreach($this->closure[$i] as $dfa) { $rule = $this->rule[$dfa['rule']]; array_splice($rule, $dfa['offs'], 0, '·'); array_splice($rule, 1, 0, '→'); if(isset($dfa['target'])) $rule[] = " [$dfa[target]]"; $res[] = join('', $rule); } return join('; ', $res); } } for($i=1; $i<=count(glob('*.txt')); $i++) echo " <a href=?id=$i>$i</a>"; $n = current($_GET) or $n = 1; $S = ''; include "$n.txt"; $p = new grammar($G); $p->report($S);
复制代码
ttrie.php
PHP code
<?php class TTrie { protected $buffer = array(); protected $dict = array( array() ); protected $input = 0; //字符串以后
偏移 protected $backtracking = 0; //字符串回溯地位
public $debug = 0; public $savematch = 1; function set($word, $action='') { if(is_array($word)) { foreach($word as $k=>$v) $this->set($k, $v); return; } $p = count($this->dict); $cur = 0; //以后
节点号 foreach(str_split($word) as $c) { if (isset($this->dict[$cur][$c])) { //已存在就下移 $cur = $this->dict[$cur][$c]; continue; } $this->dict[$p]= array(); //创立
新节点 $this->dict[$cur][$c] = $p; //在父节点纪录
子节点号 $cur = $p; //把以后
节点设为新拔出
的 $p++; } $this->dict[$cur]['acc'] = $action; //一个词停止
,标志
叶子节点 } function match($s) { $ret = array(); $cur = 0; //以后
节点,初始为根节点 $i =& $this->input; //字符串以后
偏移 $p =& $this->backtracking; //字符串回溯地位
$s .= "\0"; //附加停止
符 $len = strlen($s); $buf = ''; while($i < $len) { $c = $s{$i}; if(isset($this->dict[$cur][$c])) { //假如
存在 $cur = $this->dict[$cur][$c]; //转到对应的地位
if(isset($this->dict[$cur][$s[$i+1]])) {//反省
下一个字符是不是
也能婚配
,长度优先 $i++; continue; } if(isset($this->dict[$cur]['acc'])) { //是叶子节点,单词婚配
! if($buf) { $this->buffer[] = $buf; $buf = ''; } if($this->savematch) $this->buffer[] = substr($s, $p, $i - $p + 1); //掏出
婚配
地位
和婚配
的词 $ar = explode(',', $this->dict[$cur]['acc']); call_user_func_array( array($this, array_shift($ar)), $ar ); $p = $i + 1; //设置下一个回溯地位
$cur = 0; //重置以后
节点为根节点 } } else { //不婚配
$buf .= $s{$p}; //substr($s, $p, $i - $p + 1); //保留
未婚配
地位
和未婚配
的内容 $cur = 0; //重置以后
节点为根节点 $i = $p; //把以后
偏移设为回溯地位
$p = $i + 1; //设置下一个回溯地位
} $i++; //下一个字符 } if(trim($buf, "\0")) $this->buffer[] = trim($buf, "\0"); } function __call($method, $param) { if($this->debug) printf("偏移:%d 回溯:%d\n", $this->input, $this->backtracking); } }
复制代码
我的这套线路可能跟许多学习PHP的爱好者不谋而合,这也算是一个循序渐进的学习过程,不过新手不要看到上面的概括就以为学习蛮简单的,默默在此不得不对您稍微泼一下冷水,任何东西其实都不简单。
作者:
飘飘悠悠
时间:
2015-2-4 00:06
当然这种网站的会员费就几十块钱。
作者:
若天明
时间:
2015-2-9 07:53
曾经犯过一个很低级的错误,我在文件命名的时候用了一个横线\\\\\\\'-\\\\\\\' 号,结果找了好几个小时的错误,事实是命名的时候 是不能用横线 \\\\\\\'-\\\\\\\' 的,应该用的是下划线 \\\\\\\'_\\\\\\\' ;
作者:
灵魂腐蚀
时间:
2015-2-27 04:41
环境搭建好,当你看见你的浏览器输出“it works\\\\\\\"时你一定是喜悦的。在你解决问题的时候,我强烈建议多读php手册。
作者:
深爱那片海
时间:
2015-3-1 19:41
写的比较杂,因为我也是个新手,不当至于大家多多指正。
作者:
简单生活
时间:
2015-3-2 14:22
首先我是坚决反对新手上来就用框架的,因为对底层的东西一点都不了解,造成知识上的真空,会对以后的发展不利。我的观点上手了解下框架就好,代码还是手写。当然啦如果是位别的编程语言的高手的话,这个就另当别论啦。
作者:
莫相离
时间:
2015-3-3 16:43
做为1门年轻的语言,php一直很努力。
作者:
透明
时间:
2015-3-11 01:37
php里的数组为空的时候是不能拿来遍历的;(这个有点低级啊,不过我刚被这个边界问题墨迹了好长一会)
作者:
只想知道
时间:
2015-3-11 09:15
首先我是坚决反对新手上来就用框架的,因为对底层的东西一点都不了解,造成知识上的真空,会对以后的发展不利。我的观点上手了解下框架就好,代码还是手写。当然啦如果是位别的编程语言的高手的话,这个就另当别论啦。
作者:
因胸联盟
时间:
2015-3-13 04:09
如果你已经到这种程度了,那么你已经可以做我的老师了。其实php也分很多的区域,
作者:
金色的骷髅
时间:
2015-3-20 12:19
当留言板完成的时候,下步可以把做1个单人的blog程序,做为目标,
作者:
admin
时间:
2015-3-23 18:14
曾经犯过一个很低级的错误,我在文件命名的时候用了一个横线\\\\\\\'-\\\\\\\' 号,结果找了好几个小时的错误,事实是命名的时候 是不能用横线 \\\\\\\'-\\\\\\\' 的,应该用的是下划线 \\\\\\\'_\\\\\\\' ;
作者:
蒙在股里
时间:
2015-4-1 21:11
爱上php,他也会爱上你。
作者:
谁可相欹
时间:
2015-4-4 02:01
当然这种网站的会员费就几十块钱。
作者:
老尸
时间:
2015-4-6 20:22
我学习了一段时间后,我发现效果并不好(估计是我自身的问题)。因为一个人的精力总是有限的,同时学习这么多,会导致每个的学习时间都得不到保证。
作者:
飘灵儿
时间:
2015-4-11 05:10
兴趣是最好的老师,百度是最好的词典。
作者:
爱飞
时间:
2015-4-15 06:56
找到的的资料很多都是在论坛里的,需要注册,所以我一般没到一个论坛都注册一个id,所有的id都注册成一样的,这样下次再进来的时候就不用重复注册啦。当然有些论坛的某些资料是需要的付费的。
作者:
小妖女
时间:
2015-4-16 16:09
有位前辈曾经跟我说过,phper 至少要掌握200个函数 编起程序来才能顺畅点,那些不熟悉的函数记不住也要一拿手册就能找到。所以建议新手们没事就看看php的手册(至少array函数和string函数是要记牢的)。
作者:
山那边是海
时间:
2015-4-18 06:05
基础有没有对学习php没有太大区别,关键是兴趣。
欢迎光临 仓酷云 (http://ckuyun.com/)
Powered by Discuz! X3.2