| 123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526527528529530531532533534535536537538539540541542543544545546547548549550551552553554555556557558559560561562563564565566567568569570571572573574575576577578579580581582583584585586587588589590591592593594595596597598599600601602603604605606607608609610611612613614615616617618619620621622623624625626627628629630631632633634635636637638639640641642643644645646647648649650651652653654655656657658659660661662663664665666667668669670671672673674675676677678679680681682683684685686687688689690691692693694695696697698699700 |
- <?php
- namespace App\Http\Api;
- use Illuminate\Support\Str;
- use mustache\mustache;
- use App\Models\DhammaTerm;
- use App\Models\PaliText;
- use App\Models\Channel;
- use App\Http\Controllers\CorpusController;
- use Illuminate\Support\Facades\Cache;
- use App\Tools\RedisClusters;
- use Illuminate\Support\Facades\Log;
- use App\Tools\Markdown;
- define("STACK_DEEP", 8);
- class MdRender
- {
- /**
- * 文字渲染模式
- * read 阅读模式
- * edit 编辑模式
- */
- protected $options = [
- 'mode' => 'read',
- 'channelType' => 'translation',
- 'contentType' => "markdown",
- 'format' => 'react',
- 'debug' => [],
- 'studioId' => null,
- 'lang' => 'zh-Hans',
- 'footnote' => false,
- 'paragraph' => false,
- ];
- public function __construct($options = [])
- {
- foreach ($options as $key => $value) {
- $this->options[$key] = $value;
- }
- }
- /**
- * 将句子模版组成的段落复制一份,为了实现巴汉逐段对读
- */
- private function preprocessingForParagraph($input)
- {
- if (!$this->options['paragraph']) {
- return $input;
- }
- $paragraphs = explode("\n\n", $input);
- $output = [];
- foreach ($paragraphs as $key => $paragraph) {
- # 判断是否是纯粹的句子模版
- $pattern = "/\{\{sent\|id=([0-9].+?)\}\}/";
- $replacement = '';
- $space = preg_replace($pattern, $replacement, $paragraph);
- $space = str_replace('>', '', $space);
- if (empty(trim($space))) {
- $output[] = str_replace('}}', '|text=origin}}', $paragraph);
- $output[] = str_replace('}}', '|text=translation}}', $paragraph);
- } else {
- $output[] = $paragraph;
- }
- }
- return implode("\n\n", $output);
- }
- /**
- * 按照{{}}把字符串切分成三个部分。模版之前的,模版,和模版之后的
- */
- private function tplSplit($tpl)
- {
- $before = strpos($tpl, '{{');
- if ($before === FALSE) {
- //未找到
- return ['data' => [$tpl, '', ''], 'error' => 0];
- } else {
- $pointer = $before;
- $stack = array();
- $stack[] = $pointer;
- $after = substr($tpl, $pointer + 2);
- while (!empty($after) && count($stack) > 0 && count($stack) < STACK_DEEP) {
- $nextBegin = strpos($after, "{{");
- $nextEnd = strpos($after, "}}");
- if ($nextBegin !== FALSE) {
- if ($nextBegin < $nextEnd) {
- //有嵌套找到最后一个}}
- $pointer = $pointer + 2 + $nextBegin;
- $stack[] = $pointer;
- $after = substr($tpl, $pointer + 2);
- } else if ($nextEnd !== FALSE) {
- //无嵌套有结束
- $pointer = $pointer + 2 + $nextEnd;
- array_pop($stack);
- $after = substr($tpl, $pointer + 2);
- } else {
- //无结束符 没找到
- break;
- }
- } else if ($nextEnd !== FALSE) {
- $pointer = $pointer + 2 + $nextEnd;
- array_pop($stack);
- $after = substr($tpl, $pointer + 2);
- } else {
- //没找到
- break;
- }
- }
- if (count($stack) > 0) {
- if (count($stack) === STACK_DEEP) {
- return ['data' => [$tpl, '', ''], 'error' => 2];
- } else {
- //未关闭
- return ['data' => [$tpl, '', ''], 'error' => 1];
- }
- } else {
- return [
- 'data' =>
- [
- substr($tpl, 0, $before),
- substr($tpl, $before, $pointer - $before + 2),
- substr($tpl, $pointer + 2)
- ],
- 'error' => 0
- ];
- }
- }
- }
- private function wiki2xml(string $wiki, $channelId = []): string
- {
- /**
- * 渲染markdown里面的模版
- */
- $remain = $wiki;
- $buffer = array();
- do {
- $arrWiki = $this->tplSplit($remain);
- $buffer[] = $arrWiki['data'][0];
- $tpl = $arrWiki['data'][1];
- if (!empty($tpl)) {
- /**
- * 处理模版 提取参数
- */
- $tpl = str_replace("|\n", "|", $tpl);
- $pattern = "/\{\{(.+?)\|/";
- $replacement = '<MdTpl class="tpl" name="$1"><param>';
- $tpl = preg_replace($pattern, $replacement, $tpl);
- $tpl = str_replace("}}", "</param></MdTpl>", $tpl);
- $tpl = str_replace("|", "</param><param>", $tpl);
- /**
- * 替换变量名
- */
- $pattern = "/<param>([a-z]+?)=/";
- $replacement = '<param name="$1">';
- $tpl = preg_replace($pattern, $replacement, $tpl);
- //tpl to react
- $tpl = str_replace('<param', '<span class="param"', $tpl);
- $tpl = str_replace('</param>', '</span>', $tpl);
- $tpl = $this->xml2tpl($tpl, $channelId);
- $buffer[] = $tpl;
- }
- $remain = $arrWiki['data'][2];
- } while (!empty($remain));
- $html = implode('', $buffer);
- return $html;
- }
- private function xmlQueryId(string $xml, string $id): string
- {
- try {
- $dom = simplexml_load_string($xml);
- } catch (\Exception $e) {
- Log::error($e);
- return "<div></div>";
- }
- $tpl_list = $dom->xpath('//MdTpl');
- foreach ($tpl_list as $key => $tpl) {
- foreach ($tpl->children() as $param) {
- # 处理每个参数
- if ($param->getName() === "param") {
- foreach ($param->attributes() as $pa => $pa_value) {
- $pValue = $pa_value->__toString();
- if ($pa === "name" && $pValue === "id") {
- if ($param->__toString() === $id) {
- return $tpl->asXML();
- }
- }
- }
- }
- }
- }
- return "<div></div>";
- }
- public static function take_sentence(string $xml): array
- {
- $output = [];
- try {
- $dom = simplexml_load_string($xml);
- } catch (\Exception $e) {
- Log::error($e);
- return $output;
- }
- $tpl_list = $dom->xpath('//MdTpl');
- foreach ($tpl_list as $key => $tpl) {
- foreach ($tpl->attributes() as $a => $a_value) {
- if ($a === "name") {
- if ($a_value->__toString() === "sent") {
- foreach ($tpl->children() as $param) {
- # 处理每个参数
- if ($param->getName() === "param") {
- $sent = $param->__toString();
- if (!empty($sent)) {
- $output[] = $sent;
- break;
- }
- }
- }
- }
- }
- }
- }
- return $output;
- }
- private function xml2tpl(string $xml, $channelId = []): string
- {
- /**
- * 解析xml
- * 获取模版参数
- * 生成react 组件参数
- */
- try {
- //$dom = simplexml_load_string($xml);
- $doc = new \DOMDocument();
- $xml = str_replace('MdTpl', 'dfn', $xml);
- $xml = mb_convert_encoding($xml, 'HTML-ENTITIES', "UTF-8");
- $ok = $doc->loadHTML($xml, LIBXML_NOERROR | LIBXML_HTML_NOIMPLIED | LIBXML_HTML_NODEFDTD);
- } catch (\Exception $e) {
- Log::error($e);
- Log::error($xml);
- return "<span>xml解析错误{$e}</span>";
- }
- if (!$ok) {
- return "<span>xml解析错误</span>";
- }
- /*
- if(!$dom){
- Log::error($xml);
- return "<span>xml解析错误</span>";
- }
- */
- $tpl_list = $doc->getElementsByTagName('dfn');
- foreach ($tpl_list as $key => $tpl) {
- /**
- * 遍历 MdTpl 处理参数
- */
- $props = [];
- $tpl_name = '';
- foreach ($tpl->attributes as $a => $a_value) {
- if ($a_value->nodeName === "name") {
- $tpl_name = $a_value->nodeValue;
- break;
- }
- }
- $param_id = 0;
- $child = $tpl->firstChild;
- while ($child) {
- # 处理每个参数
- if ($child->nodeName === "span") {
- $param_id++;
- $paramName = "";
- foreach ($child->attributes as $pa => $pa_value) {
- if ($pa_value->nodeName === "name") {
- $nodeText = $pa_value->nodeValue;
- $props["{$nodeText}"] = $child->nodeValue;
- $paramName = $pa_value;
- }
- }
- if (empty($paramName)) {
- foreach ($child->childNodes as $param_child) {
- # code...
- if ($param_child->nodeType === 3) {
- $props["{$param_id}"] = $param_child->nodeValue;
- }
- }
- }
- }
- $child = $child->nextSibling;
- }
- /**
- * 生成模版参数
- *
- */
- //TODO 判断$channelId里面的是否都是uuid
- $channelInfo = [];
- foreach ($channelId as $key => $id) {
- $channelInfo[] = Channel::where('uid', $id)->first();
- }
- $tplRender = new TemplateRender(
- $props,
- $channelInfo,
- $this->options['mode'],
- $this->options['format'],
- $this->options['studioId'],
- $this->options['debug'],
- $this->options['lang'],
- );
- $tplRender->options($this->options);
- $tplProps = $tplRender->render($tpl_name);
- if ($this->options['format'] === 'react' && $tplProps) {
- $props = $doc->createAttribute("props");
- $props->nodeValue = $tplProps['props'];
- $tpl->appendChild($props);
- $attTpl = $doc->createAttribute("tpl");
- $attTpl->nodeValue = $tplProps['tpl'];
- $tpl->appendChild($attTpl);
- $htmlElement = $doc->createElement($tplProps['tag']);
- $htmlElement->nodeValue = $tplProps['html'];
- $tpl->appendChild($htmlElement);
- }
- }
- $html = $doc->saveHTML();
- $html = str_replace(['<dfn', '</dfn>'], ['<MdTpl', '</MdTpl>'], $html);
- switch ($this->options['format']) {
- case 'react':
- return trim($html);
- break;
- case 'unity':
- if ($tplProps) {
- return "{{" . "{$tplProps['tpl']}|{$tplProps['props']}" . "}}";
- } else {
- return '';
- }
- break;
- case 'html':
- if (isset($tplProps)) {
- if (is_array($tplProps)) {
- return '';
- } else {
- return $tplProps;
- }
- } else {
- Log::error('tplProps undefine');
- return '';
- }
- break;
- case 'tex':
- if (isset($tplProps)) {
- if (is_array($tplProps)) {
- return '';
- } else {
- return $tplProps;
- }
- } else {
- Log::error('tplProps undefine');
- return '';
- }
- break;
- default:
- /**text simple markdown */
- if (isset($tplProps)) {
- if (is_array($tplProps)) {
- return '';
- } else {
- return $tplProps;
- }
- } else {
- Log::error('tplProps undefine');
- return '';
- }
- break;
- }
- }
- /**
- * 将markdown文件中的模版转换为标准的wiki模版
- */
- private function markdown2wiki(string $markdown): string
- {
- //$markdown = mb_convert_encoding($markdown,'UTF-8','UTF-8');
- $markdown = iconv('UTF-8', 'UTF-8//IGNORE', $markdown);
- /**
- * nissaya
- * aaa=bbb\n
- * {{nissaya|aaa|bbb}}
- */
- if ($this->options['channelType'] === 'nissaya') {
- if ($this->options['contentType'] === "json") {
- $json = json_decode($markdown);
- $nissayaWord = [];
- if (is_array($json)) {
- foreach ($json as $word) {
- if (count($word->sn) === 1) {
- //只输出第一层级
- $str = "{{nissaya|";
- if (isset($word->word->value)) {
- $str .= $word->word->value;
- }
- $str .= "|";
- if (isset($word->meaning->value)) {
- $str .= $word->meaning->value;
- }
- $str .= "}}";
- $nissayaWord[] = $str;
- }
- }
- } else {
- Log::error('json data is not array', ['data' => $markdown]);
- }
- $markdown = implode('', $nissayaWord);
- } else if ($this->options['contentType'] === "markdown") {
- $lines = explode("\n", $markdown);
- $newLines = array();
- foreach ($lines as $line) {
- if (strstr($line, '=') === FALSE) {
- $newLines[] = $line;
- } else {
- $nissaya = explode('=', $line);
- $meaning = array_slice($nissaya, 1);
- $meaning = implode('=', $meaning);
- $newLines[] = "{{nissaya|{$nissaya[0]}|{$meaning}}}";
- }
- }
- $markdown = implode("\n", $newLines);
- }
- }
- //$markdown = preg_replace("/\n\n/","<div></div>",$markdown);
- /**
- * 处理 mermaid
- */
- if (strpos($markdown, "```mermaid") !== false) {
- $lines = explode("\n", $markdown);
- $newLines = array();
- $mermaidBegin = false;
- $mermaidString = array();
- foreach ($lines as $line) {
- if ($line === "```mermaid") {
- $mermaidBegin = true;
- $mermaidString = [];
- continue;
- }
- if ($mermaidBegin) {
- if ($line === "```") {
- $newLines[] = "{{mermaid|" . base64_encode(\json_encode($mermaidString)) . "}}";
- $mermaidBegin = false;
- } else {
- $mermaidString[] = $line;
- }
- } else {
- $newLines[] = $line;
- }
- }
- $markdown = implode("\n", $newLines);
- }
- /**
- * 替换换行符
- * react 无法处理 <br> 替换为<div></div>代替换行符作用
- */
- //$markdown = str_replace('<br>','<div></div>',$markdown);
- /**
- * markdown -> html
- */
- /*
- $html = MdRender::fixHtml($html);
- */
- #替换术语
- $pattern = "/\[\[(.+?)\]\]/";
- $replacement = '{{term|$1}}';
- $markdown = preg_replace($pattern, $replacement, $markdown);
- #替换句子模版
- $pattern = "/\{\{([0-9].+?)\}\}/";
- $replacement = '{{sent|id=$1}}';
- $markdown = preg_replace($pattern, $replacement, $markdown);
- /**
- * 替换多行注释
- * ```
- * bla
- * bla
- * ```
- * {{note|
- * bla
- * bla
- * }}
- */
- if (strpos($markdown, "```\n") !== false) {
- $lines = explode("\n", $markdown);
- $newLines = array();
- $noteBegin = false;
- $noteString = array();
- foreach ($lines as $line) {
- if ($noteBegin) {
- if ($line === "```") {
- $newLines[] = "}}";
- $noteBegin = false;
- } else {
- $newLines[] = $line;
- }
- } else {
- if ($line === "```") {
- $noteBegin = true;
- $newLines[] = "{{note|";
- continue;
- } else {
- $newLines[] = $line;
- }
- }
- }
- if ($noteBegin) {
- $newLines[] = "}}";
- }
- $markdown = implode("\n", $newLines);
- }
- /**
- * 替换单行注释
- * `bla bla`
- * {{note|bla}}
- */
- $pattern = "/`(.+?)`/";
- $replacement = '{{note|$1}}';
- $markdown = preg_replace($pattern, $replacement, $markdown);
- return $markdown;
- }
- private function markdownToHtml($markdown)
- {
- $markdown = str_replace('MdTpl', 'mdtpl', $markdown);
- $markdown = str_replace(['<param', '</param>'], ['<span', '</span>'], $markdown);
- $html = Markdown::render($markdown);
- if ($this->options['format'] === 'react') {
- $html = $this->fixHtml($html);
- }
- $html = str_replace('<hr>', '<hr />', $html);
- //给H1-6 添加uuid
- for ($i = 1; $i < 7; $i++) {
- if (strpos($html, "<h{$i}>") === false) {
- continue;
- }
- $output = array();
- $input = $html;
- $hPos = strpos($input, "<h{$i}>");
- while ($hPos !== false) {
- $output[] = substr($input, 0, $hPos);
- $output[] = "<h{$i} id='" . Str::uuid() . "'>";
- $input = substr($input, $hPos + 4);
- $hPos = strpos($input, "<h{$i}>");
- }
- $output[] = $input;
- $html = implode('', $output);
- }
- $html = str_replace('mdtpl', 'MdTpl', $html);
- return $html;
- }
- private function fixHtml($html)
- {
- $doc = new \DOMDocument();
- libxml_use_internal_errors(true);
- $html = mb_convert_encoding($html, 'HTML-ENTITIES', "UTF-8");
- $doc->loadHTML('<span>' . $html . '</span>', LIBXML_NOERROR | LIBXML_HTML_NOIMPLIED | LIBXML_HTML_NODEFDTD);
- $fixed = $doc->saveHTML();
- $fixed = mb_convert_encoding($fixed, "UTF-8", 'HTML-ENTITIES');
- return $fixed;
- }
- public static function init()
- {
- $GLOBALS["MdRenderStack"] = 0;
- }
- public function convert($markdown, $channelId = [], $queryId = null)
- {
- if (isset($GLOBALS["MdRenderStack"]) && is_numeric($GLOBALS["MdRenderStack"])) {
- $GLOBALS["MdRenderStack"]++;
- } else {
- $GLOBALS["MdRenderStack"] = 1;
- }
- if ($GLOBALS["MdRenderStack"] < 3) {
- $output = $this->_convert($markdown, $channelId, $queryId);
- } else {
- $output = $markdown;
- }
- $GLOBALS["MdRenderStack"]--;
- return $output;
- }
- private function _convert($markdown, $channelId = [], $queryId = null)
- {
- if (empty($markdown)) {
- switch ($this->options['format']) {
- case 'react':
- return "<span></span>";
- break;
- default:
- return "";
- break;
- }
- }
- $wiki = $this->markdown2wiki($markdown);
- $wiki = $this->preprocessingForParagraph($wiki);
- $markdownWithTpl = $this->wiki2xml($wiki, $channelId);
- if (!is_null($queryId)) {
- $html = $this->xmlQueryId($markdownWithTpl, $queryId);
- }
- $html = $this->markdownToHtml($markdownWithTpl);
- //后期处理
- $output = '';
- switch ($this->options['format']) {
- case 'react':
- //生成可展开组件
- $html = str_replace("<div/>", "<div></div>", $html);
- $pattern = '/<li><div>(.+?)<\/div><\/li>/';
- $replacement = '<li><MdTpl name="toggle" tpl="toggle" props=""><div>$1</div></MdTpl></li>';
- $output = preg_replace($pattern, $replacement, $html);
- break;
- case 'text':
- case 'simple':
- case 'prompt':
- $html = strip_tags($html);
- $output = htmlspecialchars_decode($html, ENT_QUOTES);
- //$output = html_entity_decode($html);
- break;
- case 'tex':
- $html = strip_tags($html);
- $output = htmlspecialchars_decode($html, ENT_QUOTES);
- //$output = html_entity_decode($html);
- break;
- case 'unity':
- $html = str_replace(['<strong>', '</strong>', '<em>', '</em>'], ['[%b%]', '[%/b%]', '[%i%]', '[%/i%]'], $html);
- $html = strip_tags($html);
- $html = str_replace(['[%b%]', '[%/b%]', '[%i%]', '[%/i%]'], ['<b>', '</b>', '<i>', '</i>'], $html);
- $output = htmlspecialchars_decode($html, ENT_QUOTES);
- break;
- case 'html':
- $output = htmlspecialchars_decode($html, ENT_QUOTES);
- //处理脚注
- if ($this->options['footnote'] && isset($GLOBALS['note']) && count($GLOBALS['note']) > 0) {
- $output .= '<div><h1>endnote</h1>';
- foreach ($GLOBALS['note'] as $footnote) {
- $output .= '<p><a name="footnote-' . $footnote['sn'] . '">[' . $footnote['sn'] . ']</a> ' . $footnote['content'] . '</p>';
- }
- $output .= '</div>';
- unset($GLOBALS['note']);
- }
- //处理图片链接
- $output = str_replace('<img src="', '<img src="' . config('app.url'), $output);
- break;
- case 'markdown':
- //处理脚注
- $footnotes = array();
- if ($this->options['footnote'] && isset($GLOBALS['note']) && count($GLOBALS['note']) > 0) {
- foreach ($GLOBALS['note'] as $footnote) {
- $footnotes[] = '[^' . $footnote['sn'] . ']: ' . $footnote['content'];
- }
- unset($GLOBALS['note']);
- }
- //处理图片链接
- $output = str_replace('/attachments/', config('app.url') . "/attachments/", $markdownWithTpl);
- $output = $output . "\n\n" . implode("\n\n", $footnotes);
- break;
- }
- return $output;
- }
- /**
- * string[] $channelId
- */
- public static function render($markdown, $channelId, $queryId = null, $mode = 'read', $channelType = 'translation', $contentType = "markdown", $format = 'react')
- {
- $mdRender = new MdRender(
- [
- 'mode' => $mode,
- 'channelType' => $channelType,
- 'contentType' => $contentType,
- 'format' => $format
- ]
- );
- $output = $mdRender->convert($markdown, $channelId, $queryId);
- return $output;
- }
- }
|