AiTranslateService.php 24 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526527528529530531532533534535536537538539540541542543544545546547548549550551552553554555556557558559560561562563564565566567568569570571572573574575576577578579580581582583584585586587588589590591592593594595596597598599600601602603604605606607608609610611612613614615616617618619620621622623624625626627628629630631632
  1. <?php
  2. namespace App\Services;
  3. use Illuminate\Support\Facades\Log;
  4. use Illuminate\Support\Facades\Http;
  5. use Illuminate\Http\Client\RequestException;
  6. use App\Tools\RedisClusters;
  7. use App\Models\Task;
  8. use App\Models\PaliText;
  9. use App\Models\PaliSentence;
  10. use App\Models\AiModel;
  11. use App\Models\Sentence;
  12. use App\Http\Api\ChannelApi;
  13. use App\Http\Controllers\AuthController;
  14. use App\Http\Api\MdRender;
  15. use App\Jobs\ProcessAITranslateJob;
  16. class DatabaseException extends \Exception {}
  17. class AiTranslateService
  18. {
  19. private $queue = 'ai_translate';
  20. private $modelToken = null;
  21. private $task = null;
  22. protected $mq;
  23. private $apiTimeout = 100;
  24. private $llmTimeout = 300;
  25. private $taskTopicId;
  26. public function __construct(RabbitMQService $mq)
  27. {
  28. $this->mq = $mq;
  29. }
  30. /**
  31. * @param string $messageId
  32. * @param array $translateData
  33. */
  34. public function processTranslate(string $messageId, array $messages, ProcessAITranslateJob $job): bool
  35. {
  36. if (!is_array($messages) || count($messages) === 0) {
  37. Log::error('message is not array');
  38. return false;
  39. }
  40. $first = $messages[0];
  41. $this->task = $first->task->info;
  42. $taskId = $this->task->id;
  43. RedisClusters::put("/task/{$taskId}/message_id", $messageId);
  44. $pointerKey = "/task/{$taskId}/pointer";
  45. $pointer = 0;
  46. if (RedisClusters::has($pointerKey)) {
  47. //回到上次中断的点
  48. $pointer = RedisClusters::get($pointerKey);
  49. Log::info("last break point {$pointer}");
  50. }
  51. //获取model token
  52. $this->modelToken = $first->model->token;
  53. Log::debug($this->queue . ' ai assistant token', ['token' => $this->modelToken]);
  54. $this->setTaskStatus($this->task->id, 'running');
  55. // 设置task discussion topic
  56. $this->taskTopicId = $this->taskDiscussion(
  57. $this->task->id,
  58. 'task',
  59. $this->task->title,
  60. $this->task->category,
  61. null
  62. );
  63. for ($i = $pointer; $i < count($messages); $i++) {
  64. // 获取当前内存使用量
  65. Log::debug("memory usage: " . memory_get_usage(true) / 1024 / 1024 . " MB");
  66. // 获取峰值内存使用量
  67. Log::debug("memory peak usage: " . memory_get_peak_usage(true) / 1024 / 1024 . " MB");
  68. if ($job->isStop()) {
  69. Log::info("收到退出信号 pointer={$i}");
  70. return false;
  71. }
  72. if (\App\Tools\Tools::isStop()) {
  73. //检测到停止标记
  74. return false;
  75. }
  76. //$this->mq->publishMessage('heartbeat_queue', ['delivery_mode' => 2]);
  77. RedisClusters::put($pointerKey, $i);
  78. $message = $messages[$i];
  79. $taskDiscussionContent = [];
  80. //推理
  81. try {
  82. $responseLLM = $this->requestLLM($message);
  83. $taskDiscussionContent[] = '- LLM request successful';
  84. } catch (RequestException $e) {
  85. throw $e;
  86. }
  87. if ($this->task->category === 'translate') {
  88. //写入句子库
  89. $message->sentence->content = $responseLLM['content'];
  90. try {
  91. $this->saveSentence($message->sentence);
  92. } catch (\Exception $e) {
  93. Log::error('sentence', ['message' => $e]);
  94. continue;
  95. }
  96. }
  97. if ($this->task->category === 'suggest') {
  98. //写入pr
  99. try {
  100. $this->savePr($message->sentence, $responseLLM['content']);
  101. } catch (\Exception $e) {
  102. Log::error('sentence', ['message' => $e]);
  103. continue;
  104. }
  105. }
  106. #获取句子id
  107. $sUid = $this->getSentenceId($message->sentence);
  108. //写入句子 discussion
  109. $topicId = $this->taskDiscussion(
  110. $sUid,
  111. 'sentence',
  112. $this->task->title,
  113. $this->task->category,
  114. null
  115. );
  116. if ($topicId) {
  117. Log::info($this->queue . ' discussion create topic successful');
  118. $data['parent'] = $topicId;
  119. unset($data['title']);
  120. $topicChildren = [];
  121. //提示词
  122. $topicChildren[] = $message->prompt;
  123. //任务结果
  124. $topicChildren[] = $responseLLM['content'];
  125. //推理过程写入discussion
  126. if (
  127. isset($responseLLM['reasoningContent']) &&
  128. !empty($responseLLM['reasoningContent'])
  129. ) {
  130. $topicChildren[] = $responseLLM['reasoningContent'];
  131. }
  132. foreach ($topicChildren as $content) {
  133. Log::debug($this->queue . ' discussion child request', ['data' => $data]);
  134. $dId = $this->taskDiscussion($sUid, 'sentence', $this->task->title, $content, $topicId);
  135. if ($dId) {
  136. Log::info($this->queue . ' discussion child successful');
  137. }
  138. }
  139. } else {
  140. Log::error($this->queue . ' discussion create topic response is null');
  141. }
  142. //修改task 完成度
  143. $progress = $this->setTaskProgress($message->task->progress);
  144. $taskDiscussionContent[] = "- progress=" . $progress;
  145. //写入task discussion
  146. if ($this->taskTopicId) {
  147. $content = implode('\n', $taskDiscussionContent);
  148. $dId = $this->taskDiscussion(
  149. $this->task->id,
  150. 'task',
  151. $this->task->title,
  152. $content,
  153. $this->taskTopicId
  154. );
  155. } else {
  156. Log::error('no task discussion root');
  157. }
  158. }
  159. //任务完成 修改任务状态为 done
  160. if ($i === count($messages)) {
  161. $this->setTaskStatus($this->task->id, 'done');
  162. }
  163. RedisClusters::forget($pointerKey);
  164. Log::info('ai translate task complete');
  165. return true;
  166. }
  167. private function setTaskStatus($taskId, $status)
  168. {
  169. $url = config('app.url') . '/api/v2/task-status/' . $taskId;
  170. $data = [
  171. 'status' => $status,
  172. ];
  173. Log::debug('ai_translate task status request', ['url' => $url, 'data' => $data]);
  174. $response = Http::timeout($this->apiTimeout)->withToken($this->modelToken)->patch($url, $data);
  175. //判断状态码
  176. if ($response->failed()) {
  177. Log::error('ai_translate task status error', ['data' => $response->json()]);
  178. } else {
  179. Log::info('ai_translate task status done');
  180. }
  181. }
  182. private function saveModelLog($token, $data)
  183. {
  184. $url = config('app.url') . '/api/v2/model-log';
  185. $response = Http::timeout($this->apiTimeout)->withToken($token)->post($url, $data);
  186. if ($response->failed()) {
  187. Log::error('ai-translate model log create failed', ['data' => $response->json()]);
  188. return false;
  189. }
  190. return true;
  191. }
  192. private function taskDiscussion($resId, $resType, $title, $content, $parentId = null)
  193. {
  194. $url = config('app.url') . '/api/v2/discussion';
  195. $taskDiscussionData = [
  196. 'res_id' => $resId,
  197. 'res_type' => $resType,
  198. 'content' => $content,
  199. 'content_type' => 'markdown',
  200. 'type' => 'discussion',
  201. 'notification' => false,
  202. ];
  203. if ($parentId) {
  204. $taskDiscussionData['parent'] = $parentId;
  205. } else {
  206. $taskDiscussionData['title'] = $title;
  207. }
  208. Log::debug($this->queue . ' discussion create', ['url' => $url, 'data' => json_encode($taskDiscussionData)]);
  209. $response = Http::timeout($this->apiTimeout)
  210. ->withToken($this->modelToken)
  211. ->post($url, $taskDiscussionData);
  212. if ($response->failed()) {
  213. Log::error($this->queue . ' discussion create error', ['data' => $response->json()]);
  214. return false;
  215. }
  216. Log::debug($this->queue . ' discussion create', ['data' => json_encode($response->json())]);
  217. if (isset($response->json()['data']['id'])) {
  218. return $response->json()['data']['id'];
  219. }
  220. return false;
  221. }
  222. private function requestLLM($message)
  223. {
  224. $param = [
  225. "model" => $message->model->model,
  226. "messages" => [
  227. ["role" => "system", "content" => $message->model->system_prompt ?? ''],
  228. ["role" => "user", "content" => $message->prompt],
  229. ],
  230. "temperature" => 0.7,
  231. "stream" => false
  232. ];
  233. Log::info($this->queue . ' LLM request' . $message->model->url . ' model:' . $param['model']);
  234. Log::debug($this->queue . ' LLM api request', [
  235. 'url' => $message->model->url,
  236. 'data' => json_encode($param),
  237. ]);
  238. //写入 model log
  239. $modelLogData = [
  240. 'model_id' => $message->model->uid,
  241. 'request_at' => now(),
  242. 'request_data' => json_encode($param, JSON_UNESCAPED_UNICODE),
  243. ];
  244. //失败重试
  245. $maxRetries = 3;
  246. $attempt = 0;
  247. try {
  248. while ($attempt < $maxRetries) {
  249. try {
  250. $response = Http::withToken($message->model->key)
  251. ->timeout($this->llmTimeout)
  252. ->post($message->model->url, $param);
  253. // 如果状态码是 4xx 或 5xx,会自动抛出 RequestException
  254. $response->throw();
  255. Log::info($this->queue . ' LLM request successful');
  256. $modelLogData['request_headers'] = json_encode($response->handlerStats(), JSON_UNESCAPED_UNICODE);
  257. $modelLogData['response_headers'] = json_encode($response->headers(), JSON_UNESCAPED_UNICODE);
  258. $modelLogData['status'] = $response->status();
  259. $modelLogData['response_data'] = json_encode($response->json(), JSON_UNESCAPED_UNICODE);
  260. self::saveModelLog($this->modelToken, $modelLogData);
  261. break; // 跳出 while 循环
  262. } catch (RequestException $e) {
  263. $attempt++;
  264. $status = $e->response->status();
  265. // 某些错误不需要重试
  266. if (in_array($status, [400, 401, 403, 404, 422])) {
  267. Log::warning("客户端错误,不重试: {$status}\n");
  268. throw $e; // 重新抛出异常
  269. }
  270. // 服务器错误或网络错误可以重试
  271. if ($attempt < $maxRetries) {
  272. $delay = pow(2, $attempt); // 指数退避
  273. Log::warning("请求失败(第 {$attempt} 次),{$delay} 秒后重试...\n");
  274. sleep($delay);
  275. } else {
  276. Log::error("达到最大重试次数,请求最终失败\n");
  277. throw $e;
  278. }
  279. }
  280. }
  281. } catch (RequestException $e) {
  282. Log::error($this->queue . ' LLM request exception: ' . $e->getMessage());
  283. $failResponse = $e->response;
  284. $modelLogData['request_headers'] = json_encode($failResponse->handlerStats(), JSON_UNESCAPED_UNICODE);
  285. $modelLogData['response_headers'] = json_encode($failResponse->headers(), JSON_UNESCAPED_UNICODE);
  286. $modelLogData['status'] = $failResponse->status();
  287. $modelLogData['response_data'] = $response->body();
  288. $modelLogData['success'] = false;
  289. self::saveModelLog($this->modelToken, $modelLogData);
  290. throw $e;
  291. }
  292. Log::info($this->queue . ' model log saved');
  293. $aiData = $response->json();
  294. Log::debug($this->queue . ' LLM http response', ['data' => $response->json()]);
  295. $responseContent = $aiData['choices'][0]['message']['content'];
  296. if (isset($aiData['choices'][0]['message']['reasoning_content'])) {
  297. $reasoningContent = $aiData['choices'][0]['message']['reasoning_content'];
  298. }
  299. $output = ['content' => $responseContent];
  300. Log::debug($this->queue . ' LLM response content=' . $responseContent);
  301. if (empty($reasoningContent)) {
  302. Log::debug($this->queue . ' no reasoningContent');
  303. } else {
  304. Log::debug($this->queue . ' reasoning=' . $reasoningContent);
  305. $output['reasoningContent'] = $reasoningContent;
  306. }
  307. return $output;
  308. }
  309. /**
  310. * 写入句子库
  311. */
  312. private function saveSentence($sentence)
  313. {
  314. $url = config('app.url') . '/api/v2/sentence';
  315. Log::info($this->queue . " sentence update {$url}");
  316. $response = Http::timeout($this->apiTimeout)->withToken($this->modelToken)->post($url, [
  317. 'sentences' => [$sentence],
  318. ]);
  319. if ($response->failed()) {
  320. Log::error($this->queue . ' sentence update failed', [
  321. 'url' => $url,
  322. 'data' => $response->json(),
  323. ]);
  324. throw new DatabaseException("sentence 数据库写入错误");
  325. }
  326. $count = $response->json()['data']['count'];
  327. Log::info("{$this->queue} sentence update {$count} successful");
  328. }
  329. private function savePr($sentence, $content)
  330. {
  331. $url = config('app.url') . '/api/v2/sentpr';
  332. Log::info($this->queue . " sentence update {$url}");
  333. $response = Http::timeout($this->apiTimeout)->withToken($this->modelToken)->post($url, [
  334. 'book' => $sentence->book_id,
  335. 'para' => $sentence->paragraph,
  336. 'begin' => $sentence->word_start,
  337. 'end' => $sentence->word_end,
  338. 'channel' => $sentence->channel_uid,
  339. 'text' => $content,
  340. 'notification' => false,
  341. 'webhook' => false,
  342. ]);
  343. if ($response->failed()) {
  344. Log::error($this->queue . ' sentence update failed', [
  345. 'url' => $url,
  346. 'data' => $response->json(),
  347. ]);
  348. throw new DatabaseException("pr 数据库写入错误");
  349. }
  350. if ($response->json()['ok']) {
  351. Log::info("{$this->queue} sentence suggest update successful");
  352. } else {
  353. Log::error("{$this->queue} sentence suggest update failed", [
  354. 'url' => $url,
  355. 'data' => $response->json(),
  356. ]);
  357. }
  358. }
  359. private function getSentenceId($sentence)
  360. {
  361. $url = config('app.url') . '/api/v2/sentence-info/aa';
  362. Log::info('ai translate', ['url' => $url]);
  363. $response = Http::timeout($this->apiTimeout)->withToken($this->modelToken)->get($url, [
  364. 'book' => $sentence->book_id,
  365. 'par' => $sentence->paragraph,
  366. 'start' => $sentence->word_start,
  367. 'end' => $sentence->word_end,
  368. 'channel' => $sentence->channel_uid
  369. ]);
  370. if (!$response->json()['ok']) {
  371. Log::error($this->queue . ' sentence id error', ['data' => $response->json()]);
  372. return false;
  373. }
  374. $sUid = $response->json()['data']['id'];
  375. Log::debug("sentence id={$sUid}");
  376. return $sUid;
  377. }
  378. private function setTaskProgress($current)
  379. {
  380. $taskProgress = $current;
  381. if ($taskProgress->total > 0) {
  382. $progress = (int)($taskProgress->current * 100 / $taskProgress->total);
  383. } else {
  384. $progress = 100;
  385. Log::error($this->queue . ' progress total is zero', ['task_id' => $this->task->id]);
  386. }
  387. $url = config('app.url') . '/api/v2/task/' . $this->task->id;
  388. $data = [
  389. 'progress' => $progress,
  390. ];
  391. Log::debug($this->queue . ' task progress request', ['url' => $url, 'data' => $data]);
  392. $response = Http::timeout($this->apiTimeout)->withToken($this->modelToken)->patch($url, $data);
  393. if ($response->failed()) {
  394. Log::error($this->queue . ' task progress error', ['data' => $response->json()]);
  395. } else {
  396. Log::info($this->queue . ' task progress successful progress=' . $response->json()['data']['progress']);
  397. }
  398. return $progress;
  399. }
  400. public function handleFailedTranslate(string $messageId, array $translateData, \Exception $exception): void
  401. {
  402. try {
  403. // 彻底失败时的业务逻辑
  404. // 设置task为失败状态
  405. $this->setTaskStatus($this->task->id, 'stop');
  406. //将故障信息写入task discussion
  407. if ($this->taskTopicId) {
  408. $dId = $this->taskDiscussion(
  409. $this->task->id,
  410. 'task',
  411. $this->task->title,
  412. "**处理失败ai任务时出错** 请重启任务 message id={$messageId} 错误信息:" . $exception->getMessage(),
  413. $this->taskTopicId
  414. );
  415. }
  416. } catch (\Exception $e) {
  417. Log::error('处理失败ai任务时出错', ['error' => $e->getMessage()]);
  418. }
  419. }
  420. /**
  421. * 读取task信息,将任务拆解为单句小任务
  422. *
  423. * @param string $taskId 任务uuid
  424. * @return array 拆解后的提示词数组
  425. */
  426. public function makeByTask(string $taskId, $aiAssistantId, bool $send = true)
  427. {
  428. $task = Task::findOrFail($taskId);
  429. $description = $task->description;
  430. $rows = explode("\n", $description);
  431. $params = [];
  432. foreach ($rows as $key => $row) {
  433. if (strpos($row, '=') !== false) {
  434. $param = explode('=', trim($row, '|'));
  435. $params[$param[0]] = $param[1];
  436. }
  437. }
  438. if (!isset($params['type'])) {
  439. Log::error('no $params.type');
  440. return false;
  441. }
  442. //get sentences in article
  443. $sentences = array();
  444. $totalLen = 0;
  445. switch ($params['type']) {
  446. case 'sentence':
  447. if (!isset($params['id'])) {
  448. Log::error('no $params.id');
  449. return false;
  450. }
  451. $sentences[] = explode('-', $params['id']);
  452. break;
  453. case 'para':
  454. if (!isset($params['book']) || !isset($params['paragraphs'])) {
  455. Log::error('no $params.book or paragraphs');
  456. return false;
  457. }
  458. $sent = PaliSentence::where('book', $params['book'])
  459. ->where('paragraph', $params['paragraphs'])->orderBy('word_begin')->get();
  460. foreach ($sent as $key => $value) {
  461. $sentences[] = [
  462. 'id' => [
  463. $value->book,
  464. $value->paragraph,
  465. $value->word_begin,
  466. $value->word_end,
  467. ],
  468. 'strlen' => $value->length
  469. ];
  470. $totalLen += $value->length;
  471. }
  472. break;
  473. case 'chapter':
  474. if (!isset($params['book']) || !isset($params['paragraphs'])) {
  475. Log::error('no $params.book or paragraphs');
  476. return false;
  477. }
  478. $chapterLen = PaliText::where('book', $params['book'])
  479. ->where('paragraph', $params['paragraphs'])->value('chapter_len');
  480. $sent = PaliSentence::where('book', $params['book'])
  481. ->whereBetween('paragraph', [$params['paragraphs'], $params['paragraphs'] + $chapterLen - 1])
  482. ->orderBy('paragraph')
  483. ->orderBy('word_begin')->get();
  484. foreach ($sent as $key => $value) {
  485. $sentences[] = [
  486. 'id' => [
  487. $value->book,
  488. $value->paragraph,
  489. $value->word_begin,
  490. $value->word_end,
  491. ],
  492. 'strlen' => $value->length
  493. ];
  494. $totalLen += $value->length;
  495. }
  496. break;
  497. default:
  498. return false;
  499. break;
  500. }
  501. //render prompt
  502. $mdRender = new MdRender([
  503. 'format' => 'prompt',
  504. 'footnote' => false,
  505. 'paragraph' => false,
  506. ]);
  507. $m = new \Mustache_Engine(array(
  508. 'entity_flags' => ENT_QUOTES,
  509. 'escape' => function ($value) {
  510. return $value;
  511. }
  512. ));
  513. # ai model
  514. $aiModel = AiModel::findOrFail($aiAssistantId);
  515. $modelToken = AuthController::getUserToken($aiModel->uid);
  516. $aiModel['token'] = $modelToken;
  517. $sumLen = 0;
  518. $mqData = [];
  519. foreach ($sentences as $key => $sentence) {
  520. $sumLen += $sentence['strlen'];
  521. $sid = implode('-', $sentence['id']);
  522. Log::debug($sid);
  523. $sentChannelInfo = explode('@', $params['channel']);
  524. $channelId = $sentChannelInfo[0];
  525. $data = [];
  526. $data['origin'] = '{{' . $sid . '}}';
  527. $data['translation'] = '{{sent|id=' . $sid;
  528. $data['translation'] .= '|channel=' . $channelId;
  529. $data['translation'] .= '|text=translation}}';
  530. if (isset($params['nissaya']) && !empty($params['nissaya'])) {
  531. $nissayaChannel = explode('@', $params['nissaya']);
  532. $channelInfo = ChannelApi::getById($nissayaChannel[0]);
  533. if ($channelInfo) {
  534. //查看句子是否存在
  535. $nissayaSent = Sentence::where('book_id', $sentence['id'][0])
  536. ->where('paragraph', $sentence['id'][1])
  537. ->where('word_start', $sentence['id'][2])
  538. ->where('word_end', $sentence['id'][3])
  539. ->where('channel_uid', $nissayaChannel[0])->first();
  540. if ($nissayaSent && !empty($nissayaSent->content)) {
  541. $nissayaData = [];
  542. $nissayaData['channel'] = $channelInfo;
  543. $nissayaData['data'] = '{{sent|id=' . $sid;
  544. $nissayaData['data'] .= '|channel=' . $nissayaChannel[0];
  545. $nissayaData['data'] .= '|text=translation}}';
  546. $data['nissaya'] = $nissayaData;
  547. }
  548. }
  549. }
  550. $content = $m->render($description, $data);
  551. $prompt = $mdRender->convert($content, []);
  552. //gen mq
  553. $aiMqData = [
  554. 'model' => $aiModel,
  555. 'task' => [
  556. 'info' => $task,
  557. 'progress' => [
  558. 'current' => $sumLen,
  559. 'total' => $totalLen
  560. ],
  561. ],
  562. 'prompt' => $prompt,
  563. 'sentence' => [
  564. 'book_id' => $sentence['id'][0],
  565. 'paragraph' => $sentence['id'][1],
  566. 'word_start' => $sentence['id'][2],
  567. 'word_end' => $sentence['id'][3],
  568. 'channel_uid' => $channelId,
  569. 'content' => $prompt,
  570. 'content_type' => 'markdown',
  571. 'access_token' => $sentChannelInfo[1] ?? $params['token'],
  572. ],
  573. ];
  574. array_push($mqData, $aiMqData);
  575. }
  576. if ($send) {
  577. $this->mq->publishMessage('ai_translate', $mqData);
  578. }
  579. return $mqData;
  580. }
  581. }