gx

lyh
app/Http/Controllers/Bside/Setting/ProofreadingController.php
--- a/app/Http/Controllers/Bside/Setting/ProofreadingController.php
查看文件 @9e50d73
+++ b/app/Http/Controllers/Bside/Setting/ProofreadingController.php
查看文件 @9e50d73
@@ -29,6 +29,8 @@ class ProofreadingController extends BaseController
         $list = $proofreadingModel->list(['url'=>$this->param['url'],'language_id'=>$this->param['language_id'],'type'=>1],'text',['text','translate']);
         //获取当前URl的所有文本内容
         $new_list = $this->getUrlRead($this->param['url']);
+         var_dump($new_list);
+         die();
         if(empty($list)){
             $data = [];
             $translate_list = Translate::tran($new_list, $countryInfo['alias']);
@@ -50,10 +52,6 @@ class ProofreadingController extends BaseController
             ];
         }
         $arr2 = array_diff($new_list, $old_list);
-         var_dump($new_list);
-         var_dump($old_list);
-         var_dump($arr2);
-         die();
         if(!empty($arr2)){
             $translate_list = Translate::tran($arr2, $countryInfo['alias']);
             foreach ($arr2 as $k1=>$v1){
@@ -160,17 +158,21 @@ class ProofreadingController extends BaseController
         $strippedContent = preg_replace($pattern, '', $strippedContent); // 删除 `<link>` 标签
         $pattern = '/<footer\b[^>]*>(.*?)<\/footer>/s'; // 定义匹配`<script>`标签及其内容的正则表达式
         $strippedContent = preg_replace($pattern, '', $strippedContent); // 删除`<script>`标签及其内容
-         $pattern = '/>([^<]+)</'; // 定义匹配中间内容不是标签的正则表达式
-         $matches = array();
-         preg_match_all($pattern, $strippedContent, $matches);
-         $textContentArray = array_filter($matches[1], function($item) {
-             $item = str_replace("\n", "", $item);
-             return !empty(trim($item));
-         });
-         $textContentArray = array_values($textContentArray);
-         $uniqueArray = array_unique($textContentArray);
-         $textContentArray = array_values($uniqueArray);
-         return $textContentArray;
+ //        $pattern = '/>([^<]+)</'; // 定义匹配中间内容不是标签的正则表达式
+ //        $matches = array();
+ //        preg_match_all($pattern, $strippedContent, $matches);
+ //        $textContentArray = array_filter($matches[1], function($item) {
+ //            $item = str_replace("\n", "", $item);
+ //            return !empty(trim($item));
+ //        });
+         $pattern = '/<(\w+)[^>]*>(.*?)<\/\1>/s'; // Define the regular expression pattern
+         preg_match_all($pattern, $strippedContent, $matches); // Match all tags and their content
+ 
+         $tagContentArray = $matches[2]; // Extract the content part from the matches array
+ //        $textContentArray = array_values($textContentArray);
+ //        $uniqueArray = array_unique($textContentArray);
+ //        $textContentArray = array_values($uniqueArray);
+         return $tagContentArray;
     }
 
     /**