ViolationStoreDataJobs.php 15 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300
  1. <?php
  2. namespace App\Jobs\Manager\Process;
  3. use Illuminate\Bus\Queueable;
  4. use Illuminate\Contracts\Queue\ShouldBeUnique;
  5. use Illuminate\Contracts\Queue\ShouldQueue;
  6. use Illuminate\Foundation\Bus\Dispatchable;
  7. use Illuminate\Queue\InteractsWithQueue;
  8. use Illuminate\Queue\SerializesModels;
  9. use App\Facades\Servers\Logs\Log;
  10. use App\Models\Manager\Process\ViolationStore as ViolationStoreModel;
  11. use App\Models\Manager\Personnel\Employee as EmployeeModel;
  12. use App\Models\Api\Process\ExecuteLog as ExecuteLogModel;
  13. use App\Models\Manager\Process\ScrapeData as ScrapeDataModel;
  14. use App\Models\Manager\WashConfig\ViolationCompanyMember as ViolationCompanyMemberModel;
  15. use App\Models\Manager\Citys as CitysModel;
  16. use App\Models\Manager\Personnel\EmployeePlatform as EmployeePlatformModel;
  17. use App\Models\Manager\Personnel\EmployeeArea as EmployeeAreaModel;
  18. use Illuminate\Support\Facades\DB;
  19. use Illuminate\Support\Carbon;
  20. /**
  21. * 数据清洗-违规店铺清洗数据队列
  22. * @author 唐远望
  23. * @version 1.0
  24. * @date 2025-12-11
  25. */
  26. class ViolationStoreDataJobs implements ShouldQueue
  27. {
  28. use Dispatchable, InteractsWithQueue, Queueable, SerializesModels;
  29. public $tries = 3; // 限制重试次数
  30. public $timeout = 600; // 5分钟超时
  31. protected $message_data;
  32. /**
  33. * Create a new job instance.
  34. *
  35. * @return void
  36. */
  37. public function __construct(array $message_data)
  38. {
  39. $this->message_data = $message_data;
  40. }
  41. /**
  42. * Execute the job.
  43. *
  44. * @return void
  45. */
  46. public function handle()
  47. {
  48. try {
  49. $this->getViolationStoreData($this->message_data);
  50. } catch (\Exception $e) {
  51. Log::info('job_error', '数据清洗-违规店铺清洗数据队列失败', ['data' => $this->message_data, 'error' => $e->getMessage()]);
  52. }
  53. }
  54. /**
  55. * 采集商品数据清洗
  56. * @author 唐远望
  57. * @version 1.0
  58. * @date 2025-12-11
  59. */
  60. public function getViolationStoreData($message_data)
  61. {
  62. $CitysModel = new CitysModel();
  63. $EmployeeModel = new EmployeeModel();
  64. $ViolationStoreModel = new ViolationStoreModel();
  65. $ScrapeDataModel = new ScrapeDataModel();
  66. $ViolationCompanyMemberModel = new ViolationCompanyMemberModel();
  67. $EmployeePlatformModel = new EmployeePlatformModel();
  68. $EmployeeAreaModel = new EmployeeAreaModel();
  69. $platform = $message_data['platform']; //多个平台配置
  70. $executeLog_id = $message_data['executeLog_id'];
  71. $store_name = $message_data['store_name']; //店铺名称
  72. $specify_responsible_person = $message_data['specify_responsible_person']; //指派责任人 0=开启 1=关闭
  73. $limit = isset($message_data['limit']) ? $message_data['limit'] : 50;
  74. $page = isset($message_data['page']) ? $message_data['page'] : 1;
  75. $company_id = isset($message_data['company_id']) ? $message_data['company_id'] : 0; //品牌方公司ID
  76. $item_totle_page = $message_data['item_totle_page']; //清洗店铺总页数
  77. $item_now_page = $message_data['item_now_page']; //清洗店铺当前页
  78. $employee_ids = $message_data['employee_ids']; //指派责任人ID列表
  79. $start_time = time() - 60 * 5; // 开始时间 5分钟之前
  80. $end_time = time();//结束时间
  81. $start_time_string = date('Y-m-d H:i:s', $start_time);
  82. $end_time_string = date('Y-m-d H:i:s', $end_time);
  83. $where_map[] = ['insert_time', '>=', $start_time_string];
  84. $where_map[] = ['insert_time', '<=', $end_time_string];
  85. if ($platform != '0' && !empty($platform)) {
  86. $platform = explode(',', $platform);
  87. $ScrapeDataModel = $ScrapeDataModel->where('store_name', $store_name)->where($where_map)->whereIn('platform_id', $platform);
  88. } else {
  89. $ScrapeDataModel = $ScrapeDataModel->where('store_name', $store_name)->where($where_map);
  90. }
  91. $product_data_info = $ScrapeDataModel->paginate($limit, ['*'], 'page', $page)->toarray();
  92. $product_datas = $product_data_info['data'];
  93. if (empty($product_datas)) {
  94. if ($executeLog_id && $item_now_page >= $item_totle_page) {
  95. (new ExecuteLogModel())->where('id', $executeLog_id)->update(['status' => 0, 'update_time' => time()]);
  96. }
  97. return true;
  98. }
  99. foreach ($product_datas as $product_data) {
  100. //-------------------------------------- 处理营业执照地区信息(开始) --------------------------------------
  101. $province_name = $product_data['province_name'];
  102. $city_name = $product_data['city_name'];
  103. //特殊地区1级移除市
  104. if ($province_name && in_array($province_name, ['北京市', '天津市', '上海市', '重庆市'])) {
  105. //移除市这个字符
  106. $province_name = trim(str_replace('市', '', $province_name));
  107. } else if ($province_name && in_array($province_name, ['北京', '天津', '上海', '重庆'])) {
  108. } else if ($province_name && in_array($province_name, ['内蒙古', '广西', '西藏', '新疆', '宁夏'])) {
  109. switch ($province_name) {
  110. case '内蒙古':
  111. $province_name = '内蒙古自治区';
  112. break;
  113. case '广西':
  114. $province_name = '广西壮族自治区';
  115. break;
  116. case '西藏':
  117. $province_name = '西藏自治区';
  118. break;
  119. case '新疆':
  120. $province_name = '新疆维吾尔自治区';
  121. break;
  122. case '宁夏':
  123. $province_name = '宁夏回族自治区';
  124. break;
  125. }
  126. } else if ($province_name && in_array($province_name, ['内蒙古自治区', '广西壮族自治区', '西藏自治区', '新疆维吾尔自治区', '宁夏回族自治区'])) {
  127. //完整匹配不做处理
  128. } else if (trim($province_name) != '' && strpos($province_name, '省') === false) {
  129. //是否存在市省,如果不存在则补全
  130. $province_name = $province_name . '省';
  131. }
  132. if (trim($province_name) != '') {
  133. //根据最新处理后的省份名称获取省份ID
  134. $db_province_id = $CitysModel->where([['name', '=', $province_name], ['level', '=', '1']])->value('id');
  135. if (!empty($db_province_id)) {
  136. $product_data['province_id'] = $db_province_id;
  137. }else{
  138. //逆推省份ID失败,则修改为未知名称
  139. $province_name ='未知';
  140. }
  141. } else {
  142. //尝试从地区详情里面匹配省份名称
  143. $db_province_data_list = $CitysModel->where([['level', '=', '1']])->select(['id','name'])->get()->toarray();
  144. foreach ($db_province_data_list as $db_province_data) {
  145. $db_province_name = $db_province_data['name'];
  146. if (strpos($product_data['area_info'], $db_province_name) !== false) {
  147. $province_name = $db_province_name;
  148. $product_data['province_id'] = $db_province_data['id'];
  149. break;
  150. }
  151. }
  152. }
  153. if (trim($city_name) != '') {
  154. //校验是否存在县这个字眼
  155. if (strpos($city_name, '县') !== false) {
  156. $db_city_id = $CitysModel->where([['name', '=', $city_name], ['level', '=', '2']])->value('id');
  157. if (!empty($db_city_id)) {
  158. $product_data['city_id'] = $db_city_id;
  159. }
  160. } elseif (trim($city_name) != '' && strpos($city_name, '市') === false) {
  161. //是否存在市
  162. $city_name = $city_name . '市';
  163. //根据最新处理后的市名称获取市ID
  164. $db_city_id = $CitysModel->where([['name', '=', $city_name], ['level', '=', '2']])->value('id');
  165. if (!empty($db_city_id)) {
  166. $product_data['city_id'] = $db_city_id;
  167. }else{
  168. $city_name ='未知';
  169. }
  170. } else {
  171. $db_city_id = $CitysModel->where([['name', '=', $city_name], ['level', '=', '2']])->value('id');
  172. if (!empty($db_city_id)) {
  173. $product_data['city_id'] = $db_city_id;
  174. }else{
  175. $city_name ='未知';
  176. }
  177. }
  178. } else {
  179. if (trim($product_data['area_info']) != '') {
  180. //尝试从地区详情里面匹配市名称
  181. $db_city_name_list = $CitysModel->where([['level', '=', '2']])->pluck('name')->toarray();
  182. foreach ($db_city_name_list as $db_city_name) {
  183. if (strpos($product_data['area_info'], $db_city_name) !== false) {
  184. $db_city_id = $CitysModel->where([['name', '=', $db_city_name], ['level', '=', '2']])->value('id');
  185. $product_data['city_id'] = $db_city_id;
  186. $product_data['city_name'] = $db_city_name;
  187. $city_name = $db_city_name;
  188. break;
  189. }
  190. }
  191. }
  192. }
  193. //如果存在市区city_id 则逆推省份ID以及名称
  194. if (!empty($product_data['city_id']) && empty($product_data['province_id'])) {
  195. $db_province_id = $CitysModel->where([['id', '=', $product_data['city_id']], ['level', '=', '2']])->value('pid');
  196. $db_province_name = $CitysModel->where([['id', '=', $db_province_id], ['level', '=', '1']])->value('name');
  197. $product_data['province_id'] = $db_province_id;
  198. $product_data['province_name'] = $db_province_name;
  199. $province_name = $db_province_name;
  200. }
  201. if (trim($product_data['area_info']) == '' && trim($city_name) != '' && trim($province_name) != '') {
  202. $product_data['area_info'] = $province_name . $city_name;
  203. }
  204. //-------------------------------------- 处理营业执照地区信息(结束) --------------------------------------
  205. //处理链接信息
  206. preg_match('/https?:\/\/[^\s\'"<>]+/i', $product_data['link_url'], $matches);
  207. if (!empty($matches)) {
  208. $product_data['link_url'] = $matches[0];
  209. }
  210. $store_name = $product_data['store_name'];
  211. $anonymous_store_name = $product_data['anonymous_store_name'];
  212. if ($anonymous_store_name != '') {
  213. $store_name = $anonymous_store_name;
  214. }
  215. $insert_product_data = [
  216. 'company_id' => $company_id,
  217. 'source_id' => $product_data['id'],
  218. 'platform' => $product_data['platform_id'],
  219. 'company_name' => $product_data['company_name'],
  220. 'link_url' => $product_data['link_url'],
  221. 'store_name' => $store_name,
  222. 'social_credit_code' => $product_data['qualification_number'],
  223. 'province_id' => $product_data['province_id'],
  224. 'province_name' => $province_name,
  225. 'city_id' => $product_data['city_id'],
  226. 'city_name' => $city_name,
  227. 'area_info' => $product_data['area_info'],
  228. 'company_category_name' => '',
  229. 'first_responsible_person' => '',
  230. 'responsible_person' => '',
  231. 'source_responsible_person' => '',
  232. 'scrape_date' => $product_data['scrape_date'],
  233. 'collection_time' => strtotime($product_data['insert_time']),
  234. ];
  235. $employee_id_list = explode(',', $employee_ids);
  236. //获取指定人员信息
  237. if ($specify_responsible_person == 0) {
  238. $first_responsible_person ='';
  239. //查询第一责任人
  240. if (!empty($employee_id_list)) {
  241. $where_query1[] = ['company_id', '=', $company_id];
  242. $where_query1[] = ['id', 'in', $employee_id_list];
  243. $where_query1[] = ['status', '=', 0];
  244. $where_query1[] = ['duty_type', '=', 1]; //责任类型1=第一责任人,2=责任人
  245. $first_responsible_person = $EmployeeModel->where($where_query1)->pluck('id')->implode(',');
  246. }
  247. $insert_product_data['first_responsible_person'] = $first_responsible_person;
  248. //查询责任人
  249. $responsible_person ='';
  250. if (!empty($employee_id_list)) {
  251. $where_query2[] = ['company_id', '=', $company_id];
  252. $where_query2[] = ['id', 'in', $employee_id_list];
  253. $where_query2[] = ['status', '=', 0];
  254. $where_query2[] = ['duty_type', '=', 2]; //责任类型1=第一责任人,2=责任人
  255. $responsible_person = $EmployeeModel->where($where_query2)->pluck('id')->implode(',');
  256. }
  257. $insert_product_data['responsible_person'] = $responsible_person;
  258. //溯源责任人
  259. $source_responsible_person = '';
  260. if ($first_responsible_person && $responsible_person) {
  261. //转换成数组,合并后在去重
  262. $first_responsible_person = explode(',', $first_responsible_person);
  263. $responsible_person = explode(',', $responsible_person);
  264. $source_responsible_person = array_unique(array_merge($first_responsible_person, $responsible_person));
  265. $source_responsible_person = ',' . implode(',', $source_responsible_person) . ',';
  266. } else if ($first_responsible_person) {
  267. $source_responsible_person = $first_responsible_person;
  268. } else if ($responsible_person) {
  269. $source_responsible_person = $responsible_person;
  270. }
  271. $insert_product_data['source_responsible_person'] = $source_responsible_person;
  272. }
  273. //插入数据
  274. $ViolationStoreModel->addViolationStore($insert_product_data);
  275. }
  276. //继续执行下一页
  277. $message_data['page'] = $page + 1;
  278. $message_data['limit'] = $limit;
  279. ViolationStoreDataJobs::dispatch($message_data)->delay(now()->addSeconds(1));
  280. }
  281. public function failed(\Throwable $exception)
  282. {
  283. Log::info('job_error', '数据清洗-违规店铺清洗数据队列完全失败', ['data' => $this->message_data, 'error' => $exception->getMessage()]);
  284. }
  285. }