Explorar o código

fix: 修复灰豚rpa没有数据卡住的问题

wuwenyi hai 6 meses
pai
achega
f7b242f0d4
Modificáronse 2 ficheiros con 8 adicións e 4 borrados
  1. 7 3
      huitun/__init__.py
  2. 1 1
      xhs/__init__.py

+ 7 - 3
huitun/__init__.py

@@ -51,11 +51,15 @@ class HuiTunBrowser(BaseBrowser):
             self.page.wait_for_timeout(500)
             self.page.on('response', self.search_note_handler)
             self.page.get_by_text('近3天', exact=True).click()
-            while size is None or len(self.list_result) < size:
-                logging.info('继续搜索用户主页')
+            # 限定一个上限
+            page_num = int(2 * size / 10)
+            for i in range(page_num):
+                if size is not None and len(self.list_result) >= size:
+                    break
+                logging.info('继续搜索灰豚')
                 self.page.evaluate("window.scrollTo(0, document.body.scrollHeight)")
                 self.page.wait_for_timeout(2000)
-                logging.info('搜索用户主页图文结果数:%s', len(self.list_result))
+                logging.info('搜索灰豚结果数:%s', len(self.list_result))
                 if not self.has_more:
                     break
             return self.list_result

+ 1 - 1
xhs/__init__.py

@@ -82,7 +82,7 @@ class XhsBrowser(BaseBrowser):
                 huitun_note['authorInfo'] = note_info.get('user')
                 if note_info.get('imageList'):
                     huitun_note['imageList'] = [img.get('urlDefault') for img in note_info.get('imageList')]
-                sleep(4)
+                self.page.wait_for_timeout(4000)
             except Exception as e:
                 utils.logger.error(f"爬取小红书异常 {e}")