Browse Source

feat: 每次爬取都判断是否有校验

wuwenyi 6 months ago
parent
commit
4168ff3c18
1 changed files with 2 additions and 1 deletions
  1. 2 1
      xhs/__init__.py

+ 2 - 1
xhs/__init__.py

@@ -82,12 +82,13 @@ class XhsBrowser(BaseBrowser):
                 huitun_note['authorInfo'] = note_info.get('user')
                 if note_info.get('imageList'):
                     huitun_note['imageList'] = [img.get('urlDefault') for img in note_info.get('imageList')]
-                sleep(2)
+                sleep(4)
             except Exception as e:
                 utils.logger.error(f"爬取小红书异常 {e}")
 
     def get_note(self, note_id: str):
         # note = self.xhs_client.get_note_by_id(note_id=note_id)
         self.page.goto(f'{XHS_URL}/explore/{note_id}', wait_until='domcontentloaded')
+        self.rotate_ident.handle_rotate()
         data = self.page.evaluate('noteId => window.__INITIAL_STATE__ && JSON.stringify(window.__INITIAL_STATE__.note.noteDetailMap[noteId].note)', note_id)
         return json.loads(data)