naibo 2 年之前
父节点
当前提交
d4d695c747
共有 2 个文件被更改,包括 5 次插入2 次删除
  1. 4 1
      .temp_to_pub/EasySpider_windows_x64/Code/easyspider_executestage.py
  2. 1 1
      .temp_to_pub/compress.py

+ 4 - 1
.temp_to_pub/EasySpider_windows_x64/Code/easyspider_executestage.py

@@ -1144,7 +1144,10 @@ class BrowserThread(Thread):
 
     # 提取数据事件
     def getData(self, para, loopElement, isInLoop=True, parentPath="", index=0):
-        pageHTML = etree.HTML(self.browser.page_source)
+        try:
+            pageHTML = etree.HTML(self.browser.page_source)
+        except:
+            pageHTML = ""
         if loopElement != "":  # 只在数据在循环中提取时才需要获取循环元素
             try:
                 loopElementOuterHTML = loopElement.get_attribute('outerHTML')

+ 1 - 1
.temp_to_pub/compress.py

@@ -65,7 +65,7 @@ if __name__ == "__main__":
             os.remove("./EasySpider_windows_x64/mysql_config.json")
         os.mkdir("./EasySpider_windows_x64/Data")
         os.mkdir("./EasySpider_windows_x64/execution_instances")
-        # compress_folder_to_7z_split("./EasySpider_windows_x64", file_name)
+        compress_folder_to_7z_split("./EasySpider_windows_x64", file_name)
         print(f"Compress {file_name} Split successfully!")
         compress_folder_to_7z("./EasySpider_windows_x64", file_name)
         print(f"Compress {file_name} successfully!")