提交boss

c5426fd1 · jimmy · 31996e88 · c5426fd1 · c5426fd1 · c5426fd1
Commit c5426fd1 authored Aug 31, 2023 by jimmy
Show whitespace changes
Inline Side-by-side

Showing with 3 additions and 1 deletion

crawler.py crawler.py +1 -1

crawler_baidu.py crawler_baidu.py +1 -0

crawler_boss.py crawler_boss.py +1 -0

No files found.
--- a/crawler.py
+++ b/crawler.py
@@ -31,7 +31,7 @@ def SaveCompanyData(name,types,intro):
    }
    json_data = json.dumps(post_data)
    response = requests.post(cyaml.data[cyaml.data["env"]]["url"]+cyaml.data["php-api"]["getcompany"], data=json_data, headers={"Content-Type": "application/json"})
+    # Log("保存数据时候的返回：" + response)
    # 检查响应状态码
    if response.status_code == 200:
        response_data = response.json()

--- a/crawler_baidu.py
+++ b/crawler_baidu.py
@@ -17,6 +17,7 @@ def GetBaiduCompany(playwright: Playwright) -> int:
    page = context.new_page()
    #获取需要爬取数据的公司
    name,url = crawler.GetCompany(1)
+    crawler.Log(name + "-百度开始请求数据：" + url)
    if url!="":
        page.goto(url)
        all = page.locator(".lemma-summary").all_text_contents()

--- a/crawler_boss.py
+++ b/crawler_boss.py
@@ -6,6 +6,7 @@ import cyaml
 def spider_company(page):
    company_nameO, url = crawler.GetCompany(2)
+    crawler.Log(company_nameO + "-boss开始请求数据：" + url)
    if url != "":
        page.goto(url)
        page.wait_for_timeout(3000)