Commit c5426fd1 authored by jimmy's avatar jimmy

提交boss

parent 31996e88
...@@ -31,7 +31,7 @@ def SaveCompanyData(name,types,intro): ...@@ -31,7 +31,7 @@ def SaveCompanyData(name,types,intro):
} }
json_data = json.dumps(post_data) json_data = json.dumps(post_data)
response = requests.post(cyaml.data[cyaml.data["env"]]["url"]+cyaml.data["php-api"]["getcompany"], data=json_data, headers={"Content-Type": "application/json"}) response = requests.post(cyaml.data[cyaml.data["env"]]["url"]+cyaml.data["php-api"]["getcompany"], data=json_data, headers={"Content-Type": "application/json"})
# Log("保存数据时候的返回:" + response)
# 检查响应状态码 # 检查响应状态码
if response.status_code == 200: if response.status_code == 200:
response_data = response.json() response_data = response.json()
......
...@@ -17,6 +17,7 @@ def GetBaiduCompany(playwright: Playwright) -> int: ...@@ -17,6 +17,7 @@ def GetBaiduCompany(playwright: Playwright) -> int:
page = context.new_page() page = context.new_page()
#获取需要爬取数据的公司 #获取需要爬取数据的公司
name,url = crawler.GetCompany(1) name,url = crawler.GetCompany(1)
crawler.Log(name + "-百度开始请求数据:" + url)
if url!="": if url!="":
page.goto(url) page.goto(url)
all = page.locator(".lemma-summary").all_text_contents() all = page.locator(".lemma-summary").all_text_contents()
......
...@@ -6,6 +6,7 @@ import cyaml ...@@ -6,6 +6,7 @@ import cyaml
def spider_company(page): def spider_company(page):
company_nameO, url = crawler.GetCompany(2) company_nameO, url = crawler.GetCompany(2)
crawler.Log(company_nameO + "-boss开始请求数据:" + url)
if url != "": if url != "":
page.goto(url) page.goto(url)
page.wait_for_timeout(3000) page.wait_for_timeout(3000)
......
Markdown is supported
0% or
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment