-
Notifications
You must be signed in to change notification settings - Fork 10
/
Copy pathheadless.py
42 lines (33 loc) · 1.13 KB
/
headless.py
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
"""Controls headless Chrome."""
import json
import pyppeteer
async def search_users(search_term: str, max_result_num=5):
"""Searches users on zhihu with given search term.
This function has to be async because pyppeteer only supports async usage.
"""
browser = await pyppeteer.launch()
page = await browser.newPage()
await page.goto(f"https://www.zhihu.com/api/v4/search_v3?t=people&q={search_term}")
await page.waitForSelector("pre")
search_results = await page.evaluate(
"""
() => {
return document.querySelector("pre").innerHTML;
}
"""
)
await browser.close()
search_results = json.loads(search_results)
users_info = []
for i, result in enumerate(search_results["data"]):
if i >= max_result_num:
break
user_object = result["object"]
users_info.append(
{
"name": user_object["name"].replace("<em>", "").replace("</em>", ""),
"url_token": user_object["url_token"],
"avatar_url": user_object["avatar_url"],
}
)
return users_info