(root_url, page_url_list)
| 26 | return url_part_list |
| 27 | |
| 28 | async def get_all_info_page_url(root_url, page_url_list): |
| 29 | tasks, all_info_page_url_list = [], [] |
| 30 | # 控制协程并发量 |
| 31 | async with asyncio.Semaphore(50) as semaphore: |
| 32 | async with aiohttp.ClientSession() as session: |
| 33 | for url in page_url_list: |
| 34 | tasks.append(get_info_page_url(url, session)) |
| 35 | done, pendding = await asyncio.wait(tasks) |
| 36 | all_info_page_url_list = [root_url+url_part for r in done |
| 37 | for url_part in r.result()] |
| 38 | return all_info_page_url_list |
| 39 | |
| 40 | |
| 41 | def get_data(url): |
no test coverage detected