Home >Backend Development >Python Tutorial >How to use aiohttp in Python

How to use aiohttp in Python

WBOYWBOYWBOYWBOYWBOYWBOYWBOYWBOYWBOYWBOYWBOYWBOYWBforward: 2023-05-11 09:22:052232browse

1.Definition

aiohttp is an asynchronous HTTP network module based on asyncio, which provides both the server and the client

2.Basic use

import aiohttp
import asyncio


async def fetch(session, url):
    # 声明一个支持异步的上下文管理器
    async with session.get(url) as response:
        # response.text()是coroutine对象 需要加await
        return await response.text(), response.status


async def main():
    # 声明一个支持异步的上下文管理器
    async with aiohttp.ClientSession() as session:
        html, status = await fetch(session, &#39;https://cuiqingcai.com&#39;)
        print(f&#39;html: {html[:100]}...&#39;)
        print(f&#39;status: {status}&#39;)


if __name__ == &#39;__main__&#39;:
    #  Python 3.7 及以后,不需要显式声明事件循环,可以使用 asyncio.run(main())来代替最后的启动操作
    asyncio.get_event_loop().run_until_complete(main())

3. Request type

session.post(&#39;http://httpbin.org/post&#39;, data=b&#39;data&#39;)
session.put(&#39;http://httpbin.org/put&#39;, data=b&#39;data&#39;)
session.delete(&#39;http://httpbin.org/delete&#39;)
session.head(&#39;http://httpbin.org/get&#39;)
session.options(&#39;http://httpbin.org/get&#39;)
session.patch(&#39;http://httpbin.org/patch&#39;, data=b&#39;data&#39;)

4. Corresponding fields

print(&#39;status:&#39;, response.status) # 状态码
print(&#39;headers:&#39;, response.headers)# 响应头
print(&#39;body:&#39;, await response.text())# 响应体
print(&#39;bytes:&#39;, await response.read())# 响应体二进制内容
print(&#39;json:&#39;, await response.json())# 响应体json数据

5. Timeout setting

import aiohttp
import asyncio
async def main():
   #设置 1 秒的超时 
   timeout = aiohttp.ClientTimeout(total=1)
   async with aiohttp.ClientSession(timeout=timeout) as session:
       async with session.get(&#39;https://httpbin.org/get&#39;) as response:
           print(&#39;status:&#39;, response.status)
if __name__ == &#39;__main__&#39;:
   asyncio.get_event_loop().run_until_complete(main())

6. Concurrency limit

import asyncio
import aiohttp
# 声明最大并发量为5
CONCURRENCY = 5
semaphore = asyncio.Semaphore(CONCURRENCY)
URL = &#39;https://www.baidu.com&#39;

session = None
async def scrape_api():
   async with semaphore:
       print(&#39;scraping&#39;, URL)
       async with session.get(URL) as response:
           await asyncio.sleep(1)
           return await response.text()
    
async def main():
   global session
   session = aiohttp.ClientSession()
   scrape_index_tasks = [asyncio.ensure_future(scrape_api()) for _ in range(10000)]
   await asyncio.gather(*scrape_index_tasks)
if __name__ == &#39;__main__&#39;:
   asyncio.get_event_loop().run_until_complete(main())

7. Practical application

import asyncio
import aiohttp
import logging
import json
logging.basicConfig(level=logging.INFO,
                    format=&#39;%(asctime)s - %(levelname)s: %(message)s&#39;)
INDEX_URL = &#39;https://dynamic5.scrape.center/api/book/?limit=18&offset={offset}&#39;
DETAIL_URL = &#39;https://dynamic5.scrape.center/api/book/{id}&#39;
PAGE_SIZE = 18
PAGE_NUMBER = 100
CONCURRENCY = 5

semaphore = asyncio.Semaphore(CONCURRENCY)
session = None

async def scrape_api(url):
   async with semaphore:
       try:
           logging.info(&#39;scraping %s&#39;, url)
           async with session.get(url) as response:
               return await response.json()
       except aiohttp.ClientError:
           logging.error(&#39;error occurred while scraping %s&#39;, url, exc_info=True)

async def scrape_index(page):
   url = INDEX_URL.format(offset=PAGE_SIZE * (page - 1))
   return await scrape_api(url)

async def main():
   global session
   session = aiohttp.ClientSession()
   scrape_index_tasks = [asyncio.ensure_future(scrape_index(page)) for page in range(1, PAGE_NUMBER + 1)]
   results = await asyncio.gather(*scrape_index_tasks)
   logging.info(&#39;results %s&#39;, json.dumps(results, ensure_ascii=False, indent=2))
   

if __name__ == &#39;__main__&#39;:
   asyncio.get_event_loop().run_until_complete(main())

The above is the detailed content of How to use aiohttp in Python. For more information, please follow other related articles on the PHP Chinese website!

Python 并发异步 http

Statement：

This article is reproduced at:yisu.com. If there is any infringement, please contact admin@php.cn delete

Previous article：How to implement lottery system in PythonNext article：How to implement lottery system in Python

See more