可以使用正则表达式或CSS Selector来定位并提取需要的信息,例如App名称、开发者、评分等。具体示例代码如下:
使用正则表达式:
import re import requests from bs4 import BeautifulSoup
url = 'https://apps.apple.com/us/app/tiktok-make-your-day/id1235601864' response = requests.get(url) soup = BeautifulSoup(response.content, 'html.parser')
app_name = soup.find('h1', {'class': 'product-header__title'}).get_text() developer = soup.find('a', {'class': 'link'}).get_text() rating = re.findall(r'(\d.\d)', str(soup.find('div', {'class': 'we-customer-ratings__averages__display'}))) description = soup.find('div', {'class': 'section__description'}).find('p').get_text()
print('App名称:', app_name) print('开发者:', developer) print('评分:', rating[0]) print('简介:', description)
使用CSS Selector:
import requests from bs4 import BeautifulSoup
url = 'https://apps.apple.com/us/app/tiktok-make-your-day/id1235601864' response = requests.get(url) soup = BeautifulSoup(response.content, 'html.parser')
app_name = soup.select_one('h1.product-header__title').get_text() developer = soup.select_one('a.link').get_text() rating = soup.select_one('div.we-customer-ratings__averages__display > div').get_text().strip() description = soup.select_one('div.section__description > p').get_text()
print('App名称:', app_name) print('开发者:', developer) print('评分:', rating) print('简介:', description)