Python 如何找到第一级的后代?
请帮助修复脚本Python 如何找到第一级的后代?,python,python-3.x,beautifulsoup,Python,Python 3.x,Beautifulsoup,请帮助修复脚本 import pprint import requests import bs4 def get_catalog(url): req = requests.get(url) if req.status_code != requests.codes.ok: print('Error: ', req.status_code) else: soup = bs4.BeautifulSoup(req.text)
import pprint
import requests
import bs4
def get_catalog(url):
req = requests.get(url)
if req.status_code != requests.codes.ok:
print('Error: ', req.status_code)
else:
soup = bs4.BeautifulSoup(req.text)
#print(soup)
catalogMenu = soup.find('section', {'class': 'catalog'})
catalogMenuList = catalogMenu.find('ul', {'class': 'topnav'})
#print(catalogMenuList)
return catalogMenuList
def parse_catalog_categories(catalogMenuList):
catalogNames = []
#li = catalogMenuList.findNext('li', limit=1) #?????????????????
pprint.pprint(li)
if __name__ == "__main__":
url = 'http://first-store.ru/'
catalogMenuList = get_catalog(url)
if not catalogMenuList:
print('Get catalog error')
else:
parse_catalog_categories(catalogMenuList)
问题是我找不到li
第一级嵌套的所有后代。即:
iphone, ipad, ipod, imac, etc...
但不是:
iphone, iphone 5s, iphone 5s VIP, iphone 5c, .....
尝试将
recursive=False
设置为仅在标记的直接子级中搜索:
items = catalogMenuList.find_all('li', recursive=False)
请在问题中加入相关的输入/输出。特别是,您能否显示一个包含
项的小html片段以及相应的预期输出?