fork download
  1. #забираем содержание страницы
  2. def get_page_data(html):
  3. soup = BeautifulSoup(html, 'lxml')
  4.  
  5. try:
  6. name = soup.find('h1').text.strip()
  7. except:
  8. name = ''
  9.  
  10. try:
  11. article = soup.find_all('span').text.strip()
  12. except:
  13. article = ''
  14.  
  15. try:
  16. komplekt = soup.find_all('strong').text.strip()
  17. except:
  18. komplekt = ''
  19.  
  20. try:
  21. composition = soup.find_all('p').text.strip()
  22. except:
  23. composition = ''
  24.  
  25. try:
  26. characteristics = soup.find('ul').find_all('li').text.strip()
  27. except:
  28. characteristics = ''
  29.  
  30.  
  31. data = {'name': name,
  32. 'article': article,
  33. 'komplekt': komplekt,
  34. 'composition': composition,
  35. 'characteristics': characteristics}
  36. print(data)
  37. return data
Success #stdin #stdout 0.02s 9308KB
stdin
Standard input is empty
stdout
Standard output is empty