parsescp.py 322 B

1234567891011121314
  1. import bs4
  2. import sys
  3. import re
  4. scp = sys.stdin.read()
  5. b = bs4.BeautifulSoup(scp)
  6. mainpage = b.find({"div":{"id":"page-content"}})
  7. splitted = mainpage.getText().split(" ")[1]
  8. r = re.compile(r'rating.*\d*')
  9. matches = r.findall(splitted)
  10. splitted = splitted.replace(matches[0],"")
  11. print(splitted)