json
re
requests
bs4 BeautifulSoup
(url):
response = requests.get(url)
response.encoding = soup = BeautifulSoup(response.text, )
content = soup.find_all()
data = []
para content:
text = para.get_text(=)
text: data.append(text)
data_str = .join(data)
data_str
(data_str):
pattern = re.compile(, re.DOTALL)
lawarticles = {}
match pattern.finditer(data_str):
articlenumber = match.group()
articlecontent = match.group().replace(+ articlenumber + , ).strip()
lawarticles[articlenumber] = articlecontent
jsonstr = json.dumps(lawarticles, =, =)
jsonstr
__name__ == :
url = data_str = fetch_and_parse(url)
json_str = extract_law_articles(data_str)
(json_str)