" not in str(content): parm = True html = pq(content, parser="html") a = [] if html.children(): for line in html.children().items(): if str(line).startswith("", "\n").replace("
", "\n").replace("
", "\n") + "\n") else: if "
" in str(line) or "
" in str(line) or "
" in str(line): line = str(line).replace("
", "###").replace("
", "###").replace("
", "###") line = pq(line) new_line = list(map(lambda x: str(x) + "\n", line.text().split("###"))) a.extend(new_line) else: if line.text().strip(): a.append(line.text() + "\n") elif str(line).startswith("

"): line = re.sub(r'', "", str(line.html())) b = line.replace('

', ""). \ replace("
", "\n"). \ replace("
", "\n"). \ replace("
", "\n"). \ replace('

', "\n").\ replace('

', "\n") b_list = b.split("\n") # b_list = list(filter(lambda x: str(x), b_list)) b_list = list(filter(filter_data, b_list)) b_list = list(map(lambda x: str(x) + "\n", b_list)) a.extend(b_list) elif str(line).startswith("', "", str(content)) content = re.sub(r'', "", str(content)) content = str(content).replace("", "") content = str(content).replace('

', "\n") parm = False if "

" not in str(content): parm = True html = pq(content, parser="html") a = [] if html.children(): for line in html.children().items(): if str(line).startswith("", "\n").replace("
", "\n").replace("
", "\n") + "\n") else: line = replace_k(line) if "
" in str(line) or "
" in str(line) or "
" in str(line): line = str(line).replace("
", "###").replace("
", "###").replace("
", "###") line = pq(line) new_line = list(map(lambda x: str(x).replace("+", "\xa0") + "\n", line.text().split("###"))) a.extend(new_line) else: if line.text().strip(): a.append(line.text().replace("+", "\xa0") + "\n") elif str(line).startswith("

"): line = re.sub(r'', "", str(line.html())) b = line.replace('

', ""). \ replace("
", "\n"). \ replace("
", "\n"). \ replace("
", "\n"). \ replace('

', "\n"). \ replace('

', "\n") b_list = b.split("\n") # b_list = list(filter(lambda x: str(x), b_list)) b_list = list(filter(filter_data, b_list)) b_list = list(map(lambda x: str(x) + "\n", b_list)) a.extend(b_list) elif str(line).startswith(" Amelia Earhart was borm in 1897 in Kansas She and her younger sister Muriel were very active. They

rode horses, played baseball and basketball.

In 1916 Amelia completed high school and then prepared to enter