diff --git a/clear_html.py b/clear_html.py new file mode 100644 index 0000000..609ab12 --- /dev/null +++ b/clear_html.py @@ -0,0 +1,18 @@ +with open('test', 'r') as f: + l = f.readlines() + f.close() + +ll = l[0].split('title="') + +lt = [] +for x in ll: + buffer = '' + cc = 0 + while x[cc] != '"': + buffer += x[cc] + cc += 1 + lt.append(buffer) + +lt.remove('