diff options
Diffstat (limited to 'day1/task4')
| -rw-r--r-- | day1/task4/task4.py | 25 | ||||
| -rw-r--r-- | day1/task4/task4_data.html | 13 |
2 files changed, 38 insertions, 0 deletions
diff --git a/day1/task4/task4.py b/day1/task4/task4.py new file mode 100644 index 0000000..9ed9f2d --- /dev/null +++ b/day1/task4/task4.py @@ -0,0 +1,25 @@ +import string +import re +import os + +with open('task4_data.html') as f: + data = f.read() + +# Не знаю зачем, но в задании так написано +os.chdir('..') +os.mkdir('htmls') +os.chdir('htmls') + +cleared_data = ''.join(filter(lambda char: char in string.printable, data)) +with open('ascii_cleared.html', 'w', encoding='utf-8') as f: + f.write(cleared_data) + +body_cleared = re.sub( + r'<BODY>(.|\n)*?</BODY>', + lambda match: match.string[match.start(): match.end()].replace('\n', ''), + data +) + +with open('body_cleared.html', 'w', encoding='utf-8') as f: + f.write(body_cleared) + diff --git a/day1/task4/task4_data.html b/day1/task4/task4_data.html new file mode 100644 index 0000000..4357c07 --- /dev/null +++ b/day1/task4/task4_data.html @@ -0,0 +1,13 @@ +<!DOCTYPE html PUBLIC "-//IETF//DTD HTML 2.0//EN"> +<HTML> + <HEAD> + <TITLE> + A Small Hello. Это по идеи заголовок. + </TITLE> + </HEAD> +<BODY> + <H1>Hi я интерактивная страница</H1> + <P>I want to be inline, in my source code</P> + <P>This is very minimal "hello world" HTML document.</P> +</BODY> +</HTML> |