summaryrefslogtreecommitdiff
path: root/day1/task4/task4.py
diff options
context:
space:
mode:
authorАндрей Гущин <saintruler@gmail.com>2019-03-15 19:32:22 +0300
committerАндрей Гущин <saintruler@gmail.com>2019-03-15 19:32:22 +0300
commit77ad522100a55724844dd9acd693a8d51b9e7ea3 (patch)
treea1b7e8590159805a43ba725dc31e580c8c8194f4 /day1/task4/task4.py
parent3c461a4190135e070b50cfad12da2532095392fe (diff)
parent5e4ba61600e76d6abab144767312fdf19663f373 (diff)
Merge branch 'day1_task4' into 'master'
Day 1 Task 4 See merge request saintruler/trainee!4
Diffstat (limited to 'day1/task4/task4.py')
-rw-r--r--day1/task4/task4.py60
1 files changed, 60 insertions, 0 deletions
diff --git a/day1/task4/task4.py b/day1/task4/task4.py
new file mode 100644
index 0000000..2583cb4
--- /dev/null
+++ b/day1/task4/task4.py
@@ -0,0 +1,60 @@
+import string
+import re
+import os
+
+
+html_path = os.path.join(os.getcwd(), 'task4_data.html')
+
+folder_path = ''
+
+# Не знаю зачем, но в задании так написано
+try:
+ os.mkdir('../htmls')
+ folder_path = '../htmls'
+except PermissionError:
+ print('Директория на уровень выше не доступна для записи.')
+ print('Создаем папку в текущей директории...')
+ try:
+ os.mkdir('htmls')
+ folder_path = 'htmls'
+ except PermissionError:
+ print('Текущая директория не доступна для записи. Завершаем работу...')
+ quit()
+
+try:
+ html_file = open(html_path)
+ os.chdir(folder_path)
+ ascii_file = open('ascii_cleared.html', 'w', encoding='utf-8')
+ body_file = open('body_cleared.html', 'w', encoding='utf-8')
+
+except FileNotFoundError as e:
+ exception_path = str(e).strip('[Errno 2] No such file or directory:')[1:-1]
+ print(f'"{exception_path}" не существует')
+
+except PermissionError as e:
+ exception_path = str(e).strip('[Errno 13] Permission denied:')[1:-1]
+ print(f'Файл "{exception_path}" не доступен для чтения/записи')
+
+except IsADirectoryError as e:
+ exception_path = str(e).strip('[Errno 21] Is a directory:')[1:-1]
+ print(f'"{exception_path}" является директорией')
+
+else:
+ data = html_file.read()
+
+ cleared_data = ''.join(filter(lambda char: char in string.printable, data))
+ ascii_file.write(cleared_data)
+
+ ###################
+
+ body_cleared = re.sub(
+ r'<BODY>(.|\n)*?</BODY>',
+ lambda match: match.string[match.start(): match.end()].replace('\n', ''),
+ data
+ )
+
+ body_file.write(body_cleared)
+
+ html_file.close()
+ ascii_file.close()
+ body_file.close()