article_match = re.search(r'(

)(.*?)(

)', content, re.DOTALL) if not article_match: # Если тег

не найден, пропускаем файл print(f"Ошибка: в файле {filename} не найден тег

") return False # Извлекаем части before_article = content[:article_match.start(1)] article_open = article_match.group(1) article_content = article_match.group(2) article_close = article_match.group(3) after_article = content[article_match.end(3):] # Сохраняем оригинальное содержимое статьи для сравнения original_article_content = article_content # Сохраняем alt атрибуты и code теги перед обработкой protected_content, saved_alts = save_alt_attributes(article_content) protected_content, saved_codes = save_code_content(protected_content, filename) # Применяем типографические улучшения только к содержимому статьи processed_article_content = prettify_prepositions(protected_content) # Восстанавливаем code теги и alt атрибуты processed_article_content = restore_code_content(processed_article_content, saved_codes) processed_article_content = restore_alt_attributes(processed_article_content, saved_alts) # Проверяем, были ли изменения в содержимом статьи if processed_article_content == original_article_content: return False # Статья не изменена # Восстанавливаем полный контент с обработанной статьей new_content = before_article + article_open + processed_article_content + article_close + after_article # Сохраняем результат обратно в файл try: with open(filepath, "w", encoding="utf-8") as f: f.write(new_content) print(f"Изменен файл: {filename}") return True except IOError as e: print(f"Ошибка записи файла {filepath}: {e}") return False def process_year_directory(year_dir): """Обработать все посты в каталоге года""" # Ищем все HTML файлы в каталоге, исключая index.html pattern = os.path.join(year_dir, "*.html") html_files = [f for f in glob.glob(pattern) if not f.endswith("index.html")] if not html_files: return 0, 0 # (обработано, изменено) read_count = 0 modified_count = 0 for filepath in sorted(html_files): read_count += 1 if process_post_file(filepath): modified_count += 1 return read_count, modified_count def main(): """Основная функция""" args = parse_arguments() if args.all: # Режим обработки всех файлов print("Начинаем типографические улучшения постов блога") # Находим каталоги с годами year_dirs = find_year_directories() if not year_dirs: print("Не найдено каталогов с годами") return print(f"Найдены каталоги с годами: {', '.join(year_dirs)}") total_read = 0 total_modified = 0 # Обрабатываем каждый каталог с годом for year_dir in year_dirs: read_count, modified_count = process_year_directory(year_dir) total_read += read_count total_modified += modified_count print(f"\n--- Завершено ---") print(f"Всего прочитано {total_read} файлов, изменено {total_modified} файлов.") elif args.file: # Режим обработки одного файла filepath = args.file # Проверяем, существует ли файл if not os.path.exists(filepath): print(f"Ошибка: файл {filepath} не найден") return # Проверяем, что это HTML файл if not filepath.endswith('.html'): print(f"Ошибка: файл {filepath} не является HTML файлом") return print(f"Обрабатываем файл: {filepath}") # Обрабатываем файл if process_post_file(filepath): print(f"Файл {filepath} был изменен") else: print(f"Файл {filepath} не требует изменений") if __name__ == "__main__": main()