sa6anw.se/clean_language_blocks.py

38 lines
1.1 KiB
Python

import os
import re
import shutil
SOURCE_DIR = "docs"
ENGLISH_DIR = "docs_en"
# Kopiera alla filer från docs/ till docs_en/
if os.path.exists(ENGLISH_DIR):
shutil.rmtree(ENGLISH_DIR)
shutil.copytree(SOURCE_DIR, ENGLISH_DIR)
def clean_file(path, keep_lang):
with open(path, "r", encoding="utf-8") as f:
content = f.read()
# Ta bort språkblock som inte ska vara kvar
if keep_lang == "sv":
content = re.sub(r":::\s*en\n.*?\n:::", "", content, flags=re.DOTALL)
elif keep_lang == "en":
content = re.sub(r":::\s*sv\n.*?\n:::", "", content, flags=re.DOTALL)
# Ta bort alla ::: lang-taggar
content = re.sub(r":::\s*(sv|en)", "", content)
content = re.sub(r":::", "", content)
with open(path, "w", encoding="utf-8") as f:
f.write(content.strip() + "\n")
# Rensa svenska versioner
for filename in os.listdir(SOURCE_DIR):
if filename.endswith(".md"):
clean_file(os.path.join(SOURCE_DIR, filename), keep_lang="sv")
# Rensa engelska versioner
for filename in os.listdir(ENGLISH_DIR):
if filename.endswith(".md"):
clean_file(os.path.join(ENGLISH_DIR, filename), keep_lang="en")