orgmode-to-gemini-blog/build_indexes.py

import argparse
import datetime
import os
import re
import shutil

from enrich_html import enrich_one_file
from website_config import configs_sites, global_config

# from enrich_html import static_page_path
# génère l'index gemini et html des articles rangés par langue

parser = argparse.ArgumentParser(description="Générer un site Web à partir de fichiers HTML.")
parser.add_argument("source", help="Le chemin vers le dossier contenant les fichiers HTML.")
args = parser.parse_args()

# Variables personnalisables
DOSSIER_SOURCE = 'sources/' + args.source  # Nom du dossier contenant les fichiers Markdown
FICHIER_INDEX = 'index_' + args.source  # Nom du fichier d'index à générer
TITRE_INDEX = f""
source_files_extension = "org"

config_title = configs_sites[args.source]['BLOG_TITLE']

# Expression régulière pour extraire la date et le slug du nom de fichier org
regex = r"^(\d{14})(-[a-zA-Z0-9_-]+)\.gmi$"
regex_orgroam = r"^(\d{14})_([a-zA-Z0-9_-]+)\.gmi$"

use_article_file_for_name = (not global_config["slug_with_year"])
website_name = args.source


def trouver_nom_article(fichier_org, format="html"):
    # print('fichier_org, ', fichier_org)
    with open(fichier_org, 'r') as file:
        lignes = file.readlines()

    nom_article = ''

    # print('trouver_nom_article format',format)
    # Expressions régulières pour trouver les titres de niveau 1 et 2
    if format == 'html':
        titre_niveau_1 = r'<h1\s+(?:id|data-created)="[^"]*">(.*?)</h1>'
        titre_niveau_2 = r'^\<h2.*?\>(.+)\<\/h2\>$'
    else:
        titre_niveau_1 = r'^\*+ (.+)$'
        titre_niveau_2 = r'^\*\*+ (.+)$'

    # Itérer sur les lignes du fichier
    for ligne in lignes:
        # Rechercher un titre de niveau 1
        titre_niveau_1_match = re.match(titre_niveau_1, ligne)
        if titre_niveau_1_match:
            titre_niveau_1_texte = titre_niveau_1_match.group(1)
            if titre_niveau_1_texte.lower() != "article" and titre_niveau_1_texte.lower() != "liens":
                nom_article = titre_niveau_1_texte
                break
            else:
                # Si le premier titre de niveau 1 est "Article", rechercher le premier titre de niveau 2
                titre_niveau_2_match = re.match(titre_niveau_2, ligne)
                if titre_niveau_2_match:
                    nom_article = titre_niveau_2_match.group(1)
                    break
    # print(f"Nom de l'article : {nom_article}")

    return nom_article.replace(args.source + '_', '').replace('_', ' ')


def find_year_and_slug(fichier):
    fichier = fichier.replace('..', '.')
    # print(f" ------------ build_indexes: find in {fichier} -------------")
    slug = fichier.replace('.gmi', '')
    annee = '2024'
    date_str = '2024-00-00'
    date = '2024-00-00'
    match = re.match(regex_orgroam, fichier)

    if match:
        date_str = match.group(1)
        annee = date_str[:4]
        slug = match.group(2)

    match = re.match(regex, fichier)
    if match:
        date_str = match.group(1)
        # Convertir la date en objet datetime
        if "-" in date_str:
            date = datetime.datetime.strptime(date_str, "%Y-%m-%d")
        else:
            date = datetime.datetime.strptime(date_str, "%Y%m%d%H%M%S")
        date_string_replaced = str(date).replace(' 00:00:00', '')
        slug = fichier.replace('.gmi', '')
        slug = slug.replace(date_string_replaced, '')
        slug = enlever_premier_tiret_ou_underscore(slug)

        annee = str(date.year).replace(' 00:00:00', '')
    # else:
    #     print('ERREUR aucun slug trouvé')

    # print(f" ------------ build_indexes:  ")
    # print(f" ------------ build_indexes: Fichier: {fichier}")
    # print(f" ------------ build_indexes: année: {annee}")
    # print(f" ------------ build_indexes: str(date): {str(date)}")
    # print(f" ------------ build_indexes: slug: {slug}")
    # print(f" ------------ build_indexes: chemin: {annee}/{slug}/")
    return [date_str, annee, slug]


def enlever_premier_tiret_ou_underscore(chaîne):
    if chaîne.startswith('-') or chaîne.startswith('_'):
        chaîne = chaîne[1:]
    return chaîne


# création des dossiers intermédiaires s'il y en a
# déplace le fichier dans le dossier spécifié
def create_path_folders_and_move_file(path, file):
    os.makedirs(os.path.dirname(path), exist_ok=True)

    shutil.move(file, path)


def get_files_list_of_folder(folder_path):
    # Vérifie si le dossier existe
    if not os.path.exists(folder_path):
        print(f" ------------ build_indexes: Erreur : Le dossier '{folder_path}' n'existe pas.")
        return
    # print('----------- get_files_list_of_folder: folder_path : ', folder_path)
    # Liste les fichiers articles, trie par nom décroissant
    try:
        fichiers_md = sorted([f.replace('.' + source_files_extension, '.gmi') for f in os.listdir(folder_path) if
                              f.endswith(source_files_extension)], reverse=True)
        print('fichiers trouvés:', len(fichiers_md))
        return fichiers_md
    except OSError as e:
        print(f" ------------ build_indexes: Erreur lors de la lecture du dossier : {e}")
        return


# transformer le nom du fichier orgmode en une création de dossier de l'année, et un sous dossier du nom du slug dans le nom de fichier, contenant un seul fichier d'index afin de faire de l'url rewrite en dur.
# le nom de fichier org commence par une date YYYY-MM-DD ou bien YYYYMMDDHHmmss, est suivie d'un slug, et finit par l'extension .org

def generer_index(dossier_source, fichier_index):
    # Chemin absolu du dossier parent (pour sauver le fichier d'index)
    dossier_parent = os.path.dirname(os.path.abspath(__file__))

    # Chemin complet du dossier contenant les Markdown
    chemin_dossier_source = os.path.join(dossier_parent, dossier_source)

    files_static = get_files_list_of_folder(chemin_dossier_source + '/')
    files_fr = get_files_list_of_folder(chemin_dossier_source + '/lang_fr')
    files_en = get_files_list_of_folder(chemin_dossier_source + '/lang_en')

    # Chemin complet pour le fichier d'index
    chemin_fichier_index_gemini = os.path.join(dossier_parent, 'gemini-capsules', args.source, 'index.gmi')
    chemin_fichier_index_html = os.path.join(dossier_parent, 'html-websites', args.source, 'index.html')

    print('\n index html: ', chemin_fichier_index_html)
    # Génère le contenu du fichier d'index
    contenu_index_gmi = f"{config_title}\n{'- ' * len(config_title)}\n\n"
    contenu_index_html = f"{config_title}\n{'- ' * len(config_title)}\n\n"

    contenu_index_gmi += "\n# Navigation\n-------------------------\n"
    contenu_index_html += "<h1>Navigation</h1>"
    for fichier in files_static:
        # print(" -------- fichier ", fichier)
        link_html = fichier.replace('.gmi', '.html')
        link_org = fichier.replace('.gmi', '.org')
        file_path_org = os.path.join(dossier_parent, "sources", website_name, link_org)
        article_name = trouver_nom_article(file_path_org, 'org')

        if article_name:
            contenu_index_gmi += f"=> {fichier} {article_name}\n"
        else:
            contenu_index_gmi += f"=> {fichier}\n"

        if fichier != "index.gmi":
            # print(' -------- rechercher le nom de l article dans le fichier ')
            if use_article_file_for_name:
                article_name = link_html
            else:
                article_name = trouver_nom_article(file_path_org, 'org')

            if not article_name:
                article_name = link_html
        else:
            article_name = 'Index'
        article_name = article_name.replace('_', ' ')
        contenu_index_html += f"<br><a href=/{link_html}>{article_name}</a>"

    # ne préciser la langue français que si on a des articles en Anglais
    if len(files_en):
        contenu_index_gmi += "\n# Articles en Français\n-------------------------\n"
    lang_folder = "lang_fr/"

    # ----------- indexer les articles en Français ------------------
    for fichier in files_fr:
        date_string, année, slug = find_year_and_slug(fichier)

        contenu_index_gmi += f"=> {fichier}\n"
        link_html = fichier.replace('.gmi', '.html')
        chemin_fichier_this_article_html = chemin_dossier_source + '/lang_fr/converted/' + link_html
        chemin_fichier_this_article_html = chemin_dossier_source + '/lang_fr/converted/' + link_html

        link_org = fichier.replace('.gmi', '.org')
        file_path_org = os.path.join(dossier_parent, "sources", website_name, lang_folder, link_org)
        article_name = trouver_nom_article(file_path_org, 'org')

        if not article_name:
            article_name = slug.replace('-', ' ')

        if global_config["slug_with_year"]:
            new_folder = f"{année}/{slug}"
            new_folder_path_this_article = os.path.join(dossier_parent,
                                                        'html-websites/' + args.source + '/' + new_folder + '/')

            # déplacer le fichier html dans le dossier slug,
            # et le renommer en index.html ensuite pour ne pas modifier l'index du blog
            contenu_index_html += f"<br><a href=/{année}/{slug}>{année} {article_name}</a>"
            os.makedirs(os.path.dirname(new_folder_path_this_article), exist_ok=True)
            shutil.copy(chemin_fichier_this_article_html, new_folder_path_this_article + 'index.html')
        else:
            contenu_index_html += f"<br><a href=/{lang_folder}/{link_html}>{link_html}</a>"

    # ---------------- pareil en anglais TODO
    # contenu_index_gmi += "\n# Articles in English\n-------------------------\n"
    # contenu_index_html += "<h1>Articles in English</h1>"
    # lang_folder="lang_en/"
    # for fichier in files_en:
    # ----------------------------------------

    print('chemin_fichier_index_html', chemin_fichier_index_html)
    print(' ')
    with open(chemin_fichier_index_html, 'w', encoding='utf-8') as file:
        print('contenu_index_html', contenu_index_html)
        contenu_index_html = enrich_one_file(contenu_index_html)
        file.write(contenu_index_html)
        print(f" ------------ build_indexes: Fichier d'index '{chemin_fichier_index_html}' généré avec succès.")

    # Écrit le contenu dans le fichier d'index
    try:
        with open(chemin_fichier_index_gemini, 'w', encoding='utf-8') as file:
            file.write(contenu_index_gmi)
            print(
                f" ------------ build_indexes: Fichier d'index gemini '{chemin_fichier_index_gemini}' généré avec succès.")

    except OSError as e:
        print(f" ------------ build_indexes: Erreur lors de l'écriture du fichier d'index : {e}")


if __name__ == "__main__":
    generer_index(DOSSIER_SOURCE, FICHIER_INDEX)
separate hard to convert files 2024-11-04 00:13:58 +01:00			`import argparse`
up slug for index 2024-11-05 01:14:45 +01:00			`import datetime`
refacto 2024-11-14 13:32:56 +01:00			`import os`
			`import re`
slugify links in website 2024-11-05 23:06:54 +01:00			`import shutil`
add scss converter 2024-11-10 00:01:15 +01:00
refacto 2024-11-14 13:32:56 +01:00			`from enrich_html import enrich_one_file`
			`from website_config import configs_sites, global_config`
variabilize blog params 2024-11-12 00:55:21 +01:00
more complex template html 2024-11-10 18:03:31 +01:00			`# from enrich_html import static_page_path`
separate hard to convert files 2024-11-04 00:13:58 +01:00			`# génère l'index gemini et html des articles rangés par langue`

			`parser = argparse.ArgumentParser(description="Générer un site Web à partir de fichiers HTML.")`
			`parser.add_argument("source", help="Le chemin vers le dossier contenant les fichiers HTML.")`
			`args = parser.parse_args()`
init transformations blog 2024-11-02 18:30:04 +01:00
			`# Variables personnalisables`
refacto 2024-11-14 13:32:56 +01:00			`DOSSIER_SOURCE = 'sources/' + args.source # Nom du dossier contenant les fichiers Markdown`
			`FICHIER_INDEX = 'index_' + args.source # Nom du fichier d'index à générer`
add scss converter 2024-11-10 00:01:15 +01:00			`TITRE_INDEX = f""`
refacto 2024-11-14 13:32:56 +01:00			`source_files_extension = "org"`

			`config_title = configs_sites[args.source]['BLOG_TITLE']`
separate hard to convert files 2024-11-04 00:13:58 +01:00
up slug for index 2024-11-05 01:14:45 +01:00			`# Expression régulière pour extraire la date et le slug du nom de fichier org`
refacto 2024-11-14 13:32:56 +01:00			`regex = r"^(\d{14})(-[a-zA-Z0-9_-]+)\.gmi$"`
			`regex_orgroam = r"^(\d{14})_([a-zA-Z0-9_-]+)\.gmi$"`
separate hard to convert files 2024-11-04 00:13:58 +01:00
refacto 2024-11-14 13:32:56 +01:00			`use_article_file_for_name = (not global_config["slug_with_year"])`
more complex template html 2024-11-10 18:03:31 +01:00			`website_name = args.source`
up displayed pages 2024-11-11 01:25:10 +01:00
rework gemini conversion 2024-11-10 15:58:11 +01:00
site builder ok 2024-11-11 00:58:44 +01:00			`def trouver_nom_article(fichier_org, format="html"):`
refacto 2024-11-14 13:32:56 +01:00			`# print('fichier_org, ', fichier_org)`
rework gemini conversion 2024-11-10 15:58:11 +01:00			`with open(fichier_org, 'r') as file:`
			`lignes = file.readlines()`
refacto 2024-11-14 13:32:56 +01:00
up displayed pages 2024-11-11 01:25:10 +01:00			`nom_article = ''`
site builder ok 2024-11-11 00:58:44 +01:00
refacto 2024-11-14 13:32:56 +01:00			`# print('trouver_nom_article format',format)`
site builder ok 2024-11-11 00:58:44 +01:00			`# Expressions régulières pour trouver les titres de niveau 1 et 2`
			`if format == 'html':`
refacto 2024-11-14 13:32:56 +01:00			`titre_niveau_1 = r'<h1\s+(?:id\|data-created)="[^"]">(.?)</h1>'`
site builder ok 2024-11-11 00:58:44 +01:00			`titre_niveau_2 = r'^\<h2.*?\>(.+)\<\/h2\>$'`
			`else:`
			`titre_niveau_1 = r'^\*+ (.+)$'`
			`titre_niveau_2 = r'^\\+ (.+)$'`

rework gemini conversion 2024-11-10 15:58:11 +01:00			`# Itérer sur les lignes du fichier`
			`for ligne in lignes:`
			`# Rechercher un titre de niveau 1`
			`titre_niveau_1_match = re.match(titre_niveau_1, ligne)`
			`if titre_niveau_1_match:`
			`titre_niveau_1_texte = titre_niveau_1_match.group(1)`
refacto 2024-11-14 13:32:56 +01:00			`if titre_niveau_1_texte.lower() != "article" and titre_niveau_1_texte.lower() != "liens":`
rework gemini conversion 2024-11-10 15:58:11 +01:00			`nom_article = titre_niveau_1_texte`
			`break`
			`else:`
			`# Si le premier titre de niveau 1 est "Article", rechercher le premier titre de niveau 2`
			`titre_niveau_2_match = re.match(titre_niveau_2, ligne)`
			`if titre_niveau_2_match:`
			`nom_article = titre_niveau_2_match.group(1)`
			`break`
refacto 2024-11-14 13:32:56 +01:00			`# print(f"Nom de l'article : {nom_article}")`

			`return nom_article.replace(args.source + '_', '').replace('_', ' ')`
rework gemini conversion 2024-11-10 15:58:11 +01:00

up slug for index 2024-11-05 01:14:45 +01:00			`def find_year_and_slug(fichier):`
refacto 2024-11-14 13:32:56 +01:00			`fichier = fichier.replace('..', '.')`
add scss converter 2024-11-10 00:01:15 +01:00			`# print(f" ------------ build_indexes: find in {fichier} -------------")`
refacto 2024-11-14 13:32:56 +01:00			`slug = fichier.replace('.gmi', '')`
add org files, copy style 2024-11-08 17:40:06 +01:00			`annee = '2024'`
refacto 2024-11-14 13:32:56 +01:00			`date_str = '2024-00-00'`
			`date = '2024-00-00'`
testing slug find in filename 2024-11-06 00:19:50 +01:00			`match = re.match(regex_orgroam, fichier)`
add org files, copy style 2024-11-08 17:40:06 +01:00
testing slug find in filename 2024-11-06 00:19:50 +01:00			`if match:`
			`date_str = match.group(1)`
			`annee = date_str[:4]`
			`slug = match.group(2)`

up slug for index 2024-11-05 01:14:45 +01:00			`match = re.match(regex, fichier)`
			`if match:`
			`date_str = match.group(1)`
			`# Convertir la date en objet datetime`
			`if "-" in date_str:`
			`date = datetime.datetime.strptime(date_str, "%Y-%m-%d")`
			`else:`
			`date = datetime.datetime.strptime(date_str, "%Y%m%d%H%M%S")`
refacto 2024-11-14 13:32:56 +01:00			`date_string_replaced = str(date).replace(' 00:00:00', '')`
			`slug = fichier.replace('.gmi', '')`
			`slug = slug.replace(date_string_replaced, '')`
up slug for index 2024-11-05 01:14:45 +01:00			`slug = enlever_premier_tiret_ou_underscore(slug)`
refacto 2024-11-14 13:32:56 +01:00
			`annee = str(date.year).replace(' 00:00:00', '')`
add org files, copy style 2024-11-08 17:40:06 +01:00			`# else:`
			`# print('ERREUR aucun slug trouvé')`
up slug for index 2024-11-05 01:14:45 +01:00
add scss converter 2024-11-10 00:01:15 +01:00			`# print(f" ------------ build_indexes: ")`
			`# print(f" ------------ build_indexes: Fichier: {fichier}")`
			`# print(f" ------------ build_indexes: année: {annee}")`
			`# print(f" ------------ build_indexes: str(date): {str(date)}")`
			`# print(f" ------------ build_indexes: slug: {slug}")`
			`# print(f" ------------ build_indexes: chemin: {annee}/{slug}/")`
add org files, copy style 2024-11-08 17:40:06 +01:00			`return [date_str, annee, slug]`
rewrite build url 2024-11-05 11:17:52 +01:00

up slug for index 2024-11-05 01:14:45 +01:00			`def enlever_premier_tiret_ou_underscore(chaîne):`
			`if chaîne.startswith('-') or chaîne.startswith('_'):`
			`chaîne = chaîne[1:]`
			`return chaîne`
rewrite build url 2024-11-05 11:17:52 +01:00
slugify links in website 2024-11-05 23:06:54 +01:00
rewrite build url 2024-11-05 11:17:52 +01:00			`# création des dossiers intermédiaires s'il y en a`
			`# déplace le fichier dans le dossier spécifié`
			`def create_path_folders_and_move_file(path, file):`
			`os.makedirs(os.path.dirname(path), exist_ok=True)`
slugify links in website 2024-11-05 23:06:54 +01:00
rewrite build url 2024-11-05 11:17:52 +01:00			`shutil.move(file, path)`

refacto 2024-11-14 13:32:56 +01:00
separate hard to convert files 2024-11-04 00:13:58 +01:00			`def get_files_list_of_folder(folder_path):`
refacto 2024-11-14 13:32:56 +01:00			`# Vérifie si le dossier existe`
separate hard to convert files 2024-11-04 00:13:58 +01:00			`if not os.path.exists(folder_path):`
refacto 2024-11-14 13:32:56 +01:00			`print(f" ------------ build_indexes: Erreur : Le dossier '{folder_path}' n'existe pas.")`
separate hard to convert files 2024-11-04 00:13:58 +01:00			`return`
refacto 2024-11-14 13:32:56 +01:00			`# print('----------- get_files_list_of_folder: folder_path : ', folder_path)`
separate hard to convert files 2024-11-04 00:13:58 +01:00			`# Liste les fichiers articles, trie par nom décroissant`
			`try:`
refacto 2024-11-14 13:32:56 +01:00			`fichiers_md = sorted([f.replace('.' + source_files_extension, '.gmi') for f in os.listdir(folder_path) if`
			`f.endswith(source_files_extension)], reverse=True)`
separate hard to convert files 2024-11-04 00:13:58 +01:00			`print('fichiers trouvés:', len(fichiers_md))`
			`return fichiers_md`
			`except OSError as e:`
add scss converter 2024-11-10 00:01:15 +01:00			`print(f" ------------ build_indexes: Erreur lors de la lecture du dossier : {e}")`
separate hard to convert files 2024-11-04 00:13:58 +01:00			`return`


up slug for index 2024-11-05 01:14:45 +01:00			`# transformer le nom du fichier orgmode en une création de dossier de l'année, et un sous dossier du nom du slug dans le nom de fichier, contenant un seul fichier d'index afin de faire de l'url rewrite en dur.`
			`# le nom de fichier org commence par une date YYYY-MM-DD ou bien YYYYMMDDHHmmss, est suivie d'un slug, et finit par l'extension .org`
separate hard to convert files 2024-11-04 00:13:58 +01:00
refacto 2024-11-14 13:32:56 +01:00			`def generer_index(dossier_source, fichier_index):`
init transformations blog 2024-11-02 18:30:04 +01:00			`# Chemin absolu du dossier parent (pour sauver le fichier d'index)`
			`dossier_parent = os.path.dirname(os.path.abspath(__file__))`
refacto 2024-11-14 13:32:56 +01:00
init transformations blog 2024-11-02 18:30:04 +01:00			`# Chemin complet du dossier contenant les Markdown`
rewrite build url 2024-11-05 11:17:52 +01:00			`chemin_dossier_source = os.path.join(dossier_parent, dossier_source)`
refacto 2024-11-14 13:32:56 +01:00
			`files_static = get_files_list_of_folder(chemin_dossier_source + '/')`
			`files_fr = get_files_list_of_folder(chemin_dossier_source + '/lang_fr')`
			`files_en = get_files_list_of_folder(chemin_dossier_source + '/lang_en')`

init transformations blog 2024-11-02 18:30:04 +01:00			`# Chemin complet pour le fichier d'index`
refacto 2024-11-14 13:32:56 +01:00			`chemin_fichier_index_gemini = os.path.join(dossier_parent, 'gemini-capsules', args.source, 'index.gmi')`
			`chemin_fichier_index_html = os.path.join(dossier_parent, 'html-websites', args.source, 'index.html')`
slugify links in website 2024-11-05 23:06:54 +01:00
			`print('\n index html: ', chemin_fichier_index_html)`
init transformations blog 2024-11-02 18:30:04 +01:00			`# Génère le contenu du fichier d'index`
refacto 2024-11-14 13:32:56 +01:00			`contenu_index_gmi = f"{config_title}\n{'- ' * len(config_title)}\n\n"`
			`contenu_index_html = f"{config_title}\n{'- ' * len(config_title)}\n\n"`
separate hard to convert files 2024-11-04 00:13:58 +01:00
			`contenu_index_gmi += "\n# Navigation\n-------------------------\n"`
sync script 2024-11-04 14:14:28 +01:00			`contenu_index_html += "<h1>Navigation</h1>"`
separate hard to convert files 2024-11-04 00:13:58 +01:00			`for fichier in files_static:`
refacto 2024-11-14 13:32:56 +01:00			`# print(" -------- fichier ", fichier)`
			`link_html = fichier.replace('.gmi', '.html')`
			`link_org = fichier.replace('.gmi', '.org')`
			`file_path_org = os.path.join(dossier_parent, "sources", website_name, link_org)`
			`article_name = trouver_nom_article(file_path_org, 'org')`

			`if article_name:`
			`contenu_index_gmi += f"=> {fichier} {article_name}\n"`
			`else:`
			`contenu_index_gmi += f"=> {fichier}\n"`

more complex template html 2024-11-10 18:03:31 +01:00			`if fichier != "index.gmi":`
refacto 2024-11-14 13:32:56 +01:00			`# print(' -------- rechercher le nom de l article dans le fichier ')`
more complex template html 2024-11-10 18:03:31 +01:00			`if use_article_file_for_name:`
			`article_name = link_html`
			`else:`
refacto 2024-11-14 13:32:56 +01:00			`article_name = trouver_nom_article(file_path_org, 'org')`

more complex template html 2024-11-10 18:03:31 +01:00			`if not article_name:`
			`article_name = link_html`
rework gemini conversion 2024-11-10 15:58:11 +01:00			`else:`
more complex template html 2024-11-10 18:03:31 +01:00			`article_name = 'Index'`
refacto 2024-11-14 13:32:56 +01:00			`article_name = article_name.replace('_', ' ')`
rework gemini conversion 2024-11-10 15:58:11 +01:00			`contenu_index_html += f"<br><a href=/{link_html}>{article_name}</a>"`
separate hard to convert files 2024-11-04 00:13:58 +01:00
slugify links in website 2024-11-05 23:06:54 +01:00			`# ne préciser la langue français que si on a des articles en Anglais`
			`if len(files_en):`
			`contenu_index_gmi += "\n# Articles en Français\n-------------------------\n"`
refacto 2024-11-14 13:32:56 +01:00			`lang_folder = "lang_fr/"`

try finding article name from content 2024-11-11 00:02:50 +01:00			`# ----------- indexer les articles en Français ------------------`
separate hard to convert files 2024-11-04 00:13:58 +01:00			`for fichier in files_fr:`
up slug for index 2024-11-05 01:14:45 +01:00			`date_string, année, slug = find_year_and_slug(fichier)`
try finding article name from content 2024-11-11 00:02:50 +01:00
separate hard to convert files 2024-11-04 00:13:58 +01:00			`contenu_index_gmi += f"=> {fichier}\n"`
refacto 2024-11-14 13:32:56 +01:00			`link_html = fichier.replace('.gmi', '.html')`
			`chemin_fichier_this_article_html = chemin_dossier_source + '/lang_fr/converted/' + link_html`
			`chemin_fichier_this_article_html = chemin_dossier_source + '/lang_fr/converted/' + link_html`
try finding article name from content 2024-11-11 00:02:50 +01:00
refacto 2024-11-14 13:32:56 +01:00			`link_org = fichier.replace('.gmi', '.org')`
			`file_path_org = os.path.join(dossier_parent, "sources", website_name, lang_folder, link_org)`
			`article_name = trouver_nom_article(file_path_org, 'org')`
try finding article name from content 2024-11-11 00:02:50 +01:00
			`if not article_name:`
refacto 2024-11-14 13:32:56 +01:00			`article_name = slug.replace('-', ' ')`

			`if global_config["slug_with_year"]:`
			`new_folder = f"{année}/{slug}"`
			`new_folder_path_this_article = os.path.join(dossier_parent,`
			`'html-websites/' + args.source + '/' + new_folder + '/')`

			`# déplacer le fichier html dans le dossier slug,`
			`# et le renommer en index.html ensuite pour ne pas modifier l'index du blog`
			`contenu_index_html += f"<br><a href=/{année}/{slug}>{année} {article_name}</a>"`
			`os.makedirs(os.path.dirname(new_folder_path_this_article), exist_ok=True)`
			`shutil.copy(chemin_fichier_this_article_html, new_folder_path_this_article + 'index.html')`
			`else:`
			`contenu_index_html += f"<br><a href=/{lang_folder}/{link_html}>{link_html}</a>"`
try finding article name from content 2024-11-11 00:02:50 +01:00
style sass 2024-11-10 18:43:38 +01:00			`# ---------------- pareil en anglais TODO`
rewrite build url 2024-11-05 11:17:52 +01:00			`# contenu_index_gmi += "\n# Articles in English\n-------------------------\n"`
			`# contenu_index_html += "<h1>Articles in English</h1>"`
add org files, copy style 2024-11-08 17:40:06 +01:00			`# lang_folder="lang_en/"`
rewrite build url 2024-11-05 11:17:52 +01:00			`# for fichier in files_en:`
style sass 2024-11-10 18:43:38 +01:00			`# ----------------------------------------`
up 2024-11-08 18:05:08 +01:00
refacto 2024-11-14 13:32:56 +01:00			`print('chemin_fichier_index_html', chemin_fichier_index_html)`
up 2024-11-08 18:05:08 +01:00			`print(' ')`
refacto 2024-11-14 13:32:56 +01:00			`with open(chemin_fichier_index_html, 'w', encoding='utf-8') as file:`
			`print('contenu_index_html', contenu_index_html)`
			`contenu_index_html = enrich_one_file(contenu_index_html)`
			`file.write(contenu_index_html)`
add scss converter 2024-11-10 00:01:15 +01:00			`print(f" ------------ build_indexes: Fichier d'index '{chemin_fichier_index_html}' généré avec succès.")`
refacto 2024-11-14 13:32:56 +01:00
init transformations blog 2024-11-02 18:30:04 +01:00			`# Écrit le contenu dans le fichier d'index`
			`try:`
up 2024-11-08 18:05:08 +01:00			`with open(chemin_fichier_index_gemini, 'w', encoding='utf-8') as file:`
			`file.write(contenu_index_gmi)`
refacto 2024-11-14 13:32:56 +01:00			`print(`
			`f" ------------ build_indexes: Fichier d'index gemini '{chemin_fichier_index_gemini}' généré avec succès.")`

init transformations blog 2024-11-02 18:30:04 +01:00			`except OSError as e:`
add scss converter 2024-11-10 00:01:15 +01:00			`print(f" ------------ build_indexes: Erreur lors de l'écriture du fichier d'index : {e}")`
init transformations blog 2024-11-02 18:30:04 +01:00
refacto 2024-11-14 13:32:56 +01:00
init transformations blog 2024-11-02 18:30:04 +01:00			`if __name__ == "__main__":`
refacto 2024-11-14 13:32:56 +01:00			`generer_index(DOSSIER_SOURCE, FICHIER_INDEX)`