2024-11-03 11:42:44 +01:00
|
|
|
#!/bin/python3
|
2024-11-03 10:29:30 +01:00
|
|
|
import os
|
2024-11-03 11:42:44 +01:00
|
|
|
import argparse
|
2024-11-10 00:16:15 +01:00
|
|
|
import re
|
2024-11-04 00:13:58 +01:00
|
|
|
|
2024-11-03 11:42:44 +01:00
|
|
|
parser = argparse.ArgumentParser(description="Générer un site Web à partir de fichiers HTML.")
|
2024-11-09 00:19:43 +01:00
|
|
|
parser.add_argument("blog_name", help="Le chemin vers le dossier contenant les fichiers HTML.")
|
2024-11-03 11:42:44 +01:00
|
|
|
parser.add_argument("--title", "-t", default="Mon site Web", help="Le titre du site Web.")
|
2024-11-08 18:16:36 +01:00
|
|
|
parser.add_argument("--style", default="templates/style_general.css", help="Le chemin vers le fichier de style CSS.")
|
2024-11-03 11:42:44 +01:00
|
|
|
args = parser.parse_args()
|
2024-11-03 10:29:30 +01:00
|
|
|
|
2024-11-04 00:13:58 +01:00
|
|
|
# Style CSS minimaliste
|
2024-11-03 11:42:44 +01:00
|
|
|
style_file = args.style
|
2024-11-08 18:05:08 +01:00
|
|
|
|
|
|
|
|
2024-11-09 00:19:43 +01:00
|
|
|
blog_name = args.blog_name
|
|
|
|
source_blog = f"sources/{blog_name}"
|
2024-11-11 00:58:44 +01:00
|
|
|
header_content_path = f"{source_blog}/templates/converted/header_page.html"
|
|
|
|
footer_content_path = f"{source_blog}/templates/converted/footer_page.html"
|
2024-11-10 00:01:15 +01:00
|
|
|
static_page_path = f"{source_blog}/templates/html/static.html"
|
|
|
|
|
2024-11-11 00:58:44 +01:00
|
|
|
footer_content=''
|
|
|
|
after_article=''
|
|
|
|
# with open(footer_content_path, "r") as f:
|
|
|
|
# footer_content = f.read()
|
|
|
|
|
2024-11-10 00:01:15 +01:00
|
|
|
# variables du template de page
|
|
|
|
BANNIERE_ENTETE=''
|
|
|
|
BLOG_TITLE='Cipher Bliss'
|
|
|
|
BLOG_SUBTITLE='Code, nouvelles technologies et entrepreneurariat par B. Lemoine'
|
|
|
|
TITLE=''
|
|
|
|
AUTHOR=''
|
|
|
|
PAGE_TITLE=''
|
2024-11-10 18:03:31 +01:00
|
|
|
LOCALE='fr_FR'
|
2024-11-10 00:01:15 +01:00
|
|
|
DESCRIPTION=''
|
2024-11-10 18:03:31 +01:00
|
|
|
NDD='https://www.cipherbliss.com'
|
2024-11-10 00:01:15 +01:00
|
|
|
EMAIL='contact@cipherbliss.com'
|
|
|
|
SITE_ICON='https://www.cipherbliss.com/wp-content/uploads/2016/12/rond.png'
|
2024-11-10 18:03:31 +01:00
|
|
|
SITE_ICON_TYPE='image/png'
|
2024-11-11 00:02:50 +01:00
|
|
|
NAVIGATION="""
|
|
|
|
<nav>
|
|
|
|
<a href="/">Accueil</a>
|
|
|
|
<a href="https://portfolio.cipherbliss.com">Portfolio</a>
|
|
|
|
<a href="/feed">Flux RSS</a>
|
|
|
|
<a href="/contact">Contact</a>
|
|
|
|
<a href="/ressources-de-café-vie-privée">Ressources</a>
|
|
|
|
</nav>
|
|
|
|
"""
|
2024-11-10 00:01:15 +01:00
|
|
|
BANNIERE_ENTETE='https://www.cipherbliss.com/wp-content/uploads/2016/11/bg.jpg'
|
|
|
|
BANNIERE_ENTETE_ALT='bannière du site'
|
|
|
|
ARTICLE=''
|
|
|
|
FOOTER=''
|
2024-11-03 11:42:44 +01:00
|
|
|
|
2024-11-10 18:03:31 +01:00
|
|
|
|
2024-11-11 00:58:44 +01:00
|
|
|
|
2024-11-10 18:03:31 +01:00
|
|
|
def extract_body_content(html_content):
|
2024-11-11 00:58:44 +01:00
|
|
|
pattern = r'<body[^>]*?>(.*?)</body>'
|
2024-11-10 18:03:31 +01:00
|
|
|
match = re.search(pattern, html_content, re.DOTALL)
|
|
|
|
if match:
|
|
|
|
return match.group(1)
|
|
|
|
else:
|
|
|
|
return None
|
|
|
|
|
2024-11-10 00:16:15 +01:00
|
|
|
def remove_properties_section(text):
|
|
|
|
pattern = r"<h1 id=\"article\">Article</h1>.+?</ul>"
|
|
|
|
replacement = ""
|
|
|
|
return re.sub(pattern, replacement, text, flags=re.DOTALL)
|
|
|
|
|
|
|
|
def remove_article_head_properties_orgmode(text):
|
|
|
|
pattern = r":PROPERTIES:.+?:END:"
|
|
|
|
replacement = ""
|
|
|
|
return re.sub(pattern, replacement, text, flags=re.DOTALL)
|
2024-11-10 18:03:31 +01:00
|
|
|
|
2024-11-10 00:16:15 +01:00
|
|
|
def remove_hint_html(text):
|
|
|
|
pattern = r"<p>ceci<sub>estduhtml</sub></p>"
|
|
|
|
replacement = ""
|
|
|
|
return re.sub(pattern, replacement, text, flags=re.DOTALL)
|
|
|
|
|
|
|
|
|
2024-11-08 18:05:08 +01:00
|
|
|
|
2024-11-08 23:19:39 +01:00
|
|
|
def enrich_one_file(file, root_path):
|
2024-11-10 00:01:15 +01:00
|
|
|
|
|
|
|
|
2024-11-11 00:58:44 +01:00
|
|
|
print(' ----------- enrich_html: file:',os.path.join(root_path, file))
|
2024-11-09 00:19:43 +01:00
|
|
|
css_content = ""
|
|
|
|
|
|
|
|
inline_the_css=False
|
|
|
|
# inline_the_css=True
|
|
|
|
|
2024-11-11 00:58:44 +01:00
|
|
|
print(' ----------- enrich_html: CSS inline: ',inline_the_css)
|
2024-11-09 00:19:43 +01:00
|
|
|
# Trouver le fichier entête
|
|
|
|
header_content=''
|
|
|
|
with open(os.path.join(root_path, file), "r") as f:
|
|
|
|
header_content = f.read()
|
2024-11-08 18:05:08 +01:00
|
|
|
# Ouvrir le fichier HTML en mode lecture
|
2024-11-08 23:19:39 +01:00
|
|
|
with open(os.path.join(root_path, file), "r") as f:
|
2024-11-08 18:05:08 +01:00
|
|
|
html_content = f.read()
|
|
|
|
|
2024-11-11 00:02:50 +01:00
|
|
|
# remove some parts
|
2024-11-11 00:58:44 +01:00
|
|
|
html_content = remove_properties_section(html_content)
|
|
|
|
html_content = remove_article_head_properties_orgmode(html_content)
|
|
|
|
html_content = remove_hint_html(html_content)
|
|
|
|
|
|
|
|
html_content = extract_body_content(html_content)
|
2024-11-10 00:16:15 +01:00
|
|
|
|
2024-11-11 00:58:44 +01:00
|
|
|
if inline_the_css is True:
|
|
|
|
print(' ----------- enrich_html: include css inline in each html page')
|
2024-11-08 23:19:39 +01:00
|
|
|
with open(os.path.join(root_path, file), "r") as f:
|
|
|
|
css_content = f.read()
|
|
|
|
css_content = "<style type='text/css'>{css_content}</style>"
|
|
|
|
|
2024-11-11 00:02:50 +01:00
|
|
|
# remplir le template
|
2024-11-10 18:03:31 +01:00
|
|
|
html_content = f"""
|
2024-11-10 00:01:15 +01:00
|
|
|
|
2024-11-10 18:03:31 +01:00
|
|
|
<!DOCTYPE html>
|
|
|
|
<html>
|
|
|
|
<head>
|
|
|
|
<meta charset="UTF-8">
|
|
|
|
<meta name="viewport" content="width=device-width, initial-scale=1">
|
|
|
|
<meta property="og:image" content="{SITE_ICON}">
|
|
|
|
<meta property="og:locale" content="{LOCALE}">
|
|
|
|
<meta property="og:description" content="{BLOG_SUBTITLE}">
|
2024-11-11 00:02:50 +01:00
|
|
|
<meta property="og:url" content="{NDD}">
|
2024-11-10 18:03:31 +01:00
|
|
|
<meta property="og:site_name" content="Cipher Bliss">
|
2024-11-11 00:58:44 +01:00
|
|
|
<link rel="alternate" type="application/rss+xml" title="Cipher Bliss » Flux" href="{NDD}/feed/">
|
2024-11-10 18:03:31 +01:00
|
|
|
<link href="/style.css" rel="stylesheet">
|
|
|
|
<meta charset="utf-8">
|
|
|
|
<meta name="viewport" content="width=device-width, initial-scale=1">
|
|
|
|
<title>{TITLE}</title>
|
|
|
|
<meta name="author" content="{AUTHOR}">
|
|
|
|
<link rel="alternate" type="application/rss+xml" title="{BLOG_TITLE} » Flux"
|
|
|
|
href="{NDD}/feed/">
|
|
|
|
<meta property="og:title" content="{PAGE_TITLE}">
|
|
|
|
<meta property="og:locale" content="{LOCALE}">
|
|
|
|
<!-- Description de la page -->
|
|
|
|
<meta name="description" content="{PAGE_TITLE}">
|
|
|
|
<meta name="reply-to" content="{EMAIL}">
|
|
|
|
<link rel="icon" type="{SITE_ICON_TYPE}" href="{SITE_ICON}">
|
|
|
|
</head>
|
|
|
|
|
|
|
|
<body>
|
|
|
|
<div id="page">
|
|
|
|
<header id="masthead" class="site-header">
|
2024-11-10 18:43:38 +01:00
|
|
|
<div class="header-image" style="background: url({BANNIERE_ENTETE})">
|
|
|
|
<a href="/">
|
|
|
|
<img src="{SITE_ICON}" class="site-icon img">
|
|
|
|
</a>
|
|
|
|
<h1 class="blog-title">{BLOG_TITLE}</h1>
|
|
|
|
<p class="blog-subtitle">{BLOG_SUBTITLE}</p>
|
2024-11-10 18:03:31 +01:00
|
|
|
</div>
|
|
|
|
<nav class="navbar is-fixed-top is-dark" role="navigation" aria-label="main navigation">
|
|
|
|
<div class="navbar-brand">
|
|
|
|
<a class="navbar-item" href="{NDD}">
|
2024-11-10 18:43:38 +01:00
|
|
|
|
2024-11-10 18:03:31 +01:00
|
|
|
</a>
|
|
|
|
|
|
|
|
</div>
|
|
|
|
|
|
|
|
<div id="navbarBasicExample" class="navbar-menu">
|
|
|
|
<div class="navbar-start">
|
|
|
|
<a class="navbar-item" href="{NDD}">
|
|
|
|
<img src="{SITE_ICON}"
|
|
|
|
class="img-fluid">
|
|
|
|
</a>
|
|
|
|
{NAVIGATION}
|
|
|
|
</div>
|
|
|
|
<div class="navbar-end">
|
|
|
|
<div class="navbar-item">
|
|
|
|
<form role="search" method="get" class="search-form" action="/">
|
|
|
|
<label>
|
|
|
|
<input class="search-field" placeholder="Recherche" value="" name="s"
|
|
|
|
type="search">
|
|
|
|
</label>
|
|
|
|
<input class="is-hidden search-submit" value="Rechercher" type="submit">
|
|
|
|
</form>
|
|
|
|
</div>
|
|
|
|
</div>
|
|
|
|
</div>
|
|
|
|
</nav>
|
|
|
|
</header>
|
|
|
|
<main class="body-wrap boxed-container">
|
|
|
|
<article class="content">
|
|
|
|
{html_content}
|
2024-11-11 00:58:44 +01:00
|
|
|
<p class="after-article">
|
|
|
|
{after_article}
|
|
|
|
</p>
|
2024-11-10 18:03:31 +01:00
|
|
|
</article>
|
|
|
|
</main>
|
|
|
|
<footer class="site-footer has-top-divider">
|
|
|
|
<div class="container">
|
|
|
|
<div class="site-footer-inner">
|
|
|
|
|
2024-11-10 18:43:38 +01:00
|
|
|
|
2024-11-11 00:58:44 +01:00
|
|
|
|
2024-11-10 18:03:31 +01:00
|
|
|
{NAVIGATION}
|
|
|
|
|
|
|
|
</div>
|
|
|
|
</div>
|
|
|
|
</footer>
|
|
|
|
</div>
|
2024-11-09 00:19:43 +01:00
|
|
|
</body>
|
2024-11-10 18:03:31 +01:00
|
|
|
<!-- généré avec orgmode-to-gemini-blog par Tykayn -->
|
|
|
|
</html>
|
|
|
|
|
2024-11-10 00:01:15 +01:00
|
|
|
"""
|
2024-11-08 18:05:08 +01:00
|
|
|
|
2024-11-09 00:19:43 +01:00
|
|
|
html_path_enriched=os.path.join(root_path, file)
|
2024-11-11 00:58:44 +01:00
|
|
|
print(' ----------- enrich_html: html_path_enriched ============> ',html_path_enriched)
|
2024-11-08 18:05:08 +01:00
|
|
|
# Écrire le contenu modifié dans le fichier HTML
|
2024-11-09 00:19:43 +01:00
|
|
|
with open(html_path_enriched, "w") as f:
|
2024-11-08 18:05:08 +01:00
|
|
|
f.write(html_content)
|
2024-11-11 00:58:44 +01:00
|
|
|
print('\n ----------- enrich_html: html écrit ', html_path_enriched)
|
2024-11-09 00:19:43 +01:00
|
|
|
|
2024-11-03 10:29:30 +01:00
|
|
|
# Parcourir tous les fichiers HTML dans le dossier
|
2024-11-09 00:19:43 +01:00
|
|
|
for root, _, files in os.walk(blog_name):
|
|
|
|
# print(files)
|
2024-11-03 10:29:30 +01:00
|
|
|
for file in files:
|
|
|
|
if file.endswith(".html"):
|
2024-11-08 23:19:39 +01:00
|
|
|
enrich_one_file(file, root)
|