mirror of
https://forge.chapril.org/tykayn/orgmode-to-gemini-blog
synced 2025-06-20 09:04:42 +02:00
up atom feed generate
This commit is contained in:
parent
bff1ec1392
commit
791d93ecde
8 changed files with 69 additions and 25 deletions
|
@ -5,57 +5,78 @@ from datetime import datetime
|
|||
# Chemin du dossier source
|
||||
import argparse
|
||||
|
||||
from utils import find_first_level1_title, find_year_and_slug, find_extract_in_content_org
|
||||
from website_config import configs_sites
|
||||
|
||||
# Configuration des arguments de la ligne de commande
|
||||
parser = argparse.ArgumentParser(description="Générer un nouvel article en mode orgmode.")
|
||||
parser.add_argument("blog_dir", help="Le nom du dossier de blog.")
|
||||
|
||||
args = parser.parse_args()
|
||||
|
||||
blog_dir = 'sources/'+args.blog_dir
|
||||
website_ndd = configs_sites[args.blog_dir]['NDD']
|
||||
blog_dir = 'sources/'+args.blog_dir+'/lang_fr/'
|
||||
|
||||
# Expression régulière pour extraire la date du contenu de l'article
|
||||
date_regex = re.compile(r"\b(\d{14})\b")
|
||||
date_regex_org = re.compile(r"\b(\d{4}-\d{2}-\d{2})\b")
|
||||
|
||||
# Liste des fichiers org-mode trouvés
|
||||
org_files = []
|
||||
|
||||
limit_articles_feed=1000
|
||||
count_articles=0
|
||||
print('atom generate: fichiers dans le dossier: ',len((blog_dir)))
|
||||
# Parcourt le dossier source à la recherche de fichiers org-mode
|
||||
for root, dirs, files in os.walk(blog_dir):
|
||||
for file in files:
|
||||
if file.endswith(".org"):
|
||||
print(os.path.join(root, file))
|
||||
date_str, annee, slug = find_year_and_slug(file)
|
||||
# Ouvre le fichier et recherche la première date dans le contenu de l'article
|
||||
with open(os.path.join(root, file), "r", encoding="utf-8") as f:
|
||||
content = f.read()
|
||||
match = date_regex.search(content)
|
||||
extract = find_extract_in_content_org(content)
|
||||
count_articles+=1
|
||||
match = date_regex_org.search(content)
|
||||
if match:
|
||||
date = datetime.strptime(match.group(1), "%Y-%m-%d")
|
||||
# Ajoute le fichier à la liste avec sa date correspondante
|
||||
org_files.append((date, os.path.join(root, file)))
|
||||
org_files.append((date, os.path.join(root, file), annee, slug,extract))
|
||||
|
||||
if count_articles > limit_articles_feed:
|
||||
break
|
||||
if count_articles > limit_articles_feed:
|
||||
break
|
||||
# Tri des fichiers par ordre décroissant de date
|
||||
org_files.sort(reverse=True)
|
||||
|
||||
# Génération du flux Atom
|
||||
atom_feed = {"title": "Flux Atom des articles GMI",
|
||||
"link": "http://www.example.com/atom",
|
||||
"updated": org_files[0][0].strftime("%Y-%m-%dT%H:%M:%SZ"),
|
||||
atom_feed = {"title": "Flux Atom des articles de "+args.blog_dir,
|
||||
"link": f"{website_ndd}/feed",
|
||||
# "updated": org_files[0][0].strftime("%Y-%m-%dT%H:%M:%SZ"),
|
||||
"updated": org_files[0][0],
|
||||
"entries": []}
|
||||
|
||||
for date, file in org_files:
|
||||
for date, file, annee, slug, extract in org_files:
|
||||
# Parse le fichier org-mode pour extraire le titre, la description et la date de publication
|
||||
with open(file, "r", encoding="utf-8") as f:
|
||||
content = f.read()
|
||||
title = re.search(r"\*+ (.+)\n", content).group(1)
|
||||
description = re.search(r"\n+ (.+)\n", content, re.DOTALL).group(1)
|
||||
published = date.strftime("%Y-%m-%dT%H:%M:%SZ")
|
||||
title = find_first_level1_title(content)
|
||||
description = title
|
||||
# published = date_str
|
||||
# Ajoute l'article au flux Atom
|
||||
atom_entry = {"title": title, "link": file, "summary": description, "published": published}
|
||||
atom_entry = {"title": title,
|
||||
"summary": extract,
|
||||
"link": f"{website_ndd}/{annee}/{slug}",
|
||||
"published": date
|
||||
}
|
||||
atom_feed["entries"].append(atom_entry)
|
||||
if published > atom_feed["updated"]:
|
||||
atom_feed["updated"] = published
|
||||
# if published > atom_feed["updated"]:
|
||||
# atom_feed["updated"] = published
|
||||
|
||||
# Enregistrement du flux Atom dans un fichier
|
||||
with open("atom.xml", "w", encoding="utf-8") as f:
|
||||
with open(f"index_{args.blog_dir}.xml", "w", encoding="utf-8") as f:
|
||||
f.write('<?xml version="1.0" encoding="UTF-8"?>\n')
|
||||
f.write('<feed xmlns="http://www.w3.org/2005/Atom">\n')
|
||||
f.write(f' <title>{atom_feed["title"]}</title>\n')
|
||||
|
|
Loading…
Add table
Add a link
Reference in a new issue