💾 Archived View for gemini.sh0.xyz › development › atom.xml.py captured on 2024-12-17 at 10:19:23.
⬅️ Previous capture (2023-09-08)
-=-=-=-=-=-=-
#!/usr/bin/env python3 import re import os import time from datetime import timezone from datetime import datetime import uuid log_dir = "/srv/gemini/log" #log_dir = "/home/jeff/gemini/log" url = "gemini://gemini.sh0.xyz/log" author = "jecxjo" title = "sh0.xyz captain's log" updated = datetime.strptime("1970-01-01 00:00:00.0000", "%Y-%m-%d %H:%M:%S.%f") feed_urn = uuid.uuid5(uuid.NAMESPACE_DNS, url) body = "" files = sorted(filter(lambda x: x.endswith(".gmi") and not x.endswith("index.gmi"), os.listdir(log_dir))) for f in files: with open(os.path.join(log_dir, f)) as file: contents = file.read() entry_title = re.findall("^# .*|$", contents)[0][1:].strip() entry_link = "{}/{}".format(url,f) entry_urn = uuid.uuid5(uuid.NAMESPACE_URL, entry_link) entry_published = re.findall("\$\s?published:\s?(\d\d\d\d-\d\d-\d\d \d\d:\d\d)\s?\$|$", contents)[0] entry_updated = re.findall("\$\s?updated:\s?(\d\d\d\d-\d\d-\d\d \d\d:\d\d)\s?\$|$", contents)[0] entry_tags = re.findall("\$\s?tags:\s?([- ,A-Za-z0-9]+)+\s?\$|$", contents)[0] if not entry_published: continue if not entry_updated: entry_updated = entry_published entry_published = datetime.strptime(entry_published, '%Y-%m-%d %H:%M') entry_updated = datetime.strptime(entry_updated, '%Y-%m-%d %H:%M') body += " <entry>\n" body += " <title>{}</title>\n".format(entry_title) body += " <link href=\"{}\"/>\n".format(entry_link) body += " <id>urn:uuid:{}</id>\n".format(entry_urn) body += " <published>{}</published>\n".format(entry_published.isoformat('T')) body += " <updated>{}</updated>\n".format(entry_updated.isoformat('T')) if entry_tags: tags = [s.strip() for s in re.split('[,]', entry_tags)] for t in tags: body += " <category term=\"{}\"/>\n".format(t) body += " </entry>\n\n" if entry_updated > updated: updated = entry_updated # Printing print("20 text/xml\r") print("<?xml version=\"1.0\" encoding=\"utf-8\"?>") print("<feed xmlns=\"http://www.w3.org/2005/Atom\">") print("") print(" <title>{}</title>".format(title)) print(" <link href=\"{}\"/>".format(url)) print(" <updated>{}</updated>".format(updated.isoformat('T'))) print(" <author>") print(" <name>{}</name>".format(author)) print(" </author>") print(" <id>urn:uuid:{}</id>".format(feed_urn)) print("") print(body) print("</feed>")