ics2mdwn/ics2mdwn.py

216 lines
7.1 KiB
Python
Raw Normal View History

2021-08-17 22:53:50 +02:00
#!/usr/bin/python3
2021-08-19 18:33:34 +02:00
import logging
2021-08-17 22:53:50 +02:00
import argparse
import os.path
from typing import Iterable
from pathlib import Path
import yaml
from datetime import timedelta
from icalendar import Calendar, Event
def get_parser():
p = argparse.ArgumentParser()
p.add_argument("files", nargs="+", type=str)
p.add_argument(
"--out-md-dir",
help="Output directory for markdown files",
default="content/talks/",
type=Path,
)
p.add_argument(
"--out-schedule",
help="Output schedule.yml file",
default="data/schedule.yml",
type=Path,
)
2021-08-19 18:33:34 +02:00
p.add_argument("--trust-location", type=str, nargs="*", default=[])
2021-08-24 18:08:27 +02:00
p.add_argument(
"--slot-size",
type=int,
metavar="MINUTES",
default=15,
help="Round times to the nearest */MINUTES",
)
2021-08-19 17:14:30 +02:00
p.add_argument("--night-threshold", metavar="HOUR", default=5, type=int)
2021-08-17 22:53:50 +02:00
p.add_argument("--mode", choices=["hugo"], default="hugo")
return p
def round_down(num, divisor):
"""
>>> round_down(1000, 10)
1000
>>> round_down(1001, 10)
1000
>>> round_down(1009, 10)
1000
"""
return num - (num % divisor)
2021-08-24 18:08:27 +02:00
def round_down_time(hhmm: str, divisor: int):
hh = hhmm[:-2]
mm = hhmm[-2:]
mm = round_down(int(mm, base=10), divisor)
return int('%s%02d' % (hh,mm) , base=10)
2021-08-17 22:53:50 +02:00
class Converter:
"""
This class takes care of everything converter-related.
Objects are used to enable multiple output formats to be added pretty easily by subclassing
"""
def __init__(self, args):
self.args = args
self.rooms = []
self.talks = {}
self.talk_room = {} # map talk uid to room name
2021-08-19 17:58:09 +02:00
self.talk_location = {} # same, but see --trust-location
2021-08-17 22:53:50 +02:00
self.changed_files = []
def _fname_to_room(self, fpath: str) -> str:
return os.path.splitext(os.path.basename(fpath))[0]
def get_vevents_from_calendar(self, cal: Calendar) -> Iterable[Event]:
for subc in cal.subcomponents:
if type(subc) is Event:
yield subc
def load_input(self):
for fpath in self.args.files:
room = self._fname_to_room(fpath)
with open(fpath) as buf:
file_content = buf.read()
cal = Calendar.from_ical(file_content, multiple=True)
for subcal in cal:
for ev in self.get_vevents_from_calendar(subcal):
2021-08-17 23:34:05 +02:00
uid = ev.decoded("uid").decode("ascii")
2021-08-17 22:53:50 +02:00
self.talks[uid] = ev
self.talk_room[uid] = room
2021-08-19 17:58:09 +02:00
self.talk_location[uid] = room
if fpath in self.args.trust_location:
try:
self.talk_location[uid] = ev.decoded('location').decode('utf8')
except:
pass
2021-08-17 22:53:50 +02:00
def run(self):
self.rooms = [self._fname_to_room(fpath) for fpath in self.args.files]
self.load_input()
self.output()
for fpath in self.changed_files:
print(fpath)
class HugoConverter(Converter):
"""
add relevant output features to the base converter
"""
def output_markdown(self):
for uid in sorted(self.talks):
talk = self.talks[uid]
2021-08-17 22:53:50 +02:00
fname = "%s.md" % uid
fpath = self.args.out_md_dir / fname
self.changed_files.append(fpath)
2021-08-19 18:32:13 +02:00
frontmatter = dict(
2021-08-19 18:31:09 +02:00
key=uid,
title=talk.decoded("SUMMARY").decode("utf8"),
format="conference",
start=talk.decoded("DTSTART"),
end=talk.decoded("DTEND"),
location=self.talk_location[uid],
duration=int(
(
talk.decoded("DTEND") - talk.decoded("DTSTART")
).total_seconds()
// 60
),
2021-08-19 18:33:34 +02:00
tags=[],
2021-08-19 18:32:13 +02:00
)
2021-08-19 18:31:09 +02:00
if "CATEGORIES" in talk:
2021-08-19 18:33:34 +02:00
try:
2021-08-19 18:37:00 +02:00
vobject = talk.get("CATEGORIES")
if hasattr(vobject, 'cats'):
vobject = vobject.cat
2021-08-19 18:39:00 +02:00
frontmatter["tags"] = [str(t) for t in vobject]
else:
frontmatter["tags"] = [str(vobject)]
2021-08-19 18:33:34 +02:00
except Exception as exc:
logging.warning("Error parsing categories: %s", str(exc))
2021-08-19 18:31:09 +02:00
if 'base' in frontmatter['tags']:
2021-08-19 18:41:57 +02:00
frontmatter['level'] = 'beginner'
2021-08-17 23:34:05 +02:00
with open(str(fpath), "w") as buf:
2021-08-17 22:53:50 +02:00
buf.write("---\n")
2021-08-19 18:31:09 +02:00
yaml.safe_dump(frontmatter, buf)
2021-08-17 22:53:50 +02:00
buf.write("---\n\n")
2021-08-19 17:14:04 +02:00
# body
2021-08-17 22:53:50 +02:00
if "DESCRIPTION" in talk:
buf.write(talk.decoded("DESCRIPTION").decode("utf8"))
def output_schedule(self):
days = {}
for uid in sorted(self.talks):
talk = self.talks[uid]
2021-08-17 22:53:50 +02:00
# TODO: talk just after midnight should belong to the preceding day
dt = talk.decoded("dtstart")
after_midnight = dt.time().hour < self.args.night_threshold
if after_midnight:
dt = dt - timedelta(days=1)
day = dt.strftime("%Y-%m-%d")
hour = talk.decoded("dtstart").time().hour
minute = talk.decoded("dtstart").time().minute
if after_midnight:
hour += 24
2021-08-19 17:14:30 +02:00
start = "%02d:%02d" % (hour, minute)
2021-08-17 22:53:50 +02:00
if day not in days:
days[day] = dict(day=day, start=start, rooms={})
2021-08-19 17:14:30 +02:00
if days[day]["start"] > start:
days[day]["start"] = start
2021-08-17 22:53:50 +02:00
room = self.talk_room[uid]
days[day]["rooms"].setdefault(room, dict(room=room, slots=[]))
2021-08-24 18:08:27 +02:00
talkstart = round_down_time('%02d%02d' % (hour, minute), self.args.slot_size)
2021-08-17 22:53:50 +02:00
duration = talk.decoded("dtend") - talk.decoded("dtstart")
duration_minutes = int(duration.total_seconds() // 60)
2021-08-24 18:08:27 +02:00
duration_minutes = round_down(duration_minutes, self.args.slot_size)
2021-08-17 22:53:50 +02:00
slot = "%04d-%dmin" % (talkstart, duration_minutes)
days[day]["rooms"][room]["slots"].append(dict(slot=slot, talk=uid))
# convert from our intermediate format to the correct one
for d in sorted(days):
2021-08-17 22:53:50 +02:00
# vanity: let's sort
for room in sorted(days[d]["rooms"]):
2021-08-17 22:53:50 +02:00
days[d]["rooms"][room]["slots"].sort(key=lambda x: x["slot"])
# convert dict to list
2021-08-19 17:14:30 +02:00
days[d]["rooms"] = [days[d]["rooms"][k] for k in sorted(days[d]["rooms"])]
out = {"schedule": [days[k] for k in sorted(days)]}
2021-08-17 22:53:50 +02:00
# dump, finally
2021-08-17 23:34:05 +02:00
with open(str(self.args.out_schedule), "w") as buf:
2021-08-17 22:53:50 +02:00
yaml.safe_dump(out, buf)
self.changed_files.append(self.args.out_schedule)
def output(self):
self.output_markdown()
self.output_schedule()
def main():
converter_register = {"hugo": HugoConverter}
args = get_parser().parse_args()
c = converter_register[args.mode](args)
c.run()
if __name__ == "__main__":
main()