-#!/usr/bin/env python
# Parse markdown table into tuple of lists
# Armaan Bhojwani 2021
from bs4 import BeautifulSoup
import markdown
+from .deck import Card
+
def md2html(file):
- with open(file, "r", encoding="utf-8") as input_file:
- return markdown.markdown(input_file.read(), extensions=['tables'])
+ """Use the markdown module to convert input to HTML"""
+ try:
+ return markdown.markdown(open(file, "r").read(), extensions=["tables"])
+ except FileNotFoundError:
+ sys.exit(f'lightcards: "{file}": No such file or directory')
def parse_html(html):
+ """Use BeautifulSoup to parse the HTML"""
+
def clean_text(inp):
return inp.get_text().rstrip()
- def clean_list(inp):
- for z in inp:
- if not len(z) == 2:
- inp.remove(z)
- return inp
-
- soup = BeautifulSoup(html, 'html.parser')
+ soup = BeautifulSoup(html, "html.parser").find("table")
outp = []
- for x in soup.find_all("tr"):
- outp.append([clean_text(y) for y in x.find_all("td")])
+ try:
+ for x in soup.find_all("tr"):
+ outp.append(Card(tuple([clean_text(y) for y in x.find_all("td")])))
+ except AttributeError:
+ sys.exit("lightcards: No table found")
+
+ ths = soup.find_all("th")
+ if len(ths) != 2:
+ sys.exit("lightcards: Headings malformed")
- return ([clean_text(x) for x in soup.find_all("th")],
- clean_list(outp))
+ # Return a tuple of nested lists
+ return ([clean_text(x) for x in ths], outp[1:])
def main(file):