#!/usr/bin/env python3 # lighttext.py — LightText (.lt) to HTML, Markdown or EPUB converter # Usage: python3 lighttext.py input.lt output.html # python3 lighttext.py input.lt output.md # python3 lighttext.py input.lt output.epub import sys import os import re import zipfile import uuid from datetime import datetime def html_escape(text): return (text .replace("&", "&") .replace("<", "<") .replace(">", ">") .replace('"', """)) def _protect_escapes(text): # Protect backslash-escaped chars so they survive formatting escapes = { r'\*': '__ESC_STAR__', r'\_': '__ESC_UND__', r'\[': '__ESC_LB__', r'\]': '__ESC_RB__', r'\>': '__ESC_GT__', r'\-': '__ESC_DASH__', r'\\': '__ESC_BS__', } for seq, placeholder in escapes.items(): text = text.replace(seq, placeholder) return text def _restore_escapes(text): restores = { '__ESC_STAR__': '*', '__ESC_UND__': '_', '__ESC_LB__': '[', '__ESC_RB__': ']', '__ESC_GT__': '>', '__ESC_DASH__': '-', '__ESC_BS__': '\\', } for placeholder, char in restores.items(): text = text.replace(placeholder, char) return text def inline_html(text): text = _protect_escapes(text) links = {} def stash(m): key = f"__LTLINK{len(links)}__" txt = html_escape(m.group(1).strip()) url = html_escape(m.group(2).strip()) links[key] = f'{txt}' return key text = re.sub(r'\[([^\]>]+?)\s*>\s*([^\]]+)\]', stash, text) text = html_escape(text) for key, tag in links.items(): text = text.replace(key, tag) text = re.sub(r'\*([^*]+)\*', r'\1', text) text = re.sub(r'_([^_]+)_', r'\1', text) text = _restore_escapes(text) return text def inline_md(text): text = _protect_escapes(text) text = re.sub(r'\[([^\]>]+?)\s*>\s*([^\]]+)\]', lambda m: f'[{m.group(1).strip()}]({m.group(2).strip()})', text) text = re.sub(r'\*([^*]+)\*', r'**\1**', text) text = _restore_escapes(text) return text def is_heading(line): letters = [c for c in line if c.isalpha()] return len(letters) > 0 and all(c.isupper() for c in letters) def parse(lines, fmt): """Parse .lt lines and return a list of output lines in fmt (html/md/xhtml).""" is_html = fmt in ("html", "xhtml") inline = inline_html if is_html else inline_md out = [] in_ul = False in_ol = False para_lines = [] prev_blank = True ol_counter = 0 def flush_para(): if para_lines: joined = " ".join(para_lines) out.append(f"

{inline(joined)}

" if is_html else f"{inline_md(joined)}") para_lines.clear() def flush_list(): nonlocal in_ul, in_ol, ol_counter if in_ul: if is_html: out.append("") in_ul = False if in_ol: if is_html: out.append("") in_ol = False ol_counter = 0 for raw in lines: line = raw.rstrip("\n").rstrip("\r") if not line.strip(): flush_para() flush_list() if not is_html: out.append("") prev_blank = True continue if prev_blank and is_heading(line): flush_para(); flush_list() out.append(f"

{inline(line)}

" if is_html else f"# {inline_md(line)}\n") prev_blank = False continue if re.match(r'^- .+', line): flush_para() if in_ol: flush_list() if not in_ul: if is_html: out.append("

{inline(content)}

{inline(content)}

{html_escape(title)}

{html_escape(title)} en {doc_id}