2023-01-04 21:14:48 -05:00
|
|
|
;;; md4tj --- Summary
|
2022-12-28 14:04:54 -05:00
|
|
|
|
|
|
|
;;; Commentary:
|
|
|
|
|
|
|
|
;;; Code:
|
2022-12-29 11:21:53 -05:00
|
|
|
|
2022-12-28 14:04:54 -05:00
|
|
|
(require 'cl-lib)
|
2023-03-25 19:42:47 -04:00
|
|
|
;(load "md4tj-util.el")
|
2022-12-28 14:04:54 -05:00
|
|
|
|
|
|
|
(defun md4tj-begin-tag (tag &optional attrs)
|
|
|
|
"Return beginning html tag for TAG with optional ATTRS."
|
|
|
|
(concat "<" tag
|
2022-12-29 11:51:11 -05:00
|
|
|
(mapconcat 'identity (cl-map 'listp (lambda (l) (concat " " (nth 0 l) "=" "\"" (nth 1 l) "\"")) attrs) "")
|
2022-12-28 14:04:54 -05:00
|
|
|
">"))
|
|
|
|
|
|
|
|
(defun md4tj-end-tag (tag)
|
|
|
|
"Return end html tag for TAG."
|
|
|
|
(concat "</" tag ">"))
|
|
|
|
|
|
|
|
(defun md4tj-process-header (line)
|
|
|
|
"Process LINE known to be header, return HTML."
|
|
|
|
(let ((level (length (nth 0 (split-string line)))))
|
|
|
|
(if (or (< level 0) (> level 6))
|
|
|
|
(error (concat "Error parsing: " line "\n"))
|
|
|
|
(concat (md4tj-begin-tag (concat "h" (number-to-string level)))
|
|
|
|
(mapconcat 'identity (cdr (split-string line)) " ")
|
|
|
|
(md4tj-end-tag (concat "h" (number-to-string level)))))))
|
|
|
|
|
|
|
|
(defun md4tj-process-paragraph (line)
|
|
|
|
"Process LINE that is paragraph, return HTML."
|
|
|
|
(concat (md4tj-begin-tag "p") line (md4tj-end-tag "p")))
|
|
|
|
|
2022-12-28 15:02:19 -05:00
|
|
|
(defun md4tj-process-line (line)
|
|
|
|
"Process all inline elements of the LINE, return HTML."
|
2023-01-04 12:07:33 -05:00
|
|
|
;; Finally strikethrough
|
2022-12-28 15:02:19 -05:00
|
|
|
(replace-regexp-in-string
|
2023-01-04 12:07:33 -05:00
|
|
|
"~~\\(.*\\)~~"
|
|
|
|
"<s>\\1</s>"
|
|
|
|
;; Then highlight
|
2022-12-28 15:02:19 -05:00
|
|
|
(replace-regexp-in-string
|
2023-01-04 12:07:33 -05:00
|
|
|
"==\\(.*\\)=="
|
|
|
|
"<mark>\\1</mark>"
|
|
|
|
;; Then links
|
2023-01-03 18:34:40 -05:00
|
|
|
(replace-regexp-in-string
|
2023-01-04 12:38:23 -05:00
|
|
|
"\\[\\([^\\[]*\\)](\\([^\\[(]*\\))"
|
2023-01-04 12:07:33 -05:00
|
|
|
(concat (md4tj-begin-tag "a" (list '("href" "\\2"))) "\\1" (md4tj-end-tag "a"))
|
|
|
|
;; Then images
|
2022-12-28 15:18:47 -05:00
|
|
|
(replace-regexp-in-string
|
2023-01-04 12:38:23 -05:00
|
|
|
"!\\[\\([^\\[]*\\)](\\([^\\[(]*\\))"
|
2023-01-04 12:07:33 -05:00
|
|
|
(md4tj-begin-tag "img" (list '("src" "\\2") '("alt" "\\1")))
|
|
|
|
;; Then videos
|
2022-12-28 15:18:47 -05:00
|
|
|
(replace-regexp-in-string
|
2023-01-04 12:38:23 -05:00
|
|
|
"!!\\[\\([^\\[]*\\)](\\([^\\[(]*\\))"
|
2023-01-04 12:07:33 -05:00
|
|
|
(concat (md4tj-begin-tag "video" (list '("src" "\\2") '("type" "video/webm") '("controls" "true"))) "\\1" (md4tj-end-tag "video"))
|
|
|
|
;; Then emphasis
|
|
|
|
(replace-regexp-in-string
|
|
|
|
"\\*\\(.*\\)\\*"
|
|
|
|
"<em>\\1</em>"
|
|
|
|
;; Then strong
|
|
|
|
(replace-regexp-in-string
|
|
|
|
"\\*\\*\\(.*\\)\\*\\*"
|
|
|
|
"<strong>\\1</strong>"
|
|
|
|
;; First code
|
|
|
|
(replace-regexp-in-string
|
|
|
|
"`\\(.*\\)`"
|
|
|
|
"<code>\\1</code>" line)))))))))
|
2022-12-29 11:21:53 -05:00
|
|
|
|
2022-12-29 11:33:30 -05:00
|
|
|
(defun md4tj-convert-line-to-html (line state)
|
|
|
|
"Process LINE with STATE and return html."
|
2023-03-25 19:42:47 -04:00
|
|
|
(let ((cleanline (md4tj-util-clean-multiline line)))
|
2022-12-29 14:17:59 -05:00
|
|
|
;; If this is a signal to include another file
|
|
|
|
(cond ((string-match "^@@INCLUDE" line) (md4tj-parse-to-string (nth 1 (split-string line))))
|
2023-01-04 13:41:20 -05:00
|
|
|
((string-match "^@@LASTUPDATED" line) (concat
|
|
|
|
(md4tj-begin-tag "p" (list (list "id" "lastupdated")))
|
|
|
|
"Last updated: " (current-time-string)
|
|
|
|
(md4tj-end-tag "p")))
|
2023-01-04 15:09:58 -05:00
|
|
|
((string-match "^@@DIV" line) (md4tj-begin-tag "div" (list (list "class" (nth 1 (split-string line))))))
|
|
|
|
((string-match "^@@ENDDIV" line) (md4tj-end-tag "div"))
|
2023-01-04 14:57:27 -05:00
|
|
|
((and (string-match "^$$.*$$" line) (eq (nth 1 state) 'normal)) ;; LaTeX formula
|
|
|
|
(shell-command (concat "./pnglatex"
|
|
|
|
" -d 300"
|
|
|
|
" -f "
|
|
|
|
"\""
|
|
|
|
(string-replace "$$" "" line)
|
|
|
|
"\""
|
|
|
|
" -o "
|
|
|
|
"./teximg/"
|
|
|
|
(md5 (string-replace "$$" "" line)) ".png"))
|
|
|
|
(md4tj-begin-tag "img" (list (list "class" "teximg") ;; give teximgs their own class
|
|
|
|
(list "src" (concat "./teximg/" (md5 (string-replace "$$" "" line)) ".png"))
|
|
|
|
(list "alt" (string-replace "$$" "" line)))))
|
2022-12-29 14:17:59 -05:00
|
|
|
;; If this is some other signal, ignore
|
|
|
|
((string-match "^@@" line) "")
|
|
|
|
;; Otherwise, process as normal
|
|
|
|
(t
|
|
|
|
(concat
|
2023-01-04 13:35:28 -05:00
|
|
|
;; Beginning multiline block/ending prev multiline block
|
|
|
|
(mapconcat #'md4tj-state-to-html state "\n")
|
2022-12-29 14:17:59 -05:00
|
|
|
|
|
|
|
;; Body
|
2023-03-25 19:42:47 -04:00
|
|
|
(cond ((or (eq (nth 1 state) 'code) (eq (nth 1 state) 'begincode)) (md4tj-util-escape-chars cleanline))
|
2022-12-29 14:17:59 -05:00
|
|
|
((string-match "^#+ " cleanline) (md4tj-process-header (md4tj-process-line cleanline)))
|
|
|
|
((string= "---" cleanline) "<hr>") ;; horizontal line
|
2023-01-04 15:14:28 -05:00
|
|
|
((= (length cleanline) 0) "<br>") ;; blank line
|
2022-12-29 14:17:59 -05:00
|
|
|
(t (md4tj-process-paragraph (md4tj-process-line cleanline))))
|
|
|
|
|
|
|
|
;; End of multiline block
|
2023-01-04 13:35:28 -05:00
|
|
|
(cond ((or (eq (nth 1 state) 'ul) (eq (nth 1 state) 'beginul)) "</li>")
|
|
|
|
((or (eq (nth 1 state) 'ol) (eq (nth 1 state) 'beginol)) "</li>")
|
|
|
|
((eq (nth 1 state) 'code) "")
|
2022-12-29 14:17:59 -05:00
|
|
|
(t "")))))))
|
2022-12-29 11:21:53 -05:00
|
|
|
|
2023-01-04 13:35:28 -05:00
|
|
|
(defun md4tj-state-to-html (state)
|
|
|
|
"Convert STATE to html."
|
|
|
|
(cond ((eq state 'beginul) "<ul>\n<li>")
|
|
|
|
((eq state 'beginol) "<ol>\n<li>")
|
|
|
|
((eq state 'begincode) "<pre>\n<code>")
|
|
|
|
((eq state 'ul) "<li>")
|
|
|
|
((eq state 'ol) "<li>")
|
|
|
|
((eq state 'code) "")
|
|
|
|
((eq state 'endul) "</ul>\n")
|
|
|
|
((eq state 'endol) "</ol>\n")
|
|
|
|
((eq state 'endcode) "</code>\n</pre>\n")
|
|
|
|
(t "")))
|
|
|
|
|
2022-12-29 11:21:53 -05:00
|
|
|
(defun md4tj-next-state (currline prevstate)
|
|
|
|
"Return the state based on CURRLINE and PREVSTATE."
|
2023-01-04 13:35:28 -05:00
|
|
|
(list
|
|
|
|
;; End state
|
|
|
|
(cond ((and (string-match "^- " currline) (or (eq prevstate 'ol) (eq prevstate 'beginol))) 'endol)
|
|
|
|
((and (string-match "^[0-9]+\\. " currline) (or (eq prevstate 'ul) (eq prevstate 'beginul))) 'endul)
|
|
|
|
((and (not (string-match "^- " currline)) (or (eq prevstate 'beginul) (eq prevstate 'ul))) 'endul)
|
|
|
|
((and (not (string-match "[0-9]+\\. " currline)) (or (eq prevstate 'beginol) (eq prevstate 'ol))) 'endul)
|
|
|
|
((and (string-match "```$" currline) (or (eq prevstate 'code) (eq prevstate 'begincode))) 'endcode)
|
|
|
|
(t 'nothing))
|
|
|
|
|
|
|
|
;; Begin state (or next line's prevstate)
|
|
|
|
(cond ((and (string-match "^- " currline) (not (or (eq prevstate 'beginul) (eq prevstate 'ul))) 'beginul))
|
|
|
|
((and (string-match "^- " currline) (or (eq prevstate 'beginul) (eq prevstate 'ul)) 'ul))
|
|
|
|
((and (string-match "^[0-9]+\\. " currline) (not (or (eq prevstate 'beginol) (eq prevstate 'ol))) 'beginol))
|
|
|
|
((and (string-match "^[0-9]+\\. " currline) (or (eq prevstate 'beginol) (eq prevstate 'ol)) 'ol))
|
|
|
|
((and (string-match "^```" currline) (not (or (eq prevstate 'begincode) (eq prevstate 'code))) 'begincode))
|
|
|
|
((and (not (string-match "```$" currline)) (or (eq prevstate 'begincode) (eq prevstate 'code)) 'code))
|
|
|
|
(t 'normal))))
|
2022-12-29 11:21:53 -05:00
|
|
|
|
2022-12-29 13:41:39 -05:00
|
|
|
(defun md4tj-begin ()
|
2023-01-04 14:57:27 -05:00
|
|
|
"Insert beginning code for all html, initialize."
|
|
|
|
(shell-command "mkdir -p ./teximg") ;; Ensure ./teximg folder exists
|
2022-12-29 13:41:39 -05:00
|
|
|
(concat "<!DOCTYPE html>\n"
|
2023-01-04 12:31:29 -05:00
|
|
|
(md4tj-begin-tag "html"
|
|
|
|
(list (list "lang"
|
|
|
|
(or (nth 1 (car (cl-remove-if-not (lambda (meta) (string= (car meta) "@@LANG")) (md4tj-find-metas)))) "en"))))
|
|
|
|
"\n"))
|
2022-12-29 13:41:39 -05:00
|
|
|
|
2022-12-29 11:21:53 -05:00
|
|
|
(defun md4tj-finalize (state)
|
|
|
|
"Finalizes HTML document by inserting missing end tags based on STATE."
|
|
|
|
(concat
|
|
|
|
(cond ((or (eq state 'beginul) (eq state 'ul)) "</ul>")
|
|
|
|
((or (eq state 'beginol) (eq state 'ol)) "</ol>")
|
|
|
|
((or (eq state 'begincode) (eq state 'code)) "</code>")
|
|
|
|
(t ""))
|
|
|
|
"</body>\n"
|
|
|
|
"</html>"))
|
2022-12-28 14:04:54 -05:00
|
|
|
|
2022-12-29 13:41:39 -05:00
|
|
|
(defun md4tj-find-metas ()
|
|
|
|
"Return all lines starting with @@ as list of split strings."
|
|
|
|
(save-excursion
|
|
|
|
(let ((meta-list nil))
|
|
|
|
(goto-char (point-min))
|
|
|
|
(while (re-search-forward "^@@" nil t)
|
2023-03-25 19:42:47 -04:00
|
|
|
(setq meta-list (cons (split-string (md4tj-util-getline)) meta-list)))
|
2022-12-29 13:41:39 -05:00
|
|
|
meta-list)))
|
|
|
|
|
|
|
|
(defun md4tj-list-to-tuple-list (list)
|
|
|
|
"Convert LIST to tuple list."
|
|
|
|
(let ((tuples nil))
|
|
|
|
(dolist (i (number-sequence 0 (- (length list) 1) 2))
|
|
|
|
(setq tuples (cons (cons (nth i list) (list (nth (+ i 1) list))) tuples)))
|
|
|
|
(reverse tuples)))
|
|
|
|
|
|
|
|
(defun md4tj-meta-to-html (meta)
|
|
|
|
"Convert META to html."
|
|
|
|
(cond ((string= (nth 0 meta) "@@TITLE")
|
|
|
|
(concat "<title>" (mapconcat 'identity (cdr meta) " ") "</title>\n"))
|
|
|
|
((string= (nth 0 meta) "@@META")
|
2023-01-02 20:08:12 -05:00
|
|
|
(concat (md4tj-begin-tag "meta" (md4tj-list-to-tuple-list (cdr meta)))))
|
|
|
|
((string= (nth 0 meta) "@@CSS")
|
|
|
|
(concat (md4tj-begin-tag "link" (list (list "rel" "stylesheet") (list "href" (nth 1 meta))))))))
|
2022-12-29 13:41:39 -05:00
|
|
|
|
|
|
|
(defun md4tj-head ()
|
|
|
|
"Return text for head element on current buffer."
|
|
|
|
(concat
|
|
|
|
(md4tj-begin-tag "head") "\n"
|
|
|
|
(mapconcat 'md4tj-meta-to-html (md4tj-find-metas) "\n")
|
|
|
|
"\n"
|
|
|
|
(md4tj-end-tag "head") "\n"))
|
|
|
|
|
2022-12-28 14:04:54 -05:00
|
|
|
(defun md4tj-parse (mdfile outfile)
|
|
|
|
"Entry point to parse MDFILE and output to OUTFILE."
|
2022-12-28 16:43:54 -05:00
|
|
|
(let ((inbuf (generate-new-buffer " in"))
|
2022-12-29 11:21:53 -05:00
|
|
|
(outbuf (generate-new-buffer " out"))
|
2023-01-04 13:35:28 -05:00
|
|
|
(fullstate (list 'nothing 'normal))
|
2022-12-29 11:21:53 -05:00
|
|
|
(line nil))
|
2022-12-28 16:43:54 -05:00
|
|
|
(set-buffer inbuf)
|
2022-12-28 14:04:54 -05:00
|
|
|
(insert-file-contents mdfile)
|
|
|
|
(goto-char (point-min))
|
2022-12-28 16:43:54 -05:00
|
|
|
(set-buffer outbuf)
|
2022-12-29 13:41:39 -05:00
|
|
|
(insert (md4tj-begin))
|
|
|
|
(insert (with-current-buffer inbuf (md4tj-head)))
|
|
|
|
(insert (md4tj-begin-tag "body"))
|
2022-12-28 16:43:54 -05:00
|
|
|
(while (with-current-buffer inbuf (< (point) (point-max)))
|
2023-03-25 19:42:47 -04:00
|
|
|
(setq line (with-current-buffer inbuf (md4tj-util-getline)))
|
2023-01-04 13:35:28 -05:00
|
|
|
(setq fullstate (md4tj-next-state line (nth 1 fullstate)))
|
2022-12-28 16:43:54 -05:00
|
|
|
;; Insert next line(s) into output file
|
2023-01-04 13:35:28 -05:00
|
|
|
(insert (concat (md4tj-convert-line-to-html line fullstate) "\n"))
|
2022-12-28 16:43:54 -05:00
|
|
|
;; Advance input file by a line
|
|
|
|
(with-current-buffer inbuf (forward-line)))
|
2023-01-04 13:35:28 -05:00
|
|
|
(insert (md4tj-finalize (nth 1 fullstate)))
|
2022-12-29 11:21:53 -05:00
|
|
|
;; Write outbuf to outfile
|
2022-12-28 16:43:54 -05:00
|
|
|
(write-region nil nil outfile nil)))
|
2022-12-28 14:04:54 -05:00
|
|
|
|
2022-12-29 14:17:59 -05:00
|
|
|
(defun md4tj-parse-to-string (mdfile)
|
|
|
|
"Parse MDFILE, return conversion to HTML as string."
|
|
|
|
(with-temp-buffer
|
|
|
|
(let ((acc nil)
|
|
|
|
(line nil)
|
2023-01-04 13:35:28 -05:00
|
|
|
(fullstate (list 'nothing 'normal)))
|
2022-12-29 14:17:59 -05:00
|
|
|
(insert-file-contents mdfile)
|
|
|
|
(goto-char (point-min))
|
|
|
|
(while (< (point) (point-max))
|
2023-03-25 19:42:47 -04:00
|
|
|
(setq line (md4tj-util-getline))
|
2023-01-04 13:35:28 -05:00
|
|
|
(setq fullstate (md4tj-next-state line (nth 1 fullstate)))
|
|
|
|
(setq acc (concat acc (md4tj-convert-line-to-html line fullstate) "\n"))
|
2022-12-29 14:17:59 -05:00
|
|
|
(forward-line))
|
|
|
|
acc)))
|
2023-01-04 21:14:48 -05:00
|
|
|
|
|
|
|
(provide 'md4tj)
|
|
|
|
;;; md4tj.el ends here
|