hasp: add a libasciidoc preprocessor

This commit is contained in:
Přemysl Eric Janouch 2018-10-07 18:07:18 +02:00
parent 7d51aaa9a4
commit 228c3f3914
Signed by: p
GPG Key ID: A0420B94F92B9493
2 changed files with 96 additions and 0 deletions

5
README
View File

@ -185,6 +185,11 @@ An improved replacement for autocutsel in selection synchronization "mode":
Only UTF8_STRING-convertible selections are synchronized.
hasp -- (lib)asciidoc syntax preprocessor
~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
Provisional tool to make libasciidoc understand more syntax, namely two-line/
underlined titles for my Gitea projects.
ht -- terminal emulator
~~~~~~~~~~~~~~~~~~~~~~~
Similar scope to st(1). Clever display of internal padding for better looks.

91
hasp/main.go Normal file
View File

@ -0,0 +1,91 @@
// Program hasp is a preprocessor for libasciidoc to make it understand
// two-line/underlined titles, intended to be used in Gitea.
package main
import (
"bytes"
"context"
"encoding/xml"
"io"
"io/ioutil"
"os"
"strings"
"unicode"
"unicode/utf8"
"github.com/bytesparadise/libasciidoc"
"github.com/bytesparadise/libasciidoc/pkg/renderer"
)
// isTitle returns the title level if the lines seem to form a title,
// zero otherwise. Input lines may inclide trailing newlines.
func isTitle(line1, line2 []byte) int {
// This is a very naïve method, we should target graphemes (thus at least
// NFC normalize the lines first) and account for wide characters.
diff := utf8.RuneCount(line1) - utf8.RuneCount(line2)
if len(line2) < 2 || diff < -1 || diff > 1 {
return 0
}
// "Don't be fooled by back-to-back delimited blocks."
// Still gets fooled by other things, though.
if bytes.IndexFunc(line1, func(r rune) bool {
return unicode.IsLetter(r) || unicode.IsNumber(r)
}) < 0 {
return 0
}
// The underline must be homogenous.
for _, r := range bytes.TrimRight(line2, "\r\n") {
if r != line2[0] {
return 0
}
}
return 1 + strings.IndexByte("=-~^+", line2[0])
}
func writeLine(w *io.PipeWriter, cur, next []byte) []byte {
if level := isTitle(cur, next); level > 0 {
w.Write(append(bytes.Repeat([]byte{'='}, level), ' '))
next = nil
}
w.Write(cur)
return next
}
// ConvertTitles converts AsciiDoc two-line (underlined) titles to single-line.
func ConvertTitles(w *io.PipeWriter, input []byte) {
var last []byte
for _, cur := range bytes.SplitAfter(input, []byte{'\n'}) {
last = writeLine(w, last, cur)
}
writeLine(w, last, nil)
}
func main() {
input, err := ioutil.ReadAll(os.Stdin)
if err != nil {
panic(err)
}
pr, pw := io.Pipe()
go func() {
defer pw.Close()
ConvertTitles(pw, input)
}()
// io.Copy(os.Stdout, pr)
// return
_, err = libasciidoc.ConvertToHTML(context.Background(), pr, os.Stdout,
renderer.IncludeHeaderFooter(true))
if err != nil {
// Fallback: output all the text sanitized for direct inclusion.
os.Stdout.WriteString("<pre>")
for _, line := range bytes.Split(input, []byte{'\n'}) {
xml.EscapeText(os.Stdout, line)
os.Stdout.WriteString("\n")
}
os.Stdout.WriteString("</pre>")
}
}