html2gmi/html2gmi.go

122 lines
2.9 KiB
Go
Raw Normal View History

2020-07-31 12:08:27 +02:00
package main
import (
"bufio"
"errors"
"fmt"
"github.com/LukeEmmet/html2gemini"
flag "github.com/spf13/pflag"
"io"
"io/ioutil"
"os"
2020-07-31 12:08:27 +02:00
)
var version = "0.2.3"
2020-07-31 12:08:27 +02:00
var (
output = flag.StringP("output", "o", "", "Output path. Otherwise uses stdout")
input = flag.StringP("input", "i", "", "Input path. Otherwise uses stdin")
citationStart = flag.IntP("citationStart", "c", 1, "Start citations from this index")
citationMarkers = flag.BoolP("citationMarkers", "m", false, "Use footnote style citation markers")
numberedLinks = flag.BoolP("numberedLinks", "n", false, "Number the links")
linkEmitFrequency = flag.IntP("linkEmitFrequency", "l", 2, "Emit gathered links through the document after this number of paragraphs")
verFlag = flag.BoolP("version", "v", false, "Find out what version of html2gmi you're running")
2020-07-31 12:08:27 +02:00
)
func check(e error) {
if e != nil {
panic(e)
}
2020-07-31 12:08:27 +02:00
}
func saveFile(contents []byte, path string) {
d1 := contents
err := ioutil.WriteFile(path, d1, 0644)
check(err)
2020-07-31 12:08:27 +02:00
}
func readStdin() string {
// based on https://flaviocopes.com/go-shell-pipes/
reader := bufio.NewReader(os.Stdin) //default size is 4096 apparently
var output []rune
2020-07-31 12:11:24 +02:00
for {
input, _, err := reader.ReadRune()
if err != nil && err == io.EOF {
break
}
output = append(output, input)
}
2020-07-31 12:08:27 +02:00
return string(output)
2020-07-31 12:08:27 +02:00
}
func getInput() (string, error) {
var inputHtml string
info, err := os.Stdin.Stat()
check(err)
if *input != "" {
//get the input file from the command line
dat, err := ioutil.ReadFile(*input)
check(err)
inputHtml = string(dat)
} else if info.Mode()&os.ModeNamedPipe != 0 {
// we have a pipe input
inputHtml = readStdin()
} else {
//we shouldn't get here
return "", errors.New("invalid option for input - use -i <path> or pipe to stdin")
}
return inputHtml, nil
2020-07-31 12:08:27 +02:00
}
func main() {
var inputHtml string
flag.Parse()
if *verFlag {
fmt.Println("html2gmi " + version)
return
}
//get the input from commandline or stdin
inputHtml, err := getInput()
check(err)
//convert html to gmi
options := html2gemini.NewOptions()
options.PrettyTables = true
options.CitationStart = *citationStart
options.LinkEmitFrequency = *linkEmitFrequency
options.CitationMarkers = *citationMarkers
options.NumberedLinks = *numberedLinks
//use slightly nicer Unicode borders, otherwise can use +,|,-
options.PrettyTablesOptions.CenterSeparator = "┼"
options.PrettyTablesOptions.ColumnSeparator = "│"
options.PrettyTablesOptions.RowSeparator = "─"
//dont use an extra line to separate header from body, but
//do separate each row visually
options.PrettyTablesOptions.HeaderLine = false
options.PrettyTablesOptions.RowLine = true
text, err := html2gemini.FromString(inputHtml, *options)
check(err)
//process the output
if *output == "" {
fmt.Print(text + "\n") //terminate with a new line
} else {
//save to the specified output
gmiBytes := []byte(text)
saveFile(gmiBytes, *output)
}
2020-07-31 12:08:27 +02:00
}