2021-12-27 16:19:05 -05:00
|
|
|
package main
|
|
|
|
|
|
|
|
import (
|
|
|
|
"bytes"
|
|
|
|
"fmt"
|
|
|
|
"github.com/PuerkitoBio/goquery"
|
|
|
|
"io/ioutil"
|
|
|
|
"strings"
|
|
|
|
)
|
|
|
|
|
|
|
|
// parse single file for links
|
|
|
|
func parse(dir, pathPrefix string) []Link {
|
|
|
|
// read file
|
|
|
|
source, err := ioutil.ReadFile(dir)
|
|
|
|
if err != nil {
|
|
|
|
panic(err)
|
|
|
|
}
|
|
|
|
|
|
|
|
// parse md
|
|
|
|
var links []Link
|
2022-04-02 11:53:14 -07:00
|
|
|
fmt.Printf("[Parsing note] %s => ", trim(dir, pathPrefix, ".md"))
|
2021-12-27 16:19:05 -05:00
|
|
|
|
|
|
|
var buf bytes.Buffer
|
|
|
|
if err := md.Convert(source, &buf); err != nil {
|
|
|
|
panic(err)
|
|
|
|
}
|
|
|
|
|
|
|
|
doc, err := goquery.NewDocumentFromReader(&buf)
|
|
|
|
var n int
|
|
|
|
doc.Find("a").Each(func(i int, s *goquery.Selection) {
|
|
|
|
text := strings.TrimSpace(s.Text())
|
|
|
|
target, ok := s.Attr("href")
|
|
|
|
if !ok {
|
|
|
|
target = "#"
|
|
|
|
}
|
|
|
|
|
2022-04-02 11:53:14 -07:00
|
|
|
target = processTarget(target)
|
|
|
|
source := processSource(trim(dir, pathPrefix, ".md"))
|
2021-12-27 16:19:05 -05:00
|
|
|
|
2022-04-02 11:53:14 -07:00
|
|
|
// fmt.Printf(" '%s' => %s\n", source, target)
|
2021-12-27 16:19:05 -05:00
|
|
|
links = append(links, Link{
|
2022-04-02 11:53:14 -07:00
|
|
|
Source: source,
|
|
|
|
Target: target,
|
2021-12-27 16:19:05 -05:00
|
|
|
Text: text,
|
|
|
|
})
|
|
|
|
n++
|
|
|
|
})
|
2022-04-02 11:53:14 -07:00
|
|
|
fmt.Printf("found: %d links\n", n)
|
2021-12-27 16:19:05 -05:00
|
|
|
|
|
|
|
return links
|
|
|
|
}
|