hugo-obsidian/walk.go

93 lines
2.0 KiB
Go
Raw Permalink Normal View History

2021-12-27 16:19:05 -05:00
package main
import (
"fmt"
"github.com/gernest/front"
"io/fs"
"io/ioutil"
2021-12-27 16:58:21 -05:00
"os"
2021-12-27 16:19:05 -05:00
"path/filepath"
"strings"
"time"
2021-12-27 16:19:05 -05:00
)
// recursively walk directory and return all files with given extension
2021-12-27 16:51:36 -05:00
func walk(root, ext string, index bool, ignorePaths map[string]struct{}) (res []Link, i ContentIndex) {
2021-12-27 16:19:05 -05:00
fmt.Printf("Scraping %s\n", root)
i = make(ContentIndex)
m := front.NewMatter()
m.Handle("---", front.YAMLHandler)
nPrivate := 0
start := time.Now()
2022-03-15 00:50:03 -07:00
err := filepath.WalkDir(root, func(fp string, d fs.DirEntry, e error) error {
2021-12-27 16:19:05 -05:00
if e != nil {
return e
}
2022-03-15 00:50:03 -07:00
// path normalize fp
s := filepath.ToSlash(fp)
2021-12-27 16:51:36 -05:00
if _, ignored := ignorePaths[s]; ignored {
fmt.Printf("[Ignored] %s\n", d.Name())
2021-12-27 16:58:21 -05:00
nPrivate++
2021-12-27 16:51:36 -05:00
} else if filepath.Ext(d.Name()) == ext {
2021-12-27 16:19:05 -05:00
res = append(res, parse(s, root)...)
if index {
text := getText(s)
frontmatter, body, err := m.Parse(strings.NewReader(text))
if err != nil {
frontmatter = map[string]interface{}{}
body = text
}
var title string
if parsedTitle, ok := frontmatter["title"]; ok {
title = parsedTitle.(string)
} else {
title = "Untitled Page"
}
// check if page is private
if parsedPrivate, ok := frontmatter["draft"]; !ok || !parsedPrivate.(bool) {
2021-12-27 16:58:21 -05:00
info, _ := os.Stat(s)
source := processSource(trim(s, root, ".md"))
// adjustedPath := UnicodeSanitize(strings.Replace(hugoPathTrim(trim(s, root, ".md")), " ", "-", -1))
i[source] = Content{
2021-12-27 16:58:21 -05:00
LastModified: info.ModTime(),
2022-03-15 00:50:03 -07:00
Title: title,
Content: body,
2021-12-27 16:19:05 -05:00
}
} else {
2021-12-27 16:58:21 -05:00
fmt.Printf("[Ignored] %s\n", d.Name())
2021-12-27 16:19:05 -05:00
nPrivate++
}
}
}
return nil
})
if err != nil {
panic(err)
}
end := time.Now()
fmt.Printf("[DONE] in %s\n", end.Sub(start).Round(time.Millisecond))
2021-12-27 16:19:05 -05:00
fmt.Printf("Ignored %d private files \n", nPrivate)
fmt.Printf("Parsed %d total links \n", len(res))
return res, i
}
func getText(dir string) string {
// read file
fileBytes, err := ioutil.ReadFile(dir)
if err != nil {
panic(err)
}
return string(fileBytes)
}