zord-tree/tree.go

678 lines
13 KiB
Go
Raw Normal View History

2021-05-04 20:26:41 +00:00
package zord_tree
import (
"bufio"
"bytes"
2023-06-26 21:44:32 +00:00
"crypto/md5"
"errors"
2021-05-11 22:10:18 +00:00
"fmt"
2023-06-26 21:44:32 +00:00
"io"
2021-05-04 20:26:41 +00:00
"io/fs"
"net/url"
2021-05-04 20:26:41 +00:00
"os"
"path"
2021-05-11 22:10:18 +00:00
"path/filepath"
"regexp"
2021-05-04 20:26:41 +00:00
"strings"
2024-01-09 07:43:24 +00:00
2025-01-07 06:26:35 +00:00
abcex "g.arns.lt/zordsdavini/abcex/v4"
2024-01-09 07:43:24 +00:00
"golang.org/x/exp/slices"
2021-05-04 20:26:41 +00:00
)
2024-01-09 07:43:24 +00:00
type Config struct {
ReadableFormats []string
AttachmentDirName string
CustomMeta map[string]func() string
Excludes []string
2025-01-11 22:18:49 +00:00
Apps map[string]AppCallback
2024-01-09 07:43:24 +00:00
}
2025-01-11 22:18:49 +00:00
type AppCallback func(dir string, content string, info os.FileInfo) (string, error)
2025-01-11 21:30:59 +00:00
2021-05-04 20:26:41 +00:00
type File struct {
2021-05-12 05:17:43 +00:00
Id string
Name string
FullPath string
Category []string
Tags []string
Meta map[string]string
2021-05-04 20:26:41 +00:00
}
type Tree struct {
2021-05-12 05:17:43 +00:00
Path string
Dirs []Tree
Files []File
2021-05-04 20:26:41 +00:00
}
func (t Tree) FileById(id string) (File, error) {
for _, f := range t.Files {
if f.Id == id {
return f, nil
}
}
for _, t2 := range t.Dirs {
f, err := t2.FileById(id)
if err == nil {
return f, nil
}
}
return File{}, errors.New("file was not found")
}
func (t Tree) Slice(path string) (Tree, error) {
if t.Path == path {
return t, nil
}
for _, t2 := range t.Dirs {
t3, err := t2.Slice(path)
if err == nil {
return t3, nil
}
}
return Tree{}, errors.New("tree was not found")
}
2022-08-30 16:39:40 +00:00
func (t Tree) Filter(filter map[string][]string) (Tree, bool) {
filtered := Tree{}
filtered.Path = t.Path
found := false
for _, f := range t.Files {
addFile := false
2024-08-09 09:20:34 +00:00
exclude := false
2022-08-30 16:39:40 +00:00
for option, values := range filter {
2024-08-09 09:20:34 +00:00
negative := false
if string(option[0]) == "-" {
negative = true
option = option[1:]
}
2022-08-30 16:39:40 +00:00
for _, value := range values {
2024-08-09 09:20:34 +00:00
if !negative && option == "tag" {
2022-08-30 16:39:40 +00:00
for _, tag := range f.Tags {
if tag == value {
addFile = true
}
}
2022-08-30 16:39:40 +00:00
continue
}
2024-08-09 09:20:34 +00:00
if negative && option == "tag" {
for _, tag := range f.Tags {
if tag == value {
exclude = true
}
}
continue
}
2024-08-09 09:43:20 +00:00
if negative && option == "category" {
for _, category := range f.Category {
if category == value {
exclude = true
}
}
continue
}
2024-08-09 09:20:34 +00:00
if !negative && strings.Contains(f.Meta[option], value) {
2022-08-30 16:39:40 +00:00
addFile = true
2024-08-09 09:20:34 +00:00
continue
}
if negative && strings.Contains(f.Meta[option], value) {
exclude = true
}
}
2024-08-09 09:39:02 +00:00
if negative && !exclude {
addFile = true
}
}
2024-08-09 09:20:34 +00:00
if addFile && !exclude {
found = true
filtered.Files = append(filtered.Files, f)
}
}
for _, t2 := range t.Dirs {
filteredChild, foundChild := t2.Filter(filter)
if foundChild {
found = true
filtered.Dirs = append(filtered.Dirs, filteredChild)
}
}
return filtered, found
}
2024-01-09 07:43:24 +00:00
func NewConfig(
readableFormats []string,
attachmentDirName string,
customMeta map[string]func() string,
excludes []string,
2025-01-11 22:18:49 +00:00
apps map[string]AppCallback,
2024-01-09 07:43:24 +00:00
) Config {
return Config{
ReadableFormats: readableFormats,
AttachmentDirName: attachmentDirName,
CustomMeta: customMeta,
Excludes: excludes,
2025-01-11 22:15:45 +00:00
Apps: apps,
2024-01-09 07:43:24 +00:00
}
}
func BuildTree(dirPath string, meta []string, config Config) (Tree, error) {
return readPath(dirPath, []string{}, meta, config)
2021-05-04 20:26:41 +00:00
}
2024-01-09 07:43:24 +00:00
func PopulateTree(sourcePath string, meta []string, config Config) error {
var err error
var attachmentRegistry map[string]string
2023-06-26 21:44:32 +00:00
2025-01-11 21:30:59 +00:00
for _, app := range config.Apps {
err = applyApp(app, sourcePath, config)
if err != nil {
return err
}
}
2024-01-09 07:43:24 +00:00
attachmentRegistry, err = moveAttachments(sourcePath, config)
2023-06-26 21:44:32 +00:00
if err != nil {
return err
}
2024-01-09 07:43:24 +00:00
err = fixFormat(sourcePath, attachmentRegistry, config)
if err != nil {
return err
}
2022-05-08 20:19:55 +00:00
var id int64 = 0
id, err = getMaxId(sourcePath)
2021-05-11 22:10:18 +00:00
if err != nil {
return err
}
id++
err = addMissingId(sourcePath, id)
if err != nil {
return err
}
2024-01-09 07:43:24 +00:00
err = addMissingMeta(sourcePath, meta, config.CustomMeta)
2021-05-11 22:10:18 +00:00
return err
}
2024-01-09 07:43:24 +00:00
func moveAttachments(dir string, config Config) (map[string]string, error) {
2023-06-26 21:44:32 +00:00
attachmentRegistry := make(map[string]string)
err := filepath.Walk(dir, func(fullPath string, info os.FileInfo, e error) error {
if e != nil {
return e
}
2024-01-09 07:43:24 +00:00
clearDir := strings.TrimPrefix(dir, "./")
if info.Mode().IsRegular() {
for _, pattern := range config.Excludes {
matched, err := regexp.Match(pattern, []byte(fullPath))
if err == nil && matched {
return nil
}
}
}
if info.Mode().IsRegular() &&
!slices.Contains(config.ReadableFormats, path.Ext(fullPath)) &&
!strings.HasPrefix(fullPath, fmt.Sprintf("%s/%s", clearDir, config.AttachmentDirName)) {
2023-06-26 21:44:32 +00:00
f, err := os.Open(fullPath)
if err != nil {
return err
}
defer f.Close()
h := md5.New()
if _, err := io.Copy(h, f); err != nil {
return err
}
2024-01-09 07:43:24 +00:00
_ = os.Mkdir(fmt.Sprintf("%s/%s", dir, config.AttachmentDirName), 0755)
attachmentRegistry[fullPath] = fmt.Sprintf(
"%s/%x%s",
config.AttachmentDirName,
h.Sum(nil),
path.Ext(fullPath),
)
newPath := fmt.Sprintf(
"%s/%s/%x%s",
dir,
config.AttachmentDirName,
h.Sum(nil),
path.Ext(fullPath),
)
2023-06-26 21:44:32 +00:00
err = os.Rename(fullPath, newPath)
if err != nil {
return err
}
}
return nil
})
return attachmentRegistry, err
}
2025-01-11 22:18:49 +00:00
func applyApp(app AppCallback, dir string, config Config) error {
2025-01-11 21:30:59 +00:00
err := filepath.Walk(dir, func(fullPath string, info os.FileInfo, e error) error {
if e != nil {
return e
}
if info.Mode().IsRegular() && slices.Contains(config.ReadableFormats, path.Ext(fullPath)) {
osf, err := os.Open(fullPath)
if err != nil {
return err
}
// remove all empty lines and separate split line
content := ""
format := true
scanner := bufio.NewScanner(osf)
scanner.Split(bufio.ScanLines)
for scanner.Scan() {
line := scanner.Text()
if line == "---" {
format = false
}
if format {
line = strings.Trim(line, " ")
if line != "" {
content = content + "\n" + line
}
} else {
content = content + "\n" + line
}
}
2025-01-11 22:30:28 +00:00
content, err = app(path.Dir(fullPath), content, info)
2025-01-11 21:30:59 +00:00
if err != nil {
return err
}
data := []byte(content)
err = os.WriteFile(fullPath, data, 0644)
if err != nil {
return err
}
}
return nil
})
return err
}
2024-01-09 07:43:24 +00:00
func fixFormat(dir string, attachmentRegistry map[string]string, config Config) error {
2023-06-26 21:44:32 +00:00
err := filepath.Walk(dir, func(fullPath string, info os.FileInfo, e error) error {
if e != nil {
return e
}
2024-01-09 07:43:24 +00:00
if info.Mode().IsRegular() && slices.Contains(config.ReadableFormats, path.Ext(fullPath)) {
2023-06-26 21:44:32 +00:00
osf, err := os.Open(fullPath)
if err != nil {
return err
}
// remove all empty lines and separate split line
content := ""
format := true
scanner := bufio.NewScanner(osf)
scanner.Split(bufio.ScanLines)
for scanner.Scan() {
line := scanner.Text()
if line == "---" {
format = false
}
2022-05-08 20:19:55 +00:00
if format {
line = strings.Trim(line, " ")
2022-05-08 20:19:55 +00:00
if line != "" {
content = content + "\n" + line
}
} else {
content = content + "\n" + line
}
}
// fix attachments
data := []byte(content)
re := regexp.MustCompile(`!?\[([^\]*]*)\]\(([^\) ]*)\)`)
for _, match := range re.FindAllSubmatch(data, -1) {
_, err := url.ParseRequestURI(string(match[2][:]))
if err != nil {
2024-01-09 07:43:24 +00:00
aPath := path.Clean(
fmt.Sprintf("%s/%s", path.Dir(fullPath), string(match[2][:])),
)
if _, ok := attachmentRegistry[aPath]; ok {
2023-06-27 08:25:32 +00:00
link := fmt.Sprintf("![%s](%s)", match[1], attachmentRegistry[aPath])
data = bytes.Replace(data, match[0], []byte(link), 1)
}
}
}
2024-01-09 07:43:24 +00:00
err = os.WriteFile(fullPath, data, 0644)
// format split line
2024-01-09 07:43:24 +00:00
b, err := os.ReadFile(fullPath) // just pass the file name
2022-05-08 21:58:00 +00:00
if err != nil {
return err
}
str := string(b)
str = strings.Replace(str, "\n---\n", "\n\n---\n", 1)
2024-01-09 07:43:24 +00:00
err = os.WriteFile(fullPath, []byte(str), 0644)
}
return nil
})
return err
}
func addMissingMeta(dir string, meta []string, customMeta map[string]func() string) error {
2021-05-11 22:10:18 +00:00
err := filepath.Walk(dir, func(path string, info os.FileInfo, e error) error {
if e != nil {
return e
}
if info.Mode().IsRegular() {
check := map[string]bool{}
for _, option := range meta {
check[option] = false
}
osf, err := os.Open(path)
if err != nil {
return err
}
scanner := bufio.NewScanner(osf)
scanner.Split(bufio.ScanLines)
for scanner.Scan() {
line := scanner.Text()
for _, option := range meta {
2022-07-30 06:36:59 +00:00
if strings.HasPrefix(line, "* "+option+":") {
2021-05-11 22:10:18 +00:00
check[option] = true
}
}
if line == "---" {
for option, process := range check {
if !process {
defaultValue := ""
if _, ok := customMeta[option]; ok {
defaultValue = customMeta[option]()
}
err = addMeta(path, option, defaultValue)
2021-05-11 22:10:18 +00:00
if err != nil {
return err
}
}
}
break
}
}
}
return nil
})
2022-05-08 20:19:55 +00:00
return err
2021-05-11 22:10:18 +00:00
}
func addMissingId(dir string, id int64) error {
err := filepath.Walk(dir, func(path string, info os.FileInfo, e error) error {
if e != nil {
return e
}
if info.Mode().IsRegular() {
osf, err := os.Open(path)
if err != nil {
return err
}
scanner := bufio.NewScanner(osf)
scanner.Split(bufio.ScanLines)
for scanner.Scan() {
line := scanner.Text()
2022-08-01 14:16:56 +00:00
if strings.HasPrefix(line, "* id:") {
2021-05-11 22:10:18 +00:00
break
}
if line == "---" {
2025-01-07 06:26:35 +00:00
err = addMeta(path, "id", abcex.Encode(id, abcex.BASE36))
2021-05-11 22:10:18 +00:00
if err != nil {
return err
}
id++
break
}
}
}
return nil
})
if err != nil {
return err
}
2022-05-08 20:19:55 +00:00
return nil
2021-05-11 22:10:18 +00:00
}
func addMeta(path string, option string, value string) error {
2024-01-09 07:43:24 +00:00
b, err := os.ReadFile(path) // just pass the file name
2021-05-11 22:10:18 +00:00
if err != nil {
2022-05-08 20:19:55 +00:00
return err
2021-05-11 22:10:18 +00:00
}
str := string(b)
2022-07-30 06:36:59 +00:00
str = strings.Replace(str, "\n\n---\n", fmt.Sprintf("\n* %s: %s\n\n---\n", option, value), 1)
2024-01-09 07:43:24 +00:00
err = os.WriteFile(path, []byte(str), 0644)
2021-05-11 22:10:18 +00:00
2022-05-08 20:19:55 +00:00
return err
2021-05-11 22:10:18 +00:00
}
func getMaxId(dir string) (int64, error) {
var max int64 = 0
err := filepath.Walk(dir, func(path string, info os.FileInfo, e error) error {
if e != nil {
return e
}
if info.Mode().IsRegular() {
osf, err := os.Open(path)
if err != nil {
return err
}
scanner := bufio.NewScanner(osf)
scanner.Split(bufio.ScanLines)
for scanner.Scan() {
line := scanner.Text()
if line == "---" {
break
}
2022-08-01 14:16:56 +00:00
if strings.HasPrefix(line, "* id:") {
line = strings.TrimPrefix(line, "* id:")
2025-01-07 06:26:35 +00:00
i := abcex.Decode(strings.Trim(line, " "), abcex.BASE36)
2021-05-11 22:10:18 +00:00
if i > max {
max = i
}
}
}
}
return nil
})
if err != nil {
return max, err
}
return max, nil
}
2024-01-09 07:43:24 +00:00
func readPath(dirPath string, category []string, meta []string, config Config) (Tree, error) {
clearDir := strings.TrimPrefix(dirPath, "./")
2021-05-04 20:26:41 +00:00
2023-06-26 21:44:32 +00:00
tree := Tree{}
tree.Path = clearDir
2021-05-04 20:26:41 +00:00
2024-01-09 07:43:24 +00:00
files, err := os.ReadDir(dirPath)
2021-05-04 20:26:41 +00:00
if err != nil {
return tree, err
}
2024-01-09 07:43:24 +00:00
FILE_LOOP:
2021-05-04 20:26:41 +00:00
for _, file := range files {
if strings.HasPrefix(file.Name(), ".") {
continue
}
2021-05-04 20:26:41 +00:00
fullPath := path.Join(dirPath, file.Name())
if file.IsDir() {
2024-01-09 07:43:24 +00:00
if strings.HasPrefix(
fullPath,
fmt.Sprintf("%s/%s", clearDir, config.AttachmentDirName),
) {
2023-06-26 21:44:32 +00:00
continue
}
2024-01-09 07:43:24 +00:00
nextDir, err := readPath(fullPath, append(category, file.Name()), meta, config)
2021-05-04 20:26:41 +00:00
if err != nil {
return tree, err
}
2021-05-12 05:17:43 +00:00
tree.Dirs = append(tree.Dirs, nextDir)
2021-05-04 20:26:41 +00:00
continue
2024-01-09 07:43:24 +00:00
} else {
for _, pattern := range config.Excludes {
matched, err := regexp.Match(pattern, []byte(fullPath))
if err == nil && matched {
continue FILE_LOOP
}
}
2021-05-04 20:26:41 +00:00
}
2024-01-09 07:43:24 +00:00
_, err := os.ReadFile(fullPath)
2021-05-04 20:26:41 +00:00
if err != nil {
return tree, err
}
2021-05-09 18:17:07 +00:00
nextFile, err := readFile(file, fullPath, category, meta)
2021-05-04 20:26:41 +00:00
if err != nil {
return tree, err
}
2021-05-12 05:17:43 +00:00
tree.Files = append(tree.Files, nextFile)
2021-05-04 20:26:41 +00:00
}
return tree, nil
}
2024-01-09 07:43:24 +00:00
func readFile(file fs.DirEntry, fullPath string, category []string, meta []string) (File, error) {
2021-05-04 20:26:41 +00:00
f := File{
2021-05-12 05:17:43 +00:00
Name: file.Name(),
FullPath: fullPath,
Category: category,
2021-05-04 20:26:41 +00:00
}
2025-01-11 21:30:59 +00:00
id, tags, fileMeta, err := GetFileParams(fullPath, meta)
if err != nil {
return f, err
}
f.Id = id
f.Tags = tags
f.Meta = fileMeta
return f, nil
}
func GetFileParams(fullPath string, meta []string) (string, []string, map[string]string, error) {
fileMeta := map[string]string{}
tags := []string{}
id := ""
2021-05-04 20:26:41 +00:00
osf, err := os.Open(fullPath)
if err != nil {
2025-01-11 21:30:59 +00:00
return id, tags, fileMeta, err
2021-05-04 20:26:41 +00:00
}
2025-01-11 21:30:59 +00:00
2021-05-04 20:26:41 +00:00
scanner := bufio.NewScanner(osf)
scanner.Split(bufio.ScanLines)
for scanner.Scan() {
line := scanner.Text()
if line == "---" {
break
}
2022-07-30 06:36:59 +00:00
if strings.HasPrefix(line, "* tags:") {
line = strings.TrimPrefix(line, "* tags:")
2021-05-04 20:26:41 +00:00
t := strings.Split(line, ",")
for _, tag := range t {
tags = append(tags, strings.Trim(tag, " "))
}
2021-05-12 05:17:43 +00:00
}
2022-07-30 06:36:59 +00:00
if strings.HasPrefix(line, "* id:") {
line = strings.TrimPrefix(line, "* id:")
2025-01-11 21:30:59 +00:00
id = strings.Trim(line, " ")
2021-05-04 20:26:41 +00:00
}
2021-05-09 18:17:07 +00:00
for _, option := range meta {
2022-07-30 06:36:59 +00:00
if strings.HasPrefix(line, "* "+option) {
line = strings.TrimPrefix(line, "* "+option+":")
2025-01-11 21:30:59 +00:00
fileMeta[option] = strings.Trim(line, " ")
2021-05-09 18:17:07 +00:00
}
2021-05-04 20:26:41 +00:00
}
}
2022-05-08 20:19:55 +00:00
_ = osf.Close()
2021-05-04 20:26:41 +00:00
2025-01-11 21:30:59 +00:00
return id, tags, fileMeta, nil
2021-05-04 20:26:41 +00:00
}
func ReadFileContent(file File) (string, error) {
2022-05-08 20:19:55 +00:00
osf, err := os.Open(file.FullPath)
if err != nil {
2022-05-08 20:19:55 +00:00
return "", err
}
content := ""
2022-05-08 21:58:00 +00:00
separator := ""
removeEmptyLine := true
isMetaPart := true
scanner := bufio.NewScanner(osf)
scanner.Split(bufio.ScanLines)
for scanner.Scan() {
line := scanner.Text()
if line == "---" {
isMetaPart = false
continue
}
2022-05-08 20:19:55 +00:00
if isMetaPart {
continue
}
2022-05-08 20:19:55 +00:00
if removeEmptyLine {
line = strings.Trim(line, " ")
2022-05-08 20:19:55 +00:00
if line == "" {
continue
} else {
removeEmptyLine = false
}
}
2022-05-08 21:58:00 +00:00
content = content + separator + line
if separator == "" {
separator = "\n"
}
}
2022-05-08 20:19:55 +00:00
_ = osf.Close()
return content, nil
}