2021-12-21 04:02:07 +00:00
|
|
|
package yqlib
|
|
|
|
|
|
|
|
import (
|
2022-10-28 03:16:46 +00:00
|
|
|
"bufio"
|
2022-11-25 01:05:56 +00:00
|
|
|
"bytes"
|
2022-10-28 03:16:46 +00:00
|
|
|
"errors"
|
2021-12-21 04:02:07 +00:00
|
|
|
"io"
|
2022-10-28 03:16:46 +00:00
|
|
|
"regexp"
|
|
|
|
"strings"
|
2021-12-21 04:02:07 +00:00
|
|
|
|
|
|
|
yaml "gopkg.in/yaml.v3"
|
|
|
|
)
|
|
|
|
|
|
|
|
type yamlDecoder struct {
|
|
|
|
decoder yaml.Decoder
|
2022-11-25 01:05:56 +00:00
|
|
|
|
|
|
|
prefs YamlPreferences
|
|
|
|
|
2022-10-28 03:16:46 +00:00
|
|
|
// work around of various parsing issues by yaml.v3 with document headers
|
|
|
|
leadingContent string
|
2022-11-25 01:05:56 +00:00
|
|
|
bufferRead bytes.Buffer
|
|
|
|
|
|
|
|
readAnything bool
|
|
|
|
firstFile bool
|
2021-12-21 04:02:07 +00:00
|
|
|
}
|
|
|
|
|
2022-10-28 03:16:46 +00:00
|
|
|
func NewYamlDecoder(prefs YamlPreferences) Decoder {
|
|
|
|
return &yamlDecoder{prefs: prefs, firstFile: true}
|
2021-12-21 04:02:07 +00:00
|
|
|
}
|
|
|
|
|
2022-10-28 03:16:46 +00:00
|
|
|
func (dec *yamlDecoder) processReadStream(reader *bufio.Reader) (io.Reader, string, error) {
|
|
|
|
var commentLineRegEx = regexp.MustCompile(`^\s*#`)
|
2022-11-14 06:22:13 +00:00
|
|
|
var yamlDirectiveLineRegEx = regexp.MustCompile(`^\s*%YA`)
|
2022-10-28 03:16:46 +00:00
|
|
|
var sb strings.Builder
|
|
|
|
for {
|
|
|
|
peekBytes, err := reader.Peek(3)
|
|
|
|
if errors.Is(err, io.EOF) {
|
|
|
|
// EOF are handled else where..
|
|
|
|
return reader, sb.String(), nil
|
|
|
|
} else if err != nil {
|
|
|
|
return reader, sb.String(), err
|
2022-12-08 02:33:06 +00:00
|
|
|
} else if string(peekBytes[0]) == "\n" {
|
|
|
|
_, err := reader.ReadString('\n')
|
|
|
|
sb.WriteString("\n")
|
|
|
|
if errors.Is(err, io.EOF) {
|
|
|
|
return reader, sb.String(), nil
|
|
|
|
} else if err != nil {
|
|
|
|
return reader, sb.String(), err
|
|
|
|
}
|
2022-10-28 03:16:46 +00:00
|
|
|
} else if string(peekBytes) == "---" {
|
|
|
|
_, err := reader.ReadString('\n')
|
2023-09-18 23:52:36 +00:00
|
|
|
sb.WriteString("$yqDocSeparator$\n")
|
2022-10-28 03:16:46 +00:00
|
|
|
if errors.Is(err, io.EOF) {
|
|
|
|
return reader, sb.String(), nil
|
|
|
|
} else if err != nil {
|
|
|
|
return reader, sb.String(), err
|
|
|
|
}
|
2022-11-14 06:22:13 +00:00
|
|
|
} else if commentLineRegEx.MatchString(string(peekBytes)) || yamlDirectiveLineRegEx.MatchString(string(peekBytes)) {
|
2022-10-28 03:16:46 +00:00
|
|
|
line, err := reader.ReadString('\n')
|
|
|
|
sb.WriteString(line)
|
|
|
|
if errors.Is(err, io.EOF) {
|
|
|
|
return reader, sb.String(), nil
|
|
|
|
} else if err != nil {
|
|
|
|
return reader, sb.String(), err
|
|
|
|
}
|
|
|
|
} else {
|
|
|
|
return reader, sb.String(), nil
|
|
|
|
}
|
|
|
|
}
|
2021-12-21 04:02:07 +00:00
|
|
|
}
|
|
|
|
|
2022-10-28 03:16:46 +00:00
|
|
|
func (dec *yamlDecoder) Init(reader io.Reader) error {
|
|
|
|
readerToUse := reader
|
|
|
|
leadingContent := ""
|
2022-11-25 01:05:56 +00:00
|
|
|
dec.bufferRead = bytes.Buffer{}
|
2022-10-28 03:16:46 +00:00
|
|
|
var err error
|
|
|
|
// if we 'evaluating together' - we only process the leading content
|
|
|
|
// of the first file - this ensures comments from subsequent files are
|
|
|
|
// merged together correctly.
|
|
|
|
if dec.prefs.LeadingContentPreProcessing && (!dec.prefs.EvaluateTogether || dec.firstFile) {
|
|
|
|
readerToUse, leadingContent, err = dec.processReadStream(bufio.NewReader(reader))
|
|
|
|
if err != nil {
|
|
|
|
return err
|
|
|
|
}
|
2022-11-25 01:05:56 +00:00
|
|
|
} else if !dec.prefs.LeadingContentPreProcessing {
|
|
|
|
// if we're not process the leading content
|
|
|
|
// keep a copy of what we've read. This is incase its a
|
|
|
|
// doc with only comments - the decoder will return nothing
|
|
|
|
// then we can read the comments from bufferRead
|
|
|
|
readerToUse = io.TeeReader(reader, &dec.bufferRead)
|
2022-10-28 03:16:46 +00:00
|
|
|
}
|
|
|
|
dec.leadingContent = leadingContent
|
|
|
|
dec.readAnything = false
|
|
|
|
dec.decoder = *yaml.NewDecoder(readerToUse)
|
|
|
|
dec.firstFile = false
|
|
|
|
return nil
|
|
|
|
}
|
|
|
|
|
|
|
|
func (dec *yamlDecoder) Decode() (*CandidateNode, error) {
|
|
|
|
var dataBucket yaml.Node
|
|
|
|
err := dec.decoder.Decode(&dataBucket)
|
|
|
|
if errors.Is(err, io.EOF) && dec.leadingContent != "" && !dec.readAnything {
|
|
|
|
// force returning an empty node with a comment.
|
|
|
|
dec.readAnything = true
|
|
|
|
return dec.blankNodeWithComment(), nil
|
2022-11-25 01:05:56 +00:00
|
|
|
} else if errors.Is(err, io.EOF) && !dec.prefs.LeadingContentPreProcessing && !dec.readAnything {
|
|
|
|
// didn't find any yaml,
|
|
|
|
// check the tee buffer, maybe there were comments
|
|
|
|
dec.readAnything = true
|
|
|
|
dec.leadingContent = dec.bufferRead.String()
|
|
|
|
if dec.leadingContent != "" {
|
|
|
|
return dec.blankNodeWithComment(), nil
|
|
|
|
}
|
|
|
|
return nil, err
|
2022-10-28 03:16:46 +00:00
|
|
|
} else if err != nil {
|
|
|
|
return nil, err
|
|
|
|
}
|
|
|
|
|
|
|
|
candidateNode := &CandidateNode{
|
|
|
|
Node: &dataBucket,
|
|
|
|
}
|
|
|
|
|
|
|
|
if dec.leadingContent != "" {
|
|
|
|
candidateNode.LeadingContent = dec.leadingContent
|
|
|
|
dec.leadingContent = ""
|
|
|
|
}
|
2022-11-25 01:05:56 +00:00
|
|
|
dec.readAnything = true
|
2022-10-28 03:16:46 +00:00
|
|
|
// move document comments into candidate node
|
|
|
|
// otherwise unwrap drops them.
|
|
|
|
candidateNode.TrailingContent = dataBucket.FootComment
|
|
|
|
dataBucket.FootComment = ""
|
|
|
|
return candidateNode, nil
|
|
|
|
}
|
|
|
|
|
|
|
|
func (dec *yamlDecoder) blankNodeWithComment() *CandidateNode {
|
|
|
|
return &CandidateNode{
|
|
|
|
Document: 0,
|
|
|
|
Filename: "",
|
|
|
|
Node: &yaml.Node{Kind: yaml.DocumentNode, Content: []*yaml.Node{{Tag: "!!null", Kind: yaml.ScalarNode}}},
|
|
|
|
FileIndex: 0,
|
|
|
|
LeadingContent: dec.leadingContent,
|
|
|
|
}
|
2021-12-21 04:02:07 +00:00
|
|
|
}
|