2020-11-22 00:56:28 +00:00
|
|
|
package yqlib
|
|
|
|
|
|
|
|
import (
|
|
|
|
"container/list"
|
2021-11-23 22:27:17 +00:00
|
|
|
"errors"
|
2021-12-06 06:25:32 +00:00
|
|
|
"fmt"
|
2020-11-22 00:56:28 +00:00
|
|
|
"io"
|
|
|
|
"os"
|
|
|
|
|
|
|
|
yaml "gopkg.in/yaml.v3"
|
|
|
|
)
|
|
|
|
|
2021-01-11 05:46:28 +00:00
|
|
|
// A yaml expression evaluator that runs the expression multiple times for each given yaml document.
|
|
|
|
// Uses less memory than loading all documents and running the expression once, but this cannot process
|
|
|
|
// cross document expressions.
|
2020-11-22 00:56:28 +00:00
|
|
|
type StreamEvaluator interface {
|
2021-07-19 09:52:51 +00:00
|
|
|
Evaluate(filename string, reader io.Reader, node *ExpressionNode, printer Printer, leadingContent string) (uint, error)
|
2021-10-15 00:43:48 +00:00
|
|
|
EvaluateFiles(expression string, filenames []string, printer Printer, leadingContentPreProcessing bool) error
|
2021-07-19 09:52:51 +00:00
|
|
|
EvaluateNew(expression string, printer Printer, leadingContent string) error
|
2020-11-22 00:56:28 +00:00
|
|
|
}
|
|
|
|
|
|
|
|
type streamEvaluator struct {
|
|
|
|
treeNavigator DataTreeNavigator
|
2021-01-12 23:18:53 +00:00
|
|
|
treeCreator ExpressionParser
|
2020-11-22 00:56:28 +00:00
|
|
|
fileIndex int
|
2021-12-16 06:50:09 +00:00
|
|
|
decoder Decoder
|
2020-11-22 00:56:28 +00:00
|
|
|
}
|
|
|
|
|
|
|
|
func NewStreamEvaluator() StreamEvaluator {
|
2021-01-12 23:18:53 +00:00
|
|
|
return &streamEvaluator{treeNavigator: NewDataTreeNavigator(), treeCreator: NewExpressionParser()}
|
2020-11-22 00:56:28 +00:00
|
|
|
}
|
|
|
|
|
2021-07-19 09:52:51 +00:00
|
|
|
func (s *streamEvaluator) EvaluateNew(expression string, printer Printer, leadingContent string) error {
|
2021-01-12 23:18:53 +00:00
|
|
|
node, err := s.treeCreator.ParseExpression(expression)
|
2020-12-01 03:06:49 +00:00
|
|
|
if err != nil {
|
|
|
|
return err
|
|
|
|
}
|
|
|
|
candidateNode := &CandidateNode{
|
2021-11-12 04:02:28 +00:00
|
|
|
Document: 0,
|
|
|
|
Filename: "",
|
|
|
|
Node: &yaml.Node{Kind: yaml.DocumentNode, Content: []*yaml.Node{{Tag: "!!null", Kind: yaml.ScalarNode}}},
|
|
|
|
FileIndex: 0,
|
|
|
|
LeadingContent: leadingContent,
|
2020-12-01 03:06:49 +00:00
|
|
|
}
|
|
|
|
inputList := list.New()
|
|
|
|
inputList.PushBack(candidateNode)
|
|
|
|
|
2021-02-02 07:17:59 +00:00
|
|
|
result, errorParsing := s.treeNavigator.GetMatchingNodes(Context{MatchingNodes: inputList}, node)
|
2020-12-01 03:06:49 +00:00
|
|
|
if errorParsing != nil {
|
|
|
|
return errorParsing
|
|
|
|
}
|
2021-07-20 00:19:55 +00:00
|
|
|
return printer.PrintResults(result.MatchingNodes)
|
2020-12-01 03:06:49 +00:00
|
|
|
}
|
|
|
|
|
2021-10-15 00:43:48 +00:00
|
|
|
func (s *streamEvaluator) EvaluateFiles(expression string, filenames []string, printer Printer, leadingContentPreProcessing bool) error {
|
2021-12-20 22:30:08 +00:00
|
|
|
var totalProcessDocs uint
|
2021-01-12 23:18:53 +00:00
|
|
|
node, err := s.treeCreator.ParseExpression(expression)
|
2020-11-22 00:56:28 +00:00
|
|
|
if err != nil {
|
|
|
|
return err
|
|
|
|
}
|
|
|
|
|
2021-07-19 09:52:51 +00:00
|
|
|
var firstFileLeadingContent string
|
|
|
|
|
2021-07-14 10:48:16 +00:00
|
|
|
for index, filename := range filenames {
|
2021-10-15 00:43:48 +00:00
|
|
|
reader, leadingContent, err := readStream(filename, leadingContentPreProcessing)
|
2021-07-19 09:52:51 +00:00
|
|
|
|
|
|
|
if index == 0 {
|
|
|
|
firstFileLeadingContent = leadingContent
|
2021-07-14 10:48:16 +00:00
|
|
|
}
|
2021-07-19 09:52:51 +00:00
|
|
|
|
2020-11-22 00:56:28 +00:00
|
|
|
if err != nil {
|
|
|
|
return err
|
|
|
|
}
|
2021-07-19 09:52:51 +00:00
|
|
|
processedDocs, err := s.Evaluate(filename, reader, node, printer, leadingContent)
|
2020-11-22 00:56:28 +00:00
|
|
|
if err != nil {
|
|
|
|
return err
|
|
|
|
}
|
2021-07-16 11:08:20 +00:00
|
|
|
totalProcessDocs = totalProcessDocs + processedDocs
|
2020-11-22 00:56:28 +00:00
|
|
|
|
|
|
|
switch reader := reader.(type) {
|
|
|
|
case *os.File:
|
|
|
|
safelyCloseFile(reader)
|
|
|
|
}
|
|
|
|
}
|
2021-07-16 11:08:20 +00:00
|
|
|
|
|
|
|
if totalProcessDocs == 0 {
|
2021-07-19 09:52:51 +00:00
|
|
|
return s.EvaluateNew(expression, printer, firstFileLeadingContent)
|
2021-07-16 11:08:20 +00:00
|
|
|
}
|
|
|
|
|
2020-11-22 00:56:28 +00:00
|
|
|
return nil
|
|
|
|
}
|
|
|
|
|
2021-07-19 09:52:51 +00:00
|
|
|
func (s *streamEvaluator) Evaluate(filename string, reader io.Reader, node *ExpressionNode, printer Printer, leadingContent string) (uint, error) {
|
2020-11-22 00:56:28 +00:00
|
|
|
|
|
|
|
var currentIndex uint
|
2021-12-16 11:20:37 +00:00
|
|
|
decoder := NewXmlDecoder(reader, "+", "")
|
2020-11-22 00:56:28 +00:00
|
|
|
for {
|
|
|
|
var dataBucket yaml.Node
|
|
|
|
errorReading := decoder.Decode(&dataBucket)
|
|
|
|
|
2021-11-22 06:43:38 +00:00
|
|
|
if errors.Is(errorReading, io.EOF) {
|
2020-11-22 00:56:28 +00:00
|
|
|
s.fileIndex = s.fileIndex + 1
|
2021-07-16 11:08:20 +00:00
|
|
|
return currentIndex, nil
|
2020-11-22 00:56:28 +00:00
|
|
|
} else if errorReading != nil {
|
2021-12-06 06:25:32 +00:00
|
|
|
return currentIndex, fmt.Errorf("bad file '%v': %w", filename, errorReading)
|
2020-11-22 00:56:28 +00:00
|
|
|
}
|
2021-11-12 04:02:28 +00:00
|
|
|
|
2020-11-22 00:56:28 +00:00
|
|
|
candidateNode := &CandidateNode{
|
|
|
|
Document: currentIndex,
|
|
|
|
Filename: filename,
|
|
|
|
Node: &dataBucket,
|
|
|
|
FileIndex: s.fileIndex,
|
|
|
|
}
|
2021-11-12 04:02:28 +00:00
|
|
|
if currentIndex == 0 {
|
|
|
|
candidateNode.LeadingContent = leadingContent
|
|
|
|
}
|
2020-11-22 00:56:28 +00:00
|
|
|
inputList := list.New()
|
|
|
|
inputList.PushBack(candidateNode)
|
|
|
|
|
2021-02-02 07:17:59 +00:00
|
|
|
result, errorParsing := s.treeNavigator.GetMatchingNodes(Context{MatchingNodes: inputList}, node)
|
2020-11-22 00:56:28 +00:00
|
|
|
if errorParsing != nil {
|
2021-07-16 11:08:20 +00:00
|
|
|
return currentIndex, errorParsing
|
2020-11-22 00:56:28 +00:00
|
|
|
}
|
2021-07-20 00:19:55 +00:00
|
|
|
err := printer.PrintResults(result.MatchingNodes)
|
2021-07-19 09:52:51 +00:00
|
|
|
|
2020-11-22 00:56:28 +00:00
|
|
|
if err != nil {
|
2021-07-16 11:08:20 +00:00
|
|
|
return currentIndex, err
|
2020-11-22 00:56:28 +00:00
|
|
|
}
|
|
|
|
currentIndex = currentIndex + 1
|
|
|
|
}
|
|
|
|
}
|