miller/pkg/transformers/having_fields.go
Adam Lesperance 085e831668
The package version must match the major tag version (#1654)
* Update package version

* Update makefile targets

* Update readme packages

* Remaining old packages via rg/sd
2024-09-20 12:10:11 -04:00

354 lines
10 KiB
Go

package transformers
import (
"container/list"
"fmt"
"os"
"regexp"
"strings"
"github.com/johnkerl/miller/v6/pkg/cli"
"github.com/johnkerl/miller/v6/pkg/lib"
"github.com/johnkerl/miller/v6/pkg/types"
)
type tHavingFieldsCriterion int
const (
havingFieldsCriterionUnspecified tHavingFieldsCriterion = iota
havingFieldsAtLeast
havingFieldsWhichAre
havingFieldsAtMost
havingAllFieldsMatching
havingAnyFieldsMatching
havingNoFieldsMatching
)
// ----------------------------------------------------------------
const verbNameHavingFields = "having-fields"
var HavingFieldsSetup = TransformerSetup{
Verb: verbNameHavingFields,
UsageFunc: transformerHavingFieldsUsage,
ParseCLIFunc: transformerHavingFieldsParseCLI,
IgnoresInput: false,
}
func transformerHavingFieldsUsage(
o *os.File,
) {
exeName := "mlr"
verb := verbNameHavingFields
fmt.Fprintf(o, "Usage: %s %s [options]\n", "mlr", verbNameHavingFields)
fmt.Fprintf(o, "Conditionally passes through records depending on each record's field names.\n")
fmt.Fprintf(o, "Options:\n")
fmt.Fprintf(o, " --at-least {comma-separated names}\n")
fmt.Fprintf(o, " --which-are {comma-separated names}\n")
fmt.Fprintf(o, " --at-most {comma-separated names}\n")
fmt.Fprintf(o, " --all-matching {regular expression}\n")
fmt.Fprintf(o, " --any-matching {regular expression}\n")
fmt.Fprintf(o, " --none-matching {regular expression}\n")
fmt.Fprintf(o, "Examples:\n")
fmt.Fprintf(o, " %s %s --which-are amount,status,owner\n", exeName, verb)
fmt.Fprintf(o, " %s %s --any-matching 'sda[0-9]'\n", exeName, verb)
fmt.Fprintf(o, " %s %s --any-matching '\"sda[0-9]\"'\n", exeName, verb)
fmt.Fprintf(o, " %s %s --any-matching '\"sda[0-9]\"i' (this is case-insensitive)\n", exeName, verb)
}
func transformerHavingFieldsParseCLI(
pargi *int,
argc int,
args []string,
_ *cli.TOptions,
doConstruct bool, // false for first pass of CLI-parse, true for second pass
) IRecordTransformer {
havingFieldsCriterion := havingFieldsCriterionUnspecified
var fieldNames []string = nil
regexString := ""
// Skip the verb name from the current spot in the mlr command line
argi := *pargi
verb := args[argi]
argi++
for argi < argc /* variable increment: 1 or 2 depending on flag */ {
opt := args[argi]
if !strings.HasPrefix(opt, "-") {
break // No more flag options to process
}
if args[argi] == "--" {
break // All transformers must do this so main-flags can follow verb-flags
}
argi++
if opt == "-h" || opt == "--help" {
transformerHavingFieldsUsage(os.Stdout)
os.Exit(0)
} else if opt == "--at-least" {
havingFieldsCriterion = havingFieldsAtLeast
fieldNames = cli.VerbGetStringArrayArgOrDie(verb, opt, args, &argi, argc)
regexString = ""
} else if opt == "--which-are" {
havingFieldsCriterion = havingFieldsWhichAre
fieldNames = cli.VerbGetStringArrayArgOrDie(verb, opt, args, &argi, argc)
regexString = ""
} else if opt == "--at-most" {
havingFieldsCriterion = havingFieldsAtMost
fieldNames = cli.VerbGetStringArrayArgOrDie(verb, opt, args, &argi, argc)
regexString = ""
} else if opt == "--all-matching" {
havingFieldsCriterion = havingAllFieldsMatching
regexString = cli.VerbGetStringArgOrDie(verb, opt, args, &argi, argc)
fieldNames = nil
} else if opt == "--any-matching" {
havingFieldsCriterion = havingAnyFieldsMatching
regexString = cli.VerbGetStringArgOrDie(verb, opt, args, &argi, argc)
fieldNames = nil
} else if opt == "--none-matching" {
havingFieldsCriterion = havingNoFieldsMatching
regexString = cli.VerbGetStringArgOrDie(verb, opt, args, &argi, argc)
fieldNames = nil
} else {
transformerHavingFieldsUsage(os.Stderr)
os.Exit(1)
}
}
if havingFieldsCriterion == havingFieldsCriterionUnspecified {
transformerHavingFieldsUsage(os.Stderr)
os.Exit(1)
}
if fieldNames == nil && regexString == "" {
transformerHavingFieldsUsage(os.Stderr)
os.Exit(1)
}
*pargi = argi
if !doConstruct { // All transformers must do this for main command-line parsing
return nil
}
transformer, err := NewTransformerHavingFields(
havingFieldsCriterion,
fieldNames,
regexString,
)
if err != nil {
fmt.Fprintln(os.Stderr, err)
os.Exit(1)
}
return transformer
}
// ----------------------------------------------------------------
type TransformerHavingFields struct {
fieldNames []string
numFieldNames int64
fieldNameSet map[string]bool
regex *regexp.Regexp
recordTransformerFunc RecordTransformerFunc
}
// ----------------------------------------------------------------
func NewTransformerHavingFields(
havingFieldsCriterion tHavingFieldsCriterion,
fieldNames []string,
regexString string,
) (*TransformerHavingFields, error) {
tr := &TransformerHavingFields{}
if fieldNames != nil {
tr.fieldNames = fieldNames
tr.numFieldNames = int64(len(fieldNames))
tr.fieldNameSet = lib.StringListToSet(fieldNames)
if havingFieldsCriterion == havingFieldsAtLeast {
tr.recordTransformerFunc = tr.transformHavingFieldsAtLeast
} else if havingFieldsCriterion == havingFieldsWhichAre {
tr.recordTransformerFunc = tr.transformHavingFieldsWhichAre
} else if havingFieldsCriterion == havingFieldsAtMost {
tr.recordTransformerFunc = tr.transformHavingFieldsAtMost
} else {
lib.InternalCodingErrorIf(true)
}
} else {
// Let them type in a.*b if they want, or "a.*b", or "a.*b"i.
// Strip off the leading " and trailing " or "i.
regex, err := lib.CompileMillerRegex(regexString)
if err != nil {
fmt.Fprintf(
os.Stderr,
"%s %s: cannot compile regex \"%s\"\n",
"mlr",
verbNameHavingFields,
regexString,
)
os.Exit(1)
// return nil, err
}
tr.regex = regex
if havingFieldsCriterion == havingAllFieldsMatching {
tr.recordTransformerFunc = tr.transformHavingAllFieldsMatching
} else if havingFieldsCriterion == havingAnyFieldsMatching {
tr.recordTransformerFunc = tr.transformHavingAnyFieldsMatching
} else if havingFieldsCriterion == havingNoFieldsMatching {
tr.recordTransformerFunc = tr.transformHavingNoFieldsMatching
} else {
lib.InternalCodingErrorIf(true)
}
}
return tr, nil
}
// ----------------------------------------------------------------
func (tr *TransformerHavingFields) Transform(
inrecAndContext *types.RecordAndContext,
outputRecordsAndContexts *list.List, // list of *types.RecordAndContext
inputDownstreamDoneChannel <-chan bool,
outputDownstreamDoneChannel chan<- bool,
) {
HandleDefaultDownstreamDone(inputDownstreamDoneChannel, outputDownstreamDoneChannel)
tr.recordTransformerFunc(inrecAndContext, outputRecordsAndContexts, inputDownstreamDoneChannel, outputDownstreamDoneChannel)
}
// ----------------------------------------------------------------
func (tr *TransformerHavingFields) transformHavingFieldsAtLeast(
inrecAndContext *types.RecordAndContext,
outputRecordsAndContexts *list.List, // list of *types.RecordAndContext
inputDownstreamDoneChannel <-chan bool,
outputDownstreamDoneChannel chan<- bool,
) {
if !inrecAndContext.EndOfStream {
inrec := inrecAndContext.Record
numFound := int64(0)
for pe := inrec.Head; pe != nil; pe = pe.Next {
if tr.fieldNameSet[pe.Key] {
numFound++
if numFound == tr.numFieldNames {
outputRecordsAndContexts.PushBack(inrecAndContext)
return
}
}
}
} else {
outputRecordsAndContexts.PushBack(inrecAndContext)
}
}
func (tr *TransformerHavingFields) transformHavingFieldsWhichAre(
inrecAndContext *types.RecordAndContext,
outputRecordsAndContexts *list.List, // list of *types.RecordAndContext
inputDownstreamDoneChannel <-chan bool,
outputDownstreamDoneChannel chan<- bool,
) {
if !inrecAndContext.EndOfStream {
inrec := inrecAndContext.Record
if inrec.FieldCount != tr.numFieldNames {
return
}
for pe := inrec.Head; pe != nil; pe = pe.Next {
if !tr.fieldNameSet[pe.Key] {
return
}
}
outputRecordsAndContexts.PushBack(inrecAndContext)
} else {
outputRecordsAndContexts.PushBack(inrecAndContext)
}
}
func (tr *TransformerHavingFields) transformHavingFieldsAtMost(
inrecAndContext *types.RecordAndContext,
outputRecordsAndContexts *list.List, // list of *types.RecordAndContext
inputDownstreamDoneChannel <-chan bool,
outputDownstreamDoneChannel chan<- bool,
) {
if !inrecAndContext.EndOfStream {
inrec := inrecAndContext.Record
for pe := inrec.Head; pe != nil; pe = pe.Next {
if !tr.fieldNameSet[pe.Key] {
return
}
}
outputRecordsAndContexts.PushBack(inrecAndContext)
} else {
outputRecordsAndContexts.PushBack(inrecAndContext)
}
}
// ----------------------------------------------------------------
func (tr *TransformerHavingFields) transformHavingAllFieldsMatching(
inrecAndContext *types.RecordAndContext,
outputRecordsAndContexts *list.List, // list of *types.RecordAndContext
inputDownstreamDoneChannel <-chan bool,
outputDownstreamDoneChannel chan<- bool,
) {
if !inrecAndContext.EndOfStream {
inrec := inrecAndContext.Record
for pe := inrec.Head; pe != nil; pe = pe.Next {
if !tr.regex.MatchString(pe.Key) {
return
}
}
outputRecordsAndContexts.PushBack(inrecAndContext)
} else {
outputRecordsAndContexts.PushBack(inrecAndContext)
}
}
func (tr *TransformerHavingFields) transformHavingAnyFieldsMatching(
inrecAndContext *types.RecordAndContext,
outputRecordsAndContexts *list.List, // list of *types.RecordAndContext
inputDownstreamDoneChannel <-chan bool,
outputDownstreamDoneChannel chan<- bool,
) {
if !inrecAndContext.EndOfStream {
inrec := inrecAndContext.Record
for pe := inrec.Head; pe != nil; pe = pe.Next {
if tr.regex.MatchString(pe.Key) {
outputRecordsAndContexts.PushBack(inrecAndContext)
return
}
}
} else {
outputRecordsAndContexts.PushBack(inrecAndContext)
}
}
func (tr *TransformerHavingFields) transformHavingNoFieldsMatching(
inrecAndContext *types.RecordAndContext,
outputRecordsAndContexts *list.List, // list of *types.RecordAndContext
inputDownstreamDoneChannel <-chan bool,
outputDownstreamDoneChannel chan<- bool,
) {
if !inrecAndContext.EndOfStream {
inrec := inrecAndContext.Record
for pe := inrec.Head; pe != nil; pe = pe.Next {
if tr.regex.MatchString(pe.Key) {
return
}
}
outputRecordsAndContexts.PushBack(inrecAndContext)
} else {
outputRecordsAndContexts.PushBack(inrecAndContext)
}
}