miller/pkg/transformers/seqgen.go
2025-03-09 14:59:16 -04:00

218 lines
5.9 KiB
Go

package transformers
import (
"fmt"
"os"
"strings"
"github.com/johnkerl/miller/v6/pkg/bifs"
"github.com/johnkerl/miller/v6/pkg/cli"
"github.com/johnkerl/miller/v6/pkg/mlrval"
"github.com/johnkerl/miller/v6/pkg/types"
)
// ----------------------------------------------------------------
const verbNameSeqgen = "seqgen"
var SeqgenSetup = TransformerSetup{
Verb: verbNameSeqgen,
UsageFunc: transformerSeqgenUsage,
ParseCLIFunc: transformerSeqgenParseCLI,
IgnoresInput: true,
}
func transformerSeqgenUsage(
o *os.File,
) {
fmt.Fprintf(o, "Usage: %s %s [options]\n", "mlr", verbNameSeqgen)
fmt.Fprintf(o, "Passes input records directly to output. Most useful for format conversion.\n")
fmt.Fprintf(o, "Produces a sequence of counters. Discards the input record stream. Produces\n")
fmt.Fprintf(o, "output as specified by the options\n")
fmt.Fprintf(o, "\n")
fmt.Fprintf(o, "Options:\n")
fmt.Fprintf(o, "-f {name} (default \"i\") Field name for counters.\n")
fmt.Fprintf(o, "--start {value} (default 1) Inclusive start value.\n")
fmt.Fprintf(o, "--step {value} (default 1) Step value.\n")
fmt.Fprintf(o, "--stop {value} (default 100) Inclusive stop value.\n")
fmt.Fprintf(o, "-h|--help Show this message.\n")
fmt.Fprintf(o, "Start, stop, and/or step may be floating-point. Output is integer if start,\n")
fmt.Fprintf(o, "stop, and step are all integers. Step may be negative. It may not be zero\n")
fmt.Fprintf(o, "unless start == stop.\n")
}
func transformerSeqgenParseCLI(
pargi *int,
argc int,
args []string,
_ *cli.TOptions,
doConstruct bool, // false for first pass of CLI-parse, true for second pass
) IRecordTransformer {
// Skip the verb name from the current spot in the mlr command line
argi := *pargi
verb := args[argi]
argi++
fieldName := "i"
startString := "1"
stopString := "100"
stepString := "1"
for argi < argc /* variable increment: 1 or 2 depending on flag */ {
opt := args[argi]
if !strings.HasPrefix(opt, "-") {
break // No more flag options to process
}
if args[argi] == "--" {
break // All transformers must do this so main-flags can follow verb-flags
}
argi++
if opt == "-h" || opt == "--help" {
transformerSeqgenUsage(os.Stdout)
os.Exit(0)
} else if opt == "-f" {
fieldName = cli.VerbGetStringArgOrDie(verb, opt, args, &argi, argc)
} else if opt == "--start" {
startString = cli.VerbGetStringArgOrDie(verb, opt, args, &argi, argc)
} else if opt == "--stop" {
stopString = cli.VerbGetStringArgOrDie(verb, opt, args, &argi, argc)
} else if opt == "--step" {
stepString = cli.VerbGetStringArgOrDie(verb, opt, args, &argi, argc)
} else {
transformerSeqgenUsage(os.Stderr)
os.Exit(1)
}
}
*pargi = argi
if !doConstruct { // All transformers must do this for main command-line parsing
return nil
}
transformer, err := NewTransformerSeqgen(
fieldName,
startString,
stopString,
stepString,
)
if err != nil {
fmt.Fprintln(os.Stderr, err)
os.Exit(1)
}
return transformer
}
// ----------------------------------------------------------------
type TransformerSeqgen struct {
fieldName string
start *mlrval.Mlrval
stop *mlrval.Mlrval
step *mlrval.Mlrval
doneComparator bifs.BinaryFunc
mdone *mlrval.Mlrval
}
// ----------------------------------------------------------------
func NewTransformerSeqgen(
fieldName string,
startString string,
stopString string,
stepString string,
) (*TransformerSeqgen, error) {
start := mlrval.FromInferredType(startString)
stop := mlrval.FromInferredType(stopString)
step := mlrval.FromInferredType(stepString)
var doneComparator bifs.BinaryFunc = nil
fstart, startIsNumeric := start.GetNumericToFloatValue()
if !startIsNumeric {
return nil, fmt.Errorf("mlr seqgen: start value should be number; got \"%s\"", startString)
}
fstop, stopIsNumeric := stop.GetNumericToFloatValue()
if !stopIsNumeric {
return nil, fmt.Errorf("mlr seqgen: stop value should be number; got \"%s\"", stopString)
}
fstep, stepIsNumeric := step.GetNumericToFloatValue()
if !stepIsNumeric {
return nil, fmt.Errorf("mlr seqgen: step value should be number; got \"%s\"", stepString)
}
if fstep > 0 {
doneComparator = bifs.BIF_greater_than
} else if fstep < 0 {
doneComparator = bifs.BIF_less_than
} else {
if fstart == fstop {
doneComparator = bifs.BIF_equals
} else {
return nil, fmt.Errorf("mlr seqgen: step must not be zero unless start == stop")
}
}
return &TransformerSeqgen{
fieldName: fieldName,
start: start,
stop: stop,
step: step,
doneComparator: doneComparator,
mdone: mlrval.FALSE,
}, nil
}
func (tr *TransformerSeqgen) Transform(
inrecAndContext *types.RecordAndContext,
outputRecordsAndContexts *types.List[*types.RecordAndContext],
inputDownstreamDoneChannel <-chan bool,
outputDownstreamDoneChannel chan<- bool,
) {
counter := tr.start
context := types.NewNilContext()
context.UpdateForStartOfFile("seqgen")
keepGoing := true
for {
// See ChainTransformer. If a downstream transformer is discarding all
// further input -- e.g. head -n 10 -- and if no interverning
// transformer is interested either, then we should break out of our
// for loop. This way 'mlr seqgen --stop 1000000000 then head -n 10'
// finishes quickly.
select {
case b := <-inputDownstreamDoneChannel:
outputDownstreamDoneChannel <- b
keepGoing = false
default:
}
if !keepGoing {
break
}
tr.mdone = tr.doneComparator(counter, tr.stop)
done, _ := tr.mdone.GetBoolValue()
if done {
break
}
outrec := mlrval.NewMlrmapAsRecord()
outrec.PutCopy(tr.fieldName, counter)
context.UpdateForInputRecord()
outrecAndContext := types.NewRecordAndContext(outrec, context)
outputRecordsAndContexts.PushBack(outrecAndContext)
counter = bifs.BIF_plus_binary(counter, tr.step)
}
outputRecordsAndContexts.PushBack(types.NewEndOfStreamMarker(context))
}