miller/pkg/dsl/cst/builtin_function_manager.go
John Kerl 268a96d002
Export library code in pkg/ (#1391)
* Export library code in `pkg/`

* new doc page
2023-09-10 17:15:13 -04:00

2748 lines
90 KiB
Go

// ================================================================
// Adding a new builtin function:
// * New entry in makeBuiltinFunctionLookupTable
// * Implement the function in mlrval_functions.go
//
// Note: Miller-DSL functions, e.g. sec2gmt, are implemented by Go functions
// with names like BIF_sec2gmt not Sec2GMT. This is an intentional departure
// from Go naming conventions: it makes it easier to mentally pair up
// Miller-DSL functions with their Go implementations. Please preserve this
// naming convention.
// ================================================================
package cst
import (
"fmt"
"os"
"regexp"
"sort"
"strings"
"github.com/johnkerl/miller/pkg/bifs"
"github.com/johnkerl/miller/pkg/colorizer"
"github.com/johnkerl/miller/pkg/lib"
)
type TFunctionClass string
const (
FUNC_CLASS_ARITHMETIC TFunctionClass = "arithmetic"
FUNC_CLASS_MATH TFunctionClass = "math"
FUNC_CLASS_STATS TFunctionClass = "stats"
FUNC_CLASS_BOOLEAN TFunctionClass = "boolean"
FUNC_CLASS_STRING TFunctionClass = "string"
FUNC_CLASS_HASHING TFunctionClass = "hashing"
FUNC_CLASS_CONVERSION TFunctionClass = "conversion"
FUNC_CLASS_TYPING TFunctionClass = "typing"
FUNC_CLASS_COLLECTIONS TFunctionClass = "collections"
FUNC_CLASS_HOFS TFunctionClass = "higher-order-functions"
FUNC_CLASS_SYSTEM TFunctionClass = "system"
FUNC_CLASS_TIME TFunctionClass = "time"
)
// ================================================================
type BuiltinFunctionInfo struct {
name string
class TFunctionClass
// For source-code storage, these have newlines in them. For any presentation to the user, they must be
// formatted using the JoinHelp() method which joins newlines. This is crucial for rendering of
// help-strings for manual page, webdocs, etc wherein we must let the user's resizing of the terminal
// window or browser determine -- at their choosing -- where lines wrap.
help string
examples []string
hasMultipleArities bool
minimumVariadicArity int
maximumVariadicArity int // 0 means no max
zaryFunc bifs.ZaryFunc
unaryFunc bifs.UnaryFunc
binaryFunc bifs.BinaryFunc
ternaryFunc bifs.TernaryFunc
variadicFunc bifs.VariadicFunc
unaryFuncWithContext bifs.UnaryFuncWithContext // asserting_{typename}
regexCaptureBinaryFunc bifs.RegexCaptureBinaryFunc // =~ and !=~
binaryFuncWithState BinaryFuncWithState // select, apply, reduce
ternaryFuncWithState TernaryFuncWithState // fold
variadicFuncWithState VariadicFuncWithState // sort
}
// ================================================================
func isLetter(c byte) bool {
return ('a' <= c && c <= 'z') || ('A' <= c && c <= 'Z')
}
func startsWithLetter(s string) bool {
if len(s) < 1 {
return false
} else {
return isLetter(s[0])
}
}
func makeBuiltinFunctionLookupTable() []BuiltinFunctionInfo {
lookupTable := []BuiltinFunctionInfo{
// ----------------------------------------------------------------
// FUNC_CLASS_ARITHMETIC
{
name: "+",
class: FUNC_CLASS_ARITHMETIC,
help: `Addition as binary operator; unary plus operator.`,
unaryFunc: bifs.BIF_plus_unary,
binaryFunc: bifs.BIF_plus_binary,
hasMultipleArities: true,
},
{
name: "-",
class: FUNC_CLASS_ARITHMETIC,
help: `Subtraction as binary operator; unary negation operator.`,
unaryFunc: bifs.BIF_minus_unary,
binaryFunc: bifs.BIF_minus_binary,
hasMultipleArities: true,
},
{
name: "*",
class: FUNC_CLASS_ARITHMETIC,
help: `Multiplication, with integer*integer overflow to float.`,
binaryFunc: bifs.BIF_times,
},
{
name: "/",
class: FUNC_CLASS_ARITHMETIC,
help: `Division. Integer / integer is integer when exact, else floating-point: e.g. 6/3 is 2 but 6/4 is 1.5.`,
binaryFunc: bifs.BIF_divide,
},
{
name: "//",
class: FUNC_CLASS_ARITHMETIC,
help: `Pythonic integer division, rounding toward negative.`,
binaryFunc: bifs.BIF_int_divide,
},
{
name: "**",
class: FUNC_CLASS_ARITHMETIC,
help: `Exponentiation. Same as pow, but as an infix operator.`,
binaryFunc: bifs.BIF_pow,
},
{
name: "pow",
class: FUNC_CLASS_ARITHMETIC,
help: `Exponentiation. Same as **, but as a function.`,
binaryFunc: bifs.BIF_pow,
},
{
name: ".+",
class: FUNC_CLASS_ARITHMETIC,
help: `Addition, with integer-to-integer overflow.`,
binaryFunc: bifs.BIF_dot_plus,
},
{
name: ".-",
class: FUNC_CLASS_ARITHMETIC,
help: `Subtraction, with integer-to-integer overflow.`,
binaryFunc: bifs.BIF_dot_minus,
},
{
name: ".*",
class: FUNC_CLASS_ARITHMETIC,
help: `Multiplication, with integer-to-integer overflow.`,
binaryFunc: bifs.BIF_dot_times,
},
{
name: "./",
class: FUNC_CLASS_ARITHMETIC,
help: `Integer division, rounding toward zero.`,
binaryFunc: bifs.BIF_dot_divide,
},
{
name: "%",
class: FUNC_CLASS_ARITHMETIC,
help: `Remainder; never negative-valued (pythonic).`,
binaryFunc: bifs.BIF_modulus,
},
{
name: "~",
class: FUNC_CLASS_ARITHMETIC,
help: `Bitwise NOT. Beware '$y=~$x' since =~ is the regex-match operator: try '$y = ~$x'.`,
unaryFunc: bifs.BIF_bitwise_not,
},
{
name: "&",
class: FUNC_CLASS_ARITHMETIC,
help: `Bitwise AND.`,
binaryFunc: bifs.BIF_bitwise_and,
},
{
name: "|",
class: FUNC_CLASS_ARITHMETIC,
help: `Bitwise OR.`,
binaryFunc: bifs.BIF_bitwise_or,
},
{
name: "^",
help: `Bitwise XOR.`,
class: FUNC_CLASS_ARITHMETIC,
binaryFunc: bifs.BIF_bitwise_xor,
},
{
name: "<<",
class: FUNC_CLASS_ARITHMETIC,
help: `Bitwise left-shift.`,
binaryFunc: bifs.BIF_left_shift,
},
{
name: ">>",
class: FUNC_CLASS_ARITHMETIC,
help: `Bitwise signed right-shift.`,
binaryFunc: bifs.BIF_signed_right_shift,
},
{
name: ">>>",
class: FUNC_CLASS_ARITHMETIC,
help: `Bitwise unsigned right-shift.`,
binaryFunc: bifs.BIF_unsigned_right_shift,
},
{
name: "bitcount",
class: FUNC_CLASS_ARITHMETIC,
help: "Count of 1-bits.",
unaryFunc: bifs.BIF_bitcount,
},
{
name: "madd",
class: FUNC_CLASS_ARITHMETIC,
help: `a + b mod m (integers)`,
ternaryFunc: bifs.BIF_mod_add,
},
{
name: "msub",
class: FUNC_CLASS_ARITHMETIC,
help: `a - b mod m (integers)`,
ternaryFunc: bifs.BIF_mod_sub,
},
{
name: "mmul",
class: FUNC_CLASS_ARITHMETIC,
help: `a * b mod m (integers)`,
ternaryFunc: bifs.BIF_mod_mul,
},
{
name: "mexp",
class: FUNC_CLASS_ARITHMETIC,
help: `a ** b mod m (integers)`,
ternaryFunc: bifs.BIF_mod_exp,
},
// ----------------------------------------------------------------
// FUNC_CLASS_BOOLEAN
{
name: "!",
class: FUNC_CLASS_BOOLEAN,
help: `Logical negation.`,
unaryFunc: bifs.BIF_logical_NOT,
},
{
name: "==",
class: FUNC_CLASS_BOOLEAN,
help: `String/numeric equality. Mixing number and string results in string compare.`,
binaryFunc: bifs.BIF_equals,
},
{
name: "!=",
class: FUNC_CLASS_BOOLEAN,
help: `String/numeric inequality. Mixing number and string results in string compare.`,
binaryFunc: bifs.BIF_not_equals,
},
{
name: ">",
help: `String/numeric greater-than. Mixing number and string results in string compare.`,
class: FUNC_CLASS_BOOLEAN,
binaryFunc: bifs.BIF_greater_than,
},
{
name: ">=",
help: `String/numeric greater-than-or-equals. Mixing number and string results in string compare.`,
class: FUNC_CLASS_BOOLEAN,
binaryFunc: bifs.BIF_greater_than_or_equals,
},
{
name: "<=>",
help: `Comparator, nominally for sorting. Given a <=> b, returns <0, 0, >0 as a < b, a == b, or a > b, respectively.`,
class: FUNC_CLASS_BOOLEAN,
binaryFunc: bifs.BIF_cmp,
},
{
name: "<",
class: FUNC_CLASS_BOOLEAN,
help: `String/numeric less-than. Mixing number and string results in string compare.`,
binaryFunc: bifs.BIF_less_than,
},
{
name: "<=",
class: FUNC_CLASS_BOOLEAN,
help: `String/numeric less-than-or-equals. Mixing number and string results in string compare.`,
binaryFunc: bifs.BIF_less_than_or_equals,
},
{
name: "=~",
class: FUNC_CLASS_BOOLEAN,
help: `String (left-hand side) matches regex (right-hand side), e.g.
'$name =~ "^a.*b$"'.
Capture groups \1 through \9 are matched from (...) in the right-hand side, and can be
used within subsequent DSL statements. See also "Regular expressions" at ` + lib.DOC_URL + `.`,
examples: []string{
`With if-statement: if ($url =~ "http.*com") { ... }`,
`Without if-statement: given $line = "index ab09 file", and $line =~ "([a-z][a-z])([0-9][0-9])", then $label = "[\1:\2]", $label is "[ab:09]"`,
},
regexCaptureBinaryFunc: bifs.BIF_string_matches_regexp,
},
{
name: "!=~",
class: FUNC_CLASS_BOOLEAN,
help: `String (left-hand side) does not match regex (right-hand side), e.g. '$name !=~ "^a.*b$"'.`,
regexCaptureBinaryFunc: bifs.BIF_string_does_not_match_regexp,
},
{
name: "&&",
class: FUNC_CLASS_BOOLEAN,
help: `Logical AND.`,
binaryFunc: BinaryShortCircuitPlaceholder,
},
{
name: "||",
class: FUNC_CLASS_BOOLEAN,
help: `Logical OR.`,
binaryFunc: BinaryShortCircuitPlaceholder,
},
{
name: "^^",
class: FUNC_CLASS_BOOLEAN,
help: `Logical XOR.`,
binaryFunc: bifs.BIF_logical_XOR,
},
{
name: "??",
class: FUNC_CLASS_BOOLEAN,
help: `Absent-coalesce operator. $a ?? 1 evaluates to 1 if $a isn't defined in the current record.`,
binaryFunc: BinaryShortCircuitPlaceholder,
},
{
name: "???",
class: FUNC_CLASS_BOOLEAN,
help: `Absent/empty-coalesce operator. $a ??? 1 evaluates to 1 if $a isn't defined in the current record, or has empty value.`,
binaryFunc: BinaryShortCircuitPlaceholder,
},
{
name: "?:",
class: FUNC_CLASS_BOOLEAN,
help: `Standard ternary operator.`,
ternaryFunc: TernaryShortCircuitPlaceholder,
},
// ----------------------------------------------------------------
// FUNC_CLASS_STRING
{
name: ".",
class: FUNC_CLASS_STRING,
help: `String concatenation. Non-strings are coerced, so you can do '"ax".98' etc.`,
binaryFunc: bifs.BIF_dot,
},
{
name: "capitalize",
class: FUNC_CLASS_STRING,
help: "Convert string's first character to uppercase.",
unaryFunc: bifs.BIF_capitalize,
},
{
name: "clean_whitespace",
class: FUNC_CLASS_STRING,
help: "Same as collapse_whitespace and strip.",
unaryFunc: bifs.BIF_clean_whitespace,
},
{
name: "collapse_whitespace",
class: FUNC_CLASS_STRING,
help: "Strip repeated whitespace from string.",
unaryFunc: bifs.BIF_collapse_whitespace,
},
{
name: "lstrip",
class: FUNC_CLASS_STRING,
help: "Strip leading whitespace from string.",
unaryFunc: bifs.BIF_lstrip,
},
{
name: "regextract",
class: FUNC_CLASS_STRING,
help: `Extracts a substring (the first, if there are multiple matches), matching a
regular expression, from the input. Does not use capture groups; see also the =~ operator which does.`,
binaryFunc: bifs.BIF_regextract,
examples: []string{
`regextract("index ab09 file", "[a-z][a-z][0-9][0-9]") gives "ab09"`,
`regextract("index a999 file", "[a-z][a-z][0-9][0-9]") gives (absent), which will result in an assignment not happening.`,
},
},
{
name: "regextract_or_else",
class: FUNC_CLASS_STRING,
help: `Like regextract but the third argument is the return value in case the input string (first
argument) doesn't match the pattern (second argument).`,
ternaryFunc: bifs.BIF_regextract_or_else,
examples: []string{
`regextract_or_else("index ab09 file", "[a-z][a-z][0-9][0-9]", "nonesuch") gives "ab09"`,
`regextract_or_else("index a999 file", "[a-z][a-z][0-9][0-9]", "nonesuch") gives "nonesuch"`,
},
},
{
name: "rstrip",
class: FUNC_CLASS_STRING,
help: "Strip trailing whitespace from string.",
unaryFunc: bifs.BIF_rstrip,
},
{
name: "strip",
class: FUNC_CLASS_STRING,
help: "Strip leading and trailing whitespace from string.",
unaryFunc: bifs.BIF_strip,
},
{
name: "strlen",
class: FUNC_CLASS_STRING,
help: "String length.",
unaryFunc: bifs.BIF_strlen,
},
{
name: "ssub",
class: FUNC_CLASS_STRING,
help: `Like sub but does no regexing. No characters are special.`,
ternaryFunc: bifs.BIF_ssub,
examples: []string{
`ssub("abc.def", ".", "X") gives "abcXdef"`,
},
},
{
name: "gssub",
class: FUNC_CLASS_STRING,
help: `Like gsub but does no regexing. No characters are special.`,
ternaryFunc: bifs.BIF_gssub,
examples: []string{
`gssub("ab.d.fg", ".", "X") gives "abXdXfg"`,
},
},
{
name: "sub",
class: FUNC_CLASS_STRING,
help: `'$name = sub($name, "old", "new")': replace once (first match, if there are multiple matches),
with support for regular expressions. Capture groups \1 through \9 in the new part are matched from (...) in
the old part, and must be used within the same call to sub -- they don't persist for subsequent DSL
statements. See also =~ and regextract. See also "Regular expressions" at ` + lib.DOC_URL + `.`,
ternaryFunc: bifs.BIF_sub,
examples: []string{
`sub("ababab", "ab", "XY") gives "XYabab"`,
`sub("abc.def", ".", "X") gives "Xbc.def"`,
`sub("abc.def", "\.", "X") gives "abcXdef"`,
`sub("abcdefg", "[ce]", "X") gives "abXdefg"`,
`sub("prefix4529:suffix8567", "suffix([0-9]+)", "name\1") gives "prefix4529:name8567"`,
},
},
{
name: "gsub",
class: FUNC_CLASS_STRING,
help: `'$name = gsub($name, "old", "new")': replace all, with support for regular expressions.
Capture groups \1 through \9 in the new part are matched from (...) in the old part, and must be
used within the same call to gsub -- they don't persist for subsequent DSL statements. See also
=~ and regextract. See also "Regular expressions" at ` + lib.DOC_URL + `.`,
ternaryFunc: bifs.BIF_gsub,
examples: []string{
`gsub("ababab", "ab", "XY") gives "XYXYXY"`,
`gsub("abc.def", ".", "X") gives "XXXXXXX"`,
`gsub("abc.def", "\.", "X") gives "abcXdef"`,
`gsub("abcdefg", "[ce]", "X") gives "abXdXfg"`,
`gsub("prefix4529:suffix8567", "(....ix)([0-9]+)", "[\1 : \2]") gives "[prefix : 4529]:[suffix : 8567]"`,
},
},
{
name: "substr0",
class: FUNC_CLASS_STRING,
help: `substr0(s,m,n) gives substring of s from 0-up position m to n inclusive.
Negative indices -len .. -1 alias to 0 .. len-1. See also substr and substr1.`,
ternaryFunc: bifs.BIF_substr_0_up,
},
{
name: "substr1",
class: FUNC_CLASS_STRING,
help: `substr1(s,m,n) gives substring of s from 1-up position m to n inclusive.
Negative indices -len .. -1 alias to 1 .. len. See also substr and substr0.`,
ternaryFunc: bifs.BIF_substr_1_up,
},
{
name: "substr",
class: FUNC_CLASS_STRING,
help: `substr is an alias for substr0. See also substr1. Miller is generally 1-up with all
array and string indices, but, this is a backward-compatibility issue with Miller 5 and below.
Arrays are new in Miller 6; the substr function is older.`,
ternaryFunc: bifs.BIF_substr_0_up,
},
{
name: "index",
class: FUNC_CLASS_STRING,
help: `Returns the index (1-based) of the second argument within the first. Returns -1 if the second argument isn't a substring of the first. Stringifies non-string inputs. Uses UTF-8 encoding to count characters, not bytes.`,
binaryFunc: bifs.BIF_index,
examples: []string{
`index("abcde", "e") gives 5`,
`index("abcde", "x") gives -1`,
`index(12345, 34) gives 3`,
`index("forêt", "t") gives 5`,
},
},
{
name: "contains",
class: FUNC_CLASS_STRING,
help: `Returns true if the first argument contains the second as a substring. This is like saying ` + "`index(arg1, arg2) >= 0`" + `but with less keystroking.`,
binaryFunc: bifs.BIF_contains,
examples: []string{
`contains("abcde", "e") gives true`,
`contains("abcde", "x") gives false`,
`contains(12345, 34) gives true`,
`contains("forêt", "ê") gives true`,
},
},
{
name: "tolower",
class: FUNC_CLASS_STRING,
help: "Convert string to lowercase.",
unaryFunc: bifs.BIF_tolower,
},
{
name: "toupper",
class: FUNC_CLASS_STRING,
help: "Convert string to uppercase.",
unaryFunc: bifs.BIF_toupper,
},
{
name: "truncate",
class: FUNC_CLASS_STRING,
help: `Truncates string first argument to max length of int second argument.`,
binaryFunc: bifs.BIF_truncate,
},
{
name: "leftpad",
class: FUNC_CLASS_STRING,
help: `Left-pads first argument to at most the specified length (second, integer argument) using specified pad value (third, string argument). If the first argument is not a string, it will be stringified first.`,
ternaryFunc: bifs.BIF_leftpad,
examples: []string{
`leftpad("abcdefg", 10 , "*") gives "***abcdefg".`,
`leftpad("abcdefg", 10 , "XY") gives "XYabcdefg".`,
`leftpad("1234567", 10 , "0") gives "0001234567".`,
},
},
{
name: "rightpad",
class: FUNC_CLASS_STRING,
help: `Right-pads first argument to at most the specified length (second, integer argument) using specified pad value (third, string argument). If the first argument is not a string, it will be stringified first.`,
ternaryFunc: bifs.BIF_rightpad,
examples: []string{
`rightpad("abcdefg", 10 , "*") gives "abcdefg***".`,
`rightpad("abcdefg", 10 , "XY") gives "abcdefgXY".`,
`rightpad("1234567", 10 , "0") gives "1234567000".`,
},
},
{
name: "format",
class: FUNC_CLASS_STRING,
help: `Using first argument as format string, interpolate remaining arguments in place of
each "{}" in the format string. Too-few arguments are treated as the empty string; too-many arguments are discarded.`,
examples: []string{
`format("{}:{}:{}", 1,2) gives "1:2:".`,
`format("{}:{}:{}", 1,2,3) gives "1:2:3".`,
`format("{}:{}:{}", 1,2,3,4) gives "1:2:3".`,
},
variadicFunc: bifs.BIF_format,
},
{
name: "unformat",
class: FUNC_CLASS_STRING,
help: `Using first argument as format string, unpacks second argument into an array of matches,
with type-inference. On non-match, returns error -- use is_error() to check.`,
examples: []string{
`unformat("{}:{}:{}", "1:2:3") gives [1, 2, 3].`,
`unformat("{}h{}m{}s", "3h47m22s") gives [3, 47, 22].`,
`is_error(unformat("{}h{}m{}s", "3:47:22")) gives true.`,
},
binaryFunc: bifs.BIF_unformat,
},
{
name: "unformatx",
class: FUNC_CLASS_STRING,
help: `Same as unformat, but without type-inference.`,
examples: []string{
`unformatx("{}:{}:{}", "1:2:3") gives ["1", "2", "3"].`,
`unformatx("{}h{}m{}s", "3h47m22s") gives ["3", "47", "22"].`,
`is_error(unformatx("{}h{}m{}s", "3:47:22")) gives true.`,
},
binaryFunc: bifs.BIF_unformatx,
},
{
name: "latin1_to_utf8",
class: FUNC_CLASS_STRING,
help: `Tries to convert Latin-1-encoded string to UTF-8-encoded string.
If argument is array or map, recurses into it.`,
examples: []string{
`$y = latin1_to_utf8($x)`,
`$* = latin1_to_utf8($*)`,
},
unaryFunc: bifs.BIF_latin1_to_utf8,
},
{
name: "utf8_to_latin1",
class: FUNC_CLASS_STRING,
help: `Tries to convert UTF-8-encoded string to Latin-1-encoded string.
If argument is array or map, recurses into it.`,
examples: []string{
`$y = utf8_to_latin1($x)`,
`$* = utf8_to_latin1($*)`,
},
unaryFunc: bifs.BIF_utf8_to_latin1,
},
// ----------------------------------------------------------------
// FUNC_CLASS_HASHING
{
name: "md5",
class: FUNC_CLASS_HASHING,
help: `MD5 hash.`,
unaryFunc: bifs.BIF_md5,
},
{
name: "sha1",
class: FUNC_CLASS_HASHING,
help: `SHA1 hash.`,
unaryFunc: bifs.BIF_sha1,
},
{
name: "sha256",
class: FUNC_CLASS_HASHING,
help: `SHA256 hash.`,
unaryFunc: bifs.BIF_sha256,
},
{
name: "sha512",
class: FUNC_CLASS_HASHING,
help: `SHA512 hash.`,
unaryFunc: bifs.BIF_sha512,
},
// ----------------------------------------------------------------
// FUNC_CLASS_MATH
{
name: "abs",
class: FUNC_CLASS_MATH,
help: "Absolute value.",
unaryFunc: bifs.BIF_abs,
},
{
name: "acos",
class: FUNC_CLASS_MATH,
help: "Inverse trigonometric cosine.",
unaryFunc: bifs.BIF_acos,
},
{
name: "acosh",
class: FUNC_CLASS_MATH,
help: "Inverse hyperbolic cosine.",
unaryFunc: bifs.BIF_acosh,
},
{
name: "asin",
class: FUNC_CLASS_MATH,
help: "Inverse trigonometric sine.",
unaryFunc: bifs.BIF_asin,
},
{
name: "asinh",
class: FUNC_CLASS_MATH,
help: "Inverse hyperbolic sine.",
unaryFunc: bifs.BIF_asinh,
},
{
name: "atan",
class: FUNC_CLASS_MATH,
help: "One-argument arctangent.",
unaryFunc: bifs.BIF_atan,
},
{
name: "atan2",
class: FUNC_CLASS_MATH,
help: "Two-argument arctangent.",
binaryFunc: bifs.BIF_atan2,
},
{
name: "atanh",
class: FUNC_CLASS_MATH,
help: "Inverse hyperbolic tangent.",
unaryFunc: bifs.BIF_atanh,
},
{
name: "cbrt",
class: FUNC_CLASS_MATH,
help: "Cube root.",
unaryFunc: bifs.BIF_cbrt,
},
{
name: "ceil",
class: FUNC_CLASS_MATH,
help: "Ceiling: nearest integer at or above.",
unaryFunc: bifs.BIF_ceil,
},
{
name: "cos",
class: FUNC_CLASS_MATH,
help: "Trigonometric cosine.",
unaryFunc: bifs.BIF_cos,
},
{
name: "cosh",
class: FUNC_CLASS_MATH,
help: "Hyperbolic cosine.",
unaryFunc: bifs.BIF_cosh,
},
{
name: "erf",
class: FUNC_CLASS_MATH,
help: "Error function.",
unaryFunc: bifs.BIF_erf,
},
{
name: "erfc",
class: FUNC_CLASS_MATH,
help: "Complementary error function.",
unaryFunc: bifs.BIF_erfc,
},
{
name: "exp",
class: FUNC_CLASS_MATH,
help: "Exponential function e**x.",
unaryFunc: bifs.BIF_exp,
},
{
name: "expm1",
class: FUNC_CLASS_MATH,
help: "e**x - 1.",
unaryFunc: bifs.BIF_expm1,
},
{
name: "floor",
class: FUNC_CLASS_MATH,
help: "Floor: nearest integer at or below.",
unaryFunc: bifs.BIF_floor,
},
{
name: "invqnorm",
class: FUNC_CLASS_MATH,
help: `Inverse of normal cumulative distribution function. Note that invqorm(urand())
is normally distributed.`,
unaryFunc: bifs.BIF_invqnorm,
},
{
name: "log",
class: FUNC_CLASS_MATH,
help: "Natural (base-e) logarithm.",
unaryFunc: bifs.BIF_log,
},
{
name: "log10",
class: FUNC_CLASS_MATH,
help: "Base-10 logarithm.",
unaryFunc: bifs.BIF_log10,
},
{
name: "log1p",
class: FUNC_CLASS_MATH,
help: "log(1-x).",
unaryFunc: bifs.BIF_log1p,
},
{
name: "logifit",
class: FUNC_CLASS_MATH,
help: `Given m and b from logistic regression, compute fit: $yhat=logifit($x,$m,$b).`,
ternaryFunc: bifs.BIF_logifit,
},
{
name: "max",
class: FUNC_CLASS_MATH,
help: `Max of n numbers; null loses. The min and max functions also recurse into arrays and maps, so they can be used to get min/max stats on array/map values.`,
variadicFunc: bifs.BIF_max_variadic,
},
{
name: "min",
class: FUNC_CLASS_MATH,
help: `Min of n numbers; null loses. The min and max functions also recurse into arrays and maps, so they can be used to get min/max stats on array/map values.`,
variadicFunc: bifs.BIF_min_variadic,
},
{
name: "qnorm",
class: FUNC_CLASS_MATH,
help: `Normal cumulative distribution function.`,
unaryFunc: bifs.BIF_qnorm,
},
{
name: "round",
class: FUNC_CLASS_MATH,
help: "Round to nearest integer.",
unaryFunc: bifs.BIF_round,
},
{
name: "sgn",
class: FUNC_CLASS_MATH,
help: `+1, 0, -1 for positive, zero, negative input respectively.`,
unaryFunc: bifs.BIF_sgn,
},
{
name: "sin",
class: FUNC_CLASS_MATH,
help: "Trigonometric sine.",
unaryFunc: bifs.BIF_sin,
},
{
name: "sinh",
class: FUNC_CLASS_MATH,
help: "Hyperbolic sine.",
unaryFunc: bifs.BIF_sinh,
},
{
name: "sqrt",
class: FUNC_CLASS_MATH,
help: "Square root.",
unaryFunc: bifs.BIF_sqrt,
},
{
name: "tan",
class: FUNC_CLASS_MATH,
help: "Trigonometric tangent.",
unaryFunc: bifs.BIF_tan,
},
{
name: "tanh",
class: FUNC_CLASS_MATH,
help: "Hyperbolic tangent.",
unaryFunc: bifs.BIF_tanh,
},
{
name: "roundm",
class: FUNC_CLASS_MATH,
help: `Round to nearest multiple of m: roundm($x,$m) is the same as round($x/$m)*$m.`,
binaryFunc: bifs.BIF_roundm,
},
{
name: "urand",
class: FUNC_CLASS_MATH,
help: `Floating-point numbers uniformly distributed on the unit interval.`,
examples: []string{
"Int-valued example: '$n=floor(20+urand()*11)'.",
},
zaryFunc: bifs.BIF_urand,
},
{
name: "urandint",
class: FUNC_CLASS_MATH,
help: `Integer uniformly distributed between inclusive integer endpoints.`,
binaryFunc: bifs.BIF_urandint,
},
{
name: "urandrange",
class: FUNC_CLASS_MATH,
help: `Floating-point numbers uniformly distributed on the interval [a, b).`,
binaryFunc: bifs.BIF_urandrange,
},
{
name: "urand32",
class: FUNC_CLASS_MATH,
help: `Integer uniformly distributed 0 and 2**32-1 inclusive.`,
zaryFunc: bifs.BIF_urand32,
},
{
name: "urandelement",
class: FUNC_CLASS_MATH,
help: `Random sample from the first argument, which must be an non-empty array.`,
unaryFunc: bifs.BIF_urandelement,
},
// ----------------------------------------------------------------
// FUNC_CLASS_STATS
{
name: "count",
class: FUNC_CLASS_STATS,
help: `Returns the length of an array or map. Returns error for non-array/non-map types.`,
unaryFunc: bifs.BIF_count,
examples: []string{
"count([7,8,9]) is 3",
`count({"a":7,"b":8,"c":9}) is 3`,
},
},
{
name: "distinct_count",
class: FUNC_CLASS_STATS,
help: `Returns the number of disinct values in an array or map. Returns error for non-array/non-map types. Values are stringified for comparison, so for example string "1" and integer 1 are not distinct.`,
unaryFunc: bifs.BIF_distinct_count,
examples: []string{
`distinct_count([7,8,9,7]) is 3`,
`distinct_count([1,"1"]) is 1`,
`distinct_count([1,1.0]) is 2`,
},
},
{
name: "null_count",
class: FUNC_CLASS_STATS,
help: `Returns the number of values in an array or map which are empty-string (AKA void) or JSON null. Returns error for non-array/non-map types. Values are stringified for comparison, so for example string "1" and integer 1 are not distinct.`,
unaryFunc: bifs.BIF_null_count,
examples: []string{
`null_count(["a", "", "c"]) is 1`,
},
},
{
name: "mode",
class: FUNC_CLASS_STATS,
help: `Returns the most frequently occurring value in an array or map. Returns error for non-array/non-map types. Values are stringified for comparison, so for example string "1" and integer 1 are not distinct. In cases of ties, first-found wins.`,
unaryFunc: bifs.BIF_mode,
examples: []string{
`mode([3,3,4,4,4]) is 4`,
`mode([3,3,4,4]) is 3`,
},
},
{
name: "antimode",
class: FUNC_CLASS_STATS,
help: `Returns the least frequently occurring value in an array or map. Returns error for non-array/non-map types. Values are stringified for comparison, so for example string "1" and integer 1 are not distinct. In cases of ties, first-found wins.`,
unaryFunc: bifs.BIF_antimode,
examples: []string{
`antimode([3,3,4,4,4]) is 3`,
`antimode([3,3,4,4]) is 3`,
},
},
{
name: "sum",
class: FUNC_CLASS_STATS,
help: `Returns the sum of values in an array or map. Returns error for non-array/non-map types.`,
unaryFunc: bifs.BIF_sum,
examples: []string{
`sum([1,2,3,4,5]) is 15`,
},
},
{
name: "sum2",
class: FUNC_CLASS_STATS,
help: `Returns the sum of squares of values in an array or map. Returns error for non-array/non-map types.`,
unaryFunc: bifs.BIF_sum2,
examples: []string{
`sum2([1,2,3,4,5]) is 55`,
},
},
{
name: "sum3",
class: FUNC_CLASS_STATS,
help: `Returns the sum of cubes of values in an array or map. Returns error for non-array/non-map types.`,
unaryFunc: bifs.BIF_sum3,
examples: []string{
`sum3([1,2,3,4,5]) is 225`,
},
},
{
name: "sum4",
class: FUNC_CLASS_STATS,
help: `Returns the sum of fourth powers of values in an array or map. Returns error for non-array/non-map types.`,
unaryFunc: bifs.BIF_sum4,
examples: []string{
`sum4([1,2,3,4,5]) is 979`,
},
},
{
name: "mean",
class: FUNC_CLASS_STATS,
help: `Returns the arithmetic mean of values in an array or map. Returns empty string AKA void for empty array/map; returns error for non-array/non-map types.`,
unaryFunc: bifs.BIF_mean,
examples: []string{
`mean([4,5,7,10]) is 6.5`,
},
},
{
name: "meaneb",
class: FUNC_CLASS_STATS,
help: `Returns the error bar for arithmetic mean of values in an array or map, assuming the values are independent and identically distributed. Returns empty string AKA void for array/map of length less than two; returns error for non-array/non-map types.`,
unaryFunc: bifs.BIF_meaneb,
examples: []string{
`meaneb([4,5,7,10]) is 1.3228756`,
},
},
{
name: "variance",
class: FUNC_CLASS_STATS,
help: `Returns the sample variance of values in an array or map. Returns empty string AKA void for array/map of length less than two; returns error for non-array/non-map types.`,
unaryFunc: bifs.BIF_variance,
examples: []string{
`variance([4,5,9,10,11]) is 9.7`,
},
},
{
name: "stddev",
class: FUNC_CLASS_STATS,
help: `Returns the sample standard deviation of values in an array or map. Returns empty string AKA void for array/map of length less than two; returns error for non-array/non-map types.`,
unaryFunc: bifs.BIF_stddev,
examples: []string{
`stddev([4,5,9,10,11]) is 3.1144823`,
},
},
{
name: "skewness",
class: FUNC_CLASS_STATS,
help: `Returns the sample skewness of values in an array or map. Returns empty string AKA void for array/map of length less than two; returns error for non-array/non-map types.`,
unaryFunc: bifs.BIF_skewness,
examples: []string{
`skewness([4,5,9,10,11]) is -0.2097285`,
},
},
{
name: "kurtosis",
class: FUNC_CLASS_STATS,
help: `Returns the sample kurtosis of values in an array or map. Returns empty string AKA void for array/map of length less than two; returns error for non-array/non-map types.`,
unaryFunc: bifs.BIF_kurtosis,
examples: []string{
`kurtosis([4,5,9,10,11]) is -1.6703688`,
},
},
{
name: "minlen",
class: FUNC_CLASS_STATS,
help: `Returns the minimum string length of values in an array or map. Returns empty string AKA void for array/map of length less than two; returns error for non-array/non-map types.`,
unaryFunc: bifs.BIF_minlen,
examples: []string{
`minlen(["año", "alto"]) is 3`,
},
},
{
name: "maxlen",
class: FUNC_CLASS_STATS,
help: `Returns the maximum string length of values in an array or map. Returns empty string AKA void for array/map of length less than two; returns error for non-array/non-map types.`,
unaryFunc: bifs.BIF_maxlen,
examples: []string{
`maxlen(["año", "alto"]) is 4`,
},
},
{
name: "median",
class: FUNC_CLASS_STATS,
help: `Returns the median of values in an array or map. Returns empty string AKA void for empty array/map; returns error for non-array/non-map types. Please see the percentiles function for information on optional flags, and on performance for large inputs.`,
unaryFunc: bifs.BIF_median,
binaryFunc: bifs.BIF_median_with_options,
hasMultipleArities: true,
examples: []string{
`median([3,4,5,6,9,10]) is 6`,
`median([3,4,5,6,9,10],{"interpolate_linearly":true}) is 5.5`,
`median(["abc", "def", "ghi", "ghi"]) is "ghi"`,
},
},
{
name: "percentile",
class: FUNC_CLASS_STATS,
help: `Returns the given percentile of values in an array or map. Returns empty string AKA void for empty array/map; returns error for non-array/non-map types. Please see the percentiles function for information on optional flags, and on performance for large inputs.`,
binaryFunc: bifs.BIF_percentile,
ternaryFunc: bifs.BIF_percentile_with_options,
hasMultipleArities: true,
examples: []string{
`percentile([3,4,5,6,9,10], 90) is 10`,
`percentile([3,4,5,6,9,10], 90, {"interpolate_linearly":true}) is 9.5`,
`percentile(["abc", "def", "ghi", "ghi"], 90) is "ghi"`,
},
},
{
name: "percentiles",
class: FUNC_CLASS_STATS,
help: `Returns the given percentiles of values in an array or map. Returns empty string AKA void for empty array/map; returns error for non-array/non-map types. See examples for information on the three option flags.`,
binaryFunc: bifs.BIF_percentiles,
ternaryFunc: bifs.BIF_percentiles_with_options,
hasMultipleArities: true,
examples: []string{
``,
`Defaults are to not interpolate linearly, to produce a map keyed by percentile name, and to sort the input before computing percentiles:`,
``,
` percentiles([3,4,5,6,9,10], [25,75]) is { "25": 4, "75": 9 }`,
` percentiles(["abc", "def", "ghi", "ghi"], [25,75]) is { "25": "def", "75": "ghi" }`,
``,
`Use "output_array_not_map" (or shorthand "oa") to get the outputs as an array:`,
``,
` percentiles([3,4,5,6,9,10], [25,75], {"output_array_not_map":true}) is [4, 9]`,
``,
`Use "interpolate_linearly" (or shorthand "il") to do linear interpolation -- note this produces error values on string inputs:`,
``,
` percentiles([3,4,5,6,9,10], [25,75], {"interpolate_linearly":true}) is { "25": 4.25, "75": 8.25 }`,
``,
`The percentiles function always sorts its inputs before computing percentiles. If you know your input is already sorted -- see also the sort_collection function -- then computation will be faster on large input if you pass in "array_is_sorted" (shorthand: "ais"):`,
``,
` x = [6,5,9,10,4,3]`,
` percentiles(x, [25,75], {"ais":true}) gives { "25": 5, "75": 4 } which is incorrect`,
` x = sort_collection(x)`,
` percentiles(x, [25,75], {"ais":true}) gives { "25": 4, "75": 9 } which is correct`,
``,
`You can also leverage this feature to compute percentiles on a sort of your choosing. For example:`,
``,
` Non-sorted input:`,
``,
` x = splitax("the quick brown fox jumped loquaciously over the lazy dogs", " ")`,
` x is: ["the", "quick", "brown", "fox", "jumped", "loquaciously", "over", "the", "lazy", "dogs"]`,
``,
` Percentiles are taken over the original positions of the words in the array -- "dogs" is last and hence appears as p99:`,
``,
` percentiles(x, [50, 99], {"oa":true, "ais":true}) gives ["loquaciously", "dogs"]`,
``,
` With sorting done inside percentiles, "the" is alphabetically last and is therefore the p99:`,
``,
` percentiles(x, [50, 99], {"oa":true}) gives ["loquaciously", "the"]`,
``,
` With default sorting done outside percentiles, the same:`,
``,
` x = sort(x) # or x = sort_collection(x)`,
` x is: ["brown", "dogs", "fox", "jumped", "lazy", "loquaciously", "over", "quick", "the", "the"]`,
` percentiles(x, [50, 99], {"oa":true, "ais":true}) gives ["loquaciously", "the"]`,
` percentiles(x, [50, 99], {"oa":true}) gives ["loquaciously", "the"]`,
``,
` Now sorting by word length, "loquaciously" is longest and hence is the p99:`,
``,
` x = sort(x, func(a,b) { return strlen(a) <=> strlen(b) } )`,
` x is: ["fox", "the", "the", "dogs", "lazy", "over", "brown", "quick", "jumped", "loquaciously"]`,
` percentiles(x, [50, 99], {"oa":true, "ais":true})`,
` ["over", "loquaciously"]`,
},
},
{
name: "sort_collection",
class: FUNC_CLASS_STATS,
help: `This is a helper function for the percentiles function; please see its online help for details.`,
unaryFunc: bifs.BIF_sort_collection,
examples: []string{},
},
// ----------------------------------------------------------------
// FUNC_CLASS_TIME
{
name: "gmt2sec",
class: FUNC_CLASS_TIME,
help: `Parses GMT timestamp as integer seconds since the epoch.`,
examples: []string{
`gmt2sec("2001-02-03T04:05:06Z") = 981173106`,
},
unaryFunc: bifs.BIF_gmt2sec,
},
{
name: "gmt2nsec",
class: FUNC_CLASS_TIME,
help: `Parses GMT timestamp as integer nanoseconds since the epoch.`,
examples: []string{
`gmt2nsec("2001-02-03T04:05:06Z") = 981173106000000000`,
},
unaryFunc: bifs.BIF_gmt2nsec,
},
{
name: "localtime2sec",
class: FUNC_CLASS_TIME,
help: `Parses local timestamp as integer seconds since the epoch. Consults $TZ environment variable,
unless second argument is supplied.`,
examples: []string{
`localtime2sec("2001-02-03 04:05:06") = 981165906 with TZ="Asia/Istanbul"`,
`localtime2sec("2001-02-03 04:05:06", "Asia/Istanbul") = 981165906"`,
},
unaryFunc: bifs.BIF_localtime2sec_unary,
binaryFunc: bifs.BIF_localtime2sec_binary,
hasMultipleArities: true,
},
{
name: "localtime2nsec",
class: FUNC_CLASS_TIME,
help: `Parses local timestamp as integer nanoseconds since the epoch. Consults $TZ environment variable,
unless second argument is supplied.`,
examples: []string{
`localtime2nsec("2001-02-03 04:05:06") = 981165906000000000 with TZ="Asia/Istanbul"`,
`localtime2nsec("2001-02-03 04:05:06", "Asia/Istanbul") = 981165906000000000"`,
},
unaryFunc: bifs.BIF_localtime2nsec_unary,
binaryFunc: bifs.BIF_localtime2nsec_binary,
hasMultipleArities: true,
},
{
name: "sec2gmt",
class: FUNC_CLASS_TIME,
help: `Formats seconds since epoch as GMT timestamp. Leaves non-numbers as-is. With second integer
argument n, includes n decimal places for the seconds part.`,
examples: []string{
`sec2gmt(1234567890) = "2009-02-13T23:31:30Z"`,
`sec2gmt(1234567890.123456) = "2009-02-13T23:31:30Z"`,
`sec2gmt(1234567890.123456, 6) = "2009-02-13T23:31:30.123456Z"`,
},
unaryFunc: bifs.BIF_sec2gmt_unary,
binaryFunc: bifs.BIF_sec2gmt_binary,
hasMultipleArities: true,
},
{
name: "nsec2gmt",
class: FUNC_CLASS_TIME,
help: `Formats integer nanoseconds since epoch as GMT timestamp. Leaves non-numbers as-is. With second integer
argument n, includes n decimal places for the seconds part.`,
examples: []string{
`nsec2gmt(1234567890000000000) = "2009-02-13T23:31:30Z"`,
`nsec2gmt(1234567890123456789) = "2009-02-13T23:31:30Z"`,
`nsec2gmt(1234567890123456789, 6) = "2009-02-13T23:31:30.123456Z"`,
},
unaryFunc: bifs.BIF_nsec2gmt_unary,
binaryFunc: bifs.BIF_nsec2gmt_binary,
hasMultipleArities: true,
},
{
name: "sec2localtime",
class: FUNC_CLASS_TIME,
help: `Formats seconds since epoch (integer part) as local timestamp. Consults $TZ
environment variable unless third argument is supplied. Leaves non-numbers as-is. With second integer argument n,
includes n decimal places for the seconds part`,
examples: []string{
`sec2localtime(1234567890) = "2009-02-14 01:31:30" with TZ="Asia/Istanbul"`,
`sec2localtime(1234567890.123456) = "2009-02-14 01:31:30" with TZ="Asia/Istanbul"`,
`sec2localtime(1234567890.123456, 6) = "2009-02-14 01:31:30.123456" with TZ="Asia/Istanbul"`,
`sec2localtime(1234567890.123456, 6, "Asia/Istanbul") = "2009-02-14 01:31:30.123456"`,
},
unaryFunc: bifs.BIF_sec2localtime_unary,
binaryFunc: bifs.BIF_sec2localtime_binary,
ternaryFunc: bifs.BIF_sec2localtime_ternary,
hasMultipleArities: true,
},
{
name: "nsec2localtime",
class: FUNC_CLASS_TIME,
help: `Formats integer nanoseconds since epoch as local timestamp. Consults $TZ
environment variable unless third argument is supplied. Leaves non-numbers as-is. With second integer argument n,
includes n decimal places for the seconds part`,
examples: []string{
`nsec2localtime(1234567890000000000) = "2009-02-14 01:31:30" with TZ="Asia/Istanbul"`,
`nsec2localtime(1234567890123456789) = "2009-02-14 01:31:30" with TZ="Asia/Istanbul"`,
`nsec2localtime(1234567890123456789, 6) = "2009-02-14 01:31:30.123456" with TZ="Asia/Istanbul"`,
`nsec2localtime(1234567890123456789, 6, "Asia/Istanbul") = "2009-02-14 01:31:30.123456"`,
},
unaryFunc: bifs.BIF_nsec2localtime_unary,
binaryFunc: bifs.BIF_nsec2localtime_binary,
ternaryFunc: bifs.BIF_nsec2localtime_ternary,
hasMultipleArities: true,
},
{
name: "sec2gmtdate",
class: FUNC_CLASS_TIME,
help: `Formats seconds since epoch (integer part) as GMT timestamp with year-month-date.
Leaves non-numbers as-is.`,
examples: []string{
`sec2gmtdate(1440768801.7) = "2015-08-28".`,
},
unaryFunc: bifs.BIF_sec2gmtdate,
},
{
name: "nsec2gmtdate",
class: FUNC_CLASS_TIME,
help: `Formats integer nanoseconds since epoch as GMT timestamp with year-month-date.
Leaves non-numbers as-is.`,
examples: []string{
`sec2gmtdate(1440768801700000000) = "2015-08-28".`,
},
unaryFunc: bifs.BIF_nsec2gmtdate,
},
{
name: "sec2localdate",
class: FUNC_CLASS_TIME,
help: `Formats seconds since epoch (integer part) as local timestamp with year-month-date.
Leaves non-numbers as-is. Consults $TZ environment variable unless second argument is supplied.`,
examples: []string{
`sec2localdate(1440768801.7) = "2015-08-28" with TZ="Asia/Istanbul"`,
`sec2localdate(1440768801.7, "Asia/Istanbul") = "2015-08-28"`,
},
unaryFunc: bifs.BIF_sec2localdate_unary,
binaryFunc: bifs.BIF_sec2localdate_binary,
hasMultipleArities: true,
},
{
name: "nsec2localdate",
class: FUNC_CLASS_TIME,
help: `Formats integer nanoseconds since epoch as local timestamp with year-month-date.
Leaves non-numbers as-is. Consults $TZ environment variable unless second argument is supplied.`,
examples: []string{
`nsec2localdate(1440768801700000000) = "2015-08-28" with TZ="Asia/Istanbul"`,
`nsec2localdate(1440768801700000000, "Asia/Istanbul") = "2015-08-28"`,
},
unaryFunc: bifs.BIF_nsec2localdate_unary,
binaryFunc: bifs.BIF_nsec2localdate_binary,
hasMultipleArities: true,
},
{
name: "localtime2gmt",
class: FUNC_CLASS_TIME,
help: `Convert from a local-time string to a GMT-time string. Consults $TZ unless second argument
is supplied.`,
examples: []string{
`localtime2gmt("2000-01-01 00:00:00") = "1999-12-31T22:00:00Z" with TZ="Asia/Istanbul"`,
`localtime2gmt("2000-01-01 00:00:00", "Asia/Istanbul") = "1999-12-31T22:00:00Z"`,
},
unaryFunc: bifs.BIF_localtime2gmt_unary,
binaryFunc: bifs.BIF_localtime2gmt_binary,
hasMultipleArities: true,
},
{
name: "gmt2localtime",
class: FUNC_CLASS_TIME,
help: `Convert from a GMT-time string to a local-time string. Consulting $TZ unless second argument
is supplied.`,
examples: []string{
`gmt2localtime("1999-12-31T22:00:00Z") = "2000-01-01 00:00:00" with TZ="Asia/Istanbul"`,
`gmt2localtime("1999-12-31T22:00:00Z", "Asia/Istanbul") = "2000-01-01 00:00:00"`,
},
unaryFunc: bifs.BIF_gmt2localtime_unary,
binaryFunc: bifs.BIF_gmt2localtime_binary,
hasMultipleArities: true,
},
{
name: "strftime",
class: FUNC_CLASS_TIME,
help: `Formats seconds since the epoch as timestamp. Format strings are as at
https://pkg.go.dev/github.com/lestrrat-go/strftime, with the Miller-specific addition of "%1S"
through "%9S" which format the seconds with 1 through 9 decimal places, respectively. ("%S" uses no
decimal places.) See also ` + lib.DOC_URL + `/en/latest/reference-dsl-time/ for more information on the differences from the C library ("man strftime" on your system).
See also strftime_local.`,
examples: []string{
`strftime(1440768801.7,"%Y-%m-%dT%H:%M:%SZ") = "2015-08-28T13:33:21Z"`,
`strftime(1440768801.7,"%Y-%m-%dT%H:%M:%3SZ") = "2015-08-28T13:33:21.700Z"`,
},
binaryFunc: bifs.BIF_strftime,
},
{
name: "strfntime",
class: FUNC_CLASS_TIME,
help: `Formats integer nanoseconds since the epoch as timestamp. Format strings are as at
https://pkg.go.dev/github.com/lestrrat-go/strftime, with the Miller-specific addition of "%1S"
through "%9S" which format the seconds with 1 through 9 decimal places, respectively. ("%S" uses no
decimal places.) See also ` + lib.DOC_URL + `/en/latest/reference-dsl-time/ for more information on the differences from the C library ("man strftime" on your system).
See also strftime_local.`,
examples: []string{
`strfntime(1440768801123456789,"%Y-%m-%dT%H:%M:%SZ") = "2015-08-28T13:33:21Z"`,
`strfntime(1440768801123456789,"%Y-%m-%dT%H:%M:%3SZ") = "2015-08-28T13:33:21.123Z"`,
`strfntime(1440768801123456789,"%Y-%m-%dT%H:%M:%6SZ") = "2015-08-28T13:33:21.123456Z"`,
},
binaryFunc: bifs.BIF_strfntime,
},
{
name: "strftime_local",
class: FUNC_CLASS_TIME,
help: `Like strftime but consults the $TZ environment variable to get local time zone.`,
examples: []string{
`strftime_local(1440768801.7, "%Y-%m-%d %H:%M:%S %z") = "2015-08-28 16:33:21 +0300" with TZ="Asia/Istanbul"`,
`strftime_local(1440768801.7, "%Y-%m-%d %H:%M:%3S %z") = "2015-08-28 16:33:21.700 +0300" with TZ="Asia/Istanbul"`,
`strftime_local(1440768801.7, "%Y-%m-%d %H:%M:%3S %z", "Asia/Istanbul") = "2015-08-28 16:33:21.700 +0300"`,
},
binaryFunc: bifs.BIF_strftime_local_binary,
ternaryFunc: bifs.BIF_strftime_local_ternary,
hasMultipleArities: true,
},
{
name: "strfntime_local",
class: FUNC_CLASS_TIME,
help: `Like strfntime but consults the $TZ environment variable to get local time zone.`,
examples: []string{
`strfntime_local(1440768801123456789, "%Y-%m-%d %H:%M:%S %z") = "2015-08-28 16:33:21 +0300" with TZ="Asia/Istanbul"`,
`strfntime_local(1440768801123456789, "%Y-%m-%d %H:%M:%3S %z") = "2015-08-28 16:33:21.123 +0300" with TZ="Asia/Istanbul"`,
`strfntime_local(1440768801123456789, "%Y-%m-%d %H:%M:%3S %z", "Asia/Istanbul") = "2015-08-28 16:33:21.123 +0300"`,
`strfntime_local(1440768801123456789, "%Y-%m-%d %H:%M:%9S %z", "Asia/Istanbul") = "2015-08-28 16:33:21.123456789 +0300"`,
},
binaryFunc: bifs.BIF_strfntime_local_binary,
ternaryFunc: bifs.BIF_strfntime_local_ternary,
hasMultipleArities: true,
},
{
name: "strptime",
class: FUNC_CLASS_TIME,
help: `strptime: Parses timestamp as floating-point seconds since the epoch. See also strptime_local.`,
examples: []string{
`strptime("2015-08-28T13:33:21Z", "%Y-%m-%dT%H:%M:%SZ") = 1440768801.000000`,
`strptime("2015-08-28T13:33:21.345Z", "%Y-%m-%dT%H:%M:%SZ") = 1440768801.345000`,
`strptime("1970-01-01 00:00:00 -0400", "%Y-%m-%d %H:%M:%S %z") = 14400`,
`strptime("1970-01-01 00:00:00 +0200", "%Y-%m-%d %H:%M:%S %z") = -7200`,
},
binaryFunc: bifs.BIF_strptime,
},
{
name: "strpntime",
class: FUNC_CLASS_TIME,
help: `strpntime: Parses timestamp as integer nanoseconds since the epoch. See also strpntime_local.`,
examples: []string{
`strpntime("2015-08-28T13:33:21Z", "%Y-%m-%dT%H:%M:%SZ") = 1440768801000000000`,
`strpntime("2015-08-28T13:33:21.345Z", "%Y-%m-%dT%H:%M:%SZ") = 1440768801345000000`,
`strpntime("1970-01-01 00:00:00 -0400", "%Y-%m-%d %H:%M:%S %z") = 14400000000000`,
`strpntime("1970-01-01 00:00:00 +0200", "%Y-%m-%d %H:%M:%S %z") = -7200000000000`,
},
binaryFunc: bifs.BIF_strpntime,
},
{
name: "strptime_local",
class: FUNC_CLASS_TIME,
help: `Like strptime but consults the $TZ environment variable to get local time zone.`,
examples: []string{
`strptime_local("2015-08-28T13:33:21Z", "%Y-%m-%dT%H:%M:%SZ") = 1440758001 with TZ="Asia/Istanbul"`,
`strptime_local("2015-08-28T13:33:21.345Z","%Y-%m-%dT%H:%M:%SZ") = 1440758001.345 with TZ="Asia/Istanbul"`,
`strptime_local("2015-08-28 13:33:21", "%Y-%m-%d %H:%M:%S") = 1440758001 with TZ="Asia/Istanbul"`,
`strptime_local("2015-08-28 13:33:21", "%Y-%m-%d %H:%M:%S", "Asia/Istanbul") = 1440758001`,
// TODO: fix parse error on decimal part
//`strptime_local("2015-08-28 13:33:21.345","%Y-%m-%d %H:%M:%S") = 1440758001.345`,
},
binaryFunc: bifs.BIF_strptime_local_binary,
ternaryFunc: bifs.BIF_strptime_local_ternary,
hasMultipleArities: true,
},
{
name: "strpntime_local",
class: FUNC_CLASS_TIME,
help: `Like strpntime but consults the $TZ environment variable to get local time zone.`,
examples: []string{
`strpntime_local("2015-08-28T13:33:21Z", "%Y-%m-%dT%H:%M:%SZ") = 1440758001000000000 with TZ="Asia/Istanbul"`,
`strpntime_local("2015-08-28T13:33:21.345Z","%Y-%m-%dT%H:%M:%SZ") = 1440758001345000000 with TZ="Asia/Istanbul"`,
`strpntime_local("2015-08-28 13:33:21", "%Y-%m-%d %H:%M:%S") = 1440758001000000000 with TZ="Asia/Istanbul"`,
`strpntime_local("2015-08-28 13:33:21", "%Y-%m-%d %H:%M:%S", "Asia/Istanbul") = 1440758001000000000`,
// TODO: fix parse error on decimal part
//`strpntime_local("2015-08-28 13:33:21.345","%Y-%m-%d %H:%M:%S") = 1440758001.345`,
},
binaryFunc: bifs.BIF_strpntime_local_binary,
ternaryFunc: bifs.BIF_strpntime_local_ternary,
hasMultipleArities: true,
},
{
name: "dhms2fsec",
class: FUNC_CLASS_TIME,
help: `Recovers floating-point seconds as in dhms2fsec("5d18h53m20.250000s") = 500000.250000`,
unaryFunc: bifs.BIF_dhms2fsec,
},
{
name: "dhms2sec",
class: FUNC_CLASS_TIME,
help: `Recovers integer seconds as in dhms2sec("5d18h53m20s") = 500000`,
unaryFunc: bifs.BIF_dhms2sec,
},
{
name: "fsec2dhms",
class: FUNC_CLASS_TIME,
help: `Formats floating-point seconds as in fsec2dhms(500000.25) = "5d18h53m20.250000s"`,
unaryFunc: bifs.BIF_fsec2dhms,
},
{
name: "fsec2hms",
class: FUNC_CLASS_TIME,
help: `Formats floating-point seconds as in fsec2hms(5000.25) = "01:23:20.250000"`,
unaryFunc: bifs.BIF_fsec2hms,
},
{
name: "hms2fsec",
class: FUNC_CLASS_TIME,
help: `Recovers floating-point seconds as in hms2fsec("01:23:20.250000") = 5000.250000`,
unaryFunc: bifs.BIF_hms2fsec,
},
{
name: "hms2sec",
class: FUNC_CLASS_TIME,
help: `Recovers integer seconds as in hms2sec("01:23:20") = 5000`,
unaryFunc: bifs.BIF_hms2sec,
},
{
name: "sec2dhms",
class: FUNC_CLASS_TIME,
help: `Formats integer seconds as in sec2dhms(500000) = "5d18h53m20s"`,
unaryFunc: bifs.BIF_sec2dhms,
},
{
name: "sec2hms",
class: FUNC_CLASS_TIME,
help: `Formats integer seconds as in sec2hms(5000) = "01:23:20"`,
unaryFunc: bifs.BIF_sec2hms,
},
{
name: "systime",
class: FUNC_CLASS_TIME,
help: "Returns the system time in floating-point seconds since the epoch.",
zaryFunc: bifs.BIF_systime,
},
{
name: "sysntime",
class: FUNC_CLASS_TIME,
help: "Returns the system time in 64-bit nanoseconds since the epoch.",
zaryFunc: bifs.BIF_sysntime,
},
{
name: "systimeint",
class: FUNC_CLASS_TIME,
help: "Returns the system time in integer seconds since the epoch.",
zaryFunc: bifs.BIF_systimeint,
},
{
name: "uptime",
class: FUNC_CLASS_TIME,
help: "Returns the time in floating-point seconds since the current Miller program was started.",
zaryFunc: bifs.BIF_uptime,
},
{
name: "upntime",
class: FUNC_CLASS_TIME,
help: "Returns the time in 64-bit nanoseconds since the current Miller program was started.",
zaryFunc: bifs.BIF_upntime,
},
// ----------------------------------------------------------------
// FUNC_CLASS_TYPING
{
name: "is_absent",
class: FUNC_CLASS_TYPING,
help: "False if field is present in input, true otherwise",
unaryFunc: bifs.BIF_is_absent,
},
{
name: "is_array",
class: FUNC_CLASS_TYPING,
help: "True if argument is an array.",
unaryFunc: bifs.BIF_is_array,
},
{
name: "is_bool",
class: FUNC_CLASS_TYPING,
help: "True if field is present with boolean value. Synonymous with is_boolean.",
unaryFunc: bifs.BIF_is_bool,
},
{
name: "is_boolean",
class: FUNC_CLASS_TYPING,
help: "True if field is present with boolean value. Synonymous with is_bool.",
unaryFunc: bifs.BIF_is_boolean,
},
{
name: "is_empty",
class: FUNC_CLASS_TYPING,
help: "True if field is present in input with empty string value, false otherwise.",
unaryFunc: bifs.BIF_is_empty,
},
{
name: "is_empty_map",
class: FUNC_CLASS_TYPING,
help: "True if argument is a map which is empty.",
unaryFunc: bifs.BIF_is_emptymap,
},
{
name: "is_error",
class: FUNC_CLASS_TYPING,
help: "True if if argument is an error, such as taking string length of an integer.",
unaryFunc: bifs.BIF_is_error,
},
{
name: "is_float",
class: FUNC_CLASS_TYPING,
help: "True if field is present with value inferred to be float",
unaryFunc: bifs.BIF_is_float,
},
{
name: "is_int",
class: FUNC_CLASS_TYPING,
help: "True if field is present with value inferred to be int",
unaryFunc: bifs.BIF_is_int,
},
{
name: "is_map",
class: FUNC_CLASS_TYPING,
help: "True if argument is a map.",
unaryFunc: bifs.BIF_is_map,
},
{
name: "is_nonempty_map",
class: FUNC_CLASS_TYPING,
help: "True if argument is a map which is non-empty.",
unaryFunc: bifs.BIF_is_nonemptymap,
},
{
name: "is_not_empty",
class: FUNC_CLASS_TYPING,
help: "True if field is present in input with non-empty value, false otherwise",
unaryFunc: bifs.BIF_is_notempty,
},
{
name: "is_not_map",
class: FUNC_CLASS_TYPING,
help: "True if argument is not a map.",
unaryFunc: bifs.BIF_is_notmap,
},
{
name: "is_not_array",
class: FUNC_CLASS_TYPING,
help: "True if argument is not an array.",
unaryFunc: bifs.BIF_is_notarray,
},
{
name: "is_not_null",
class: FUNC_CLASS_TYPING,
help: "False if argument is null (empty, absent, or JSON null), true otherwise.",
unaryFunc: bifs.BIF_is_notnull,
},
{
name: "is_null",
class: FUNC_CLASS_TYPING,
help: "True if argument is null (empty, absent, or JSON null), false otherwise.",
unaryFunc: bifs.BIF_is_null,
},
{
name: "is_numeric",
class: FUNC_CLASS_TYPING,
help: "True if field is present with value inferred to be int or float",
unaryFunc: bifs.BIF_is_numeric,
},
{
name: "is_present",
class: FUNC_CLASS_TYPING,
help: "True if field is present in input, false otherwise.",
unaryFunc: bifs.BIF_is_present,
},
{
name: "is_string",
class: FUNC_CLASS_TYPING,
help: "True if field is present with string (including empty-string) value",
unaryFunc: bifs.BIF_is_string,
},
{
name: "is_nan",
class: FUNC_CLASS_TYPING,
help: `True if the argument is the NaN (not-a-number) floating-point value.
Note that NaN has the property that NaN != NaN, so you need 'is_nan(x)' rather than 'x == NaN'.`,
unaryFunc: bifs.BIF_is_nan,
},
{
name: "asserting_absent",
class: FUNC_CLASS_TYPING,
help: `Aborts with an error if is_absent on the argument returns false, else returns its argument.`,
unaryFuncWithContext: bifs.BIF_asserting_absent,
},
{
name: "asserting_array",
class: FUNC_CLASS_TYPING,
help: `Aborts with an error if is_array on the argument returns false, else returns its argument.`,
unaryFuncWithContext: bifs.BIF_asserting_array,
},
{
name: "asserting_bool",
class: FUNC_CLASS_TYPING,
help: `Aborts with an error if is_bool on the argument returns false, else returns its argument.`,
unaryFuncWithContext: bifs.BIF_asserting_bool,
},
{
name: "asserting_boolean",
class: FUNC_CLASS_TYPING,
help: `Aborts with an error if is_boolean on the argument returns false, else returns its argument.`,
unaryFuncWithContext: bifs.BIF_asserting_boolean,
},
{
name: "asserting_error",
class: FUNC_CLASS_TYPING,
help: `Aborts with an error if is_error on the argument returns false, else returns its argument.`,
unaryFuncWithContext: bifs.BIF_asserting_error,
},
{
name: "asserting_empty",
class: FUNC_CLASS_TYPING,
help: `Aborts with an error if is_empty on the argument returns false, else returns its argument.`,
unaryFuncWithContext: bifs.BIF_asserting_empty,
},
{
name: "asserting_empty_map",
class: FUNC_CLASS_TYPING,
help: `Aborts with an error if is_empty_map on the argument returns false, else returns its argument.`,
unaryFuncWithContext: bifs.BIF_asserting_emptyMap,
},
{
name: "asserting_float",
class: FUNC_CLASS_TYPING,
help: `Aborts with an error if is_float on the argument returns false, else returns its argument.`,
unaryFuncWithContext: bifs.BIF_asserting_float,
},
{
name: "asserting_int",
class: FUNC_CLASS_TYPING,
help: `Aborts with an error if is_int on the argument returns false, else returns its argument.`,
unaryFuncWithContext: bifs.BIF_asserting_int,
},
{
name: "asserting_map",
class: FUNC_CLASS_TYPING,
help: `Aborts with an error if is_map on the argument returns false, else returns its argument.`,
unaryFuncWithContext: bifs.BIF_asserting_map,
},
{
name: "asserting_nonempty_map",
class: FUNC_CLASS_TYPING,
help: `Aborts with an error if is_nonempty_map on the argument returns false, else returns its argument.`,
unaryFuncWithContext: bifs.BIF_asserting_nonempty_map,
},
{
name: "asserting_not_empty",
class: FUNC_CLASS_TYPING,
help: `Aborts with an error if is_not_empty on the argument returns false, else returns its argument.`,
unaryFuncWithContext: bifs.BIF_asserting_not_empty,
},
{
name: "asserting_not_map",
class: FUNC_CLASS_TYPING,
help: `Aborts with an error if is_not_map on the argument returns false, else returns its argument.`,
unaryFuncWithContext: bifs.BIF_asserting_not_map,
},
{
name: "asserting_not_array",
class: FUNC_CLASS_TYPING,
help: `Aborts with an error if is_not_array on the argument returns false, else returns its argument.`,
unaryFuncWithContext: bifs.BIF_asserting_not_array,
},
{
name: "asserting_not_null",
class: FUNC_CLASS_TYPING,
help: `Aborts with an error if is_not_null on the argument returns false, else returns its argument.`,
unaryFuncWithContext: bifs.BIF_asserting_not_null,
},
{
name: "asserting_null",
class: FUNC_CLASS_TYPING,
help: `Aborts with an error if is_null on the argument returns false, else returns its argument.`,
unaryFuncWithContext: bifs.BIF_asserting_null,
},
{
name: "asserting_numeric",
class: FUNC_CLASS_TYPING,
help: `Aborts with an error if is_numeric on the argument returns false, else returns its argument.`,
unaryFuncWithContext: bifs.BIF_asserting_numeric,
},
{
name: "asserting_present",
class: FUNC_CLASS_TYPING,
help: `Aborts with an error if is_present on the argument returns false, else returns its argument.`,
unaryFuncWithContext: bifs.BIF_asserting_present,
},
{
name: "asserting_string",
class: FUNC_CLASS_TYPING,
help: `Aborts with an error if is_string on the argument returns false, else returns its argument.`,
unaryFuncWithContext: bifs.BIF_asserting_string,
},
{
name: "typeof",
class: FUNC_CLASS_TYPING,
help: "Convert argument to type of argument (e.g. \"str\"). For debug.",
unaryFunc: bifs.BIF_typeof,
},
// ----------------------------------------------------------------
// FUNC_CLASS_CONVERSION
{
name: "boolean",
class: FUNC_CLASS_CONVERSION,
help: "Convert int/float/bool/string to boolean.",
unaryFunc: bifs.BIF_boolean,
},
{
name: "float",
class: FUNC_CLASS_CONVERSION,
help: "Convert int/float/bool/string to float.",
unaryFunc: bifs.BIF_float,
},
{
name: "fmtnum",
class: FUNC_CLASS_CONVERSION,
help: `Convert int/float/bool to string using printf-style format string (https://pkg.go.dev/fmt), e.g.
'$s = fmtnum($n, "%08d")' or '$t = fmtnum($n, "%.6e")'. This function recurses on array and map values.`,
binaryFunc: bifs.BIF_fmtnum,
examples: []string{
`$x = fmtnum($x, "%.6f")`,
},
},
{
name: "fmtifnum",
class: FUNC_CLASS_CONVERSION,
help: `Identical to fmtnum, except returns the first argument as-is if the output would be an error.`,
binaryFunc: bifs.BIF_fmtifnum,
examples: []string{
`fmtifnum(3.4, "%.6f") gives 3.400000"`,
`fmtifnum("abc", "%.6f") gives abc"`,
`$* = fmtifnum($*, "%.6f") formats numeric fields in the current record, leaving non-numeric ones alone`,
},
},
{
name: "hexfmt",
class: FUNC_CLASS_CONVERSION,
help: `Convert int to hex string, e.g. 255 to "0xff".`,
unaryFunc: bifs.BIF_hexfmt,
},
{
name: "int",
class: FUNC_CLASS_CONVERSION,
help: `Convert int/float/bool/string to int.
If the second argument is omitted and the first argument is a string, base is inferred from the first argument's prefix.
If the second argument is provided and the first argument is a string, the second argument is used as the base.
If the second argument is provided and the first argument is not a string, the second argument is ignored.`,
unaryFunc: bifs.BIF_int,
binaryFunc: bifs.BIF_int_with_base,
hasMultipleArities: true,
examples: []string{
`int("345") gives decimal 345 (base-10/decimal input is inferred)`,
`int("0xff") gives decimal 255 (base-16/hexadecimal input is inferred)`,
`int("0377") gives decimal 255 (base-8/octal input is inferred)`,
`int("0b11010011") gives decimal 211 which is hexadecimal 0xd3 (base-2/binary input is inferred)`,
`int("0377", 10) gives decimal 377`,
`int(345, 16) gives decimal 345`,
`int(string(345), 16) gives decimal 837`,
},
},
{
name: "joink",
class: FUNC_CLASS_CONVERSION,
help: `Makes string from map/array keys. First argument is map/array; second is separator string.`,
examples: []string{
`joink({"a":3,"b":4,"c":5}, ",") = "a,b,c".`,
`joink([1,2,3], ",") = "1,2,3".`,
},
binaryFunc: bifs.BIF_joink,
},
{
name: "joinv",
class: FUNC_CLASS_CONVERSION,
help: `Makes string from map/array values. First argument is map/array; second is separator string.`,
examples: []string{
`joinv([3,4,5], ",") = "3,4,5"`,
`joinv({"a":3,"b":4,"c":5}, ",") = "3,4,5"`,
},
binaryFunc: bifs.BIF_joinv,
},
{
name: "joinkv",
class: FUNC_CLASS_CONVERSION,
help: `Makes string from map/array key-value pairs. First argument is map/array;
second is pair-separator string; third is field-separator string. Mnemonic: the "=" comes before the "," in the output and in the arguments to joinkv.`,
examples: []string{
`joinkv([3,4,5], "=", ",") = "1=3,2=4,3=5"`,
`joinkv({"a":3,"b":4,"c":5}, ":", ";") = "a:3;b:4;c:5"`,
},
ternaryFunc: bifs.BIF_joinkv,
},
{
name: "splita",
class: FUNC_CLASS_CONVERSION,
help: `Splits string into array with type inference. First argument is string to split;
second is the separator to split on.`,
examples: []string{
`splita("3,4,5", ",") = [3,4,5]`,
},
binaryFunc: bifs.BIF_splita,
},
{
name: "splitax",
class: FUNC_CLASS_CONVERSION,
help: `Splits string into array without type inference. First argument is string to split;
second is the separator to split on.`,
examples: []string{
`splitax("3,4,5", ",") = ["3","4","5"]`,
},
binaryFunc: bifs.BIF_splitax,
},
{
name: "splitkv",
class: FUNC_CLASS_CONVERSION,
help: `Splits string by separators into map with type inference. First argument is string to split;
second argument is pair separator; third argument is field separator.`,
examples: []string{
`splitkv("a=3,b=4,c=5", "=", ",") = {"a":3,"b":4,"c":5}`,
},
ternaryFunc: bifs.BIF_splitkv,
},
{
name: "splitkvx",
class: FUNC_CLASS_CONVERSION,
help: `Splits string by separators into map without type inference
(keys and values are strings). First argument is string to split; second
argument is pair separator; third argument is field separator.`,
examples: []string{
`splitkvx("a=3,b=4,c=5", "=", ",") = {"a":"3","b":"4","c":"5"}`,
},
ternaryFunc: bifs.BIF_splitkvx,
},
{
name: "splitnv",
class: FUNC_CLASS_CONVERSION,
help: `Splits string by separator into integer-indexed map with type inference. First argument is
string to split; second argument is separator to split on.`,
examples: []string{
`splitnv("a,b,c", ",") = {"1":"a","2":"b","3":"c"}`,
},
binaryFunc: bifs.BIF_splitnv,
},
{
name: "splitnvx",
class: FUNC_CLASS_CONVERSION,
help: `Splits string by separator into integer-indexed map without
type inference (values are strings). First argument is string to split; second
argument is separator to split on.`,
examples: []string{
`splitnvx("3,4,5", ",") = {"1":"3","2":"4","3":"5"}`,
},
binaryFunc: bifs.BIF_splitnvx,
},
{
name: "string",
class: FUNC_CLASS_CONVERSION,
help: "Convert int/float/bool/string/array/map to string.",
unaryFunc: bifs.BIF_string,
},
// ----------------------------------------------------------------
// FUNC_CLASS_COLLECTIONS
{
name: "append",
class: FUNC_CLASS_COLLECTIONS,
help: "Appends second argument to end of first argument, which must be an array.",
binaryFunc: bifs.BIF_append,
},
{
name: "arrayify",
class: FUNC_CLASS_COLLECTIONS,
help: `Walks through a nested map/array, converting any map with consecutive keys
"1", "2", ... into an array. Useful to wrap the output of unflatten.`,
unaryFunc: bifs.BIF_arrayify,
},
{
name: "concat",
class: FUNC_CLASS_COLLECTIONS,
help: `Returns the array concatenation of the arguments. Non-array arguments are treated as
single-element arrays.`,
examples: []string{
`concat(1,2,3) is [1,2,3]`,
`concat([1,2],3) is [1,2,3]`,
`concat([1,2],[3]) is [1,2,3]`,
},
variadicFunc: bifs.BIF_concat,
},
{
name: "depth",
class: FUNC_CLASS_COLLECTIONS,
help: "Prints maximum depth of map/array. Scalars have depth 0.",
unaryFunc: bifs.BIF_depth,
},
{
name: "flatten",
class: FUNC_CLASS_COLLECTIONS,
help: `Flattens multi-level maps to single-level ones. Useful for nested JSON-like structures
for non-JSON file formats like CSV. With two arguments, the first argument is a map (maybe $*) and
the second argument is the flatten separator. With three arguments, the first argument is prefix,
the second is the flatten separator, and the third argument is a map; flatten($*, ".") is the
same as flatten("", ".", $*). See "Flatten/unflatten: converting between JSON and tabular formats"
at ` + lib.DOC_URL + ` for more information.`,
examples: []string{
`flatten({"a":[1,2],"b":3}, ".") is {"a.1": 1, "a.2": 2, "b": 3}.`,
`flatten("a", ".", {"b": { "c": 4 }}) is {"a.b.c" : 4}.`,
`flatten("", ".", {"a": { "b": 3 }}) is {"a.b" : 3}.`,
},
binaryFunc: bifs.BIF_flatten_binary,
ternaryFunc: bifs.BIF_flatten,
hasMultipleArities: true,
},
{
name: "unflatten",
class: FUNC_CLASS_COLLECTIONS,
help: `Reverses flatten. Useful for nested JSON-like structures for non-JSON file formats like CSV.
The first argument is a map, and the second argument is the flatten separator. See also arrayify.
See "Flatten/unflatten: converting between JSON and tabular formats" at ` + lib.DOC_URL + ` for more
information.`,
examples: []string{
`unflatten({"a.b.c" : 4}, ".") is {"a": "b": { "c": 4 }}.`,
},
binaryFunc: bifs.BIF_unflatten,
},
{
name: "get_keys",
class: FUNC_CLASS_COLLECTIONS,
help: "Returns array of keys of map or array",
unaryFunc: bifs.BIF_get_keys,
},
{
name: "get_values",
class: FUNC_CLASS_COLLECTIONS,
help: "Returns array of values of map or array -- in the latter case, returns a copy of the array",
unaryFunc: bifs.BIF_get_values,
},
{
name: "haskey",
class: FUNC_CLASS_COLLECTIONS,
help: `True/false if map has/hasn't key, e.g. 'haskey($*, "a")' or 'haskey(mymap, mykey)',
or true/false if array index is in bounds / out of bounds. Error if 1st argument is not a map or array. Note
-n..-1 alias to 1..n in Miller arrays.`,
binaryFunc: bifs.BIF_haskey,
},
{
name: "json_parse",
class: FUNC_CLASS_COLLECTIONS,
help: `Converts value from JSON-formatted string.`,
unaryFunc: bifs.BIF_json_parse,
},
{
name: "json_stringify",
class: FUNC_CLASS_COLLECTIONS,
help: `Converts value to JSON-formatted string. Default output is single-line.
With optional second boolean argument set to true, produces multiline output.`,
unaryFunc: bifs.BIF_json_stringify_unary,
binaryFunc: bifs.BIF_json_stringify_binary,
hasMultipleArities: true,
},
{
name: "leafcount",
class: FUNC_CLASS_COLLECTIONS,
help: `Counts total number of terminal values in map/array. For single-level map/array, same as length.`,
unaryFunc: bifs.BIF_leafcount,
},
{
name: "length",
class: FUNC_CLASS_COLLECTIONS,
help: "Counts number of top-level entries in array/map. Scalars have length 1.",
unaryFunc: bifs.BIF_length,
},
{
name: "mapdiff",
class: FUNC_CLASS_COLLECTIONS,
help: `With 0 args, returns empty map. With 1 arg, returns copy of arg. With 2 or more,
returns copy of arg 1 with all keys from any of remaining argument maps removed.`,
variadicFunc: bifs.BIF_mapdiff,
},
{
name: "mapexcept",
class: FUNC_CLASS_COLLECTIONS,
help: `Returns a map with keys from remaining arguments, if any, unset.
Remaining arguments can be strings or arrays of string. E.g. 'mapexcept({1:2,3:4,5:6}, 1, 5, 7)' is '{3:4}'
and 'mapexcept({1:2,3:4,5:6}, [1, 5, 7])' is '{3:4}'.`,
variadicFunc: bifs.BIF_mapexcept,
minimumVariadicArity: 1,
},
{
name: "mapselect",
class: FUNC_CLASS_COLLECTIONS,
help: `Returns a map with only keys from remaining arguments set.
Remaining arguments can be strings or arrays of string. E.g. 'mapselect({1:2,3:4,5:6}, 1, 5, 7)' is
'{1:2,5:6}' and 'mapselect({1:2,3:4,5:6}, [1, 5, 7])' is '{1:2,5:6}'.`,
variadicFunc: bifs.BIF_mapselect,
minimumVariadicArity: 1,
},
{
name: "mapsum",
class: FUNC_CLASS_COLLECTIONS,
help: `With 0 args, returns empty map. With >= 1 arg, returns a map with key-value pairs
from all arguments. Rightmost collisions win, e.g. 'mapsum({1:2,3:4},{1:5})' is '{1:5,3:4}'.`,
variadicFunc: bifs.BIF_mapsum,
},
// ----------------------------------------------------------------
// FUNC_CLASS_HOFS
// Note: most UDFs are in the types package, but these use UDFs which are in the dsl/cst.
{
name: "select",
class: FUNC_CLASS_HOFS,
help: `Given a map or array as first argument and a function as second argument, includes each
input element in the output if the function returns true. For arrays, the function should take one argument,
for array element; for maps, it should take two, for map-element key and value. In either case it should
return a boolean.`,
examples: []string{
`Array example: select([1,2,3,4,5], func(e) {return e >= 3}) returns [3, 4, 5].`,
`Map example: select({"a":1, "b":3, "c":5}, func(k,v) {return v >= 3}) returns {"b":3, "c": 5}.`,
},
binaryFuncWithState: SelectHOF,
},
{
name: "apply",
class: FUNC_CLASS_HOFS,
help: `Given a map or array as first argument and a function as second argument, applies the
function to each element of the array/map. For arrays, the function should take one argument, for array
element; it should return a new element. For maps, it should take two arguments, for map-element key and
value; it should return a new key-value pair (i.e. a single-entry map).`,
examples: []string{
`Array example: apply([1,2,3,4,5], func(e) {return e ** 3}) returns [1, 8, 27, 64, 125].`,
`Map example: apply({"a":1, "b":3, "c":5}, func(k,v) {return {toupper(k): v ** 2}}) returns {"A": 1, "B":9, "C": 25}",`,
},
binaryFuncWithState: ApplyHOF,
},
{
name: "reduce",
class: FUNC_CLASS_HOFS,
help: `Given a map or array as first argument and a function as second argument, accumulates entries
into a final output -- for example, sum or product. For arrays, the function should take two arguments, for
accumulated value and array element, and return the accumulated element. For maps, it should take four
arguments, for accumulated key and value, and map-element key and value; it should return the updated
accumulator as a new key-value pair (i.e. a single-entry map). The start value for the accumulator is the
first element for arrays, or the first element's key-value pair for maps.`,
examples: []string{
`Array example: reduce([1,2,3,4,5], func(acc,e) {return acc + e**3}) returns 225.`,
`Map example: reduce({"a":1, "b":3, "c": 5}, func(acck,accv,ek,ev) {return {"sum_of_squares": accv + ev**2}}) returns {"sum_of_squares": 35}.`,
},
binaryFuncWithState: ReduceHOF,
},
{
name: "fold",
class: FUNC_CLASS_HOFS,
help: `Given a map or array as first argument and a function as second argument, accumulates
entries into a final output -- for example, sum or product. For arrays, the function should take two
arguments, for accumulated value and array element. For maps, it should take four arguments, for accumulated
key and value, and map-element key and value; it should return the updated accumulator as a new key-value pair
(i.e. a single-entry map). The start value for the accumulator is taken from the third argument.`,
examples: []string{
`Array example: fold([1,2,3,4,5], func(acc,e) {return acc + e**3}, 10000) returns 10225.`,
`Map example: fold({"a":1, "b":3, "c": 5}, func(acck,accv,ek,ev) {return {"sum": accv+ev**2}}, {"sum":10000}) returns 10035.`,
},
ternaryFuncWithState: FoldHOF,
},
{
name: "sort",
class: FUNC_CLASS_HOFS,
help: `Given a map or array as first argument and string flags or function as optional second argument,
returns a sorted copy of the input. With one argument, sorts array elements with numbers first
numerically and then strings lexically, and map elements likewise by map keys. If the second
argument is a string, it can contain any of "f" for lexical ("n" is for the above default), "c" for
case-folded lexical, or "t" for natural sort order. An additional "r" in that string is for reverse.
An additional "v" in that string means sort maps by value, rather than by key. If the second
argument is a function, then for arrays it should take two arguments a and b, returning < 0, 0, or >
0 as a < b, a == b, or a > b respectively; for maps the function should take four arguments ak, av,
bk, and bv, again returning < 0, 0, or
> 0, using a and b's keys and values.`,
examples: []string{
`Default sorting: sort([3,"A",1,"B",22]) returns [1, 3, 20, "A", "B"].`,
` Note that this is numbers before strings.`,
`Default sorting: sort(["E","a","c","B","d"]) returns ["B", "E", "a", "c", "d"].`,
` Note that this is uppercase before lowercase.`,
`Case-folded ascending: sort(["E","a","c","B","d"], "c") returns ["a", "B", "c", "d", "E"].`,
`Case-folded descending: sort(["E","a","c","B","d"], "cr") returns ["E", "d", "c", "B", "a"].`,
`Natural sorting: sort(["a1","a10","a100","a2","a20","a200"], "t") returns ["a1", "a2", "a10", "a20", "a100", "a200"].`,
`Array with function: sort([5,2,3,1,4], func(a,b) {return b <=> a}) returns [5,4,3,2,1].`,
`Map with function: sort({"c":2,"a":3,"b":1}, func(ak,av,bk,bv) {return bv <=> av}) returns {"a":3,"c":2,"b":1}.`,
`Map without function: sort({"c":2,"a":3,"b":1}) returns {"a":3,"b":1,"c":2}.`,
`Map without function: sort({"c":2,"a":3,"b":1}, "v") returns {"b":1,"c":2,"a":3}.`,
`Map without function: sort({"c":2,"a":3,"b":1}, "vnr") returns {"a":3,"c":2,"b":1}.`,
},
variadicFuncWithState: SortHOF,
minimumVariadicArity: 1,
maximumVariadicArity: 2,
},
{
name: "any",
class: FUNC_CLASS_HOFS,
help: `Given a map or array as first argument and a function as second argument, yields a boolean true
if the argument function returns true for any array/map element, false otherwise. For arrays, the function
should take one argument, for array element; for maps, it should take two, for map-element key and value. In
either case it should return a boolean.`,
examples: []string{
`Array example: any([10,20,30], func(e) {return $index == e})`,
`Map example: any({"a": "foo", "b": "bar"}, func(k,v) {return $[k] == v})`,
},
binaryFuncWithState: AnyHOF,
},
{
name: "every",
class: FUNC_CLASS_HOFS,
help: `Given a map or array as first argument and a function as second argument, yields a boolean true
if the argument function returns true for every array/map element, false otherwise. For arrays, the function
should take one argument, for array element; for maps, it should take two, for map-element key and value. In
either case it should return a boolean.`,
examples: []string{
`Array example: every(["a", "b", "c"], func(e) {return $[e] >= 0})`,
`Map example: every({"a": "foo", "b": "bar"}, func(k,v) {return $[k] == v})`,
},
binaryFuncWithState: EveryHOF,
},
// ----------------------------------------------------------------
// FUNC_CLASS_SYSTEM
{
name: "hostname",
class: FUNC_CLASS_SYSTEM,
help: `Returns the hostname as a string.`,
zaryFunc: bifs.BIF_hostname,
},
{
name: "os",
class: FUNC_CLASS_SYSTEM,
help: `Returns the operating-system name as a string.`,
zaryFunc: bifs.BIF_os,
},
{
name: "system",
class: FUNC_CLASS_SYSTEM,
help: `Run command string, yielding its stdout minus final carriage return.`,
unaryFunc: bifs.BIF_system,
},
{
name: "exec",
class: FUNC_CLASS_SYSTEM,
help: `'$output = exec(
"command",
["arg1", "arg2"],
{"env": ["ENV_VAR=ENV_VALUE", "ENV_VAR2=ENV_VALUE2"],
"dir": "/tmp/run_command_here",
"stdin_string": "this is input fed to program",
"combined_output": true
)'
Run a command via executable, path, args and environment, yielding its stdout minus final carriage return.`,
examples: []string{
`exec("echo", ["I don't do", "$SHELL things"], {"env": "SHELL=sh"}) outputs "I don't do $SHELL things"`,
},
variadicFunc: bifs.BIF_exec,
},
{
name: "version",
class: FUNC_CLASS_SYSTEM,
help: `Returns the Miller version as a string.`,
zaryFunc: bifs.BIF_version,
},
}
// Sort the function table. Useful for online help and autogenned docs / manpage.
// Go sort API: for ascending sort, return true if element i < element j.
// Put symbols like '||' after text like 'gsub', not before.
sort.Slice(lookupTable, func(i, j int) bool {
namei := lookupTable[i].name
namej := lookupTable[j].name
si := startsWithLetter(namei)
sj := startsWithLetter(namej)
if si && !sj {
return true
} else if !si && sj {
return false
} else {
if namei < namej {
return true
} else {
return false
}
}
})
return lookupTable
}
// ================================================================
type BuiltinFunctionManager struct {
// We need both the array and the hashmap since Go maps are not
// insertion-order-preserving: to produce a sensical help-all-functions
// list, etc., we want the original ordering.
lookupTable *[]BuiltinFunctionInfo
hashTable map[string]*BuiltinFunctionInfo
}
func NewBuiltinFunctionManager() *BuiltinFunctionManager {
lookupTable := makeBuiltinFunctionLookupTable()
hashTable := hashifyLookupTable(&lookupTable)
return &BuiltinFunctionManager{
lookupTable: &lookupTable,
hashTable: hashTable,
}
}
func (manager *BuiltinFunctionManager) LookUp(functionName string) *BuiltinFunctionInfo {
return manager.hashTable[functionName]
}
func hashifyLookupTable(lookupTable *[]BuiltinFunctionInfo) map[string]*BuiltinFunctionInfo {
hashTable := make(map[string]*BuiltinFunctionInfo)
for _, builtinFunctionInfo := range *lookupTable {
// Each function name should appear only once in the table. If it has
// multiple arities (e.g. unary and binary "-") there should be
// multiple function-pointers in a single row.
if hashTable[builtinFunctionInfo.name] != nil {
fmt.Fprintf(
os.Stderr,
"Internal coding error: function name \"%s\" is non-unique",
builtinFunctionInfo.name,
)
os.Exit(1)
}
clone := builtinFunctionInfo
hashTable[builtinFunctionInfo.name] = &clone
}
return hashTable
}
// ----------------------------------------------------------------
func (manager *BuiltinFunctionManager) ListBuiltinFunctionClasses() {
classesList := manager.getBuiltinFunctionClasses()
for _, class := range classesList {
fmt.Println(class)
}
}
func (manager *BuiltinFunctionManager) getBuiltinFunctionClasses() []string {
classesSeen := make(map[string]bool)
classesList := make([]string, 0)
for _, builtinFunctionInfo := range *manager.lookupTable {
class := string(builtinFunctionInfo.class)
if classesSeen[class] == false {
classesList = append(classesList, class)
classesSeen[class] = true
}
}
sort.Strings(classesList)
return classesList
}
// ----------------------------------------------------------------
func (manager *BuiltinFunctionManager) ListBuiltinFunctionsInClass(class string) {
for _, builtinFunctionInfo := range *manager.lookupTable {
if string(builtinFunctionInfo.class) == class {
fmt.Println(builtinFunctionInfo.name)
}
}
}
func (manager *BuiltinFunctionManager) ListBuiltinFunctionNamesVertically() {
for _, builtinFunctionInfo := range *manager.lookupTable {
fmt.Println(builtinFunctionInfo.name)
}
}
func (manager *BuiltinFunctionManager) ListBuiltinFunctionNamesAsParagraph() {
functionNames := make([]string, len(*manager.lookupTable))
for i, builtinFunctionInfo := range *manager.lookupTable {
functionNames[i] = builtinFunctionInfo.name
}
lib.PrintWordsAsParagraph(functionNames)
}
func (manager *BuiltinFunctionManager) ListBuiltinFunctionsAsTable() {
fmt.Printf("%-30s %-12s %s\n", "Name", "Class", "Args")
for _, builtinFunctionInfo := range *manager.lookupTable {
fmt.Printf("%-30s %-12s %s\n",
builtinFunctionInfo.name,
builtinFunctionInfo.class,
describeNargs(&builtinFunctionInfo),
)
}
}
// ----------------------------------------------------------------
func (manager *BuiltinFunctionManager) ListBuiltinFunctionUsages() {
for i, builtinFunctionInfo := range *manager.lookupTable {
if i > 0 {
fmt.Println()
}
manager.showSingleUsage(&builtinFunctionInfo)
}
}
func (manager *BuiltinFunctionManager) ListBuiltinFunctionUsagesByClass() {
classesList := manager.getBuiltinFunctionClasses()
for _, class := range classesList {
fmt.Println()
fmt.Println(colorizer.MaybeColorizeHelp(strings.ToUpper(class), true))
fmt.Println()
for _, builtinFunctionInfo := range *manager.lookupTable {
if string(builtinFunctionInfo.class) != class {
continue
}
manager.showSingleUsage(&builtinFunctionInfo)
}
}
}
func (manager *BuiltinFunctionManager) ListBuiltinFunctionUsage(functionName string) {
if !manager.TryListBuiltinFunctionUsage(functionName) {
fmt.Fprintf(os.Stderr, "Function \"%s\" not found.\n", functionName)
}
}
func (manager *BuiltinFunctionManager) TryListBuiltinFunctionUsage(
functionName string,
) bool {
builtinFunctionInfo := manager.LookUp(functionName)
if builtinFunctionInfo == nil {
return false
}
manager.listBuiltinFunctionUsageExact(builtinFunctionInfo)
return true
}
func (manager *BuiltinFunctionManager) TryListBuiltinFunctionUsageApproximate(
searchString string,
) bool {
found := false
for _, builtinFunctionInfo := range *manager.lookupTable {
if strings.Contains(builtinFunctionInfo.name, searchString) {
manager.showSingleUsage(&builtinFunctionInfo)
found = true
}
}
return found
}
func (manager *BuiltinFunctionManager) listBuiltinFunctionUsageExact(
builtinFunctionInfo *BuiltinFunctionInfo,
) {
manager.showSingleUsage(builtinFunctionInfo)
}
func (manager *BuiltinFunctionManager) showSingleUsage(
builtinFunctionInfo *BuiltinFunctionInfo,
) {
lib.InternalCodingErrorIf(builtinFunctionInfo.help == "")
fmt.Printf("%s (class=%s #args=%s) %s\n",
colorizer.MaybeColorizeHelp(builtinFunctionInfo.name, true),
builtinFunctionInfo.class,
describeNargs(builtinFunctionInfo),
builtinFunctionInfo.JoinHelp(),
)
if len(builtinFunctionInfo.examples) == 1 {
fmt.Println("Example:")
}
if len(builtinFunctionInfo.examples) > 1 {
fmt.Println("Examples:")
}
for _, example := range builtinFunctionInfo.examples {
fmt.Println(example)
}
}
func (manager *BuiltinFunctionManager) ListBuiltinFunctionUsageApproximate(
text string,
) bool {
found := false
for _, builtinFunctionInfo := range *manager.lookupTable {
if strings.Contains(builtinFunctionInfo.name, text) {
fmt.Printf(" %s\n", builtinFunctionInfo.name)
found = true
}
}
return found
}
func describeNargs(info *BuiltinFunctionInfo) string {
if info.hasMultipleArities {
pieces := make([]string, 0)
if info.zaryFunc != nil {
pieces = append(pieces, "0")
}
if info.unaryFunc != nil {
pieces = append(pieces, "1")
}
if info.unaryFuncWithContext != nil {
pieces = append(pieces, "1")
}
if info.binaryFunc != nil {
pieces = append(pieces, "2")
}
if info.regexCaptureBinaryFunc != nil {
pieces = append(pieces, "2")
}
if info.ternaryFunc != nil {
pieces = append(pieces, "3")
}
return strings.Join(pieces, ",")
} else {
if info.zaryFunc != nil {
return "0"
}
if info.unaryFunc != nil {
return "1"
}
if info.unaryFuncWithContext != nil {
return "1"
}
if info.binaryFunc != nil {
return "2"
}
if info.binaryFuncWithState != nil {
return "2"
}
if info.regexCaptureBinaryFunc != nil {
return "2"
}
if info.ternaryFunc != nil {
return "3"
}
if info.ternaryFuncWithState != nil {
return "3"
}
if info.variadicFunc != nil || info.variadicFuncWithState != nil {
if info.maximumVariadicArity != 0 {
return fmt.Sprintf("%d-%d", info.minimumVariadicArity, info.maximumVariadicArity)
} else {
return "variadic"
}
}
}
lib.InternalCodingErrorIf(true)
return "(error)" // solely to appease the Go compiler; not reached
}
var multiSpaceRegex = regexp.MustCompile(`\s+`)
// JoinHelp must be used to format any function help-strings for output. for
// source-code storage, these have newlines in them. For any presentation to
// the user, they must be formatted using the JoinHelp() method which joins
// newlines. This is crucial for rendering of help-strings for manual page,
// webdocs, etc wherein we must let the user's resizing of the terminal window
// or browser determine -- at their choosing -- where lines wrap.
func (info *BuiltinFunctionInfo) JoinHelp() string {
return multiSpaceRegex.ReplaceAllString(strings.ReplaceAll(info.help, "\n", " "), " ")
}
// ================================================================
// This is a singleton so the online-help functions can query it for listings,
// online help, etc.
var BuiltinFunctionManagerInstance *BuiltinFunctionManager = NewBuiltinFunctionManager()