1
1
mirror of https://github.com/wader/fq.git synced 2024-11-24 11:16:09 +03:00
fq/pkg/interp/decode.go

709 lines
16 KiB
Go
Raw Normal View History

2020-06-08 03:29:51 +03:00
package interp
import (
"bytes"
2020-06-08 03:29:51 +03:00
"errors"
2021-08-12 00:51:00 +03:00
"fmt"
2020-06-08 03:29:51 +03:00
"io"
"io/ioutil"
2020-06-08 03:29:51 +03:00
"math/big"
"strings"
"time"
2020-06-08 03:29:51 +03:00
"github.com/mitchellh/mapstructure"
"github.com/wader/fq/internal/bitioextra"
"github.com/wader/fq/internal/gojqextra"
"github.com/wader/fq/internal/ioextra"
"github.com/wader/fq/pkg/bitio"
"github.com/wader/fq/pkg/decode"
"github.com/wader/fq/pkg/scalar"
"github.com/wader/gojq"
2020-06-08 03:29:51 +03:00
)
func init() {
functionRegisterFns = append(functionRegisterFns, func(i *Interp) []Function {
return []Function{
{"_registry", 0, 0, i._registry, nil},
{"_tovalue", 1, 1, i._toValue, nil},
{"_decode", 2, 2, i._decode, nil},
}
})
}
2021-08-12 00:51:00 +03:00
type expectedExtkeyError struct {
Key string
}
func (err expectedExtkeyError) Error() string {
return "expected a extkey but got: " + err.Key
}
// TODO: redo/rename
// used by _isDecodeValue
2021-09-23 19:35:04 +03:00
type DecodeValue interface {
2021-09-27 12:01:14 +03:00
Value
ToBinary
2021-09-23 19:35:04 +03:00
DecodeValue() *decode.Value
2020-06-08 03:29:51 +03:00
}
func (i *Interp) _registry(c interface{}, a []interface{}) interface{} {
uniqueFormats := map[string]decode.Format{}
groups := map[string]interface{}{}
formats := map[string]interface{}{}
for fsName := range i.registry.Groups {
var group []interface{}
for _, f := range i.registry.MustGroup(fsName) {
group = append(group, f.Name)
if _, ok := uniqueFormats[f.Name]; ok {
continue
}
uniqueFormats[f.Name] = f
}
groups[fsName] = group
}
for _, f := range uniqueFormats {
vf := map[string]interface{}{
"name": f.Name,
"description": f.Description,
"probe_order": f.ProbeOrder,
"root_name": f.RootName,
"root_array": f.RootArray,
"to_repr": f.ToRepr,
}
var dependenciesVs []interface{}
for _, d := range f.Dependencies {
var dNamesVs []interface{}
for _, n := range d.Names {
dNamesVs = append(dNamesVs, n)
}
dependenciesVs = append(dependenciesVs, dNamesVs)
}
if len(dependenciesVs) > 0 {
vf["dependencies"] = dependenciesVs
}
var groupsVs []interface{}
for _, n := range f.Groups {
groupsVs = append(groupsVs, n)
}
if len(groupsVs) > 0 {
vf["groups"] = groupsVs
}
if f.Files != nil {
files := map[string]interface{}{}
entries, err := f.Files.ReadDir(".")
if err != nil {
return err
}
for _, e := range entries {
f, err := f.Files.Open(e.Name())
if err != nil {
return err
}
b, err := ioutil.ReadAll(f)
if err != nil {
return err
}
files[e.Name()] = string(b)
}
vf["files"] = files
}
formats[f.Name] = vf
}
return map[string]interface{}{
"groups": groups,
"formats": formats,
}
}
func (i *Interp) _toValue(c interface{}, a []interface{}) interface{} {
v, _ := toValue(
func() Options { return i.Options(a[0]) },
c,
)
return v
}
func (i *Interp) _decode(c interface{}, a []interface{}) interface{} {
var opts struct {
Filename string `mapstructure:"filename"`
Force bool `mapstructure:"force"`
Progress string `mapstructure:"_progress"`
Remain map[string]interface{} `mapstructure:",remain"`
}
_ = mapstructure.Decode(a[1], &opts)
// TODO: progress hack
// would be nice to move all progress code into decode but it might be
// tricky to keep track of absolute positions in the underlaying readers
// when it uses BitBuf slices, maybe only in Pos()?
if bbf, ok := c.(*openFile); ok {
opts.Filename = bbf.filename
if opts.Progress != "" {
evalProgress := func(c interface{}) {
// {approx_read_bytes: 123, total_size: 123} | opts.Progress
_, _ = i.EvalFuncValues(
i.evalInstance.ctx,
c,
opts.Progress,
nil,
EvalOpts{output: ioextra.DiscardCtxWriter{Ctx: i.evalInstance.ctx}},
)
}
lastProgress := time.Now()
bbf.progressFn = func(approxReadBytes, totalSize int64) {
// make sure to not call too often as it's quite expensive
n := time.Now()
if n.Sub(lastProgress) < 200*time.Millisecond {
return
}
lastProgress = n
evalProgress(
map[string]interface{}{
"approx_read_bytes": approxReadBytes,
"total_size": totalSize,
},
)
}
// when done decoding, tell progress function were done and disable it
defer func() {
bbf.progressFn = nil
evalProgress(nil)
}()
}
}
bv, err := toBinary(c)
if err != nil {
return err
}
formatName, err := toString(a[0])
if err != nil {
return err
}
decodeFormat, err := i.registry.Group(formatName)
if err != nil {
return err
}
dv, _, err := decode.Decode(i.evalInstance.ctx, bv.br, decodeFormat,
decode.Options{
IsRoot: true,
FillGaps: true,
Force: opts.Force,
Range: bv.r,
Description: opts.Filename,
FormatOptions: opts.Remain,
},
)
if dv == nil {
var decodeFormatsErr decode.FormatsError
if errors.As(err, &decodeFormatsErr) {
var vs []interface{}
for _, fe := range decodeFormatsErr.Errs {
vs = append(vs, fe.Value())
}
return valueError{vs}
}
return valueError{err}
}
return makeDecodeValue(dv)
}
2021-09-28 00:06:46 +03:00
func valueKey(name string, a, b func(name string) interface{}) interface{} {
2021-08-12 00:51:00 +03:00
if strings.HasPrefix(name, "_") {
return a(name)
}
return b(name)
}
2021-09-28 00:06:46 +03:00
func valueHas(key interface{}, a func(name string) interface{}, b func(key interface{}) interface{}) interface{} {
stringKey, ok := key.(string)
if ok && strings.HasPrefix(stringKey, "_") {
if err, ok := a(stringKey).(error); ok {
return err
}
return true
}
return b(key)
}
2021-08-12 00:51:00 +03:00
// optsFn is a function as toValue is used by tovalue/0 so needs to be fast
func toValue(optsFn func() Options, v interface{}) (interface{}, bool) {
switch v := v.(type) {
case JQValueEx:
return v.JQValueToGoJQEx(optsFn), true
case gojq.JQValue:
return v.JQValueToGoJQ(), true
case nil, bool, float64, int, string, *big.Int, map[string]interface{}, []interface{}:
return v, true
default:
return nil, false
}
}
func makeDecodeValue(dv *decode.Value) interface{} {
2020-06-08 03:29:51 +03:00
switch vv := dv.V.(type) {
case *decode.Compound:
if vv.IsArray {
return NewArrayDecodeValue(dv, vv)
2020-06-08 03:29:51 +03:00
}
return NewStructDecodeValue(dv, vv)
case *scalar.S:
switch vv := vv.Value().(type) {
case bitio.ReaderAtSeeker:
// is lazy so that in situations where the decode value is only used to
// create another binary we don't have to read and create a string, ex:
// .unknown0 | tobytes[1:] | ...
return decodeValue{
JQValue: &gojqextra.Lazy{
Type: "string",
IsScalar: true,
Fn: func() (gojq.JQValue, error) {
buf := &bytes.Buffer{}
vvC, err := bitioextra.Clone(vv)
if err != nil {
return nil, err
}
if _, err := bitioextra.CopyBits(buf, vvC); err != nil {
return nil, err
}
return gojqextra.String([]rune(buf.String())), nil
},
},
decodeValueBase: decodeValueBase{dv},
bitsFormat: true,
}
case bool:
return decodeValue{
JQValue: gojqextra.Boolean(vv),
decodeValueBase: decodeValueBase{dv},
}
case int:
return decodeValue{
JQValue: gojqextra.Number{V: vv},
decodeValueBase: decodeValueBase{dv},
}
case int64:
return decodeValue{
JQValue: gojqextra.Number{V: big.NewInt(vv)},
decodeValueBase: decodeValueBase{dv},
}
case uint64:
return decodeValue{
JQValue: gojqextra.Number{V: new(big.Int).SetUint64(vv)},
decodeValueBase: decodeValueBase{dv},
}
case float64:
return decodeValue{
JQValue: gojqextra.Number{V: vv},
decodeValueBase: decodeValueBase{dv},
}
case string:
return decodeValue{
JQValue: gojqextra.String(vv),
decodeValueBase: decodeValueBase{dv},
}
case []interface{}:
return decodeValue{
JQValue: gojqextra.Array(vv),
decodeValueBase: decodeValueBase{dv},
}
case map[string]interface{}:
return decodeValue{
JQValue: gojqextra.Object(vv),
decodeValueBase: decodeValueBase{dv},
}
case nil:
return decodeValue{
JQValue: gojqextra.Null{},
decodeValueBase: decodeValueBase{dv},
}
case *big.Int:
return decodeValue{
JQValue: gojqextra.Number{V: vv},
decodeValueBase: decodeValueBase{dv},
}
default:
panic(fmt.Sprintf("unreachable vv %#+v", vv))
2020-06-08 03:29:51 +03:00
}
default:
panic(fmt.Sprintf("unreachable dv %#+v", dv))
2020-06-08 03:29:51 +03:00
}
}
type decodeValueBase struct {
dv *decode.Value
}
2021-09-23 19:35:04 +03:00
func (dvb decodeValueBase) DecodeValue() *decode.Value {
return dvb.dv
}
2020-06-08 03:29:51 +03:00
func (dvb decodeValueBase) Display(w io.Writer, opts Options) error { return dump(dvb.dv, w, opts) }
func (dvb decodeValueBase) ToBinary() (Binary, error) {
return Binary{br: dvb.dv.RootReader, r: dvb.dv.InnerRange(), unit: 8}, nil
2020-06-08 03:29:51 +03:00
}
func (decodeValueBase) ExtType() string { return "decode_value" }
2020-06-08 03:29:51 +03:00
func (dvb decodeValueBase) ExtKeys() []string {
kv := []string{
"_start",
"_stop",
"_len",
"_name",
"_root",
"_buffer_root",
"_format_root",
"_parent",
"_actual",
"_sym",
2020-06-08 03:29:51 +03:00
"_description",
"_path",
"_bits",
"_bytes",
"_unknown",
"_index", // TODO: only if parent is array?
2020-06-08 03:29:51 +03:00
}
if _, ok := dvb.dv.V.(*decode.Compound); ok {
kv = append(kv,
"_error",
"_format",
)
if dvb.dv.Index != -1 {
kv = append(kv, "_index")
}
2020-06-08 03:29:51 +03:00
}
return kv
}
func (dvb decodeValueBase) JQValueKey(name string) interface{} {
2021-08-12 00:51:00 +03:00
dv := dvb.dv
switch name {
case "_start":
return big.NewInt(dv.Range.Start)
case "_stop":
return big.NewInt(dv.Range.Stop())
case "_len":
return big.NewInt(dv.Range.Len)
case "_name":
return dv.Name
case "_root":
return makeDecodeValue(dv.Root())
case "_buffer_root":
// TODO: rename?
return makeDecodeValue(dv.BufferRoot())
case "_format_root":
// TODO: rename?
return makeDecodeValue(dv.FormatRoot())
case "_parent":
if dv.Parent == nil {
return nil
}
return makeDecodeValue(dv.Parent)
case "_actual":
switch vv := dv.V.(type) {
case *scalar.S:
jv, ok := gojqextra.ToGoJQValue(vv.Actual)
if !ok {
return fmt.Errorf("can't convert actual value jq value %#+v", vv.Actual)
}
return jv
default:
return nil
}
case "_sym":
switch vv := dv.V.(type) {
case *scalar.S:
jv, ok := gojqextra.ToGoJQValue(vv.Sym)
if !ok {
return fmt.Errorf("can't convert sym value jq value %#+v", vv.Actual)
}
return jv
default:
return nil
}
2021-08-12 00:51:00 +03:00
case "_description":
switch vv := dv.V.(type) {
case *decode.Compound:
if vv.Description == "" {
return nil
}
return vv.Description
case *scalar.S:
if vv.Description == "" {
return nil
}
return vv.Description
default:
return nil
}
2021-08-12 00:51:00 +03:00
case "_path":
return valuePath(dv)
case "_error":
switch vv := dv.V.(type) {
case *decode.Compound:
var formatErr decode.FormatError
if errors.As(vv.Err, &formatErr) {
return formatErr.Value()
2021-08-12 00:51:00 +03:00
}
return vv.Err
default:
return nil
2020-06-08 03:29:51 +03:00
}
2021-08-12 00:51:00 +03:00
case "_bits":
return Binary{
br: dv.RootReader,
2021-10-05 23:26:05 +03:00
r: dv.Range,
unit: 1,
2021-08-12 00:51:00 +03:00
}
case "_bytes":
return Binary{
br: dv.RootReader,
2021-10-05 23:26:05 +03:00
r: dv.Range,
unit: 8,
2021-08-12 00:51:00 +03:00
}
case "_format":
switch vv := dv.V.(type) {
case *decode.Compound:
if vv.Format != nil {
return vv.Format.Name
}
return nil
case *scalar.S:
// TODO: hack, Scalar interface?
switch vv.Actual.(type) {
case map[string]interface{}, []interface{}:
return "json"
default:
return nil
}
default:
2021-08-12 00:51:00 +03:00
return nil
}
case "_unknown":
switch vv := dv.V.(type) {
case *scalar.S:
return vv.Unknown
default:
return false
}
case "_index":
if dv.Index != -1 {
return dv.Index
}
2020-06-08 03:29:51 +03:00
}
2021-08-12 00:51:00 +03:00
return expectedExtkeyError{Key: name}
2020-06-08 03:29:51 +03:00
}
2021-09-23 19:35:04 +03:00
var _ DecodeValue = decodeValue{}
2020-06-08 03:29:51 +03:00
type decodeValue struct {
2021-08-12 00:51:00 +03:00
gojq.JQValue
decodeValueBase
bitsFormat bool
2021-08-12 00:51:00 +03:00
}
func (v decodeValue) JQValueKey(name string) interface{} {
2021-09-28 00:06:46 +03:00
return valueKey(name, v.decodeValueBase.JQValueKey, v.JQValue.JQValueKey)
}
func (v decodeValue) JQValueHas(key interface{}) interface{} {
return valueHas(key, v.decodeValueBase.JQValueKey, v.JQValue.JQValueHas)
2021-08-12 00:51:00 +03:00
}
func (v decodeValue) JQValueToGoJQEx(optsFn func() Options) interface{} {
if !v.bitsFormat {
return v.JQValueToGoJQ()
2021-08-12 00:51:00 +03:00
}
bv, err := v.decodeValueBase.ToBinary()
if err != nil {
return err
2020-06-08 03:29:51 +03:00
}
br, err := bv.toReader()
if err != nil {
return err
}
brC, err := bitioextra.Clone(br)
if err != nil {
return err
2020-06-08 03:29:51 +03:00
}
s, err := optsFn().BitsFormatFn(brC)
if err != nil {
return err
}
return s
2020-06-08 03:29:51 +03:00
}
// decode value array
2021-09-23 19:35:04 +03:00
var _ DecodeValue = ArrayDecodeValue{}
2020-06-08 03:29:51 +03:00
2021-09-27 12:01:14 +03:00
type ArrayDecodeValue struct {
2021-08-12 00:51:00 +03:00
gojqextra.Base
decodeValueBase
*decode.Compound
2020-06-08 03:29:51 +03:00
}
func NewArrayDecodeValue(dv *decode.Value, c *decode.Compound) ArrayDecodeValue {
2021-09-27 12:01:14 +03:00
return ArrayDecodeValue{
2021-08-12 00:51:00 +03:00
decodeValueBase: decodeValueBase{dv},
Base: gojqextra.Base{Typ: "array"},
Compound: c,
2021-08-12 00:51:00 +03:00
}
}
2021-09-27 12:01:14 +03:00
func (v ArrayDecodeValue) JQValueKey(name string) interface{} {
2021-09-28 00:06:46 +03:00
return valueKey(name, v.decodeValueBase.JQValueKey, v.Base.JQValueKey)
2021-08-12 00:51:00 +03:00
}
func (v ArrayDecodeValue) JQValueSliceLen() interface{} { return len(v.Compound.Children) }
func (v ArrayDecodeValue) JQValueLength() interface{} { return len(v.Compound.Children) }
2021-09-27 12:01:14 +03:00
func (v ArrayDecodeValue) JQValueIndex(index int) interface{} {
2020-06-08 03:29:51 +03:00
// -1 outside after string, -2 outside before string
if index < 0 {
return nil
}
return makeDecodeValue((v.Compound.Children)[index])
2020-06-08 03:29:51 +03:00
}
2021-09-27 12:01:14 +03:00
func (v ArrayDecodeValue) JQValueSlice(start int, end int) interface{} {
2020-06-08 03:29:51 +03:00
vs := make([]interface{}, end-start)
for i, e := range (v.Compound.Children)[start:end] {
vs[i] = makeDecodeValue(e)
2020-06-08 03:29:51 +03:00
}
return vs
}
2021-09-27 12:01:14 +03:00
func (v ArrayDecodeValue) JQValueUpdate(key interface{}, u interface{}, delpath bool) interface{} {
return gojqextra.NonUpdatableTypeError{Key: fmt.Sprintf("%v", key), Typ: "array"}
}
2021-09-27 12:01:14 +03:00
func (v ArrayDecodeValue) JQValueEach() interface{} {
props := make([]gojq.PathValue, len(v.Compound.Children))
for i, f := range v.Compound.Children {
props[i] = gojq.PathValue{Path: i, Value: makeDecodeValue(f)}
2020-06-08 03:29:51 +03:00
}
return props
}
2021-09-27 12:01:14 +03:00
func (v ArrayDecodeValue) JQValueKeys() interface{} {
vs := make([]interface{}, len(v.Compound.Children))
for i := range v.Compound.Children {
2020-06-08 03:29:51 +03:00
vs[i] = i
}
return vs
}
2021-09-27 12:01:14 +03:00
func (v ArrayDecodeValue) JQValueHas(key interface{}) interface{} {
2021-09-28 00:06:46 +03:00
return valueHas(
key,
v.decodeValueBase.JQValueKey,
func(key interface{}) interface{} {
intKey, ok := key.(int)
if !ok {
return gojqextra.HasKeyTypeError{L: "array", R: fmt.Sprintf("%v", key)}
}
return intKey >= 0 && intKey < len(v.Compound.Children)
2021-09-28 00:06:46 +03:00
})
2020-06-08 03:29:51 +03:00
}
2021-09-27 12:01:14 +03:00
func (v ArrayDecodeValue) JQValueToGoJQ() interface{} {
vs := make([]interface{}, len(v.Compound.Children))
for i, f := range v.Compound.Children {
vs[i] = makeDecodeValue(f)
2020-06-08 03:29:51 +03:00
}
return vs
}
// decode value struct
2021-09-23 19:35:04 +03:00
var _ DecodeValue = StructDecodeValue{}
2020-06-08 03:29:51 +03:00
2021-09-27 12:01:14 +03:00
type StructDecodeValue struct {
2021-08-12 00:51:00 +03:00
gojqextra.Base
decodeValueBase
*decode.Compound
2020-06-08 03:29:51 +03:00
}
func NewStructDecodeValue(dv *decode.Value, c *decode.Compound) StructDecodeValue {
2021-09-27 12:01:14 +03:00
return StructDecodeValue{
2021-08-12 00:51:00 +03:00
decodeValueBase: decodeValueBase{dv},
Base: gojqextra.Base{Typ: "object"},
Compound: c,
2021-08-12 00:51:00 +03:00
}
}
func (v StructDecodeValue) JQValueLength() interface{} { return len(v.Compound.Children) }
func (v StructDecodeValue) JQValueSliceLen() interface{} { return len(v.Compound.Children) }
2021-09-27 12:01:14 +03:00
func (v StructDecodeValue) JQValueKey(name string) interface{} {
2021-08-12 00:51:00 +03:00
if strings.HasPrefix(name, "_") {
return v.decodeValueBase.JQValueKey(name)
}
for _, f := range v.Compound.Children {
2020-06-08 03:29:51 +03:00
if f.Name == name {
return makeDecodeValue(f)
2020-06-08 03:29:51 +03:00
}
}
return nil
}
2021-09-27 12:01:14 +03:00
func (v StructDecodeValue) JQValueUpdate(key interface{}, u interface{}, delpath bool) interface{} {
return gojqextra.NonUpdatableTypeError{Key: fmt.Sprintf("%v", key), Typ: "object"}
}
2021-09-27 12:01:14 +03:00
func (v StructDecodeValue) JQValueEach() interface{} {
props := make([]gojq.PathValue, len(v.Compound.Children))
for i, f := range v.Compound.Children {
props[i] = gojq.PathValue{Path: f.Name, Value: makeDecodeValue(f)}
2020-06-08 03:29:51 +03:00
}
return props
}
2021-09-27 12:01:14 +03:00
func (v StructDecodeValue) JQValueKeys() interface{} {
vs := make([]interface{}, len(v.Compound.Children))
for i, f := range v.Compound.Children {
2020-06-08 03:29:51 +03:00
vs[i] = f.Name
}
return vs
}
2021-09-27 12:01:14 +03:00
func (v StructDecodeValue) JQValueHas(key interface{}) interface{} {
2021-09-28 00:06:46 +03:00
return valueHas(
key,
v.decodeValueBase.JQValueKey,
func(key interface{}) interface{} {
stringKey, ok := key.(string)
if !ok {
return gojqextra.HasKeyTypeError{L: "object", R: fmt.Sprintf("%v", key)}
}
for _, f := range v.Compound.Children {
2021-09-28 00:06:46 +03:00
if f.Name == stringKey {
return true
}
}
return false
},
)
2020-06-08 03:29:51 +03:00
}
2021-09-27 12:01:14 +03:00
func (v StructDecodeValue) JQValueToGoJQ() interface{} {
vm := make(map[string]interface{}, len(v.Compound.Children))
for _, f := range v.Compound.Children {
vm[f.Name] = makeDecodeValue(f)
2020-06-08 03:29:51 +03:00
}
return vm
}