forked from johnkerl/miller
-
Notifications
You must be signed in to change notification settings - Fork 0
/
group_like.go
125 lines (102 loc) · 3.22 KB
/
group_like.go
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
package transformers
import (
"container/list"
"fmt"
"os"
"strings"
"github.com/johnkerl/miller/internal/pkg/cli"
"github.com/johnkerl/miller/internal/pkg/lib"
"github.com/johnkerl/miller/internal/pkg/types"
)
// ----------------------------------------------------------------
const verbNameGroupLike = "group-like"
var GroupLikeSetup = TransformerSetup{
Verb: verbNameGroupLike,
UsageFunc: transformerGroupLikeUsage,
ParseCLIFunc: transformerGroupLikeParseCLI,
IgnoresInput: false,
}
func transformerGroupLikeUsage(
o *os.File,
) {
fmt.Fprintf(o, "Usage: %s %s [options]\n", "mlr", verbNameGroupLike)
fmt.Fprintln(o, "Outputs records in batches having identical field names.")
fmt.Fprintln(o, "Options:")
fmt.Fprintln(o, "-h|--help Show this message.")
}
func transformerGroupLikeParseCLI(
pargi *int,
argc int,
args []string,
_ *cli.TOptions,
doConstruct bool, // false for first pass of CLI-parse, true for second pass
) IRecordTransformer {
// Skip the verb name from the current spot in the mlr command line
argi := *pargi
argi++
for argi < argc /* variable increment: 1 or 2 depending on flag */ {
opt := args[argi]
if !strings.HasPrefix(opt, "-") {
break // No more flag options to process
}
if args[argi] == "--" {
break // All transformers must do this so main-flags can follow verb-flags
}
argi++
if opt == "-h" || opt == "--help" {
transformerGroupLikeUsage(os.Stdout)
os.Exit(0)
} else {
transformerGroupLikeUsage(os.Stderr)
os.Exit(1)
}
}
*pargi = argi
if !doConstruct { // All transformers must do this for main command-line parsing
return nil
}
transformer, err := NewTransformerGroupLike()
if err != nil {
fmt.Fprintln(os.Stderr, err)
os.Exit(1)
}
return transformer
}
// ----------------------------------------------------------------
type TransformerGroupLike struct {
// map from string to *list.List
recordListsByGroup *lib.OrderedMap
}
func NewTransformerGroupLike() (*TransformerGroupLike, error) {
tr := &TransformerGroupLike{
recordListsByGroup: lib.NewOrderedMap(),
}
return tr, nil
}
// ----------------------------------------------------------------
func (tr *TransformerGroupLike) Transform(
inrecAndContext *types.RecordAndContext,
outputRecordsAndContexts *list.List, // list of *types.RecordAndContext
inputDownstreamDoneChannel <-chan bool,
outputDownstreamDoneChannel chan<- bool,
) {
HandleDefaultDownstreamDone(inputDownstreamDoneChannel, outputDownstreamDoneChannel)
if !inrecAndContext.EndOfStream {
inrec := inrecAndContext.Record
groupingKey := inrec.GetKeysJoined()
recordListForGroup := tr.recordListsByGroup.Get(groupingKey)
if recordListForGroup == nil { // first time
recordListForGroup = list.New()
tr.recordListsByGroup.Put(groupingKey, recordListForGroup)
}
recordListForGroup.(*list.List).PushBack(inrecAndContext)
} else {
for outer := tr.recordListsByGroup.Head; outer != nil; outer = outer.Next {
recordListForGroup := outer.Value.(*list.List)
for inner := recordListForGroup.Front(); inner != nil; inner = inner.Next() {
outputRecordsAndContexts.PushBack(inner.Value.(*types.RecordAndContext))
}
}
outputRecordsAndContexts.PushBack(inrecAndContext) // end-of-stream marker
}
}