From 28c0f0d30cf61163e636c88f285b0f41dba6bece Mon Sep 17 00:00:00 2001 From: marco Date: Tue, 7 Jan 2025 23:18:45 +0100 Subject: [PATCH] log warning if local items have conflicting names --- cmd/crowdsec-cli/clihub/items.go | 2 +- pkg/cwhub/hub.go | 1 + pkg/cwhub/state.go | 3 +- pkg/cwhub/state_test.go | 1 + pkg/cwhub/sync.go | 376 +++++++++++++++++---------- test/bats/20_hub_items.bats | 17 +- test/bats/cscli-hubtype-install.bats | 32 +++ test/bats/cscli-hubtype-list.bats | 2 +- 8 files changed, 288 insertions(+), 146 deletions(-) diff --git a/cmd/crowdsec-cli/clihub/items.go b/cmd/crowdsec-cli/clihub/items.go index 730d2208be0..87cb10b1f93 100644 --- a/cmd/crowdsec-cli/clihub/items.go +++ b/cmd/crowdsec-cli/clihub/items.go @@ -63,7 +63,7 @@ func ListItems(out io.Writer, wantColor string, itemTypes []string, items map[st continue } - listHubItemTable(out, wantColor, "\n"+strings.ToUpper(itemType), items[itemType]) + listHubItemTable(out, wantColor, strings.ToUpper(itemType), items[itemType]) nothingToDisplay = false } diff --git a/pkg/cwhub/hub.go b/pkg/cwhub/hub.go index 998a4032359..aeccb3268f7 100644 --- a/pkg/cwhub/hub.go +++ b/pkg/cwhub/hub.go @@ -171,6 +171,7 @@ func (h *Hub) Update(ctx context.Context, indexProvider IndexProvider, withConte return nil } +// addItem adds an item to the hub. It silently replaces an existing item with the same type and name. func (h *Hub) addItem(item *Item) { if h.items[item.Type] == nil { h.items[item.Type] = make(map[string]*Item) diff --git a/pkg/cwhub/state.go b/pkg/cwhub/state.go index 518185aff1c..03e10671afb 100644 --- a/pkg/cwhub/state.go +++ b/pkg/cwhub/state.go @@ -11,6 +11,7 @@ type ItemState struct { LocalVersion string `json:"local_version,omitempty" yaml:"local_version,omitempty"` LocalHash string `json:"local_hash,omitempty" yaml:"local_hash,omitempty"` Installed bool `json:"installed"` + local bool Downloaded bool `json:"downloaded"` UpToDate bool `json:"up_to_date"` Tainted bool `json:"tainted"` @@ -20,7 +21,7 @@ type ItemState struct { // IsLocal returns true if the item has been create by a user (not downloaded from the hub). func (s *ItemState) IsLocal() bool { - return s.Installed && !s.Downloaded + return s.local } // Text returns the status of the item as a string (eg. "enabled,update-available"). diff --git a/pkg/cwhub/state_test.go b/pkg/cwhub/state_test.go index 3ed3de16fcc..20741809ae2 100644 --- a/pkg/cwhub/state_test.go +++ b/pkg/cwhub/state_test.go @@ -40,6 +40,7 @@ func TestItemStateText(t *testing.T) { ItemState{ Installed: true, UpToDate: false, + local: true, Tainted: false, Downloaded: false, }, diff --git a/pkg/cwhub/sync.go b/pkg/cwhub/sync.go index ee8e49f2bf0..53fd9aa1d24 100644 --- a/pkg/cwhub/sync.go +++ b/pkg/cwhub/sync.go @@ -50,9 +50,8 @@ func resolveSymlink(path string) (string, error) { } // isPathInside checks if a path is inside the given directory -// it can return false negatives if the filesystem is case insensitive func isPathInside(path, dir string) (bool, error) { - absFilePath, err := filepath.Abs(path) + absFile, err := filepath.Abs(path) if err != nil { return false, err } @@ -62,103 +61,145 @@ func isPathInside(path, dir string) (bool, error) { return false, err } - return strings.HasPrefix(absFilePath, absDir), nil -} + rel, err := filepath.Rel(absDir, absFile) + if err != nil { + return false, err + } -// information used to create a new Item, from a file path. -type itemFileInfo struct { - fname string - stage string - ftype string - fauthor string - inhub bool + return !strings.HasPrefix(rel, ".."), nil } -func (h *Hub) getItemFileInfo(path string, logger *logrus.Logger) (*itemFileInfo, error) { - var ret *itemFileInfo +// itemSpec contains some information needed to complete the items +// after they have been parsed from the index. itemSpecs are created by +// scanning the hub (/etc/crowdsec/hub/*) and install (/etc/crowdsec/*) directories. +// Only directories for the known types are scanned. +type itemSpec struct { + path string // full path to the file (or link) + fname string // name of the item: + // for local item, taken from the file content or defaults to the filename (including extension) + // for non-local items, always {author}/{name} + stage string // stage for parsers and overflows + ftype string // type, plural (collections, contexts etc.) + fauthor string // author - empty for local items + inhub bool // true if the spec comes from the hub dir + target string // the target of path if it's a link, otherwise == path + local bool // is this a spec for a local item? +} - hubDir := h.local.HubDir - installDir := h.local.InstallDir +func newHubItemSpec(path string, subs []string, logger *logrus.Logger) (*itemSpec, error) { + // .../hub/parsers/s00-raw/crowdsecurity/skip-pretag.yaml + // .../hub/scenarios/crowdsecurity/ssh_bf.yaml + // .../hub/profiles/crowdsecurity/linux.yaml + if len(subs) < 3 { + return nil, fmt.Errorf("path is too short: %s (%d)", path, len(subs)) + } - subsHub := relativePathComponents(path, hubDir) - subsInstall := relativePathComponents(path, installDir) + ftype := subs[0] + if !slices.Contains(ItemTypes, ftype) { + // this doesn't really happen anymore, because we only scan the {hubtype} directories + return nil, fmt.Errorf("unknown configuration type '%s'", ftype) + } - switch { - case len(subsHub) > 0: - logger.Tracef("in hub dir") + stage := "" + fauthor := subs[1] + fname := subs[2] - // .../hub/parsers/s00-raw/crowdsecurity/skip-pretag.yaml - // .../hub/scenarios/crowdsecurity/ssh_bf.yaml - // .../hub/profiles/crowdsecurity/linux.yaml - if len(subsHub) < 3 { - return nil, fmt.Errorf("path is too short: %s (%d)", path, len(subsHub)) + if ftype == PARSERS || ftype == POSTOVERFLOWS { + if len(subs) < 4 { + return nil, fmt.Errorf("path is too short: %s (%d)", path, len(subs)) } - ftype := subsHub[0] - if !slices.Contains(ItemTypes, ftype) { - // this doesn't really happen anymore, because we only scan the {hubtype} directories - return nil, fmt.Errorf("unknown configuration type '%s'", ftype) - } + stage = subs[1] + fauthor = subs[2] + fname = subs[3] + } - stage := "" - fauthor := subsHub[1] - fname := subsHub[2] + spec := itemSpec{ + path: path, + inhub: true, + ftype: ftype, + stage: stage, + fauthor: fauthor, + fname: fname, + } - if ftype == PARSERS || ftype == POSTOVERFLOWS { - if len(subsHub) < 4 { - return nil, fmt.Errorf("path is too short: %s (%d)", path, len(subsHub)) - } + return &spec, nil +} - stage = subsHub[1] - fauthor = subsHub[2] - fname = subsHub[3] - } +func newInstallItemSpec(path string, subs []string, logger *logrus.Logger) (*itemSpec, error) { + logger.Tracef("%s in install dir", path) - ret = &itemFileInfo{ - inhub: true, - ftype: ftype, - stage: stage, - fauthor: fauthor, - fname: fname, - } + // .../config/parser/stage/file.yaml + // .../config/postoverflow/stage/file.yaml + // .../config/scenarios/scenar.yaml + // .../config/collections/linux.yaml //file is empty - case len(subsInstall) > 0: - logger.Tracef("in install dir") + if len(subs) < 2 { + return nil, fmt.Errorf("path is too short: %s (%d)", path, len(subs)) + } - // .../config/parser/stage/file.yaml - // .../config/postoverflow/stage/file.yaml - // .../config/scenarios/scenar.yaml - // .../config/collections/linux.yaml //file is empty + // this can be in any number of subdirs, we join them to compose the item name - if len(subsInstall) < 2 { - return nil, fmt.Errorf("path is too short: %s (%d)", path, len(subsInstall)) - } + ftype := subs[0] + stage := "" + fname := strings.Join(subs[1:], "/") - // this can be in any number of subdirs, we join them to compose the item name + if ftype == PARSERS || ftype == POSTOVERFLOWS { + stage = subs[1] + fname = strings.Join(subs[2:], "/") + } - ftype := subsInstall[0] - stage := "" - fname := strings.Join(subsInstall[1:], "/") + spec := itemSpec{ + path: path, + inhub: false, + ftype: ftype, + stage: stage, + fauthor: "", + fname: fname, + } - if ftype == PARSERS || ftype == POSTOVERFLOWS { - stage = subsInstall[1] - fname = strings.Join(subsInstall[2:], "/") - } + return &spec, nil +} + +func newItemSpec(path, hubDir, installDir string, logger *logrus.Logger) (*itemSpec, error) { + var ( + spec *itemSpec + err error + ) - ret = &itemFileInfo{ - inhub: false, - ftype: ftype, - stage: stage, - fauthor: "", - fname: fname, + if subs := relativePathComponents(path, hubDir); len(subs) > 0 { + spec, err = newHubItemSpec(path, subs, logger) + if err != nil { + return nil, err + } + } else if subs := relativePathComponents(path, installDir); len(subs) > 0 { + spec, err = newInstallItemSpec(path, subs, logger) + if err != nil { + return nil, err } - default: + } + + if spec == nil { return nil, fmt.Errorf("file '%s' is not from hub '%s' nor from the configuration directory '%s'", path, hubDir, installDir) } - logger.Tracef("CORRECTED [%s] by [%s] in stage [%s] of type [%s]", ret.fname, ret.fauthor, ret.stage, ret.ftype) + // follow the link to see if it falls in the hub directory + // if it's not a link, target == path + spec.target, err = resolveSymlink(spec.path) + if err != nil { + // target does not exist, the user might have removed the file + // or switched to a hub branch without it; or symlink loop + return nil, err + } - return ret, nil + targetInHub, err := isPathInside(spec.target, hubDir) + if err != nil { + return nil, ErrSkipPath + } + + spec.local = !targetInHub + + return spec, nil } // sortedVersions returns the input data, sorted in reverse order (new, old) by semver. @@ -185,7 +226,7 @@ func sortedVersions(raw []string) ([]string, error) { return ret, nil } -func newLocalItem(h *Hub, path string, info *itemFileInfo) (*Item, error) { +func newLocalItem(h *Hub, path string, spec *itemSpec) (*Item, error) { type localItemName struct { Name string `yaml:"name"` } @@ -194,12 +235,13 @@ func newLocalItem(h *Hub, path string, info *itemFileInfo) (*Item, error) { item := &Item{ hub: h, - Name: info.fname, - Stage: info.stage, - Type: info.ftype, + Name: spec.fname, + Stage: spec.stage, + Type: spec.ftype, FileName: fileName, State: ItemState{ LocalPath: path, + local: true, Installed: true, UpToDate: true, }, @@ -225,22 +267,25 @@ func newLocalItem(h *Hub, path string, info *itemFileInfo) (*Item, error) { return item, nil } -func (h *Hub) itemVisit(path string, f os.DirEntry, err error) error { +// A sentinel to skip regular files because "nil, nil" is ambiguous. Returning SkipDir with files would skip the rest of the directory. +var ErrSkipPath = errors.New("sentinel") + +func (h *Hub) itemVisit(path string, f os.DirEntry, err error) (*itemSpec, error) { if err != nil { h.logger.Debugf("while syncing hub dir: %s", err) // there is a path error, we ignore the file - return nil + return nil, ErrSkipPath + } + + // permission errors, files removed while reading, etc. + if f == nil { + return nil, ErrSkipPath } // only happens if the current working directory was removed (!) path, err = filepath.Abs(path) if err != nil { - return err - } - - // permission errors, files removed while reading, etc. - if f == nil { - return nil + return nil, err } if f.IsDir() { @@ -249,101 +294,126 @@ func (h *Hub) itemVisit(path string, f os.DirEntry, err error) error { // - double dot prefix is used by k8s to mount config maps if strings.HasPrefix(f.Name(), ".") { h.logger.Tracef("skipping hidden directory %s", path) - return filepath.SkipDir + return nil, filepath.SkipDir } // keep traversing - return nil + return nil, nil } // we only care about YAML files if !isYAMLFileName(f.Name()) { - return nil + return nil, ErrSkipPath } - info, err := h.getItemFileInfo(path, h.logger) + spec, err := newItemSpec(path, h.local.HubDir, h.local.InstallDir, h.logger) if err != nil { h.logger.Warningf("Ignoring file %s: %s", path, err) - return nil + return nil, ErrSkipPath } - // follow the link to see if it falls in the hub directory - // if it's not a link, target == path - target, err := resolveSymlink(path) - if err != nil { - // target does not exist, the user might have removed the file - // or switched to a hub branch without it; or symlink loop - h.logger.Warningf("Ignoring file %s: %s", path, err) - return nil - } - - targetInHub, err := isPathInside(target, h.local.HubDir) - if err != nil { - h.logger.Warningf("Ignoring file %s: %s", path, err) - return nil - } - - // local (custom) item if the file or link target is not inside the hub dir - if !targetInHub { - h.logger.Tracef("%s is a local file, skip", path) - - item, err := newLocalItem(h, path, info) - if err != nil { - return err - } + return spec, nil +} - h.addItem(item) +func updateNonLocalItem(h *Hub, path string, spec *itemSpec, symlinkTarget string) (*Item, error) { + // look for the matching item - return nil + tot := 0 + for range h.GetItemMap(spec.ftype) { + tot++ } - hubpath := target - - // try to find which configuration item it is - h.logger.Tracef("check [%s] of %s", info.fname, info.ftype) - - for _, item := range h.GetItemMap(info.ftype) { - if info.fname != item.FileName { + for _, item := range h.GetItemMap(spec.ftype) { + if spec.fname != item.FileName { continue } - if item.Stage != info.stage { + if item.Stage != spec.stage { continue } - // if we are walking hub dir, just mark present files as downloaded - if info.inhub { + // Downloaded item, in the hub dir. + if spec.inhub { // not the item we're looking for - if !item.validPath(info.fauthor, info.fname) { + if !item.validPath(spec.fauthor, spec.fname) { continue } src, err := item.DownloadPath() if err != nil { - return err + return nil, err } - if path == src { + if spec.path == src { h.logger.Tracef("marking %s as downloaded", item.Name) item.State.Downloaded = true } - } else if !hasPathSuffix(hubpath, item.RemotePath) { + } else if !hasPathSuffix(symlinkTarget, item.RemotePath) { // wrong file // ///.yaml continue } - err := item.setVersionState(path, info.inhub) + err := item.setVersionState(spec.path, spec.inhub) + if err != nil { + return nil, err + } + + return item, nil + } + + return nil, nil +} + +// addItemFromSpec adds an item to the hub based on the spec, or updates it if already present. +// +// When the item is: +// +// Local - an itemSpec instance is created while scanning the install directory +// and an Item instance will be added to the hub.items map. +// +// Not downloaded, not installed - an Item instance is already on hub.items (decoded from index) and left untouched. +// +// Downloaded, not installed - an Item instance is on hub.items (decoded from index) and an itemSpec instance is created +// to complete it (i.e. set version and state flags). +// +// Downloaded, installed - an Item instance is on hub.items and is complemented with two itemSpecs: one from the file +// on the hub directory, one from the link in the install directory. +func (h *Hub) addItemFromSpec(spec *itemSpec) error { + var ( + item *Item + err error + ) + + // Local item: links outside the hub directory. + // We add it, or overwrite the existing one if it happened to have the same name. + if spec.local { + item, err = newLocalItem(h, spec.path, spec) if err != nil { return err } - h.pathIndex[path] = item + // we now have the name declared in the file (for local), + // see if there's another installed item of the same name + theOtherItem := h.GetItem(spec.ftype, item.Name) + if theOtherItem != nil { + if theOtherItem.State.Installed { + h.logger.Warnf("multiple %s named %s: ignoring %s", spec.ftype, item.Name, theOtherItem.State.LocalPath) + } + } + } else { + item, err = updateNonLocalItem(h, spec.path, spec, spec.target) + if err != nil { + return err + } + } + if item == nil { + h.logger.Infof("Ignoring file %s of type %s", spec.path, spec.ftype) return nil } - h.logger.Infof("Ignoring file %s of type %s", path, info.ftype) + h.addItem(item) return nil } @@ -411,6 +481,8 @@ func (i *Item) checkSubItemVersions() []string { // syncDir scans a directory for items, and updates the Hub state accordingly. func (h *Hub) syncDir(dir string) error { + specs := []*itemSpec{} + // For each, scan PARSERS, POSTOVERFLOWS... and COLLECTIONS last for _, scan := range ItemTypes { // cpath: top-level item directory, either downloaded or installed items. @@ -423,11 +495,43 @@ func (h *Hub) syncDir(dir string) error { // explicit check for non existing directory, avoid spamming log.Debug if _, err = os.Stat(cpath); os.IsNotExist(err) { - h.logger.Tracef("directory %s doesn't exist, skipping", cpath) continue } - if err = filepath.WalkDir(cpath, h.itemVisit); err != nil { + // wrap itemVisit to collect spec results + var specCollector = func(path string, f os.DirEntry, err error) error { + spec, err := h.itemVisit(path, f, err) + if err == nil && spec != nil { + specs = append(specs, spec) + } + if errors.Is(err, ErrSkipPath) { + return nil + } + + return err + } + + if err = filepath.WalkDir(cpath, specCollector); err != nil { + return err + } + } + + // add non-local items first, so they can find the place in the index + // before it's overridden by local items in case of name collision + for _, spec := range specs { + if spec.local { + continue + } + if err := h.addItemFromSpec(spec); err != nil { + return err + } + } + + for _, spec := range specs { + if !spec.local { + continue + } + if err := h.addItemFromSpec(spec); err != nil { return err } } diff --git a/test/bats/20_hub_items.bats b/test/bats/20_hub_items.bats index 8ebe505c6e1..34034816004 100644 --- a/test/bats/20_hub_items.bats +++ b/test/bats/20_hub_items.bats @@ -99,13 +99,6 @@ teardown() { rune -0 cscli parsers remove crowdsecurity/syslog-logs --purge assert_output "Nothing to do." - - rune -0 cscli parsers remove --all --error --purge --force - assert_output "Nothing to do." - refute_stderr - rune -0 cscli collections remove --all --error --purge --force - assert_output "Nothing to do." - refute_stderr } @test "a local item is not tainted" { @@ -199,6 +192,16 @@ teardown() { assert_json '[]' } +@test "replacing a symlink with a regular file makes a local item" { + rune -0 cscli parsers install crowdsecurity/caddy-logs + rune -0 rm "$CONFIG_DIR/parsers/s01-parse/caddy-logs.yaml" + rune -0 cp "$HUB_DIR/parsers/s01-parse/crowdsecurity/caddy-logs.yaml" "$CONFIG_DIR/parsers/s01-parse/caddy-logs.yaml" + rune -0 cscli hub list + rune -0 cscli parsers inspect crowdsecurity/caddy-logs -o json + rune -0 jq -e '[.tainted,.local,.local_version==false,true,"?"]' <(output) + refute_stderr +} + @test "tainted hub file, not enabled, install --force should repair" { rune -0 cscli scenarios install crowdsecurity/ssh-bf rune -0 cscli scenarios inspect crowdsecurity/ssh-bf -o json diff --git a/test/bats/cscli-hubtype-install.bats b/test/bats/cscli-hubtype-install.bats index 2304e5a72cc..5283929a2a9 100644 --- a/test/bats/cscli-hubtype-install.bats +++ b/test/bats/cscli-hubtype-install.bats @@ -267,3 +267,35 @@ teardown() { assert_line 'enabling contexts:crowdsecurity/bf_base' assert_line 'enabling collections:crowdsecurity/sshd' } + +@test "a local item can override an official one, if it's not installed" { + mkdir -p "$CONFIG_DIR/parsers/s02-enrich" + rune -0 cscli parsers install crowdsecurity/whitelists --download-only + echo "name: crowdsecurity/whitelists" > "$CONFIG_DIR/parsers/s02-enrich/hi.yaml" + # no warning + rune -0 cscli parsers list + refute_stderr + rune -0 cscli parsers list -o json + rune -0 jq -e '.installed,.local==true,true' <(output) +} + +@test "conflicting item names: local and non local - the local one has priority" { + mkdir -p "$CONFIG_DIR/parsers/s02-enrich" + rune -0 cscli parsers install crowdsecurity/whitelists + echo "name: crowdsecurity/whitelists" > "$CONFIG_DIR/parsers/s02-enrich/hi.yaml" + rune -0 cscli parsers list -o json + rune -0 jq -e '.installed,.local==true,true' <(output) + rune -0 cscli parsers list + assert_stderr --partial "multiple parsers named crowdsecurity/sshd-logs: ignoring $CONFIG_DIR/parsers/s01-parse/one.yaml" +} + +@test "conflicting item names: both local, the last one wins" { + mkdir -p "$CONFIG_DIR/parsers/s02-enrich" + echo "name: crowdsecurity/whitelists" > "$CONFIG_DIR/parsers/s02-enrich/one.yaml" + echo "name: crowdsecurity/whitelists" > "$CONFIG_DIR/parsers/s02-enrich/two.yaml" + rune -0 cscli parsers inspect crowdsecurity/whitelists -o json + rune -0 jq -r '.local_path' <(output) + assert_output --partial "/parsers/s02-enrich/one.yaml" + rune -0 cscli parsers list + assert_stderr --partial "multiple parsers named crowdsecurity/whitelists: ignoring $CONFIG_DIR/parsers/s02-enrich/two.yaml" +} diff --git a/test/bats/cscli-hubtype-list.bats b/test/bats/cscli-hubtype-list.bats index b3db4743eb9..14113650c74 100644 --- a/test/bats/cscli-hubtype-list.bats +++ b/test/bats/cscli-hubtype-list.bats @@ -80,7 +80,7 @@ teardown() { # the list should be the same in all formats, and sorted (not case sensitive) list_raw=$(cscli parsers list -o raw -a | tail -n +2 | cut -d, -f1) - list_human=$(cscli parsers list -o human -a | tail -n +7 | head -n -1 | cut -d' ' -f2) + list_human=$(cscli parsers list -o human -a | tail -n +6 | head -n -1 | cut -d' ' -f2) list_json=$(cscli parsers list -o json -a | jq -r '.parsers[].name') # use python to sort because it handles "_" like go