summaryrefslogtreecommitdiff
path: root/internal
diff options
context:
space:
mode:
authorPaul Buetow <paul@buetow.org>2026-06-09 22:18:42 +0300
committerPaul Buetow <paul@buetow.org>2026-06-09 22:18:42 +0300
commit7031211501884555139351bb676fc0592c9df14c (patch)
treedc5bf201bacb706c355f477413ad375a6d8fbe5b /internal
parentbab929022f4f4bba77439c63d130c833595758b6 (diff)
feat(parquet): surface epoll_ctl op/target-fd/events metadata
epoll_ctl's BPF handler already decodes the operation (args[1]), target descriptor (args[2]), and requested event mask (args[3]->events) into an EpollCtlEvent, but the single resolved-epfd `fd` column was the only epoll detail reaching the output schema. Consumers could not see which descriptor was registered nor the operation performed. Surface the metadata as three additive, backward-compatible columns, mirroring the existing dedicated optional-column convention used by requested_sleep_ns and address_space_bytes: - epoll_op (String): ADD/MOD/DEL, or the raw decimal for unknown ops; empty for non-epoll_ctl rows. - epoll_target_fd (Int32): registered descriptor (args[2]); 0 otherwise. - epoll_events (UInt32): requested event mask; 0 otherwise. Data flows EpollCtlEvent -> event.Pair (new EpollCtl/HasEpoll fields, populated in handleEpollCtlExit) -> streamrow.Row -> parquet.Record. The op-to-string mapping lives on event.EpollCtl.OpName. Docs (docs/parquet-querying.md) and the Magefile parquetValidate column list updated in lockstep (also adding the previously-undocumented address_space_bytes/requested_sleep_ns columns). The polling parquet integration test now asserts epoll_ctl rows carry a decoded op and a valid target fd, and that other syscalls leave epoll_op empty. Co-Authored-By: Claude Opus 4.8 <noreply@anthropic.com>
Diffstat (limited to 'internal')
-rw-r--r--internal/event/pair.go38
-rw-r--r--internal/eventloop_exit.go9
-rw-r--r--internal/parquet/schema.go10
-rw-r--r--internal/streamrow/row.go16
4 files changed, 73 insertions, 0 deletions
diff --git a/internal/event/pair.go b/internal/event/pair.go
index 523f961..afc9bed 100644
--- a/internal/event/pair.go
+++ b/internal/event/pair.go
@@ -31,6 +31,44 @@ type Pair struct {
AddressSpaceBytes uint64
// RequestedSleepNs tracks requested sleep duration for nanosleep-style syscalls.
RequestedSleepNs int64
+ // Epoll carries epoll_ctl control metadata (op, target fd, requested event
+ // mask). It is only populated for epoll_ctl pairs; HasEpoll reports whether
+ // it is set. The Pair-level File still resolves to the epoll instance (epfd);
+ // Epoll.TargetFD is the descriptor being registered/modified/removed.
+ Epoll EpollCtl
+ HasEpoll bool
+}
+
+// EpollCtl holds the decoded epoll_ctl arguments surfaced from the BPF
+// EpollCtlEvent: the operation (EPOLL_CTL_ADD/MOD/DEL), the target fd
+// (args[2]), and the requested epoll event mask (args[3]->events).
+type EpollCtl struct {
+ Op int32
+ TargetFD int32
+ Events uint32
+}
+
+// Linux epoll_ctl op values from <sys/epoll.h>.
+const (
+ epollCtlAdd = 1
+ epollCtlDel = 2
+ epollCtlMod = 3
+)
+
+// OpName renders the epoll_ctl operation as a human-readable token
+// (ADD/DEL/MOD). Unknown values fall back to their decimal form so the
+// raw op is never lost.
+func (c EpollCtl) OpName() string {
+ switch c.Op {
+ case epollCtlAdd:
+ return "ADD"
+ case epollCtlDel:
+ return "DEL"
+ case epollCtlMod:
+ return "MOD"
+ default:
+ return strconv.FormatInt(int64(c.Op), 10)
+ }
}
func NewPair(enterEv Event) *Pair {
diff --git a/internal/eventloop_exit.go b/internal/eventloop_exit.go
index ae085c6..105d9ac 100644
--- a/internal/eventloop_exit.go
+++ b/internal/eventloop_exit.go
@@ -385,7 +385,16 @@ func (e *eventLoop) handleEventfdExit(ep *event.Pair, eventfdEv *types.EventfdEv
}
func (e *eventLoop) handleEpollCtlExit(ep *event.Pair, epollCtlEv *types.EpollCtlEvent) bool {
+ // File resolves to the epoll instance (epfd); the decoded op/target-fd/events
+ // are surfaced separately via ep.Epoll so consumers can see which descriptor
+ // was registered and the operation performed.
ep.File = e.fdState().resolve(epollCtlEv.Epfd, epollCtlEv.Pid)
+ ep.Epoll = event.EpollCtl{
+ Op: epollCtlEv.Op,
+ TargetFD: epollCtlEv.Fd,
+ Events: epollCtlEv.Events,
+ }
+ ep.HasEpoll = true
return e.finishPairForTid(ep, epollCtlEv.GetTid())
}
diff --git a/internal/parquet/schema.go b/internal/parquet/schema.go
index f39361c..b7ed381 100644
--- a/internal/parquet/schema.go
+++ b/internal/parquet/schema.go
@@ -30,6 +30,13 @@ type Record struct {
File string `parquet:"file"`
IsError bool `parquet:"is_error"`
FilterEpoch uint64 `parquet:"filter_epoch"`
+ // EpollOp/EpollTargetFD/EpollEvents surface epoll_ctl control metadata: the
+ // operation (ADD/MOD/DEL), the target descriptor registered (args[2]), and
+ // the requested event mask (args[3]->events). EpollOp is empty and the
+ // numeric fields are zero for all non-epoll_ctl rows.
+ EpollOp string `parquet:"epoll_op"`
+ EpollTargetFD int32 `parquet:"epoll_target_fd"`
+ EpollEvents uint32 `parquet:"epoll_events"`
}
// FileMetadata captures constant metadata written once into the parquet file.
@@ -74,6 +81,9 @@ func RecordFromStream(row streamrow.Row, filterEpoch uint64) Record {
File: row.FileName,
IsError: row.IsError,
FilterEpoch: filterEpoch,
+ EpollOp: row.EpollOp,
+ EpollTargetFD: row.EpollTargetFD,
+ EpollEvents: row.EpollEvents,
}
}
diff --git a/internal/streamrow/row.go b/internal/streamrow/row.go
index a6ccdf7..c846346 100644
--- a/internal/streamrow/row.go
+++ b/internal/streamrow/row.go
@@ -30,6 +30,13 @@ type Row struct {
RetVal int64
IsError bool
FD int32
+ // EpollOp is the epoll_ctl operation as a readable token (ADD/MOD/DEL),
+ // empty for non-epoll_ctl rows. EpollTargetFD and EpollEvents hold the
+ // registered descriptor (args[2]) and requested event mask (args[3]->events)
+ // for epoll_ctl rows; both are zero when EpollOp is empty.
+ EpollOp string
+ EpollTargetFD int32
+ EpollEvents uint32
}
func (r Row) SyscallValue() string {
@@ -122,6 +129,15 @@ func New(seq uint64, pair *event.Pair) Row {
row.FD = fd
}
+ // Surface epoll_ctl control metadata when present. The Pair's FD/File still
+ // reflect the epoll instance (epfd); these fields expose the target fd and
+ // operation so consumers can see which descriptor was registered.
+ if pair.HasEpoll {
+ row.EpollOp = pair.Epoll.OpName()
+ row.EpollTargetFD = pair.Epoll.TargetFD
+ row.EpollEvents = pair.Epoll.Events
+ }
+
if retEv, ok := pair.ExitEv.(*types.RetEvent); ok {
row.RetVal = retEv.Ret
row.IsError = retEv.Ret < 0