operator-framework
diff --git a/‎.gitignore‎
Lines changed: 10 additions & 2 deletions b/‎.gitignore‎
Lines changed: 10 additions & 2 deletions
diff --git a/‎Makefile‎
Lines changed: 14 additions & 2 deletions b/‎Makefile‎
Lines changed: 14 additions & 2 deletions
diff --git a/‎hack/tools/e2e-profiling/README.md‎
Lines changed: 234 additions & 0 deletions b/‎hack/tools/e2e-profiling/README.md‎
Lines changed: 234 additions & 0 deletions
@@ -38,8 +38,13 @@ vendor/
 \#*\#
 .\#*
 
-# AI temp files files
-.claude/
+# AI temp/local files
+.claude/settings.local.json
+.claude/history/
+.claude/cache/
+.claude/logs/
+.claude/.session*
+.claude/*.log
 
 # documentation website asset folder
 site
@@ -50,3 +55,6 @@ site
 
 # Temporary files and directories
 /test/regression/convert/testdata/tmp/*
+
+# E2E profiling artifacts
+e2e-profiles/
@@ -106,11 +106,11 @@ CATALOGS_MANIFEST := $(MANIFEST_HOME)/default-catalogs.yaml
 
 .PHONY: help
 help: #HELP Display essential help.
-	@awk 'BEGIN {FS = ":[^#]*#HELP"; printf "\nUsage:\n  make \033[36m<target>\033[0m\n\n"} /^[a-zA-Z_0-9-]+:.*#HELP / { printf "  \033[36m%-21s\033[0m %s\n", $$1, $$2 } ' $(MAKEFILE_LIST)
+	@awk 'BEGIN {FS = ":[^#]*#HELP"; printf "\nUsage:\n  make \033[36m<target>\033[0m\n\n"} /^[a-zA-Z_0-9\/%-]+:.*#HELP / { printf "  \033[36m%-21s\033[0m %s\n", $$1, $$2 } ' $(MAKEFILE_LIST)
 
 .PHONY: help-extended
 help-extended: #HELP Display extended help.
-	@awk 'BEGIN {FS = ":.*#(EX)?HELP"; printf "\nUsage:\n  make \033[36m<target>\033[0m\n"} /^[a-zA-Z_0-9-]+:.*#(EX)?HELP / { printf "  \033[36m%-25s\033[0m %s\n", $$1, $$2 } /^#SECTION / { printf "\n\033[1m%s\033[0m\n", substr($$0, 10) } ' $(MAKEFILE_LIST)
+	@awk 'BEGIN {FS = ":.*#(EX)?HELP"; printf "\nUsage:\n  make \033[36m<target>\033[0m\n"} /^[a-zA-Z_0-9\/%-]+:.*#(EX)?HELP / { printf "  \033[36m%-25s\033[0m %s\n", $$1, $$2 } /^#SECTION / { printf "\n\033[1m%s\033[0m\n", substr($$0, 10) } ' $(MAKEFILE_LIST)
 
 #SECTION Development
 
@@ -335,6 +335,18 @@ test-upgrade-experimental-e2e: $(TEST_UPGRADE_E2E_TASKS) #HELP Run upgrade e2e t
 e2e-coverage:
 	COVERAGE_NAME=$(COVERAGE_NAME) ./hack/test/e2e-coverage.sh
 
+.PHONY: start-profiling
+start-profiling: #EXHELP Start profiling in background with auto-generated name (timestamp). Use start-profiling/<name> for custom name.
+	./hack/tools/e2e-profiling/start-profiling.sh
+
+.PHONY: start-profiling/%
+start-profiling/%: #EXHELP Start profiling in background with specified name. Usage: make start-profiling/<name>
+	./hack/tools/e2e-profiling/start-profiling.sh $*
+
+.PHONY: stop-profiling
+stop-profiling: #EXHELP Stop profiling and generate analysis report
+	./hack/tools/e2e-profiling/stop-profiling.sh
+
 #SECTION KIND Cluster Operations
 
 .PHONY: kind-load
 
@@ -0,0 +1,234 @@
+# E2E Profiling Tools
+
+Automated profiling and analysis for operator-controller e2e tests. Collect heap and CPU profiles during test runs, analyze memory usage patterns, and compare optimizations.
+
+## Quick Start
+
+### Simple Start/Stop Workflow
+
+```bash
+# Start profiling (auto-generated name or specify custom name)
+make start-profiling
+make start-profiling/baseline
+
+# Run your tests
+make test-e2e
+
+# Stop and analyze
+make stop-profiling
+```
+
+The profiler:
+- Waits for cluster components to be ready
+- Collects profiles every 10 seconds (configurable)
+- Handles cluster teardown automatically
+- Generates analysis reports
+
+### Automated Test Runner
+
+```bash
+# Run baseline
+./hack/tools/e2e-profiling/e2e-profile.sh run baseline
+
+# Make changes, then run optimized version
+./hack/tools/e2e-profiling/e2e-profile.sh run optimized
+
+# Compare results
+./hack/tools/e2e-profiling/e2e-profile.sh compare baseline optimized
+```
+
+View reports:
+```bash
+cat e2e-profiles/baseline/analysis.md
+cat e2e-profiles/comparisons/baseline-vs-optimized.md
+```
+
+## Commands
+
+### `run <name> [test-target]`
+Run e2e test with profiling.
+
+```bash
+./hack/tools/e2e-profiling/e2e-profile.sh run my-test [test-e2e|test-experimental-e2e|...]
+```
+
+Output:
+- `e2e-profiles/<name>/operator-controller/*.pprof` - Profile snapshots
+- `e2e-profiles/<name>/catalogd/*.pprof` - Catalogd profiles
+- `e2e-profiles/<name>/analysis.md` - Analysis report
+
+### `analyze <name>`
+Analyze collected profiles.
+
+```bash
+./hack/tools/e2e-profiling/e2e-profile.sh analyze my-test
+```
+
+### `compare <test1> <test2>`
+Compare two test runs.
+
+```bash
+./hack/tools/e2e-profiling/e2e-profile.sh compare baseline optimized
+```
+
+Output: `e2e-profiles/comparisons/<test1>-vs-<test2>.md`
+
+### `collect`
+Manually collect a single heap profile.
+
+```bash
+./hack/tools/e2e-profiling/e2e-profile.sh collect
+```
+
+## Configuration
+
+```bash
+# Namespace (default: olmv1-system)
+export E2E_PROFILE_NAMESPACE=olmv1-system
+
+# Collection interval in seconds (default: 10)
+export E2E_PROFILE_INTERVAL=10
+
+# CPU profiling duration in seconds (default: 10)
+export E2E_PROFILE_CPU_DURATION=10
+
+# Profile mode: both, heap, cpu (default: both)
+export E2E_PROFILE_MODE=both
+
+# Output directory (default: ./e2e-profiles)
+export E2E_PROFILE_DIR=./e2e-profiles
+
+# Test target (default: test-experimental-e2e)
+export E2E_PROFILE_TEST_TARGET=test-experimental-e2e
+```
+
+**Note:** If `CPU_DURATION >= INTERVAL`, CPU profiling runs continuously.
+
+## Output Structure
+
+```
+e2e-profiles/
+├── baseline/
+│   ├── operator-controller/
+│   │   ├── heap*.pprof      # Heap snapshots
+│   │   └── cpu*.pprof       # CPU profiles
+│   ├── catalogd/
+│   │   ├── heap*.pprof
+│   │   └── cpu*.pprof
+│   ├── test.log
+│   ├── collection.log
+│   └── analysis.md
+└── comparisons/
+    └── baseline-vs-optimized.md
+```
+
+## Examples
+
+### Profile Optimization
+
+```bash
+# Baseline
+make start-profiling/baseline
+make test-e2e
+make stop-profiling
+
+# Implement changes, then profile optimized version
+make start-profiling/optimized
+make test-e2e
+make stop-profiling
+
+# Compare
+./hack/tools/e2e-profiling/e2e-profile.sh compare baseline optimized
+```
+
+### Heap-Only Profiling
+
+```bash
+# Reduced overhead for memory-focused analysis
+E2E_PROFILE_MODE=heap make start-profiling/memory-test
+make test-e2e
+make stop-profiling
+```
+
+### Different Test Suites
+
+```bash
+./hack/tools/e2e-profiling/e2e-profile.sh run standard test-e2e
+./hack/tools/e2e-profiling/e2e-profile.sh run upgrade test-upgrade-e2e
+./hack/tools/e2e-profiling/e2e-profile.sh compare standard upgrade
+```
+
+## Interactive Analysis
+
+```bash
+cd e2e-profiles/my-test/operator-controller
+
+# Top allocators
+go tool pprof -top heap23.pprof
+
+# Interactive mode
+go tool pprof heap23.pprof
+# Commands: top, list, web, pdf
+
+# Compare snapshots
+go tool pprof -base=heap0.pprof -top heap23.pprof
+
+# Filter specific patterns
+go tool pprof -text heap23.pprof | grep -i openapi
+```
+
+## Troubleshooting
+
+**No profiles collected:**
+- Check deployment is ready: `kubectl get deployment -n olmv1-system`
+- Verify pprof endpoint: `curl http://localhost:6060/debug/pprof/`
+- Review `collection.log` for connection errors
+
+**Test exits early:**
+- Run test manually first to verify it works
+- Check `test.log` for errors
+
+**Analysis fails:**
+- Verify files exist: `find e2e-profiles -name "*.pprof"`
+- Check `go tool pprof --help` works
+
+**Port-forward issues:**
+- Test manually: `kubectl port-forward -n olmv1-system deployment/operator-controller-controller-manager 6060:6060`
+- Kill stuck processes: `pkill -f "kubectl port-forward.*6060"`
+
+## Requirements
+
+- kubectl (cluster access)
+- go (for `go tool pprof`)
+- make
+- curl
+- bash 4.0+
+
+## Real-World Results
+
+OpenAPI caching optimization:
+- **Memory:** 49.6 MB → 41.2 MB (-16.9%)
+- **OpenAPI allocations:** 13 MB → 3.5 MB (-73%)
+- **Key insight:** Repeated schema fetching was #1 memory consumer
+
+## Architecture
+
+**Scripts:**
+- `profile-collector-daemon.sh` - Background collection process
+- `start-profiling.sh` - Start daemon mode profiling
+- `stop-profiling.sh` - Stop daemon and cleanup
+- `run-profiled-test.sh` - Orchestrate test + profiling
+- `analyze-profiles.sh` - Generate analysis reports
+- `compare-profiles.sh` - Create comparison reports
+- `common.sh` - Shared utilities and logging
+
+**Key Features:**
+- Deployment-based port-forwarding (survives pod restarts)
+- Automatic retry with 30s timeout
+- Graceful cleanup on exit/interrupt
+- Multi-component support (operator-controller + catalogd)
+
+## See Also
+
+- [Go pprof documentation](https://pkg.go.dev/net/http/pprof)
+- [Profiling Go Programs](https://go.dev/blog/pprof)