openshift
diff --git a/‎openshift/tests-extension/.openshift-tests-extension/openshift_payload_olmv1.json‎
Lines changed: 16 additions & 0 deletions b/‎openshift/tests-extension/.openshift-tests-extension/openshift_payload_olmv1.json‎
Lines changed: 16 additions & 0 deletions
diff --git a/‎openshift/tests-extension/test/qe/README.md‎
Lines changed: 14 additions & 1 deletion b/‎openshift/tests-extension/test/qe/README.md‎
Lines changed: 14 additions & 1 deletion
diff --git a/‎openshift/tests-extension/test/qe/specs/olmv1_stress.go‎
Lines changed: 145 additions & 0 deletions b/‎openshift/tests-extension/test/qe/specs/olmv1_stress.go‎
Lines changed: 145 additions & 0 deletions
diff --git a/‎openshift/tests-extension/test/qe/util/architecture/architecture.go‎
Lines changed: 6 additions & 6 deletions b/‎openshift/tests-extension/test/qe/util/architecture/architecture.go‎
Lines changed: 6 additions & 6 deletions
diff --git a/‎openshift/tests-extension/test/qe/util/olmv1util/helper.go‎
Lines changed: 1 addition & 1 deletion b/‎openshift/tests-extension/test/qe/util/olmv1util/helper.go‎
Lines changed: 1 addition & 1 deletion
diff --git a/‎openshift/tests-extension/test/qe/util/stress/README.md‎
Lines changed: 80 additions & 0 deletions b/‎openshift/tests-extension/test/qe/util/stress/README.md‎
Lines changed: 80 additions & 0 deletions
diff --git a/‎openshift/tests-extension/test/qe/util/stress/manifests/config/pkg-ins-v1/metrics-endpoint.yml‎
Lines changed: 9 additions & 0 deletions b/‎openshift/tests-extension/test/qe/util/stress/manifests/config/pkg-ins-v1/metrics-endpoint.yml‎
Lines changed: 9 additions & 0 deletions
diff --git a/‎openshift/tests-extension/test/qe/util/stress/manifests/config/pkg-ins-v1/metrics-profiles/metrics-aggregated.yml‎
Lines changed: 7 additions & 0 deletions b/‎openshift/tests-extension/test/qe/util/stress/manifests/config/pkg-ins-v1/metrics-profiles/metrics-aggregated.yml‎
Lines changed: 7 additions & 0 deletions
@@ -565,6 +565,22 @@
       "exclude": "topology==\"External\""
     }
   },
+  {
+    "name": "[sig-olmv1][Jira:OLM] OLM v1 for stress PolarionID:81509-[OTP][Skipped:Disconnected][OlmStress]olmv1 create mass operator to see if they all are installed successfully [Slow][Timeout:330m]",
+    "labels": {
+      "Extended": {},
+      "NonHyperShiftHOST": {},
+      "StressTest": {}
+    },
+    "resources": {
+      "isolation": {}
+    },
+    "source": "openshift:payload:olmv1",
+    "lifecycle": "blocking",
+    "environmentSelector": {
+      "exclude": "topology==\"External\""
+    }
+  },
   {
     "name": "[sig-olmv1][OCPFeatureGate:NewOLM][Skipped:Disconnected] OLMv1 Catalogs should be installed",
     "labels": {},
 
@@ -244,7 +244,20 @@ All migrated test case code needs the following changes to run in the new test f
 
 **Environment Validation for Disconnected-Supporting Migrated Test Cases:**
 
-If your test case supports disconnected environments, you MUST call `ValidateAccessEnvironment` at the beginning of the test:
+**When to use `ValidateAccessEnvironment`:**
+
+1. **Test cases that create ClusterCatalog or ClusterExtension**:
+   - If your test supports disconnected environments (both connected+disconnected, or disconnected-only)
+   - AND your test creates ClusterCatalog or ClusterExtension resources
+   - **MUST** call `ValidateAccessEnvironment(oc)` at the beginning of the test
+   - This applies to both newly created test cases and migrated test cases
+
+2. **Test cases that do NOT create both ClusterCatalog or ClusterExtension**:
+   - Optional to use `ValidateAccessEnvironment(oc)`
+   - Using it won't cause errors, but it's not required
+   - The validation is primarily for ensuring catalog images can be mirrored
+
+**Usage example:**
 
 ```go
 g.It("test case supporting disconnected", func() {
 
@@ -0,0 +1,145 @@
+package specs
+
+import (
+	"fmt"
+	"path/filepath"
+	"time"
+
+	g "github.com/onsi/ginkgo/v2"
+	o "github.com/onsi/gomega"
+	e2e "k8s.io/kubernetes/test/e2e/framework"
+
+	exutil "github.com/openshift/operator-framework-operator-controller/openshift/tests-extension/test/qe/util"
+	olmv1util "github.com/openshift/operator-framework-operator-controller/openshift/tests-extension/test/qe/util/olmv1util"
+)
+
+var _ = g.Describe("[sig-olmv1][Jira:OLM] OLM v1 for stress", func() {
+
+	defer g.GinkgoRecover()
+	var (
+		oc = exutil.NewCLIWithoutNamespace("default")
+	)
+
+	g.BeforeEach(func() {
+		exutil.SkipMicroshift(oc)
+		exutil.SkipNoOLMv1Core(oc)
+	})
+
+	// author: [email protected]
+	g.It("PolarionID:81509-[OTP][Skipped:Disconnected][OlmStress]olmv1 create mass operator to see if they all are installed successfully [Slow][Timeout:330m]", g.Label("StressTest"), g.Label("NonHyperShiftHOST"), func() {
+		var (
+			caseID                       = "81509"
+			prefixCatalog                = "catalog-" + caseID
+			prefixSa                     = "sa-" + caseID
+			prefixCe                     = "ce-" + caseID
+			prefixNs                     = "ns-" + caseID
+			prefixPackage                = "stress-olmv1-c"
+			prefixImage                  = "quay.io/olmqe/stress-index:vokv"
+			nsOc                         = "openshift-operator-controller"
+			nsCatalog                    = "openshift-catalogd"
+			catalogLabel                 = "control-plane=catalogd-controller-manager"
+			ocLabel                      = "control-plane=operator-controller-controller-manager"
+			baseDir                      = exutil.FixturePath("testdata", "olm")
+			clustercatalogTemplate       = filepath.Join(baseDir, "clustercatalog.yaml")
+			clusterextensionTemplate     = filepath.Join(baseDir, "clusterextension.yaml")
+			saClusterRoleBindingTemplate = filepath.Join(baseDir, "sa-admin.yaml")
+		)
+
+		if !olmv1util.IsPodReady(oc, nsCatalog, catalogLabel) {
+			_, _ = olmv1util.Get(oc, "pod", "-n", nsCatalog, "-l", catalogLabel, "-o", "yaml")
+			exutil.AssertWaitPollNoErr(fmt.Errorf("the pod with %s is not correct", catalogLabel), "the pod with app=catalog-operator is not correct")
+		}
+		if !olmv1util.IsPodReady(oc, nsOc, ocLabel) {
+			_, _ = olmv1util.Get(oc, "pod", "-n", nsOc, "-l", ocLabel, "-o", "yaml")
+			exutil.AssertWaitPollNoErr(fmt.Errorf("the pod with %s is not correct", ocLabel), "the pod with app=olm-operator is not correct")
+		}
+
+		startTime := time.Now().UTC()
+		e2e.Logf("Start time: %s", startTime.Format(time.RFC3339))
+
+		// for i := 0; i < 500; i++ {
+		for i := 900; i < 969; i++ {
+			// it is not enough with 330m for one case if we run 100 times
+			e2e.Logf("=================it is round %v=================", i)
+			ns := fmt.Sprintf("%s-%d", prefixNs, i)
+			clustercatalog := olmv1util.ClusterCatalogDescription{
+				Name:     fmt.Sprintf("%s-%d", prefixCatalog, i),
+				Imageref: fmt.Sprintf("%s%d", prefixImage, i),
+				Template: clustercatalogTemplate,
+			}
+			saCrb := olmv1util.SaCLusterRolebindingDescription{
+				Name:      fmt.Sprintf("%s-%d", prefixSa, i),
+				Namespace: ns,
+				Template:  saClusterRoleBindingTemplate,
+			}
+			ce := olmv1util.ClusterExtensionDescription{
+				Name:             fmt.Sprintf("%s-%d", prefixCe, i),
+				PackageName:      fmt.Sprintf("%s%d", prefixPackage, i),
+				Channel:          "alpha",
+				Version:          ">=0.0.1",
+				InstallNamespace: ns,
+				SaName:           fmt.Sprintf("%s-%d", prefixSa, i),
+				Template:         clusterextensionTemplate,
+			}
+			g.By(fmt.Sprintf("Create namespace for %d", i))
+			// defer oc.WithoutNamespace().AsAdmin().Run("delete").Args("ns", ns, "--ignore-not-found").Execute()
+			// it takes time to delete ns which is not necessary. currently 5.5h is not enough to delete them.
+			// so I prefer to keep ns to save case duration
+			err := oc.WithoutNamespace().AsAdmin().Run("create").Args("ns", ns).Execute()
+			o.Expect(err).NotTo(o.HaveOccurred())
+			o.Expect(olmv1util.Appearance(oc, exutil.Appear, "ns", ns)).To(o.BeTrue())
+
+			g.By(fmt.Sprintf("Create clustercatalog for %d", i))
+			e2e.Logf("=========Create clustercatalog %v=========", clustercatalog.Name)
+			defer clustercatalog.Delete(oc)
+			err = clustercatalog.CreateWithoutCheck(oc)
+			o.Expect(err).NotTo(o.HaveOccurred())
+			clustercatalog.WaitCatalogStatus(oc, "true", "Serving", 0)
+
+			g.By(fmt.Sprintf("Create SA for clusterextension for %d", i))
+			defer saCrb.Delete(oc)
+			saCrb.Create(oc)
+
+			g.By(fmt.Sprintf("check ce to be installed for %d", i))
+			e2e.Logf("=========Create clusterextension %v=========", ce.Name)
+			defer ce.Delete(oc)
+			err = ce.CreateWithoutCheck(oc)
+			o.Expect(err).NotTo(o.HaveOccurred())
+			ce.CheckClusterExtensionCondition(oc, "Progressing", "reason", "Succeeded", 10, 600, 0)
+			ce.WaitClusterExtensionCondition(oc, "Installed", "True", 0)
+		}
+
+		endTime := time.Now().UTC()
+		e2e.Logf("End time:  %v", endTime.Format(time.RFC3339))
+
+		duration := endTime.Sub(startTime)
+		minutes := int(duration.Minutes())
+		if minutes < 1 {
+			minutes = 1
+		}
+
+		podName, err := oc.AsAdmin().WithoutNamespace().Run("get").Args("pods", "-l", catalogLabel, "-o=jsonpath={.items[0].metadata.name}", "-n", nsCatalog).Output()
+		if err == nil {
+			if !olmv1util.WriteErrToArtifactDir(oc, nsCatalog, podName, "error", "Unhandled|Reconciler error|level=info", caseID, minutes) {
+				e2e.Logf("no error log into artifact for pod %s in %s", podName, nsCatalog)
+			}
+		}
+		podName, err = oc.AsAdmin().WithoutNamespace().Run("get").Args("pods", "-l", ocLabel, "-o=jsonpath={.items[0].metadata.name}", "-n", nsOc).Output()
+		if err == nil {
+			if !olmv1util.WriteErrToArtifactDir(oc, nsOc, podName, "error", "Unhandled|Reconciler error|level=info", caseID, minutes) {
+				e2e.Logf("no error log into artifact for pod %s in %s", podName, nsOc)
+			}
+		}
+
+		if !olmv1util.IsPodReady(oc, nsCatalog, catalogLabel) {
+			_, _ = olmv1util.Get(oc, "pod", "-n", nsCatalog, "-l", catalogLabel, "-o", "yaml")
+			exutil.AssertWaitPollNoErr(fmt.Errorf("the pod with %s is not correct", catalogLabel), "the pod with app=catalog-operator is not correct")
+		}
+		if !olmv1util.IsPodReady(oc, nsOc, ocLabel) {
+			_, _ = olmv1util.Get(oc, "pod", "-n", nsOc, "-l", ocLabel, "-o", "yaml")
+			exutil.AssertWaitPollNoErr(fmt.Errorf("the pod with %s is not correct", ocLabel), "the pod with app=olm-operator is not correct")
+		}
+
+	})
+
+})
@@ -80,10 +80,10 @@ func SkipNonAmd64SingleArch(oc *exutil.CLI) Architecture {
 func getNodeArchitectures(oc *exutil.CLI) []string {
 	output, err := oc.WithoutNamespace().AsAdmin().Run("get").Args("nodes", "-o=jsonpath={.items[*].status.nodeInfo.architecture}").Output()
 	if err != nil {
-		e2e.Failf("unable to get cluster node architectures: %v", err)
+		g.Skip(fmt.Sprintf("unable to get cluster node architectures: %v", err))
 	}
 	if output == "" {
-		e2e.Failf("no nodes found or architecture information missing")
+		g.Skip("no nodes found or architecture information missing")
 	}
 	return strings.Fields(output) // Use Fields instead of Split to handle multiple spaces
 }
@@ -97,7 +97,7 @@ func getNodeArchitectures(oc *exutil.CLI) []string {
 func GetAvailableArchitecturesSet(oc *exutil.CLI) []Architecture {
 	architectureStrings := getNodeArchitectures(oc)
 	if len(architectureStrings) == 0 {
-		e2e.Failf("no node architectures found")
+		g.Skip("no node architectures found")
 	}
 
 	// Use map for deduplication with Architecture as key
@@ -199,7 +199,7 @@ func (a Architecture) String() string {
 func ClusterArchitecture(oc *exutil.CLI) Architecture {
 	architectureStrings := getNodeArchitectures(oc)
 	if len(architectureStrings) == 0 {
-		e2e.Failf("no node architectures found")
+		g.Skip("no node architectures found")
 	}
 
 	// Filter out empty strings and convert to Architecture
@@ -211,7 +211,7 @@ func ClusterArchitecture(oc *exutil.CLI) Architecture {
 	}
 
 	if len(architectures) == 0 {
-		e2e.Failf("no valid node architectures found")
+		g.Skip("no valid node architectures found")
 	}
 
 	// Check if all architectures are the same
@@ -267,7 +267,7 @@ func GetControlPlaneArch(oc *exutil.CLI) Architecture {
 
 	architectureStr = strings.TrimSpace(architectureStr)
 	if architectureStr == "" {
-		e2e.Failf("Control plane node %s has no architecture information", masterNode)
+		g.Skip(fmt.Sprintf("Control plane node %s has no architecture information", masterNode))
 	}
 
 	return FromString(architectureStr)
 
@@ -590,7 +590,7 @@ func HasExternalNetworkAccess(oc *exutil.CLI) bool {
 	// Note: In disconnected environments, curl will fail and bash will return non-zero exit code,
 	// causing DebugNodeWithChroot to return an error. We ignore this error and rely on output checking.
 	cmd := `timeout 10 curl -k https://quay.io > /dev/null 2>&1; [ $? -eq 0 ] && echo "connected"`
-	output, _ := exutil.DebugNodeWithChroot(oc, masterNode, "bash", "-c", cmd)
+	output, _ := exutil.DebugNodeWithOptionsAndChroot(oc, masterNode, []string{"--to-namespace=default"}, "bash", "-c", cmd)
 
 	// Check if the output contains "connected"
 	// - Connected environment: curl succeeds -> echo "connected" -> output contains "connected"
 
@@ -0,0 +1,80 @@
+# OLM v1 Stress Testing Tools
+
+This directory contains tools and configuration files for OLM v1 stress testing. These tools are used by the `openshift-e2e-test-olm-qe-stress` Prow job chain.
+
+## Directory Structure
+
+```
+stress/
+├── manifests/
+│   └── config/
+│       └── pkg-ins-v1/           # OLM v1 stress test configurations
+│           ├── pkg-ins-v1.yml    # Main kube-burner configuration
+│           ├── metrics-endpoint.yml
+│           ├── metrics-profiles/
+│           │   └── metrics-aggregated.yml
+│           └── templates/        # Resource templates for stress testing
+│               ├── catalogd.yml  # ClusterCatalog template
+│               ├── ce.yml        # ClusterExtension template
+│               ├── sa.yml        # ServiceAccount template
+│               ├── clusterrole.yml
+│               └── clusterrolebinding.yml
+└── util/
+    └── ma/                       # Metrics analysis Python package
+        ├── cli/                  # CLI commands
+        │   ├── cmd_group.py
+        │   └── cmd_check_ccpu.py
+        └── helper/               # Helper modules
+            ├── util.py
+            ├── containercpu.py
+            ├── exceptions.py
+            ├── algo.py
+            └── const.py
+```
+
+## Purpose
+
+This directory supports stress testing for OLM v1 by:
+
+1. **Kube-burner Configuration**: `pkg-ins-v1.yml` defines the stress test job that creates multiple ClusterCatalogs and ClusterExtensions
+2. **Resource Templates**: YAML templates for creating OLM v1 resources at scale
+3. **Metrics Analysis**: Python tools for analyzing CPU and performance metrics during stress tests
+
+## Usage Context
+
+These tools are **NOT** used by the Golang test cases directly. Instead, they are used by:
+
+- **Prow Job**: `openshift-e2e-test-olm-qe-stress`
+- **Test Chain**: `stress-olm` (referenced in CI operator config)
+
+The Prow job uses kube-burner with these configurations to create hundreds of OLM v1 resources concurrently and measure system behavior under load.
+
+## Relationship to Test Cases
+
+The Golang test case in `specs/olmv1_stress.go` (PolarionID:81509) is a **functional stress test** that validates OLM v1 can install mass operators correctly. It differs from these kube-burner tools:
+
+- **Golang Test (81509)**: Validates functional correctness of installing many operators
+- **Kube-burner Tools**: Measure performance and resource usage under extreme load
+
+Both are important for ensuring OLM v1 can handle production workloads at scale.
+
+## Metrics Analysis
+
+The `ma` (Metrics Analysis) Python package provides tools to analyze metrics collected during stress tests:
+
+- **cmd_check_ccpu.py**: Check catalogd controller CPU usage
+- **containercpu.py**: Analyze container CPU metrics
+- **algo.py**: Statistical analysis algorithms for metrics
+
+## Maintenance Notes
+
+- This directory contains **OLM v1 specific** stress tools only
+- OLM v0 stress tools (`pkg-ins`) have been removed during migration
+- Template files reference OLM v1 resources: ClusterCatalog, ClusterExtension
+- Image prefix: `quay.io/olmqe/stress-index:vokv*` (stress test catalog images)
+
+## Related Documentation
+
+- [Kube-burner Documentation](https://kube-burner.readthedocs.io/)
+- [OLM v1 Stress Test Case](../../specs/olmv1_stress.go)
+- [CI Operator Config](https://github.com/openshift/release/tree/master/ci-operator/config/openshift/openshift-tests-private)
@@ -0,0 +1,9 @@
+- endpoint: {{.PROMETHEUS_URL}}
+  token: {{.PROMETHEUS_TOKEN}}
+  step: 10s
+  skipTLSVerify: true
+  metrics:
+    - metrics-profiles/metrics-aggregated.yml
+  indexer:
+    type: local
+    metricsDirectory: collected-metrics-{{.UUID}}
@@ -0,0 +1,7 @@
+# Containers & pod metrics
+
+- query: (sum(irate(container_cpu_usage_seconds_total{container="manager",namespace="openshift-catalogd"}[2m]) * 100) by (container, pod)) > 0
+  metricName: containerCPU-Catlogd
+
+- query: (sum(irate(container_cpu_usage_seconds_total{container="manager",namespace="openshift-operator-controller"}[2m]) * 100) by (container, pod)) > 0
+  metricName: containerCPU-OpCon
Original file line number	Diff line number	Diff line change
`@@ -80,10 +80,10 @@ func SkipNonAmd64SingleArch(oc *exutil.CLI) Architecture {`
`80`	`80`	`func getNodeArchitectures(oc *exutil.CLI) []string {`
`81`	`81`	`output, err := oc.WithoutNamespace().AsAdmin().Run("get").Args("nodes", "-o=jsonpath={.items[*].status.nodeInfo.architecture}").Output()`
`82`	`82`	`if err != nil {`
`83`		`- e2e.Failf("unable to get cluster node architectures: %v", err)`
	`83`	`+ g.Skip(fmt.Sprintf("unable to get cluster node architectures: %v", err))`
`84`	`84`	`}`
`85`	`85`	`if output == "" {`
`86`		`- e2e.Failf("no nodes found or architecture information missing")`
	`86`	`+ g.Skip("no nodes found or architecture information missing")`
`87`	`87`	`}`
`88`	`88`	`return strings.Fields(output) // Use Fields instead of Split to handle multiple spaces`
`89`	`89`	`}`
`@@ -97,7 +97,7 @@ func getNodeArchitectures(oc *exutil.CLI) []string {`
`97`	`97`	`func GetAvailableArchitecturesSet(oc *exutil.CLI) []Architecture {`
`98`	`98`	`architectureStrings := getNodeArchitectures(oc)`
`99`	`99`	`if len(architectureStrings) == 0 {`
`100`		`- e2e.Failf("no node architectures found")`
	`100`	`+ g.Skip("no node architectures found")`
`101`	`101`	`}`
`102`	`102`
`103`	`103`	`// Use map for deduplication with Architecture as key`
`@@ -199,7 +199,7 @@ func (a Architecture) String() string {`
`199`	`199`	`func ClusterArchitecture(oc *exutil.CLI) Architecture {`
`200`	`200`	`architectureStrings := getNodeArchitectures(oc)`
`201`	`201`	`if len(architectureStrings) == 0 {`
`202`		`- e2e.Failf("no node architectures found")`
	`202`	`+ g.Skip("no node architectures found")`
`203`	`203`	`}`
`204`	`204`
`205`	`205`	`// Filter out empty strings and convert to Architecture`
`@@ -211,7 +211,7 @@ func ClusterArchitecture(oc *exutil.CLI) Architecture {`
`211`	`211`	`}`
`212`	`212`
`213`	`213`	`if len(architectures) == 0 {`
`214`		`- e2e.Failf("no valid node architectures found")`
	`214`	`+ g.Skip("no valid node architectures found")`
`215`	`215`	`}`
`216`	`216`
`217`	`217`	`// Check if all architectures are the same`
`@@ -267,7 +267,7 @@ func GetControlPlaneArch(oc *exutil.CLI) Architecture {`
`267`	`267`
`268`	`268`	`architectureStr = strings.TrimSpace(architectureStr)`
`269`	`269`	`if architectureStr == "" {`
`270`		`- e2e.Failf("Control plane node %s has no architecture information", masterNode)`
	`270`	`+ g.Skip(fmt.Sprintf("Control plane node %s has no architecture information", masterNode))`
`271`	`271`	`}`
`272`	`272`
`273`	`273`	`return FromString(architectureStr)`