canonical
diff --git a/‎poetry.lock
+2,333 b/‎poetry.lock
+2,333
diff --git a/‎pyproject.toml
+129 b/‎pyproject.toml
+129
diff --git a/‎src/benchmark/literals.py
+6 b/‎src/benchmark/literals.py
+6
diff --git a/‎src/benchmark/wrapper/core.py
+133 b/‎src/benchmark/wrapper/core.py
+133
diff --git a/‎src/benchmark/wrapper/main.py
+75 b/‎src/benchmark/wrapper/main.py
+75
@@ -0,0 +1,129 @@
+# Copyright 2023 Canonical Ltd.
+# See LICENSE file for licensing details.
+
+[tool.poetry]
+package-mode = false
+requires-poetry = ">=2.0.0"
+
+[tool.poetry.dependencies]
+python = "^3.10"
+ops = "^2.17.0"
+tenacity = "^9.0.0"
+jinja2 = "^3.1.4"
+overrides = "7.7.0"
+requests = "2.32.3"
+shortuuid = "1.0.13"
+cryptography = "^43.0.1"
+jsonschema = "^4.23.0"
+prometheus-client = ">=0.19.0"
+pydantic = "^1.10.18, <2"
+# pydantic = ">=2.0,<3.0"
+fastapi = ">=0.115.0"
+uvicorn = ">0.11.5"
+kafka-python = ">=2.0"
+
+[tool.poetry.group.charm-libs.dependencies]
+# data_platform_libs/v0/data_interfaces.py
+ops = "^2.17"
+# data_platform_libs/v0/upgrade.py
+# grafana_agent/v0/cos_agent.py requires pydantic <2
+pydantic = "^1.10, <2"
+# tls_certificates_interface/v1/tls_certificates.py
+cryptography = "^43.0.0"
+jsonschema = "^4.23.0"
+# grafana_agent/v0/cos_agent.py
+cosl = "^0.0.41"
+bcrypt = "^4.1.3"
+
+[tool.poetry.group.format]
+optional = true
+
+[tool.poetry.group.format.dependencies]
+ruff = "^0.6.8"
+
+[tool.poetry.group.lint]
+optional = true
+
+[tool.poetry.group.lint.dependencies]
+codespell = "^2.3.0"
+shellcheck-py = "^0.10.0.1"
+
+[tool.poetry.group.unit.dependencies]
+pytest = "^8.3.3"
+pytest-asyncio = "^0.21.2"
+coverage = {extras = ["toml"], version = "^7.6.1"}
+parameterized = "^0.9.0"
+
+[tool.poetry.group.integration.dependencies]
+pytest = "^8.3.3"
+pytest-github-secrets = {git = "https://github.com/canonical/data-platform-workflows", tag = "v24.0.6", subdirectory = "python/pytest_plugins/github_secrets"}
+pytest-operator = "^0.37.0"
+pytest-operator-cache = {git = "https://github.com/canonical/data-platform-workflows", tag = "v24.0.6", subdirectory = "python/pytest_plugins/pytest_operator_cache"}
+pytest-operator-groups = {git = "https://github.com/canonical/data-platform-workflows", tag = "v24.0.6", subdirectory = "python/pytest_plugins/pytest_operator_groups"}
+pytest-microceph = {git = "https://github.com/canonical/data-platform-workflows", tag = "v24.0.6", subdirectory = "python/pytest_plugins/microceph"}
+juju = "^3.5.2"
+ops = "^2.17.0"
+tenacity = "^9.0.0"
+pyyaml = "^6.0.2"
+urllib3 = "^2.2.3"
+protobuf = "5.28.2"
+
+[tool.coverage.run]
+branch = true
+
+[tool.coverage.report]
+show_missing = true
+
+[tool.pytest.ini_options]
+minversion = "6.0"
+log_cli_level = "INFO"
+markers = ["unstable"]
+asyncio_mode = "auto"
+
+# Formatting tools configuration
+[tool.black]
+line-length = 99
+target-version = ["py310"]
+
+# Linting tools configuration
+[tool.ruff]
+# preview and explicit preview are enabled for CPY001
+preview = true
+target-version = "py310"
+src = ["src", "."]
+line-length = 99
+
+[tool.ruff.lint]
+explicit-preview-rules = true
+select = ["A", "E", "W", "F", "C", "N", "D", "I001", "CPY001"]
+extend-ignore = [
+    "D203",
+    "D204",
+    "D213",
+    "D215",
+    "D400",
+    "D404",
+    "D406",
+    "D407",
+    "D408",
+    "D409",
+    "D413",
+]
+# Ignore E501 because using black creates errors with this
+# Ignore D107 Missing docstring in __init__
+ignore = ["E501", "D107"]
+
+[tool.ruff.lint.per-file-ignores]
+"tests/*" = ["D100", "D101", "D102", "D103", "D104"]
+
+[tool.ruff.lint.flake8-copyright]
+# Check for properly formatted copyright header in each file
+author = "Canonical Ltd."
+notice-rgx = "Copyright\\s\\d{4}([-,]\\d{4})*\\s+"
+min-file-size = 1
+
+[tool.ruff.lint.mccabe]
+max-complexity = 10
+
+[tool.ruff.lint.pydocstyle]
+convention = "google"
@@ -0,0 +1,6 @@
+# Copyright 2024 Canonical Ltd.
+# See LICENSE file for licensing details.
+
+"""This module contains the constants and models used by the sysbench charm."""
+
+BENCHMARK_WORKLOAD_PATH = "/root/.benchmark/charmed_parameters"
@@ -0,0 +1,133 @@
+# Copyright 2024 Canonical Ltd.
+# See LICENSE file for licensing details.
+
+"""The core models for the wrapper script."""
+
+from enum import Enum
+
+from prometheus_client import Gauge
+from pydantic import BaseModel
+
+
+class BenchmarkCommand(str, Enum):
+    """Enum to hold the benchmark phase."""
+
+    PREPARE = "prepare"
+    RUN = "run"
+    STOP = "stop"
+    COLLECT = "collect"
+    UPLOAD = "upload"
+    CLEANUP = "cleanup"
+
+
+class ProcessStatus(str, Enum):
+    """Enum to hold the process status."""
+
+    RUNNING = "running"
+    STOPPED = "stopped"
+    ERROR = "error"
+    TO_START = "to_start"
+
+
+class ProcessModel(BaseModel):
+    """Model to hold the process information."""
+
+    cmd: str
+    pid: int = -1
+    status: str = ProcessStatus.TO_START
+    user: str | None = None
+    group: str | None = None
+    cwd: str | None = None
+
+
+class MetricOptionsModel(BaseModel):
+    """Model to hold the metrics."""
+
+    label: str | None = None
+    extra_labels: list[str] = []
+    description: str | None = None
+
+
+class WorkloadCLIArgsModel(BaseModel):
+    """Model to hold the workload options."""
+
+    test_name: str
+    command: BenchmarkCommand
+    workload: str
+    threads: int
+    parallel_processes: int
+    duration: int
+    run_count: int
+    report_interval: int
+    extra_labels: str
+    peers: str
+    log_file: str = "/var/log/dpe_benchmark_workload.log"
+    is_coordinator: bool
+
+
+class BenchmarkMetrics:
+    """Class to hold the benchmark metrics."""
+
+    def __init__(
+        self,
+        options: MetricOptionsModel,
+    ):
+        self.options = options
+        self.metrics = {}
+
+    def add(self, sample: BaseModel):
+        """Add the benchmark to the prometheus metric."""
+        for key, value in sample.dict().items():
+            if f"{self.options.label}_{key}" not in self.metrics:
+                self.metrics[f"{self.options.label}_{key}"] = Gauge(
+                    f"{self.options.label}_{key}",
+                    f"{self.options.description} {key}",
+                    ["model", "unit"],
+                )
+            self.metrics[f"{self.options.label}_{key}"].labels(*self.options.extra_labels).set(
+                value
+            )
+
+
+class KafkaBenchmarkSample(BaseModel):
+    """Sample from the benchmark tool."""
+
+    produce_rate: float  # in msgs / s
+    produce_throughput: float  # in MB/s
+    produce_error_rate: float  # in err/s
+
+    produce_latency_avg: float  # in (ms)
+    produce_latency_50: float
+    produce_latency_99: float
+    produce_latency_99_9: float
+    produce_latency_max: float
+
+    produce_delay_latency_avg: float  # in (us)
+    produce_delay_latency_50: float
+    produce_delay_latency_99: float
+    produce_delay_latency_99_9: float
+    produce_delay_latency_max: float
+
+    consume_rate: float  # in msgs / s
+    consume_throughput: float  # in MB/s
+    consume_backlog: float  # in KB
+
+
+class KafkaBenchmarkSampleMatcher(Enum):
+    """Hard-coded regexes to process the benchmark sample."""
+
+    produce_rate: str = r"Pub rate\s+(.*?)\s+msg/s"
+    produce_throughput: str = r"Pub rate\s+\d+.\d+\s+msg/s\s+/\s+(.*?)\s+MB/s"
+    produce_error_rate: str = r"Pub err\s+(.*?)\s+err/s"
+    produce_latency_avg: str = r"Pub Latency \(ms\) avg:\s+(.*?)\s+"
+    # Match: Pub Latency (ms) avg: 1478.1 - 50%: 1312.6 - 99%: 4981.5 - 99.9%: 5104.7 - Max: 5110.5
+    # Generates: [('1478.1', '1312.6', '4981.5', '5104.7', '5110.5')]
+    produce_latency_percentiles: str = r"Pub Latency \(ms\) avg:\s+(.*?)\s+- 50%:\s+(.*?)\s+- 99%:\s+(.*?)\s+- 99.9%:\s+(.*?)\s+- Max:\s+(.*?)\s+"
+
+    # Pub Delay Latency (us) avg: 21603452.9 - 50%: 21861759.0 - 99%: 23621631.0 - 99.9%: 24160895.0 - Max: 24163839.0
+    # Generates: [('21603452.9', '21861759.0', '23621631.0', '24160895.0', '24163839.0')]
+    produce_latency_delay_percentiles: str = r"Pub Delay Latency \(us\) avg:\s+(.*?)\s+- 50%:\s+(.*?)\s+- 99%:\s+(.*?)\s+- 99.9%:\s+(.*?)\s+- Max:\s+(\d+\.\d+)"
+
+    consume_rate: str = r"Cons rate\s+(.*?)\s+msg/s"
+    consume_throughput: str = r"Cons rate\s+\d+.\d+\s+msg/s\s+/\s+(.*?)\s+MB/s"
+    consume_backlog: str = r"Backlog:\s+(.*?)\s+K"
@@ -0,0 +1,75 @@
+#!/usr/bin/python3
+# Copyright 2024 Canonical Ltd.
+# See LICENSE file for licensing details.
+
+"""This script runs the benchmark tool, collects its output and forwards to prometheus."""
+
+import logging
+import signal
+
+from core import WorkloadCLIArgsModel
+from process import WorkloadToProcessMapping
+from prometheus_client import start_http_server
+
+
+class MainWrapper:
+    """Main class to manage the benchmark tool."""
+
+    mapping: WorkloadToProcessMapping
+
+    def __init__(self, args: WorkloadCLIArgsModel):
+        self.args = args
+
+    def run(self):
+        """Prepares the workload and runs the benchmark."""
+        manager, _ = self.mapping.map(self.args.command)
+
+        logging.basicConfig(filename=self.args.log_file, encoding="utf-8", level=logging.INFO)
+
+        def _exit(*args, **kwargs):
+            manager.stop()
+
+        signal.signal(signal.SIGINT, _exit)
+        signal.signal(signal.SIGTERM, _exit)
+        start_http_server(8008)
+
+        # Start the manager and process the output
+        manager.start()
+        # Now, start the event loop to monitor the processes:
+        manager.run()
+
+
+# EXAMPLE
+# The code below is an example usage of the main function + the wrapper classes
+#
+# if __name__ == "__main__":
+#     parser = argparse.ArgumentParser(
+#         prog="wrapper", description="Runs the benchmark command as an argument."
+#     )
+#     parser.add_argument("--test_name", type=str, help="Test name to be used")
+#     parser.add_argument("--command", type=str, help="Command to be executed", default="run")
+#     parser.add_argument(
+#         "--workload", type=str, help="Name of the workload to be executed", default="default"
+#     )
+#     parser.add_argument("--report_interval", type=int, default=10)
+#     parser.add_argument("--parallel_processes", type=int, default=1)
+#     parser.add_argument("--threads", type=int, default=1)
+#     parser.add_argument("--duration", type=int, default=0)
+#     parser.add_argument("--run_count", type=int, default=1)
+#     parser.add_argument(
+#         "--target_hosts", type=str, default="", help="comma-separated list of target hosts"
+#     )
+#     parser.add_argument(
+#         "--log_file", type=str, default="/var/log/dpe_benchmark_workload.log", help="Log file for all threads"
+#     )
+#     parser.add_argument(
+#         "--extra_labels",
+#         type=str,
+#         help="comma-separated list of extra labels to be used.",
+#         default="",
+#     )
+#     # Parse the arguments as dictionary, using the same logic as:
+#     # https://github.com/python/cpython/blob/ \
+#     #     47c5a0f307cff3ed477528536e8de095c0752efa/Lib/argparse.py#L134
+#     args = parser.parse_args().__dict__ | {"command": BenchmarkCommand(parser.parse_args().command)}
+#     MainWrapper(WorkloadCLIArgsModel.parse_obj(args)).run()