docs: add metrics generation validation

fix: windows gitbash support fix: new name found with no group vector_search/vector_store_client.cc 343 fix: rm allowmismatch fix: git bash (windows) compatibility fix: git bash (windows) compatibility Closes scylladb/scylladb#26173
2025-09-21 22:53:35 +01:00
parent b911a643fd
commit 64a65cac55
7 changed files with 246 additions and 33 deletions
--- a/.github/workflows/docs-validate-metrics.yml
+++ b/.github/workflows/docs-validate-metrics.yml
@@ -0,0 +1,34 @@
+name: Docs / Validate metrics
+
+on:
+  pull_request:
+    branches:
+      - master
+      - enterprise
+    paths:
+      - '**/*.cc'
+      - 'scripts/metrics-config.yml' 
+      - 'scripts/get_description.py'
+      - 'docs/_ext/scylladb_metrics.py'
+
+jobs:
+  validate-metrics:
+    runs-on: ubuntu-latest
+    name: Check metrics documentation coverage
+    
+    steps:
+    - name: Checkout code
+      uses: actions/checkout@v4
+      with:
+        submodules: true
+      
+    - name: Set up Python
+      uses: actions/setup-python@v6
+      with:
+        python-version: '3.10'
+        
+    - name: Install dependencies
+      run: pip install PyYAML
+        
+    - name: Validate metrics
+      run: python3 scripts/get_description.py --validate -c scripts/metrics-config.yml
--- a/docs/README-metrics.md
+++ b/docs/README-metrics.md
@@ -0,0 +1,65 @@
+# ScyllaDB metrics docs scripts
+
+The following files extracts metrics from C++ source files and generates documentation:
+
+- **`scripts/get_description.py`** - Metrics parser and extractor
+- **`scripts/metrics-config.yml`** - Configuration for special cases only
+- **`docs/_ext/scylladb_metrics.py`** - Sphinx extension for rendering
+
+## Configuration
+
+The system automatically handles most metrics extraction. You only need configuration in the `metrics-config.yml` file for:
+
+**Complex parameter combinations:**
+```yaml
+"cdc/log.cc":
+  params:
+    part_name;suffix: [["static_row", "total"], ["clustering_row", "failed"]]
+    kind: ["total", "failed"]
+```
+
+**Multiple parameter values:**
+```yaml
+"service/storage_proxy.cc":
+  params:
+    _short_description_prefix: ["total_write_attempts", "write_errors"]
+```
+
+**Complex expressions:**
+```yaml
+"tracing/tracing.cc":
+  params:
+    "max_pending_trace_records + write_event_records_threshold": "max_pending_trace_records + write_event_records_threshold"
+```
+
+**Group assignments:**
+```yaml
+"cql3/query_processor.cc":
+  groups:
+    "80": query_processor
+```
+
+**Skip files:**
+```yaml
+"seastar/tests/unit/metrics_test.cc": skip
+```
+
+## Validation
+
+Use the built-in validation to check all metrics files:
+
+```bash
+# Validate all metrics files
+python scripts/get_description.py --validate -c scripts/metrics-config.yml
+
+# Validate with verbose output
+python scripts/get_description.py --validate -c scripts/metrics-config.yml -v
+```
+
+The GitHub workflow `docs-validate-metrics.yml` automatically runs validation on PRs to `master` that modify `.cc` files or metrics configuration.
+
+## Common fixes
+
+- **"Parameter not found"**: Add parameter mapping to config `params` section
+- **"Could not resolve param"**: Check parameter name matches C++ code exactly
+- **"No group found"**: Add group mapping or verify `add_group()` calls
--- a/docs/_ext/scylladb_metrics.py
+++ b/docs/_ext/scylladb_metrics.py
@@ -32,17 +32,29 @@ class MetricsProcessor:
            content = f.read()
        if self.MARKER in content and not os.path.exists(destination_path):
            try:
-                metrics_file = metrics.get_metrics_from_file(file_path, "scylla", metrics.get_metrics_information(metrics_config_path))
-                with open(destination_path, 'w+', encoding='utf-8') as f:
-                    json.dump(metrics_file, f, indent=4)
-            except SystemExit:
-                LOGGER.info(f'Skipping file: {file_path}')
+                metrics_info = metrics.get_metrics_information(metrics_config_path)
+                
+                # Get relative path to the repo root
+                relative_path = os.path.relpath(file_path, os.path.dirname(os.path.dirname(os.path.dirname(__file__))))
+                repo_root = os.path.dirname(os.path.dirname(os.path.dirname(__file__)))
+                old_cwd = os.getcwd()
+                os.chdir(repo_root)
+                
+                # Get metrics from the file
+                try:
+                    metrics_file = metrics.get_metrics_from_file(relative_path, "scylla_", metrics_info)
+                finally:
+                    os.chdir(old_cwd)
+                
+                if metrics_file:
+                    with open(destination_path, 'w+', encoding='utf-8') as f:
+                        json.dump(metrics_file, f, indent=4)
+                    LOGGER.info(f'Generated {len(metrics_file)} metrics for {file_path}')
+                else:
+                    LOGGER.info(f'No metrics generated for {file_path}')
+                    
            except Exception as error:
-                # Remove [Errno X] prefix from error message
-                error_msg = str(error)
-                if '[Errno' in error_msg:
-                    error_msg = error_msg.split('] ', 1)[1]
-                LOGGER.info(error_msg)
+                LOGGER.info(f'Error processing {file_path}: {str(error)}')

    def _process_metrics_files(self, repo_dir, output_directory, metrics_config_path):
        for root, _, files in os.walk(repo_dir):
@@ -163,7 +175,7 @@ class MetricsDirective(Directive):
        output = []
        try:
            relative_path_from_current_rst = self._get_relative_path(metrics_directory, app, docname)
-            files = os.listdir(metrics_directory)
+            files = sorted(os.listdir(metrics_directory))
            for _, file in enumerate(files):
                output.extend(self._process_file(file, relative_path_from_current_rst))
        except Exception as error:
--- a/docs/_ext/utils.py
+++ b/docs/_ext/utils.py
@@ -29,6 +29,7 @@ def readable_desc_rst(description):

        cleaned_line = cleaned_line.lstrip()
        cleaned_line = cleaned_line.replace('"', '')
+        cleaned_line = cleaned_line.replace('`', '\\`')
        
        if cleaned_line != '':
            cleaned_line = indent + cleaned_line
--- a/docs/conf.py
+++ b/docs/conf.py
@@ -76,7 +76,7 @@ author = u"ScyllaDB Project Contributors"

 # List of patterns, relative to source directory, that match files and
 # directories to ignore when looking for source files.
-exclude_patterns = ['_build', 'Thumbs.db', '.DS_Store', 'lib', 'lib64','**/_common/*', 'README.md', 'index.md', '.git', '.github', '_utils', 'rst_include', 'venv', 'dev', '_data/**']
+exclude_patterns = ['_build', 'Thumbs.db', '.DS_Store', 'lib', 'lib64','**/_common/*', 'README.md', 'README-metrics.md', 'index.md', '.git', '.github', '_utils', 'rst_include', 'venv', 'dev', '_data/**']

 # The name of the Pygments (syntax highlighting) style to use.
 pygments_style = "sphinx"
--- a/scripts/get_description.py
+++ b/scripts/get_description.py
@@ -5,6 +5,7 @@ import re
 import yaml
 import json
 import inspect
+from pathlib import Path

 from encodings import undefined

@@ -150,15 +151,28 @@ def get_metrics_information(config_file):

 def get_metrics_from_file(file_name, prefix, metrics_information, verb=None):
    current_group = ""
-    clean_name = file_name[2:] if file_name.startswith('./') else file_name
+    # Normalize path for cross-platform compatibility
+    # Convert absolute paths to relative and backslashes to forward slashes
+    clean_name = file_name
+    if file_name.startswith('./'):
+        clean_name = file_name[2:]
+    else:
+        # Handle absolute paths (Windows: C:\..., Unix: /...)
+        file_path = Path(file_name)
+        if file_path.is_absolute():
+            try:
+                # Try to make it relative to current directory
+                clean_name = str(file_path.relative_to(Path.cwd()))
+            except ValueError:
+                # If not relative to cwd, just use the name as-is
+                clean_name = file_name
+    # Normalize backslashes to forward slashes for config file compatibility
+    clean_name = clean_name.replace('\\', '/')
    param_mapping = {}
    groups = {}
-    allowmismatch = False
    if clean_name in metrics_information:
        if (isinstance(metrics_information[clean_name], str) and metrics_information[clean_name] == "skip") or "skip" in metrics_information[clean_name]:
            exit(0)
-        if "allowmismatch" in metrics_information[clean_name]:
-            allowmismatch = metrics_information[clean_name]["allowmismatch"]
    param_mapping =  metrics_information[clean_name]["params"] if clean_name in metrics_information and "params" in metrics_information[clean_name] else {}
    groups = metrics_information[clean_name]["groups"] if clean_name in metrics_information and "groups" in metrics_information[clean_name] else {}

@@ -184,11 +198,26 @@ def get_metrics_from_file(file_name, prefix, metrics_information, verb=None):
                serching_group = False
                verbose(verb, "group found on new line", current_group)
            m = metric.match(line)
+            # Check if add_group and metric are on the same line
            if m and not current_group:
-                print("new name found with no group", file_name, line_number, line)
-                exit(-1)
+                gr_match = gr.match(line)
+                if gr_match:
+                    # Extract group from add_group on the same line
+                    current_group = gr_match.group(2)
+                    m_str = string_content.match(current_group)
+                    if m_str:
+                        current_group = m_str.group(1)
+                    else:
+                        m_alt = alternative_name.match(current_group)
+                        if m_alt:
+                            current_group = param_mapping[m_alt.group(1)] if m_alt.group(1) in param_mapping else m_alt.group(1)
+                    verbose(verb, "group found on same line as metric", current_group)
+                else:
+                    print("new name found with no group", file_name, line_number, line)
+                    exit(-1)
            if current_metric or m:
-                if gr.match(line):
+                # Only error if add_group appears after we've started processing a metric
+                if current_metric and gr.match(line):
                    print("add group found unexpectedly", file_name, line_number, line)
                    exit(-1)
                if current_metric and m:
@@ -236,11 +265,10 @@ def get_metrics_from_file(file_name, prefix, metrics_information, verb=None):
                        for idx, base_name in enumerate(name_list):
                            name = prefix + cg + "_" + base_name
                            description = description_list[0].replace('#','"') if len(description_list) == 1 else description_list[idx].replace('#','\\"')
-                            if not allowmismatch and name in metrics and description !=  metrics[name][1]:
-                                print('description problem, different descriptions found', file_name, line_number, names, typ, line, name, metrics[name][1], description)
-                                print(metrics[name][1])
-                                print(description)
-                                exit(-1)
+                            if name in metrics:
+                                if description != metrics[name][1]:
+                                    verbose(verb, f'Note: Multiple descriptions found for {name}, using first one from {metrics[name][4]}')
+                                continue
                            metrics[name] = [typ, description, cg, base_name, file_name + ":" + str(line_number)]
                    current_metric = ""
                    parenthes_count = 0
@@ -274,6 +302,75 @@ def write_metrics_to_file(out_file, metrics, fmt="pipe"):
                fo.write(l.replace('-','_')+'|' +'|'.join(metrics[l])+ '\n')


+def validate_all_metrics(prefix, config_file, verbose=False):
+    """Validate all metrics files and report issues"""
+    
+    print("Validating all metrics files...")
+    
+    # Use pathlib to find all .cc files (cross-platform)
+    try:
+        current_dir = Path('.')
+        all_cc_files = list(current_dir.rglob('*.cc'))
+        
+        # Filter files that contain '::description'
+        metric_files = []
+        for cc_file in all_cc_files:
+            try:
+                with open(cc_file, 'r', encoding='utf-8', errors='ignore') as f:
+                    content = f.read()
+                    if '::description' in content:
+                        # Normalize path to use forward slashes for cross-platform compatibility
+                        normalized_path = str(cc_file).replace('\\', '/')
+                        metric_files.append(normalized_path)
+            except Exception as e:
+                if verbose:
+                    print(f"[WARN] Could not read {cc_file}: {e}")
+                continue
+        
+    except Exception as e:
+        print(f"[ERROR] Error finding metrics files: {e}")
+        return False
+
+    
+    total_files = len(metric_files)
+    
+    print(f"Found {total_files} files with metrics")
+    
+    failed_files = []
+    total_metrics = 0
+    metrics_info = get_metrics_information(config_file)
+    
+    for file_path in metric_files:
+        try:
+            metrics = get_metrics_from_file(file_path, prefix, metrics_info, verbose)
+            metrics_count = len(metrics)
+            total_metrics += metrics_count
+            if verbose:
+                print(f"[OK] {file_path} - {metrics_count} metrics")
+            else:
+                print(f"[OK] {file_path}")
+        except Exception as e:
+            print(f"[ERROR] {file_path}")
+            print(f"   Error: {str(e)}")
+            failed_files.append((file_path, str(e)))
+    
+    
+    if failed_files:
+        print("\n[ERROR] METRICS VALIDATION FAILED")
+        print("Failed files:")
+        for file_path, error in failed_files:
+            print(f"   - {file_path}: {error}")
+        print(f"\nAdd missing parameters to {config_file}")
+        return False
+    else:
+        working_files = total_files - len(failed_files)
+        coverage_pct = (working_files * 100 // total_files) if total_files > 0 else 0
+        
+        print(f"\n[SUCCESS] All metrics files validated successfully")
+        print(f"   Files: {working_files}/{total_files} working ({coverage_pct}% coverage)")
+        print(f"   Metrics: {total_metrics} total processed")
+        return True
+
 if __name__ == '__main__':
    parser = argparse.ArgumentParser(description='get metrics descriptions from file', conflict_handler="resolve")
    parser.add_argument('-p', '--prefix', default="scylla_", help='the prefix added to the metrics names')
@@ -281,8 +378,17 @@ if __name__ == '__main__':
    parser.add_argument('-c', '--config-file', default="metrics-config.yml", help='The configuration file used to add extra data missing in the code')
    parser.add_argument('-v', '--verbose', action='store_true', default=False, help='When set prints verbose information')
    parser.add_argument('-F', '--format', default="pipe", help='Set the output format, can be pipe, or yml')
-    parser.add_argument('file', help='the file to parse')
+    parser.add_argument('--validate', action='store_true', help='Validate all metrics files instead of processing single file')
+    parser.add_argument('file', nargs='?', help='the file to parse (not needed with --validate)')

    args = parser.parse_args()
+    
+    if args.validate:
+        success = validate_all_metrics(args.prefix, args.config_file, args.verbose)
+        exit(0 if success else 1)
+    
+    if not args.file:
+        parser.error('file argument is required when not using --validate')
+    
    metrics = get_metrics_from_file(args.file, args.prefix, get_metrics_information(args.config_file), args.verbose)
    write_metrics_to_file(args.out_file, metrics, args.format)
--- a/scripts/metrics-config.yml
+++ b/scripts/metrics-config.yml
@@ -6,13 +6,10 @@
 "db/commitlog/commitlog.cc":
    params:
        metrics_category_name: ["commitlog", "schema_commitlog"]
-        cfg.max_active_flushes: "cfg.max_active_flushes"
+        "cfg.max_active_flushes": "cfg.max_active_flushes"
 "cql3/query_processor.cc":
    groups:
        "80": query_processor
-    allowmismatch: true
-"raft/server.cc":
-  allowmismatch: true
 "replica/dirty_memory_manager.cc":
  params:
    namestr: ["regular", "system"]
@@ -20,7 +17,6 @@
  params:
    stat_name: ["exclusive_row", "shared_row", "exclusive_partition", "shared_partition"]
 "replica/database.cc":
-  allowmismatch: true
  params:
    "_dirty_memory_manager.throttle_threshold()": "throttle threshold"
 "seastar/apps/metrics_tester/metrics_tester.cc": skip
@@ -32,10 +28,10 @@
    COORDINATOR_STATS_CATEGORY: "storage_proxy_coordinator"
    "storage_proxy_stats::COORDINATOR_STATS_CATEGORY": "storage_proxy_coordinator"
    REPLICA_STATS_CATEGORY: "storage_proxy_replica"
+    "storage_proxy_stats::REPLICA_STATS_CATEGORY": "storage_proxy_replica"
    _short_description_prefix: ["total_write_attempts", "write_errors", "background_replica_writes_failed", "read_repair_write_attempts"]
    _long_description_prefix: ["total number of write requests", "number of write requests that failed", "background_replica_writes_failed", "number of write operations in a read repair context"]
    _category: "storage_proxy_coordinator"
-  allowmismatch: true
 "thrift/server.cc": skip
 "tracing/tracing.cc":
  params:
@@ -44,7 +40,7 @@
  groups:
    "200": transport
  params:
-    _max_request_size: "max_request_size"
+    "_config.max_request_size": "max_request_size"
 "seastar/src/net/dpdk.cc": skip
 "db/hints/manager.cc":
    params:
@@ -67,6 +63,5 @@
        "_queue_name + \"_tx_frags\"": ["queue"]
        "_queue_name + \"_rx_frags\"": ["queue"]
 "alternator/stats.cc":
-  allowmismatch: true
  params:
    group_name: "alternator"