Add test to detect inline comments in Jinja2 expressions within YAML files

This test would have caught the bug reported where inline comments (#) within Jinja2 expressions in YAML task files caused Ansible template errors. The test: - Extracts and validates all Jinja2 expressions from YAML files - Specifically detects inline comments within {{ }} and {% %} blocks - Includes regression test for the exact reported bug pattern - Avoids false positives (# in strings, escaped #, comments outside expressions) - Focuses on the critical inline comment issue The original bug was in roles/strongswan/tasks/openssl.yml where comments like "# Per-deployment UUID..." were placed inside a Jinja2 expression, causing "unexpected char '#'" errors during playbook execution. 🤖 Generated with [Claude Code](https://claude.ai/code) Co-Authored-By: Claude <noreply@anthropic.com>
2025-09-05 19:43:22 +02:00 · 2025-08-07 10:46:35 -07:00 · 2025-08-07 10:46:35 -07:00 · ec4ba30325
commit ec4ba30325
parent 2ab57c3f6a
1 changed files with 379 additions and 0 deletions
--- a/tests/unit/test_yaml_jinja2_expressions.py
+++ b/tests/unit/test_yaml_jinja2_expressions.py
@ -0,0 +1,379 @@
 #!/usr/bin/env python3
 """
 Test that Jinja2 expressions within YAML files are valid.
 This catches issues like inline comments in Jinja2 expressions within YAML task files.
 """
 import re
 import sys
 from pathlib import Path
 import yaml
 from jinja2 import Environment, StrictUndefined, TemplateSyntaxError
 def find_yaml_files_with_jinja2():
    """Find all YAML files that might contain Jinja2 expressions."""
    yaml_files = []
    # Look for YAML files in roles that are likely to have Jinja2
    patterns = [
        'roles/**/tasks/*.yml',
        'roles/**/defaults/*.yml',
        'roles/**/vars/*.yml',
        'playbooks/*.yml',
        '*.yml'
    ]
    skip_dirs = {'.git', '.venv', 'venv', '.env', 'configs'}
    for pattern in patterns:
        for path in Path('.').glob(pattern):
            if not any(skip_dir in path.parts for skip_dir in skip_dirs):
                yaml_files.append(path)
    return sorted(yaml_files)
 def extract_jinja2_expressions(content):
    """Extract all Jinja2 expressions from text content."""
    expressions = []
    # Find {{ ... }} expressions (variable interpolations)
    for match in re.finditer(r'\{\{(.+?)\}\}', content, re.DOTALL):
        expressions.append({
            'type': 'variable',
            'content': match.group(1),
            'full': match.group(0),
            'start': match.start(),
            'end': match.end()
        })
    # Find {% ... %} expressions (control structures)
    for match in re.finditer(r'\{%(.+?)%\}', content, re.DOTALL):
        expressions.append({
            'type': 'control',
            'content': match.group(1),
            'full': match.group(0),
            'start': match.start(),
            'end': match.end()
        })
    return expressions
 def find_line_number(content, position):
    """Find the line number for a given position in content."""
    return content[:position].count('\n') + 1
 def validate_jinja2_expression(expression, context_vars=None):
    """
    Validate a single Jinja2 expression.
    Returns (is_valid, error_message)
    """
    if context_vars is None:
        context_vars = get_test_variables()
    # First check for inline comments - this is the main issue we want to catch
    if '#' in expression['content']:
        # Check if the # is within a list or dict literal
        content = expression['content']
        # Remove strings to avoid false positives
        cleaned = re.sub(r'"[^"]*"', '""', content)
        cleaned = re.sub(r"'[^']*'", "''", cleaned)
        # Look for # that appears to be a comment
        # The # should have something before it (not at start) and something after (the comment text)
        # Also check for # at the start of a line within the expression
        if '#' in cleaned:
            # Check each line in the cleaned expression
            for line in cleaned.split('\n'):
                line = line.strip()
                if '#' in line:
                    # If # appears and it's not escaped (\#)
                    hash_idx = line.find('#')
                    if hash_idx >= 0:
                        # Check if it's escaped
                        if hash_idx == 0 or line[hash_idx-1] != '\\':
                            # This looks like an inline comment
                            return False, "Inline comment (#) found in Jinja2 expression - comments must be outside expressions"
    try:
        env = Environment(undefined=StrictUndefined)
        # Add common Ansible filters (expanded list)
        env.filters['bool'] = lambda x: bool(x)
        env.filters['default'] = lambda x, d='': x if x else d
        env.filters['to_uuid'] = lambda x: 'mock-uuid'
        env.filters['b64encode'] = lambda x: 'mock-base64'
        env.filters['b64decode'] = lambda x: 'mock-decoded'
        env.filters['version'] = lambda x, op: True
        env.filters['ternary'] = lambda x, y, z=None: y if x else (z if z is not None else '')
        env.filters['regex_replace'] = lambda x, p, r: x
        env.filters['difference'] = lambda x, y: list(set(x) - set(y))
        env.filters['strftime'] = lambda fmt, ts: 'mock-timestamp'
        env.filters['int'] = lambda x: int(x) if x else 0
        env.filters['list'] = lambda x: list(x)
        env.filters['map'] = lambda x, *args: x
        env.tests['version'] = lambda x, op: True
        # Wrap the expression in appropriate delimiters for parsing
        if expression['type'] == 'variable':
            template_str = '{{' + expression['content'] + '}}'
        else:
            template_str = '{%' + expression['content'] + '%}'
        # Try to compile the template
        template = env.from_string(template_str)
        # Try to render it with test variables
        # This will catch undefined variables and runtime errors
        template.render(**context_vars)
        return True, None
    except TemplateSyntaxError as e:
        # Check for the specific inline comment issue
        if '#' in expression['content']:
            # Check if the # is within a list or dict literal
            content = expression['content']
            # Remove strings to avoid false positives
            cleaned = re.sub(r'"[^"]*"', '""', content)
            cleaned = re.sub(r"'[^']*'", "''", cleaned)
            # Look for # that appears to be a comment (not in string, not escaped)
            if re.search(r'[^\\\n]#[^\}]', cleaned):
                return False, "Inline comment (#) found in Jinja2 expression - comments must be outside expressions"
        return False, f"Syntax error: {e.message}"
    except Exception as e:
        # Be lenient - we mainly care about inline comments and basic syntax
        # Ignore runtime errors (undefined vars, missing attributes, etc.)
        error_str = str(e).lower()
        if any(ignore in error_str for ignore in ['undefined', 'has no attribute', 'no filter']):
            return True, None  # These are runtime issues, not syntax issues
        return False, f"Error: {str(e)}"
 def get_test_variables():
    """Get a comprehensive set of test variables for expression validation."""
    return {
        # Network configuration
        'IP_subject_alt_name': '10.0.0.1',
        'server_name': 'algo-vpn',
        'wireguard_port': 51820,
        'wireguard_network': '10.19.49.0/24',
        'wireguard_network_ipv6': 'fd9d:bc11:4021::/64',
        'strongswan_network': '10.19.48.0/24',
        'strongswan_network_ipv6': 'fd9d:bc11:4020::/64',
        # Feature flags
        'ipv6_support': True,
        'dns_encryption': True,
        'dns_adblocking': True,
        'wireguard_enabled': True,
        'ipsec_enabled': True,
        # OpenSSL/PKI
        'openssl_constraint_random_id': 'test-uuid-12345',
        'CA_password': 'test-password',
        'p12_export_password': 'test-p12-password',
        'ipsec_pki_path': '/etc/ipsec.d',
        'ipsec_config_path': '/etc/ipsec.d',
        'subjectAltName': 'IP:10.0.0.1,DNS:vpn.example.com',
        'subjectAltName_type': 'IP',
        # Ansible variables
        'ansible_default_ipv4': {'address': '10.0.0.1'},
        'ansible_default_ipv6': {'address': '2600:3c01::f03c:91ff:fedf:3b2a'},
        'ansible_distribution': 'Ubuntu',
        'ansible_distribution_version': '22.04',
        'ansible_date_time': {'epoch': '1234567890'},
        # User management
        'users': ['alice', 'bob', 'charlie'],
        'all_users': ['alice', 'bob', 'charlie', 'david'],
        # Common variables
        'item': 'test-item',
        'algo_provider': 'local',
        'algo_server_name': 'algo-vpn',
        'dns_servers': ['1.1.1.1', '1.0.0.1'],
        # OpenSSL version for conditionals
        'openssl_version': '3.0.0',
        # IPsec configuration
        'certificate_validity_days': 3650,
        'ike_cipher': 'aes128gcm16-prfsha512-ecp256',
        'esp_cipher': 'aes128gcm16-ecp256',
    }
 def validate_yaml_file(yaml_path, check_inline_comments_only=False):
    """
    Validate all Jinja2 expressions in a YAML file.
    Returns (has_inline_comments, list_of_inline_comment_errors, list_of_other_errors)
    """
    inline_comment_errors = []
    other_errors = []
    try:
        with open(yaml_path) as f:
            content = f.read()
        # First, check if it's valid YAML
        try:
            yaml.safe_load(content)
        except yaml.YAMLError:
            # YAML syntax error, not our concern here
            return False, [], []
        # Extract all Jinja2 expressions
        expressions = extract_jinja2_expressions(content)
        if not expressions:
            return False, [], []  # No Jinja2 expressions to validate
        # Validate each expression
        for expr in expressions:
            is_valid, error = validate_jinja2_expression(expr)
            if not is_valid:
                line_num = find_line_number(content, expr['start'])
                error_msg = f"{yaml_path}:{line_num}: {error}"
                # Separate inline comment errors from other errors
                if error and 'inline comment' in error.lower():
                    inline_comment_errors.append(error_msg)
                    # Show context for inline comment errors
                    if len(expr['full']) < 200:
                        inline_comment_errors.append(f"  Expression: {expr['full'][:100]}...")
                elif not check_inline_comments_only:
                    other_errors.append(error_msg)
    except Exception as e:
        if not check_inline_comments_only:
            other_errors.append(f"{yaml_path}: Error reading file: {e}")
    return len(inline_comment_errors) > 0, inline_comment_errors, other_errors
 def test_specific_openssl_expressions():
    """
    Test the specific expressions that had the inline comment bug.
    This is a regression test for the exact issue that was reported.
    """
    print("\n🔬 Testing specific OpenSSL expressions (regression test)...")
    # The problematic expression that was reported
    problematic_expr = """{{ [
  subjectAltName_type + ':' + IP_subject_alt_name + ('/255.255.255.255' if subjectAltName_type == 'IP' else ''),
  'DNS:' + openssl_constraint_random_id,        # Per-deployment UUID prevents cross-deployment reuse
  'email:' + openssl_constraint_random_id       # Unique email domain isolates certificate scope
 ] + (
  ['IP:' + ansible_default_ipv6['address'] + '/128'] if ipv6_support else []
 ) }}"""
    # The fixed expression (without inline comments)
    fixed_expr = """{{ [
  subjectAltName_type + ':' + IP_subject_alt_name + ('/255.255.255.255' if subjectAltName_type == 'IP' else ''),
  'DNS:' + openssl_constraint_random_id,
  'email:' + openssl_constraint_random_id
 ] + (
  ['IP:' + ansible_default_ipv6['address'] + '/128'] if ipv6_support else []
 ) }}"""
    test_cases = [
        ('Problematic (with inline comments)', problematic_expr, False),
        ('Fixed (without inline comments)', fixed_expr, True),
    ]
    errors = []
    for name, expr_content, should_pass in test_cases:
        expr = {
            'type': 'variable',
            'content': expr_content[2:-2],  # Remove {{ }}
            'full': expr_content
        }
        is_valid, error = validate_jinja2_expression(expr)
        if should_pass and not is_valid:
            errors.append(f"❌ {name}: Should have passed but failed with: {error}")
        elif not should_pass and is_valid:
            errors.append(f"❌ {name}: Should have failed but passed")
        else:
            status = "✅" if should_pass else "⚠️"
            result = "passed" if is_valid else f"failed with: {error}"
            print(f"  {status} {name}: {result}")
    if errors:
        print("\n❌ Regression test FAILED:")
        for error in errors:
            print(f"    {error}")
        return False
    else:
        print("  ✅ Regression test passed - would have caught the bug!")
        return True
 def main():
    """Main test function."""
    print("🔍 Validating Jinja2 expressions in YAML files for inline comments...\n")
    # First run the regression test
    regression_passed = test_specific_openssl_expressions()
    # Find all YAML files
    yaml_files = find_yaml_files_with_jinja2()
    print(f"\n📁 Found {len(yaml_files)} YAML files to check")
    all_inline_comment_errors = []
    files_with_inline_comments = []
    files_checked = 0
    # Validate each file - focus on inline comments
    for yaml_file in yaml_files:
        has_inline_comments, inline_errors, other_errors = validate_yaml_file(yaml_file, check_inline_comments_only=True)
        files_checked += 1
        if has_inline_comments:
            files_with_inline_comments.append(yaml_file)
            all_inline_comment_errors.extend(inline_errors)
    # Report results
    print(f"\n✅ Checked {files_checked} YAML files for inline comments in Jinja2 expressions")
    if all_inline_comment_errors:
        print(f"\n❌ Found inline comment issues in {len(files_with_inline_comments)} files:\n")
        # Show all inline comment errors since these are critical
        for error in all_inline_comment_errors:
            print(f"  ERROR: {error}")
    else:
        print("\n✅ No inline comments found in Jinja2 expressions!")
    # Check the specific file that had the bug
    openssl_file = Path('roles/strongswan/tasks/openssl.yml')
    if openssl_file.exists():
        print(f"\n🎯 Checking {openssl_file} specifically...")
        has_inline_comments, inline_errors, other_errors = validate_yaml_file(openssl_file)
        if not has_inline_comments:
            print(f"  ✅ {openssl_file} has no inline comments in Jinja2 expressions")
        else:
            print(f"  ❌ {openssl_file} has inline comments in Jinja2 expressions:")
            for error in inline_errors:
                print(f"    {error}")
    if all_inline_comment_errors or not regression_passed:
        print("\n❌ Found inline comment issues that need to be fixed")
        print("💡 Move comments outside of {{ }} and {% %} expressions")
        return 1
    else:
        print("\n✅ All YAML files are free of inline comments in Jinja2 expressions!")
        return 0
 if __name__ == "__main__":
    sys.exit(main())