nutrient-code-review/claudecode/test_github_action_audit.py at 61ab9df8a15d47048e2c3e58bbe2b0a5b8fa4979 · danielmartin/nutrient-code-review · GitHub

1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
248
249
250
251
252
253
254
255
256
257
258
259
260
261
262
263
264
265
266
267
268
269
270
271
272
273
274
275
276
277
278
279
280
281
282
283
284
285
286
287
288
289
290
291
292
293
294
295
296
297
298
299
300
301
302
303
304
305
306
307
308
309
310
311
312
313
314
315
316
317
318
319
320
321
322
323
324
325
326
327
328
329
330
331
332
333
334
335
336
337
338
339
340
341
342
343
344
345
346
347
348
349
350
351
352
353
354
355
356
357
358
359
360
361
362
363
364
365
366
367
368
369
370
371
372
373
374
375
376
377
378
379
380
381
382
383
384
385
386
387
388
389
390
391
392
393
394
395
396
397
398
399
400
401
402
403
404
405
406
407
408
409
410
411
412
413
414
415
416
417
418
419
420
421
422
423
424
425
426
427
428
429
430
431
432
433
434
435
436
437
438
439
440
441
442
443
444
445
446
447
448
449
450
451
452
453
454
455
456
457
458
459
460
461
462
463
464
465
466
467
468
469
470
471
472
473
474
475
476
477
478
479
480
481
482
483
484
485
486
487
488
489
490
491
492
493
494
495
496
497
498
499
500
501
502
503
504
505
506
507
508
509
510
511
512
513
514
515
516
517
518
519
520
521
522
523
524
525
526
527
528
529
530
531
532
533
534
535
536
537
538
539
540
541
542
543
544
545
546
547
548
549
550
551
552
553
554
555
556
557
558
559
560
561
562
563
564
565
566
567
568
569
570
571
572
573
574
575
576
577
578
579
580
581
582
583
584
585
586
587
588
589
590
591
#!/usr/bin/env python3
"""
Pytest tests for GitHub Action audit script components.
"""

import pytest


class TestImports:
    """Test that all required modules can be imported."""

    def test_main_module_import(self):
        """Test that the main module can be imported."""
        from claudecode import github_action_audit
        assert hasattr(github_action_audit, 'GitHubActionClient')
        assert hasattr(github_action_audit, 'SimpleClaudeRunner')
        # SimpleFindingsFilter was removed
        assert hasattr(github_action_audit, 'main')

    def test_component_imports(self):
        """Test that all component modules can be imported."""
        from claudecode.prompts import get_unified_review_prompt
        from claudecode.json_parser import parse_json_with_fallbacks, extract_json_from_text

        # Verify they're callable/usable
        assert callable(get_unified_review_prompt)
        assert callable(parse_json_with_fallbacks)
        assert callable(extract_json_from_text)


class TestHardExclusionRules:
    """Test the HardExclusionRules patterns."""

    def test_dos_patterns(self):
        """Test DOS pattern exclusions."""
        from claudecode.findings_filter import HardExclusionRules

        dos_findings = [
            {'description': 'Potential denial of service vulnerability', 'category': 'security'},
            {'description': 'DOS attack through resource exhaustion', 'category': 'security'},
            {'description': 'Infinite loop causing resource exhaustion', 'category': 'security'},
        ]

        for finding in dos_findings:
            reason = HardExclusionRules.get_exclusion_reason(finding)
            assert reason is not None
            assert 'dos' in reason.lower()

    def test_rate_limiting_patterns(self):
        """Test rate limiting pattern exclusions."""
        from claudecode.findings_filter import HardExclusionRules

        rate_limit_findings = [
            {'description': 'Missing rate limiting on endpoint', 'category': 'security'},
            {'description': 'No rate limit implemented for API', 'category': 'security'},
            {'description': 'Implement rate limiting for this route', 'category': 'security'},
        ]

        for finding in rate_limit_findings:
            reason = HardExclusionRules.get_exclusion_reason(finding)
            assert reason is not None
            assert 'rate limit' in reason.lower()

    def test_open_redirect_patterns(self):
        """Test open redirect pattern exclusions."""
        from claudecode.findings_filter import HardExclusionRules

        redirect_findings = [
            {'description': 'Open redirect vulnerability found', 'category': 'security'},
            {'description': 'Unvalidated redirect in URL parameter', 'category': 'security'},
            {'description': 'Redirect attack possible through user input', 'category': 'security'},
        ]

        for finding in redirect_findings:
            reason = HardExclusionRules.get_exclusion_reason(finding)
            assert reason is not None
            assert 'open redirect' in reason.lower()

    def test_markdown_file_exclusion(self):
        """Test that findings in .md files are excluded."""
        from claudecode.findings_filter import HardExclusionRules

        md_findings = [
            {'file': 'README.md', 'description': 'SQL injection vulnerability', 'category': 'security'},
            {'file': 'docs/security.md', 'description': 'Command injection found', 'category': 'security'},
            {'file': 'CHANGELOG.MD', 'description': 'XSS vulnerability', 'category': 'security'},  # Test case insensitive
            {'file': 'path/to/file.Md', 'description': 'Path traversal', 'category': 'security'},  # Mixed case
        ]

        for finding in md_findings:
            reason = HardExclusionRules.get_exclusion_reason(finding)
            assert reason is not None
            assert 'markdown' in reason.lower()

    def test_non_markdown_files_not_excluded(self):
        """Test that findings in non-.md files are not excluded due to file extension."""
        from claudecode.findings_filter import HardExclusionRules

        non_md_findings = [
            {'file': 'main.py', 'description': 'SQL injection vulnerability'},
            {'file': 'server.js', 'description': 'Command injection found'},
            {'file': 'index.html', 'description': 'XSS vulnerability'},
            {'file': 'config.yml', 'description': 'Hardcoded credentials'},
            {'file': 'README.txt', 'description': 'Path traversal'},
            {'file': 'file.mdx', 'description': 'Security issue'},  # Not .md
        ]

        for finding in non_md_findings:
            reason = HardExclusionRules.get_exclusion_reason(finding)
            # Should not be excluded for being a markdown file
            # (might be excluded for other reasons like DOS patterns)
            if reason:
                assert 'markdown' not in reason.lower()

    def test_keeps_real_vulnerabilities(self):
        """Test that real vulnerabilities are not excluded."""
        from claudecode.findings_filter import HardExclusionRules

        real_vulns = [
            {'file': 'auth.py', 'description': 'SQL injection in user authentication', 'category': 'security'},
            {'file': 'exec.js', 'description': 'Command injection through user input', 'category': 'security'},
            {'file': 'comments.php', 'description': 'Cross-site scripting in comment field', 'category': 'security'},
            {'file': 'upload.go', 'description': 'Path traversal in file upload', 'category': 'security'},
        ]

        for finding in real_vulns:
            reason = HardExclusionRules.get_exclusion_reason(finding)
            assert reason is None


class TestJSONParser:
    """Test JSON parsing utilities."""

    def test_parse_valid_json(self):
        """Test parsing valid JSON."""
        from claudecode.json_parser import parse_json_with_fallbacks

        valid_json = '{"test": "data", "number": 123}'
        success, result = parse_json_with_fallbacks(valid_json, "test")

        assert success is True
        assert result == {"test": "data", "number": 123}

    def test_parse_invalid_json(self):
        """Test parsing invalid JSON."""
        from claudecode.json_parser import parse_json_with_fallbacks

        invalid_json = '{invalid json}'
        success, result = parse_json_with_fallbacks(invalid_json, "test")

        assert success is False
        assert 'error' in result
        assert 'Invalid JSON response' in result['error']

    def test_extract_json_from_text(self):
        """Test extracting JSON from mixed text."""
        from claudecode.json_parser import extract_json_from_text

        mixed_text = 'Some text before {"key": "value"} some text after'
        result = extract_json_from_text(mixed_text)

        assert result == {"key": "value"}

    def test_extract_json_from_text_no_json(self):
        """Test extracting JSON when none exists."""
        from claudecode.json_parser import extract_json_from_text

        plain_text = 'This is just plain text with no JSON'
        result = extract_json_from_text(plain_text)

        assert result is None


class TestPromptsModule:
    """Test the prompts module."""

    def test_get_unified_review_prompt(self):
        """Test unified review prompt generation."""
        from claudecode.prompts import get_unified_review_prompt

        pr_data = {
            'number': 123,
            'title': 'Test PR',
            'body': 'Test description',
            'user': 'testuser',
            'changed_files': 1,
            'additions': 10,
            'deletions': 5,
            'head': {
                'repo': {
                    'full_name': 'owner/repo'
                }
            },
            'files': [
                {
                    'filename': 'test.py',
                    'status': 'modified',
                    'additions': 10,
                    'deletions': 5,
                    'patch': '@@ -1,5 +1,10 @@\n+added line'
                }
            ]
        }

        pr_diff = "diff --git a/test.py b/test.py\n+added line"

        prompt = get_unified_review_prompt(pr_data, pr_diff)

        assert isinstance(prompt, str)
        assert 'security' in prompt.lower()
        assert 'PR #123' in prompt
        assert 'test.py' in prompt


class TestDeploymentPRDetection:
    """Test deployment PR title pattern matching."""

    def test_deployment_pr_patterns(self):
        """Test that deployment PR titles are correctly identified."""
        import re

        deployment_pattern = r'^Deploy\s+[a-f0-9]{6,}\s+to\s+(production|staging|development|production-services)'

        # These should match
        deployment_titles = [
            "Deploy 53f395b0 to production-services",
            "Deploy af179b5b to production",
            "Deploy 1a3cb909 to production",
            "Deploy 49c09ea5 to production-services",
            "Deploy 8e7acc60 to production",
            "Deploy e0b1fe0b to production-services",
            "Deploy c53e6010 to production",
            "Deploy 42c4a061 to production",
            "Deploy 9de55976 to production-services",
            "deploy abcdef123456 to staging",  # lowercase should work
            "DEPLOY ABCDEF01 TO DEVELOPMENT",  # uppercase should work
        ]

        for title in deployment_titles:
            assert re.match(deployment_pattern, title, re.IGNORECASE), f"Failed to match deployment PR: {title}"

    def test_non_deployment_pr_patterns(self):
        """Test that non-deployment PR titles are not matched."""
        import re

        deployment_pattern = r'^Deploy\s+[a-f0-9]{6,}\s+to\s+(production|staging|development|production-services)'

        # These should NOT match
        non_deployment_titles = [
            "Add new feature",
            "Fix bug in deployment script",
            "Update deployment documentation",
            "Deploy new feature to production",  # No commit hash
            "Deploy abc to production",  # Too short hash
            "Deploy 12345g to production",  # Non-hex character
            "Preparing deploy af179b5b to production",  # Doesn't start with Deploy
            "Deploy af179b5b to testing",  # Wrong environment
            "Deploy af179b5b",  # Missing environment
            "af179b5b to production",  # Missing Deploy prefix
        ]

        for title in non_deployment_titles:
            assert not re.match(deployment_pattern, title, re.IGNORECASE), f"Incorrectly matched non-deployment PR: {title}"


class TestBuiltinExclusions:
    """Test built-in file and directory exclusions."""

    def test_builtin_excluded_directories(self):
        """Test that built-in directories are in the exclusion list."""
        from claudecode.github_action_audit import GitHubActionClient

        expected_dirs = [
            'node_modules',
            'vendor',
            'dist',
            'build',
            '.next',
            '__pycache__',
            '.gradle',
            'Pods',
            'DerivedData',
        ]

        for dir_name in expected_dirs:
            assert dir_name in GitHubActionClient.BUILTIN_EXCLUDED_DIRS, f"Missing built-in excluded dir: {dir_name}"

    def test_builtin_excluded_patterns(self):
        """Test that built-in file patterns are in the exclusion list."""
        from claudecode.github_action_audit import GitHubActionClient

        expected_patterns = [
            'package-lock.json',
            'yarn.lock',
            '*.min.js',
            '*.min.css',
            '*.pb.go',
            '*.generated.*',
            '*.png',
            '*.jpg',
            '*.woff2',
            '*.pyc',
        ]

        for pattern in expected_patterns:
            assert pattern in GitHubActionClient.BUILTIN_EXCLUDED_PATTERNS, f"Missing built-in excluded pattern: {pattern}"

    def test_is_excluded_lock_files(self):
        """Test that lock files are excluded."""
        from claudecode.github_action_audit import GitHubActionClient
        from unittest.mock import patch

        with patch.dict('os.environ', {'GITHUB_TOKEN': 'test-token', 'EXCLUDE_DIRECTORIES': ''}):
            client = GitHubActionClient()

            lock_files = [
                'package-lock.json',
                'yarn.lock',
                'Gemfile.lock',
                'poetry.lock',
                'Cargo.lock',
                'go.sum',
                'nested/path/package-lock.json',
            ]

            for filepath in lock_files:
                assert client._is_excluded(filepath), f"Lock file should be excluded: {filepath}"

    def test_is_excluded_generated_files(self):
        """Test that generated files are excluded."""
        from claudecode.github_action_audit import GitHubActionClient
        from unittest.mock import patch

        with patch.dict('os.environ', {'GITHUB_TOKEN': 'test-token', 'EXCLUDE_DIRECTORIES': ''}):
            client = GitHubActionClient()

            generated_files = [
                'app.min.js',
                'styles.min.css',
                'app.bundle.js',
                'main.chunk.js',
                'api.pb.go',
                'models.generated.ts',
                'user.g.dart',
            ]

            for filepath in generated_files:
                assert client._is_excluded(filepath), f"Generated file should be excluded: {filepath}"

    def test_is_excluded_binary_files(self):
        """Test that binary files are excluded."""
        from claudecode.github_action_audit import GitHubActionClient
        from unittest.mock import patch

        with patch.dict('os.environ', {'GITHUB_TOKEN': 'test-token', 'EXCLUDE_DIRECTORIES': ''}):
            client = GitHubActionClient()

            binary_files = [
                'logo.png',
                'photo.jpg',
                'icon.ico',
                'font.woff2',
                'document.pdf',
                'archive.zip',
            ]

            for filepath in binary_files:
                assert client._is_excluded(filepath), f"Binary file should be excluded: {filepath}"

    def test_is_excluded_vendor_directories(self):
        """Test that vendor directories are excluded."""
        from claudecode.github_action_audit import GitHubActionClient
        from unittest.mock import patch

        with patch.dict('os.environ', {'GITHUB_TOKEN': 'test-token', 'EXCLUDE_DIRECTORIES': ''}):
            client = GitHubActionClient()

            vendor_paths = [
                'node_modules/lodash/index.js',
                'vendor/github.com/pkg/errors/errors.go',
                'dist/bundle.js',
                'build/output.js',
                '.next/cache/data.json',
                '__pycache__/module.pyc',
                'Pods/AFNetworking/Source.m',
            ]

            for filepath in vendor_paths:
                assert client._is_excluded(filepath), f"Vendor path should be excluded: {filepath}"

    def test_is_not_excluded_source_files(self):
        """Test that regular source files are NOT excluded."""
        from claudecode.github_action_audit import GitHubActionClient
        from unittest.mock import patch

        with patch.dict('os.environ', {'GITHUB_TOKEN': 'test-token', 'EXCLUDE_DIRECTORIES': ''}):
            client = GitHubActionClient()

            source_files = [
                'src/main.py',
                'lib/utils.js',
                'app/models/user.rb',
                'pkg/handler/api.go',
                'src/components/Button.tsx',
                'tests/test_auth.py',
            ]

            for filepath in source_files:
                assert not client._is_excluded(filepath), f"Source file should NOT be excluded: {filepath}"

    def test_user_exclusions_combined_with_builtin(self):
        """Test that user exclusions are combined with built-in exclusions."""
        from claudecode.github_action_audit import GitHubActionClient
        from unittest.mock import patch

        with patch.dict('os.environ', {'GITHUB_TOKEN': 'test-token', 'EXCLUDE_DIRECTORIES': 'custom_dir,my_vendor'}):
            client = GitHubActionClient()

            # Built-in should still work
            assert client._is_excluded('node_modules/pkg/index.js')
            assert client._is_excluded('vendor/lib/code.go')

            # User exclusions should also work
            assert client._is_excluded('custom_dir/file.py')
            assert client._is_excluded('my_vendor/lib.js')


class TestExtractReviewFindings:
    """Test the _extract_review_findings method."""

    def test_extract_findings_with_pr_summary(self):
        """Test that pr_summary is extracted from Claude output."""
        import json
        from claudecode.github_action_audit import SimpleClaudeRunner

        runner = SimpleClaudeRunner()

        claude_output = {
            'result': json.dumps({
                'findings': [
                    {'file': 'test.py', 'line': 1, 'severity': 'HIGH', 'description': 'Test finding'}
                ],
                'pr_summary': {
                    'overview': 'This PR adds authentication middleware.',
                    'file_changes': [
                        {'label': 'src/auth.py', 'files': ['src/auth.py'], 'changes': 'Added JWT validation'}
                    ]
                }
            })
        }

        result = runner._extract_review_findings(claude_output)

        assert 'pr_summary' in result
        assert result['pr_summary']['overview'] == 'This PR adds authentication middleware.'
        assert len(result['pr_summary']['file_changes']) == 1
        assert result['pr_summary']['file_changes'][0]['files'] == ['src/auth.py']
        assert len(result['findings']) == 1

    def test_extract_findings_from_structured_output(self):
        """Test that structured_output is accepted when result is empty."""
        from claudecode.github_action_audit import SimpleClaudeRunner

        runner = SimpleClaudeRunner()

        claude_output = {
            'result': '',
            'structured_output': {
                'findings': [
                    {'file': 'test.py', 'line': 1, 'severity': 'HIGH', 'description': 'Test finding'}
                ],
                'pr_summary': {
                    'overview': 'This PR adds authentication middleware.',
                    'file_changes': [
                        {'label': 'src/auth.py', 'files': ['src/auth.py'], 'changes': 'Added JWT validation'}
                    ]
                }
            }
        }

        result = runner._extract_review_findings(claude_output)

        assert 'pr_summary' in result
        assert result['pr_summary']['overview'] == 'This PR adds authentication middleware.'
        assert len(result['findings']) == 1

    def test_extract_findings_without_pr_summary(self):
        """Test that missing pr_summary fails instead of degrading silently."""
        import json
        from claudecode.github_action_audit import SimpleClaudeRunner

        runner = SimpleClaudeRunner()

        claude_output = {
            'result': json.dumps({
                'findings': []
            })
        }

        with pytest.raises(ValueError, match="valid review payload"):
            runner._extract_review_findings(claude_output)

    def test_extract_findings_empty_result(self):
        """Test extraction with invalid/empty Claude output."""
        from claudecode.github_action_audit import SimpleClaudeRunner

        runner = SimpleClaudeRunner()

        with pytest.raises(ValueError, match="valid review payload"):
            runner._extract_review_findings({})

    def test_extract_findings_with_grouped_files(self):
        """Test that grouped file_changes are handled correctly."""
        import json
        from claudecode.github_action_audit import SimpleClaudeRunner

        runner = SimpleClaudeRunner()

        claude_output = {
            'result': json.dumps({
                'findings': [],
                'pr_summary': {
                    'overview': 'Test updates.',
                    'file_changes': [
                        {
                            'label': 'tests/test_*.py',
                            'files': ['tests/test_auth.py', 'tests/test_login.py', 'tests/test_session.py'],
                            'changes': 'Unit tests for auth module'
                        }
                    ]
                }
            })
        }

        result = runner._extract_review_findings(claude_output)

        assert 'pr_summary' in result
        file_changes = result['pr_summary']['file_changes']
        assert len(file_changes) == 1
        assert file_changes[0]['label'] == 'tests/test_*.py'
        assert len(file_changes[0]['files']) == 3


class TestDiffSizeLimits:
    """Test diff size limit functionality."""

    def test_diff_line_counting(self):
        """Test that diff lines are counted correctly."""
        sample_diff = """diff --git a/file.py b/file.py
--- a/file.py
+++ b/file.py
@@ -1,5 +1,10 @@
 line 1
+added line 2
+added line 3
 line 4
-removed line 5
+replaced line 5
 line 6"""

        line_count = len(sample_diff.splitlines())
        assert line_count == 11  # Count the actual lines

    def test_max_diff_lines_env_parsing(self):
        """Test that MAX_DIFF_LINES environment variable is parsed correctly."""
        import os
        from unittest.mock import patch

        # Test default value when env var is not set
        with patch.dict('os.environ', {}, clear=False):
            os.environ.pop('MAX_DIFF_LINES', None)
            max_lines_str = os.environ.get('MAX_DIFF_LINES', '5000')
            try:
                max_lines = int(max_lines_str)
            except ValueError:
                max_lines = 5000

        assert max_lines == 5000  # Default when not set

    def test_max_diff_lines_zero_forces_agentic_mode(self):
        """Test that setting MAX_DIFF_LINES to 0 forces agentic file reading mode."""
        import os
        from unittest.mock import patch

        with patch.dict('os.environ', {'MAX_DIFF_LINES': '0'}):
            max_lines_str = os.environ.get('MAX_DIFF_LINES', '5000')
            max_lines = int(max_lines_str)

            # When max_lines is 0, agentic mode is always used
            assert max_lines == 0
            # In the actual code: use_agentic_mode = max_diff_lines == 0 or ...