GeneralizedNotationNotation/src/main.py at main · ActiveInferenceInstitute/GeneralizedNotationNotation · GitHub

1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
248
249
250
251
252
253
254
255
256
257
258
259
260
261
262
263
264
265
266
267
268
269
270
271
272
273
274
275
276
277
278
279
280
281
282
283
284
285
286
287
288
289
290
291
292
293
294
295
296
297
298
299
300
301
302
303
304
305
306
307
308
309
310
311
312
313
314
315
316
317
318
319
320
321
322
323
324
325
326
327
328
329
330
331
332
333
334
335
336
337
338
339
340
341
342
343
344
345
346
347
348
349
350
351
352
353
354
355
356
357
358
359
360
361
362
363
364
365
366
367
368
369
370
371
372
373
374
375
376
377
378
379
380
381
382
383
384
385
386
387
388
389
390
391
392
393
394
395
396
397
398
399
400
401
402
403
404
405
406
407
408
409
410
411
412
413
414
415
416
417
418
419
420
421
422
423
424
425
426
427
428
429
430
431
432
433
434
435
436
437
438
439
440
441
442
443
444
445
446
447
448
449
450
451
452
453
454
455
456
457
458
459
460
461
462
463
464
465
466
467
468
469
470
471
472
473
474
475
476
477
478
479
480
481
482
483
484
485
486
487
488
489
490
491
492
493
494
495
496
497
498
499
500
501
502
503
504
505
506
507
508
509
510
511
512
513
514
515
516
517
518
519
520
521
522
523
524
525
526
527
528
529
530
531
532
533
534
535
536
537
538
539
540
541
542
543
544
545
546
547
548
549
550
551
552
553
554
555
556
557
558
559
560
561
562
563
564
565
566
567
568
569
570
571
572
573
574
575
576
577
578
579
580
581
582
583
584
585
586
587
588
589
590
591
592
593
594
595
596
597
598
599
600
601
602
603
604
605
606
607
608
609
610
611
612
613
614
615
616
617
618
619
620
621
622
623
624
625
626
627
628
629
630
631
632
633
634
635
636
637
638
639
640
641
642
643
644
645
646
647
648
649
650
651
652
653
654
655
656
657
658
659
660
661
662
663
664
665
666
667
668
669
670
671
672
673
674
675
676
677
678
679
680
681
682
683
684
685
686
687
688
689
690
691
692
693
694
695
696
697
698
699
700
701
702
703
704
705
706
707
708
709
710
711
712
713
714
715
716
717
718
719
720
721
722
723
724
725
726
727
728
729
730
731
732
733
734
735
736
737
738
739
740
741
742
743
744
745
746
747
748
749
750
751
752
753
754
755
756
757
758
759
760
761
762
763
764
765
766
767
768
769
770
771
772
773
774
775
776
777
778
779
780
781
782
783
784
785
786
787
788
789
790
791
792
793
794
795
796
797
798
799
800
801
802
803
804
805
806
807
808
809
810
811
812
813
814
815
816
817
818
819
820
821
822
823
824
825
826
827
828
829
830
831
832
833
834
835
836
837
838
839
840
841
842
843
844
845
846
847
848
849
850
851
852
853
854
855
856
857
858
859
860
861
862
863
864
865
866
867
868
869
870
871
872
873
874
875
876
877
878
879
880
881
882
883
884
885
886
887
888
889
890
891
892
893
894
895
896
897
898
899
900
901
902
903
904
905
906
907
908
909
910
911
912
913
914
915
916
917
918
919
920
921
922
923
924
925
926
927
928
929
930
931
932
933
934
935
936
937
938
939
940
941
942
943
944
945
946
947
948
949
950
951
952
953
954
955
956
957
958
959
960
961
962
963
964
965
966
967
968
969
970
971
972
973
974
975
976
977
978
979
980
981
982
983
984
985
986
987
988
989
990
991
992
993
994
995
996
997
998
999
1000
#!/usr/bin/env python3
"""
GNN Processing Pipeline

This script orchestrates the 25-step GNN processing pipeline (steps 0-24).
The pipeline transforms GNN specifications into executable simulations, visualizations,
and advanced representations including audio sonification.

Pipeline Steps:
0. Template initialization (0_template.py)
1. Environment setup (1_setup.py)
2. Test suite execution (2_tests.py)
3. GNN file processing (3_gnn.py)
4. Model registry (4_model_registry.py)
5. Type checking (5_type_checker.py)
6. Validation (6_validation.py)
7. Multi-format export (7_export.py)
8. Visualization (8_visualization.py)
9. Advanced visualization (9_advanced_viz.py)
10. Ontology processing (10_ontology.py)
11. Code rendering (11_render.py)
12. Execution (12_execute.py)
13. LLM processing (13_llm.py)
14. ML integration (14_ml_integration.py)
15. Audio processing (15_audio.py)
16. Analysis (16_analysis.py)
17. Integration (17_integration.py)
18. Security (18_security.py)
19. Research (19_research.py)
20. Website generation (20_website.py)
21. Model Context Protocol processing (21_mcp.py)
22. GUI (Interactive GNN Constructor) (22_gui.py)
23. Report generation (23_report.py)
24. Intelligent analysis (24_intelligent_analysis.py)

Usage:
    python src/main.py [options]

Examples:
    # Run full pipeline
    python src/main.py --target-dir input/gnn_files --verbose

    # Run specific steps only
    python src/main.py --only-steps "0,1,2,3" --verbose

    # Skip certain steps
    python src/main.py --skip-steps "15,16" --verbose

For complete usage information, see:
- README.md: Project overview and quick start
- doc/pipeline/README.md: Detailed pipeline documentation
- src/README.md: Pipeline safety and reliability documentation
"""

import argparse
import json
import logging
import os
import re
import sys
import time
from datetime import datetime
from pathlib import Path
from typing import Any, Dict, List, Optional

_module_logger = logging.getLogger(__name__)

# Detect project root and ensure we're working from there
SCRIPT_DIR = Path(__file__).parent  # src/
PROJECT_ROOT = SCRIPT_DIR.parent     # project root (one level up from src/)

# Change working directory to project root if not already there
if Path.cwd() != PROJECT_ROOT:
    os.chdir(PROJECT_ROOT)
    logging.getLogger(__name__).info(f"Changed working directory to project root: {PROJECT_ROOT}")

# Add src to path for imports
sys.path.insert(0, str(SCRIPT_DIR))

from utils.pipeline_template import (
    setup_step_logging as _basic_setup_step_logging,
)

try:
    from utils.logging.logging_utils import log_step_error, log_step_start
except ImportError:
    from utils.logging_utils import log_step_error, log_step_start
from dataclasses import fields

from utils.argument_utils import ArgumentParser, PipelineArguments
from utils.pipeline_config_merge import apply_input_config_defaults
from utils.pipeline_validator import (
    validate_pipeline_step_sequence,
    validate_step_prerequisites,
)
from utils.resource_manager import get_current_memory_usage

# Optional structured logging and visual progress tracking.
# setup_step_logging is resolved here; falls back to the basic version from
# utils.pipeline_template (_basic_setup_step_logging) when unavailable.
try:
    from utils.logging.logging_utils import (
        PipelineLogger,
        PipelineProgressTracker,
        log_pipeline_summary,
        reset_progress_tracker,
        rotate_logs,
        setup_step_logging,  # structured version — preferred
    )
    from utils.visual_logging import (
        VisualConfig,
        VisualLogger,
        create_visual_logger,
        print_completion_summary,
        print_pipeline_banner,
        print_step_summary,
    )
    STRUCTURED_LOGGING_AVAILABLE = True
except ImportError:
    # Fall back to the basic version imported above under its alias.
    setup_step_logging = _basic_setup_step_logging
    STRUCTURED_LOGGING_AVAILABLE = False
    # Provide recovery implementations when visual logging is not available
    from dataclasses import dataclass

    @dataclass
    class VisualConfig:
        """Recovery visual config when visual_logging is not available."""
        enable_colors: bool = True
        enable_progress_bars: bool = True
        enable_emoji: bool = True
        enable_animation: bool = True
        max_width: int = 80
        show_timestamps: bool = False
        show_correlation_ids: bool = True
        compact_mode: bool = False

    class VisualLogger:
        """Recovery visual logger when visual_logging is not available."""
        def __init__(self, name, config=None):
            self.name = name
            self.config = config
            self._correlation_id = None
            self.logger = logging.getLogger(name)

        def set_correlation_id(self, correlation_id: str) -> None:
            self._correlation_id = correlation_id

        def print_progress(self, current: int, total: int, message: str) -> None: self.logger.info(f"[{current}/{total}] {message}")
        def print_step_header(self, step_num: int, description: str, total: int) -> None: self.logger.info(f"\n=== Step {step_num}/{total}: {description} ===")

    def create_visual_logger(name: str, config: Any) -> VisualLogger:
        vl = VisualLogger(name, config)
        return vl

    def print_pipeline_banner(title: str, subtitle: str) -> None:
        logging.getLogger("pipeline").info(f"\n{'='*60}\n{title}\n{subtitle}\n{'='*60}")

    def print_step_summary(step: int, desc: str, status: str, duration: float, stats: Any) -> None:
        logging.getLogger("pipeline").info(f"Step {step}: {desc} - {status} ({duration:.2f}s)")

    def print_completion_summary(success: bool, duration: float, stats: Any) -> None:
        status_msg = 'COMPLETED' if success else 'FAILED'
        logging.getLogger("pipeline").info(f"\n{'='*60}\nPipeline {status_msg} in {duration:.2f}s\n{stats}\n{'='*60}")

def main(override_args: Optional[PipelineArguments] = None, override_config: Optional[Dict[str, Any]] = None) -> int:
    """Main pipeline orchestration function."""
    parsed: Optional[argparse.Namespace] = None
    if override_args is not None:
        args = override_args
    else:
        # Parse arguments
        parser = ArgumentParser.create_main_parser()
        parsed = parser.parse_args()

        # Only pass attributes argparse actually set (SUPPRESS omits unset flags)
        field_names = {f.name for f in fields(PipelineArguments)}
        kwargs = {k: getattr(parsed, k) for k in field_names if hasattr(parsed, k)}
        args = PipelineArguments(**kwargs)

        if getattr(args, "skip_llm", False):
            existing = args.skip_steps or ""
            existing_nums = [s.strip() for s in str(existing).split(",") if s.strip()] if existing else []
            if "13" not in existing_nums:
                existing_nums.append("13")
            args.skip_steps = ",".join(existing_nums)

    # Setup visual logging
    visual_config = VisualConfig(
        enable_colors=True,
        enable_progress_bars=True,
        enable_emoji=True,
        enable_animation=True,
        show_timestamps=args.verbose,
        show_correlation_ids=True,
        compact_mode=False
    )

    visual_logger = create_visual_logger("pipeline", visual_config)

    # Setup logging (use structured if available, recovery to standard)
    if STRUCTURED_LOGGING_AVAILABLE:
        # Prepare log directory
        log_dir = args.output_dir / "00_pipeline_logs"
        log_dir.mkdir(parents=True, exist_ok=True)

        # Rotate existing logs
        rotate_logs(log_dir)

        # Force re-initialization so pipeline.log is always freshly created
        # for this run (prevents stale logs when re-running within same process)
        PipelineLogger._initialized = False
        if PipelineLogger._log_file_handler:
            logging.getLogger().removeHandler(PipelineLogger._log_file_handler)
            PipelineLogger._log_file_handler.close()
            PipelineLogger._log_file_handler = None

        # Initialize with log_dir to create pipeline.log
        PipelineLogger.initialize(log_dir=log_dir, enable_structured=True, log_format=args.log_format)

        # Enable JSON logging (adds pipeline.jsonl handler)
        PipelineLogger.enable_json_logging(log_dir)

        logger = setup_step_logging("pipeline", args.verbose, enable_structured=True, log_format=args.log_format)
        # Reset progress tracker for new pipeline run
        reset_progress_tracker()
    else:
        logger = setup_step_logging("pipeline", args.verbose, log_format=args.log_format if hasattr(args, "log_format") else "human")

    if args.verbose:
        _parts: List[str] = []
        for mod, label in (
            ("jax", "jax"),
            ("jaxlib", "jaxlib"),
            ("torch", "torch"),
            ("numpyro", "numpyro"),
            ("discopy", "discopy"),
        ):
            try:
                m = __import__(mod)
                _parts.append(f"{label}={getattr(m, '__version__', '?')}")
            except ImportError:
                _parts.append(f"{label}=missing")
        logger.info("Step 12 backends: %s", "; ".join(_parts))

    # Set correlation ID for tracking
    import uuid
    correlation_id = str(uuid.uuid4())[:8]
    visual_logger.set_correlation_id(correlation_id)

    # Initialize steps_to_execute outside try block
    steps_to_execute = []

    # Define pipeline steps (outside try block for proper scope)
    pipeline_steps = [
        ("0_template.py", "Template initialization"),
        ("1_setup.py", "Environment setup"),
        ("2_tests.py", "Test suite execution"),
        ("3_gnn.py", "GNN file processing"),
        ("4_model_registry.py", "Model registry"),
        ("5_type_checker.py", "Type checking"),
        ("6_validation.py", "Validation"),
        ("7_export.py", "Multi-format export"),
        ("8_visualization.py", "Visualization"),
        ("9_advanced_viz.py", "Advanced visualization"),
        ("10_ontology.py", "Ontology processing"),
        ("11_render.py", "Code rendering"),
        ("12_execute.py", "Execution"),
        ("13_llm.py", "LLM processing"),
        ("14_ml_integration.py", "ML integration"),
        ("15_audio.py", "Audio processing"),
        ("16_analysis.py", "Analysis"),
        ("17_integration.py", "Integration"),
        ("18_security.py", "Security"),
        ("19_research.py", "Research"),
        ("20_website.py", "Website generation"),
        ("21_mcp.py", "Model Context Protocol processing"),
        ("22_gui.py", "GUI (Interactive GNN Constructor)"),
        ("23_report.py", "Report generation"),
        ("24_intelligent_analysis.py", "Intelligent pipeline analysis")
    ]

    # Load configuration from config.yaml or override context
    full_config = {}
    config_pipeline_settings = {}

    if override_config is not None:
        full_config = override_config
        config_pipeline_settings = full_config.get("pipeline", {})
    else:
        input_config_path = Path("input/config.yaml")
        if input_config_path.exists():
            try:
                import yaml
                with open(input_config_path, "r") as f:
                    full_config = yaml.safe_load(f) or {}
                    config_pipeline_settings = full_config.get("pipeline", {})
            except Exception as e:
                logger.warning(f"Could not load pipeline settings from input/config.yaml: {e}")

    apply_input_config_defaults(args, full_config, parsed)

    # Handle step filtering with automatic dependency resolution
    # Order of precedence: Command line > Config file > All steps

    # 1. Start with full pipeline
    steps_to_execute = pipeline_steps

    # 2. Apply 'only_steps' (Command line preferred over config)
    only_steps_val = args.only_steps or config_pipeline_settings.get("only_steps")
    if only_steps_val:
        requested_step_numbers = parse_step_list(only_steps_val)

        # Automatic dependency resolution
        step_dependencies = {
            11: [3],     # 11_render.py needs 3_gnn.py
            12: [3, 11], # 12_execute.py needs 3_gnn.py and 11_render.py
            8: [3],      # 8_visualization.py needs 3_gnn.py
            9: [3, 8],   # 9_advanced_viz.py needs 3_gnn.py and 8_visualization.py
            13: [3],     # 13_llm.py needs 3_gnn.py
            23: [8, 13], # 23_report.py needs 8_visualization.py and 13_llm.py
            20: [8],     # 20_website.py needs 8_visualization.py
            5: [3],      # 5_type_checker.py needs 3_gnn.py
            6: [3, 5],   # 6_validation.py needs 3_gnn.py and 5_type_checker.py
            7: [3],      # 7_export.py needs 3_gnn.py
            10: [3],     # 10_ontology.py needs 3_gnn.py
            15: [3],     # 15_audio.py needs 3_gnn.py
            16: [3, 7],  # 16_analysis.py needs 3_gnn.py and 7_export.py
            24: [23],    # 24_intelligent_analysis.py needs 23_report.py (and implicitly the summary it generates/pipeline completion)
        }

        # Include dependencies automatically
        resolved_step_numbers = set(requested_step_numbers)
        added_dependencies = []
        for step_num in requested_step_numbers:
            if step_num in step_dependencies:
                for dep in step_dependencies[step_num]:
                    if dep not in resolved_step_numbers:
                        resolved_step_numbers.add(dep)
                        added_dependencies.append(dep)

        if added_dependencies:
            logger.info(f"Auto-including dependency steps: {sorted(added_dependencies)}")

        steps_to_execute = [pipeline_steps[i] for i in sorted(resolved_step_numbers) if 0 <= i < len(pipeline_steps)]
        logger.info(f"Executing steps: {[step[0] for step in steps_to_execute]}")

    # 3. Apply 'skip_steps' (Merge command line and config)
    cmd_skip = parse_step_list(args.skip_steps)
    cfg_skip = parse_step_list(config_pipeline_settings.get("skip_steps"))
    skip_numbers = sorted(set(cmd_skip + cfg_skip))

    if skip_numbers:
        # Map original indices to scripts to avoid losing track if already filtered
        original_indices = {script: i for i, (script, desc) in enumerate(pipeline_steps)}

        filtered_steps = []
        for step in steps_to_execute:
            script_name = step[0]
            original_idx = original_indices.get(script_name, -1)
            if original_idx not in skip_numbers:
                filtered_steps.append(step)

        steps_to_execute = filtered_steps
        logger.info(f"Skipping steps: {[pipeline_steps[i][0] for i in skip_numbers if 0 <= i < len(pipeline_steps)]}")

    # Calculate run hash for content addressability
    from pipeline.hasher import compute_run_hash_with_files, index_run
    run_hash, file_hashes = compute_run_hash_with_files(
        args.target_dir,
        config=config_pipeline_settings,
    )

    # Initialize pipeline execution summary
    pipeline_summary = {
        "run_hash": run_hash,
        "file_hashes": file_hashes,
        "start_time": datetime.now().isoformat(),
        "arguments": args.to_dict(),
        "steps": [],
        "end_time": None,
        "overall_status": "RUNNING",
        "total_duration_seconds": None,
        "environment_info": get_environment_info(),
        "performance_summary": {
            "peak_memory_mb": 0.0,
            "total_steps": len(steps_to_execute),
            "failed_steps": 0,
            "critical_failures": 0,
            "successful_steps": 0,
            "warnings": 0
        }
    }

    try:
        # Project identification banner (displayed at very top)
        print_pipeline_banner(
            "Generalized Notation Notation (GNN)",
            "https://github.com/ActiveInferenceInstitute/GeneralizedNotationNotation | Active Inference Institute"
        )

        # Pipeline start with visual banner
        print_pipeline_banner(
            "🚀 GNN Processing Pipeline",
            f"Starting execution with {len(steps_to_execute)} steps | Correlation ID: {correlation_id}"
        )

        # Visual progress indicator
        visual_logger.print_progress(0, len(steps_to_execute), "Pipeline initialization")

        # Pipeline start logging
        if STRUCTURED_LOGGING_AVAILABLE:
            PipelineLogger.log_structured(
                logger, logging.INFO,
                "🚀 Starting GNN Processing Pipeline",
                 total_steps=len(steps_to_execute),
                target_dir=str(args.target_dir),
                output_dir=str(args.output_dir),
                event_type="pipeline_start"
            )
        else:
            log_step_start(logger, "Starting GNN Processing Pipeline")

        # Update pipeline summary with actual step count
        pipeline_summary["performance_summary"]["total_steps"] = len(steps_to_execute)

        # Initialize progress tracker if enhanced logging is available
        progress_tracker = None
        if STRUCTURED_LOGGING_AVAILABLE:
            progress_tracker = PipelineProgressTracker(len(steps_to_execute))
            # Set global progress tracker so structured logging functions can use it
            from utils.logging.logging_utils import set_global_progress_tracker
            set_global_progress_tracker(progress_tracker)

        # Validate step sequence before execution
        sequence_validation = validate_pipeline_step_sequence(steps_to_execute, logger)
        if sequence_validation["warnings"]:
            for warning in sequence_validation["warnings"]:
                logger.warning(f"Pipeline sequence: {warning}")
        if sequence_validation["recommendations"]:
            for rec in sequence_validation["recommendations"]:
                logger.info(f"Recommendation: {rec}")

        # Execute each step
        for step_index, (script_name, description) in enumerate(steps_to_execute, 0):
            # Use the actual script name as step identifier for clarity
            actual_step_number = step_index + 1
            step_start_time = time.time()
            step_start_datetime = datetime.now()

            # Step start with visual indicators
            visual_logger.print_step_header(actual_step_number, description, len(steps_to_execute))

            # Step start logging with progress tracking
            if STRUCTURED_LOGGING_AVAILABLE and progress_tracker:
                progress_tracker.start_step(actual_step_number, description)
                # Use structured logging functions that support additional parameters
                from utils.logging.logging_utils import (
                    log_step_start as structured_log_step_start,
                )
                structured_log_step_start(logger, f"Starting {description}",
                                      step_number=actual_step_number,
                                      total_steps=len(steps_to_execute),
                                      script_name=script_name)
            else:
                logger.info(f"🔄 Executing step {actual_step_number}: {description}")

            # Write a preliminary pipeline summary before report generation and
            # intelligent analysis so both steps can read current-run data
            if script_name in ("23_report.py", "24_intelligent_analysis.py"):
                try:
                    prelim_summary = dict(pipeline_summary)
                    prelim_end = datetime.now()
                    prelim_start = datetime.fromisoformat(prelim_summary["start_time"])
                    prelim_summary["end_time"] = prelim_end.isoformat()
                    prelim_summary["total_duration_seconds"] = (prelim_end - prelim_start).total_seconds()
                    # All prior steps succeeded if we reached here, so set SUCCESS
                    # The 'preliminary' flag distinguishes this from the final summary
                    prelim_summary["overall_status"] = "SUCCESS"
                    prelim_summary["preliminary"] = True

                    prelim_path = args.output_dir / "00_pipeline_summary" / "pipeline_execution_summary.json"
                    prelim_path.parent.mkdir(parents=True, exist_ok=True)
                    with open(prelim_path, 'w') as f:
                        json.dump(prelim_summary, f, indent=4, default=str)
                    logger.info(f"📝 Preliminary pipeline summary written for intelligent analysis ({len(prelim_summary.get('steps', []))} steps)")
                except Exception as prelim_err:
                    logger.warning(f"Could not write preliminary summary: {prelim_err}")

            # Execute the step
            step_result = execute_pipeline_step(script_name, args, logger)

            # Calculate step duration
            step_end_time = time.time()
            step_duration = step_end_time - step_start_time
            step_end_datetime = datetime.now()

            # Update step result with timing information and enhanced metadata
            step_result.update({
                "step_number": actual_step_number,
                "script_name": script_name,
                "description": description,
                "start_time": step_start_datetime.isoformat(),
                "end_time": step_end_datetime.isoformat(),
                "duration_seconds": step_duration,
                "exit_code": step_result.get("exit_code", 0),
                "retry_count": step_result.get("retry_count", 0),
                "prerequisite_check": step_result.get("prerequisite_check", True),
                "dependency_warnings": step_result.get("dependency_warnings", []),
                "recoverable": step_result.get("recoverable", False),
                "memory_usage_mb": step_result.get("memory_usage_mb", 0.0),
                "peak_memory_mb": step_result.get("peak_memory_mb", 0.0),
                "memory_delta_mb": step_result.get("memory_delta_mb", 0.0)
            })

            # Check for warnings in both stdout and stderr (precise regex matching)
            combined_output = f"{step_result.get('stdout', '')}\n{step_result.get('stderr', '')}"
            # More precise warning detection - look for actual log levels or warning symbols


            # Known safe warnings that should not trigger SUCCESS_WITH_WARNINGS
            safe_warning_patterns = [
                r"matplotlib.*?backend",  # Matplotlib backend selection messages
                r"using agg backend",  # Headless backend in use
                r"no display",  # No display available (expected in CI/headless)
                r"pymdp.*?not available",  # Optional dependency message
                r"optional.*?dependency",  # Optional dependency notifications
                r"plotly.*?not available",  # Optional plotly dependency
                r"numpy.*?not available",  # Optional numpy dependency
                r"seaborn.*?not available",  # Optional seaborn dependency
                r"bokeh.*?not available",  # Optional bokeh dependency
                r"d2.*?not available",  # Optional D2 CLI dependency
                r"d2 cli.*?not available",  # Optional D2 CLI dependency (explicit)
                r"d2 visualizer.*?not available",  # D2 visualizer module
                r"d2 cli.*?install",  # D2 CLI installation instructions
                r"interactive.*?limited",  # Interactive visualization limitations
                r"numeric.*?limited",  # Numeric visualization limitations
                r"warnings: 0",  # Zero warnings count in validation logs
                r"optional test tooling not installed",  # Step 2: cov/xdist optional; INFO line
            ]

            # Combine safe patterns into single regex
            safe_patterns = "|".join(f"({p})" for p in safe_warning_patterns)
            safe_warning_pattern = re.compile(safe_patterns, re.IGNORECASE)

            # Check for warnings but exclude safe patterns
            warning_pattern = re.compile(r"(WARNING|⚠️|warn)", re.IGNORECASE)
            has_warning = bool(warning_pattern.search(combined_output))

            # If warning found, check if it's a "safe" warning
            if has_warning:
                has_warning = not bool(safe_warning_pattern.search(combined_output))

            # Propagate SUCCESS_WITH_WARNINGS status if applicable
            if step_result["status"] == "SUCCESS" and has_warning:
                step_result["status"] = "SUCCESS_WITH_WARNINGS"

            # Add to pipeline summary
            pipeline_summary["steps"].append(step_result)

            # Update performance summary
            if step_result["status"] in ("SUCCESS", "SUCCESS_WITH_WARNINGS", "SKIPPED"):
                pipeline_summary["performance_summary"]["successful_steps"] += 1
            elif step_result["status"] == "FAILED":
                pipeline_summary["performance_summary"]["failed_steps"] += 1
                # Only mark as critical if a core processing step fails
                # Tests, LLM, audio, research, website, GUI, analysis are non-critical
                critical_scripts = {
                    "0_template.py", "1_setup.py", "3_gnn.py",
                    "5_type_checker.py", "6_validation.py", "7_export.py",
                    "11_render.py"
                }
                if script_name in critical_scripts and step_result.get("exit_code", 0) != 0:
                    pipeline_summary["performance_summary"]["critical_failures"] += 1

            # Count warnings
            if has_warning:
                pipeline_summary["performance_summary"]["warnings"] += 1

            # Update peak memory usage with better tracking
            step_memory = step_result.get("memory_usage_mb", 0.0)
            step_peak_memory = step_result.get("peak_memory_mb", 0.0)
            current_peak = pipeline_summary["performance_summary"]["peak_memory_mb"]

            # Use the higher of step memory or peak memory
            new_peak = max(step_memory, step_peak_memory, current_peak)
            pipeline_summary["performance_summary"]["peak_memory_mb"] = new_peak

            # Update total steps count
            pipeline_summary["performance_summary"]["total_steps"] = len(steps_to_execute)

            # Step completion with visual indicators
            status_for_logging = step_result["status"]

            # Visual step completion summary
            step_stats = {
                "Status": status_for_logging,
                "Duration": f"{step_duration:.2f}s",
                "Memory": f"{step_result.get('peak_memory_mb', 0):.1f}MB",
                "Exit Code": step_result.get("exit_code", 0)
            }

            print_step_summary(actual_step_number, description, status_for_logging, step_duration, step_stats)

            # Step completion logging with progress tracking
            if STRUCTURED_LOGGING_AVAILABLE and progress_tracker:
                # Use structured logging functions that support additional parameters
                # These functions will handle progress tracking via the global tracker
                if status_for_logging.startswith("SUCCESS"):
                    from utils.logging.logging_utils import (
                        log_step_success as structured_log_step_success,
                    )
                    structured_log_step_success(logger, f"{description} completed",
                                        step_number=actual_step_number,
                                        duration=step_duration,
                                            status=status_for_logging)
                elif "WARNING" in status_for_logging:
                    from utils.logging.logging_utils import (
                        log_step_warning as structured_log_step_warning,
                    )
                    structured_log_step_warning(logger, f"{description} completed with warnings",
                                        step_number=actual_step_number,
                                        duration=step_duration,
                                            status=status_for_logging)
                else:
                    from utils.logging.logging_utils import (
                        log_step_error as structured_log_step_error,
                    )
                    structured_log_step_error(logger, f"{description} failed",
                                        step_number=actual_step_number,
                                        duration=step_duration,
                                            status=status_for_logging)
            else:
                if str(status_for_logging).startswith("SUCCESS"):
                    logger.info(f"✅ Step {actual_step_number} completed successfully in {step_duration:.2f}s")
                elif status_for_logging == "PARTIAL_SUCCESS" or "WARNING" in status_for_logging:
                    logger.warning(f"⚠️ Step {actual_step_number} completed with warnings in {step_duration:.2f}s")
                else:
                    logger.error(f"❌ Step {actual_step_number} failed with status: {status_for_logging}")

        # Complete pipeline summary
        end_time_dt = datetime.now()
        pipeline_summary["end_time"] = end_time_dt.isoformat()
        start_time_dt = datetime.fromisoformat(pipeline_summary["start_time"])
        pipeline_summary["total_duration_seconds"] = (end_time_dt - start_time_dt).total_seconds()

        # Determine overall status with enhanced logic
        perf_summary = pipeline_summary["performance_summary"]
        if perf_summary["critical_failures"] > 0:
            pipeline_summary["overall_status"] = "FAILED"
        elif perf_summary["failed_steps"] > 0:
            # Check if failures are recoverable vs critical
            total_steps = perf_summary["total_steps"]
            failed_ratio = perf_summary["failed_steps"] / total_steps if total_steps > 0 else 0

            if failed_ratio > 0.5:  # More than half failed
                pipeline_summary["overall_status"] = "FAILED"
            elif failed_ratio > 0.2:  # 20-50% failed
                pipeline_summary["overall_status"] = "PARTIAL_SUCCESS"
            else:  # Less than 20% failed
                pipeline_summary["overall_status"] = "SUCCESS_WITH_WARNINGS"
        else:
            pipeline_summary["overall_status"] = "SUCCESS"

        # Save pipeline summary with validation and error handling
        summary_path = args.output_dir / "00_pipeline_summary" / "pipeline_execution_summary.json"
        summary_path.parent.mkdir(parents=True, exist_ok=True)
        logger.info(f"Saving pipeline summary to: {summary_path}")

        try:
            # Validate summary structure before saving
            validate_pipeline_summary(pipeline_summary, logger)

            with open(summary_path, 'w') as f:
                json.dump(pipeline_summary, f, indent=4, default=str)
            logger.info("Pipeline summary saved successfully")

            # Index completion
            run_hash = pipeline_summary.get("run_hash")
            if run_hash:
                index_run(
                    run_hash=run_hash,
                    summary_path=summary_path,
                    config={"args": args.to_dict(), "pipeline": config_pipeline_settings},
                    file_hashes=pipeline_summary.get("file_hashes")
                )

            # Log summary statistics
            steps = pipeline_summary["steps"]
            successful = sum(1 for step in steps if step["status"] in ("SUCCESS", "SUCCESS_WITH_WARNINGS"))
            failed = sum(1 for step in steps if step["status"] == "FAILED")
            logger.info(f"Summary: {successful}/{len(steps)} steps successful, {failed} failed")

        except Exception as e:
            logger.error(f"Failed to save pipeline summary: {e}")
            # Try to save a minimal summary as recovery
            try:
                minimal_summary = {
                    "start_time": pipeline_summary.get("start_time"),
                    "end_time": datetime.now().isoformat(),
                    "overall_status": "FAILED",
                    "error": str(e),
                    "arguments": pipeline_summary.get("arguments", {}),
                    "steps_count": len(pipeline_summary.get("steps", [])),
                    "performance_summary": pipeline_summary.get("performance_summary", {}),
                    "steps": pipeline_summary.get("steps", [])
                }
                with open(summary_path, 'w') as f:
                    json.dump(minimal_summary, f, indent=4, default=str)
                logger.info("Minimal summary saved as recovery")
            except Exception as fallback_error:
                logger.error(f"Failed to save even minimal summary: {fallback_error}")

        # Final completion summary with visual indicators
        total_duration = pipeline_summary['total_duration_seconds']
        perf_summary = pipeline_summary['performance_summary']

        completion_stats = {
            "Total Steps": len(pipeline_summary.get('steps', [])),
            "Successful": perf_summary['successful_steps'],
            "Failed": perf_summary['failed_steps'],
            "Warnings": perf_summary['warnings'],
            "Peak Memory": f"{perf_summary['peak_memory_mb']:.1f}MB",
            "Duration": f"{total_duration:.1f}s"
        }

        success = pipeline_summary['overall_status'] == "SUCCESS"
        print_completion_summary(success, total_duration, completion_stats)

        # Final status logging
        if STRUCTURED_LOGGING_AVAILABLE:
            # Log overall progress summary
            if progress_tracker:
                overall_progress = progress_tracker.get_overall_progress()
                logger.info(overall_progress)

            # Log detailed pipeline summary
            log_pipeline_summary(logger, pipeline_summary)
        else:
            # Log final status with visual indicators
            if success:
                logger.info(f"🎯 Pipeline completed successfully in {total_duration:.2f}s")
            else:
                logger.info(f"⚠️ Pipeline completed with issues in {total_duration:.2f}s")

        return 0 if pipeline_summary["overall_status"] == "SUCCESS" else 1

    except Exception as e:
        # Update pipeline summary with error
        end_time_dt = datetime.now()
        pipeline_summary["end_time"] = end_time_dt.isoformat()
        pipeline_summary["overall_status"] = "FAILED"
        start_time_dt = datetime.fromisoformat(pipeline_summary["start_time"])
        pipeline_summary["total_duration_seconds"] = (end_time_dt - start_time_dt).total_seconds()

        # Save pipeline summary even on error
        summary_path = args.output_dir / "00_pipeline_summary" / "pipeline_execution_summary.json"
        summary_path.parent.mkdir(parents=True, exist_ok=True)
        with open(summary_path, 'w') as f:
            json.dump(pipeline_summary, f, indent=4)

        log_step_error(logger, f"Pipeline failed: {str(e)}")
        return 1

def execute_pipeline_step(script_name: str, args: PipelineArguments, logger) -> Dict[str, Any]:
    """Execute a single pipeline step with comprehensive monitoring."""
    import os

    # Initialize performance tracking
    start_memory = get_current_memory_usage()
    peak_memory = start_memory

    step_result = {
        "status": "UNKNOWN",
        "stdout": "",
        "stderr": "",
        "memory_usage_mb": 0.0,
        "peak_memory_mb": 0.0,
        "memory_delta_mb": 0.0,
        "exit_code": -1,
        "retry_count": 0,
        "prerequisite_check": True,
        "dependency_warnings": []
    }

    try:
        # Load config.yaml once — used for both skip_steps (prereq validation) and testing_matrix
        config_skip_steps = []
        testing_matrix = {}
        input_config_path = Path("input/config.yaml")
        if input_config_path.exists():
            try:
                import yaml
                with open(input_config_path, "r") as f:
                    _full_cfg = yaml.safe_load(f) or {}
                config_skip_steps = _full_cfg.get("pipeline", {}).get("skip_steps", [])
                testing_matrix = _full_cfg.get("testing_matrix", {})
            except (ImportError, OSError, ValueError, Exception) as e:
                logger.debug(f"Could not parse input/config.yaml: {e}")

        # Validate step prerequisites
        prereq_result = validate_step_prerequisites(script_name, args, logger,
                                                     skip_steps=config_skip_steps)
        step_result["prerequisite_check"] = prereq_result["passed"]
        step_result["dependency_warnings"] = prereq_result.get("warnings", [])

        # Log prerequisite warnings if any
        if prereq_result.get("warnings"):
            for warning in prereq_result["warnings"]:
                logger.warning(f"Prerequisite warning for {script_name}: {warning}")

        # Get script path
        script_path = Path(__file__).parent / script_name

        # Get virtual environment Python path
        project_root = Path(__file__).parent.parent
        venv_python = project_root / ".venv" / "bin" / "python"

        # Use virtual environment Python if available, otherwise fall back to system Python
        python_executable = str(venv_python) if venv_python.exists() else sys.executable

        # Extract step number
        step_num_match = re.match(r"^(\d+)_", script_name)
        step_num = int(step_num_match.group(1)) if step_num_match else -1

        matrix_enabled = testing_matrix.get("enabled", False)
        target_folders = []

        # Check global_steps: if a global step (0, 1, 2) is disabled, skip it entirely
        if matrix_enabled:
            global_steps = testing_matrix.get("global_steps", {})
            script_stem = script_name.replace('.py', '')
            if script_stem in global_steps and not global_steps[script_stem]:
                logger.info(f"⏭️ Skipping {script_name}: disabled in testing_matrix.global_steps")
                step_result["status"] = "SKIPPED"
                step_result["exit_code"] = 0
                step_result["stdout"] = f"Skipped by global_steps config (testing_matrix.global_steps.{script_stem}: false)\n"
                return step_result

        # Only apply folder-matrix logic if enabled and the step is a processing step (>= 3)
        if matrix_enabled and step_num >= 3:
            base_target_dir = args.target_dir
            if base_target_dir.exists() and base_target_dir.is_dir():
                folders_config = testing_matrix.get("folders", {})
                default_steps = testing_matrix.get("default_steps", [])

                # Check all subdirectories in the base target directory
                for item in base_target_dir.iterdir():
                    if item.is_dir() and item.name != "archived_gnn_files":
                        # Determine allowed steps for this folder
                        allowed_steps = folders_config.get(item.name, default_steps)
                        if step_num in allowed_steps:
                            target_folders.append(item)

        from pipeline.step_timeouts import get_step_timeout
        from utils.argument_utils import build_step_command_args
        from utils.execution_utils import execute_command_streaming

        # Prepare environment
        _env = os.environ.copy()
        _env.setdefault("PYTHONUNBUFFERED", "1")
        comprehensive_requested = any("--comprehensive" in str(arg) for arg in sys.argv)
        step_timeout_seconds = get_step_timeout(script_name, comprehensive=comprehensive_requested)

        if matrix_enabled and step_num >= 2 and target_folders:
            # MATRIX MODE: We found specific folders to run for this step
            if args.verbose:
                logger.info(f"Testing matrix enabled. Running step {step_num} on {len(target_folders)} specific folders: {[f.name for f in target_folders]}")

            combined_stdout = ""
            combined_stderr = ""
            worst_exit_code = 0

            for folder in target_folders:
                if args.verbose:
                    logger.info(f"  -> Executing for folder: {folder.name}")

                # Creating a modified args copy to point to the specific subfolder
                import copy
                folder_args = copy.copy(args)
                folder_args.target_dir = folder

                cmd = build_step_command_args(
                    script_name.replace('.py', ''),
                    folder_args,
                    python_executable,
                    script_path
                )

                # We do not use print_stdout=True for every subfolder iteration to avoid extreme terminal spam,
                # but we will print if requested verbose globally
                if args.verbose:
                    logger.info(f"  -> CMD ACTUALLY IS: {' '.join(cmd)}")

                result = execute_command_streaming(
                    cmd,
                    cwd=project_root,
                    env=_env,
                    timeout=step_timeout_seconds,
                    print_stdout=args.verbose,
                    print_stderr=True,
                    capture_output=True
                )

                combined_stdout += f"\n--- Output for {folder.name} ---\n{result.get('stdout', '')}\n"
                if result.get('stderr'):
                    combined_stderr += f"\n--- Stderr for {folder.name} ---\n{result.get('stderr', '')}\n"

                exit_code = result.get('exit_code', -1)
                if exit_code != 0:
                    worst_exit_code = exit_code
                    logger.warning(f"  -> Folder {folder.name} execution returned code {exit_code}")

            end_memory = get_current_memory_usage()
            peak_memory = max(peak_memory, end_memory)

            step_result["stdout"] = combined_stdout
            step_result["stderr"] = combined_stderr
            step_result["exit_code"] = worst_exit_code
            step_result["memory_usage_mb"] = end_memory
            step_result["peak_memory_mb"] = peak_memory
            step_result["memory_delta_mb"] = end_memory - start_memory

        else:
            # STANDARD MODE
            cmd = build_step_command_args(
                script_name.replace('.py', ''),
                args,
                python_executable,
                script_path
            )

            if args.verbose:
                logger.info(f"Executing command: {' '.join(cmd)}")

            result = execute_command_streaming(
                cmd,
                cwd=project_root,
                env=_env,
                timeout=step_timeout_seconds,
                print_stdout=True,
                print_stderr=True,
                capture_output=True
            )

            end_memory = get_current_memory_usage()
            peak_memory = max(peak_memory, end_memory)

            step_result["stdout"] = result.get("stdout", "")
            step_result["stderr"] = result.get("stderr", "")
            step_result["exit_code"] = result.get("exit_code", -1)
            step_result["memory_usage_mb"] = end_memory
            step_result["peak_memory_mb"] = peak_memory
            step_result["memory_delta_mb"] = end_memory - start_memory

            if args.verbose:
                 logger.info("Command completed with exit code: " + str(step_result["exit_code"]))

        # Determine status
        if step_result["exit_code"] == 0:
            step_result["status"] = "SUCCESS"
            # Check for any dependency warnings that might affect downstream steps
            if step_result["dependency_warnings"]:
                step_result["status"] = "SUCCESS_WITH_WARNINGS"
        else:
            # Respect the child process exit code to avoid masking failures
            step_result["status"] = "FAILED"
            # Log detailed failure information
            logger.error(f"Step {script_name} failed with exit code {step_result['exit_code']}")
            if step_result["stderr"]:
                logger.error(f"Error output: {step_result['stderr'][:500]}...")  # Limit to first 500 chars

        # Steps determine their own output directories via get_output_dir_for_script

        # Add recovery status to result
        if not step_result.get("recoverable"):
            step_result["recoverable"] = False

        return step_result

    except Exception as e:
        logger.error(f"Exception in execute_pipeline_step for {script_name}: {e}")
        step_result["status"] = "FAILED"
        step_result["exit_code"] = -1
        step_result["stderr"] = str(e)
        return step_result

def parse_step_list(step_input: Any) -> List[int]:
    """Parse step input (string or list) into list of integers."""
    if step_input is None:
        return []
    if isinstance(step_input, list):
        return [int(s) for s in step_input if str(s).isdigit() or isinstance(s, int)]
    if isinstance(step_input, str):
        try:
            return [int(s.strip()) for s in step_input.split(',') if s.strip()]
        except ValueError:
            _module_logger.debug("Could not parse step list '%s' as comma-separated integers", step_input)
            return []
    return []