aegis-stack/aegis/core/template_generator.py at b036dfbe64eb98a4a523975a73e13d6d2f7e4e64 · lbedner/aegis-stack · GitHub

1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
248
249
250
251
252
253
254
255
256
257
258
259
260
261
262
263
264
265
266
267
268
269
270
271
272
273
274
275
276
277
278
279
280
281
282
283
284
285
286
287
288
289
290
291
292
293
294
295
296
297
298
299
300
301
302
303
304
305
306
307
308
309
310
311
312
313
314
315
316
317
318
319
320
321
322
323
324
325
326
327
328
329
330
331
332
333
334
335
336
337
338
339
340
341
342
343
344
345
346
347
348
349
350
351
352
353
354
355
356
357
358
359
360
361
362
363
364
365
366
367
368
369
370
371
372
373
374
375
376
377
378
379
380
381
382
383
384
385
386
387
388
389
390
391
392
393
394
395
396
397
398
399
400
401
402
403
404
405
406
407
408
409
410
411
412
413
414
415
416
417
418
419
420
421
422
423
424
425
426
427
428
429
430
431
432
433
434
435
436
437
438
439
440
441
442
443
444
445
446
447
448
449
450
451
452
453
454
455
456
457
458
459
460
461
462
463
464
465
466
467
468
469
470
471
472
473
474
475
476
477
478
479
480
481
482
483
484
485
486
487
488
489
490
491
492
493
494
495
496
497
498
499
500
501
502
503
504
505
506
507
508
509
510
511
512
513
514
515
516
517
518
519
520
521
522
523
524
525
526
527
528
529
530
531
532
533
534
535
536
537
538
539
540
541
542
543
544
545
546
547
548
549
550
551
552
553
554
555
556
557
558
559
560
561
562
563
564
565
566
567
568
569
570
571
572
573
574
575
576
577
578
579
580
581
582
583
584
585
586
587
588
589
590
591
592
593
594
595
596
597
598
599
600
601
602
603
604
605
606
607
608
609
610
611
612
613
614
615
616
617
618
619
620
621
622
623
624
625
626
"""
Template generation and context building for Aegis Stack projects.

This module handles the generation of cookiecutter context and manages
the template rendering process based on selected components.
"""

from pathlib import Path
from typing import Any

from .. import __version__ as aegis_version
from ..config.defaults import DEFAULT_PYTHON_VERSION
from ..constants import (
    AIFrameworks,
    AnswerKeys,
    AuthLevels,
    ComponentNames,
    OllamaMode,
    PaymentProviders,
    StorageBackends,
    WorkerBackends,
)
from .ai_service_parser import is_ai_service_with_options, parse_ai_service_config
from .auth_service_parser import is_auth_service_with_options, parse_auth_service_config
from .component_utils import (
    extract_base_component_name,
    extract_base_service_name,
    extract_engine_info,
)
from .components import COMPONENTS, CORE_COMPONENTS
from .insights_service_parser import (
    is_insights_service_with_options,
    parse_insights_service_config,
)
from .services import SERVICES

# Service names for bracket syntax detection
SERVICE_AI = "ai"
SERVICE_AUTH = "auth"
SERVICE_INSIGHTS = "insights"


class TemplateGenerator:
    """Handles template context generation for cookiecutter."""

    def __init__(
        self,
        project_name: str,
        selected_components: list[str],
        scheduler_backend: str = StorageBackends.MEMORY,
        selected_services: list[str] | None = None,
        python_version: str = DEFAULT_PYTHON_VERSION,
    ):
        """
        Initialize template generator.

        Args:
            project_name: Name of the project being generated
            selected_components: List of component names to include
            scheduler_backend: Scheduler backend: memory, sqlite, or postgres
            selected_services: List of service names to include
            python_version: Python version for generated project (default from pyproject.toml)
        """
        self.project_name = project_name
        self.project_slug = project_name.lower().replace(" ", "-").replace("_", "-")
        self.scheduler_backend = scheduler_backend
        self.selected_services = selected_services or []
        self.python_version = python_version

        # Always include core components
        all_components = CORE_COMPONENTS + selected_components

        # Add required components from selected services
        for service_name in self.selected_services:
            if service_name in SERVICES:
                service_spec = SERVICES[service_name]
                all_components.extend(service_spec.required_components)

        # Remove duplicates, preserve order
        self.components = list(dict.fromkeys(all_components))

        # Extract database engine from database[engine] format for template context
        self.database_engine = None
        for component in self.components:
            if extract_base_component_name(component) == ComponentNames.DATABASE:
                self.database_engine = extract_engine_info(component)
                if self.database_engine:
                    break

        # Extract scheduler backend from scheduler[backend] format or use passed param
        # If scheduler[backend] syntax is used, it overrides the passed parameter
        for component in self.components:
            if extract_base_component_name(component) == ComponentNames.SCHEDULER:
                backend = extract_engine_info(component)
                if backend:
                    self.scheduler_backend = backend
                    break

        # Extract worker backend from worker[backend] format
        self.worker_backend = WorkerBackends.ARQ  # Default to arq
        for component in self.components:
            if extract_base_component_name(component) == ComponentNames.WORKER:
                backend = extract_engine_info(component)
                if backend:
                    self.worker_backend = backend
                    break

        # Extract AI config from ai[framework, backend, providers, rag, voice] format in services
        self.ai_backend = StorageBackends.MEMORY  # Default to memory
        self.ai_framework = AIFrameworks.PYDANTIC_AI  # Default to pydantic-ai
        self.ai_rag = False  # Default to no RAG
        self.ai_voice = False  # Default to no voice
        user_specified_ai_backend = False

        for service in self.selected_services:
            if extract_base_service_name(service) == SERVICE_AI:
                if is_ai_service_with_options(service):
                    ai_config = parse_ai_service_config(service)
                    self.ai_backend = ai_config.backend
                    self.ai_framework = ai_config.framework
                    self.ai_rag = ai_config.rag_enabled
                    self.ai_voice = ai_config.voice_enabled
                    user_specified_ai_backend = True
                break

        # OAuth social login (GitHub + Google) — opt-in via the
        # ``auth[oauth]`` modifier in the bracket syntax (composes with
        # ``auth[rbac,oauth]`` etc.). Defaults off so projects that
        # don't ask for it don't pay for the extra routes and deps.
        self.include_oauth: bool = False

        # Extract auth level (and oauth modifier) from auth[...] format in services
        self.auth_level = AuthLevels.BASIC  # Default to basic
        self._user_specified_auth_level = False
        for service in self.selected_services:
            if extract_base_service_name(service) == SERVICE_AUTH:
                if is_auth_service_with_options(service):
                    auth_config = parse_auth_service_config(service)
                    self.auth_level = auth_config.level
                    self._user_specified_auth_level = True
                    self.include_oauth = auth_config.oauth
                break

        # Extract insights sources from insights[sources] format in services
        from .insights_service_parser import DEFAULT_SOURCES

        self.insights_sources: list[str] = DEFAULT_SOURCES.copy()
        for service in self.selected_services:
            if extract_base_service_name(service) == SERVICE_INSIGHTS:
                if is_insights_service_with_options(service):
                    insights_config = parse_insights_service_config(service)
                    self.insights_sources = insights_config.sources
                break

        # Auto-detect: if AI service selected AND database available AND no explicit backend,
        # use SQLite for persistence (analytics, conversation history, LLM tracking)
        if not user_specified_ai_backend:
            has_ai = any(
                extract_base_service_name(s) == SERVICE_AI
                for s in self.selected_services
            )
            has_database = any(
                extract_base_component_name(c) == ComponentNames.DATABASE
                for c in self.components
            )
            if has_ai and has_database:
                self.ai_backend = StorageBackends.SQLITE

        # Build component specs using base names
        self.component_specs = {}
        for name in self.components:
            base_name = extract_base_component_name(name)
            if base_name in COMPONENTS:
                self.component_specs[base_name] = COMPONENTS[base_name]

    def get_template_context(self) -> dict[str, Any]:
        """
        Generate cookiecutter context from components.

        Returns:
            Dictionary containing all template variables
        """
        # Store the originally selected components (without core)
        selected_only = [c for c in self.components if c not in CORE_COMPONENTS]

        # Check for components using base names
        has_database = any(
            extract_base_component_name(c) == ComponentNames.DATABASE
            for c in self.components
        )

        return {
            "project_name": self.project_name,
            "project_slug": self.project_slug,
            "python_version": self.python_version,
            "aegis_version": aegis_version,
            # Component flags for template conditionals - cookiecutter needs yes/no
            AnswerKeys.REDIS: "yes"
            if ComponentNames.REDIS in self.components
            else "no",
            AnswerKeys.WORKER: "yes"
            if any(c.startswith(ComponentNames.WORKER) for c in self.components)
            else "no",
            AnswerKeys.SCHEDULER: "yes"
            if any(c.startswith(ComponentNames.SCHEDULER) for c in self.components)
            else "no",
            AnswerKeys.DATABASE: "yes" if has_database else "no",
            AnswerKeys.INGRESS: "yes"
            if ComponentNames.INGRESS in self.components
            else "no",
            AnswerKeys.OBSERVABILITY: "yes"
            if ComponentNames.OBSERVABILITY in self.components
            else "no",
            # Database engine selection (sqlite or postgres)
            "database_engine": self.database_engine or StorageBackends.SQLITE,
            # Scheduler backend selection
            AnswerKeys.SCHEDULER_BACKEND: self.scheduler_backend,
            # Worker backend selection
            AnswerKeys.WORKER_BACKEND: self.worker_backend,
            # Legacy scheduler persistence flag for backwards compatibility
            AnswerKeys.SCHEDULER_WITH_PERSISTENCE: (
                "yes" if self.scheduler_backend != StorageBackends.MEMORY else "no"
            ),
            # Derived flags for template logic
            "has_background_infrastructure": any(
                c.startswith(ComponentNames.WORKER)
                or c.startswith(ComponentNames.SCHEDULER)
                for c in self.components
            ),
            "needs_redis": ComponentNames.REDIS in self.components,
            # Service flags for template conditionals
            # Use base name extraction to handle bracket syntax (e.g., ai[langchain, sqlite])
            AnswerKeys.AUTH: "yes"
            if any(
                extract_base_service_name(s) == AnswerKeys.SERVICE_AUTH
                for s in self.selected_services
            )
            else "no",
            # Auth level selection (basic, rbac, or org)
            AnswerKeys.AUTH_LEVEL: (auth_level := self._get_auth_level()),
            # Derived auth level flags for template conditionals
            # Org level implies RBAC (org gets both roles and orgs)
            AnswerKeys.AUTH_RBAC: "yes"
            if auth_level in (AuthLevels.RBAC, AuthLevels.ORG)
            else "no",
            AnswerKeys.AUTH_ORG: "yes" if auth_level == AuthLevels.ORG else "no",
            # OAuth social login (GitHub + Google) — opt-in via the
            # ``auth[oauth]`` modifier in the bracket syntax (composes
            # with ``auth[rbac,oauth]`` etc.). Defaults off so existing
            # flows aren't surprised by extra routes and dependencies.
            AnswerKeys.AUTH_OAUTH: "yes" if self.include_oauth else "no",
            AnswerKeys.AI: "yes"
            if any(
                extract_base_service_name(s) == AnswerKeys.SERVICE_AI
                for s in self.selected_services
            )
            else "no",
            AnswerKeys.COMMS: "yes"
            if any(
                extract_base_service_name(s) == AnswerKeys.SERVICE_COMMS
                for s in self.selected_services
            )
            else "no",
            AnswerKeys.INSIGHTS: "yes"
            if any(
                extract_base_service_name(s) == AnswerKeys.SERVICE_INSIGHTS
                for s in self.selected_services
            )
            else "no",
            AnswerKeys.PAYMENT: "yes"
            if any(
                extract_base_service_name(s) == AnswerKeys.SERVICE_PAYMENT
                for s in self.selected_services
            )
            else "no",
            AnswerKeys.PAYMENT_PROVIDER: PaymentProviders.DEFAULT,
            # Insights source flags
            AnswerKeys.INSIGHTS_GITHUB: "yes"
            if "github" in self.insights_sources
            else "no",
            AnswerKeys.INSIGHTS_PYPI: "yes"
            if "pypi" in self.insights_sources
            else "no",
            AnswerKeys.INSIGHTS_PLAUSIBLE: "yes"
            if "plausible" in self.insights_sources
            else "no",
            AnswerKeys.INSIGHTS_REDDIT: "yes"
            if "reddit" in self.insights_sources
            else "no",
            # AI backend selection for conversation persistence
            AnswerKeys.AI_BACKEND: self.ai_backend,
            # AI persistence flag for backwards compatibility with template conditionals
            AnswerKeys.AI_WITH_PERSISTENCE: (
                "yes" if self.ai_backend != StorageBackends.MEMORY else "no"
            ),
            # AI framework selection (pydantic-ai or langchain)
            AnswerKeys.AI_FRAMEWORK: self._get_ai_framework(),
            # AI provider selection for dynamic dependency generation
            AnswerKeys.AI_PROVIDERS: self._get_ai_providers_string(),
            # AI RAG (Retrieval-Augmented Generation) selection
            AnswerKeys.AI_RAG: "yes" if self.ai_rag else "no",
            # AI Voice (TTS and STT) selection
            AnswerKeys.AI_VOICE: "yes" if self.ai_voice else "no",
            # Ollama deployment mode (host, docker, or none)
            AnswerKeys.OLLAMA_MODE: self._get_ollama_mode(),
            # Dependency lists for templates
            "selected_components": selected_only,  # Original selection for context
            "docker_services": self._get_docker_services(),
            "pyproject_dependencies": self._get_pyproject_deps(),
        }

    def _get_docker_services(self) -> list[str]:
        """
        Collect all docker services needed.

        Returns:
            List of docker service names
        """
        services = []
        for component_name in self.components:
            if component_name in self.component_specs:
                spec = self.component_specs[component_name]
                if spec.docker_services:
                    services.extend(spec.docker_services)
        return list(dict.fromkeys(services))  # Preserve order, remove duplicates

    def _get_pyproject_deps(self) -> list[str]:
        """
        Collect all Python dependencies.

        Returns:
            Sorted list of Python package dependencies
        """
        deps = []
        # Collect component dependencies
        for component_name in self.components:
            base_name = extract_base_component_name(component_name)
            if base_name in self.component_specs:
                spec = self.component_specs[base_name]
                if spec.pyproject_deps:
                    # Handle worker backend-specific dependencies
                    if base_name == ComponentNames.WORKER:
                        if self.worker_backend == WorkerBackends.TASKIQ:
                            deps.extend(["taskiq>=0.11.11", "taskiq-redis>=1.0.2"])
                        elif self.worker_backend == WorkerBackends.DRAMATIQ:
                            deps.append("dramatiq[redis]>=1.17.0")
                        else:
                            deps.extend(spec.pyproject_deps)  # arq deps from spec
                    # Handle database engine-specific dependencies
                    elif base_name == ComponentNames.DATABASE:
                        deps.extend(["sqlmodel>=0.0.14", "sqlalchemy>=2.0.0"])
                        if self.database_engine == StorageBackends.POSTGRES:
                            deps.extend(["asyncpg>=0.29.0", "psycopg2-binary>=2.9.9"])
                        else:
                            deps.append("aiosqlite>=0.19.0")
                    else:
                        deps.extend(spec.pyproject_deps)

        # Collect service dependencies
        for service_name in self.selected_services:
            # Extract base service name for bracket syntax (e.g., "ai[langchain]" → "ai")
            base_service_name = extract_base_service_name(service_name)
            if base_service_name in SERVICES:
                service_spec = SERVICES[base_service_name]
                if service_spec.pyproject_deps:
                    # Process service dependencies with dynamic substitution
                    for dep in service_spec.pyproject_deps:
                        if (
                            base_service_name == AnswerKeys.SERVICE_AI
                            and "{AI_FRAMEWORK_DEPS}" in dep
                        ):
                            # Substitute AI framework + provider deps dynamically
                            ai_deps = self._get_ai_framework_deps()
                            deps.extend(ai_deps)
                        else:
                            deps.append(dep)

        return sorted(set(deps))  # Sort and deduplicate

    def get_template_files(self) -> list[str]:
        """
        Get list of template files that should be included.

        Returns:
            List of template file paths
        """
        files = []
        # Collect component template files
        for component_name in self.components:
            base_name = extract_base_component_name(component_name)
            if base_name in self.component_specs:
                spec = self.component_specs[base_name]
                if spec.template_files:
                    files.extend(spec.template_files)

        # Collect service template files
        for service in self.selected_services:
            base_service = extract_base_service_name(service)
            if base_service in SERVICES:
                service_spec = SERVICES[base_service]
                if service_spec.template_files:
                    files.extend(service_spec.template_files)

        return list(dict.fromkeys(files))  # Preserve order, remove duplicates

    def _get_ai_providers_string(self) -> str:
        """
        Get AI providers as comma-separated string for pydantic-ai-slim dependency.

        Returns:
            Comma-separated string of provider names (e.g., "openai,anthropic,google")
        """
        # Check if AI service is selected (handle bracket syntax)
        has_ai = any(
            extract_base_service_name(s) == AnswerKeys.SERVICE_AI
            for s in self.selected_services
        )
        if not has_ai:
            return "openai"  # Default for PUBLIC provider

        # Import here to avoid circular imports
        from ..cli.interactive import get_ai_provider_selection

        providers = get_ai_provider_selection("ai")
        return ",".join(providers)

    def _get_ai_framework(self) -> str:
        """
        Get AI framework selection (pydantic-ai or langchain).

        Returns:
            Framework name string
        """
        # Check if AI service is selected (handle bracket syntax)
        has_ai = any(
            extract_base_service_name(s) == AnswerKeys.SERVICE_AI
            for s in self.selected_services
        )
        if not has_ai:
            return AIFrameworks.PYDANTIC_AI  # Default

        # Import here to avoid circular imports
        from ..cli.interactive import get_ai_framework_selection

        return get_ai_framework_selection("ai")

    def _get_ollama_mode(self) -> str:
        """
        Get Ollama deployment mode selection (host, docker, or none).

        Returns:
            Ollama mode string
        """
        # Check if AI service is selected (handle bracket syntax)
        has_ai = any(
            extract_base_service_name(s) == AnswerKeys.SERVICE_AI
            for s in self.selected_services
        )
        if not has_ai:
            return OllamaMode.NONE  # Default when AI not selected

        # Import here to avoid circular imports
        from ..cli.interactive import get_ollama_mode_selection

        return get_ollama_mode_selection("ai")

    def _get_auth_level(self) -> str:
        """
        Get auth level selection (basic or rbac).

        Uses the value parsed from bracket syntax in __init__, falling back
        to the interactive global selection.

        Returns:
            Auth level string
        """
        has_auth = any(
            extract_base_service_name(s) == AnswerKeys.SERVICE_AUTH
            for s in self.selected_services
        )
        if not has_auth:
            return AuthLevels.BASIC  # Default

        # If bracket syntax was used, trust the parsed value
        if self._user_specified_auth_level:
            return self.auth_level

        # Fall back to interactive global selection
        from ..cli.interactive import get_auth_level_selection

        return get_auth_level_selection("auth")

    def _get_ai_framework_deps(self) -> list[str]:
        """
        Get AI framework-specific dependencies based on framework and provider selection.

        Returns:
            List of Python package dependency strings
        """
        framework = self._get_ai_framework()
        providers_str = self._get_ai_providers_string()
        providers = providers_str.split(",")

        if framework == AIFrameworks.PYDANTIC_AI:
            # PydanticAI uses a single package with extras
            # Map provider names to pydantic-ai-slim extras
            # Providers using OpenAI-compatible APIs map to "openai" extra
            pydantic_extra_mapping = {
                "public": "openai",  # LLM7.io uses OpenAI-compatible API
                "openrouter": "openai",  # OpenRouter uses OpenAI-compatible API
                # Future OpenAI-compatible providers go here:
                # "together": "openai",
                # "fireworks": "openai",
            }

            pydantic_extras = []
            for provider in providers:
                provider = provider.strip()
                # Map to the correct extra, or use provider name directly
                extra = pydantic_extra_mapping.get(provider, provider)
                if extra not in pydantic_extras:
                    pydantic_extras.append(extra)

            extras_str = ",".join(pydantic_extras) if pydantic_extras else "openai"
            return [
                f"pydantic-ai-slim[{extras_str}]>=1.0.10",
                "httpx>=0.27.0",  # For API providers
            ]
        else:
            # LangChain uses separate packages per provider
            deps = ["langchain-core>=1.1.0"]

            # Map provider names to LangChain packages
            langchain_packages = {
                "openai": "langchain-openai>=1.1.0",
                "anthropic": "langchain-anthropic>=1.2.0",
                "google": "langchain-google-genai>=4.0.0",
                "groq": "langchain-groq>=1.1.0",
                "mistral": "langchain-mistralai>=1.1.0",
                "cohere": "langchain-cohere>=0.5.0",
            }

            for provider in providers:
                provider = provider.strip()
                if provider in langchain_packages:
                    deps.append(langchain_packages[provider])
                elif provider == "public" and "langchain-openai>=1.1.0" not in deps:
                    # Public provider uses OpenAI-compatible endpoint
                    deps.append("langchain-openai>=1.1.0")

            return deps

    def get_entrypoints(self) -> list[str]:
        """
        Get list of entrypoints that will be created.

        Returns:
            List of entrypoint file paths
        """
        entrypoints = ["app/entrypoints/webserver.py"]  # Always included

        # Check component specs for actual entrypoint files
        for component_name in self.components:
            base_name = extract_base_component_name(component_name)
            if base_name in self.component_specs:
                spec = self.component_specs[base_name]
                if spec.template_files:
                    for template_file in spec.template_files:
                        if (
                            template_file.startswith("app/entrypoints/")
                            and template_file not in entrypoints
                        ):
                            entrypoints.append(template_file)

        return entrypoints

    def get_worker_queues(self) -> list[str]:
        """
        Get list of worker queue files that will be created.

        Returns:
            List of worker queue file paths
        """
        queues: list[str] = []

        # Only check if worker component is included
        if not any(c.startswith(ComponentNames.WORKER) for c in self.components):
            return queues

        # Discover queue files from the template directory
        template_root = (
            Path(__file__).parent.parent / "templates" / "copier-aegis-project"
        )
        worker_queues_dir = (
            template_root
            / "{{ project_slug }}"
            / "app"
            / "components"
            / "worker"
            / "queues"
        )

        if worker_queues_dir.exists():
            for queue_file in worker_queues_dir.glob("*.py"):
                if queue_file.stem == "__init__":
                    continue
                # Filter based on worker backend — each backend has _suffix.py files
                # that get renamed to .py by post_gen_tasks
                is_taskiq_file = queue_file.stem.endswith("_taskiq")
                is_dramatiq_file = queue_file.stem.endswith("_dramatiq")
                is_backend_specific = is_taskiq_file or is_dramatiq_file

                if self.worker_backend == WorkerBackends.TASKIQ:
                    if is_taskiq_file:
                        final_name = queue_file.name.replace("_taskiq.py", ".py")
                        queues.append(f"app/components/worker/queues/{final_name}")
                elif self.worker_backend == WorkerBackends.DRAMATIQ:
                    if is_dramatiq_file:
                        final_name = queue_file.name.replace("_dramatiq.py", ".py")
                        queues.append(f"app/components/worker/queues/{final_name}")
                else:
                    # arq (default): show non-backend-specific files
                    if not is_backend_specific:
                        queues.append(f"app/components/worker/queues/{queue_file.name}")

        return sorted(queues)