feat(v3): PR 3 — prompt_layer package (base, video_prompt, search_query, visual_vocabulary)

Co-Authored-By: Claude Sonnet 4.6 <noreply@anthropic.com>
2026-03-29 11:43:15 +09:00
parent 4484fd1cfc
commit 33b0bbd5ee
5 changed files with 369 additions and 0 deletions
@@ -0,0 +1,43 @@
+"""
+bots/prompt_layer/__init__.py
+Unified entry point for all prompt composition.
+
+V3.0 scope: video + search + tts categories
+V3.1+: expand to all categories
+"""
+from .base import ComposedPrompt
+from .video_prompt import KlingPromptFormatter, VeoPromptFormatter
+from .search_query import StockSearchQueryComposer
+
+
+def compose(category: str, input_data: dict, engine: str) -> 'ComposedPrompt':
+    """
+    Unified entry point for all prompt composition.
+
+    category: 'video' | 'search' | 'tts' | 'image' | 'writing' | 'caption'
+    input_data: category-specific dict
+    engine: target engine name
+
+    V3.0 scope: video + search only
+    V3.1+: expand to all categories
+    """
+    composer = _get_composer(category, engine)
+    return composer.compose(input_data, engine)
+
+
+def _get_composer(category: str, engine: str):
+    """Return appropriate composer for category+engine combination."""
+    if category == 'video':
+        if engine in ('kling_free', 'kling_pro'):
+            return KlingPromptFormatter()
+        else:
+            return VeoPromptFormatter()
+    elif category == 'search':
+        return StockSearchQueryComposer()
+    else:
+        # Fallback: return a passthrough composer for unsupported categories
+        from .base import PassthroughComposer
+        return PassthroughComposer()
+
+
+__all__ = ['compose', 'ComposedPrompt']
@@ -0,0 +1,41 @@
+"""
+bots/prompt_layer/base.py
+Base types for the prompt layer.
+"""
+from dataclasses import dataclass, field
+from typing import Optional
+
+@dataclass
+class ComposedPrompt:
+    """
+    Unified prompt container returned by all composers.
+
+    Fields used varies by engine:
+    - Kling: positive + negative
+    - Veo: positive (structured)
+    - Search: queries list
+    - TTS: processed_text
+    """
+    positive: str = ''
+    negative: str = ''
+    queries: list[str] = field(default_factory=list)
+    processed_text: str = ''
+    metadata: dict = field(default_factory=dict)
+
+    def __bool__(self) -> bool:
+        return bool(self.positive or self.queries or self.processed_text)
+
+
+class BaseComposer:
+    """Abstract base for all composers."""
+    def compose(self, input_data: dict, engine: str) -> ComposedPrompt:
+        raise NotImplementedError
+
+
+class PassthroughComposer(BaseComposer):
+    """Returns input as-is for unsupported categories."""
+    def compose(self, input_data: dict, engine: str) -> ComposedPrompt:
+        return ComposedPrompt(
+            positive=input_data.get('text', ''),
+            metadata={'passthrough': True, 'engine': engine}
+        )
@@ -0,0 +1,55 @@
+"""
+bots/prompt_layer/search_query.py
+Compose stock video/image search queries from Korean concepts.
+"""
+from .base import BaseComposer, ComposedPrompt
+from .visual_vocabulary import CONCEPT_TO_VISUAL, VISUAL_STYLE_MODIFIERS
+import re
+
+
+class StockSearchQueryComposer(BaseComposer):
+    """
+    Korean concept -> English visual search terms.
+    Used to search Pexels/Pixabay/Unsplash for stock footage.
+    """
+
+    def compose(self, input_data: dict, engine: str = 'pexels') -> ComposedPrompt:
+        """
+        input_data: {
+            'sentence': str,  # Korean sentence to find visuals for
+            'platform': str,  # 'pexels' | 'pixabay' | 'kling' | 'veo'
+            'count': int,     # number of search queries to return (default 3)
+        }
+        Returns ComposedPrompt with queries list
+        """
+        sentence = input_data.get('sentence', '')
+        count = input_data.get('count', 3)
+
+        queries = self._sentence_to_queries(sentence, count)
+
+        return ComposedPrompt(
+            queries=queries,
+            metadata={'sentence': sentence, 'engine': engine}
+        )
+
+    def _sentence_to_queries(self, sentence: str, count: int) -> list[str]:
+        """Extract Korean concepts from sentence and map to visual search terms."""
+        # Find matching concepts from vocabulary
+        matched_visuals = []
+        for concept, visuals in CONCEPT_TO_VISUAL.items():
+            if concept in sentence:
+                matched_visuals.extend(visuals)
+
+        # If no matches, use generic professional stock footage terms
+        if not matched_visuals:
+            matched_visuals = ['professional business', 'modern lifestyle', 'technology future']
+
+        # Return up to count unique queries
+        seen = set()
+        unique = []
+        for v in matched_visuals:
+            if v not in seen:
+                seen.add(v)
+                unique.append(v)
+
+        return unique[:count]
@@ -0,0 +1,85 @@
+"""
+bots/prompt_layer/video_prompt.py
+Format prompts for video generation engines (Kling, Veo).
+"""
+from .base import BaseComposer, ComposedPrompt
+from .visual_vocabulary import VISUAL_STYLE_MODIFIERS, NEGATIVE_TERMS
+
+
+class KlingPromptFormatter(BaseComposer):
+    """
+    Format prompts for Kling AI video generation.
+    Kling works best with: scene description + movement + mood + negative prompt.
+    """
+
+    def compose(self, input_data: dict, engine: str = 'kling_free') -> ComposedPrompt:
+        """
+        input_data: {
+            'scenes': list[dict],  # [{text, type, image_prompt}, ...]
+            'corner': str,         # content corner/category
+            'duration': float,     # target duration in seconds
+        }
+        """
+        scenes = input_data.get('scenes', [])
+        corner = input_data.get('corner', '')
+
+        # Build positive prompt from scenes
+        scene_texts = []
+        for scene in scenes:
+            prompt = scene.get('image_prompt') or scene.get('text', '')
+            if prompt:
+                scene_texts.append(self._enhance_for_kling(prompt, corner))
+
+        positive = '. '.join(scene_texts[:3])  # Max 3 scenes per prompt
+        if not positive:
+            positive = f'cinematic short video about {corner or "technology"}'
+
+        # Kling negative prompt
+        negative = ', '.join(NEGATIVE_TERMS + ['text overlay', 'subtitles', 'watermark'])
+
+        # Add beat markers for Kling
+        positive = f'{positive}. Camera: smooth movement, vertical 9:16 format. Style: cinematic, vibrant.'
+
+        return ComposedPrompt(
+            positive=positive,
+            negative=negative,
+            metadata={'engine': engine, 'corner': corner}
+        )
+
+    def _enhance_for_kling(self, text: str, corner: str) -> str:
+        """Add cinematic enhancement to prompt."""
+        modifiers = ', '.join(VISUAL_STYLE_MODIFIERS[:3])
+        return f'{text}, {modifiers}'
+
+
+class VeoPromptFormatter(BaseComposer):
+    """
+    Format prompts for Google Veo video generation.
+    Veo works best with structured ingredient list format.
+    """
+
+    def compose(self, input_data: dict, engine: str = 'veo3') -> ComposedPrompt:
+        """
+        input_data: same as KlingPromptFormatter
+        """
+        scenes = input_data.get('scenes', [])
+        corner = input_data.get('corner', '')
+
+        scene_texts = [
+            scene.get('image_prompt') or scene.get('text', '')
+            for scene in scenes if scene.get('image_prompt') or scene.get('text')
+        ]
+
+        # Veo structured format: Subject + Action + Setting + Style
+        subject = scene_texts[0] if scene_texts else f'{corner or "technology"} concept'
+        positive = (
+            f'Subject: {subject}. '
+            f'Format: vertical 9:16 portrait video. '
+            f'Style: cinematic, {", ".join(VISUAL_STYLE_MODIFIERS[:2])}. '
+            f'Camera: smooth pan or zoom. Duration: short clip.'
+        )
+
+        return ComposedPrompt(
+            positive=positive,
+            metadata={'engine': engine, 'corner': corner, 'format': 'veo_structured'}
+        )
@@ -0,0 +1,145 @@
+"""
+bots/prompt_layer/visual_vocabulary.py
+Shared Korean -> English visual concept dictionary.
+Used by search_query.py and video_prompt.py for concept mapping.
+"""
+
+CONCEPT_TO_VISUAL = {
+    # Technology
+    'AI': ['artificial intelligence screen', 'digital interface', 'neural network visualization'],
+    '인공지능': ['robot brain', 'digital mind', 'AI hologram'],
+    '자동화': ['gears mechanism', 'conveyor belt', 'robot arm factory'],
+    '코딩': ['computer code screen', 'programmer keyboard', 'dark terminal code'],
+    '데이터': ['data visualization', 'bar chart analytics', 'network nodes'],
+    '알고리즘': ['flowchart diagram', 'binary code', 'decision tree'],
+    '앱': ['smartphone screen', 'mobile app interface', 'app store'],
+    '소프트웨어': ['software development', 'code editor', 'programming laptop'],
+    # Finance/Money
+    '돈': ['money cash bills', 'coins pile', 'dollar bills'],
+    '수익': ['profit growth chart', 'rising arrow money', 'income cash'],
+    '투자': ['stock market chart', 'investment portfolio', 'financial growth'],
+    '절약': ['piggy bank savings', 'money jar coins', 'budget planning'],
+    '부자': ['luxury lifestyle', 'wealthy business person', 'success achievement'],
+    '무료': ['gift present box', 'unlocked padlock', 'free tag label'],
+    '할인': ['sale discount tag', 'percent off sign', 'price reduction'],
+    # Business
+    '비즈니스': ['business meeting', 'office workspace', 'professional handshake'],
+    '창업': ['startup launch rocket', 'entrepreneur office', 'business idea lightbulb'],
+    '마케팅': ['marketing strategy board', 'social media icons', 'advertising billboard'],
+    '브랜드': ['brand logo design', 'brand identity', 'premium label'],
+    '고객': ['customer service smile', 'client meeting', 'happy customer'],
+    '성공': ['success achievement trophy', 'winner podium', 'goal celebration'],
+    '실패': ['failure mistake frustrated', 'broken plan', 'problem obstacle'],
+    # Health/Lifestyle
+    '건강': ['healthy lifestyle', 'fitness exercise', 'fresh vegetables'],
+    '다이어트': ['diet food salad', 'weight loss scale', 'healthy eating'],
+    '운동': ['gym workout exercise', 'running sport', 'fitness training'],
+    '수면': ['peaceful sleep bedroom', 'sleeping person night', 'rest relaxation'],
+    '스트레스': ['stress anxiety person', 'overwhelmed work', 'headache pressure'],
+    '행복': ['happy smiling person', 'joy celebration', 'positive energy'],
+    # Education
+    '공부': ['studying books desk', 'student learning', 'open textbook'],
+    '독서': ['reading book cozy', 'bookshelf library', 'person reading'],
+    '교육': ['classroom teaching', 'education school', 'learning knowledge'],
+    '자격증': ['certificate diploma award', 'achievement credential', 'professional certification'],
+    # Social/Communication
+    '소통': ['communication talking', 'conversation speech bubble', 'people talking'],
+    '관계': ['relationship people together', 'friendship bond', 'social connection'],
+    '가족': ['family together happy', 'family portrait', 'home family'],
+    '친구': ['friends together laughing', 'friendship bond', 'social gathering'],
+    # Environment/Nature
+    '자연': ['nature landscape scenic', 'green forest trees', 'outdoor beauty'],
+    '환경': ['environment ecology', 'green earth planet', 'sustainability'],
+    '도시': ['city skyline urban', 'modern architecture', 'downtown cityscape'],
+    '여행': ['travel adventure journey', 'wanderlust explore', 'tourism destination'],
+    # Time/Productivity
+    '시간': ['clock time management', 'hourglass countdown', 'calendar schedule'],
+    '생산성': ['productivity work desk', 'efficient workflow', 'organized workspace'],
+    '습관': ['habit routine daily', 'calendar habit tracker', 'consistent practice'],
+    '목표': ['goal target arrow', 'achievement milestone', 'success roadmap'],
+    # Food
+    '음식': ['food meal delicious', 'restaurant dining', 'cooking kitchen'],
+    '커피': ['coffee cup cafe', 'espresso morning', 'coffee shop cozy'],
+    '요리': ['cooking chef kitchen', 'recipe preparation', 'homemade food'],
+    # Digital/Social Media
+    '유튜브': ['youtube play button', 'video content creator', 'streaming platform'],
+    '틱톡': ['social media video', 'short video content', 'viral content'],
+    '인스타그램': ['instagram photo aesthetic', 'social media post', 'influencer lifestyle'],
+    '콘텐츠': ['content creation studio', 'digital content', 'creative media'],
+    # Generic actions
+    '시작': ['starting launch beginning', 'new start fresh', 'launch rocket'],
+    '변화': ['change transformation', 'before after contrast', 'evolution progress'],
+    '성장': ['growth plant sprouting', 'growth chart rising', 'development progress'],
+    '문제': ['problem solving puzzle', 'challenge obstacle', 'issue question mark'],
+    '해결': ['solution lightbulb', 'problem solved checkmark', 'resolution answer'],
+    '비교': ['comparison side by side', 'versus contrast', 'pros cons balance'],
+    '순위': ['ranking top list', 'leaderboard winners', 'chart comparison'],
+    '방법': ['how-to guide steps', 'tutorial instruction', 'method process'],
+    '팁': ['tips tricks advice', 'helpful hints', 'pro tip star'],
+    '비밀': ['secret reveal hidden', 'mystery unlock', 'insider knowledge'],
+    '진실': ['truth reveal facts', 'reality check', 'honest disclosure'],
+    '놀라운': ['surprising amazing wow', 'unexpected revelation', 'shocking discovery'],
+    # Numbers/Stats
+    '1위': ['number one winner', 'first place gold', 'top ranked best'],
+    '100%': ['one hundred percent complete', 'full capacity', 'perfect score'],
+    # Korean culture
+    '한국': ['korea seoul cityscape', 'korean culture', 'hanbok traditional'],
+    '직장': ['office workplace corporate', 'work desk professional', 'business office'],
+    '취업': ['job interview hiring', 'employment opportunity', 'career success'],
+    '부동산': ['real estate property', 'house home investment', 'property market'],
+    # Abstract concepts
+    '가능성': ['possibility open door', 'opportunity horizon', 'potential unlimited'],
+    '미래': ['future technology vision', 'futuristic landscape', 'innovation tomorrow'],
+    '트렌드': ['trend arrow upward', 'trending popular', 'hot topic social'],
+}
+
+# Quality/style modifiers to append to video/image prompts
+VISUAL_STYLE_MODIFIERS = [
+    'cinematic',
+    '4k',
+    'professional',
+    'high quality',
+    'vibrant colors',
+    'sharp focus',
+    'natural lighting',
+    'smooth motion',
+]
+
+# Terms to avoid in video generation prompts
+NEGATIVE_TERMS = [
+    'blurry',
+    'low quality',
+    'watermark',
+    'text overlay',
+    'distorted',
+    'pixelated',
+    'grainy',
+    'overexposed',
+    'underexposed',
+    'shaky camera',
+]
+
+
+if __name__ == '__main__':
+    import sys
+
+    if '--test' in sys.argv:
+        print('=== visual_vocabulary 테스트 시작 ===')
+        print(f'총 개념 수: {len(CONCEPT_TO_VISUAL)}')
+        print(f'스타일 수식어 수: {len(VISUAL_STYLE_MODIFIERS)}')
+        print(f'네거티브 용어 수: {len(NEGATIVE_TERMS)}')
+        print()
+
+        # Test a few lookups
+        test_concepts = ['AI', '미래', '성공', '건강', '코딩']
+        for concept in test_concepts:
+            visuals = CONCEPT_TO_VISUAL.get(concept, [])
+            print(f'  [{concept}] -> {visuals}')
+
+        print()
+        print(f'스타일 수식어: {VISUAL_STYLE_MODIFIERS}')
+        print(f'네거티브 용어: {NEGATIVE_TERMS}')
+        print()
+        print('=== 테스트 완료 ===')
+    else:
+        print('사용법: python -m bots.prompt_layer.visual_vocabulary --test')