diff --git a/scripts/caption_processor.py b/scripts/caption_processor.py index 4655949..11d6223 100644 --- a/scripts/caption_processor.py +++ b/scripts/caption_processor.py @@ -82,9 +82,9 @@ def generate_caption_with_llava( """Generate caption using LLaVA model""" try: # Try to use transformers with LLaVA - from transformers import AutoProcessor, AutoModelForVision2Seq - import torch - from PIL import Image + from transformers import AutoProcessor, AutoModelForVision2Seq # noqa: F401 + import torch # noqa: F401 + from PIL import Image # noqa: F401 # Note: This requires llava-hf/llava-1.5-7b-hf or similar # For now, return a placeholder diff --git a/scripts/story_processor.py b/scripts/story_processor.py index da03d2c..a6ebc09 100644 --- a/scripts/story_processor.py +++ b/scripts/story_processor.py @@ -63,7 +63,7 @@ def generate_parent_child_chunks( asr_segments = asr_data.get("segments", []) cut_scenes = cut_data.get("scenes", []) yolo_frames = yolo_data.get("frames", []) - ocr_frames = ocr_data.get("frames", []) + _ocr_frames = ocr_data.get("frames", []) # Create child chunks from ASR segments asr_child_ids = []