add whisperx support

This commit is contained in:
Mariano Gabriel
2025-12-02 02:33:39 -03:00
parent 118ef04223
commit 7b919beda6
4 changed files with 155 additions and 38 deletions

View File

@@ -32,13 +32,13 @@ def main():
formatter_class=argparse.RawDescriptionHelpFormatter,
epilog="""
Examples:
# Embed images for LLM analysis (recommended - let LLM analyze actual frames)
# Reference frames for LLM analysis (recommended - transcript includes frame paths)
python process_meeting.py samples/meeting.mkv --run-whisper --embed-images --scene-detection
# Embed with custom quality (lower = smaller file size)
# Adjust frame extraction quality (lower = smaller files)
python process_meeting.py samples/meeting.mkv --run-whisper --embed-images --embed-quality 60 --scene-detection
# Hybrid approach: OpenCV + OCR (extracts text, no images)
# Hybrid approach: OpenCV + OCR (extracts text from frames)
python process_meeting.py samples/meeting.mkv --run-whisper --use-hybrid --scene-detection
# Hybrid + LLM cleanup (best for code formatting)
@@ -183,12 +183,12 @@ Examples:
parser.add_argument(
'--embed-images',
action='store_true',
help='Embed frame images (as base64) in enhanced transcript for LLM analysis'
help='Skip OCR/vision analysis and reference frame files directly (faster, lets LLM analyze images)'
)
parser.add_argument(
'--embed-quality',
type=int,
help='JPEG quality for embedded images (default: 80, lower = smaller file)',
help='JPEG quality for extracted frames (default: 80, lower = smaller files)',
default=80
)