sudo apt install python3 python3-venv python3-pip -y
python3 -m venv venv
source venv/bin/activate
pip install --upgrade pip
pip install opencv-python ffmpeg-python librosa pytesseract faster-whisper typer
sudo apt install tesseract-ocr -y
sudo apt install ffmpeg -y
NOTE: BE AWARE OF "/" or "" convention
cli: python -m src.main -i "<input folder>"
gui: python -m src.main
Linux/macOS
make
Windows
nmake /f Makefile.win
- File system (open,rename,text->filename)
- GUI
- Audio processor
- Get audio
- .mp4
- .braw
- Preprocessing (Noise Reduction)
- Detect slate clap
- Find slate call
- Transcribe
- Get audio
- Video processor
- Get frames
- Preprocessing
- Transcribe
- Additional Perameters
- Rely on video cue only
- Rely on audio cue only
- Accept only above a certain confidence for video
- Accept only above a certain confidence for audio
- Print confidence for each video
- User set time chunk to check