chore: init

This commit is contained in:
Thiago Sposito 2026-02-04 21:11:16 -03:00
commit edb31d2d31
13 changed files with 531 additions and 0 deletions

19
run.sh Executable file
View file

@ -0,0 +1,19 @@
#!/usr/bin/env bash
# Full pipeline: extract frames + OCR → heuristic fixes → sew + dedupe → result.csv
# Usage: ./run.sh [video] [output_dir]
# Default: video=video-data.webm, output_dir=frames, result=result.csv
set -e
VIDEO="${1:-video-data.webm}"
OUT_DIR="${2:-frames}"
RESULT="result.csv"
echo "1. Extract frames (every 10) + OCR with template.svg → ${OUT_DIR}/"
python3 extract_frames_and_tables.py "$OUT_DIR" "$VIDEO" template.svg 10
echo "2. Heuristic fixes on ${OUT_DIR}/*.csv"
python3 fix_all_csvs.py "$OUT_DIR"
echo "3. Sew CSVs + dedupe → ${RESULT}"
python3 sew_csvs.py "$OUT_DIR" "$RESULT"
echo "Done. Output: ${RESULT}"