Initial commit with two utilities: reducepdf and whisper

5 months ago · 541f20eb6e
commit 541f20eb6e
4 changed files with 220 additions and 0 deletions
--- a/.gitignore
+++ b/.gitignore
@ -0,0 +1 @@
 markitdown
--- a/README.md
+++ b/README.md
@ -0,0 +1,6 @@
 # My ./local/bin collection of scripts for my convenience
 Currently done from my work computer, I have the following utilities:
 - `reducepdf.sh`: Reduce a PDF file size by reducing the ppi of the images.
 - `whisper.sh`: Transcribe audio and video files directly in the directory they're on.
--- a/reducepdf.sh
+++ b/reducepdf.sh
@ -0,0 +1,83 @@
 #!/bin/bash
 # Function to display usage information and exit
 usage() {
 	echo "Usage: $0 input.pdf output.pdf [-r resolution] [-h]"
 	echo ""
 	echo "Options:"
 	echo "-r     Set the image resolution (default is 150ppi)"
 	echo "-h     Display this help message"
 	exit 1
 }
 # Default settings
 RESOLUTION=150
 # Parse command-line options
 while getopts ":r:h" opt; do
 	case ${opt} in
 	r)
 		RESOLUTION=$OPTARG
 		;;
 	h)
 		usage
 		;;
 	\?)
 		echo "Invalid option: -$OPTARG" >&2
 		exit 1
 		;;
 	:)
 		echo "Option -$OPTARG requires an argument." >&2
 		exit 1
 		;;
 	esac
 done
 shift $((OPTIND - 1))
 # Check if the correct number of arguments are provided after parsing options
 if [ "$#" -ne 2 ]; then
 	usage
 fi
 INPUT_FILE="$1"
 OUTPUT_FILE="$2"
 # Check if input file exists
 if [ ! -f "$INPUT_FILE" ]; then
 	echo "Input file '$INPUT_FILE' does not exist."
 	exit 1
 fi
 # Extract directory and base name from output file path
 OUTPUT_DIR=$(dirname "$OUTPUT_FILE")
 OUTPUT_BASENAME=$(basename "$OUTPUT_FILE")
 # Create the output directory if it doesn't already exist
 mkdir -p "$OUTPUT_DIR"
 # Run Ghostscript command with specified resolution
 gs \
 	-sDEVICE=pdfwrite \
 	-dCompatibilityLevel=1.7 \
 	-dPDFSETTINGS=/prepress \
 	-dDownsampleMonoImages=false \
 	-dDownsampleColorImages=true \
 	-dColorImageResolution=$RESOLUTION \
 	-dGrayImageResolution=$RESOLUTION \
 	-dMonoImageResolution=$RESOLUTION \
 	-dPreserveOPIRequests=false \
 	-dSubsetFonts=true \
 	-dEmbedAllFonts=true \
 	-sProcessColorModel=DeviceRGB \
 	-dQUIET -dBATCH -dNOPAUSE \
 	-sOutputFile="$OUTPUT_FILE" "$INPUT_FILE"
 # Check if Ghostscript command was successful
 if [ $? -ne 0 ]; then
 	echo "Error: Ghostscript failed to process the file '$INPUT_FILE'."
 	exit 1
 fi
 echo "Successfully converted '$INPUT_FILE' to '$OUTPUT_BASENAME'"
--- a/whisper.sh
+++ b/whisper.sh
@ -0,0 +1,130 @@
 #!/bin/bash
 # Script that uses `whispercpp` to tranascribe audio and video files automatically and outputs the results in the same directory
 # Configuración
 REPO_DIR=~/code/whisper.cpp
 WHISPER_CLI="$REPO_DIR/build/bin/whisper-cli"
 TEMP_DIR=$(mktemp -d)
 LANGUAGE="en"
 OUTPUT_FORMAT="txt"
 # Rutas de los modelos
 MODEL_LARGE="/Users/borjarobert/code/whisper.cpp/models/ggml-large-v3-turbo.bin"
 MODEL_MEDIUM="/Users/borjarobert/code/whisper.cpp/models/ggml-medium.bin"
 MODEL_SMALL="/Users/borjarobert/code/whisper.cpp/models/ggml-base.bin"
 MODEL_PATH="$MODEL_LARGE" # Valor por defecto
 # Función para mostrar uso
 usage() {
 	echo "Uso: whisper [-u] [-t archivo] [-m modelo] [-l idioma] [-f formato]"
 	echo "Opciones:"
 	echo "  -u              Actualiza y recompila whispercpp"
 	echo "  -t archivo      Transcribe el archivo de video"
 	echo "  -m modelo       Especifica el modelo (large, medium, small)"
 	echo "  -l idioma       Especifica el idioma (por defecto: en)"
 	echo "  -f formato      Especifica el formato de salida (txt, srt, json, vtt, lrc, csv)"
 	exit 1
 }
 # Manejo de argumentos
 while getopts ":ut:m:l:f:" opt; do
 	case $opt in
 	u)
 		echo "Actualizando whispercpp..."
 		cd "$REPO_DIR" || exit
 		git pull
 		make
 		echo "Actualización completa."
 		exit 0
 		;;
 	t)
 		FILE="$OPTARG"
 		;;
 	m)
 		case $OPTARG in
 		large)
 			MODEL_PATH="$MODEL_LARGE"
 			;;
 		medium)
 			MODEL_PATH="$MODEL_MEDIUM"
 			;;
 		small)
 			MODEL_PATH="$MODEL_SMALL"
 			;;
 		*)
 			echo "Modelo no válido: $OPTARG. Usando el modelo por defecto (large)."
 			;;
 		esac
 		;;
 	l)
 		LANGUAGE="$OPTARG"
 		;;
 	f)
 		OUTPUT_FORMAT="$OPTARG"
 		;;
 	\?)
 		echo "Opción inválida: -$OPTARG" >&2
 		usage
 		;;
 	:)
 		echo "La opción -$OPTARG requiere un argumento." >&2
 		usage
 		;;
 	esac
 done
 # Verificar si se proporcionó un archivo para transcribir
 if [ -z "$FILE" ]; then
 	usage
 fi
 # Verificar si whisper-cli está disponible
 if ! command -v "$WHISPER_CLI" &>/dev/null; then
 	echo "Error: whisper-cli no se encuentra en $WHISPER_CLI"
 	exit 1
 fi
 # Convertir archivo a WAV
 WAV_FILE="$TEMP_DIR/$(basename "$FILE" .mp4).wav"
 ffmpeg -i "$FILE" -acodec pcm_s16le -ac 1 -ar 16000 "$WAV_FILE" -y || {
 	echo "Error al convertir a WAV"
 	rm -rf "$TEMP_DIR"
 	exit 1
 }
 # Preparar nombres de salida
 OUTPUT_BASE="$(basename "$FILE" .mp4)_${LANGUAGE}"
 OUTPUT_DIR="$(pwd)" # Directorio actual
 OUTPUT_FILE="$OUTPUT_DIR/$OUTPUT_BASE"
 # Transcribir
 case "$OUTPUT_FORMAT" in
 txt)
 	$WHISPER_CLI -m "$MODEL_PATH" -l "$LANGUAGE" -otxt -of "$OUTPUT_FILE" "$WAV_FILE" | tee "$OUTPUT_FILE"_timestamped.txt
 	;;
 srt)
 	$WHISPER_CLI -m "$MODEL_PATH" -l "$LANGUAGE" -osrt -of "$OUTPUT_FILE" "$WAV_FILE" | tee "$OUTPUT_FILE"_timestamped.txt
 	;;
 json)
 	$WHISPER_CLI -m "$MODEL_PATH" -l "$LANGUAGE" -oj -of "$OUTPUT_FILE" "$WAV_FILE" | tee "$OUTPUT_FILE"_timestamped.txt
 	;;
 vtt)
 	$WHISPER_CLI -m "$MODEL_PATH" -l "$LANGUAGE" -ovtt -of "$OUTPUT_FILE" "$WAV_FILE" | tee "$OUTPUT_FILE"_timestamped.txt
 	;;
 lrc)
 	$WHISPER_CLI -m "$MODEL_PATH" -l "$LANGUAGE" -olrc -of "$OUTPUT_FILE" "$WAV_FILE" | tee "$OUTPUT_FILE"_timestamped.txt
 	;;
 csv)
 	$WHISPER_CLI -m "$MODEL_PATH" -l "$LANGUAGE" -ocsv -of "$OUTPUT_FILE" "$WAV_FILE" | tee "$OUTPUT_FILE"_timestamped.txt
 	;;
 *)
 	echo "Formato de salida no soportado: $OUTPUT_FORMAT"
 	rm -rf "$TEMP_DIR"
 	exit 1
 	;;
 esac
 # Limpiar archivos temporales
 rm -rf "$TEMP_DIR"
 echo "Transcripción completada. Archivos generados: ${OUTPUT_FILE}_timestamped.txt y ${OUTPUT_FILE}.${OUTPUT_FORMAT}."