#!/bin/bash

# Create the images directory if it doesn't exist
mkdir -p images

# Loop through all PDF files in the current directory
for pdf in *.pdf; do
    # Extract the date from the filename
    date=$(echo "$pdf" | grep -oP '\d{4}-\d{2}-\d{2}')
    
    if [ -z "$date" ]; then
        echo "Skipping $pdf: No date found in filename"
        continue
    fi
    
    # Initialize counter for this PDF
    counter=1
    
    # Use pdfimages to extract images, storing them in a temporary directory
    temp_dir=$(mktemp -d)
    pdfimages -all "$pdf" "$temp_dir/img"
    
    # Move and rename the extracted images
    for img in "$temp_dir"/*; do
        # Get the file extension
        ext="${img##*.}"
        
        # Move and rename the image
        mv "$img" "images/${date}_${counter}.${ext}"
        
        # Increment counter
        ((counter++))
    done
    
    # Remove the temporary directory
    rm -rf "$temp_dir"
    
    echo "Processed $pdf: Extracted $((counter-1)) images"
done

echo "Image extraction complete. All images are in the 'images' directory."