- Tested with node 0.10.38
- Tesseract libs (
brew install tesseract
on Mac OSX) - Imagemagick
npm install
curl http://www.arleneslivekaraoke.com/images/songlist-7-15.jpg > book.jpg
convert book.jpg -colorspace Gray -depth 1 ocr.jpg
node index.js ocr.jpg | grep -v '^$' > by-title.txt
# by artist
awk -F ' - ' '{ print $NF, "-", $0 }' by-title.txt | sort -n -k1 | awk -F ' - ' '{ print $1, "-", $2 }' > by-artist.txt