#! /bin/sh # Save your clipboard to UTF-8 text file, then convert by this tool. # acroread-iconv pdf-font-charset file... CHARSET=$1 shift TEMP=$(mktemp) rm -f $TEMP || exit 1 for (( i=160 ; i<256 ; i++ )) ; do xi=$(printf %x $i) eval "eval \$'CHAR=\\x$xi'" OLDCHAR="$(echo -n "$CHAR" | iconv -f ISO-8859-1 -t UTF-8 )" NEWCHAR="$(echo -n "$CHAR" | iconv -f $CHARSET -t UTF-8 )" echo "s/$OLDCHAR/$NEWCHAR/g" >>$TEMP done for FILE in "$@" ; do sed -f $TEMP <"$FILE" >"${FILE%.txt}_pdfconverted.txt" done rm $TEMP