aboutsummaryrefslogtreecommitdiffstats
path: root/obfuscate.sh
blob: 872f23460f2e86f81913010fca57e38ed489ec0d (plain)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
#!/bin/bash

# obfuscate.sh
# obfuscate email addresses in XML/HTML
# Script written (and slight perl modification) by Archaic <archaic AT linuxfromscratch D0T org>
# Modified from "sed -i" to old style "sed -e" by Manuel Canales <manuel AT linuxfromscratch D0T org>
# to prevent hangs on very long files, like nonckunked books.
# Original Perl expression by Anderson Lizardo <lizardo AT linuxfromscratch D0T org>
# Released under the GNU General Public License
#
# This script currently only seeks out mailto: addresses. If those same
# addresses also appear in plaintext, we need to obfuscate those as well.
#
# This script was made for a very specific purpose so I was a bit lazy in
# writing the regex's.
#
# Please send comments, enhancements, etc. to the above address

#set -e  # Bail on all errors

# First, ensure that we are given a file to process
# if [ $# -lt 1 ]; then
#   echo -e "\nYou must provide an input file."
#   exit 1
# fi

# Nothing like a backup plan!
#cp "$1" "$1".bak

for i in `grep -o '"mailto:.*@.*"' ${1} |cut -d\" -f2|sed -e 's|^mailto:||' -e 's|"$||'`; do
  link=`echo $i | perl -pe 's/[^\n]/"\\\&#".ord($&)."\;"/ge'`
  plaintext=`echo $i | sed -e 's|@| AT |' -e 's|\.| D0T |g'`
  cp ${1}{,.tmp}
  sed -e "s|mailto:$i|mailto:$link|" \
      -e "s|$i|$plaintext|" ${1}.tmp > ${1}
  rm ${1}.tmp
done
#rm $FILE.tmp
#exit 0