aboutsummaryrefslogtreecommitdiff
path: root/bin/htmlesc
blob: 0e4c75a8a0d55a29b35cecdc77440e7cadd76d71 (plain) (blame)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
#!/bin/sh
set -eu


usage() {
	cat <<-'EOF'
		Usage:
		  htmlesc [-e|d] [CONTENT...]
		  htmlesc -h
	EOF
}

help() {
	cat <<-'EOF'

		Options:
		  -e            escape the string (the default action)
		  -d            unescape (de-escape?) the string
		  -h, --help    show this message

		  CONTENT       a literal string to be escaped


		Convert data to/from HTML escaping.  If CONTENT is not given,
		get data from STDIN.


		Examples:

		  Escape HTML control characters in a string:

		    $ htmlesc 'a > 5 && !b'
		    a &gt; 5 &amp;&amp; !b


		  Unescape the content from a file:

		    $ htmlesc -d < file.html
	EOF
}


for flag in "$@"; do
	case "$flag" in
		--)
			break
			;;
		--help)
			usage
			help
			exit
			;;
		*)
			;;
	esac
done

ENCODE=false
DECODE=false
while getopts 'edh' flag; do
	case "$flag" in
		e)
			ENCODE=true
			;;
		d)
			DECODE=true
			;;
		h)
			usage
			help
			exit
			;;
		*)
			usage >&2
			exit 2
			;;
	esac
done
shift $((OPTIND - 1))

if [ "$ENCODE" = true ] && [ "$DECODE" = true ]; then
	printf 'Both -e and -d given.  Pick one.\n' >&2
	usage >&2
	exit 2
fi

decode() {
	sed \
		-e 's|&amp;|\&|g'  \
		-e 's|&lt;|<|g'   \
		-e 's|&gt;|>|g'   \
		-e 's|&quot;|"|g' \
		-e "s|&apos;|'|g"
}

encode() {
	sed \
		-e 's|&|\&amp;|g'  \
		-e 's|<|\&lt;|g'   \
		-e 's|>|\&gt;|g'   \
		-e 's|"|\&quot;|g' \
		-e "s|'|\&apos;|g"
}

if [ "$DECODE" = true ]; then
	FN=decode
else
	FN=encode
fi

if [ $# = 0 ]; then
	"$FN"
else
	for s in "$@"; do
		printf '%s\n' "$s" | "$FN"
	done
fi