-
Notifications
You must be signed in to change notification settings - Fork 0
/
Copy pathwordslengthdist.sh
executable file
·78 lines (71 loc) · 2.12 KB
/
wordslengthdist.sh
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
#!/bin/bash
# help
display_help() {
echo "Usage: $0 [option...] " >&2
echo
echo " -h, --help Display this help message"
echo " -o, --output-file Specify output file name"
echo " -i, --input-file Specify input file name"
echo
# echo some stuff here for the -a or --add-options
exit 1
}
# As long as there is at least one more argument, keep looping
while [[ $# -gt 0 ]]; do
key="$1"
case "$key" in
# This is an arg value type option. Will catch -o value or --output-file value
-o|--output-file)
shift # past the key and to the value
OUTPUTFILE="$1"
;;
# This is an arg value type option. Will catch -i value or --input-file value
-i|--input-file)
shift # past the key and to the value
INPUTFILE="$1"
;;
# display help
-h | --help)
display_help # Call your function
exit 0
;;
*)
# Do whatever you want with extra options
#echo "Unknown option '$key'"
INPUTFILE="$1"
;;
esac
# Shift after checking all the cases to get the next option
shift
done
if [ ! -z "$OUTPUTFILE" ]; then
if [ -f "$OUTPUTFILE" ]; then
read -p "File exist! Are you sure [y,n]? " -n 1 -r
echo
if [[ $REPLY =~ ^[Yy]$ ]];
then
rm $OUTPUTFILE
else
exit
fi
fi
fi
if [ -z "$OUTPUTFILE" ]; then
echo -e "f\twlen"
else
echo -e "f\twlen" > $OUTPUTFILE
fi
SEDSTR="\1\t\2"
if [ -z "$OUTPUTFILE" ]; then
if [ "$INPUTFILE" ]; then
cat "$INPUTFILE"
else
cat
fi | awk '{gsub(/[^[:alpha:][:blank:]]/,""); print tolower($0)}' | tr -d '\r' | tr -s ' \n' | tr ' ' '\n' | awk 'NF' | awk '{ print length }' | sort | uniq -c | sort -n -k2 | sed "s/[[:space:]]*\([0-9]*\) \([a-z']*\)/$SEDSTR/"
else
if [ "$INPUTFILE" ]; then
cat "$INPUTFILE"
else
cat
fi | awk '{gsub(/[^[:alpha:][:blank:]]/,""); print tolower($0)}' | tr -d '\r' | tr -s ' \n' | tr ' ' '\n' | awk 'NF' | awk '{ print length }' | sort | uniq -c | sort -n -k2 |sed "s/[[:space:]]*\([0-9]*\) \([a-z']*\)/$SEDSTR/" >> $OUTPUTFILE
fi