LDP/LDP/guide/docbook/abs-guide/dict-lookup.sh

#!/bin/bash
# dict-lookup.sh

#  This script looks up definitions in the 1913 Webster's Dictionary.
#  This Public Domain dictionary is available for download
#+ from various sites, including
#+ Project Gutenberg (http://www.gutenberg.org/etext/247).
#
#  Convert it from DOS to UNIX format (with only LF at end of line)
#+ before using it with this script.
#  Store the file in plain, uncompressed ASCII text.
#  Set DEFAULT_DICTFILE variable below to path/filename.


E_BADARGS=85
MAXCONTEXTLINES=50                        # Maximum number of lines to show.
DEFAULT_DICTFILE="/usr/share/dict/webster1913-dict.txt"
                                          # Default dictionary file pathname.
                                          # Change this as necessary.
#  Note:
#  ----
#  This particular edition of the 1913 Webster's
#+ begins each entry with an uppercase letter
#+ (lowercase for the remaining characters).
#  Only the *very first line* of an entry begins this way,
#+ and that's why the search algorithm below works.


if [[ -z $(echo "$1" | sed -n '/^[A-Z]/p') ]]
#  Must at least specify word to look up, and
#+ it must start with an uppercase letter.
then
  echo "Usage: `basename $0` Word-to-define [dictionary-file]"
  echo
  echo "Note: Word to look up must start with capital letter,"
  echo "with the rest of the word in lowercase."
  echo "--------------------------------------------"
  echo "Examples: Abandon, Dictionary, Marking, etc."
  exit $E_BADARGS
fi


if [ -z "$2" ]                            #  May specify different dictionary
                                          #+ as an argument to this script.
then
  dictfile=$DEFAULT_DICTFILE
else
  dictfile="$2"
fi

# ---------------------------------------------------------
Definition=$(fgrep -A $MAXCONTEXTLINES "$1 \\" "$dictfile")
#                  Definitions in form "Word \..."
#
#  And, yes, "fgrep" is fast enough
#+ to search even a very large text file.


# Now, snip out just the definition block.

echo "$Definition" |
sed -n '1,/^[A-Z]/p' |
#  Print from first line of output
#+ to the first line of the next entry.
sed '$d' | sed '$d'
#  Delete last two lines of output
#+ (blank line and first line of next entry).
# ---------------------------------------------------------

exit $?

# Exercises:
# ---------
# 1)  Modify the script to accept any type of alphabetic input
#   + (uppercase, lowercase, mixed case), and convert it
#   + to an acceptable format for processing.
#
# 2)  Convert the script to a GUI application,
#   + using something like 'gdialog' or 'zenity' . . .
#     The script will then no longer take its argument(s)
#   + from the command-line.
#
# 3)  Modify the script to parse one of the other available
#   + Public Domain Dictionaries, such as the U.S. Census Bureau Gazetteer.
new 2005-03-21 13:52:30 +00:00			`#!/bin/bash`
			`# dict-lookup.sh`

			`# This script looks up definitions in the 1913 Webster's Dictionary.`
			`# This Public Domain dictionary is available for download`
			`#+ from various sites, including`
			`#+ Project Gutenberg (http://www.gutenberg.org/etext/247).`
			`#`
updated 2008-11-23 22:43:47 +00:00			`# Convert it from DOS to UNIX format (with only LF at end of line)`
new 2005-03-21 13:52:30 +00:00			`#+ before using it with this script.`
updated 2008-11-23 22:43:47 +00:00			`# Store the file in plain, uncompressed ASCII text.`
updated 2005-05-08 20:09:31 +00:00			`# Set DEFAULT_DICTFILE variable below to path/filename.`
new 2005-03-21 13:52:30 +00:00

updated 2008-11-23 22:43:47 +00:00			`E_BADARGS=85`
new 2005-03-21 13:52:30 +00:00			`MAXCONTEXTLINES=50 # Maximum number of lines to show.`
updated 2005-05-08 20:09:31 +00:00			`DEFAULT_DICTFILE="/usr/share/dict/webster1913-dict.txt"`
			`# Default dictionary file pathname.`
new 2005-03-21 13:52:30 +00:00			`# Change this as necessary.`
			`# Note:`
			`# ----`
updated 2005-05-08 20:09:31 +00:00			`# This particular edition of the 1913 Webster's`
new 2005-03-21 13:52:30 +00:00			`#+ begins each entry with an uppercase letter`
			`#+ (lowercase for the remaining characters).`
updated 2005-05-08 20:09:31 +00:00			`# Only the very first line of an entry begins this way,`
new 2005-03-21 13:52:30 +00:00			`#+ and that's why the search algorithm below works.`



			`if [[ -z $(echo "$1" \| sed -n '/^[A-Z]/p') ]]`
			`# Must at least specify word to look up, and`
			`#+ it must start with an uppercase letter.`
			`then`
			echo "Usage: `basename $0` Word-to-define [dictionary-file]"
			`echo`
			`echo "Note: Word to look up must start with capital letter,"`
			`echo "with the rest of the word in lowercase."`
			`echo "--------------------------------------------"`
			`echo "Examples: Abandon, Dictionary, Marking, etc."`
			`exit $E_BADARGS`
			`fi`


updated 2005-05-08 20:09:31 +00:00			`if [ -z "$2" ] # May specify different dictionary`
			`#+ as an argument to this script.`
new 2005-03-21 13:52:30 +00:00			`then`
			`dictfile=$DEFAULT_DICTFILE`
			`else`
			`dictfile="$2"`
			`fi`

			`# ---------------------------------------------------------`
			`Definition=$(fgrep -A $MAXCONTEXTLINES "$1 \\" "$dictfile")`
			`# Definitions in form "Word \..."`
			`#`
updated 2005-05-08 20:09:31 +00:00			`# And, yes, "fgrep" is fast enough`
			`#+ to search even a very large text file.`
new 2005-03-21 13:52:30 +00:00

			`# Now, snip out just the definition block.`

			`echo "$Definition" \|`
			`sed -n '1,/^[A-Z]/p' \|`
			`# Print from first line of output`
			`#+ to the first line of the next entry.`
			`sed '$d' \| sed '$d'`
			`# Delete last two lines of output`
			`#+ (blank line and first line of next entry).`
			`# ---------------------------------------------------------`

updated 2008-11-23 22:43:47 +00:00			`exit $?`
new 2005-03-21 13:52:30 +00:00
			`# Exercises:`
			`# ---------`
			`# 1) Modify the script to accept any type of alphabetic input`
			`# + (uppercase, lowercase, mixed case), and convert it`
			`# + to an acceptable format for processing.`
			`#`
			`# 2) Convert the script to a GUI application,`
updated 2008-03-13 13:24:45 +00:00			`# + using something like 'gdialog' or 'zenity' . . .`
new 2005-03-21 13:52:30 +00:00			`# The script will then no longer take its argument(s)`
updated 2008-11-23 22:43:47 +00:00			`# + from the command-line.`
updated 2005-05-08 20:09:31 +00:00			`#`
			`# 3) Modify the script to parse one of the other available`
			`# + Public Domain Dictionaries, such as the U.S. Census Bureau Gazetteer.`