| #!/bin/sh |
| # |
| # find_repeated_words.sh |
| # |
| # A simple script for finding instances of repeated consecutive words |
| # in manual pages -- human inspection can then determine if these |
| # are real errors in the text. |
| # |
| # Usage: sh find_repeated_words.sh [file...] |
| # |
| ###################################################################### |
| # |
| # (C) Copyright 2007 & 2013, Michael Kerrisk |
| # This program is free software; you can redistribute it and/or |
| # modify it under the terms of the GNU General Public License |
| # as published by the Free Software Foundation; either version 2 |
| # of the License, or (at your option) any later version. |
| # |
| # This program is distributed in the hope that it will be useful, |
| # but WITHOUT ANY WARRANTY; without even the implied warranty of |
| # MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the |
| # GNU General Public License for more details |
| # (http://www.gnu.org/licenses/gpl-2.0.html). |
| # |
| # |
| |
| for file in "$@" ; do |
| # Do not process files that are redirects. |
| grep -qE "^\.so man.*" "$file" |
| if test $? -ne 0; then |
| words=$(MANWIDTH=2000 man -l "$file" 2> /dev/null | col -b | \ |
| tr ' \008' '\012' | sed -e '/^$/d' | \ |
| sed 's/ *$//' | |
| awk 'BEGIN {p=""} {if (p==$0) print p; p=$0}' | \ |
| grep '[a-zA-Z]' | tr '\012' ' ') |
| if test -n "$words"; then |
| echo "$file: $words" |
| fi |
| fi |
| done |