File: wctabs.sh
   1 #!/bin/sh
   2 
   3 # The MIT License (MIT)
   4 #
   5 # Copyright © 2024 pacman64
   6 #
   7 # Permission is hereby granted, free of charge, to any person obtaining a copy
   8 # of this software and associated documentation files (the “Software”), to deal
   9 # in the Software without restriction, including without limitation the rights
  10 # to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
  11 # copies of the Software, and to permit persons to whom the Software is
  12 # furnished to do so, subject to the following conditions:
  13 #
  14 # The above copyright notice and this permission notice shall be included in
  15 # all copies or substantial portions of the Software.
  16 #
  17 # THE SOFTWARE IS PROVIDED “AS IS”, WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
  18 # IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
  19 # FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
  20 # AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
  21 # LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
  22 # OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
  23 # SOFTWARE.
  24 
  25 
  26 # wctabs [options...] [filepaths...]
  27 #
  28 # Run `wc` (word-count) with the arguments given, turning its output into
  29 # lines of tab-separated values: this removes output-parsing ambiguities,
  30 # in case of filepaths with spaces in them.
  31 #
  32 # You can run `wc --help` to see all its options, which you can also use
  33 # with this script.
  34 
  35 
  36 # handle help option(s)
  37 case "$1" in
  38     -h|--h|-help|--help)
  39         awk '/^# +wctabs/, /^$/ { gsub(/^# ?/, ""); print }' "$0"
  40         exit 0
  41     ;;
  42 esac
  43 
  44 # avoid testing all permutations of up to 5 single-char options
  45 stats=$(awk '
  46 BEGIN {
  47     for (i = 1; i < ARGC; i++) {
  48         s = ARGV[i]
  49         delete ARGV[i]
  50 
  51         if (s !~ /^-/) continue
  52         if (s ~ /c/ || s == "--bytes") bytes = 1
  53         if (s ~ /m/ || s == "--chars") chars = 1
  54         if (s ~ /l/ || s == "--lines") lines = 1
  55         if (s ~ /w/ || s == "--words") words = 1
  56         if (s ~ /L/ || s == "--max-line-length") maxll = 1
  57     }
  58 
  59     stats = bytes + chars + words + lines + maxll
  60     # `wc` defaults to 3 stats when not explicitly given any option
  61     print (stats == 0) ? 3 : stats
  62 }
  63 ' "$@")
  64 
  65 case "${stats}" in
  66     0) wc "$@" | sed -E -u 's-^ +--; s- +-\t-1; s- +-\t-1; s- +-\t-1';;
  67     1) wc "$@" | sed -E -u 's-^ +--; s- +-\t-1';;
  68     2) wc "$@" | sed -E -u 's-^ +--; s- +-\t-1; s- +-\t-1';;
  69     3) wc "$@" | sed -E -u 's-^ +--; s- +-\t-1; s- +-\t-1; s- +-\t-1';;
  70     4) wc "$@" | sed -E -u 's-^ +--; s- +-\t-1; s- +-\t-1; s- +-\t-1; s- +-\t-1';;
  71     5) wc "$@" | sed -E -u 's-^ +--; s- +-\t-1; s- +-\t-1; s- +-\t-1; s- +-\t-1; s- +-\t-1';;
  72 esac