# Extracting the "best pick" text, without comment lines: # # cat L16-eva/text16e4.evt \ # | best-pick \ # -v trcodes="UVZABENOPRSWXYKQLMRJITFGCD" \ # > vms.evt # # dicio-wc vms.evt # # lines words bytes file # ------- ------- --------- ------------ # 5146 11130 327816 vms.evt gawk \ ' /^[#]/ { print; next; } \ /./ { \ str = $0; gsub(/[0-9]/, "N", str); \ gsub(/[:][:] *$/, "=", str); \ gsub(/[:][:]/, "-", str); gsub(/[:;.]/, "-", str); \ gsub(/[ ]/, ".", str); gsub(/$/, ".", str); \ gsub(/[-.]*[=][-=.]*/, "=", str); gsub(/[.]*[-][-.]*/, "-", str); \ gsub(/[.][.]*/, ".", str); \ gsub(/^[- .]*/, "", str); printf "| %s\n", str; \ } \ ' Then I numbred pages and lines with the following script: gawk \ ' BEGIN { pg=0; } \ /^[#][#] g-/ {pg++; ln=0; un=1; print; next} \ /^[#]/ {print; next;} \ /^ *$/ { print "#"; next; } \ /^[|]/ { \ ln++; if (ln > 99) { ln=1; un++; } \ gsub(/^[|][ ]*/, "", $0); \ printf " %s\n", pg, un, ln, $0; \ } \ '