Commit: 918367feed0cb8046758fcac0f8b77102f58c662 Parent: 72409cf15fce7fe649a677efdbebba3616953722 Author: Randy Palamar Date: Sat, 28 Aug 2021 14:12:58 -0600 add script for printing kanji in a file to stdout Diffstat:
A | bin/kanji | | | 10 | ++++++++++ |
1 file changed, 10 insertions(+), 0 deletions(-)
diff --git a/bin/kanji b/bin/kanji @@ -0,0 +1,10 @@ +#!/bin/sh + +# outputs kanji in (utf-8) files to stdout + +# strip non-kanji +regexp="s:[^\x{3400}-\x{4DB5}\x{4E00}-\x{9FCB}\x{F900}-\x{FA6A}]::g" +# split each char onto a newline +regexp="${regexp};s:(.):\1\n:g" + +cat "$@" | perl -CS -pe "${regexp}"