From abb8ca2455f3efd6f8f0eed78c54829bf0a9001e Mon Sep 17 00:00:00 2001
From: Felix Janda <felix.janda@posteo.de>
Date: Thu, 8 Nov 2012 11:19:07 -0600
Subject: wc -m only cares about counting characters. Attached is a try on
 implementing it and some test cases for it. The test cases are only for UTF-8
 locales.

---
 scripts/test/wc.test | 26 +++++++++++++++++++++++++-
 1 file changed, 25 insertions(+), 1 deletion(-)
 mode change 100644 => 100755 scripts/test/wc.test

(limited to 'scripts')

diff --git a/scripts/test/wc.test b/scripts/test/wc.test
old mode 100644
new mode 100755
index 1b9a051c..801cd713
--- a/scripts/test/wc.test
+++ b/scripts/test/wc.test
@@ -18,5 +18,29 @@ testing "wc -c" "wc -c file1" "26 file1\n" "" ""
 testing "wc -l" "wc -l file1" "4 file1\n" "" ""
 testing "wc -w" "wc -w file1" "5 file1\n" "" ""
 testing "wc format" "wc file1" "4 5 26 file1\n" "" ""
-testing "wc multiple files" "wc input - file1" "1 2 3 input\n0 2 3 -\n4 5 26 file1\n5 9 32 total\n" "a\nb" "a b"
+testing "wc multiple files" "wc input - file1" \
+        "1 2 3 input\n0 2 3 -\n4 5 26 file1\n5 9 32 total\n" "a\nb" "a b"
+
+#Tests for wc -m
+if printf "%s" "$LANG" | grep -q UTF-8
+then
+
+printf " " > file1
+for i in $(seq 1 8192)
+do
+  printf "ü" >> file1
+done
+testing "wc -m" "wc -m file1" "8193 file1\n" "" ""
+printf " " > file1
+for i in $(seq 1 8192)
+do
+  printf "ü" >> file1
+done
+testing "wc -m (invalid chars)" "wc -m file1" "8193 file1\n" "" ""
+testing "wc -mlw" "wc -mlw input" "1 2 11 input\n" "hello, 世界!\n" ""
+
+else
+printf "skipping tests for wc -m"
+fi
+
 rm file1
-- 
cgit v1.2.3