NetBSD/tests/usr.bin/awk/t_awk.sh

405 lines
8.7 KiB
Bash

# $NetBSD: t_awk.sh,v 1.7 2020/06/26 07:50:11 jruoho Exp $
#
# Copyright (c) 2012 The NetBSD Foundation, Inc.
# All rights reserved.
#
# This code is derived from software contributed to The NetBSD Foundation
# by Christos Zoulas
#
# Redistribution and use in source and binary forms, with or without
# modification, are permitted provided that the following conditions
# are met:
# 1. Redistributions of source code must retain the above copyright
# notice, this list of conditions and the following disclaimer.
# 2. Redistributions in binary form must reproduce the above copyright
# notice, this list of conditions and the following disclaimer in the
# documentation and/or other materials provided with the distribution.
#
# THIS SOFTWARE IS PROVIDED BY THE NETBSD FOUNDATION, INC. AND CONTRIBUTORS
# ``AS IS'' AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED
# TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR
# PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE FOUNDATION OR CONTRIBUTORS
# BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
# CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
# SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS
# INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN
# CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE)
# ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE
# POSSIBILITY OF SUCH DAMAGE.
#
awk=awk
h_check()
{
local fname=d_$1
for sfx in in out awk; do
cp -r $(atf_get_srcdir)/$fname.$sfx .
done
shift 1
atf_check -o file:$fname.out -x "awk $@ -f $fname.awk < $fname.in"
}
atf_test_case big_regexp
big_regexp_head() {
atf_set "descr" "Checks matching long regular expressions (PR/33392)"
}
big_regexp_body() {
h_check big_regexp
}
atf_test_case end
end_head() {
atf_set "descr" "Checks that the last line of the input" \
"is available under END pattern (PR/29659)"
}
end_body() {
h_check end1
h_check end2
}
atf_test_case string1
string1_head() {
atf_set "descr" "Checks escaping newlines in string literals"
}
string1_body() {
for sfx in out awk; do
cp -r $(atf_get_srcdir)/d_string1.$sfx .
done
atf_check -o file:d_string1.out awk -f d_string1.awk
}
atf_test_case multibyte
multibyte_head() {
atf_set "descr" "Checks multibyte charsets support" \
"in tolower and toupper (PR/36394)"
}
multibyte_body() {
export LANG=en_US.UTF-8
h_check tolower
h_check toupper
}
atf_test_case period
period_head() {
atf_set "descr" "Checks that the period character is recognised" \
"in awk program regardless of locale (PR bin/42320)"
}
period_body() {
export LANG=ru_RU.KOI8-R
h_check period -v x=0.5
}
atf_test_case assign_NF
assign_NF_head() {
atf_set "descr" 'Checks that assign to NF changes $0 and $n (PR/44063)'
}
assign_NF_body() {
h_check assign_NF
}
atf_test_case single_char_rs
single_char_rs_head() {
atf_set "descr" "Test awk(1) with single character RS"
}
single_char_rs_body() {
atf_check \
-o "inline:1\n2\n\n3\n\n\n4\n\n" \
-x "echo 1a2aa3aaa4 | $awk 1 RS=a"
}
atf_test_case two_char_rs
two_char_rs_head() {
atf_set "descr" "Test awk(1) with two characters RS"
}
two_char_rs_body() {
atf_check \
-o "inline:1\n2\n3\n4\n\n" \
-x "echo 1ab2ab3ab4 | $awk 1 RS=ab"
}
atf_test_case single_char_regex_group_rs
single_char_regex_group_rs_head() {
atf_set "descr" "Test awk(1) with single character regex group RS"
}
single_char_regex_group_rs_body() {
atf_check \
-o "inline:1\n2\n\n3\n\n\n4\n\n" \
-x "echo 1a2aa3aaa4 | $awk 1 RS='[a]'"
}
atf_test_case two_char_regex_group_rs
two_char_regex_group_rs_head() {
atf_set "descr" "Test awk(1) with two characters regex group RS"
}
two_char_regex_group_rs_body() {
atf_check \
-o "inline:1\n2\n\n3\n\n\n4\n\n" \
-x "echo 1a2ab3aba4 | $awk 1 RS='[ab]'"
}
atf_test_case single_char_regex_star_rs
single_char_regex_star_rs_head() {
atf_set "descr" "Test awk(1) with single character regex star RS"
}
single_char_regex_star_rs_body() {
atf_check \
-o "inline:1\n2\n3\n4\n\n" \
-x "echo 1a2aa3aaa4 | $awk 1 RS='a*'"
}
atf_test_case two_char_regex_star_rs
two_char_regex_star_rs_head() {
atf_set "descr" "Test awk(1) with two characters regex star RS"
}
two_char_regex_star_rs_body() {
atf_check \
-o "inline:1\n2\n3\n4\n\n" \
-x "echo 1a2aa3aaa4 | $awk 1 RS='aa*'"
}
atf_test_case regex_two_star_rs
regex_two_star_rs_head() {
atf_set "descr" "Test awk(1) with regex two star RS"
}
regex_two_star_rs_body() {
atf_check \
-o "inline:1\n2\n3\n4\n\n" \
-x "echo 1a2ab3aab4 | $awk 1 RS='aa*b*'"
}
atf_test_case regex_or_1_rs
regex_or_1_rs_head() {
atf_set "descr" "Test awk(1) with regex | case 1 RS"
}
regex_or_1_rs_body() {
atf_check \
-o "inline:1a\nc\n\n" \
-x "echo 1abc | $awk 1 RS='abcde|b'"
}
atf_test_case regex_or_2_rs
regex_or_2_rs_head() {
atf_set "descr" "Test awk(1) with regex | case 2 RS"
}
regex_or_2_rs_body() {
atf_check \
-o "inline:1a\ncdf2\n\n" \
-x "echo 1abcdf2 | $awk 1 RS='abcde|b'"
}
atf_test_case regex_or_3_rs
regex_or_3_rs_head() {
atf_set "descr" "Test awk(1) with regex | case 3 RS"
}
regex_or_3_rs_body() {
atf_check \
-o "inline:1\n\nf2\n\n" \
-x "echo 1abcdebf2 | $awk 1 RS='abcde|b'"
}
atf_test_case regex_or_4_rs
regex_or_4_rs_head() {
atf_set "descr" "Test awk(1) with regex | case 4 RS"
}
regex_or_4_rs_body() {
atf_check \
-o "inline:1\nbcdf2\n\n" \
-x "echo 1abcdf2 | $awk 1 RS='abcde|a'"
}
atf_test_case regex_caret_1_rs
regex_caret_1_rs_head() {
atf_set "descr" "Test awk(1) with regex ^ case 1 RS"
}
regex_caret_1_rs_body() {
atf_check \
-o "inline:\n1a2a3a\n\n" \
-x "echo a1a2a3a | $awk 1 RS='^a'"
}
atf_test_case regex_caret_2_rs
regex_caret_2_rs_head() {
atf_set "descr" "Test awk(1) with regex ^ case 2 RS"
}
regex_caret_2_rs_body() {
atf_check \
-o "inline:\naa1a2a\n\n" \
-x "echo aaa1a2a | $awk 1 RS='^a'"
}
atf_test_case regex_dollar_1_rs
regex_dollar_1_rs_head() {
atf_set "descr" "Test awk(1) with regex $ case 1 RS"
}
regex_dollar_1_rs_body() {
atf_check \
-o "inline:a1a2a3a\n\n" \
-x "echo a1a2a3a | $awk 1 RS='a$'"
}
atf_test_case regex_dollar_2_rs
regex_dollar_2_rs_head() {
atf_set "descr" "Test awk(1) with regex $ case 2 RS"
}
regex_dollar_2_rs_body() {
atf_check \
-o "inline:a1a2aaa\n\n" \
-x "echo a1a2aaa | $awk 1 RS='a$'"
}
atf_test_case regex_reallocation_rs
regex_reallocation_rs_head() {
atf_set "descr" "Test awk(1) with regex reallocation RS"
}
regex_reallocation_rs_body() {
atf_check \
-o "inline:a\na\na\na\na\na\na\na\na\na10000\n\n" \
-x "jot -s a 10000 | $awk 'NR>1' RS='999[0-9]'"
}
atf_test_case empty_rs
empty_rs_head() {
atf_set "descr" "Test awk(1) with empty RS"
}
empty_rs_body() {
atf_check \
-o "inline:foo\n" \
-x "echo foo | $awk 1 RS=''"
}
atf_test_case newline_rs
newline_rs_head() {
atf_set "descr" "Test awk(1) with newline RS"
}
newline_rs_body() {
atf_check \
-o "inline:r1f1:r1f2\nr2f1:r2f2\n" \
-x "printf '\n\n\nr1f1\nr1f2\n\nr2f1\nr2f2\n\n\n' | $awk '{\$1=\$1}1' RS= OFS=:"
}
atf_test_case regex_range
regex_range_head() {
atf_set "descr" "Test awk(1) with regex range"
}
regex_range_body() {
atf_check \
-o "inline:matched\n" \
-x "echo '1 a' | $awk '/[[:digit:]][[:space:]][[:alpha:]]/ { print \"matched\"; }'"
}
atf_test_case regex_repeat
regex_repeat_head() {
atf_set "descr" "Test awk(1) with regex repeat"
}
regex_repeat_body() {
atf_check \
-o "inline:matched\n" \
-x "echo 'aaabbbbcc' | $awk '/a{3}b{4}c{2}/ { print \"matched\"; }'"
}
atf_test_case modify_subsep
modify_subsep_head() {
atf_set "descr" "Test awk(1) SUPSEP modification (PR/47306)"
}
modify_subsep_body() {
atf_check \
-o "inline:1\n1\n1\n" \
-x "printf '1\n1 2\n' | \
$awk '1{ arr[\$1 SUBSEP \$2 SUBSEP ++cnt[\$1]]=1} {for (f in arr) print arr[f];}'"
}
atf_init_test_cases() {
atf_add_test_case big_regexp
atf_add_test_case end
atf_add_test_case string1
atf_add_test_case multibyte
atf_add_test_case period
atf_add_test_case assign_NF
atf_add_test_case single_char_rs
atf_add_test_case two_char_rs
atf_add_test_case single_char_regex_group_rs
atf_add_test_case two_char_regex_group_rs
atf_add_test_case two_char_regex_star_rs
atf_add_test_case single_char_regex_star_rs
atf_add_test_case regex_two_star_rs
atf_add_test_case regex_or_1_rs
atf_add_test_case regex_or_2_rs
atf_add_test_case regex_or_3_rs
atf_add_test_case regex_caret_1_rs
atf_add_test_case regex_caret_2_rs
atf_add_test_case regex_dollar_1_rs
atf_add_test_case regex_dollar_2_rs
atf_add_test_case regex_reallocation_rs
atf_add_test_case empty_rs
atf_add_test_case newline_rs
atf_add_test_case regex_range
atf_add_test_case regex_repeat
atf_add_test_case modify_subsep
}