1
0
mirror of git://git.sv.gnu.org/coreutils.git synced 2026-04-14 07:46:28 +02:00
Files
coreutils/tests/misc/split-lchunk
Chen Guo be107398e5 split: add --number to generate a particular number of files
* src/split.c (usage, long_options, main): New options --number,
--unbuffered, --elide-empty-files.
(set_suffix_length): New function to auto increase suffix length
to handle a specified number of files.
(create): New function.  Refactored from cwrite() and ofile_open().
(bytes_split): Add max_files argument to support byte chunking.
(lines_chunk_split): New function.  Split file into chunks of lines.
(bytes_chunk_extract): New function.  Extract a chunk of file.
(of_info): New struct.  Used by functions lines_rr and ofile_open
to keep track of file descriptors associated with output files.
(ofile_open): New function.  Shuffle file descriptors when there
are more output files than available file descriptors.
(lines_rr): New function to distribute lines round-robin to files.
(chunk_parse): New function.  Parses K/N syntax.
* tests/misc/split-bchunk: New test for byte chunking.
* tests/misc/split-lchunk: New test for line delimited chunking.
* tests/misc/split-rchunk: New test for round-robin chunking.
* tests/Makefile.am: Reference new tests.
* tests/misc/split-fail: Add failure scenarios for new options.
* tests/misc/split-l: Fix a typo. s/ln/split/.
* doc/coreutils.texi (split invocation): Document --number.
* NEWS: Mention the new feature.
* .mailmap: Map new email address for shortlog.

Signed-off-by: Pádraig Brady <P@draigBrady.com>
2010-11-22 01:45:15 +00:00

118 lines
3.3 KiB
Bash
Executable File

#!/bin/sh
# test splitting into newline delineated chunks (-n l/...)
# Copyright (C) 2010 Free Software Foundation, Inc.
# This program is free software: you can redistribute it and/or modify
# it under the terms of the GNU General Public License as published by
# the Free Software Foundation, either version 3 of the License, or
# (at your option) any later version.
# This program is distributed in the hope that it will be useful,
# but WITHOUT ANY WARRANTY; without even the implied warranty of
# MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
# GNU General Public License for more details.
# You should have received a copy of the GNU General Public License
# along with this program. If not, see <http://www.gnu.org/licenses/>.
. "${srcdir=.}/init.sh"; path_prepend_ ../src
print_ver_ split
# invalid number of chunks
echo 'split: 1o: invalid number of chunks' > exp
split -n l/1o 2>err && fail=1
compare err exp || fail=1
echo "split: \`-': cannot determine file size" > exp
echo | split -n l/1 2>err && fail=1
compare err exp || fail=1
# N can be greater than the file size
# in which case no data is extracted, or empty files are written
split -n l/10 /dev/null || fail=1
test "$(stat -c %s x* | uniq -c | sed 's/^ *//; s/ /x/')" = "10x0" || fail=1
rm x??
# Ensure --elide-empty-files is honored
split -e -n l/10 /dev/null || fail=1
stat x?? 2>/dev/null && fail=1
# 80 bytes. ~ transformed to \n below
lines=\
12345~1~12345~1~12345~1~12345~1~12345~~~12345~1~12345~1~12345~1~12345~1~12345~1~
printf "%s" "$lines" | tr '~' '\n' > in || framework_failure
echo 'split: 16: invalid chunk number' > exp
split -n l/16/15 in 2>err && fail=1
compare err exp || fail=1
: > out
printf '%s' "\
14 16 09 15 16 10
14 08 08 10 14 08 08 10
06 08 08 02 06 08 08 02 06 08 08 10
06 08 02 06 08 00 08 02 06 08 02 06 08 00 10
06 00 08 00 02 06 00 02 06 00 08 00 01 07 00 02 06 00 08 00 02 16
" > exp || framework_failure
# Note for full testing one should set bufsize to 1,2,5,10,80,100
# at the start of lines_chunk_split(), for each run of this test.
DEBUGGING=
test "$DEBUGGING" && test "$VERBOSE" && set +x
for N in 6 8 12 15 22; do
rm -f x*
split -n l/$N in
echo $(stat -c "%02s" x*) >> out
if test "$DEBUGGING"; then
# Output partition pattern
size=$(printf "%s" "$lines" | wc -c)
chunk_size=$(($size/$N))
end_size=$(($chunk_size + ($size % $N)))
{
yes "$(printf %${chunk_size}s ])" | head -n$(($N-1))
printf %${end_size}s ]
} | tr -d '\n' | sed "s/\\(^.\\{1,$size\\}\\).*/\\1/"
echo
# Output pattern generated for comparison
for s in $(stat -c "%s" x*); do
#s=0 transitions are not shown
test "$m" = "_" && m=- || m=_
printf "%${s}s" '' | tr ' ' $m
done
echo
# Output lines for reference
echo "$lines"
fi
done
test "$DEBUGGING" && test "$VERBOSE" && set -x
compare out exp || fail=1
# Check extraction of particular chunks
: > out
printf '1\n12345\n' > exp
split -n l/13/15 in > out
compare out exp || fail=1
: > out
printf '' > exp
split -n l/14/15 in > out
compare out exp || fail=1
: > out
printf '1\n12345\n1\n' > exp
split -n l/15/15 in > out
compare out exp || fail=1
# test input with no \n at end
printf '12\n34\n5' > in
printf '5' > exp
split -n l/7/7 in > out
compare out exp || fail=1
Exit $fail