1
0
mirror of git://git.sv.gnu.org/coreutils.git synced 2026-04-18 17:56:54 +02:00

du: don't miscount duplicate directories or link-count-1 files

* NEWS: Mention this.
* src/du.c (hash_all): New static var.
(process_file): Use it.
(main): Set it.
* tests/du/hard-link: Add a couple of test cases to help make
sure this bug stays squashed.
* tests/du/files0-from: Adjust existing tests to reflect
change in semantics with duplicate arguments.
This commit is contained in:
Paul Eggert
2010-07-02 23:41:08 -07:00
committed by Jim Meyering
parent d27d6d371f
commit efe53cc72b
4 changed files with 50 additions and 18 deletions

5
NEWS
View File

@@ -38,6 +38,11 @@ GNU coreutils NEWS -*- outline -*-
Also errors are no longer suppressed for unsupported file types, and
relative sizes are restricted to supported file types.
** Bug fixes
du no longer multiply counts a file that is a directory or whose
link count is 1, even if the file is reached multiple times by
following symlinks or via multiple arguments.
* Noteworthy changes in release 8.5 (2010-04-23) [stable]

View File

@@ -132,6 +132,9 @@ static bool apparent_size = false;
/* If true, count each hard link of files with multiple links. */
static bool opt_count_all = false;
/* If true, hash all files to look for hard links. */
static bool hash_all;
/* If true, output the NUL byte instead of a newline at the end of each line. */
static bool opt_nul_terminate_output = false;
@@ -518,8 +521,7 @@ process_file (FTS *fts, FTSENT *ent)
via a hard link, then don't let it contribute to the sums. */
if (skip
|| (!opt_count_all
&& ! S_ISDIR (sb->st_mode)
&& 1 < sb->st_nlink
&& (hash_all || (! S_ISDIR (sb->st_mode) && 1 < sb->st_nlink))
&& ! hash_ins (sb->st_ino, sb->st_dev)))
{
/* Note that we must not simply return here.
@@ -937,11 +939,20 @@ main (int argc, char **argv)
quote (files_from));
ai = argv_iter_init_stream (stdin);
/* It's not easy here to count the arguments, so assume the
worst. */
hash_all = true;
}
else
{
char **files = (optind < argc ? argv + optind : cwd_only);
ai = argv_iter_init_argv (files);
/* Hash all dev,ino pairs if there are multiple arguments, or if
following non-command-line symlinks, because in either case a
file with just one hard link might be seen more than once. */
hash_all = (optind + 1 < argc || symlink_deref_bits == FTS_LOGICAL);
}
if (!ai)

View File

@@ -70,15 +70,15 @@ my @Tests =
{IN=>{f=>"g\0"}}, {AUX=>{g=>''}},
{OUT=>"0\tg\n"}, {OUT_SUBST=>'s/^\d+/0/'} ],
# two file names, no final NUL
# two identical file names, no final NUL
['2', '--files0-from=-', '<',
{IN=>{f=>"g\0g"}}, {AUX=>{g=>''}},
{OUT=>"0\tg\n0\tg\n"}, {OUT_SUBST=>'s/^\d+/0/'} ],
{OUT=>"0\tg\n"}, {OUT_SUBST=>'s/^\d+/0/'} ],
# two file names, with final NUL
# two identical file names, with final NUL
['2a', '--files0-from=-', '<',
{IN=>{f=>"g\0g\0"}}, {AUX=>{g=>''}},
{OUT=>"0\tg\n0\tg\n"}, {OUT_SUBST=>'s/^\d+/0/'} ],
{OUT=>"0\tg\n"}, {OUT_SUBST=>'s/^\d+/0/'} ],
# Ensure that $prog processes FILEs following a zero-length name.
['zero-len', '--files0-from=-', '<',

View File

@@ -26,24 +26,40 @@ fi
. $srcdir/test-lib.sh
mkdir -p dir/sub
( cd dir && { echo non-empty > f1; ln f1 f2; echo non-empty > sub/F; } )
( cd dir &&
{ echo non-empty > f1
ln f1 f2
ln -s f1 f3
echo non-empty > sub/F; } )
du -a -L --exclude=sub --count-links dir \
| sed 's/^[0-9][0-9]* //' | sort -r > out || fail=1
# For these tests, transform f1 or f2 or f3 (whichever name is find
# first) to f_. That is necessary because, depending on the type of
# file system, du could encounter any of those linked files first,
# thus listing that one and not the others.
for args in '-L' 'dir' '-L dir'
do
echo === >> out
du -a --exclude=sub $args dir \
| sed 's/^[0-9][0-9]* //' | sed 's/f[123]/f_/' >> out || fail=1
done
# Note that for this first test, we transform f1 or f2
# (whichever name we find first) to f_. That is necessary because,
# depending on the type of file system, du could encounter either of those
# two hard-linked files first, thus listing that one and not the other.
du -a --exclude=sub dir \
| sed 's/^[0-9][0-9]* //' | sed 's/f[12]/f_/' > out || fail=1
echo === >> out
du -a --exclude=sub --count-links dir \
| sed 's/^[0-9][0-9]* //' | sort -r >> out || fail=1
cat <<\EOF > exp
dir/f3
dir/f2
dir/f1
dir
===
dir/f_
dir
===
dir/f2
dir/f1
dir/f_
dir/f_
dir
===
dir/f_
dir
EOF