summaryrefslogtreecommitdiffstats
path: root/contrib/gnu-sort
diff options
context:
space:
mode:
Diffstat (limited to 'contrib/gnu-sort')
-rw-r--r--contrib/gnu-sort/lib/hard-locale.c17
-rw-r--r--contrib/gnu-sort/lib/version-etc.c2
-rw-r--r--contrib/gnu-sort/src/sort.c268
3 files changed, 116 insertions, 171 deletions
diff --git a/contrib/gnu-sort/lib/hard-locale.c b/contrib/gnu-sort/lib/hard-locale.c
index ca584d6..45b7d05 100644
--- a/contrib/gnu-sort/lib/hard-locale.c
+++ b/contrib/gnu-sort/lib/hard-locale.c
@@ -1,6 +1,7 @@
/* hard-locale.c -- Determine whether a locale is hard.
- Copyright (C) 1997, 1998, 1999, 2002, 2003 Free Software Foundation, Inc.
+ Copyright (C) 1997, 1998, 1999, 2002, 2003, 2004 Free Software
+ Foundation, Inc.
This program is free software; you can redistribute it and/or modify
it under the terms of the GNU General Public License as published by
@@ -30,23 +31,23 @@
#include <stdlib.h>
#include <string.h>
-/* Return nonzero if the current CATEGORY locale is hard, i.e. if you
+/* Return true if the current CATEGORY locale is hard, i.e. if you
can't get away with assuming traditional C or POSIX behavior. */
-int
+bool
hard_locale (int category)
{
#if ! HAVE_SETLOCALE
- return 0;
+ return false;
#else
- int hard = 1;
- char const *p = setlocale (category, 0);
+ bool hard = true;
+ char const *p = setlocale (category, NULL);
if (p)
{
# if defined(__FreeBSD__) || (defined __GLIBC__ && 2 <= __GLIBC__)
if (strcmp (p, "C") == 0 || strcmp (p, "POSIX") == 0)
- hard = 0;
+ hard = false;
# else
char *locale = malloc (strlen (p) + 1);
if (locale)
@@ -60,7 +61,7 @@ hard_locale (int category)
&& strcmp (p, locale) == 0)
|| ((p = setlocale (category, "POSIX"))
&& strcmp (p, locale) == 0))
- hard = 0;
+ hard = false;
/* Restore the caller's locale. */
setlocale (category, locale);
diff --git a/contrib/gnu-sort/lib/version-etc.c b/contrib/gnu-sort/lib/version-etc.c
index 3746df4..204d262 100644
--- a/contrib/gnu-sort/lib/version-etc.c
+++ b/contrib/gnu-sort/lib/version-etc.c
@@ -48,7 +48,7 @@ version_etc_va (FILE *stream,
const char *command_name, const char *package,
const char *version, va_list authors)
{
- unsigned int n_authors;
+ size_t n_authors;
/* Count the number of authors. */
{
diff --git a/contrib/gnu-sort/src/sort.c b/contrib/gnu-sort/src/sort.c
index 7481814..0b9d33f 100644
--- a/contrib/gnu-sort/src/sort.c
+++ b/contrib/gnu-sort/src/sort.c
@@ -20,7 +20,7 @@
The author may be reached (Email) at the address mike@gnu.ai.mit.edu,
or (US mail) as Mike Haertel c/o Free Software Foundation.
- Ørn E. Hansen added NLS support in 1997. */
+ Ørn E. Hansen added NLS support in 1997. */
#include <config.h>
@@ -56,6 +56,7 @@
#include "long-options.h"
#include "physmem.h"
#include "posixver.h"
+#include "quote.h"
#include "stdio-safer.h"
#include "xmemcoll.h"
#include "xstrtol.h"
@@ -98,7 +99,6 @@ double strtod ();
#endif
#define UCHAR_LIM (UCHAR_MAX + 1)
-#define UCHAR(c) ((unsigned char) (c))
#ifndef DEFAULT_TMPDIR
# define DEFAULT_TMPDIR "/tmp"
@@ -137,7 +137,7 @@ static bool hard_LC_TIME;
#else
# define decimal_point C_DECIMAL_POINT
-# define IS_THOUSANDS_SEP(x) 0
+# define IS_THOUSANDS_SEP(x) false
#endif
@@ -204,8 +204,8 @@ struct keyfield
size_t echar; /* Additional characters in field. */
bool const *ignore; /* Boolean array of characters to ignore. */
char const *translate; /* Translation applied to characters. */
- bool skipsblanks; /* Skip leading blanks at start. */
- bool skipeblanks; /* Skip trailing blanks at finish. */
+ bool skipsblanks; /* Skip leading blanks when finding start. */
+ bool skipeblanks; /* Skip leading blanks when finding end. */
bool numeric; /* Flag for numeric comparison. Handle
strings of digits with optional decimal
point, but no exponential notation. */
@@ -490,13 +490,14 @@ cleanup (void)
unlink (node->name);
}
-/* Report MESSAGE for FILE, then clean up and exit. */
+/* Report MESSAGE for FILE, then clean up and exit.
+ If FILE is null, it represents standard output. */
static void die (char const *, char const *) ATTRIBUTE_NORETURN;
static void
die (char const *message, char const *file)
{
- error (0, errno, "%s: %s", message, file);
+ error (0, errno, "%s: %s", message, file ? file : _("standard output"));
exit (SORT_FAILURE);
}
@@ -538,20 +539,22 @@ create_temp_file (FILE **pfp)
return file;
}
+/* Return a stream for FILE, opened with mode HOW. A null FILE means
+ standard output; HOW should be "w". When opening for input, "-"
+ means standard input. To avoid confusion, do not return file
+ descriptors 0, 1, or 2. */
+
static FILE *
xfopen (const char *file, const char *how)
{
FILE *fp;
- if (STREQ (file, "-"))
+ if (!file)
+ fp = stdout;
+ else if (STREQ (file, "-") && *how == 'r')
{
- if (*how == 'r')
- {
- have_read_stdin = true;
- fp = stdin;
- }
- else
- fp = stdout;
+ have_read_stdin = true;
+ fp = stdin;
}
else
{
@@ -660,7 +663,7 @@ inittables_uni (void)
monthtab[i].val = i + 1;
for (j = 0; j < s_len; j++)
- name[j] = fold_toupper[UCHAR (s[j])];
+ name[j] = fold_toupper[to_uchar (s[j])];
name[j] = '\0';
}
qsort ((void *) monthtab, MONTHS_PER_YEAR,
@@ -861,7 +864,7 @@ sort_buffer_size (FILE *const *fps, int nfps,
size_t worst_case;
if ((i < nfps ? fstat (fileno (fps[i]), &st)
- : strcmp (files[i], "-") == 0 ? fstat (STDIN_FILENO, &st)
+ : STREQ (files[i], "-") ? fstat (STDIN_FILENO, &st)
: stat (files[i], &st))
!= 0)
die (_("stat failed"), files[i]);
@@ -958,14 +961,14 @@ begfield_uni (const struct line *line, const struct keyfield *key)
else
while (ptr < lim && sword--)
{
- while (ptr < lim && blanks[UCHAR (*ptr)])
+ while (ptr < lim && blanks[to_uchar (*ptr)])
++ptr;
- while (ptr < lim && !blanks[UCHAR (*ptr)])
+ while (ptr < lim && !blanks[to_uchar (*ptr)])
++ptr;
}
if (key->skipsblanks)
- while (ptr < lim && blanks[UCHAR (*ptr)])
+ while (ptr < lim && blanks[to_uchar (*ptr)])
++ptr;
/* Advance PTR by SCHAR (if possible), but no further than LIM. */
@@ -1065,9 +1068,9 @@ limfield_uni (const struct line *line, const struct keyfield *key)
else
while (ptr < lim && eword--)
{
- while (ptr < lim && blanks[UCHAR (*ptr)])
+ while (ptr < lim && blanks[to_uchar (*ptr)])
++ptr;
- while (ptr < lim && !blanks[UCHAR (*ptr)])
+ while (ptr < lim && !blanks[to_uchar (*ptr)])
++ptr;
}
@@ -1114,18 +1117,19 @@ limfield_uni (const struct line *line, const struct keyfield *key)
{
char *newlim;
newlim = ptr;
- while (newlim < lim && blanks[UCHAR (*newlim)])
+ while (newlim < lim && blanks[to_uchar (*newlim)])
++newlim;
- while (newlim < lim && !blanks[UCHAR (*newlim)])
+ while (newlim < lim && !blanks[to_uchar (*newlim)])
++newlim;
lim = newlim;
}
#endif
- /* If we're skipping leading blanks, don't start counting characters
- until after skipping past any leading blanks. */
- if (key->skipsblanks)
- while (ptr < lim && blanks[UCHAR (*ptr)])
+ /* If we're ignoring leading blanks when computing the End
+ of the field, don't start counting bytes until after skipping
+ past any leading blanks. */
+ if (key->skipeblanks)
+ while (ptr < lim && blanks[to_uchar (*ptr)])
++ptr;
/* Advance PTR by ECHAR (if possible), but no further than LIM. */
@@ -1218,7 +1222,7 @@ limfield_mb (const struct line *line, const struct keyfield *key)
/* If we're skipping leading blanks, don't start counting characters
* until after skipping past any leading blanks. */
- if (key->skipsblanks)
+ if (key->skipeblanks)
while (ptr < lim && ismbblank (ptr, lim - ptr, &mblength))
ptr += mblength;
@@ -1239,38 +1243,6 @@ limfield_mb (const struct line *line, const struct keyfield *key)
}
#endif
-/* Return the number of trailing blanks in FIELD, with LEN bytes. */
-
-static size_t
-trailing_blanks (char const *field, size_t len)
-{
-#if HAVE_MBRTOWC
- if (MB_CUR_MAX > 1)
- {
- size_t blanks = 0;
-
- while (len) {
- size_t mblength;
- if (ismbblank (field, len, &mblength))
- blanks++;
- else
- blanks = 0;
-
- field += mblength, len -= mblength;
- }
-
- return blanks;
- }
- else
-#endif
- {
- size_t i;
- for (i = len; 0 < i && blanks[UCHAR (field[i - 1])]; i--)
- continue;
- return len - i;
- }
-}
-
/* Fill BUF reading from FP, moving buf->left bytes from the end
of buf->buf to the beginning first. If EOF is reached and the
file wasn't terminated by a newline, supply one. Set up BUF's line
@@ -1365,17 +1337,12 @@ fillbuf (struct buffer *buf, register FILE *fp, char const *file)
else
#endif
{
- while (blanks[UCHAR (*line_start)])
+ while (blanks[to_uchar (*line_start)])
line_start++;
}
}
line->keybeg = line_start;
}
- if (key->skipeblanks)
- {
- size_t keylen = line->keylim - line->keybeg;
- line->keylim -= trailing_blanks (line->keybeg, keylen);
- }
}
line_start = ptr;
@@ -1473,8 +1440,11 @@ fraccompare (register const char *a, register const char *b)
static int
numcompare (register const char *a, register const char *b)
{
- register int tmpa, tmpb, tmp;
- register size_t log_a, log_b;
+ char tmpa;
+ char tmpb;
+ int tmp;
+ size_t log_a;
+ size_t log_b;
#if HAVE_MBRTOWC
if (MB_CUR_MAX > 1)
@@ -1497,9 +1467,9 @@ numcompare (register const char *a, register const char *b)
tmpa = *a;
tmpb = *b;
- while (blanks[UCHAR (tmpa)])
+ while (blanks[to_uchar (tmpa)])
tmpa = *++a;
- while (blanks[UCHAR (tmpb)])
+ while (blanks[to_uchar (tmpb)])
tmpb = *++b;
}
@@ -1712,7 +1682,7 @@ getmonth_uni (const char *s, size_t len)
register size_t i;
register int lo = 0, hi = MONTHS_PER_YEAR, result;
- while (len > 0 && blanks[UCHAR (*s)])
+ while (len > 0 && blanks[to_uchar (*s)])
{
++s;
--len;
@@ -1723,8 +1693,7 @@ getmonth_uni (const char *s, size_t len)
month = alloca (len + 1);
for (i = 0; i < len; ++i)
- month[i] = fold_toupper[UCHAR (s[i])];
- len -= trailing_blanks (month, len);
+ month[i] = fold_toupper[to_uchar (s[i])];
month[len] = '\0';
do
@@ -1780,14 +1749,8 @@ getmonth_mb (const char *s, size_t len)
assert (wclength != (size_t)-1 && *pp == NULL);
for (i = 0; i < wclength; i++)
- {
month_wcs[i] = towupper(month_wcs[i]);
- if (iswblank (month_wcs[i]))
- {
- month_wcs[i] = L'\0';
- break;
- }
- }
+ month_wcs[i] = L'\0';
wpp = (const wchar_t **)&month_wcs;
@@ -1838,12 +1801,6 @@ keycompare_uni (const struct line *a, const struct line *b)
size_t lena = lima <= texta ? 0 : lima - texta;
size_t lenb = limb <= textb ? 0 : limb - textb;
- if (key->skipeblanks)
- {
- lena -= trailing_blanks (texta, lena);
- lenb -= trailing_blanks (textb, lenb);
- }
-
/* Actually compare the fields. */
if (key->numeric | key->general_numeric)
{
@@ -1872,17 +1829,17 @@ keycompare_uni (const struct line *a, const struct line *b)
if (i < lena)
{
copy_a[new_len_a] = (translate
- ? translate[UCHAR (texta[i])]
+ ? translate[to_uchar (texta[i])]
: texta[i]);
- if (!ignore || !ignore[UCHAR (texta[i])])
+ if (!ignore || !ignore[to_uchar (texta[i])])
++new_len_a;
}
if (i < lenb)
{
copy_b[new_len_b] = (translate
- ? translate[UCHAR (textb[i])]
+ ? translate[to_uchar (textb[i])]
: textb [i]);
- if (!ignore || !ignore[UCHAR (textb[i])])
+ if (!ignore || !ignore[to_uchar (textb[i])])
++new_len_b;
}
}
@@ -1903,13 +1860,13 @@ keycompare_uni (const struct line *a, const struct line *b)
{ \
for (;;) \
{ \
- while (texta < lima && ignore[UCHAR (*texta)]) \
+ while (texta < lima && ignore[to_uchar (*texta)]) \
++texta; \
- while (textb < limb && ignore[UCHAR (*textb)]) \
+ while (textb < limb && ignore[to_uchar (*textb)]) \
++textb; \
if (! (texta < lima && textb < limb)) \
break; \
- diff = UCHAR (A) - UCHAR (B); \
+ diff = to_uchar (A) - to_uchar (B); \
if (diff) \
goto not_equal; \
++texta; \
@@ -1921,8 +1878,8 @@ keycompare_uni (const struct line *a, const struct line *b)
while (0)
if (translate)
- CMP_WITH_IGNORE (translate[UCHAR (*texta)],
- translate[UCHAR (*textb)]);
+ CMP_WITH_IGNORE (translate[to_uchar (*texta)],
+ translate[to_uchar (*textb)]);
else
CMP_WITH_IGNORE (*texta, *textb);
}
@@ -1936,8 +1893,8 @@ keycompare_uni (const struct line *a, const struct line *b)
{
while (texta < lima && textb < limb)
{
- diff = (UCHAR (translate[UCHAR (*texta++)])
- - UCHAR (translate[UCHAR (*textb++)]));
+ diff = (to_uchar (translate[to_uchar (*texta++)])
+ - to_uchar (translate[to_uchar (*textb++)]));
if (diff)
goto not_equal;
}
@@ -1971,9 +1928,9 @@ keycompare_uni (const struct line *a, const struct line *b)
texta = a->text, textb = b->text;
if (key->skipsblanks)
{
- while (texta < lima && blanks[UCHAR (*texta)])
+ while (texta < lima && blanks[to_uchar (*texta)])
++texta;
- while (textb < limb && blanks[UCHAR (*textb)])
+ while (textb < limb && blanks[to_uchar (*textb)])
++textb;
}
}
@@ -2018,16 +1975,6 @@ keycompare_mb (const struct line *a, const struct line *b)
size_t lena = lima <= texta ? 0 : lima - texta;
size_t lenb = limb <= textb ? 0 : limb - textb;
- if (key->skipeblanks)
- {
- char *a_end = texta + lena;
- char *b_end = textb + lenb;
- a_end -= trailing_blanks (texta, lena);
- b_end -= trailing_blanks (textb, lenb);
- lena = a_end - texta;
- lenb = b_end - textb;
- }
-
/* Actually compare the fields. */
if (key->numeric | key->general_numeric)
{
@@ -2291,8 +2238,9 @@ check (char const *file_name)
/* Merge lines from FILES onto OFP. NFILES cannot be greater than
NMERGE. Close input and output files before returning.
- OUTPUT_FILE gives the name of the output file; if OFP is NULL, the
- output file has not been opened yet. */
+ OUTPUT_FILE gives the name of the output file. If it is NULL,
+ the output file is standard output. If OFP is NULL, the output
+ file has not been opened yet (or written to, if standard output). */
static void
mergefps (char **files, register int nfiles,
@@ -2561,9 +2509,17 @@ sortlines_temp (struct line *lines, size_t nlines, struct line *temp)
}
/* Return the index of the first of NFILES FILES that is the same file
- as OUTFILE. If none can be the same, return NFILES. Consider an
- input pipe to be the same as OUTFILE, since the pipe might be the
- output of a command like "cat OUTFILE". */
+ as OUTFILE. If none can be the same, return NFILES.
+
+ This test ensures that an otherwise-erroneous use like
+ "sort -m -o FILE ... FILE ..." copies FILE before writing to it.
+ It's not clear that POSIX requires this nicety.
+ Detect common error cases, but don't try to catch obscure cases like
+ "cat ... FILE ... | sort -m -o FILE"
+ where traditional "sort" doesn't copy the input and where
+ people should know that they're getting into trouble anyway.
+ Catching these obscure cases would slow down performance in
+ common cases. */
static int
first_same_file (char * const *files, int nfiles, char const *outfile)
@@ -2576,15 +2532,15 @@ first_same_file (char * const *files, int nfiles, char const *outfile)
{
bool standard_input = STREQ (files[i], "-");
- if (STREQ (outfile, files[i]) && ! standard_input)
+ if (outfile && STREQ (outfile, files[i]) && ! standard_input)
return i;
if (! got_outstat)
{
got_outstat = true;
- if ((STREQ (outfile, "-")
- ? fstat (STDOUT_FILENO, &outstat)
- : stat (outfile, &outstat))
+ if ((outfile
+ ? stat (outfile, &outstat)
+ : fstat (STDOUT_FILENO, &outstat))
!= 0)
return nfiles;
}
@@ -2593,7 +2549,7 @@ first_same_file (char * const *files, int nfiles, char const *outfile)
? fstat (STDIN_FILENO, &instat)
: stat (files[i], &instat))
== 0)
- && (S_ISFIFO (instat.st_mode) || SAME_INODE (instat, outstat)))
+ && SAME_INODE (instat, outstat))
return i;
}
@@ -2602,7 +2558,7 @@ first_same_file (char * const *files, int nfiles, char const *outfile)
/* Merge NFILES FILES onto OUTPUT_FILE. However, merge at most
MAX_MERGE input files directly onto OUTPUT_FILE. MAX_MERGE cannot
- exceed NMERGE. */
+ exceed NMERGE. A null OUTPUT_FILE stands for standard output. */
static void
merge (char **files, int nfiles, int max_merge, char const *output_file)
@@ -2794,19 +2750,7 @@ sighandler (int sig)
cleanup ();
-#ifdef SA_NOCLDSTOP
- {
- struct sigaction sigact;
-
- sigact.sa_handler = SIG_DFL;
- sigemptyset (&sigact.sa_mask);
- sigact.sa_flags = 0;
- sigaction (sig, &sigact, NULL);
- }
-#else
signal (sig, SIG_DFL);
-#endif
-
raise (sig);
}
@@ -2885,12 +2829,7 @@ main (int argc, char **argv)
? COMMON_SHORT_OPTIONS "y::"
: COMMON_SHORT_OPTIONS "y:");
char *minus = "-", **files;
- char const *outfile = minus;
- static int const sigs[] = { SIGHUP, SIGINT, SIGPIPE, SIGTERM };
- unsigned int nsigs = sizeof sigs / sizeof *sigs;
-#ifdef SA_NOCLDSTOP
- struct sigaction oldact, newact;
-#endif
+ char const *outfile = NULL;
initialize_main (&argc, &argv);
program_name = argv[0];
@@ -2954,32 +2893,34 @@ main (int argc, char **argv)
have_read_stdin = false;
inittables ();
-#ifdef SA_NOCLDSTOP
{
- unsigned int i;
+ int i;
+ static int const sig[] = { SIGHUP, SIGINT, SIGPIPE, SIGTERM };
+ enum { nsigs = sizeof sig / sizeof sig[0] };
+
+#ifdef SA_NOCLDSTOP
+ struct sigaction act;
+
sigemptyset (&caught_signals);
for (i = 0; i < nsigs; i++)
- sigaddset (&caught_signals, sigs[i]);
- newact.sa_handler = sighandler;
- newact.sa_mask = caught_signals;
- newact.sa_flags = 0;
- }
-#endif
+ {
+ sigaction (sig[i], NULL, &act);
+ if (act.sa_handler != SIG_IGN)
+ sigaddset (&caught_signals, sig[i]);
+ }
+
+ act.sa_handler = sighandler;
+ act.sa_mask = caught_signals;
+ act.sa_flags = 0;
- {
- unsigned int i;
for (i = 0; i < nsigs; i++)
- {
- int sig = sigs[i];
-#ifdef SA_NOCLDSTOP
- sigaction (sig, NULL, &oldact);
- if (oldact.sa_handler != SIG_IGN)
- sigaction (sig, &newact, NULL);
+ if (sigismember (&caught_signals, sig[i]))
+ sigaction (sig[i], &act, NULL);
#else
- if (signal (sig, SIG_IGN) != SIG_IGN)
- signal (sig, sighandler);
+ for (i = 0; i < nsigs; i++)
+ if (signal (sig[i], SIG_IGN) != SIG_IGN)
+ signal (sig[i], sighandler);
#endif
- }
}
gkey.sword = gkey.eword = SIZE_MAX;
@@ -3132,7 +3073,7 @@ main (int argc, char **argv)
break;
case 'o':
- if (outfile != minus && strcmp (outfile, optarg) != 0)
+ if (outfile && !STREQ (outfile, optarg))
error (SORT_FAILURE, 0, _("multiple output files specified"));
outfile = optarg;
break;
@@ -3184,7 +3125,7 @@ main (int argc, char **argv)
if (optarg[1])
{
- if (strcmp (optarg, "\\0") == 0)
+ if (STREQ (optarg, "\\0"))
newtab[0] = '\0';
else
{
@@ -3270,8 +3211,11 @@ main (int argc, char **argv)
if (checkonly)
{
if (nfiles > 1)
- error (SORT_FAILURE, 0, _("extra operand `%s' not allowed with -c"),
- files[1]);
+ {
+ error (0, 0, _("extra operand %s not allowed with -c"),
+ quote (files[1]));
+ usage (SORT_FAILURE);
+ }
/* POSIX requires that sort return 1 IFF invoked with -c and the
input is not properly sorted. */
OpenPOWER on IntegriCloud