Update to tcsh 6.18.01.

author: mp <mp@FreeBSD.org> 2012-02-22 03:36:15 +0000
committer: mp <mp@FreeBSD.org> 2012-02-22 03:36:15 +0000
commit: 3ee51a00f36c11a6172d08d787943dfc63f66110 (patch)
tree: 522fd2d4d27770566e466a79d636194e5743d94a /contrib/tcsh/sh.hist.c
parent: d177303078ee8f6069218009d6c3c2b6d9d9ca97 (diff)
parent: 54c5644df8eb87e7a5b1c4c411e349ac329ee04b (diff)
download: FreeBSD-src-3ee51a00f36c11a6172d08d787943dfc63f66110.zip
FreeBSD-src-3ee51a00f36c11a6172d08d787943dfc63f66110.tar.gz
1 files changed, 1003 insertions, 142 deletions
diff --git a/contrib/tcsh/sh.hist.c b/contrib/tcsh/sh.hist.c
index 72b376a..6a12737 100644
--- a/contrib/tcsh/sh.hist.c
+++ b/contrib/tcsh/sh.hist.c
@@ -1,4 +1,4 @@
-/* $Header: /p/tcsh/cvsroot/tcsh/sh.hist.c,v 3.40 2007/03/01 17:14:51 christos Exp $ */
+/* $Header: /p/tcsh/cvsroot/tcsh/sh.hist.c,v 3.53 2011/01/24 18:10:26 christos Exp $ */
 /*
  * sh.hist.c: Shell history expansions and substitutions
  */
@@ -32,8 +32,9 @@
  */
 #include "sh.h"
 
-RCSID("$tcsh: sh.hist.c,v 3.40 2007/03/01 17:14:51 christos Exp $")
+RCSID("$tcsh: sh.hist.c,v 3.53 2011/01/24 18:10:26 christos Exp $")
 
+#include <assert.h>
 #include "tc.h"
 
 extern int histvalid;
@@ -42,8 +43,6 @@ Char HistLit = 0;
 
 static	int	heq	(const struct wordent *, const struct wordent *);
 static	void	hfree	(struct Hist *);
-static	void	dohist1	(struct Hist *, int *, int);
-static	void	phist	(struct Hist *, int);
 
 #define HIST_ONLY	0x01
 #define HIST_SAVE	0x02
@@ -57,10 +56,95 @@ static	void	phist	(struct Hist *, int);
  * C shell
  */
 
-void
-savehist(struct wordent *sp, int mflg)
+/* Static functions don't show up in gprof summaries.  So eliminate "static"
+ * modifier from some frequently called functions. */
+#ifdef PROF
+#define PG_STATIC
+#else
+#define PG_STATIC static
+#endif
+
+/* #define DEBUG_HIST 1 */
+
+static const int fastMergeErase = 1;
+static unsigned histCount = 0;		/* number elements on history list */
+static struct Hist *histTail = NULL;     /* last element on history list */
+static struct Hist *histMerg = NULL;	 /* last element merged by Htime */
+
+static void insertHistHashTable(struct Hist *, unsigned);
+
+
+/* Insert new element (hp) in history list after specified predecessor (pp). */
+static void
+hinsert(struct Hist *hp, struct Hist *pp)
+{
+    struct Hist *fp = pp->Hnext;        /* following element, if any */
+    hp->Hnext = fp, hp->Hprev = pp;
+    pp->Hnext = hp;
+    if (fp)
+        fp->Hprev = hp;
+    else
+        histTail = hp;                  /* meaning hp->Hnext == NULL */
+    histCount++;
+}
+
+/* Remove the entry from the history list. */
+static void
+hremove(struct Hist *hp)
+{
+    struct Hist *pp = hp->Hprev;
+    assert(pp);                         /* elements always have a previous */
+    pp->Hnext = hp->Hnext;
+    if (hp->Hnext)
+        hp->Hnext->Hprev = pp;
+    else
+        histTail = pp;                  /* we must have been last */
+    if (hp == histMerg)			/* deleting this hint from list */
+	histMerg = NULL;
+    assert(histCount > 0);
+    histCount--;
+}
+
+/* Prune length of history list to specified size by history variable. */
+PG_STATIC void
+discardExcess(int histlen)
 {
     struct Hist *hp, *np;
+    if (histTail == NULL) {
+        assert(histCount == 0);
+        return;                         /* no entries on history list */
+    }
+    /* Prune dummy entries from the front, then old entries from the back. If
+     * the list is still too long scan the whole list as before.  But only do a
+     * full scan if the list is more than 6% (1/16th) too long. */
+    while (histCount > (unsigned)histlen && (np = Histlist.Hnext)) {
+        if (eventno - np->Href >= histlen || histlen == 0)
+            hremove(np), hfree(np);
+        else
+            break;
+    }
+    while (histCount > (unsigned)histlen && (np = histTail) != &Histlist) {
+        if (eventno - np->Href >= histlen || histlen == 0)
+            hremove(np), hfree(np);
+        else
+            break;
+    }
+    if (histCount - (histlen >> 4) <= (unsigned)histlen)
+	return;				/* don't bother doing the full scan */
+    for (hp = &Histlist; histCount > (unsigned)histlen &&
+	(np = hp->Hnext) != NULL;)
+        if (eventno - np->Href >= histlen || histlen == 0)
+            hremove(np), hfree(np);
+        else
+            hp = np;
+}
+
+/* Add the command "sp" to the history list. */
+void
+savehist(
+  struct wordent *sp,
+  int mflg)				/* true if -m (merge) specified */
+{
     int histlen = 0;
     Char   *cp;
 
@@ -76,14 +160,445 @@ savehist(struct wordent *sp, int mflg)
 	histlen = histlen * 10 + *cp++ - '0';
     }
     if (sp)
-	(void) enthist(++eventno, sp, 1, mflg);
-    for (hp = &Histlist; (np = hp->Hnext) != NULL;)
-	if (eventno - np->Href >= histlen || histlen == 0)
-	    hp->Hnext = np->Hnext, hfree(np);
-	else
-	    hp = np;
+        (void) enthist(++eventno, sp, 1, mflg, histlen);
+    discardExcess(histlen);
+}
+
+#define USE_JENKINS_HASH 1
+/* #define USE_ONE_AT_A_TIME 1 */
+#undef PRIME_LENGTH			/* no need for good HTL */
+
+#ifdef USE_JENKINS_HASH
+#define hashFcnName "lookup3"
+/* From:
+   lookup3.c, by Bob Jenkins, May 2006, Public Domain.
+   "...  You can use this free for any purpose.  It's in
+    the public domain.  It has no warranty."
+   http://burtleburtle.net/bob/hash/index.html
+ */
+
+#define rot(x,k) (((x)<<(k)) | ((x)>>(32-(k))))
+#define mix(a,b,c) \
+{ \
+  a -= c;  a ^= rot(c, 4);  c += b; \
+  b -= a;  b ^= rot(a, 6);  a += c; \
+  c -= b;  c ^= rot(b, 8);  b += a; \
+  a -= c;  a ^= rot(c,16);  c += b; \
+  b -= a;  b ^= rot(a,19);  a += c; \
+  c -= b;  c ^= rot(b, 4);  b += a; \
+}
+#define final(a,b,c) \
+{ \
+  c ^= b; c -= rot(b,14); \
+  a ^= c; a -= rot(c,11); \
+  b ^= a; b -= rot(a,25); \
+  c ^= b; c -= rot(b,16); \
+  a ^= c; a -= rot(c, 4); \
+  b ^= a; b -= rot(a,14); \
+  c ^= b; c -= rot(b,24); \
 }
 
+struct hashValue		  /* State used to hash a wordend word list. */
+{
+    uint32_t a, b, c;
+};
+
+/* Set up the internal state */
+static void
+initializeHash(struct hashValue *h)
+{
+    h->a = h->b = h->c = 0xdeadbeef;
+}
+
+/* This does a partial hash of the Chars in a single word.  For efficiency we
+ * include 3 versions of the code to pack Chars into 32-bit words for the
+ * mixing function. */
+static void
+addWordToHash(struct hashValue *h, const Char *word)
+{
+    uint32_t a = h->a, b = h->b, c = h->c;
+#ifdef SHORT_STRINGS
+#ifdef WIDE_STRINGS
+    assert(sizeof(Char) >= 4);
+    while (1) {
+	unsigned k;
+	if ((k = (uChar)*word++) == 0) break; a += k;
+	if ((k = (uChar)*word++) == 0) break; b += k;
+	if ((k = (uChar)*word++) == 0) break; c += k;
+	mix(a, b, c);
+    }
+#else
+    assert(sizeof(Char) == 2);
+    while (1) {
+	unsigned k;
+	if ((k = (uChar)*word++) == 0) break; a += k;
+	if ((k = (uChar)*word++) == 0) break; a += k << 16;
+	if ((k = (uChar)*word++) == 0) break; b += k;
+	if ((k = (uChar)*word++) == 0) break; b += k << 16;
+	if ((k = (uChar)*word++) == 0) break; c += k;
+	if ((k = (uChar)*word++) == 0) break; c += k << 16;
+	mix(a, b, c);
+    }
+#endif
+#else
+    assert(sizeof(Char) == 1);
+    while (1) {
+	unsigned k;
+	if ((k = *word++) == 0) break; a += k;
+	if ((k = *word++) == 0) break; a += k << 8;
+	if ((k = *word++) == 0) break; a += k << 16;
+	if ((k = *word++) == 0) break; a += k << 24;
+	if ((k = *word++) == 0) break; b += k;
+	if ((k = *word++) == 0) break; b += k << 8;
+	if ((k = *word++) == 0) break; b += k << 16;
+	if ((k = *word++) == 0) break; b += k << 24;
+	if ((k = *word++) == 0) break; c += k;
+	if ((k = *word++) == 0) break; c += k << 8;
+	if ((k = *word++) == 0) break; c += k << 16;
+	if ((k = *word++) == 0) break; c += k << 24;
+	mix(a, b, c);
+    }
+#endif
+    h->a = a, h->b = b, h->c = c;
+}
+
+static void
+addCharToHash(struct hashValue *h, Char ch)
+{
+    /* The compiler (gcc -O2) seems to do a good job optimizing this without
+     * explicitly extracting into local variables. */
+    h->a += (uChar)ch;
+    mix(h->a, h->b, h->c);
+}
+
+static uint32_t
+finalizeHash(struct hashValue *h)
+{
+    uint32_t a = h->a, b = h->b, c = h->c;
+    final(a, b, c);
+    return c;
+}
+
+#elif USE_ONE_AT_A_TIME
+#define hashFcnName "one-at-a-time"
+/* This one is also from Bob Jenkins, but is slower but simpler than lookup3.
+   "...  The code given here are all public domain."
+   http://burtleburtle.net/bob/hash/doobs.html */
+
+#if 0
+ub4
+one_at_a_time(char *key, ub4 len)
+{
+  ub4   hash, i;
+  for (hash=0, i=0; i<len; ++i)
+  {
+    hash += key[i];
+    hash += (hash << 10);
+    hash ^= (hash >> 6);
+  }
+  hash += (hash << 3);
+  hash ^= (hash >> 11);
+  hash += (hash << 15);
+  return (hash & mask);
+}
+#endif
+
+struct hashValue { uint32_t h; };
+static void
+initializeHash(struct hashValue *h)
+{
+    h->h = 0;
+}
+
+static void
+addWordToHash(struct hashValue *h, const Char *word)
+{
+    unsigned k;
+    uint32_t hash = h->h;
+    while (k = (uChar)*word++)
+	hash += k, hash += hash << 10, hash ^= hash >> 6;
+    h->h = hash;
+}
+
+static void
+addCharToHash(struct hashValue *h, Char c)
+{
+    Char b[2] = { c, 0 };
+    addWordToHash(h, b);
+}
+
+static uint32_t
+finalizeHash(struct hashValue *h)
+{
+    unsigned hash = h->h;
+    hash += (hash << 3);
+    hash ^= (hash >> 11);
+    hash += (hash << 15);
+    return hash;
+}
+
+#else
+#define hashFcnName "add-mul"
+/* Simple multipy and add hash. */
+#define PRIME_LENGTH 1			/* need "good" HTL */
+struct hashValue { uint32_t h; };
+static void
+initializeHash(struct hashValue *h)
+{
+    h->h = 0xe13e2345;
+}
+
+static void
+addWordToHash(struct hashValue *h, const Char *word)
+{
+    unsigned k;
+    uint32_t hash = h->h;
+    while (k = (uChar)*word++)
+	hash = hash * 0x9e4167b9 + k;
+    h->h = hash;
+}
+
+static void
+addCharToHash(struct hashValue *h, Char c)
+{
+    h->h = h->h * 0x9e4167b9 + (uChar)c;
+}
+
+static uint32_t
+finalizeHash(struct hashValue *h)
+{
+    return h->h;
+}
+#endif
+
+static unsigned
+hashhist(struct wordent *h0)
+{
+    struct hashValue s;
+    struct wordent *firstWord = h0->next;
+    struct wordent *h = firstWord;
+    unsigned hash = 0;
+
+    initializeHash(&s);
+    for (; h != h0; h = h->next) {
+        if (h->word[0] == '\n')
+            break;                      /* don't hash newline */
+        if (h != firstWord)
+            addCharToHash(&s, ' ');	/* space between words */
+	addWordToHash(&s, h->word);
+    }
+    hash = finalizeHash(&s);
+    /* Zero means no hash value, so never return zero as a hash value. */
+    return hash ? hash : 0x7fffffff;	/* prime! */
+}
+
+#if 0
+unsigned
+hashStr(Char *str)
+{
+    struct hashValue s;
+    initializeHash(&s);
+    addWordToHash(&s, str);
+    return finalizeHash(&s);
+}
+#endif
+
+#ifdef PRIME_LENGTH			/* need good HTL */
+#define hash2tableIndex(hash, len) ((hash) % len)
+#else
+#define hash2tableIndex(hash, len) ((hash) & (len-1))
+#endif
+
+/* This code can be enabled to test the above hash functions for speed and
+ * collision avoidance.  The testing is enabled by "occasional" calls to
+ * displayHistStats(), see which. */
+#ifdef DEBUG_HIST
+
+#ifdef BSDTIMES
+static double
+doTiming(int start) {
+    static struct timeval beginTime;
+    if (start) {
+	gettimeofday(&beginTime, NULL);
+	return 0.0;
+    } else {
+	struct timeval now;
+	gettimeofday(&now, NULL);
+	return (now.tv_sec-beginTime.tv_sec) +
+	    (now.tv_usec-beginTime.tv_usec)/1e6;
+    }
+}
+#else
+static double
+doTiming(int start) {
+    USE(start);
+    return 0.0;
+}
+#endif
+
+static void
+generateHashes(int nChars, unsigned nWords, unsigned samples, unsigned *hashes,
+    unsigned length)
+{
+    if (nChars < 1)
+	return;
+    nWords = (nWords < 1) ? 1 : (nWords > 4) ? 4 : nWords;
+    Char *number = xmalloc((nChars+nWords)*sizeof(Char));
+    struct wordent word[4];
+    struct wordent base = { NULL, &word[0], &word[0] };
+    word[0].word = number, word[0].next = &base, word[0].prev = &base;
+    unsigned w = 0;			/* word number */
+    /* Generate multiple words of length 2, 3, 5, then all the rest. */
+    unsigned wBoundaries[4] = { 2-1, 2+3-1, 2+3+5-1, 0 };
+    /* Ensure the last word has at least 4 Chars in it. */
+    while (nWords >= 2 && nChars < (wBoundaries[nWords-2]+1) + 4)
+	nWords--;
+    wBoundaries[nWords-1] = 0xffffffff;	/* don't end word past this point */
+    unsigned i;
+    for (i = 0; i<nChars; i++) {
+	/* In deference to the gawd awful add-mul hash, we won't use the worse
+	 * case here (setting all Chars to 1), but assume mostly (or at least
+	 * initially) ASCII data. */
+	number[i+w] = '!';		/* 0x21 = 33 */
+
+	if (i == wBoundaries[w]) {	/* end a word here and move to next */
+	    w++;			/* next word */
+	    number[i+w] = 0;		/* terminate */
+	    word[w].word = &number[i+w+1];
+	    word[w].next = &base, word[w].prev = &word[w-1];
+	    word[w-1].next = &word[w], base.prev = &word[w];
+	}
+    }
+    /* w is the index of the last word actually created. */
+    number[nChars + w] = 0;		/* terminate last word */
+    unsigned timeLimit = !samples;
+    if (samples == 0)
+	samples = 1000000000;
+    doTiming(1);
+    double sec;
+    for (i = 0; i < samples; i++) {
+	/* increment 4 digit base 255 number; last characters vary fastest */
+	unsigned j = nChars-1 + w;
+	while (1) {
+	    if (++number[j] != 0)
+		break;
+	    /* else reset this digit and proceed to next one */
+	    number[j] = 1;
+	    if (&number[j] <= word[w].word)
+		break;			/* stop at beginning of last word */
+	    j--;
+	}
+	if (word[w].word[0] == '\n')
+	    word[w].word[0]++;		/* suppress newline character */
+	unsigned hash = hashhist(&base);
+	hashes[hash2tableIndex(hash, length)]++;
+	if (timeLimit && (i & 0x3ffff) == 0x3ffff) {
+	    sec = doTiming(0);
+	    if (sec > 10)
+		break;
+	}
+    }
+    if (i >= samples)
+	sec = doTiming(0);
+    else
+	samples = i;			/* number we actually did */
+    if (sec > 0.01) {
+	xprintf("Hash %d (%d Char %u words) with %s: %d nsec/hash, %d mcps\n",
+		samples, nChars, w+1, hashFcnName, (int)((sec/samples)*1e9),
+		(int)((double)samples*nChars/sec/1e6));
+    }
+}
+#endif /* DEBUG_HIST */
+
+#ifdef DEBUG_HIST
+static void
+testHash(void)
+{
+    static const Char STRtestHashTimings[] =
+	{ 't','e','s','t','H','a','s','h','T','i','m','i','n','g','s', 0 };
+    struct varent *vp = adrof(STRtestHashTimings);
+    if (vp && vp->vec) {
+	unsigned hashes[4];		/* dummy place to put hashes */
+	Char **vals = vp->vec;
+	while (*vals) {
+	    int length = getn(*vals);
+	    unsigned words =
+		(length < 5) ? 1 : (length < 25) ? 2 : (length < 75) ? 3 : 4;
+	    if (length > 0)
+		generateHashes(length, words, 0, hashes, 4);
+	    vals++;
+	}
+    }
+    unsigned length = 1024;
+#ifdef PRIME_LENGTH			/* need good HTL */
+    length = 1021;
+#endif
+    unsigned *hashes = xmalloc(length*sizeof(unsigned));
+    memset(hashes, 0, length*sizeof(unsigned));
+    /* Compute collision statistics for half full hashes modulo "length". */
+    generateHashes(4, 1, length/2, hashes, length);
+    /* Evaluate collisions by comparing occupancy rates (mean value 0.5).
+     * One bin for each number of hits. */
+    unsigned bins[155];
+    memset(bins, 0, sizeof(bins));
+    unsigned highest = 0;
+    unsigned i;
+    for (i = 0; i<length; i++) {
+	unsigned hits = hashes[i];
+	if (hits >= sizeof(bins)/sizeof(bins[0])) /* clip */
+	    hits = highest = sizeof(bins)/sizeof(bins[0]) - 1;
+	if (hits > highest)
+	    highest = hits;
+	bins[hits]++;
+    }
+    xprintf("Occupancy of %d buckets by %d hashes %d Chars %d word with %s\n",
+	    length, length/2, 4, 1, hashFcnName);
+    for (i = 0; i <= highest; i++) {
+	xprintf(" %d buckets (%d%%) with %d hits\n",
+		bins[i], bins[i]*100/length, i);
+    }
+    /* Count run lengths to evaluate linear rehashing effectiveness.  Estimate
+     * a little corrupted by edge effects. */
+    memset(bins, 0, sizeof(bins));
+    highest = 0;
+    for (i = 0; hashes[i] == 0; i++);	/* find first occupied bucket */
+    unsigned run = 0;
+    unsigned rehashed = 0;
+    for (; i<length; i++) {
+	unsigned hits = hashes[i];
+	if (hits == 0 && rehashed > 0)
+	    hits = 1 && rehashed--;
+	else if (hits > 1)
+	    rehashed += hits-1;
+	if (hits)
+	    run++;
+	else {
+	    /* a real free slot, count it */
+	    if (run >= sizeof(bins)/sizeof(bins[0])) /* clip */
+		run = highest = sizeof(bins)/sizeof(bins[0]) - 1;
+	    if (run > highest)
+		highest = run;
+	    bins[run]++;
+	    run = 0;
+	}
+    }
+    /* Ignore the partial run at end as we ignored the beginning. */
+    double merit = 0.0, entries = 0;
+    for (i = 0; i <= highest; i++) {
+	entries += bins[i]*i;		/* total hashed objects */
+	merit += bins[i]*i*i;
+    }
+    xprintf("Rehash collision figure of merit %u (ideal=100), run lengths:\n",
+	    (int)(100.0*merit/entries));
+    for (i = 0; i <= highest; i++) {
+	if (bins[i] != 0)
+	    xprintf(" %d runs of length %d buckets\n", bins[i], i);
+    }
+    xfree(hashes);
+}
+#endif /* DEBUG_HIST */
+
+/* Compares two word lists for equality. */
 static int
 heq(const struct wordent *a0, const struct wordent *b0)
 {
@@ -98,40 +613,362 @@ heq(const struct wordent *a0, const struct wordent *b0)
 	    return (b == b0) ? 1 : 0;
 	if (b == b0)
 	    return 0;
-    } 
+    }
+}
+
+/* Renumber entries following p, which we will be deleting. */
+PG_STATIC void
+renumberHist(struct Hist *p)
+{
+    int n = p->Href;
+    while ((p = p->Hnext))
+        p->Href = n--;
+}
+
+/* The hash table is implemented as an array of pointers to Hist entries.  Each
+ * entry is located in the table using hash2tableIndex() and checking the
+ * following entries in case of a collision (linear rehash).  Free entries in
+ * the table are zero (0, NULL, emptyHTE).  Deleted entries that cannot yet be
+ * freed are set to one (deletedHTE).  The Hist.Hhash member is non-zero iff
+ * the entry is in the hash table.  When the hash table get too full, it is
+ * reallocated to be approximately twice the history length (see
+ * getHashTableSize). */
+static struct Hist **histHashTable = NULL;
+static unsigned histHashTableLength = 0; /* number of Hist pointers in table */
+
+static struct Hist * const emptyHTE = NULL;
+static struct Hist * const deletedHTE = (struct Hist *)1;
+
+static struct {
+    unsigned insertCount;
+    unsigned removeCount;
+    unsigned rehashes;
+    int deleted;
+} hashStats;
+
+#ifdef DEBUG_HIST
+void
+checkHistHashTable(int print)
+{
+    unsigned occupied = 0;
+    unsigned deleted = 0;
+    unsigned i;
+    for (i = 0; i<histHashTableLength; i++)
+	if (histHashTable[i] == emptyHTE)
+	    continue;
+	else if (histHashTable[i] == deletedHTE)
+	    deleted++;
+	else
+	    occupied++;
+    if (print)
+	xprintf("  found len %u occupied %u deleted %u\n",
+		histHashTableLength, occupied, deleted);
+    assert(deleted == hashStats.deleted);
+}
+
+static int doneTest = 0;
+
+/* Main entry point for displaying history statistics and hash function
+ * behavior. */
+void
+displayHistStats(const char *reason)
+{
+    /* Just hash statistics for now. */
+    xprintf("%s history hash table len %u count %u (deleted %d)\n", reason,
+	    histHashTableLength, histCount, hashStats.deleted);
+    xprintf("  inserts %u rehashes %u%% each\n",
+	    hashStats.insertCount,
+	    (hashStats.insertCount
+	     ? 100*hashStats.rehashes/hashStats.insertCount : 0));
+    xprintf("  removes %u net %u\n",
+	    hashStats.removeCount,
+	    hashStats.insertCount - hashStats.removeCount);
+    assert(hashStats.insertCount >= hashStats.removeCount);
+    checkHistHashTable(1);
+    memset(&hashStats, 0, sizeof(hashStats));
+    if (!doneTest) {
+	testHash();
+	doneTest = 1;
+    }
+}
+#else
+void
+displayHistStats(const char *reason)
+{
+    USE(reason);
+}
+#endif
+
+static void
+discardHistHashTable(void)
+{
+    if (histHashTable == NULL)
+        return;
+    displayHistStats("Discarding");
+    xfree(histHashTable);
+    histHashTable = NULL;
+}
+
+/* Computes a new hash table size, when the current one is too small. */
+static unsigned
+getHashTableSize(int histlen)
+{
+    unsigned target = histlen * 2;
+    unsigned e = 5;
+    unsigned size;
+    while ((size = 1<<e) < target)
+	e++;
+#ifdef PRIME_LENGTH			/* need good HTL */
+    /* Not all prime, but most are and none have factors smaller than 11. */
+    return size+15;
+#else
+    assert((size & (size-1)) == 0);	/* must be a power of two */
+    return size;
+#endif
+}
+
+/* Create the hash table or resize, if necessary. */
+static void
+createHistHashTable(int histlen)
+{
+    if (histlen == 0) {
+	discardHistHashTable();
+        return;
+    }
+    if (histlen < 0) {
+        histlen = getn(varval(STRhistory));
+	if (histlen == 0)
+	    return;			/* no need for hash table */
+	assert(histlen > 0);
+    }
+    if (histHashTable != NULL) {
+	if (histCount < histHashTableLength * 3 / 4)
+	    return;			/* good enough for now */
+	discardHistHashTable();		/* too small */
+    }
+    histHashTableLength = getHashTableSize(
+	histlen > (int)histCount ? histlen : (int)histCount);
+    histHashTable = xmalloc(histHashTableLength * sizeof(struct Hist *));
+    memset(histHashTable, 0, histHashTableLength * sizeof(struct Hist *));
+    assert(histHashTable[0] == emptyHTE);
+
+    /* Now insert all the entries on the history list into the hash table. */
+    {
+        struct Hist *hp;
+        for (hp = &Histlist; (hp = hp->Hnext) != NULL;) {
+            unsigned lpHash = hashhist(&hp->Hlex);
+            assert(!hp->Hhash || hp->Hhash == lpHash);
+            hp->Hhash = 0;              /* force insert to new hash table */
+            insertHistHashTable(hp, lpHash);
+        }
+    }
+}
+
+/* Insert np into the hash table.  We assume that np is already on the
+ * Histlist.  The specified hashval matches the new Hist entry but has not yet
+ * been assigned to Hhash (or the element is already on the hash table). */
+static void
+insertHistHashTable(struct Hist *np, unsigned hashval)
+{
+    unsigned rehashes = 0;
+    unsigned hi = 0;
+    if (!histHashTable)
+	return;
+    if (np->Hhash != 0) {
+        /* already in hash table */
+        assert(hashval == np->Hhash);
+        return;
+    }
+    assert(np != deletedHTE);
+    /* Find a free (empty or deleted) slot, using linear rehash. */
+    assert(histHashTable);
+    for (rehashes = 0;
+         ((hi = hash2tableIndex(hashval + rehashes, histHashTableLength)),
+          histHashTable[hi] != emptyHTE && histHashTable[hi] != deletedHTE);
+         rehashes++) {
+        assert(np != histHashTable[hi]);
+        if (rehashes >= histHashTableLength / 10) {
+            /* Hash table is full, so grow it.  We assume the create function
+             * will roughly double the size we give it.  Create initializes the
+             * new table with everything on the Histlist, so we are done when
+             * it returns.  */
+#ifdef DEBUG_HIST
+	    xprintf("Growing history hash table from %d ...",
+		histHashTableLength);
+	    flush();
+#endif
+            discardHistHashTable();
+            createHistHashTable(histHashTableLength);
+#ifdef DEBUG_HIST
+	    xprintf("to %d.\n", histHashTableLength);
+#endif
+            return;
+        }
+    }
+    /* Might be sensible to grow hash table if rehashes is "too big" here. */
+    if (histHashTable[hi] == deletedHTE)
+	hashStats.deleted--;
+    histHashTable[hi] = np;
+    np->Hhash = hashval;
+    hashStats.insertCount++;
+    hashStats.rehashes += rehashes;
+}
+
+/* Remove the 'np' entry from the hash table. */
+static void
+removeHistHashTable(struct Hist *np)
+{
+    unsigned hi = np->Hhash;
+    if (!histHashTable || !hi)
+        return;                         /* no hash table or not on it */
+    /* find desired entry */
+    while ((hi = hash2tableIndex(hi, histHashTableLength)),
+           histHashTable[hi] != emptyHTE) {
+        if (np == histHashTable[hi]) {
+	    unsigned i;
+	    unsigned deletes = 0;
+	    histHashTable[hi] = deletedHTE; /* dummy, but non-zero entry */
+	    /* now peek ahead to see if the dummies are really necessary. */
+	    i = 1;
+	    while (histHashTable[hash2tableIndex(hi+i, histHashTableLength)] ==
+		   deletedHTE)
+		i++;
+	    if (histHashTable[hash2tableIndex(hi+i, histHashTableLength)] ==
+		emptyHTE) {
+		/* dummies are no longer necessary placeholders. */
+		deletes = i;
+		while (i-- > 0) {
+		    histHashTable[hash2tableIndex(hi+i, histHashTableLength)] =
+			emptyHTE;
+		}
+	    }
+	    hashStats.deleted += 1 - deletes; /* delta deleted entries */
+	    hashStats.removeCount++;
+            return;
+        }
+        hi++;                           /* linear rehash */
+    }
+    assert(!"Hist entry not found in hash table");
 }
 
+/* Search the history hash table for a command matching lp, using hashval as
+ * its hash value. */
+static struct Hist *
+findHistHashTable(struct wordent *lp, unsigned hashval)
+{
+    unsigned deleted = 0;		/* number of deleted entries skipped */
+    unsigned hi = hashval;
+    struct Hist *hp;
+    if (!histHashTable)
+	return NULL;
+    while ((hi = hash2tableIndex(hi, histHashTableLength)),
+           (hp = histHashTable[hi]) != emptyHTE) {
+        if (hp == deletedHTE)
+	    deleted++;
+	else if (hp->Hhash == hashval && heq(lp, &(hp->Hlex)))
+            return hp;
+	if (deleted > (histHashTableLength>>4)) {
+	    /* lots of deletes, so we need a sparser table. */
+            discardHistHashTable();
+            createHistHashTable(histHashTableLength);
+	    return findHistHashTable(lp, hashval);
+	}
+        hi++;                           /* linear rehash */
+    }
+    return NULL;
+}
+
+/* When merge semantics are in use, find the approximate predecessor for the
+ * new entry, so that the Htime entries are decreasing.  Return the entry just
+ * before the first entry with equal times, so the caller can check for
+ * duplicates.  When pTime is not NULL, use it as a starting point for search,
+ * otherwise search from beginning (largest time value) of history list. */
+PG_STATIC struct Hist *
+mergeInsertionPoint(
+    struct Hist *np,                      /* new entry to be inserted */
+    struct Hist *pTime)                   /* hint about where to insert */
+{
+    struct Hist *pp, *p;
+    if (histTail && histTail->Htime >= np->Htime)
+	pTime = histTail;		/* new entry goes at the end */
+    if (histMerg && histMerg != &Histlist && histMerg != Histlist.Hnext) {
+	/* Check above and below previous insertion point, in case we're adding
+	 * sequential times in the middle of the list (e.g. history -M). */
+	if (histMerg->Htime >= np->Htime)
+	    pTime = histMerg;
+	else if (histMerg->Hprev->Htime >= np->Htime)
+	    pTime = histMerg->Hprev;
+    }
+    if (pTime) {
+        /* With hint, search up the list until Htime is greater.  We skip past
+         * the equal ones, too, so our caller can elide duplicates. */
+        pp = pTime;
+        while (pp != &Histlist && pp->Htime <= np->Htime)
+            pp = pp->Hprev;
+    } else
+        pp = &Histlist;
+    /* Search down the list while current entry's time is too large. */
+    while ((p = pp->Hnext) && (p->Htime > np->Htime))
+            pp = p;                     /* advance insertion point */
+    /* Remember recent position as hint for next time */
+    histMerg = pp;
+    return pp;
+}
+
+/* Bubble Hnum & Href in new entry down to pp through earlier part of list. */
+PG_STATIC void bubbleHnumHrefDown(struct Hist *np, struct Hist *pp)
+{
+    struct Hist *p;
+    for (p = Histlist.Hnext; p != pp->Hnext; p = p->Hnext) {
+        /* swap Hnum & Href values of p and np. */
+        int n = p->Hnum, r = p->Href;
+        p->Hnum = np->Hnum; p->Href = np->Href;
+        np->Hnum = n; np->Href = r;
+    }
+}
 
+/* Enter new command into the history list according to current settings. */
 struct Hist *
-enthist(int event, struct wordent *lp, int docopy, int mflg)
+enthist(
+  int event,				/* newly incremented global eventno */
+  struct wordent *lp,
+  int docopy,
+  int mflg,				/* true if merge requested */
+  int histlen)				/* -1 if unknown */
 {
-    struct Hist *p = NULL, *pp = &Histlist;
-    int n, r;
+    struct Hist *p = NULL, *pp = &Histlist, *pTime = NULL;
     struct Hist *np;
     const Char *dp;
-    
+    unsigned lpHash = 0;                /* non-zero if hashing entries */
+
     if ((dp = varval(STRhistdup)) != STRNULL) {
 	if (eq(dp, STRerase)) {
 	    /* masaoki@akebono.tky.hp.com (Kobayashi Masaoki) */
-	    struct Hist *px;
-	    for (p = pp; (px = p, p = p->Hnext) != NULL;)
-		if (heq(lp, &(p->Hlex))){
-		    px->Hnext = p->Hnext;
-		    if (Htime != 0 && p->Htime > Htime)
-			Htime = p->Htime;
-		    n = p->Href;
-		    hfree(p);
-		    for (p = px->Hnext; p != NULL; p = p->Hnext)
-			p->Href = n--;
-		    break;
-		}
+            createHistHashTable(histlen);
+            lpHash = hashhist(lp);
+            assert(lpHash != 0);
+            p = findHistHashTable(lp, lpHash);
+            if (p) {
+		if (Htime != 0 && p->Htime > Htime)
+		    Htime = p->Htime;
+                /* If we are merging, and the old entry is at the place we want
+                 * to insert the new entry, then remember the place. */
+                if (mflg && Htime != 0 && p->Hprev->Htime >= Htime)
+                    pTime = p->Hprev;
+		if (!fastMergeErase)
+		    renumberHist(p);	/* Reset Href of subsequent entries */
+                hremove(p);
+		hfree(p);
+                p = NULL;               /* so new entry is allocated below */
+	    }
 	}
 	else if (eq(dp, STRall)) {
-	    for (p = pp; (p = p->Hnext) != NULL;)
-		if (heq(lp, &(p->Hlex))) {
-		    eventno--;
-		    break;
-		}
+            createHistHashTable(histlen);
+            lpHash = hashhist(lp);
+            assert(lpHash != 0);
+            p = findHistHashTable(lp, lpHash);
+	    if (p)   /* p!=NULL, only update this entry's Htime below */
+		eventno--;		/* not adding a new event */
 	}
 	else if (eq(dp, STRprev)) {
 	    if (pp->Hnext && heq(lp, &(pp->Hnext->Hlex))) {
@@ -149,14 +986,15 @@ enthist(int event, struct wordent *lp, int docopy, int mflg)
 	Htime = 0;
     }
     else
-	(void) time(&(np->Htime));
+        (void) time(&(np->Htime));
 
     if (p == np)
-	return np;
+        return np;                      /* reused existing entry */
 
+    /* Initialize the new entry. */
     np->Hnum = np->Href = event;
     if (docopy) {
-	copylex(&np->Hlex, lp);
+        copylex(&np->Hlex, lp);
 	if (histvalid)
 	    np->histline = Strsave(histline.s);
 	else
@@ -166,46 +1004,127 @@ enthist(int event, struct wordent *lp, int docopy, int mflg)
 	np->Hlex.next = lp->next;
 	lp->next->prev = &np->Hlex;
 	np->Hlex.prev = lp->prev;
-	lp->prev->next = &np->Hlex;
-	np->histline = NULL;
-    }
-    if (mflg)
-      {
-        while ((p = pp->Hnext) && (p->Htime > np->Htime))
-	  pp = p;
-	while (p && p->Htime == np->Htime)
-	  {
-	    if (heq(&p->Hlex, &np->Hlex))
-	      {
-	        eventno--;
-		hfree(np);
-	        return (p);
-	      }
-	    pp = p;
-	    p = p->Hnext;
-	  }
-	for (p = Histlist.Hnext; p != pp->Hnext; p = p->Hnext)
-	  {
-	    n = p->Hnum; r = p->Href;
-	    p->Hnum = np->Hnum; p->Href = np->Href;
-	    np->Hnum = n; np->Href = r;
-	  }
-      }
-    np->Hnext = pp->Hnext;
-    pp->Hnext = np;
+        lp->prev->next = &np->Hlex;
+        np->histline = NULL;
+    }
+    np->Hhash = 0;
+
+    /* The head of history list is the default insertion point.
+       If merging, advance insertion point, in pp, according to Htime. */
+    /* XXX -- In histdup=all, Htime values can be non-monotonic. */
+    if (mflg) {                         /* merge according to np->Htime */
+        pp = mergeInsertionPoint(np, pTime);
+        for (p = pp->Hnext; p && p->Htime == np->Htime; pp = p, p = p->Hnext) {
+            if (heq(&p->Hlex, &np->Hlex)) {
+                eventno--;              /* duplicate, so don't add new event */
+                hfree(np);
+                return (p);
+              }
+          }
+        /* pp is now the last entry with time >= to np. */
+	if (!fastMergeErase) {		/* renumber at end of loadhist */
+	    /* Before inserting np after pp, bubble its Hnum & Href values down
+	     * through the earlier part of list. */
+	    bubbleHnumHrefDown(np, pp);
+	}
+    }
+    else
+        pp = &Histlist;                 /* insert at beginning of history */
+    hinsert(np, pp);
+    if (lpHash && histlen != 0)		/* erase & all modes use hash table */
+        insertHistHashTable(np, lpHash);
+    else
+        discardHistHashTable();
     return (np);
 }
 
 static void
 hfree(struct Hist *hp)
 {
-
+    assert(hp != histMerg);
+    if (hp->Hhash)
+        removeHistHashTable(hp);
     freelex(&hp->Hlex);
     if (hp->histline)
-	xfree(hp->histline);
+        xfree(hp->histline);
     xfree(hp);
 }
 
+PG_STATIC void
+phist(struct Hist *hp, int hflg)
+{
+    if (hflg & HIST_ONLY) {
+	int old_output_raw;
+
+       /*
+        * Control characters have to be written as is (output_raw).
+        * This way one can preserve special characters (like tab) in
+        * the history file.
+        * From: mveksler@vnet.ibm.com (Veksler Michael)
+        */
+	old_output_raw = output_raw;
+        output_raw = 1;
+	cleanup_push(&old_output_raw, output_raw_restore);
+	if (hflg & HIST_TIME)
+	    /* 
+	     * Make file entry with history time in format:
+	     * "+NNNNNNNNNN" (10 digits, left padded with ascii '0') 
+	     */
+
+	    xprintf("#+%010lu\n", (unsigned long)hp->Htime);
+
+	if (HistLit && hp->histline)
+	    xprintf("%S\n", hp->histline);
+	else
+	    prlex(&hp->Hlex);
+        cleanup_until(&old_output_raw);
+    }
+    else {
+	Char   *cp = str2short("%h\t%T\t%R\n");
+	Char *p;
+	struct varent *vp = adrof(STRhistory);
+
+	if (vp && vp->vec != NULL && vp->vec[0] && vp->vec[1])
+	    cp = vp->vec[1];
+
+	p = tprintf(FMT_HISTORY, cp, NULL, hp->Htime, hp);
+	cleanup_push(p, xfree);
+	for (cp = p; *cp;)
+	    xputwchar(*cp++);
+	cleanup_until(p);
+    }
+}
+
+PG_STATIC void
+dophist(int n, int hflg)
+{
+    struct Hist *hp;
+    if (setintr) {
+	int old_pintr_disabled;
+
+	pintr_push_enable(&old_pintr_disabled);
+	cleanup_until(&old_pintr_disabled);
+    }
+    if ((hflg & HIST_REV) == 0) {
+	/* Since the history list is stored most recent first, non-reversing
+	 * print needs to print (backwards) up the list. */
+	if ((unsigned)n >= histCount)
+	    hp = histTail;
+	else {
+	    for (hp = Histlist.Hnext;
+		 --n > 0 && hp->Hnext != NULL;
+		 hp = hp->Hnext)
+		;
+	}
+	if (hp == NULL)
+	    return;			/* nothing to print */
+	for (; hp != &Histlist; hp = hp->Hprev)
+	    phist(hp, hflg);
+    } else {
+	for (hp = Histlist.Hnext; n-- > 0 && hp != NULL; hp = hp->Hnext)
+	    phist(hp, hflg);
+    }
+}
 
 /*ARGSUSED*/
 void
@@ -247,11 +1166,10 @@ dohist(Char **vp, struct command *c)
 		break;
 	    }
     }
-
     if (hflg & HIST_CLEAR) {
-	struct Hist *np, *hp;
-	for (hp = &Histlist; (np = hp->Hnext) != NULL;)
-	    hp->Hnext = np->Hnext, hfree(np);
+        struct Hist *np, *hp;
+        for (hp = &Histlist; (np = hp->Hnext) != NULL;)
+            hremove(np), hfree(np);
     }
 
     if (hflg & (HIST_LOAD | HIST_MERGE))
@@ -264,76 +1182,7 @@ dohist(Char **vp, struct command *c)
 	else {
 	    n = getn(varval(STRhistory));
 	}
-	dohist1(Histlist.Hnext, &n, hflg);
-    }
-}
-
-static void
-dohist1(struct Hist *hp, int *np, int hflg)
-{
-    int    print = (*np) > 0;
-
-    for (; hp != 0; hp = hp->Hnext) {
-	if (setintr) {
-	    int old_pintr_disabled;
-
-	    pintr_push_enable(&old_pintr_disabled);
-	    cleanup_until(&old_pintr_disabled);
-	}
-	(*np)--;
-	if ((hflg & HIST_REV) == 0) {
-	    dohist1(hp->Hnext, np, hflg);
-	    if (print)
-		phist(hp, hflg);
-	    return;
-	}
-	if (*np >= 0)
-	    phist(hp, hflg);
-    }
-}
-
-static void
-phist(struct Hist *hp, int hflg)
-{
-    if (hflg & HIST_ONLY) {
-	int old_output_raw;
-
-       /*
-        * Control characters have to be written as is (output_raw).
-        * This way one can preserve special characters (like tab) in
-        * the history file.
-        * From: mveksler@vnet.ibm.com (Veksler Michael)
-        */
-	old_output_raw = output_raw;
-        output_raw = 1;
-	cleanup_push(&old_output_raw, output_raw_restore);
-	if (hflg & HIST_TIME)
-	    /* 
-	     * Make file entry with history time in format:
-	     * "+NNNNNNNNNN" (10 digits, left padded with ascii '0') 
-	     */
-
-	    xprintf("#+%010lu\n", (unsigned long)hp->Htime);
-
-	if (HistLit && hp->histline)
-	    xprintf("%S\n", hp->histline);
-	else
-	    prlex(&hp->Hlex);
-        cleanup_until(&old_output_raw);
-    }
-    else {
-	Char   *cp = str2short("%h\t%T\t%R\n");
-	Char *p;
-	struct varent *vp = adrof(STRhistory);
-
-	if (vp && vp->vec != NULL && vp->vec[0] && vp->vec[1])
-	    cp = vp->vec[1];
-
-	p = tprintf(FMT_HISTORY, cp, NULL, hp->Htime, hp);
-	cleanup_push(p, xfree);
-	for (cp = p; *cp;)
-	    xputwchar(*cp++);
-	cleanup_until(p);
+	dophist(n, hflg);
     }
 }
 
@@ -371,6 +1220,7 @@ fmthist(int fmt, ptr_t ptr)
     }
 }
 
+/* Save history before exiting the shell. */
 void
 rechist(Char *fname, int ref)
 {
@@ -424,10 +1274,11 @@ rechist(Char *fname, int ref)
     if ((shist = adrof(STRsavehist)) != NULL && shist->vec != NULL)
 	if (shist->vec[1] && eq(shist->vec[1], STRmerge))
 	    loadhist(fname, 1);
+
     fp = xcreat(short2str(fname), 0600);
+    cleanup_until(fname);
     if (fp == -1) {
 	didfds = oldidfds;
-	cleanup_until(fname);
 	return;
     }
     ftmp = SHOUT;
@@ -437,10 +1288,10 @@ rechist(Char *fname, int ref)
     xclose(fp);
     SHOUT = ftmp;
     didfds = oldidfds;
-    cleanup_until(fname);
 }
 
 
+/* This is the entry point for loading history data from a file. */
 void
 loadhist(Char *fname, int mflg)
 {
@@ -455,4 +1306,14 @@ loadhist(Char *fname, int mflg)
 	loadhist_cmd[2] = STRtildothist;
 
     dosource(loadhist_cmd, NULL);
+
+    /* During history merging (enthist sees mflg set), we disable management of
+     * Hnum and Href (because fastMergeErase is true).  So now reset all the
+     * values based on the final ordering of the history list. */
+    if (mflg) {
+	int n = eventno;
+        struct Hist *hp = &Histlist;
+        while ((hp = hp->Hnext))
+	    hp->Hnum = hp->Href = n--;
+    }
 }
author	mp <mp@FreeBSD.org>	2012-02-22 03:36:15 +0000
committer	mp <mp@FreeBSD.org>	2012-02-22 03:36:15 +0000
commit	3ee51a00f36c11a6172d08d787943dfc63f66110 (patch)
tree	522fd2d4d27770566e466a79d636194e5743d94a /contrib/tcsh/sh.hist.c
parent	d177303078ee8f6069218009d6c3c2b6d9d9ca97 (diff)
parent	54c5644df8eb87e7a5b1c4c411e349ac329ee04b (diff)
download	FreeBSD-src-3ee51a00f36c11a6172d08d787943dfc63f66110.zip FreeBSD-src-3ee51a00f36c11a6172d08d787943dfc63f66110.tar.gz