X-Git-Url: http://jsfdemo.indexdata.com/?a=blobdiff_plain;f=src%2Ftermlists.c;h=ea93130a6c40229bb2b5c9944ecd8c677bc5a0b2;hb=512a11133b1ccc4a44d6e971c8a446865136bb15;hp=fdfc7f0ea81067e27c5defeb3b658afe3f293c93;hpb=ed47c2d4ce54cc225c063f56792ef7bb30705f22;p=pazpar2-moved-to-github.git diff --git a/src/termlists.c b/src/termlists.c index fdfc7f0..ea93130 100644 --- a/src/termlists.c +++ b/src/termlists.c @@ -1,5 +1,5 @@ /* This file is part of Pazpar2. - Copyright (C) 2006-2010 Index Data + Copyright (C) 2006-2012 Index Data Pazpar2 is free software; you can redistribute it and/or modify it under the terms of the GNU General Public License as published by the Free @@ -107,23 +107,25 @@ static void update_highscore(struct termlist *tl, struct termlist_score *t) } } -void termlist_insert(struct termlist *tl, const char *term, int freq) +void termlist_insert(struct termlist *tl, const char *display_term, + const char *norm_term, int freq) { unsigned int bucket; struct termlist_bucket **p; char buf[256], *cp; - if (strlen(term) > 255) + if (strlen(norm_term) > 255) return; - strcpy(buf, term); + strcpy(buf, norm_term); /* chop right */ + /* for (cp = buf + strlen(buf); cp != buf && strchr(",. -", cp[-1]); cp--) cp[-1] = '\0'; - + */ bucket = jenkins_hash((unsigned char *)buf) % tl->hash_size; for (p = &tl->hashtable[bucket]; *p; p = &(*p)->next) { - if (!strcmp(buf, (*p)->term.term)) + if (!strcmp(buf, (*p)->term.norm_term)) { (*p)->term.frequency += freq; update_highscore(tl, &((*p)->term)); @@ -134,7 +136,9 @@ void termlist_insert(struct termlist *tl, const char *term, int freq) { struct termlist_bucket *new = nmem_malloc(tl->nmem, sizeof(struct termlist_bucket)); - new->term.term = nmem_strdup(tl->nmem, buf); + new->term.norm_term = nmem_strdup(tl->nmem, buf); + new->term.display_term = *display_term ? + nmem_strdup(tl->nmem, display_term) : new->term.norm_term; new->term.frequency = freq; new->next = 0; *p = new; @@ -144,8 +148,12 @@ void termlist_insert(struct termlist *tl, const char *term, int freq) static int compare(const void *s1, const void *s2) { - struct termlist_score **p1 = (struct termlist_score**) s1, **p2 = (struct termlist_score **) s2; - return (*p2)->frequency - (*p1)->frequency; + struct termlist_score **p1 = (struct termlist_score **) s1; + struct termlist_score **p2 = (struct termlist_score **) s2; + int d = (*p2)->frequency - (*p1)->frequency; + if (d) + return d; + return strcmp((*p1)->display_term, (*p2)->display_term); } struct termlist_score **termlist_highscore(struct termlist *tl, int *len)