1 /* $Id: test_relevance.c,v 1.9 2007-04-25 07:00:33 marc Exp $
2 Copyright (c) 2006-2007, Index Data.
4 This file is part of Pazpar2.
6 Pazpar2 is free software; you can redistribute it and/or modify it under
7 the terms of the GNU General Public License as published by the Free
8 Software Foundation; either version 2, or (at your option) any later
11 Pazpar2 is distributed in the hope that it will be useful, but WITHOUT ANY
12 WARRANTY; without even the implied warranty of MERCHANTABILITY or
13 FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License
16 You should have received a copy of the GNU General Public License
17 along with Pazpar2; see the file LICENSE. If not, write to the
18 Free Software Foundation, 59 Temple Place - Suite 330, Boston, MA
28 #include <yaz/timing.h>
35 #include "relevance.h"
40 void test_relevance(int argc, char **argv)
42 NMEM nmem = nmem_create();
45 const char * queryterms[] =
47 // {"ål", "økologi", "æble", 0};
49 //struct record_cluster *cluster = 0;
50 struct conf_service *service = 0;
51 struct reclist *list = 0;
52 struct record *record = 0;
53 //const char *mergekey = "amergekey";
56 struct relevance *rel = 0;
57 //struct client *client = 0;
60 rel = relevance_create(nmem, queryterms, numrecs);
63 list = reclist_create(nmem, numrecs);
66 service = conf_service_create(nmem, 4, 3);
69 YAZ_CHECK(conf_service_add_metadata(nmem, service, 0, "title",
70 Metadata_type_generic, Metadata_merge_unique,
73 YAZ_CHECK(conf_service_add_metadata(nmem, service, 1, "author",
74 Metadata_type_generic, Metadata_merge_longest,
77 YAZ_CHECK(conf_service_add_metadata(nmem, service, 2, "isbn",
78 Metadata_type_number, Metadata_merge_no,
81 YAZ_CHECK(conf_service_add_metadata(nmem, service, 3, "year",
82 Metadata_type_year, Metadata_merge_range,
85 YAZ_CHECK(conf_service_add_sortkey(nmem, service, 0, "relevance",
86 Metadata_sortkey_relevance));
88 YAZ_CHECK(conf_service_add_sortkey(nmem, service, 1, "title",
89 Metadata_sortkey_string));
91 YAZ_CHECK(conf_service_add_sortkey(nmem, service, 2, "year",
92 Metadata_sortkey_numeric));
97 // testing record things
98 record = record_create(nmem, 4, 3);
101 // why on earth do we have a client dangeling from the record ??
102 // record->client = client;
104 char * bla = "blabla";
105 union data_types data_text;
106 data_text.text = bla;
109 union data_types data_num;
110 data_num.number.min = 2;
111 data_num.number.max = 5;
113 struct record_metadata * tmp_md = 0;
114 tmp_md = record_metadata_insert(nmem, &(record->metadata[0]), data_text);
116 tmp_md = record_metadata_insert(nmem, &tmp_md, data_text);
119 YAZ_CHECK(record_add_metadata_field_id(nmem, record, 3, data_num));
120 YAZ_CHECK(record_add_metadata_field_id(nmem, record, 3, data_num));
122 YAZ_CHECK(record_add_metadata(nmem, record, service, "author", data_text));
123 YAZ_CHECK(record_add_metadata(nmem, record, service, "author", data_text));
126 YAZ_CHECK(record_assign_sortkey_field_id(nmem, record, 0, data_text));
127 YAZ_CHECK(record_assign_sortkey_field_id(nmem, record, 1, data_text));
128 YAZ_CHECK(record_assign_sortkey_field_id(nmem, record, 2, data_num));
130 YAZ_CHECK(record_assign_sortkey(nmem, record, service, "relevance", data_text));
131 YAZ_CHECK(record_assign_sortkey(nmem, record, service, "title", data_text));
132 YAZ_CHECK(record_assign_sortkey(nmem, record, service, "year", data_num));
140 // now we need to put some actual data into the record ... how ??
141 // there is a hell of a lot spagetti code in logic.c ingest_record()
142 // line 694 ff snippet from there:
143 // this code needs to be analyzed and the fundamental stuff extracted
146 service->metadata[imeta].name;
147 md = &service->metadata[imeta];
148 if (md->sortkey_offset >= 0)
149 sk = &service->sortkeys[md->sortkey_offset];
152 // Find out where we are putting it if (md->merge == Metadata_merge_no)
153 wheretoput = &res->metadata[imeta];
155 wheretoput = &cluster->metadata[imeta];
159 newm = nmem_malloc(se->nmem, sizeof(struct record_metadata));
161 if (md->type == Metadata_type_generic)
164 for (p = (char *) value; *p && isspace(*p); p++)
166 for (pe = p + strlen(p) - 1;
167 pe > p && strchr(" ,/.:([", *pe); pe--)
169 newm->data.text = nmem_strdup(se->nmem, p);
172 else if (md->type == Metadata_type_year)
174 if (extract_years((char *) value, &first, &last) < 0)
179 yaz_log(YLOG_WARN, "Unknown type in metadata element %s", type);
182 if (md->type == Metadata_type_year && md->merge != Metadata_merge_range)
184 yaz_log(YLOG_WARN, "Only range merging supported for years");
187 if (md->merge == Metadata_merge_unique)
189 struct record_metadata *mnode;
190 for (mnode = *wheretoput; mnode; mnode = mnode->next)
191 if (!strcmp((const char *) mnode->data.text, newm->data.text))
195 newm->next = *wheretoput;
199 else if (md->merge == Metadata_merge_longest)
202 strlen(newm->data.text) > strlen((*wheretoput)->data.text))
207 char *s = nmem_strdup(se->nmem, newm->data.text);
208 if (!cluster->sortkeys[md->sortkey_offset])
209 cluster->sortkeys[md->sortkey_offset] =
210 nmem_malloc(se->nmem, sizeof(union data_types));
211 normalize_mergekey(s,
212 (sk->type == Metadata_sortkey_skiparticle));
213 cluster->sortkeys[md->sortkey_offset]->text = s;
217 else if (md->merge == Metadata_merge_all || md->merge == Metadata_merge_no)
219 newm->next = *wheretoput;
222 else if (md->merge == Metadata_merge_range)
224 assert(md->type == Metadata_type_year);
228 (*wheretoput)->data.number.min = first;
229 (*wheretoput)->data.number.max = last;
231 cluster->sortkeys[md->sortkey_offset] = &newm->data;
235 if (first < (*wheretoput)->data.number.min)
236 (*wheretoput)->data.number.min = first;
237 if (last > (*wheretoput)->data.number.max)
238 (*wheretoput)->data.number.max = last;
241 relevance_countwords(se->relevance, cluster,
242 (char *) value, md->rank);
245 if (md->type == Metadata_type_year)
248 sprintf(year, "%d", last);
249 add_facet(se, (char *) type, year);
252 sprintf(year, "%d", first);
253 add_facet(se, (char *) type, year);
257 add_facet(se, (char *) type, (char *) value);
261 //mergekey_norm = (xmlChar *) nmem_strdup(se->nmem, (char*) mergekey);
262 //normalize_mergekey((char *) mergekey_norm, 0);
266 // insert one record into recordlist/cluster - what's a cluster, exactly??
267 cluster = reclist_insert(list, service, record, (char *)mergekey, &total);
268 relevance_newrec(rel, cluster);
276 //relevance_prepare_read(rel, list);
279 //relevance_donerecord(rel, cluster);
280 // relevance_countwords(se->rel, cluster,
281 // (char *) value, service->metadata->rank);
288 //YAZ_CHECK_EQ(0, 1);
292 int main(int argc, char **argv)
294 YAZ_CHECK_INIT(argc, argv);
298 test_relevance(argc, argv);
310 * indent-tabs-mode: nil
312 * vim: shiftwidth=4 tabstop=8 expandtab