X-Git-Url: http://sru.miketaylor.org.uk/?a=blobdiff_plain;f=index%2Fmod_dom.c;h=a2e83c73b45c337d0371013a31805fefb457c5f7;hb=800fb31d00e78000dd2229231401ee67d03ed78d;hp=fca04eb75ce2c6812a49a48b8af6184080a8a4e2;hpb=7bc692d5bc6971008fc2e1e37d63c080383d6a3e;p=idzebra-moved-to-github.git diff --git a/index/mod_dom.c b/index/mod_dom.c index fca04eb..a2e83c7 100644 --- a/index/mod_dom.c +++ b/index/mod_dom.c @@ -1,4 +1,5 @@ -/* $Id: mod_dom.c,v 1.26 2007-03-03 21:39:10 adam Exp $ + +/* $Id: mod_dom.c,v 1.27 2007-03-05 13:02:11 marc Exp $ Copyright (C) 1995-2007 Index Data ApS @@ -1057,7 +1058,6 @@ static void extract_dom_doc_node(struct filter_info *tinfo, RecWord recword; (*extctr->init)(extctr, &recword); - tinfo->record_info_invoked = 0; process_xml_element_node(tinfo, extctr, &recword, (xmlNodePtr)doc); } @@ -1076,6 +1076,14 @@ static int convert_extract_doc(struct filter_info *tinfo, xsltStylesheetPtr last_xsp = 0; xmlDocPtr store_doc = 0; + /* per default do not ingest record */ + tinfo->record_info_invoked = 0; + + /* exit if empty document given */ + if (!doc) + return RECCTRL_EXTRACT_SKIP; + + /* we actuallu have a document which needs to be processed further */ params[0] = 0; set_param_str(params, "schema", zebra_dom_ns, tinfo->odr_record); @@ -1090,14 +1098,12 @@ static int convert_extract_doc(struct filter_info *tinfo, params, &store_doc, &last_xsp); } + /* saving either store doc or original doc in case no store doc exists */ if (last_xsp) xsltSaveResultToString(&buf_out, &len_out, store_doc ? store_doc : doc, last_xsp); else xmlDocDumpMemory(store_doc ? store_doc : doc, &buf_out, &len_out); - - /* if (p->flagShowRecords) - fwrite(buf_out, len_out, 1, stdout); */ (*p->setStoreData)(p, buf_out, len_out); xmlFree(buf_out); @@ -1108,15 +1114,17 @@ static int convert_extract_doc(struct filter_info *tinfo, /* extract conversion */ perform_convert(tinfo, p, tinfo->extract->convert, params, &doc, 0); + /* finally, do the indexing */ - if (doc) + if (doc){ extract_dom_doc_node(tinfo, p, doc); - - if (doc) xmlFreeDoc(doc); - + } + + /* there was nothing to index, so there is no inserted/updated record */ if (tinfo->record_info_invoked == 0) return RECCTRL_EXTRACT_SKIP; + return RECCTRL_EXTRACT_OK; } @@ -1145,13 +1153,20 @@ static int extract_xml_split(struct filter_info *tinfo, { int type = xmlTextReaderNodeType(input->u.xmlreader.reader); int depth = xmlTextReaderDepth(input->u.xmlreader.reader); + if (type == XML_READER_TYPE_ELEMENT && input->u.xmlreader.split_level == depth) { - xmlNodePtr ptr + /* per default do not ingest record */ + tinfo->record_info_invoked = 0; + + xmlNodePtr ptr = xmlTextReaderExpand(input->u.xmlreader.reader); + if (ptr) - { + { + /* we have a new document */ + xmlNodePtr ptr2 = xmlCopyNode(ptr, 1); xmlDocPtr doc = xmlNewDoc((const xmlChar*) "1.0");