X-Git-Url: http://git.nguyen.vg/gitweb/?a=blobdiff_plain;f=OCamlDriver.cpp;h=e3b5f445c26efb890aac5c3e8c3932cdc7da6e86;hb=f84dd2f6de7d5da16da729dc2e91cbdeb3585d75;hp=48925b6cb3f117a7a22524acb2a3a3b2c5080a14;hpb=3623eefccfb5fc69e19ad975a3669f51a2a8b276;p=SXSI%2Fxpathcomp.git diff --git a/OCamlDriver.cpp b/OCamlDriver.cpp index 48925b6..e3b5f44 100644 --- a/OCamlDriver.cpp +++ b/OCamlDriver.cpp @@ -15,23 +15,54 @@ extern "C" { #include #include #include +#include + + } //extern C +//#include "TextCollection/TextCollection.h" #include "XMLDocShredder.h" +#include "XMLTree.h" +#include "Utils.h" + #define CAMLRAISECPP(e) (caml_failwith( ((e).what()))) -#define NOT_IMPLEMENTED (caml_failwith("Not Implemented!!!")) +#define NOT_IMPLEMENTED(s) (caml_failwith(s)) +#define XMLTREE(x) ((XMLTree *)(* (XMLTree**) Data_custom_val(x))) +#define TEXTCOLLECTION(x) +#define TREENODEVAL(i) ((treeNode) (Int_val(i))) + +extern "C" { + static struct custom_operations ops; + static bool initialized = false; +} +extern "C" void caml_xml_tree_finalize(value tree){ + delete XMLTREE(tree); + return; +} + +extern "C" void caml_init_ops () { + + if (initialized) + return; + ops.identifier = (char*) "XMLTree"; + ops.finalize = caml_xml_tree_finalize; + return; +} -extern "C" CAMLprim value caml_call_shredder_uri(value uri){ +extern "C" CAMLprim value caml_call_shredder_uri(value uri,value sf, value iet, value dtc){ CAMLparam1(uri); CAMLlocal1(doc); char *fn = String_val(uri); try { - XMLDocShredder shredder(fn); + XMLDocShredder shredder(fn,Int_val(sf),Bool_val(iet),Bool_val(dtc)); + XMLTree * tree; shredder.processStartDocument(fn); shredder.parse(); shredder.processEndDocument(); - doc = (value) shredder.storageIfc_->returnDocument(); - + caml_init_ops(); + doc = caml_alloc_custom(&ops,sizeof(XMLTree*),1,2); + tree = (XMLTree *) shredder.storageIfc_->returnDocument(); + memcpy(Data_custom_val(doc),&tree,sizeof(XMLTree*)); CAMLreturn(doc); } catch (const std::exception& e){ @@ -40,19 +71,22 @@ extern "C" CAMLprim value caml_call_shredder_uri(value uri){ } -extern "C" CAMLprim value caml_call_shredder_string(value data){ +extern "C" CAMLprim value caml_call_shredder_string(value data,value sf, value iet, value dtc){ CAMLparam1(data); CAMLlocal1(doc); unsigned int ln = string_length(data); unsigned char *fn = (unsigned char*) String_val(data); try { - XMLDocShredder shredder(fn,ln); + XMLDocShredder shredder(fn,ln,Int_val(sf),Bool_val(iet),Bool_val(dtc)); + XMLTree* tree; shredder.processStartDocument(""); shredder.parse(); shredder.processEndDocument(); - doc = (value) shredder.storageIfc_->returnDocument(); - + caml_init_ops(); + doc = caml_alloc_custom(&ops,sizeof(XMLTree*),1,2); + tree = (XMLTree *) shredder.storageIfc_->returnDocument(); + memcpy(Data_custom_val(doc),&tree,sizeof(XMLTree*)); CAMLreturn(doc); } catch (const std::exception& e) { @@ -60,75 +94,194 @@ extern "C" CAMLprim value caml_call_shredder_string(value data){ }; } +void traversal_rec(XMLTree* tree, treeNode id){ + DocID tid; + if (id == NULLT) + return; + // int tag = tree->Tag(id); + if (id) { + tid = tree->PrevText(id); + char * data = (char *) (tree->getTextCollection())->GetText(tid); + if (tree->IsLeaf(id)){ + tid = tree->MyText(id); + + data = (char*) (tree->getTextCollection())->GetText(tid); + }; + + if (tree->NextSibling(id) == NULLT){ + tid = tree->NextText(id); + data = (char*) (tree->getTextCollection())->GetText(tid); + }; + }; + traversal_rec(tree,tree->FirstChild(id)); + traversal_rec(tree,tree->NextSibling(id)); + return; +} + +extern "C" CAMLprim value caml_cpp_traversal(value tree){ + CAMLparam1(tree); + traversal_rec(XMLTREE(tree),XMLTREE(tree)->Root()); + CAMLreturn(Val_unit); +} + extern "C" CAMLprim value caml_text_collection_get_text(value tree, value id){ CAMLparam2(tree,id); + CAMLlocal1(str); + uchar* txt = XMLTREE(tree)->GetText((DocID) Int_val(id)); + str = caml_copy_string((const char*)txt); + delete (txt); + CAMLreturn (str); +} +extern "C" CAMLprim value caml_text_collection_empty_text(value tree,value id){ + CAMLparam2(tree,id); + CAMLreturn ( Val_int((XMLTREE(tree))->EmptyText((DocID) Int_val(id)))); +} - NOT_IMPLEMENTED; - CAMLreturn (Val_unit); +extern "C" CAMLprim value caml_text_collection_is_contains(value tree,value str){ + CAMLparam2(tree,str); + uchar * cstr = (uchar *) String_val(str); + CAMLreturn ( Val_bool((int) XMLTREE(tree)->IsContains(cstr))); +} + +extern "C" CAMLprim value caml_text_collection_count_contains(value tree,value str){ + CAMLparam2(tree,str); + uchar * cstr = (uchar *) String_val(str); + CAMLreturn (Val_int((XMLTREE(tree)->CountContains(cstr)))); + +} + +extern "C" CAMLprim value caml_text_collection_contains(value tree,value str){ + CAMLparam2(tree,str); + CAMLlocal1(resarray); + uchar * cstr = (uchar *) String_val(str); + std::vector results; + results = XMLTREE(tree)->Contains(cstr); + //free(cstr); + resarray = caml_alloc_tuple(results.size()); + + for (unsigned int i=0; iRoot())); } -extern "C" CAMLprim value caml_xml_tree_text_collection(value tree, value id){ +extern "C" CAMLprim value caml_xml_tree_text_collection(value tree){ + CAMLparam1(tree); + CAMLreturn((value) XMLTREE(tree)->getTextCollection()); +} +extern "C" CAMLprim value caml_xml_tree_parent(value tree, value id){ CAMLparam2(tree,id); - - NOT_IMPLEMENTED; - CAMLreturn (Val_unit); + CAMLreturn(Val_int (XMLTREE(tree)->Parent(TREENODEVAL(id)))); } -extern "C" CAMLprim value caml_xml_tree_next_sibling(value tree, value id){ +extern "C" CAMLprim value caml_xml_tree_parent_doc(value tree, value id){ CAMLparam2(tree,id); + CAMLreturn(Val_int (XMLTREE(tree)->ParentNode((DocID) Int_val(id)))); +} - NOT_IMPLEMENTED; - CAMLreturn (Val_unit); +extern "C" CAMLprim value caml_xml_tree_is_ancestor(value tree,value id1, value id2) { + CAMLparam3(tree,id1,id2); + CAMLreturn(Val_bool (XMLTREE(tree)->IsAncestor(TREENODEVAL(id1),TREENODEVAL(id2)))); +} + +extern "C" CAMLprim value caml_xml_tree_serialize(value tree, value filename){ + CAMLparam2(tree,filename); + NOT_IMPLEMENTED("caml_xml_tree_serialize"); + CAMLreturn(Val_unit); +} + +extern "C" CAMLprim value caml_xml_tree_unserialize(value filename){ + CAMLparam1(filename); + NOT_IMPLEMENTED("caml_xml_tree_unserialize"); + CAMLreturn(Val_unit); } + + extern "C" CAMLprim value caml_xml_tree_first_child(value tree, value id){ CAMLparam2(tree,id); + CAMLreturn(Val_int (XMLTREE(tree)->FirstChild(TREENODEVAL(id)))); +} - NOT_IMPLEMENTED; - CAMLreturn (Val_unit); +extern "C" CAMLprim value caml_xml_tree_is_leaf(value tree, value id){ + CAMLparam2(tree,id); + CAMLreturn(Val_bool (XMLTREE(tree)->IsLeaf(TREENODEVAL(id)))); } -extern "C" CAMLprim value caml_xml_tree_prev_text(value tree, value id){ + +extern "C" CAMLprim value caml_xml_tree_next_sibling(value tree, value id){ CAMLparam2(tree,id); + CAMLreturn(Val_int (XMLTREE(tree)->NextSibling(TREENODEVAL(id)))); +} - NOT_IMPLEMENTED; - CAMLreturn (Val_unit); +extern "C" CAMLprim value caml_xml_tree_prev_text(value tree, value id){ + CAMLparam2(tree,id); + CAMLlocal1(res); + CAMLreturn(Val_int((XMLTREE(tree)->PrevText(TREENODEVAL(id))))); + CAMLreturn(res); } extern "C" CAMLprim value caml_xml_tree_next_text(value tree, value id){ CAMLparam2(tree,id); - - NOT_IMPLEMENTED; - CAMLreturn (Val_unit); + CAMLreturn(Val_int((XMLTREE(tree)->NextText(TREENODEVAL(id))))); } extern "C" CAMLprim value caml_xml_tree_my_text(value tree, value id){ CAMLparam2(tree,id); - - NOT_IMPLEMENTED; - CAMLreturn (Val_unit); + CAMLreturn(Val_int((XMLTREE(tree)->MyText(TREENODEVAL(id))))); } extern "C" CAMLprim value caml_xml_tree_text_xml_id(value tree, value id){ CAMLparam2(tree,id); - - NOT_IMPLEMENTED; - CAMLreturn (Val_unit); + CAMLreturn(Val_int((XMLTREE(tree)->TextXMLId(TREENODEVAL(id))))); } extern "C" CAMLprim value caml_xml_tree_node_xml_id(value tree, value id){ CAMLparam2(tree,id); + CAMLreturn(Val_int((XMLTREE(tree)->NodeXMLId(TREENODEVAL(id))))); +} - NOT_IMPLEMENTED; - CAMLreturn (Val_unit); +extern "C" CAMLprim value caml_xml_tree_tag_name(value tree, value tagid){ + CAMLparam2(tree,tagid); + CAMLlocal1(str); + char* tag; + tag = (char*) XMLTREE(tree)->GetTagNameByRef((TagType) (Int_val(tagid))); + str = caml_copy_string((const char*) tag); + CAMLreturn (str); } -extern "C" CAMLprim value caml_xml_tree_tag(value tree, value id){ - CAMLparam2(tree,id); - NOT_IMPLEMENTED; - CAMLreturn (Val_unit); + +extern "C" CAMLprim value caml_xml_tree_tag_id(value tree,value id){ + CAMLparam2(tree,id); + CAMLreturn (Val_int(XMLTREE(tree)->Tag(TREENODEVAL(id)))); } + +extern "C" CAMLprim value caml_xml_tree_register_tag(value tree,value str){ + CAMLparam2(tree,str); + CAMLlocal1(id); + unsigned char* tag; + tag = (unsigned char*) (String_val(str)); + id = Val_int(XMLTREE(tree)->RegisterTag(tag)); + CAMLreturn (id); +} + extern "C" CAMLprim value caml_xml_tree_nullt(value unit){ CAMLparam1(unit); - CAMLreturn (Val_int(-1)); + CAMLreturn (NULLT); +} +extern "C" CAMLprim value caml_xml_tree_save(value tree,value filename){ + CAMLparam2(tree,filename); + XMLTREE(tree)->Save((unsigned char *) String_val(filename)); + CAMLreturn (Val_unit); +} + +extern "C" CAMLprim value caml_xml_tree_load(value filename,value samplerate){ + CAMLparam2(filename,samplerate); + CAMLlocal1(doc); + XMLTree * tree; + tree = XMLTree::Load((unsigned char *) String_val(filename),Int_val(samplerate)); + caml_init_ops(); + doc = caml_alloc_custom(&ops,sizeof(XMLTree*),1,2); + memcpy(Data_custom_val(doc),&tree,sizeof(XMLTree*)); + CAMLreturn(doc); }