#include <caml/memory.h>
#include <caml/callback.h>
#include <caml/fail.h>
+#include <caml/custom.h>
+
+
} //extern C
+//#include "TextCollection/TextCollection.h"
#include "XMLDocShredder.h"
#include "XMLTree.h"
-#include "TextCollection/TextCollection.h"
#include "Utils.h"
#define CAMLRAISECPP(e) (caml_failwith( ((e).what())))
#define NOT_IMPLEMENTED(s) (caml_failwith(s))
-#define XMLTREE(x) ((XMLTree *)(x))
+#define XMLTREE(x) ((XMLTree *)(* (XMLTree**) Data_custom_val(x)))
#define TEXTCOLLECTION(x)
#define TREENODEVAL(i) ((treeNode) (Int_val(i)))
-extern "C" CAMLprim value caml_call_shredder_uri(value uri){
+extern "C" {
+ static struct custom_operations ops;
+ static bool initialized = false;
+}
+extern "C" void caml_xml_tree_finalize(value tree){
+ delete XMLTREE(tree);
+ return;
+}
+
+extern "C" void caml_init_ops () {
+
+ if (initialized)
+ return;
+ ops.identifier = (char*) "XMLTree";
+ ops.finalize = caml_xml_tree_finalize;
+ return;
+}
+
+extern "C" CAMLprim value caml_call_shredder_uri(value uri,value sf, value iet, value dtc){
CAMLparam1(uri);
CAMLlocal1(doc);
char *fn = String_val(uri);
try {
- XMLDocShredder shredder(fn);
+ XMLDocShredder shredder(fn,Int_val(sf),Bool_val(iet),Bool_val(dtc));
+ XMLTree * tree;
shredder.processStartDocument(fn);
shredder.parse();
shredder.processEndDocument();
- doc = (value) shredder.storageIfc_->returnDocument();
-
+ caml_init_ops();
+ doc = caml_alloc_custom(&ops,sizeof(XMLTree*),1,2);
+ tree = (XMLTree *) shredder.storageIfc_->returnDocument();
+ memcpy(Data_custom_val(doc),&tree,sizeof(XMLTree*));
CAMLreturn(doc);
}
catch (const std::exception& e){
}
-extern "C" CAMLprim value caml_call_shredder_string(value data){
+extern "C" CAMLprim value caml_call_shredder_string(value data,value sf, value iet, value dtc){
CAMLparam1(data);
CAMLlocal1(doc);
unsigned int ln = string_length(data);
unsigned char *fn = (unsigned char*) String_val(data);
try {
- XMLDocShredder shredder(fn,ln);
+ XMLDocShredder shredder(fn,ln,Int_val(sf),Bool_val(iet),Bool_val(dtc));
+ XMLTree* tree;
shredder.processStartDocument("");
shredder.parse();
shredder.processEndDocument();
- doc = (value) shredder.storageIfc_->returnDocument();
-
+ caml_init_ops();
+ doc = caml_alloc_custom(&ops,sizeof(XMLTree*),1,2);
+ tree = (XMLTree *) shredder.storageIfc_->returnDocument();
+ memcpy(Data_custom_val(doc),&tree,sizeof(XMLTree*));
CAMLreturn(doc);
}
catch (const std::exception& e) {
};
}
-extern "C" CAMLprim value caml_text_collection_get_text(value tc, value id){
- CAMLparam2(tc,id);
+void traversal_rec(XMLTree* tree, treeNode id){
+ DocID tid;
+ if (id == NULLT)
+ return;
+ // int tag = tree->Tag(id);
+ if (id) {
+ tid = tree->PrevText(id);
+ char * data = (char *) (tree->getTextCollection())->GetText(tid);
+ if (tree->IsLeaf(id)){
+ tid = tree->MyText(id);
+
+ data = (char*) (tree->getTextCollection())->GetText(tid);
+ };
- const char* txt = (const char*) ((TextCollection*) tc)->GetText((DocID) Int_val(id));
- CAMLreturn (caml_copy_string(txt));
+ if (tree->NextSibling(id) == NULLT){
+ tid = tree->NextText(id);
+ data = (char*) (tree->getTextCollection())->GetText(tid);
+ };
+ };
+ traversal_rec(tree,tree->FirstChild(id));
+ traversal_rec(tree,tree->NextSibling(id));
+ return;
+}
+
+extern "C" CAMLprim value caml_cpp_traversal(value tree){
+ CAMLparam1(tree);
+ traversal_rec(XMLTREE(tree),XMLTREE(tree)->Root());
+ CAMLreturn(Val_unit);
}
+extern "C" CAMLprim value caml_text_collection_get_text(value tree, value id){
+ CAMLparam2(tree,id);
+ CAMLlocal1(str);
+ uchar* txt = XMLTREE(tree)->GetText((DocID) Int_val(id));
+ str = caml_copy_string((const char*)txt);
+ delete (txt);
+ CAMLreturn (str);
+}
+extern "C" CAMLprim value caml_text_collection_empty_text(value tree,value id){
+ CAMLparam2(tree,id);
+ CAMLreturn ( Val_int((XMLTREE(tree))->EmptyText((DocID) Int_val(id))));
+}
+
+extern "C" CAMLprim value caml_text_collection_is_contains(value tree,value str){
+ CAMLparam2(tree,str);
+ uchar * cstr = (uchar *) String_val(str);
+ CAMLreturn ( Val_bool((int) XMLTREE(tree)->IsContains(cstr)));
+}
+
+extern "C" CAMLprim value caml_text_collection_count_contains(value tree,value str){
+ CAMLparam2(tree,str);
+ uchar * cstr = (uchar *) String_val(str);
+ CAMLreturn (Val_int((XMLTREE(tree)->CountContains(cstr))));
+
+}
+
+extern "C" CAMLprim value caml_text_collection_contains(value tree,value str){
+ CAMLparam2(tree,str);
+ CAMLlocal1(resarray);
+ uchar * cstr = (uchar *) String_val(str);
+ std::vector<DocID> results;
+ results = XMLTREE(tree)->Contains(cstr);
+ //free(cstr);
+ resarray = caml_alloc_tuple(results.size());
+
+ for (unsigned int i=0; i<results.size();i++){
+ caml_initialize(&Field(resarray,i),Val_int(results[i]));
+ };
+ CAMLreturn (resarray);
+}
+
+
extern "C" CAMLprim value caml_xml_tree_root(value tree){
CAMLparam1(tree);
CAMLreturn (TREENODEVAL(XMLTREE(tree)->Root()));
}
extern "C" CAMLprim value caml_xml_tree_text_collection(value tree){
CAMLparam1(tree);
- CAMLreturn((value) XMLTREE(tree)->GetTextCollection());
+ CAMLreturn((value) XMLTREE(tree)->getTextCollection());
+}
+extern "C" CAMLprim value caml_xml_tree_parent(value tree, value id){
+ CAMLparam2(tree,id);
+ CAMLreturn(Val_int (XMLTREE(tree)->Parent(TREENODEVAL(id))));
+}
+extern "C" CAMLprim value caml_xml_tree_parent_doc(value tree, value id){
+ CAMLparam2(tree,id);
+ CAMLreturn(Val_int (XMLTREE(tree)->ParentNode((DocID) Int_val(id))));
+}
+
+extern "C" CAMLprim value caml_xml_tree_is_ancestor(value tree,value id1, value id2) {
+ CAMLparam3(tree,id1,id2);
+ CAMLreturn(Val_bool (XMLTREE(tree)->IsAncestor(TREENODEVAL(id1),TREENODEVAL(id2))));
}
+extern "C" CAMLprim value caml_xml_tree_serialize(value tree, value filename){
+ CAMLparam2(tree,filename);
+ NOT_IMPLEMENTED("caml_xml_tree_serialize");
+ CAMLreturn(Val_unit);
+}
+
+extern "C" CAMLprim value caml_xml_tree_unserialize(value filename){
+ CAMLparam1(filename);
+ NOT_IMPLEMENTED("caml_xml_tree_unserialize");
+ CAMLreturn(Val_unit);
+}
+
+
extern "C" CAMLprim value caml_xml_tree_first_child(value tree, value id){
CAMLparam2(tree,id);
CAMLreturn(Val_int (XMLTREE(tree)->FirstChild(TREENODEVAL(id))));
CAMLreturn(Val_bool (XMLTREE(tree)->IsLeaf(TREENODEVAL(id))));
}
+extern "C" CAMLprim value caml_xml_tree_tagged_desc(value tree, value id, value tag){
+ CAMLparam3(tree,id,tag);
+ CAMLreturn(Val_int (XMLTREE(tree)->TaggedDesc(TREENODEVAL(id),(TagType) Int_val(tag))));
+}
+
+extern "C" CAMLprim value caml_xml_tree_tagged_next(value tree, value id, value tag){
+ CAMLparam3(tree,id,tag);
+ CAMLreturn(Val_int (XMLTREE(tree)->TaggedNext(TREENODEVAL(id),(TagType) Int_val(tag))));
+}
+
+
+
+
+extern "C" CAMLprim value caml_xml_tree_tagged_foll(value tree, value id, value tag){
+ CAMLparam3(tree,id,tag);
+ CAMLreturn(Val_int (XMLTREE(tree)->TaggedFoll(TREENODEVAL(id),(TagType) Int_val(tag))));
+}
+
+
extern "C" CAMLprim value caml_xml_tree_next_sibling(value tree, value id){
CAMLparam2(tree,id);
CAMLreturn(Val_int (XMLTREE(tree)->NextSibling(TREENODEVAL(id))));
extern "C" CAMLprim value caml_xml_tree_text_xml_id(value tree, value id){
CAMLparam2(tree,id);
-
- NOT_IMPLEMENTED("caml_xml_tree_text_xml_id");
- CAMLreturn (Val_unit);
+ CAMLreturn(Val_int((XMLTREE(tree)->TextXMLId(TREENODEVAL(id)))));
}
extern "C" CAMLprim value caml_xml_tree_node_xml_id(value tree, value id){
CAMLparam2(tree,id);
+ CAMLreturn(Val_int((XMLTREE(tree)->NodeXMLId(TREENODEVAL(id)))));
+}
- NOT_IMPLEMENTED("caml_xml_tree_node_xml_id");
- CAMLreturn (Val_unit);
+extern "C" CAMLprim value caml_xml_tree_tag_name(value tree, value tagid){
+ CAMLparam2(tree,tagid);
+ CAMLlocal1(str);
+ char* tag;
+ tag = (char*) XMLTREE(tree)->GetTagNameByRef((TagType) (Int_val(tagid)));
+ str = caml_copy_string((const char*) tag);
+ CAMLreturn (str);
}
-extern "C" CAMLprim value caml_xml_tree_tag(value tree, value id){
- CAMLparam2(tree,id);
- const char* tag;
- tag =(const char*) XMLTREE(tree)->GetTagName(XMLTREE(tree)->Tag(TREENODEVAL(id)));
- CAMLreturn (caml_copy_string(tag));
+
+extern "C" CAMLprim value caml_xml_tree_tag_id(value tree,value id){
+ CAMLparam2(tree,id);
+ CAMLreturn (Val_int(XMLTREE(tree)->Tag(TREENODEVAL(id))));
+}
+
+extern "C" CAMLprim value caml_xml_tree_subtree_tags(value tree,value id,value tag){
+ CAMLparam3(tree,id,tag);
+ CAMLreturn (Val_int(XMLTREE(tree)->SubtreeTags(TREENODEVAL(id),Int_val(tag))));
+}
+
+
+extern "C" CAMLprim value caml_xml_tree_register_tag(value tree,value str){
+ CAMLparam2(tree,str);
+ CAMLlocal1(id);
+ unsigned char* tag;
+ tag = (unsigned char*) (String_val(str));
+ id = Val_int(XMLTREE(tree)->RegisterTag(tag));
+ CAMLreturn (id);
}
+
extern "C" CAMLprim value caml_xml_tree_nullt(value unit){
CAMLparam1(unit);
CAMLreturn (NULLT);
}
+
+extern "C" CAMLprim value caml_xml_tree_save(value tree,value filename){
+ CAMLparam2(tree,filename);
+ XMLTREE(tree)->Save((unsigned char *) String_val(filename));
+ CAMLreturn (Val_unit);
+}
+
+extern "C" CAMLprim value caml_xml_tree_load(value filename,value samplerate){
+ CAMLparam2(filename,samplerate);
+ CAMLlocal1(doc);
+ XMLTree * tree;
+ tree = XMLTree::Load((unsigned char *) String_val(filename),Int_val(samplerate));
+ caml_init_ops();
+ doc = caml_alloc_custom(&ops,sizeof(XMLTree*),1,2);
+ memcpy(Data_custom_val(doc),&tree,sizeof(XMLTree*));
+ CAMLreturn(doc);
+}