1 /**************************************
4 * A Test Ocaml Driver which calls the C++ methods and
5 * adds a C wrapper interface with OCaml code.
11 /* OCaml memory managment */
13 #include <caml/mlvalues.h>
14 #include <caml/alloc.h>
15 #include <caml/memory.h>
16 #include <caml/callback.h>
17 #include <caml/fail.h>
18 #include <caml/custom.h>
23 //#include "TextCollection/TextCollection.h"
24 #include "XMLDocShredder.h"
28 #define CAMLRAISECPP(e) (caml_failwith( ((e).what())))
29 #define NOT_IMPLEMENTED(s) (caml_failwith(s))
30 #define XMLTREE(x) ((XMLTree *)(* (XMLTree**) Data_custom_val(x)))
31 #define TEXTCOLLECTION(x)
32 #define TREENODEVAL(i) ((treeNode) (Int_val(i)))
35 static struct custom_operations ops;
36 static bool initialized = false;
38 extern "C" void caml_xml_tree_finalize(value tree){
43 extern "C" void caml_init_ops () {
47 ops.identifier = (char*) "XMLTree";
48 ops.finalize = caml_xml_tree_finalize;
52 extern "C" CAMLprim value caml_call_shredder_uri(value uri,value sf, value iet, value dtc){
55 char *fn = String_val(uri);
57 XMLDocShredder shredder(fn,Int_val(sf),Bool_val(iet),Bool_val(dtc));
59 shredder.processStartDocument(fn);
61 shredder.processEndDocument();
63 doc = caml_alloc_custom(&ops,sizeof(XMLTree*),1,2);
64 tree = (XMLTree *) shredder.storageIfc_->returnDocument();
65 memcpy(Data_custom_val(doc),&tree,sizeof(XMLTree*));
68 catch (const std::exception& e){
74 extern "C" CAMLprim value caml_call_shredder_string(value data,value sf, value iet, value dtc){
77 unsigned int ln = string_length(data);
78 unsigned char *fn = (unsigned char*) String_val(data);
81 XMLDocShredder shredder(fn,ln,Int_val(sf),Bool_val(iet),Bool_val(dtc));
83 shredder.processStartDocument("");
85 shredder.processEndDocument();
87 doc = caml_alloc_custom(&ops,sizeof(XMLTree*),1,2);
88 tree = (XMLTree *) shredder.storageIfc_->returnDocument();
89 memcpy(Data_custom_val(doc),&tree,sizeof(XMLTree*));
92 catch (const std::exception& e) {
97 void traversal_rec(XMLTree* tree, treeNode id){
101 // int tag = tree->Tag(id);
103 tid = tree->PrevText(id);
104 char * data = (char *) (tree->getTextCollection())->GetText(tid);
105 if (tree->IsLeaf(id)){
106 tid = tree->MyText(id);
108 data = (char*) (tree->getTextCollection())->GetText(tid);
111 if (tree->NextSibling(id) == NULLT){
112 tid = tree->NextText(id);
113 data = (char*) (tree->getTextCollection())->GetText(tid);
116 traversal_rec(tree,tree->FirstChild(id));
117 traversal_rec(tree,tree->NextSibling(id));
121 extern "C" CAMLprim value caml_cpp_traversal(value tree){
123 traversal_rec(XMLTREE(tree),XMLTREE(tree)->Root());
124 CAMLreturn(Val_unit);
127 extern "C" CAMLprim value caml_text_collection_get_text(value tree, value id){
130 uchar* txt = XMLTREE(tree)->GetText((DocID) Int_val(id));
131 str = caml_copy_string((const char*)txt);
136 extern "C" CAMLprim value caml_text_collection_get_cached_text(value tree, value id){
139 char* txt = (char*) XMLTREE(tree)->GetCachedText((DocID) Int_val(id));
140 str = caml_copy_string(txt);
145 extern "C" CAMLprim value caml_text_collection_size(value tree){
147 // CAMLreturn (Val_int( XMLTREE(tree)->CachedText.size()));
148 NOT_IMPLEMENTED("text_collection_size");
149 CAMLreturn (Val_unit);
154 extern "C" CAMLprim value caml_text_collection_empty_text(value tree,value id){
156 CAMLreturn ( Val_int((XMLTREE(tree))->EmptyText((DocID) Int_val(id))));
159 extern "C" CAMLprim value caml_text_collection_is_contains(value tree,value str){
160 CAMLparam2(tree,str);
161 uchar * cstr = (uchar *) String_val(str);
162 CAMLreturn ( Val_bool((int) XMLTREE(tree)->IsContains(cstr)));
165 extern "C" CAMLprim value caml_text_collection_count_contains(value tree,value str){
166 CAMLparam2(tree,str);
167 uchar * cstr = (uchar *) String_val(str);
168 CAMLreturn (Val_int((XMLTREE(tree)->CountContains(cstr))));
171 extern "C" CAMLprim value caml_text_collection_count(value tree,value str){
172 CAMLparam2(tree,str);
173 //uchar * cstr = (uchar *) String_val(str);
174 NOT_IMPLEMENTED("text_collection_count");
175 CAMLreturn (Val_unit);
179 extern "C" CAMLprim value caml_text_collection_contains(value tree,value str){
180 CAMLparam2(tree,str);
181 CAMLlocal1(resarray);
182 uchar * cstr = (uchar *) String_val(str);
183 std::vector<DocID> results;
184 results = XMLTREE(tree)->Contains(cstr);
186 resarray = caml_alloc_tuple(results.size());
188 for (unsigned int i=0; i<results.size();i++){
189 caml_initialize(&Field(resarray,i),Val_int(results[i]));
191 CAMLreturn (resarray);
195 extern "C" CAMLprim value caml_xml_tree_root(value tree){
197 CAMLreturn (TREENODEVAL(XMLTREE(tree)->Root()));
199 extern "C" CAMLprim value caml_xml_tree_text_collection(value tree){
201 CAMLreturn((value) XMLTREE(tree)->getTextCollection());
203 extern "C" CAMLprim value caml_xml_tree_parent(value tree, value id){
205 CAMLreturn(Val_int (XMLTREE(tree)->Parent(TREENODEVAL(id))));
207 extern "C" CAMLprim value caml_xml_tree_parent_doc(value tree, value id){
209 CAMLreturn(Val_int (XMLTREE(tree)->ParentNode((DocID) Int_val(id))));
212 extern "C" CAMLprim value caml_xml_tree_is_ancestor(value tree,value id1, value id2) {
213 CAMLparam3(tree,id1,id2);
214 CAMLreturn(Val_bool (XMLTREE(tree)->IsAncestor(TREENODEVAL(id1),TREENODEVAL(id2))));
217 extern "C" CAMLprim value caml_xml_tree_serialize(value tree, value filename){
218 CAMLparam2(tree,filename);
219 NOT_IMPLEMENTED("caml_xml_tree_serialize");
220 CAMLreturn(Val_unit);
223 extern "C" CAMLprim value caml_xml_tree_unserialize(value filename){
224 CAMLparam1(filename);
225 NOT_IMPLEMENTED("caml_xml_tree_unserialize");
226 CAMLreturn(Val_unit);
230 extern "C" CAMLprim value caml_xml_tree_first_child(value tree, value id){
232 CAMLreturn(Val_int (XMLTREE(tree)->FirstChild(TREENODEVAL(id))));
235 extern "C" CAMLprim value caml_xml_tree_is_leaf(value tree, value id){
237 CAMLreturn(Val_bool (XMLTREE(tree)->IsLeaf(TREENODEVAL(id))));
240 extern "C" CAMLprim value caml_xml_tree_tagged_desc(value tree, value id, value tag){
241 CAMLparam3(tree,id,tag);
242 CAMLreturn(Val_int (XMLTREE(tree)->TaggedDesc(TREENODEVAL(id),(TagType) Int_val(tag))));
245 extern "C" CAMLprim value caml_xml_tree_tagged_next(value tree, value id, value tag){
246 CAMLparam3(tree,id,tag);
247 CAMLreturn(Val_int (XMLTREE(tree)->TaggedNext(TREENODEVAL(id),(TagType) Int_val(tag))));
253 extern "C" CAMLprim value caml_xml_tree_tagged_foll(value tree, value id, value tag){
254 CAMLparam3(tree,id,tag);
255 CAMLreturn(Val_int (XMLTREE(tree)->TaggedFoll(TREENODEVAL(id),(TagType) Int_val(tag))));
259 extern "C" CAMLprim value caml_xml_tree_next_sibling(value tree, value id){
261 CAMLreturn(Val_int (XMLTREE(tree)->NextSibling(TREENODEVAL(id))));
264 extern "C" CAMLprim value caml_xml_tree_prev_text(value tree, value id){
267 CAMLreturn(Val_int((XMLTREE(tree)->PrevText(TREENODEVAL(id)))));
270 extern "C" CAMLprim value caml_xml_tree_next_text(value tree, value id){
272 CAMLreturn(Val_int((XMLTREE(tree)->NextText(TREENODEVAL(id)))));
274 extern "C" CAMLprim value caml_xml_tree_my_text(value tree, value id){
276 CAMLreturn(Val_int((XMLTREE(tree)->MyText(TREENODEVAL(id)))));
279 extern "C" CAMLprim value caml_xml_tree_text_xml_id(value tree, value id){
281 CAMLreturn(Val_int((XMLTREE(tree)->TextXMLId(TREENODEVAL(id)))));
283 extern "C" CAMLprim value caml_xml_tree_node_xml_id(value tree, value id){
285 CAMLreturn(Val_int((XMLTREE(tree)->NodeXMLId(TREENODEVAL(id)))));
288 extern "C" CAMLprim value caml_xml_tree_tag_name(value tree, value tagid){
289 CAMLparam2(tree,tagid);
292 tag = (char*) XMLTREE(tree)->GetTagNameByRef((TagType) (Int_val(tagid)));
293 str = caml_copy_string((const char*) tag);
298 extern "C" CAMLprim value caml_xml_tree_tag_id(value tree,value id){
300 CAMLreturn (Val_int(XMLTREE(tree)->Tag(TREENODEVAL(id))));
303 extern "C" CAMLprim value caml_xml_tree_subtree_tags(value tree,value id,value tag){
304 CAMLparam3(tree,id,tag);
305 CAMLreturn (Val_int(XMLTREE(tree)->SubtreeTags(TREENODEVAL(id),Int_val(tag))));
309 extern "C" CAMLprim value caml_xml_tree_register_tag(value tree,value str){
310 CAMLparam2(tree,str);
313 tag = (unsigned char*) (String_val(str));
314 id = Val_int(XMLTREE(tree)->RegisterTag(tag));
318 extern "C" CAMLprim value caml_xml_tree_nullt(value unit){
323 extern "C" CAMLprim value caml_xml_tree_save(value tree,value filename){
324 CAMLparam2(tree,filename);
325 XMLTREE(tree)->Save((unsigned char *) String_val(filename));
326 CAMLreturn (Val_unit);
329 extern "C" CAMLprim value caml_xml_tree_load(value filename,value samplerate){
330 CAMLparam2(filename,samplerate);
333 tree = XMLTree::Load((unsigned char *) String_val(filename),Int_val(samplerate));
335 doc = caml_alloc_custom(&ops,sizeof(XMLTree*),1,2);
336 memcpy(Data_custom_val(doc),&tree,sizeof(XMLTree*));