1 /**************************************
4 * A Test Ocaml Driver which calls the C++ methods and
5 * adds a C wrapper interface with OCaml code.
11 /* OCaml memory managment */
13 #include <caml/mlvalues.h>
14 #include <caml/alloc.h>
15 #include <caml/memory.h>
16 #include <caml/callback.h>
17 #include <caml/fail.h>
18 #include <caml/custom.h>
23 //#include "TextCollection/TextCollection.h"
24 #include "XMLDocShredder.h"
28 #define CAMLRAISECPP(e) (caml_failwith( ((e).what())))
29 #define NOT_IMPLEMENTED(s) (caml_failwith(s))
30 #define XMLTREE(x) ((XMLTree *)(* (XMLTree**) Data_custom_val(x)))
31 #define TEXTCOLLECTION(x)
32 #define TREENODEVAL(i) ((treeNode) (Int_val(i)))
35 static struct custom_operations ops;
36 static bool initialized = false;
38 extern "C" void caml_xml_tree_finalize(value tree){
43 extern "C" void caml_init_ops () {
47 ops.identifier = (char*) "XMLTree";
48 ops.finalize = caml_xml_tree_finalize;
53 extern "C" CAMLprim value caml_call_shredder_uri(value uri,value sf, value iet, value dtc){
56 char *fn = String_val(uri);
58 XMLDocShredder shredder(fn,Int_val(sf),Bool_val(iet),Bool_val(dtc));
60 shredder.processStartDocument(fn);
62 shredder.processEndDocument();
64 doc = caml_alloc_custom(&ops,sizeof(XMLTree*),1,2);
65 tree = (XMLTree *) shredder.storageIfc_->returnDocument();
66 memcpy(Data_custom_val(doc),&tree,sizeof(XMLTree*));
69 catch (const std::exception& e){
75 extern "C" CAMLprim value caml_call_shredder_string(value data,value sf, value iet, value dtc){
78 unsigned int ln = string_length(data);
79 unsigned char *fn = (unsigned char*) String_val(data);
82 XMLDocShredder shredder(fn,ln,Int_val(sf),Bool_val(iet),Bool_val(dtc));
84 shredder.processStartDocument("");
86 shredder.processEndDocument();
88 doc = caml_alloc_custom(&ops,sizeof(XMLTree*),1,2);
89 tree = (XMLTree *) shredder.storageIfc_->returnDocument();
90 memcpy(Data_custom_val(doc),&tree,sizeof(XMLTree*));
93 catch (const std::exception& e) {
101 void traversal_rec(XMLTree* tree, treeNode id){
105 //int tag = tree->Tag(id);
107 tid = tree->PrevText(id);
108 char * data = (char *) (tree->getTextCollection())->GetText(tid);
109 if (tree->IsLeaf(id)){
110 tid = tree->MyText(id);
112 data = (char*) (tree->getTextCollection())->GetText(tid);
115 if (tree->NextSibling(id) == NULLT){
116 tid = tree->NextText(id);
117 data = (char*) (tree->getTextCollection())->GetText(tid);
120 traversal_rec(tree,tree->FirstChild(id));
121 traversal_rec(tree,tree->NextSibling(id));
125 extern "C" CAMLprim value caml_cpp_traversal(value tree){
127 traversal_rec(XMLTREE(tree),XMLTREE(tree)->Root());
128 CAMLreturn(Val_unit);
131 extern "C" CAMLprim value caml_text_collection_get_text(value tree, value id){
134 uchar* txt = XMLTREE(tree)->GetText((DocID) Int_val(id));
135 str = caml_copy_string((const char*)txt);
140 extern "C" CAMLprim value caml_text_collection_get_cached_text(value tree, value id){
143 char* txt = (char*) XMLTREE(tree)->GetCachedText((DocID) Int_val(id));
144 str = caml_copy_string(txt);
149 extern "C" CAMLprim value caml_text_collection_size(value tree){
151 // CAMLreturn (Val_int( XMLTREE(tree)->CachedText.size()));
152 NOT_IMPLEMENTED("text_collection_size");
153 CAMLreturn (Val_unit);
158 extern "C" CAMLprim value caml_text_collection_empty_text(value tree,value id){
160 CAMLreturn ( Val_int((XMLTREE(tree))->EmptyText((DocID) Int_val(id))));
163 extern "C" CAMLprim value caml_text_collection_is_contains(value tree,value str){
164 CAMLparam2(tree,str);
165 uchar * cstr = (uchar *) String_val(str);
166 CAMLreturn ( Val_bool((int) XMLTREE(tree)->IsContains(cstr)));
169 extern "C" CAMLprim value caml_text_collection_count_contains(value tree,value str){
170 CAMLparam2(tree,str);
171 uchar * cstr = (uchar *) String_val(str);
172 CAMLreturn (Val_int((XMLTREE(tree)->CountContains(cstr))));
175 extern "C" CAMLprim value caml_text_collection_count(value tree,value str){
176 CAMLparam2(tree,str);
177 uchar * cstr = (uchar *) String_val(str);
178 CAMLreturn (Val_int((XMLTREE(tree)->Count(cstr))));
179 CAMLreturn (Val_unit);
183 extern "C" CAMLprim value caml_text_collection_contains(value tree,value str){
184 CAMLparam2(tree,str);
185 CAMLlocal1(resarray);
186 uchar * cstr = (uchar *) String_val(str);
187 std::vector<DocID> results;
188 results = XMLTREE(tree)->Contains(cstr);
190 resarray = caml_alloc_tuple(results.size());
192 for (unsigned int i=0; i<results.size();i++){
193 caml_initialize(&Field(resarray,i),Val_int(results[i]));
195 CAMLreturn (resarray);
199 extern "C" CAMLprim value caml_xml_tree_root(value tree){
201 CAMLreturn (Val_int(TREENODEVAL(XMLTREE(tree)->Root())));
203 extern "C" CAMLprim value caml_xml_tree_text_collection(value tree){
205 CAMLreturn((value) XMLTREE(tree)->getTextCollection());
207 extern "C" CAMLprim value caml_xml_tree_parent(value tree, value id){
209 CAMLreturn(Val_int (XMLTREE(tree)->Parent(TREENODEVAL(id))));
211 extern "C" CAMLprim value caml_xml_tree_prev_sibling(value tree, value id){
213 CAMLreturn(Val_int (XMLTREE(tree)->PrevSibling(TREENODEVAL(id))));
216 extern "C" CAMLprim value caml_xml_tree_parent_doc(value tree, value id){
218 CAMLreturn(Val_int (XMLTREE(tree)->ParentNode((DocID) Int_val(id))));
221 extern "C" CAMLprim value caml_xml_tree_prev_doc(value tree, value id){
223 CAMLreturn(Val_int (XMLTREE(tree)->PrevNode((DocID) Int_val(id))));
226 extern "C" CAMLprim value caml_xml_tree_is_ancestor(value tree,value id1, value id2) {
227 CAMLparam3(tree,id1,id2);
228 CAMLreturn(Val_bool (XMLTREE(tree)->IsAncestor(TREENODEVAL(id1),TREENODEVAL(id2))));
231 extern "C" CAMLprim value caml_xml_tree_serialize(value tree, value filename){
232 CAMLparam2(tree,filename);
233 NOT_IMPLEMENTED("caml_xml_tree_serialize");
234 CAMLreturn(Val_unit);
237 extern "C" CAMLprim value caml_xml_tree_unserialize(value filename){
238 CAMLparam1(filename);
239 NOT_IMPLEMENTED("caml_xml_tree_unserialize");
240 CAMLreturn(Val_unit);
244 extern "C" CAMLprim value caml_xml_tree_first_child(value tree, value id){
246 CAMLreturn(Val_int (XMLTREE(tree)->FirstChild(TREENODEVAL(id))));
249 extern "C" CAMLprim value caml_xml_tree_is_leaf(value tree, value id){
251 CAMLreturn(Val_bool (XMLTREE(tree)->IsLeaf(TREENODEVAL(id))));
254 extern "C" CAMLprim value caml_xml_tree_tagged_desc(value tree, value id, value tag){
255 CAMLparam3(tree,id,tag);
256 CAMLreturn(Val_int (XMLTREE(tree)->TaggedDesc(TREENODEVAL(id),(TagType) Int_val(tag))));
260 extern "C" CAMLprim value caml_xml_tree_tagged_foll(value tree, value id, value tag){
261 CAMLparam3(tree,id,tag);
262 CAMLreturn(Val_int (XMLTREE(tree)->TaggedFoll(TREENODEVAL(id),(TagType) Int_val(tag))));
264 extern "C" CAMLprim value caml_xml_tree_tagged_foll_below(value tree, value id, value tag,value root){
265 CAMLparam4(tree,id,tag,root);
266 CAMLreturn(Val_int (XMLTREE(tree)->TaggedFollBelow(TREENODEVAL(id),(TagType) Int_val(tag),TREENODEVAL(root))));
270 extern "C" CAMLprim value caml_xml_tree_next_sibling(value tree, value id){
272 CAMLreturn(Val_int (XMLTREE(tree)->NextSibling(TREENODEVAL(id))));
275 extern "C" CAMLprim value caml_xml_tree_prev_text(value tree, value id){
278 CAMLreturn(Val_int((XMLTREE(tree)->PrevText(TREENODEVAL(id)))));
281 extern "C" CAMLprim value caml_xml_tree_next_text(value tree, value id){
283 CAMLreturn(Val_int((XMLTREE(tree)->NextText(TREENODEVAL(id)))));
285 extern "C" CAMLprim value caml_xml_tree_my_text(value tree, value id){
287 CAMLreturn(Val_int((XMLTREE(tree)->MyText(TREENODEVAL(id)))));
290 extern "C" CAMLprim value caml_xml_tree_text_xml_id(value tree, value id){
292 CAMLreturn(Val_int((XMLTREE(tree)->TextXMLId(TREENODEVAL(id)))));
294 extern "C" CAMLprim value caml_xml_tree_node_xml_id(value tree, value id){
296 CAMLreturn(Val_int((XMLTREE(tree)->NodeXMLId(TREENODEVAL(id)))));
299 extern "C" CAMLprim value caml_xml_tree_tag_name(value tree, value tagid){
300 CAMLparam2(tree,tagid);
303 tag = (char*) XMLTREE(tree)->GetTagNameByRef((TagType) (Int_val(tagid)));
304 str = caml_copy_string((const char*) tag);
309 extern "C" CAMLprim value caml_xml_tree_tag_id(value tree,value id){
311 CAMLreturn (Val_int(XMLTREE(tree)->Tag(TREENODEVAL(id))));
314 extern "C" CAMLprim value caml_xml_tree_subtree_tags(value tree,value id,value tag){
315 CAMLparam3(tree,id,tag);
316 CAMLreturn (Val_int(XMLTREE(tree)->SubtreeTags(TREENODEVAL(id),Int_val(tag))));
320 extern "C" CAMLprim value caml_xml_tree_register_tag(value tree,value str){
321 CAMLparam2(tree,str);
324 tag = (unsigned char*) (String_val(str));
325 id = Val_int(XMLTREE(tree)->RegisterTag(tag));
329 extern "C" CAMLprim value caml_xml_tree_nullt(value unit){
334 extern "C" CAMLprim value caml_xml_tree_save(value tree,value filename){
335 CAMLparam2(tree,filename);
336 XMLTREE(tree)->Save((unsigned char *) String_val(filename));
337 CAMLreturn (Val_unit);
340 extern "C" CAMLprim value caml_xml_tree_load(value filename,value samplerate){
341 CAMLparam2(filename,samplerate);
344 tree = XMLTree::Load((unsigned char *) String_val(filename),Int_val(samplerate));
346 doc = caml_alloc_custom(&ops,sizeof(XMLTree*),1,2);
347 memcpy(Data_custom_val(doc),&tree,sizeof(XMLTree*));
352 static int caml_empty_vector[] = { 0 };
355 extern "C" CAMLprim value caml_int_vector_empty(value unit){
357 CAMLreturn ((value) caml_empty_vector);
360 extern "C" CAMLprim value caml_int_vector_length(value vec){
362 CAMLreturn (Val_int( ((int*) caml_empty_vector)[0] ));
364 extern "C" CAMLprim value caml_int_vector_alloc(value len){
366 int * vec = (int *) malloc(sizeof(int)*(Int_val(len)+1));
367 vec[0] = Int_val(len);
368 CAMLreturn ((value) vec);
371 extern "C" CAMLprim value caml_int_vector_set(value vec, value i, value v){
374 ((int*) vec)[Int_val(i)+1] = Int_val(v);
375 CAMLreturn (Val_unit);
379 #define VECT(x) ((int*) (x))
380 extern "C" CAMLprim value caml_xml_tree_tagged_below(value tree, value node, value ctags, value dtags){
381 CAMLparam4(tree,node,ctags,dtags);
383 CAMLreturn (Val_int (
384 (XMLTREE(tree)->TaggedBelow(TREENODEVAL(node),
391 extern "C" CAMLprim value caml_xml_tree_tagged_next(value tree, value node, value ctags, value ftags,value root){
392 CAMLparam5(tree,node,ctags,ftags,root);
393 CAMLreturn (Val_int (
394 (XMLTREE(tree)->TaggedNext(TREENODEVAL(node),
399 TREENODEVAL(root)))));
402 extern "C" CAMLprim value caml_xml_tree_tagged_desc_only(value tree, value node,value dtags){
403 CAMLparam3(tree,node,dtags);
405 CAMLreturn (Val_int (
406 (XMLTREE(tree)->TaggedDescOnly(TREENODEVAL(node),
411 extern "C" CAMLprim value caml_xml_tree_tagged_foll_only(value tree, value node, value ftags,value root){
412 CAMLparam4(tree,node,ftags,root);
413 CAMLreturn (Val_int (
414 (XMLTREE(tree)->TaggedFollOnly(TREENODEVAL(node),
417 TREENODEVAL(root)))));
420 extern "C" CAMLprim value caml_xml_tree_tagged_desc_or_foll_only(value tree, value node, value ftags,value root){
421 CAMLparam4(tree,node,ftags,root);
422 CAMLreturn (Val_int (
423 (XMLTREE(tree)->TaggedDescOrFollOnly(TREENODEVAL(node),
426 TREENODEVAL(root)))));
429 extern "C" CAMLprim value caml_xml_tree_doc_ids(value tree, value node){
430 CAMLparam2(tree,node);
432 tuple = caml_alloc_tuple(2);
433 range r = (XMLTREE(tree)->DocIds(TREENODEVAL(node)));
434 caml_initialize(&Field(tuple,0),Val_int(r.min));
435 caml_initialize(&Field(tuple,1),Val_int(r.max));