9 val top_down_run : Ata.t -> Tree.t -> Tree.node -> result_set
10 val bottom_up_run : Ata.t -> Tree.t -> Compile.text_query * string -> result_set
11 val grammar_run : Ata.t -> Grammar2.t -> unit -> result_set
15 module Make (U : ResJIT.S) : S with type result_set = U.NS.t =
18 type result_set = U.NS.t;;
20 let eval_form auto s1 s2 f =
22 match Formula.expr f with
23 | Formula.False | Formula.True | Formula.Pred _ -> f, []
24 | Formula.Atom(`Left, b, q) ->
25 Formula.of_bool (b == (StateSet.mem q s1)),
26 if b && StateSet.mem q auto.topdown_marking_states then [ResJIT.LEFT q] else []
27 | Formula.Atom (`Right, b, q) ->
28 Formula.of_bool(b == (StateSet.mem q s2)),
29 if b && StateSet.mem q auto.topdown_marking_states then [ResJIT.RIGHT q] else []
30 | Formula.Atom (`Epsilon, _, _) -> assert false
32 | Formula.Or(f1, f2) ->
33 let b1, i1 = loop f1 in
34 let b2, i2 = loop f2 in
35 Formula.or_pred b1 b2, i1 @ i2
36 | Formula.And(f1, f2) ->
37 let b1, i1 = loop f1 in
38 let b2, i2 = loop f2 in
39 Formula.and_pred b1 b2, i1 @ i2
44 let eval_trans auto s1 s2 trans =
46 (fun t ((a_st, a_op, a_todo) as acc)->
47 let q, _, m, f = Transition.node t in
48 let form, ops = eval_form auto s1 s2 f in
49 match Formula.expr form with
52 (q, (if m then (ResJIT.SELF() :: ops) else ops)):: a_op,
54 | Formula.False -> acc
55 | Formula.Pred p -> a_st, a_op,
56 (p.Tree.Predicate.node, q, [(q,(if m then (ResJIT.SELF() :: ops) else ops))]) :: a_todo
58 ) trans (StateSet.empty, [], [])
65 type opcode = (t -> t -> t -> Tree.t -> Tree.node -> StateSet.t * t)
67 type t = opcode Cache.Lvl3.t
69 let dummy _ _ _ _ _ = failwith "Uninitialized L3JIT"
71 let create () = Cache.Lvl3.create 1024 dummy
72 let find t tlist s1 s2 =
74 (Uid.to_int s2.StateSet.Node.id)
75 (Uid.to_int s1.StateSet.Node.id)
76 (Uid.to_int tlist.Translist.Node.id)
80 let add t tlist s1 s2 v =
82 (Uid.to_int s2.StateSet.Node.id)
83 (Uid.to_int s1.StateSet.Node.id)
84 (Uid.to_int tlist.Translist.Node.id)
87 let compile auto trl s1 s2 =
88 let orig_s1, orig_s2 =
89 Translist.fold (fun t (a1, a2) ->
90 let _, _, _, f = Transition.node t in
91 let (_, _, fs1), (_, _, fs2) = Formula.st f in
92 (StateSet.union a1 fs1, StateSet.union a2 fs2)
93 ) trl (StateSet.empty, StateSet.empty)
95 let ns1 = StateSet.inter s1 orig_s1
96 and ns2 = StateSet.inter s2 orig_s2 in
97 let res, ops, todo = eval_trans auto ns1 ns2 trl in
98 let code, not_marking = ResJIT.compile ops in
99 let todo_code, todo_notmarking =
100 List.fold_left (fun (l, b) (p, q, o) -> let c, b' = ResJIT.compile o in
101 (p, q, c)::l, b && b')
102 ([], not_marking) todo
104 let opcode = res, code, todo_notmarking, todo_code in
107 let gen_code auto tlist s1 s2 =
108 let res, code, not_marking, todo_code = compile auto tlist s1 s2 in
110 if todo_code == [] then
111 if not_marking then begin fun empty_slot sl1 sl2 _ node ->
112 let slot1_empty = sl1 == empty_slot
113 and slot2_empty = sl2 == empty_slot in
114 if slot1_empty && slot2_empty then res,sl2
119 Array.copy empty_slot
123 U.exec sl sl1 sl2 node code;
126 else (* marking *) begin fun empty_slot sl1 sl2 _ node ->
128 if sl2 == empty_slot then
129 if sl1 == empty_slot then
130 Array.copy empty_slot
134 U.exec sl sl1 sl2 node code;
137 else (* todo != [] *)
138 begin fun empty_slot sl1 sl2 tree node ->
140 if sl2 == empty_slot then
141 if sl1 == empty_slot then
142 Array.copy empty_slot
146 U.exec sl sl1 sl2 node code;
148 (fun ares (p, q, code) ->
149 if !p tree node then begin
150 if code != ResJIT.Nil then U.exec sl sl1 sl2 node code;
153 else ares) res todo_code, sl
159 let cache_apply cache auto tlist s1 s2 =
160 let f = gen_code auto tlist s1 s2 in
161 TRACE("grammar", 2, __ "Inserting: %i, %a, %a\n%!"
162 (Uid.to_int tlist.Translist.Node.id) StateSet.print s1 StateSet.print s2);
163 add cache tlist s1 s2 f; f
166 DEFINE LOOP (t, states, ctx) = (
168 TRACE("top-down-run", 3,
169 __ "Entering node %i with loop (tag %s, context %i) with states %a\n%!"
171 (Tag.to_string (Tree.tag tree _t))
173 (StateSet.print) (states));
174 if _t == Tree.nil then nil_res
176 let tag = Tree.tag tree _t in
178 _t tag (states) (ctx) (L2JIT.find cache2 tag (states))
181 DEFINE LOOP_TAG (t, states, tag, ctx) = (
182 let _t = (t) in (* to avoid duplicating expression t *)
183 TRACE("top-down-run", 3,
184 __ "Entering node %i with loop_tag (tag %s, context %i) with states %a\n%!"
186 (Tag.to_string (tag))
188 (StateSet.print) (states));
189 if _t == Tree.nil then nil_res
192 _t (tag) (states) (ctx) (L2JIT.find cache2 (tag) (states)))
195 let top_down_run auto tree root states ctx =
196 let res_len = StateSet.max_elt auto.states + 1 in
197 let empty_slot = Array.create res_len U.NS.empty in
198 let nil_res = auto.bottom_states, empty_slot in
199 let cache3 = L3JIT.create () in
201 let l3jit_dispatch trl s1 s2 t sl1 sl2 =
202 let f = L3JIT.find cache3 trl s1 s2 in
203 if f == L3JIT.dummy then (L3JIT.cache_apply cache3 auto trl s1 s2) empty_slot sl1 sl2 tree t
204 else f empty_slot sl1 sl2 tree t
207 let cache2 = L2JIT.create () in
210 let rec l2jit_dispatch t tag states ctx opcode =
212 | L2JIT.RETURN -> nil_res
214 let opcode = L2JIT.compile cache2 auto tree tag states in
215 l2jit_dispatch t tag states ctx opcode
217 | L2JIT.LEFT (tr_list, instr) ->
219 l2jit_dispatch_instr t tag states (Tree.closing tree t) instr
221 l3jit_dispatch tr_list res1 auto.bottom_states t slot1 empty_slot
223 | L2JIT.RIGHT (tr_list, instr) ->
224 let res2, slot2 = l2jit_dispatch_instr t tag states ctx instr in
225 l3jit_dispatch tr_list auto.bottom_states res2 t empty_slot slot2
227 | L2JIT.BOTH (tr_list, instr1, instr2) ->
229 l2jit_dispatch_instr t tag states (Tree.closing tree t) instr1
231 let res2, slot2 = l2jit_dispatch_instr t tag states ctx instr2 in
232 l3jit_dispatch tr_list res1 res2 t slot1 slot2
234 and l2jit_dispatch_instr t tag states ctx instr =
236 | L2JIT.NOP () -> nil_res
237 | L2JIT.FIRST_CHILD s -> LOOP ((Tree.first_child tree t), s, ctx)
238 | L2JIT.NEXT_SIBLING s -> LOOP ((Tree.next_sibling tree t), s, ctx)
240 | L2JIT.FIRST_ELEMENT s -> LOOP ((Tree.first_element tree t), s, ctx)
241 | L2JIT.NEXT_ELEMENT s -> LOOP ((Tree.next_element tree t), s, ctx)
243 | L2JIT.TAGGED_DESCENDANT (s, tag) ->
244 LOOP_TAG ((Tree.tagged_descendant tree t tag), s, tag, ctx)
246 | L2JIT.TAGGED_FOLLOWING (s, tag) ->
247 LOOP_TAG((Tree.tagged_following_before tree t tag ctx), s, tag, ctx)
249 | L2JIT.SELECT_DESCENDANT (s, _, us) ->
250 LOOP((Tree.select_descendant tree t us), s, ctx)
252 | L2JIT.SELECT_FOLLOWING (s, pt, us) ->
253 LOOP ((Tree.select_following_before tree t us ctx), s, ctx)
255 | L2JIT.TAGGED_CHILD (s, tag) ->
256 LOOP_TAG((Tree.tagged_child tree t tag), s, tag, ctx)
258 | L2JIT.TAGGED_FOLLOWING_SIBLING (s, tag) ->
259 LOOP_TAG((Tree.tagged_following_sibling tree t tag), s, tag, ctx)
261 | L2JIT.SELECT_CHILD (s, _, us) ->
262 LOOP ((Tree.select_child tree t us), s, ctx)
264 | L2JIT.SELECT_FOLLOWING_SIBLING (s, _, us) ->
265 LOOP ((Tree.select_following_sibling tree t us), s, ctx)
267 | L2JIT.TAGGED_SUBTREE(s, tag) ->
269 let count = U.NS.subtree_tags tree t tag in
270 if count != U.NS.empty then
271 let r = Array.copy empty_slot in
272 r.(auto.last) <- count;
277 | L2JIT.ELEMENT_SUBTREE(s) ->
279 let count = U.NS.subtree_elements tree t in
280 if count != U.NS.empty then
281 let r = Array.copy empty_slot in
282 r.(auto.last) <- count;
288 let r = LOOP (root, states, ctx) in
289 (*L3JIT.stats err_formatter cache3; *)
292 let full_top_down_run auto states tree root =
294 top_down_run auto tree root states (Tree.closing tree root)
296 let top_down_run auto tree root =
298 let res, slot = full_top_down_run auto auto.init tree root in
300 slot.(StateSet.min_elt auto.topdown_marking_states)
303 (*** Bottom-up evaluation function **)
306 Format.fprintf fmt "{ ";
307 U.NS.iter begin fun node ->
308 Format.fprintf fmt "%a " Node.print node;
310 Format.fprintf fmt "}"
312 let slot_print fmt t =
313 Array.iteri begin fun state ns ->
314 Format.eprintf "%a -> %a\n" State.print state ns_print ns;
318 let eval_trans auto tree parent res1 res2 = assert false
321 let bottom_up_run auto tree (query, pat) =
322 let leaves = Array.to_list (Tree.full_text_query query tree pat) in
323 let states = auto.states in
324 let res_len = (StateSet.max_elt states) + 1 in
325 let empty_slot = Array.create res_len U.NS.empty in
326 let nil_res = auto.bottom_states, empty_slot in
327 let cache = Cache.Lvl3.create 1024 L3JIT.dummy in
328 let rec loop_leaves l acc =
332 let res, lll = bottom_up_next node ll Tree.nil in
333 if (lll <> []) then Printf.eprintf "Leftover elements\n%!";
336 and bottom_up_next node rest stop =
337 let fs = Tree.first_child tree node in
339 if fs == Tree.nil then nil_res
340 else full_top_down_run auto states tree fs
342 move_up node res1 true rest stop
344 and move_up node res is_left rest stop =
345 if node == stop then res, rest
347 let prev_sibling = Tree.prev_sibling tree node in
348 let is_left' = prev_sibling == Tree.nil in
349 let real_parent = Tree.parent tree node in
351 if is_left' then real_parent else max (Tree.first_child tree real_parent) stop
353 (* let parent = if is_left' then Tree.parent tree node else prev_sibling in *)
354 let (s1, sl1), (s2, sl2), rest' =
355 if is_left then match rest with
356 [] -> res, nil_res, rest
358 if Tree.is_right_descendant tree node next
360 let res2, rest' = bottom_up_next next rest' node in
362 else res, nil_res, rest
366 let tag = Tree.tag tree node in
367 let id1 = Uid.to_int s1.StateSet.Node.id in
368 let id2 = Uid.to_int s2.StateSet.Node.id in
370 let code = Cache.Lvl3.find cache tag id1 id2 in
371 if code == L3JIT.dummy then
375 List.fold_left (fun acc' (labels, tr) ->
376 if labels == TagSet.any || TagSet.mem tag labels
377 then Translist.cons tr acc' else acc')
379 (Hashtbl.find auto.trans q)
384 let code = L3JIT.gen_code auto trl s1 s2 in
385 Cache.Lvl3.add cache tag id1 id2 code; code
388 let res' = code empty_slot sl1 sl2 tree node in
389 move_up parent res' is_left' rest' stop
391 let _, slot = loop_leaves leaves (nil_res) in
392 slot.(StateSet.min_elt auto.topdown_marking_states)
394 let get_trans g auto tag states =
395 StateSet.fold (fun q tr_acc ->
397 (fun ((lstates, rstates, tacc) as acc) (ts, trs) ->
398 if TagSet.mem (Tag.translate tag) ts then
399 if not (TagSet.mem Tag.attribute ts) && Grammar2.is_attribute g tag
402 let _, _, _, phi = Transition.node trs in
403 let (_,_,l), (_,_,r) = Formula.st phi in
404 (StateSet.union l lstates,
405 StateSet.union r rstates,
406 Translist.cons trs tacc)
408 tr_acc (Hashtbl.find auto.trans q)
409 ) states (StateSet.empty, StateSet.empty, Translist.nil)
412 let dispatch_param0 conf id2 y0 y1 =
414 | Grammar2.C0 | Grammar2.C2 -> Grammar2.Node0 id2
415 | Grammar2.C1 | Grammar2.C5 -> Grammar2.Node1(id2,y0)
416 | Grammar2.C3 | Grammar2.C6 -> y0
417 | Grammar2.C4 -> Grammar2.Node2(id2, y0, y1)
419 let dispatch_param1 conf id2 y0 y1 =
422 | Grammar2.C3 -> Grammar2.Node0 id2
424 | Grammar2.C6 -> Grammar2.Node1(id2, y1)
425 | _ -> Grammar2.dummy_param
427 module K_down = struct
428 type t = Grammar2.n_symbol * StateSet.t
429 let hash (x,y) = HASHINT2(Node.to_int x, Uid.to_int y.StateSet.Node.id)
430 let equal (x1,y1) (x2,y2) = x1 == x2 && y1 == y2
434 type t = Grammar2.n_symbol * StateSet.t * StateSet.t * StateSet.t
436 HASHINT4 (Node.to_int a,
437 Uid.to_int b.StateSet.Node.id,
438 Uid.to_int c.StateSet.Node.id,
439 Uid.to_int d.StateSet.Node.id)
440 let equal (a1, b1, c1, d1) (a2, b2, c2, d2) =
441 a1 == a2 && b1 == b2 && c1 == c2 && d1 == d2
446 include Hashtbl.Make(K_down)
447 let dummy = StateSet.singleton State.dummy
448 let notfound l = l.(0) == dummy && l.(1) == dummy
454 let a = [| dummy; dummy |] in
458 module UCache = Hashtbl.Make(K_up)
462 out0 : StateSet.t * U.t;
463 out1 : StateSet.t * U.t;
464 main : StateSet.t * U.t
467 { in0 = StateSet.empty;
468 in1 = StateSet.empty;
476 out0 = StateSet.empty,v;
477 out1 = StateSet.empty,v;
480 let grammar_run auto g () =
481 let dummy_leaf = Grammar2.dummy_param in
482 let dummy_set = StateSet.singleton State.dummy in
483 let res_len = (StateSet.max_elt auto.states) + 1 in
484 let empty_slot = Array.create res_len U.NS.empty in
485 let nil_res = mk_nil auto.bottom_states empty_slot in
486 let empty_res = mk_empty (StateSet.empty, empty_slot) in
487 let cache3 = L3JIT.create () in
488 let dummy2 = (StateSet.empty, StateSet.empty, Translist.nil) in
489 let cache2 = Cache.Lvl2.create 512 dummy2 in
490 let rule_counter = ref 0 in
491 let preorder_counter = ref 0 in
492 let dcache = DCache.create 1023 in
493 let ucache = UCache.create 1023 in
494 let term_array = [| StateSet.empty; StateSet.empty |] in
495 let get_trans tag states =
496 let c = Cache.Lvl2.find cache2 tag (Uid.to_int states.StateSet.Node.id) in
498 let c = get_trans g auto tag states in
500 Cache.Lvl2.add cache2 tag (Uid.to_int states.StateSet.Node.id) c;
505 let lambda = ref 0 in
506 let rec start_loop idx states =
507 TRACE("grammar", 2, __ "Node %i\n%!" (Node.to_int idx));
508 if states == dummy_set then nil_res else
509 if idx < Node.null then nil_res
511 let symbol = Grammar2.start_tag g idx in
512 let fc = Grammar2.start_first_child g idx in
513 let ns = Grammar2.start_next_sibling g fc in
514 if Grammar2.is_terminal g symbol then
515 let t = Grammar2.terminal symbol in
516 terminal_loop t states (Grammar2.Leaf (~-1,0,term_array, fc)) (Grammar2.Leaf (~-1,1,term_array, ns))
518 let nt = Grammar2.non_terminal symbol in
520 let lmbd = !lambda in
521 let y0 = (Grammar2.Leaf (lmbd,0, term_array, fc))
522 and y1 = (Grammar2.Leaf (lmbd,1, term_array, ns)) in
523 rule_loop nt states y0 y1
525 and rule_loop (t : Grammar2.n_symbol) states y0 y1 =
526 if t = Node.nil || states == dummy_set then nil_res else
527 let () = incr rule_counter in
528 if !rule_counter land 65535 == 0 then begin Gc.minor() end;
529 let k = (t, states) in
530 let pstates = DCache.find dcache k in
531 let notfound = DCache.notfound pstates in
532 let rhs = Grammar2.get_rule g t in
533 let id1 = Grammar2.get_id1 rhs in
534 let id2 = Grammar2.get_id2 rhs in
535 let conf = Grammar2.get_conf rhs in
537 let ny0 = dispatch_param0 conf id2 y0 y1 in
538 let ny1 = dispatch_param1 conf id2 y0 y1 in
539 let res = dispatch_loop id1 states ny0 ny1 in
540 pstates.(0) <- res.in0;
541 pstates.(1) <- res.in1;
543 UCache.add ucache (t, states, fst res.out0, fst res.out1)
545 let h = Hashtbl.create 7 in
546 for i = 0 to res_len - 1 do
547 Hashtbl.add h (0, i) (snd res.out0).(i);
548 Hashtbl.add h (1, i) (snd res.out1).(i);
551 main = ((fst res.main), (U.close h (snd res.main)));
555 let res0 = partial_loop y0 pstates.(0) in
556 let res1 = partial_loop y1 pstates.(1) in
557 let k2 = (t, states, fst res0.main, fst res1.main) in
560 UCache.find ucache k2
563 let ores0 = { res0 with main = fst res0.main, U.var 0 (snd res0.main) }
564 and ores1 = { res1 with main = fst res1.main, U.var 1 (snd res1.main) }
566 let res = dispatch_loop id1 states (Grammar2.Cache (0,ores0)) (Grammar2.Cache (1, ores1)) in
567 UCache.add ucache k2 res.main;
570 let h = Hashtbl.create 7 in
571 for i = 0 to res_len - 1 do
572 Hashtbl.add h (0, i) (snd res0.main).(i);
573 Hashtbl.add h (1, i) (snd res1.main).(i);
579 main = s, U.close h r;
582 and dispatch_loop id1 states ny0 ny1 =
583 if Grammar2.is_non_terminal g id1 then
584 rule_loop (Grammar2.non_terminal id1) states ny0 ny1
586 terminal_loop (Grammar2.terminal id1) states ny0 ny1
588 and terminal_loop (symbol : Grammar2.t_symbol) states y0 y1 =
590 if symbol == Grammar2.nil_symbol || symbol = Node.nil || states == dummy_set then nil_res else begin
591 let tag = Grammar2.tag symbol in
592 let lst, rst, trans = get_trans tag states in
593 let res0 = partial_loop y0 lst in
594 let res1 = partial_loop y1 rst in
595 let s1, slot1 = res0.main
596 and s2, slot2 = res1.main in
597 let opcode = L3JIT.find cache3 trans s1 s2 in
598 let node = Node.of_int !preorder_counter in
599 incr preorder_counter;
601 if opcode == L3JIT.dummy then
602 (L3JIT.cache_apply cache3 auto trans s1 s2) empty_slot slot1 slot2 (Obj.magic ()) node
604 opcode empty_slot slot1 slot2 (Obj.magic()) (node)
613 and partial_loop l states =
614 if l == dummy_leaf then nil_res else
616 | Grammar2.Cache (_, r) -> r
617 | Grammar2.Leaf (_,_, _, id) -> start_loop id states
618 | Grammar2.Node0 id ->
619 if (Grammar2.terminal id) == Grammar2.nil_symbol then nil_res
621 rule_loop (Grammar2.non_terminal id) states dummy_leaf dummy_leaf
623 | Grammar2.Node1 (id, y0) ->
624 rule_loop (Grammar2.non_terminal id) states y0 dummy_leaf
625 | Grammar2.Node2 (id, y0, y1) ->
626 if Grammar2.is_terminal g id then
627 terminal_loop (Grammar2.terminal id) states y0 y1
629 rule_loop (Grammar2.non_terminal id) states y0 y1
632 let (_, slot) = (start_loop (Node.null) auto.init).main in
633 slot.(StateSet.min_elt auto.topdown_marking_states)