4 let index_empty_texts = ref true
5 let sample_factor = ref 64
6 let disable_text_collection = ref false
7 let tc_threshold = ref 60000
10 let input_file = ref ""
11 let output_file = ref None
12 let save_file = ref ""
13 let count_only = ref false
15 let bottom_up = ref false
16 let no_jump = ref false
17 let verbose = ref false
18 let text_index_type = ref 0
19 let do_perf = ref false
20 let twopass = ref false
22 let docstats = ref false
24 let set_index_type = function
25 | "default" -> text_index_type := 0
26 | "swcsa" -> text_index_type := 1
27 | "rlcsa" -> text_index_type := 2
28 | s -> raise (Arg.Bad(s))
30 let usage_msg = Printf.sprintf "%s [options] <input.{xml|srx}> 'query' [output]" Sys.argv.(0)
34 fun s -> match !pos with
35 | 0 -> input_file:= s;incr pos
36 | 1 -> query := s; incr pos
37 | 2 -> output_file := Some s; incr pos
38 | _ -> raise (Arg.Bad(s))
44 match String.explode t ':' with
46 let l = try int_of_string lvl with _ -> raise (Arg.Bad (lvl)) in
47 if Logger.is_logger tr then Logger.activate tr l
48 else raise (Arg.Bad (t))
49 | _ -> raise (Arg.Bad (t))
50 ) (String.explode s ',')
52 let pretty_loggers () =
53 ignore(flush_str_formatter());
56 (fun f s -> fprintf f "%s" s)
58 (Logger.available ());
59 flush_str_formatter ()
62 [ "-c", Arg.Set(count_only),
63 " counting only (don't materialize the result set)";
65 "-two", Arg.Set(twopass),
66 " Use twopass algorithm";
68 "-f", Arg.Set_int(sample_factor),
69 "<n> sample factor [default=64]";
71 "-ne", Arg.Clear(index_empty_texts),
72 " don't index empty texts [default=index]";
74 "-d", Arg.Set(disable_text_collection),
75 " disable text collection[default=false]";
77 "-s", Arg.Set_string(save_file),
78 "<save_file> save the intermediate representation into file.srx";
80 "-b", Arg.Set(bottom_up), " real bottom up run";
82 "-nj", Arg.Set(no_jump), " disable jumping";
84 "-p", Arg.Set(do_perf), " dump perf counters (Linux only)";
86 "-index-type", Arg.Symbol ([ "default"; "swcsa"; "rlcsa" ],
88 " choose text index type";
90 "-r", Arg.Set_int(repeat),
91 " repeat query execution n time (benchmarking only, default 1)";
93 "-doc-stats", Arg.Set(docstats),
94 " Compute document statistics (performs full traversal)";
97 "-v", Arg.Set(verbose), " verbose mode"; ] @
100 "-log", Arg.String (set_logger),
101 "<logger1:l1,...,loggern:ln> enable logging with the specified level. Valid loggers are: "
102 ^ (pretty_loggers ())
108 let parse_cmdline() =
109 let _ = Arg.parse spec anon_fun usage_msg
111 if (!pos > 3 || !pos < 2)
112 then begin Arg.usage spec usage_msg; exit 1 end