diff options
Diffstat (limited to 'lib/analysers/query.ml')
-rw-r--r-- | lib/analysers/query.ml | 310 |
1 files changed, 19 insertions, 291 deletions
diff --git a/lib/analysers/query.ml b/lib/analysers/query.ml index bcf4a72..e24da78 100644 --- a/lib/analysers/query.ml +++ b/lib/analysers/query.ml @@ -2,58 +2,8 @@ open StdLabels module Expression = ImportExpression module Q = Expression.Query module Syntax = ImportConf.Syntax -module Table = ImportConf.Table -module Path = ImportConf.Path - -let truncate buffer n = Buffer.truncate buffer (Buffer.length buffer - n) - -(** The module allow to create fragment in the query which keep together the - binderd parameters and the text of the query.contents. - - This is used a lot in order to create the CTE, where you need the create - fragment used both in the main request and partially in the CTE itself. - - The content is mutable and all the functions are returning [unit]. *) -module Chunk = struct - type t = { - b : Buffer.t; - parameters : ImportCSV.DataType.t Queue.t; - } - - let create : unit -> t = - fun () -> { b = Buffer.create 16; parameters = Queue.create () } - - let create' : Buffer.t -> ImportCSV.DataType.t Queue.t -> t = - fun b parameters -> { b; parameters } - - (* Append the element from [tail] at the end of [head] - - Tail is destroyed during the operation. - *) - let append : head:t -> tail:t -> unit = - fun ~head ~tail -> - match Buffer.length tail.b with - | 0 -> () - | _ -> - Buffer.add_buffer head.b tail.b; - Queue.transfer tail.parameters head.parameters; - () - - (** Add a litteral string in the sequence *) - let add_string : t -> string -> unit = fun t v -> Buffer.add_string t.b v - - let copy : t -> t = - fun t -> - let b = Buffer.create 16 and parameters = Queue.copy t.parameters in - Buffer.add_buffer b t.b; - { b; parameters } - - let add_parameters : t -> ImportCSV.DataType.t Seq.t -> unit = - fun t p -> Queue.add_seq t.parameters p -end - -let prepare_key : f:(Format.formatter -> unit) -> Format.formatter -> unit = - fun ~f formatter -> Format.fprintf formatter "rtrim(upper(%t))" f +module Table = ImportDataTypes.Table +module Path = ImportDataTypes.Path (* Collect all the tables pointed by the expression. *) let pointed_tables : Syntax.t -> 'a Expression.T.t -> (Table.t * string) list = @@ -64,11 +14,6 @@ let pointed_tables : Syntax.t -> 'a Expression.T.t -> (Table.t * string) list = (table, table_name) :: acc) |> List.sort_uniq ~cmp:Stdlib.compare -(** Represent a column in a safe way in a query *) -let print_column : Table.t -> string -> string = - fun table column -> - String.concat ~sep:"" [ "'"; table.Table.name; "'.'"; column; "'" ] - let create_table : Dependency.t -> string = fun mapping -> let b = Buffer.create 64 in @@ -90,184 +35,6 @@ let create_table : Dependency.t -> string = Buffer.contents b -let show_path : conf:Syntax.t -> Format.formatter -> Path.t -> unit = - fun ~conf buffer { alias; column } -> - let table = ImportConf.get_table_for_name conf alias in - let table_name = table.Table.name in - Format.fprintf buffer "'%s'.col_%d" table_name column - -(** Extract the informations from the dependancies. We get two informations here - : - - - the join query in order to load the data from the external column - - the column corresponding to the key in order to identify the missing links - later. *) -let query_of_external : - conf:Syntax.t -> join_buffer:Chunk.t -> Syntax.Extern.t -> unit = - fun ~conf ~join_buffer external_ -> - let extern_table = Table.name external_.target in - - let formatter = Format.formatter_of_buffer join_buffer.b in - Format.fprintf formatter "\nLEFT JOIN '%s' AS '%s' ON %t = %s" extern_table - external_.target.name - (prepare_key ~f:(fun f -> - let q = - Q.query_of_expression Q.BindParam f (show_path ~conf) - external_.intern_key - in - - Chunk.add_parameters join_buffer (Queue.to_seq q))) - (print_column external_.Syntax.Extern.target - ("key_" ^ external_.Syntax.Extern.target.name)); - - Format.pp_print_flush formatter () - -(** Create the from part of the query, adding all the reuired externals. - - SQLite is able to optimize the query and do not load the table not used in - the select clause. *) -let create_from_chunck : Syntax.t -> Chunk.t -> unit = - fun conf c -> - Chunk.add_string c "\nFROM '"; - Chunk.add_string c (Table.name conf.source); - Chunk.add_string c "' AS '"; - Chunk.add_string c conf.source.name; - Chunk.add_string c "'"; - - (* Add the externals in the query *) - List.iter conf.externals ~f:(query_of_external ~conf ~join_buffer:c) - -(** Build a CTE query in order to use any group function inside the query. - Return the binded parameters used in the expression. The buffer given in - argument is also modified during the construction. - - If filters is not None, the clauses are added to the CTE. *) -let build_cte : - Syntax.t -> - expression:'a Expression.T.t -> - filters:Chunk.t option -> - Chunk.t = - fun conf ~expression ~filters -> - (* The binded parameters queue will be used later in the full query *) - let cte_chunk = Chunk.create () in - - Chunk.add_string cte_chunk "WITH cte AS (SELECT "; - Chunk.add_string cte_chunk conf.source.name; - Chunk.add_string cte_chunk ".id, "; - - let formatter = Format.formatter_of_buffer cte_chunk.b in - - let p = - Q.query_of_expression Q.BindParam formatter (show_path ~conf) expression - in - Format.pp_print_flush formatter (); - Chunk.add_parameters cte_chunk (Queue.to_seq p); - (* The name is hardcoded here, and used in [Expression.Filters.window] *) - Chunk.add_string cte_chunk " AS group0"; - - let () = create_from_chunck conf cte_chunk in - let () = - match filters with - | None -> () - | Some filters_chunk -> - Chunk.append ~head:cte_chunk ~tail:(Chunk.copy filters_chunk) - in - - Chunk.add_string cte_chunk ")\n"; - cte_chunk - -type filter_evaluation = { - content : Buffer.t; - parameters : ImportCSV.DataType.t Seq.t; - cte : (string * Chunk.t) option; -} -(** Build the filters to apply in the query. We make the difference here between - the predicates to apply directly in the query, and the filters associated - with a group, which are required to be transformed into a CTE in SQL, and - are evaluated before. *) - -(** Evaluate the filters on the query *) -let eval_filters : Syntax.t -> filter_evaluation = - fun conf -> - match conf.filters with - | [] -> - let empty_buffer = Buffer.create 0 in - { content = empty_buffer; parameters = Seq.empty; cte = None } - | filters -> ( - (* Create a new queue in order to accumulate all the parameters to bind. - This filter will be given to both the CTE if any, or reused in the - main query when there is no CTE. - *) - let chunk_filters = Chunk.create () in - Chunk.add_string chunk_filters "\nWHERE "; - - let group = Chunk.create () in - - let with_cte, with_exr = - List.fold_left filters ~init:(None, false) - ~f:(fun (with_cte, with_exr) column -> - (* The function will return an option in second position which is - None when no Group function where found, and Some Expression - otherwise *) - let b = Buffer.create 16 in - - let formatter = Format.formatter_of_buffer b in - let queue, group_found = - Expression.Filters.query_of_expression Q.BindParam formatter - (show_path ~conf) column - in - Format.pp_print_flush formatter (); - let clause = Chunk.create' b queue in - - match (group_found, with_cte) with - | None, _ -> - Chunk.append ~head:chunk_filters ~tail:clause; - Chunk.add_string chunk_filters "\nAND "; - (with_cte, true) - | (Some _ as group'), None -> - (* We have a group here, we do not add it into the - filter_buffer right now. - - This can occur only once, the second one will raise - an error. *) - Chunk.append ~head:group ~tail:clause; - (group', with_exr) - | Some _, Some _ -> raise ImportErrors.MisplacedWindow) - in - - match with_cte with - | None -> - let content = chunk_filters.b in - truncate content 5; - { - (* There is no group clause in the query *) - content; - parameters = Queue.to_seq chunk_filters.parameters; - cte = None; - } - | Some expression -> - let filters = - if with_exr then ( - (* If we have additionnals filters from the group clause, we - have to report them in the CTE instead of the main query. *) - let c' = Chunk.copy chunk_filters in - truncate c'.b 5; - Some c') - else None - in - - (* Create the common expression table *) - let cte_parameters = build_cte conf ~expression ~filters in - Chunk.append ~head:chunk_filters ~tail:group; - - { - content = chunk_filters.b; - parameters = Queue.to_seq chunk_filters.parameters; - (* The name is hardcoded here, and used in - [Expression.Filters.window] *) - cte = Some ("cte", cte_parameters); - }) - type query = { q : string; parameters : ImportCSV.DataType.t Seq.t; @@ -323,23 +90,12 @@ let clean_window : find which source is pointed by this alias. *) let select : Syntax.t -> query * Path.t ImportExpression.T.t array = fun conf -> - (* If the filters contains a group expression, we need to transform this into - a CTE, which have to be evaluated before the main query. That’s why we are - evaluating the filters right now.*) - let filters = eval_filters conf in - let b = Buffer.create 256 in - let parameters = Queue.create () in - - Option.iter - (fun (_, (cte : Chunk.t)) -> - Buffer.add_buffer b cte.b; - Queue.add_seq parameters (Queue.to_seq cte.parameters)) - filters.cte; + let filter = ImportConf.CTE.of_filters conf.filters in (* For each column in the configuration file, add the corresponding element in the query. - The Sqlite driver return the elements in an array, we create an array to + The Sqlite driver return the elements in an array, we create an array too in order to manage the elements together. *) let headers = Array.make (List.length conf.columns) (Obj.magic None) in @@ -355,6 +111,10 @@ let select : Syntax.t -> query * Path.t ImportExpression.T.t array = let expression = c in (i, clean_window ~prefix:conf.uniq expression)) in + let filters = Chunk.create () in + let request_header = Filters.generate_sql ~conf filter filters in + let b = request_header.Chunk.b + and parameters = request_header.Chunk.parameters in let formatter = Format.formatter_of_buffer b in let () = Format.fprintf formatter "SELECT %a" @@ -363,7 +123,7 @@ let select : Syntax.t -> query * Path.t ImportExpression.T.t array = (fun formatter (i, column) -> Array.set headers i column; let p = - Q.query_of_expression Q.BindParam formatter (show_path ~conf) + Q.query_of_expression Q.BindParam formatter (Printers.path ~conf) column in Queue.transfer p parameters; @@ -372,26 +132,8 @@ let select : Syntax.t -> query * Path.t ImportExpression.T.t array = in Format.pp_print_flush formatter (); - let () = create_from_chunck conf (Chunk.create' b parameters) in - - (* If the query has a CTE, link it as well. We use an INNER JOIN here because - we want to be sure to get all the rows fetched by the CTE - *) - let () = - match filters.cte with - | None -> () - | Some (name, _) -> - Buffer.add_string b "\nINNER JOIN '"; - Buffer.add_string b name; - Buffer.add_string b "' ON "; - Buffer.add_string b name; - Buffer.add_string b ".id = "; - Buffer.add_string b conf.source.name; - Buffer.add_string b ".id" - in - - Buffer.add_buffer b filters.content; - Queue.add_seq parameters filters.parameters; + let () = Chunk.create_from_statement_of_chunck conf request_header in + Chunk.append ~head:request_header ~tail:filters; let formatter = Format.formatter_of_buffer b in (match conf.Syntax.uniq with @@ -402,7 +144,7 @@ let select : Syntax.t -> query * Path.t ImportExpression.T.t array = ~pp_sep:(fun f () -> Format.fprintf f ", ") (fun formatter column -> let seq = - Q.query_of_expression Q.BindParam formatter (show_path ~conf) + Q.query_of_expression Q.BindParam formatter (Printers.path ~conf) column in Queue.transfer seq parameters)) @@ -415,7 +157,7 @@ let select : Syntax.t -> query * Path.t ImportExpression.T.t array = ~pp_sep:(fun f () -> Format.fprintf f ", ") (fun formatter column -> let seq = - Q.query_of_expression Q.BindParam formatter (show_path ~conf) + Q.query_of_expression Q.BindParam formatter (Printers.path ~conf) column in Queue.transfer seq parameters)) @@ -426,20 +168,12 @@ let select : Syntax.t -> query * Path.t ImportExpression.T.t array = let check_external : Syntax.t -> Syntax.Extern.t -> query = fun conf external_ -> - let internal_chunk = - let internal_key_buffer = Buffer.create 16 in - let formatter = Format.formatter_of_buffer internal_key_buffer in - let internal_key_seq = - Q.query_of_expression Q.BindParam formatter (show_path ~conf) - external_.Syntax.Extern.intern_key - in - Format.pp_print_flush formatter (); - Chunk.create' internal_key_buffer (Queue.copy internal_key_seq) - in + let internal_chunk = Chunk.create () in + Chunk.add_expression ~conf internal_chunk external_.Syntax.Extern.intern_key; let external_key_buffer = Buffer.create 16 in Buffer.add_string external_key_buffer - (print_column external_.Syntax.Extern.target + (Table.print_column external_.Syntax.Extern.target ("key_" ^ external_.Syntax.Extern.target.name)); let pointed_tables = pointed_tables conf external_.intern_key in @@ -495,18 +229,12 @@ let check_external : Syntax.t -> Syntax.Extern.t -> query = Chunk.add_string request "-1" | (table, _name) :: _ -> (* If we have a single source, extract the row number. *) - Chunk.add_string request (print_column table "id") + Chunk.add_string request (Table.print_column table "id") in Chunk.add_string request ", "; Chunk.append ~head:request ~tail:(Chunk.copy internal_chunk); - Chunk.add_string request " FROM\n'"; - Chunk.add_string request (Table.name conf.source); - Chunk.add_string request "' AS '"; - Chunk.add_string request conf.source.name; - Chunk.add_string request "'"; - (* Add the externals in the query *) - List.iter dependencies ~f:(query_of_external ~conf ~join_buffer:request); + Chunk.create_from_statement_of_chunck ~externals:dependencies conf request; Chunk.add_string request " WHERE "; Chunk.add_string request join_content; Chunk.add_string request " IS NULL AND "; @@ -526,7 +254,7 @@ let build_key_insert : Buffer.t -> Dependency.key -> unit = let formatter = Format.formatter_of_buffer buffer in let () = - prepare_key formatter ~f:(fun formatter -> + Printers.prepare_key formatter ~f:(fun formatter -> Q.query_of_expression Q.NoParam formatter show_column expression) in |