summaryrefslogtreecommitdiff
path: root/compiler/ExtractBuiltin.ml
diff options
context:
space:
mode:
authorSon Ho2023-12-05 17:34:13 +0100
committerSon Ho2023-12-05 17:34:13 +0100
commit726db4911add81a853aafcec3936b457aaeff5b4 (patch)
tree2663915767c3558203990ed14f8d5604b7fd21d1 /compiler/ExtractBuiltin.ml
parent92887b89e35607e99bae2f19e4c5b2f162683d02 (diff)
parent4795e5f823bc89504855d8eb946b111d9314f4d5 (diff)
Merge branch 'main' into son_fixes2
Diffstat (limited to '')
-rw-r--r--compiler/ExtractBuiltin.ml579
1 files changed, 579 insertions, 0 deletions
diff --git a/compiler/ExtractBuiltin.ml b/compiler/ExtractBuiltin.ml
new file mode 100644
index 00000000..24d16dca
--- /dev/null
+++ b/compiler/ExtractBuiltin.ml
@@ -0,0 +1,579 @@
+(** This file declares external identifiers that we catch to map them to
+ definitions coming from the standard libraries in our backends.
+
+ TODO: there misses trait **implementations**
+ *)
+
+open Config
+open Charon.NameMatcher (* TODO: include? *)
+include ExtractName (* TODO: only open? *)
+
+let log = Logging.builtin_log
+
+(** Small utility to memoize some computations *)
+let mk_memoized (f : unit -> 'a) : unit -> 'a =
+ let r = ref None in
+ let g () =
+ match !r with
+ | Some x -> x
+ | None ->
+ let x = f () in
+ r := Some x;
+ x
+ in
+ g
+
+let split_on_separator (s : string) : string list =
+ Str.split (Str.regexp "\\(::\\|\\.\\)") s
+
+let flatten_name (name : string list) : string =
+ match !backend with
+ | FStar | Coq | HOL4 -> String.concat "_" name
+ | Lean -> String.concat "." name
+
+let () =
+ assert (split_on_separator "x::y::z" = [ "x"; "y"; "z" ]);
+ assert (split_on_separator "x.y.z" = [ "x"; "y"; "z" ])
+
+(** Switch between two values depending on the target backend.
+
+ We often compute the same value (typically: a name) if the target
+ is F*, Coq or HOL4, and a different value if the target is Lean.
+ *)
+let backend_choice (fstar_coq_hol4 : 'a) (lean : 'a) : 'a =
+ match !backend with Coq | FStar | HOL4 -> fstar_coq_hol4 | Lean -> lean
+
+let builtin_globals : (string * string) list =
+ [
+ (* Min *)
+ ("core::num::{usize}::MIN", "core_usize_min");
+ ("core::num::{u8}::MIN", "core_u8_min");
+ ("core::num::{u16}::MIN", "core_u16_min");
+ ("core::num::{u32}::MIN", "core_u32_min");
+ ("core::num::{u64}::MIN", "core_u64_min");
+ ("core::num::{u128}::MIN", "core_u128_min");
+ ("core::num::{isize}::MIN", "core_isize_min");
+ ("core::num::{i8}::MIN", "core_i8_min");
+ ("core::num::{i16}::MIN", "core_i16_min");
+ ("core::num::{i32}::MIN", "core_i32_min");
+ ("core::num::{i64}::MIN", "core_i64_min");
+ ("core::num::{i128}::MIN", "core_i128_min");
+ (* Max *)
+ ("core::num::{usize}::MAX", "core_usize_max");
+ ("core::num::{u8}::MAX", "core_u8_max");
+ ("core::num::{u16}::MAX", "core_u16_max");
+ ("core::num::{u32}::MAX", "core_u32_max");
+ ("core::num::{u64}::MAX", "core_u64_max");
+ ("core::num::{u128}::MAX", "core_u128_max");
+ ("core::num::{isize}::MAX", "core_isize_max");
+ ("core::num::{i8}::MAX", "core_i8_max");
+ ("core::num::{i16}::MAX", "core_i16_max");
+ ("core::num::{i32}::MAX", "core_i32_max");
+ ("core::num::{i64}::MAX", "core_i64_max");
+ ("core::num::{i128}::MAX", "core_i128_max");
+ ]
+
+let builtin_globals_map : string NameMatcherMap.t =
+ NameMatcherMap.of_list
+ (List.map (fun (x, y) -> (parse_pattern x, y)) builtin_globals)
+
+type builtin_variant_info = { fields : (string * string) list }
+[@@deriving show]
+
+type builtin_enum_variant_info = {
+ rust_variant_name : string;
+ extract_variant_name : string;
+ fields : string list option;
+}
+[@@deriving show]
+
+type builtin_type_body_info =
+ | Struct of string * (string * string) list
+ (* The constructor name and the map for the field names *)
+ | Enum of builtin_enum_variant_info list
+(* For every variant, a map for the field names *)
+[@@deriving show]
+
+type builtin_type_info = {
+ rust_name : pattern;
+ extract_name : string;
+ keep_params : bool list option;
+ (** We might want to filter some of the type parameters.
+
+ For instance, `Vec` type takes a type parameter for the allocator,
+ which we want to ignore.
+ *)
+ body_info : builtin_type_body_info option;
+}
+[@@deriving show]
+
+type type_variant_kind =
+ | KOpaque
+ | KStruct of (string * string) list
+ (* TODO: handle the tuple case *)
+ | KEnum (* TODO *)
+
+let mk_struct_constructor (type_name : string) : string =
+ let prefix =
+ match !backend with FStar -> "Mk" | Coq | HOL4 -> "mk" | Lean -> ""
+ in
+ let suffix = match !backend with FStar | Coq | HOL4 -> "" | Lean -> ".mk" in
+ prefix ^ type_name ^ suffix
+
+(** The assumed types.
+
+ The optional list of booleans is filtering information for the type
+ parameters. For instance, in the case of the `Vec` functions, there is
+ a type parameter for the allocator to use, which we want to filter.
+ *)
+let builtin_types () : builtin_type_info list =
+ let mk_type (rust_name : string) ?(custom_name : string option = None)
+ ?(keep_params : bool list option = None)
+ ?(kind : type_variant_kind = KOpaque) () : builtin_type_info =
+ let rust_name = parse_pattern rust_name in
+ let extract_name =
+ match custom_name with
+ | None -> flatten_name (pattern_to_type_extract_name rust_name)
+ | Some name -> flatten_name (split_on_separator name)
+ in
+ let body_info : builtin_type_body_info option =
+ match kind with
+ | KOpaque -> None
+ | KStruct fields ->
+ let fields =
+ List.map
+ (fun (rname, name) ->
+ ( rname,
+ match !backend with
+ | FStar | Lean -> name
+ | Coq | HOL4 -> extract_name ^ "_" ^ name ))
+ fields
+ in
+ let constructor = mk_struct_constructor extract_name in
+ Some (Struct (constructor, fields))
+ | KEnum -> raise (Failure "TODO")
+ in
+ { rust_name; extract_name; keep_params; body_info }
+ in
+
+ [
+ (* Alloc *)
+ mk_type "alloc::alloc::Global" ();
+ (* String *)
+ mk_type "alloc::string::String"
+ ~custom_name:(Some (backend_choice "string" "String"))
+ ();
+ (* Vec *)
+ mk_type "alloc::vec::Vec" ~keep_params:(Some [ true; false ]) ();
+ (* Range *)
+ mk_type "core::ops::range::Range"
+ ~kind:(KStruct [ ("start", "start"); ("end", "end_") ])
+ ();
+ (* Option
+
+ This one is more custom because we use the standard "option" type from
+ the target backend.
+ *)
+ {
+ rust_name = parse_pattern "core::option::Option";
+ extract_name =
+ (match !backend with
+ | Lean -> "Option"
+ | Coq | FStar | HOL4 -> "option");
+ keep_params = None;
+ body_info =
+ Some
+ (Enum
+ [
+ {
+ rust_variant_name = "None";
+ extract_variant_name =
+ (match !backend with
+ | FStar | Coq -> "None"
+ | Lean -> "none"
+ | HOL4 -> "NONE");
+ fields = None;
+ };
+ {
+ rust_variant_name = "Some";
+ extract_variant_name =
+ (match !backend with
+ | FStar | Coq -> "Some"
+ | Lean -> "some"
+ | HOL4 -> "SOME");
+ fields = None;
+ };
+ ]);
+ };
+ ]
+
+let mk_builtin_types_map () =
+ NameMatcherMap.of_list
+ (List.map (fun info -> (info.rust_name, info)) (builtin_types ()))
+
+let builtin_types_map = mk_memoized mk_builtin_types_map
+
+type builtin_fun_info = {
+ rg : Types.RegionGroupId.id option;
+ extract_name : string;
+}
+[@@deriving show]
+
+(** The assumed functions.
+
+ The optional list of booleans is filtering information for the type
+ parameters. For instance, in the case of the `Vec` functions, there is
+ a type parameter for the allocator to use, which we want to filter.
+ *)
+let builtin_funs () : (pattern * bool list option * builtin_fun_info list) list
+ =
+ let rg0 = Some Types.RegionGroupId.zero in
+ (* Small utility *)
+ let mk_fun (rust_name : string) (extract_name : string option)
+ (filter : bool list option) (with_back : bool) (back_no_suffix : bool) :
+ pattern * bool list option * builtin_fun_info list =
+ let rust_name =
+ try parse_pattern rust_name
+ with Failure _ ->
+ raise (Failure ("Could not parse pattern: " ^ rust_name))
+ in
+ let extract_name =
+ match extract_name with
+ | None -> pattern_to_fun_extract_name rust_name
+ | Some name -> split_on_separator name
+ in
+ let basename = flatten_name extract_name in
+ let fwd_suffix = if with_back && back_no_suffix then "_fwd" else "" in
+ let fwd = [ { rg = None; extract_name = basename ^ fwd_suffix } ] in
+ let back_suffix = if with_back && back_no_suffix then "" else "_back" in
+ let back =
+ if with_back then [ { rg = rg0; extract_name = basename ^ back_suffix } ]
+ else []
+ in
+ (rust_name, filter, fwd @ back)
+ in
+ [
+ mk_fun "core::mem::replace" None None true false;
+ mk_fun "core::slice::{[@T]}::len"
+ (Some (backend_choice "slice::len" "Slice::len"))
+ None true false;
+ mk_fun "alloc::vec::{alloc::vec::Vec<@T, alloc::alloc::Global>}::new"
+ (Some "alloc::vec::Vec::new") None false false;
+ mk_fun "alloc::vec::{alloc::vec::Vec<@T, @A>}::push" None
+ (Some [ true; false ])
+ true true;
+ mk_fun "alloc::vec::{alloc::vec::Vec<@T, @A>}::insert" None
+ (Some [ true; false ])
+ true true;
+ mk_fun "alloc::vec::{alloc::vec::Vec<@T, @A>}::len" None
+ (Some [ true; false ])
+ true false;
+ mk_fun "alloc::vec::{alloc::vec::Vec<@T, @A>}::index" None
+ (Some [ true; true; false ])
+ true false;
+ mk_fun "alloc::vec::{alloc::vec::Vec<@T, @A>}::index_mut" None
+ (Some [ true; true; false ])
+ true false;
+ mk_fun "alloc::boxed::{Box<@T>}::deref" None
+ (Some [ true; false ])
+ true false;
+ mk_fun "alloc::boxed::{Box<@T>}::deref_mut" None
+ (Some [ true; false ])
+ true false;
+ mk_fun "core::slice::index::{[@T]}::index" None None true false;
+ mk_fun "core::slice::index::{[@T]}::index_mut" None None true false;
+ mk_fun "core::array::{[@T; @C]}::index" None None true false;
+ mk_fun "core::array::{[@T; @C]}::index_mut" None None true false;
+ mk_fun "core::slice::index::{core::ops::range::Range<usize>}::get"
+ (Some "core::slice::index::RangeUsize::get") None true false;
+ mk_fun "core::slice::index::{core::ops::range::Range<usize>}::get_mut"
+ (Some "core::slice::index::RangeUsize::get_mut") None true false;
+ mk_fun "core::slice::index::{core::ops::range::Range<usize>}::index"
+ (Some "core::slice::index::RangeUsize::index") None true false;
+ mk_fun "core::slice::index::{core::ops::range::Range<usize>}::index_mut"
+ (Some "core::slice::index::RangeUsize::index_mut") None true false;
+ mk_fun "core::slice::index::{core::ops::range::Range<usize>}::get_unchecked"
+ (Some "core::slice::index::RangeUsize::get_unchecked") None false false;
+ mk_fun
+ "core::slice::index::{core::ops::range::Range<usize>}::get_unchecked_mut"
+ (Some "core::slice::index::RangeUsize::get_unchecked_mut") None false
+ false;
+ mk_fun "core::slice::index::{usize}::get" None None true false;
+ mk_fun "core::slice::index::{usize}::get_mut" None None true false;
+ mk_fun "core::slice::index::{usize}::get_unchecked" None None false false;
+ mk_fun "core::slice::index::{usize}::get_unchecked_mut" None None false
+ false;
+ mk_fun "core::slice::index::{usize}::index" None None true false;
+ mk_fun "core::slice::index::{usize}::index_mut" None None true false;
+ ]
+
+let mk_builtin_funs_map () =
+ let m =
+ NameMatcherMap.of_list
+ (List.map
+ (fun (name, filter, info) -> (name, (filter, info)))
+ (builtin_funs ()))
+ in
+ log#ldebug
+ (lazy ("builtin_funs_map:\n" ^ NameMatcherMap.to_string (fun _ -> "...") m));
+ m
+
+let builtin_funs_map = mk_memoized mk_builtin_funs_map
+
+type effect_info = { can_fail : bool; stateful : bool }
+
+let builtin_fun_effects =
+ let int_names =
+ [
+ "usize";
+ "u8";
+ "u16";
+ "u32";
+ "u64";
+ "u128";
+ "isize";
+ "i8";
+ "i16";
+ "i32";
+ "i64";
+ "i128";
+ ]
+ in
+ let int_ops =
+ [ "wrapping_add"; "wrapping_sub"; "rotate_left"; "rotate_right" ]
+ in
+ let int_funs =
+ List.map
+ (fun int_name ->
+ List.map
+ (fun op ->
+ "core::num::" ^ "{"
+ ^ StringUtils.capitalize_first_letter int_name
+ ^ "}::" ^ op)
+ int_ops)
+ int_names
+ in
+ let int_funs = List.concat int_funs in
+ let no_fail_no_state_funs =
+ [
+ (* TODO: redundancy with the funs information above *)
+ "core::slice::{[@T]}::len";
+ "alloc::vec::{alloc::vec::Vec<@T, alloc::alloc::Global>}::new";
+ "alloc::vec::{alloc::vec::Vec<@T, @A>}::len";
+ "core::mem::replace";
+ "core::mem::take";
+ ]
+ @ int_funs
+ in
+ let no_fail_no_state_funs =
+ List.map
+ (fun n -> (n, { can_fail = false; stateful = false }))
+ no_fail_no_state_funs
+ in
+ let no_state_funs =
+ [
+ (* TODO: redundancy with the funs information above *)
+ "alloc::vec::{alloc::vec::Vec<@T, @A>}::push";
+ "alloc::vec::{alloc::vec::Vec<@T, @A>}::index";
+ "alloc::vec::{alloc::vec::Vec<@T, @A>}::index_mut";
+ "alloc::vec::{alloc::vec::Vec<@T, @A>}::index_mut_back";
+ ]
+ in
+ let no_state_funs =
+ List.map (fun n -> (n, { can_fail = true; stateful = false })) no_state_funs
+ in
+ no_fail_no_state_funs @ no_state_funs
+
+let builtin_fun_effects_map =
+ NameMatcherMap.of_list
+ (List.map (fun (n, x) -> (parse_pattern n, x)) builtin_fun_effects)
+
+type builtin_trait_decl_info = {
+ rust_name : pattern;
+ extract_name : string;
+ constructor : string;
+ parent_clauses : string list;
+ consts : (string * string) list;
+ types : (string * (string * string list)) list;
+ (** Every type has:
+ - a Rust name
+ - an extraction name
+ - a list of clauses *)
+ methods : (string * builtin_fun_info list) list;
+}
+[@@deriving show]
+
+let builtin_trait_decls_info () =
+ let rg0 = Some Types.RegionGroupId.zero in
+ let mk_trait (rust_name : string) ?(extract_name : string option = None)
+ ?(parent_clauses : string list = []) ?(types : string list = [])
+ ?(methods : (string * bool) list = []) () : builtin_trait_decl_info =
+ let rust_name = parse_pattern rust_name in
+ let extract_name =
+ match extract_name with
+ | Some n -> n
+ | None ->
+ let rust_name = pattern_to_fun_extract_name rust_name in
+ flatten_name rust_name
+ in
+ let constructor = mk_struct_constructor extract_name in
+ let consts = [] in
+ let types =
+ let mk_type item_name =
+ let type_name =
+ if !record_fields_short_names then item_name
+ else extract_name ^ "_" ^ item_name
+ in
+ let type_name =
+ match !backend with
+ | FStar | Coq | HOL4 -> StringUtils.lowercase_first_letter type_name
+ | Lean -> type_name
+ in
+ let clauses = [] in
+ (item_name, (type_name, clauses))
+ in
+ List.map mk_type types
+ in
+ let methods =
+ let mk_method (item_name, with_back) =
+ (* TODO: factor out with builtin_funs_info *)
+ let basename =
+ if !record_fields_short_names then item_name
+ else extract_name ^ "_" ^ item_name
+ in
+ let back_no_suffix = false in
+ let fwd_suffix = if with_back && back_no_suffix then "_fwd" else "" in
+ let fwd = [ { rg = None; extract_name = basename ^ fwd_suffix } ] in
+ let back_suffix = if with_back && back_no_suffix then "" else "_back" in
+ let back =
+ if with_back then
+ [ { rg = rg0; extract_name = basename ^ back_suffix } ]
+ else []
+ in
+ (item_name, fwd @ back)
+ in
+ List.map mk_method methods
+ in
+ {
+ rust_name;
+ extract_name;
+ constructor;
+ parent_clauses;
+ consts;
+ types;
+ methods;
+ }
+ in
+ [
+ (* Deref *)
+ mk_trait "core::ops::deref::Deref" ~types:[ "Target" ]
+ ~methods:[ ("deref", true) ]
+ ();
+ (* DerefMut *)
+ mk_trait "core::ops::deref::DerefMut" ~parent_clauses:[ "derefInst" ]
+ ~methods:[ ("deref_mut", true) ]
+ ();
+ (* Index *)
+ mk_trait "core::ops::index::Index" ~types:[ "Output" ]
+ ~methods:[ ("index", true) ]
+ ();
+ (* IndexMut *)
+ mk_trait "core::ops::index::IndexMut" ~parent_clauses:[ "indexInst" ]
+ ~methods:[ ("index_mut", true) ]
+ ();
+ (* Sealed *)
+ mk_trait "core::slice::index::private_slice_index::Sealed" ();
+ (* SliceIndex *)
+ mk_trait "core::slice::index::SliceIndex" ~parent_clauses:[ "sealedInst" ]
+ ~types:[ "Output" ]
+ ~methods:
+ [
+ ("get", true);
+ ("get_mut", true);
+ ("get_unchecked", false);
+ ("get_unchecked_mut", false);
+ ("index", true);
+ ("index_mut", true);
+ ]
+ ();
+ ]
+
+let mk_builtin_trait_decls_map () =
+ NameMatcherMap.of_list
+ (List.map
+ (fun info -> (info.rust_name, info))
+ (builtin_trait_decls_info ()))
+
+let builtin_trait_decls_map = mk_memoized mk_builtin_trait_decls_map
+
+let builtin_trait_impls_info () : (pattern * (bool list option * string)) list =
+ let fmt (rust_name : string) ?(extract_name : string option = None)
+ ?(filter : bool list option = None) () :
+ pattern * (bool list option * string) =
+ let rust_name = parse_pattern rust_name in
+ let name =
+ let name =
+ match extract_name with
+ | None -> pattern_to_trait_impl_extract_name rust_name
+ | Some name -> split_on_separator name
+ in
+ flatten_name name
+ in
+ (rust_name, (filter, name))
+ in
+ [
+ (* core::ops::Deref<alloc::boxed::Box<T>> *)
+ fmt "core::ops::deref::Deref<Box<@T>>"
+ ~extract_name:(Some "alloc::boxed::Box::coreopsDerefInst") ();
+ (* core::ops::DerefMut<alloc::boxed::Box<T>> *)
+ fmt "core::ops::deref::DerefMut<Box<@T>>"
+ ~extract_name:(Some "alloc::boxed::Box::coreopsDerefMutInst") ();
+ (* core::ops::index::Index<[T], I> *)
+ fmt "core::ops::index::Index<[@T], @I>"
+ ~extract_name:(Some "core::ops::index::IndexSliceTIInst") ();
+ (* core::ops::index::IndexMut<[T], I> *)
+ fmt "core::ops::index::IndexMut<[@T], @I>"
+ ~extract_name:(Some "core::ops::index::IndexMutSliceTIInst") ();
+ (* core::slice::index::private_slice_index::Sealed<Range<usize>> *)
+ fmt
+ "core::slice::index::private_slice_index::Sealed<core::ops::range::Range<usize>>"
+ ~extract_name:
+ (Some "core.slice.index.private_slice_index.SealedRangeUsizeInst") ();
+ (* core::slice::index::SliceIndex<Range<usize>, [T]> *)
+ fmt "core::slice::index::SliceIndex<core::ops::range::Range<usize>, [@T]>"
+ ~extract_name:(Some "core::slice::index::SliceIndexRangeUsizeSliceTInst")
+ ();
+ (* core::ops::index::Index<[T; N], I> *)
+ fmt "core::ops::index::Index<[@T; @N], @I>"
+ ~extract_name:(Some "core::ops::index::IndexArrayInst") ();
+ (* core::ops::index::IndexMut<[T; N], I> *)
+ fmt "core::ops::index::IndexMut<[@T; @N], @I>"
+ ~extract_name:(Some "core::ops::index::IndexMutArrayIInst") ();
+ (* core::slice::index::private_slice_index::Sealed<usize> *)
+ fmt "core::slice::index::private_slice_index::Sealed<usize>"
+ ~extract_name:
+ (Some "core::slice::index::private_slice_index::SealedUsizeInst") ();
+ (* core::slice::index::SliceIndex<usize, [T]> *)
+ fmt "core::slice::index::SliceIndex<usize, [@T]>"
+ ~extract_name:(Some "core::slice::index::SliceIndexUsizeSliceTInst") ();
+ (* core::ops::index::Index<alloc::vec::Vec<T>, T> *)
+ fmt "core::ops::index::Index<alloc::vec::Vec<@T, @A>, @T>"
+ ~extract_name:(Some "alloc::vec::Vec::coreopsindexIndexInst")
+ ~filter:(Some [ true; true; false ])
+ ();
+ (* core::ops::index::IndexMut<alloc::vec::Vec<T>, T> *)
+ fmt "core::ops::index::IndexMut<alloc::vec::Vec<@T, @A>, @T>"
+ ~extract_name:(Some "alloc::vec::Vec::coreopsindexIndexMutInst")
+ ~filter:(Some [ true; true; false ])
+ ();
+ ]
+
+let mk_builtin_trait_impls_map () =
+ let m = NameMatcherMap.of_list (builtin_trait_impls_info ()) in
+ log#ldebug
+ (lazy
+ ("builtin_trait_impls_map:\n"
+ ^ NameMatcherMap.to_string (fun _ -> "...") m));
+ m
+
+let builtin_trait_impls_map = mk_memoized mk_builtin_trait_impls_map