src/heap/sharedMem.ml

(* * Copyright (c) Meta Platforms, Inc. and affiliates. * * This source code is licensed under the MIT license found in the * LICENSE file in the root directory of this source tree. *) (* Don't change the ordering of this record without updating hh_shared_init in * hh_shared.c, which indexes into config objects *) type config = { heap_size: int; hash_table_pow: int; log_level: int; } type handle = Unix.file_descr type table_stats = { nonempty_slots: int; used_slots: int; slots: int; } type buf = (char, Bigarray.int8_unsigned_elt, Bigarray.c_layout) Bigarray.Array1.t (* Phantom type parameter provides type-safety to callers of this API. * Internally, these are all just ints, so be careful! *) type +'k addr = int (* The integer values corresponding to these tags are encoded in the low byte * of object headers. Any changes made here must be kept in sync with * hh_shared.c -- e.g., the should_scan function. *) type tag = | Entity_tag (* 0 *) | Addr_tbl_tag | Untyped_tag | Typed_tag | Source_file_tag | Json_file_tag | Resource_file_tag | Lib_file_tag | Haste_module_tag | File_module_tag (* tags defined below this point are scanned for pointers *) | String_tag (* 10 *) | Int64_tag | Docblock_tag | ALoc_table_tag | Type_sig_tag (* tags defined above this point are serialized+compressed *) | Serialized_tag (* 15 *) | Serialized_resolved_requires_tag | Serialized_ast_tag | Serialized_file_sig_tag | Serialized_exports_tag let heap_ref : buf option ref = ref None (* constant constructors are integers *) let tag_val : tag -> int = Obj.magic (* double-check integer values are consistent with hh_shared.c *) let () = assert (tag_val Entity_tag = 0); assert (tag_val String_tag = 10); assert (tag_val Serialized_tag = 15) exception Out_of_shared_memory exception Hash_table_full exception Heap_full exception Failed_memfd_init of Unix.error let () = Callback.register_exception "out_of_shared_memory" Out_of_shared_memory; Callback.register_exception "hash_table_full" Hash_table_full; Callback.register_exception "heap_full" Heap_full; Callback.register_exception "failed_memfd_init" (Failed_memfd_init Unix.EINVAL) (*****************************************************************************) (* Initializes the shared memory. Must be called before forking. *) (*****************************************************************************) external init : config -> num_workers:int -> buf * handle = "hh_shared_init" let init config ~num_workers = try let (heap, handle) = init config ~num_workers in heap_ref := Some heap; Ok handle with | Failed_memfd_init _ -> Error () external connect : handle -> worker_id:int -> buf = "hh_connect" let connect handle ~worker_id = let heap = connect handle ~worker_id in heap_ref := Some heap (*****************************************************************************) (* The current state of the incremental GC. *) (*****************************************************************************) type gc_phase = | Phase_idle | Phase_mark | Phase_sweep external gc_phase : unit -> gc_phase = "hh_gc_phase" (*****************************************************************************) (* The size of the dynamically allocated shared memory section *) (*****************************************************************************) external heap_size : unit -> int = "hh_used_heap_size" (*****************************************************************************) (* The size of any new allocations since the previous full collection cycle *) (*****************************************************************************) external new_alloc_size : unit -> int = "hh_new_alloc_size" (*****************************************************************************) (* The size of all free space in shared memory *) (*****************************************************************************) external free_size : unit -> int = "hh_free_heap_size" (*****************************************************************************) (* Force a new GC cycle to start. Precondition: gc_phase must be Phase_idle *) (*****************************************************************************) external start_cycle : unit -> unit = "hh_start_cycle" (*****************************************************************************) (* Perform a fixed amount of marking work. The return value is the unused work * budget. If marking completed in the given budget, the returned value will be * greater than 0. Precondition: gc_phase must be Phase_mark. *) (*****************************************************************************) external mark_slice : int -> int = "hh_mark_slice" (*****************************************************************************) (* Perform a fixed amount of sweeping work. The return value is the unused work * budget. If weeping completed in the given budget, the returned value will be * greater than 0. Precondition: gc_phase must be Phase_sweep. *) (*****************************************************************************) external sweep_slice : int -> int = "hh_sweep_slice" (*****************************************************************************) (* Compact the heap, sliding objects "to the left" over any free objects * discovered during the previous full mark and sweep. Precondition: gc_phase * must be Phase_idle. *) (*****************************************************************************) external hh_compact : unit -> unit = "hh_compact" (*****************************************************************************) (* The logging level for shared memory statistics *) (* 0 = nothing *) (* 1 = log totals, averages, min, max bytes marshalled and unmarshalled *) (*****************************************************************************) external hh_log_level : unit -> int = "hh_log_level" (*****************************************************************************) (* The total number of slots in our hashtable *) (*****************************************************************************) external hash_stats : unit -> table_stats = "hh_hash_stats" external get_next_version : unit -> int = "hh_next_version" [@@noalloc] (* Any entities which were advanced since the last commit will be committed * after this. Committing the transaction requries synchronization with readers * and writers. *) external commit_transaction : unit -> unit = "hh_commit_transaction" (* Iterate the shared hash table. *) external hh_iter : (_ addr -> unit) -> unit = "hh_iter" let on_compact = ref (fun _ _ -> ()) let compact_helper () = let k = !on_compact () in hh_compact (); k () (* GC will attempt to keep the overhead of garbage to no more than 20%. Before * we actually mark and sweep, however, we don't know how much garbage there is, * so we estimate. * * To estimate the amount of garbage, we consider all "new" allocations -- * allocations since the previous mark+sweep -- to be garbage. We add that * number to the known free space. If that is at least 20% of the total space, * we will kick of a new mark and sweep pass. *) let should_collect () = let estimated_garbage = free_size () + new_alloc_size () in estimated_garbage * 5 >= heap_size () (* After a full mark and sweep, we want to compact the heap if the amount of * free space is 20% of the scanned heap. *) let should_compact () = let scanned_size = heap_size () - new_alloc_size () in free_size () * 5 >= scanned_size (* Perform an incremental "slice" of GC work. The caller can control the amount * of work performed by passing in a smaller or larger "work" budget. This * function returns `true` when the GC phase was completed, and `false` if there * is still more work to do. *) let collect_slice ?(force = false) work = let work = ref work in while !work > 0 do match gc_phase () with | Phase_idle -> if force || should_collect () then start_cycle () else work := 0 | Phase_mark -> work := mark_slice !work | Phase_sweep -> ignore (sweep_slice !work); work := 0 done; let is_idle = gc_phase () = Phase_idle in (* The GC will be in idle phase under two conditions: (1) we started in idle * and did not start a new collect cycle, or (2) we just finished a sweep. In * condition (1) should_compact should return false, so we will only possibly * compact in condition (2), assuming 20% of the scanned heap is free. *) if is_idle && should_compact () then compact_helper (); is_idle (* Perform a full GC pass, or complete an in-progress GC pass. This call * bypasses the `should_collect` heuristic and will instead always trigger a new * mark and sweep pass if the GC is currently idle. *) let collect_full () = while not (collect_slice ~force:true max_int) do () done let finish_cycle () = while gc_phase () == Phase_mark do ignore (mark_slice max_int) done; while gc_phase () == Phase_sweep do ignore (sweep_slice max_int) done (* Perform a full compaction of shared memory, such that no heap space is * wasted. We finish the current cycle, if one is in progress, then perform a * full mark and sweep pass before collecting. This ensures that any "floating * garbage" from a previous GC pass is also collected. *) let compact () = finish_cycle (); start_cycle (); finish_cycle (); compact_helper () (* Compute size of values in the garbage-collected heap *) let value_size r = let w = Obj.reachable_words r in w * (Sys.word_size / 8) let debug_value_size = value_size module type Key = sig type t val to_string : t -> string val compare : t -> t -> int end module type Value = sig type t val description : string end module type AddrValue = sig type t end (* The shared memory segment contains a single shared hash table. This functor * creates modules that give the illusion of multiple hash tables by adding a * prefix to each key. *) module HashtblSegment (Key : Key) = struct type hash = string external hh_add : hash -> 'k addr -> 'k addr = "hh_add" external hh_mem : hash -> bool = "hh_mem" external hh_get : hash -> _ addr = "hh_get" external hh_remove : hash -> unit = "hh_remove" external hh_move : hash -> hash -> unit = "hh_move" let hh_add x y = WorkerCancel.with_worker_exit (fun () -> hh_add x y) let hh_mem x = WorkerCancel.with_worker_exit (fun () -> hh_mem x) let hh_get x = WorkerCancel.with_worker_exit (fun () -> hh_get x) (* The hash table supports a kind of versioning, where a key can be "oldified" * temporarily while a new value for the same key is written. The oldified key * can then be revived or removed. We ensure that the new and old entries * occupy distinct hash table slots by giving them distinct prefixes. *) let new_prefix = Prefix.make () let old_prefix = Prefix.make () let new_hash_of_key k = Digest.string (Prefix.make_key new_prefix (Key.to_string k)) let old_hash_of_key k = Digest.string (Prefix.make_key old_prefix (Key.to_string k)) let add k addr = hh_add (new_hash_of_key k) addr let mem k = hh_mem (new_hash_of_key k) let mem_old k = hh_mem (old_hash_of_key k) let get_hash hash = if hh_mem hash then Some (hh_get hash) else None let get k = get_hash (new_hash_of_key k) let get_old k = get_hash (old_hash_of_key k) let remove k = let new_hash = new_hash_of_key k in if hh_mem new_hash then hh_remove new_hash (* We oldify entries that might be changed by an operation, which involves * moving the address of the current heap value from the "new" key to the * "old" key. The operation might then write an updated value to the "new" * key. * * This function is strange, though. Why, if a new entry does not exist, do we * try to remove an extant old entry? Why should an old entry even exist at * this point? I was not able to find a clear justification for this behavior * from source control history... *) let oldify k = let new_hash = new_hash_of_key k in let old_hash = old_hash_of_key k in if hh_mem new_hash then hh_move new_hash old_hash else if hh_mem old_hash then hh_remove old_hash (* After an operation which first oldified some values, we might decide that * the original values are still good enough. In this case we can move the old * key back into the new slot. * * hh_move expects the destination slot to be empty, but the operation might * have written a new value before deciding to roll back, so we first check * and remove any new key first. *) let revive k = let new_hash = new_hash_of_key k in let old_hash = old_hash_of_key k in if hh_mem new_hash then hh_remove new_hash; if hh_mem old_hash then hh_move old_hash new_hash (* After an operation which first oldified some values, if we decide to commit * those changes, we can remove the old key. Generally the hash table entry * keeps the corresponding heap object alive, so removing this reference will * allow the GC to clean up the old value in the heap. *) let remove_old k = let old_hash = old_hash_of_key k in if hh_mem old_hash then hh_remove old_hash end (*****************************************************************************) (* All the caches are functors returning a module of the following signature *) (*****************************************************************************) module type DebugCacheType = sig val get_size : unit -> int end module type CacheType = sig include DebugCacheType type key type value val add : key -> value -> unit val get : key -> value option val remove : key -> unit val clear : unit -> unit end (*****************************************************************************) (* The signatures of what we are actually going to expose to the user *) (*****************************************************************************) module type NoCache = sig type key type value module KeySet : Flow_set.S with type elt = key val add : key -> value -> unit val get : key -> value option val get_old : key -> value option val remove_old_batch : KeySet.t -> unit val remove : key -> unit val remove_batch : KeySet.t -> unit val mem : key -> bool val mem_old : key -> bool val oldify : key -> unit val oldify_batch : KeySet.t -> unit val revive_batch : KeySet.t -> unit end module type LocalCache = sig module DebugL1 : DebugCacheType module DebugL2 : DebugCacheType type key type value val add : key -> value -> unit val get : key -> value option val remove : key -> unit val clear : unit -> unit end module type WithCache = sig include NoCache val write_around : key -> value -> unit val get_no_cache : key -> value option module DebugCache : LocalCache with type key = key and type value = value end (*****************************************************************************) (* A functor returning an implementation of the S module without caching. *) (*****************************************************************************) module NoCache (Key : Key) (Value : Value) : NoCache with type key = Key.t and type value = Value.t and module KeySet = Flow_set.Make(Key) = struct module Tbl = HashtblSegment (Key) module KeySet = Flow_set.Make (Key) type key = Key.t type value = Value.t (* Returns address into the heap, alloc size, and orig size *) external hh_store : Value.t -> int -> _ addr * int * int = "hh_store_ocaml" external hh_deserialize : _ addr -> Value.t = "hh_deserialize" external hh_get_size : _ addr -> int = "hh_get_size" let hh_store x = WorkerCancel.with_worker_exit (fun () -> hh_store x (tag_val Serialized_tag)) let hh_deserialize x = WorkerCancel.with_worker_exit (fun () -> hh_deserialize x) let log_serialize compressed original = let compressed = float compressed in let original = float original in let saved = original -. compressed in let ratio = compressed /. original in Measure.sample (Value.description ^ " (bytes serialized into shared heap)") compressed; Measure.sample "ALL bytes serialized into shared heap" compressed; Measure.sample (Value.description ^ " (bytes saved in shared heap due to compression)") saved; Measure.sample "ALL bytes saved in shared heap due to compression" saved; Measure.sample (Value.description ^ " (shared heap compression ratio)") ratio; Measure.sample "ALL bytes shared heap compression ratio" ratio let log_deserialize l r = let sharedheap = float l in Measure.sample (Value.description ^ " (bytes deserialized from shared heap)") sharedheap; Measure.sample "ALL bytes deserialized from shared heap" sharedheap; if hh_log_level () > 1 then ( (* value_size is a bit expensive to call this often, so only run with log levels >= 2 *) let localheap = float (value_size r) in Measure.sample (Value.description ^ " (bytes allocated for deserialized value)") localheap; Measure.sample "ALL bytes allocated for deserialized value" localheap ) let add key value = let (addr, compressed_size, original_size) = hh_store value in ignore (Tbl.add key addr); if hh_log_level () > 0 && compressed_size > 0 then log_serialize compressed_size original_size let mem = Tbl.mem let mem_old = Tbl.mem_old let deserialize addr = let value = hh_deserialize addr in if hh_log_level () > 0 then log_deserialize (hh_get_size addr) (Obj.repr value); value let get key = match Tbl.get key with | None -> None | Some addr -> Some (deserialize addr) let get_old key = match Tbl.get_old key with | None -> None | Some addr -> Some (deserialize addr) let remove = Tbl.remove let remove_batch keys = KeySet.iter remove keys let oldify = Tbl.oldify let oldify_batch keys = KeySet.iter oldify keys let revive_batch keys = KeySet.iter Tbl.revive keys let remove_old_batch keys = KeySet.iter Tbl.remove_old keys end module NoCacheAddr (Key : Key) (Value : AddrValue) = struct module Tbl = HashtblSegment (Key) module KeySet = Flow_set.Make (Key) type key = Key.t type value = Value.t addr let add = Tbl.add let mem = Tbl.mem let mem_old = Tbl.mem_old let get = Tbl.get let get_old = Tbl.get_old let remove = Tbl.remove let remove_batch keys = KeySet.iter remove keys let oldify = Tbl.oldify let oldify_batch keys = KeySet.iter oldify keys let revive_batch keys = KeySet.iter Tbl.revive keys let remove_old_batch keys = KeySet.iter Tbl.remove_old keys end (*****************************************************************************) (* All the cache are configured by a module of type CacheConfig *) (*****************************************************************************) module type CacheConfig = sig type key type value (* The capacity of the cache *) val capacity : int end (*****************************************************************************) (* Cache keeping the objects the most frequently used. *) (*****************************************************************************) module FreqCache (Config : CacheConfig) : CacheType with type key := Config.key and type value := Config.value = struct (* The cache itself *) let (cache : (Config.key, int ref * Config.value) Hashtbl.t) = Hashtbl.create (2 * Config.capacity) let size = ref 0 let get_size () = !size let clear () = Hashtbl.clear cache; size := 0 (* The collection function is called when we reach twice original * capacity in size. When the collection is triggered, we only keep * the most frequently used objects. * So before collection: size = 2 * capacity * After collection: size = capacity (with the most frequently used objects) *) let collect () = if !size < 2 * Config.capacity then () else let l = ref [] in Hashtbl.iter begin fun key (freq, v) -> l := (key, !freq, v) :: !l end cache; Hashtbl.clear cache; l := Base.List.sort ~compare:(fun (_, x, _) (_, y, _) -> y - x) !l; let i = ref 0 in while !i < Config.capacity do match !l with | [] -> i := Config.capacity | (k, _freq, v) :: rl -> Hashtbl.replace cache k (ref 0, v); l := rl; incr i done; size := Config.capacity; () let add x y = collect (); try let (freq, y') = Hashtbl.find cache x in incr freq; if y' == y then () else Hashtbl.replace cache x (freq, y) with | Not_found -> incr size; let elt = (ref 0, y) in Hashtbl.replace cache x elt; () let find x = let (freq, value) = Hashtbl.find cache x in incr freq; value let get x = try Some (find x) with | Not_found -> None let remove x = if Hashtbl.mem cache x then decr size; Hashtbl.remove cache x end (*****************************************************************************) (* An ordered cache keeps the most recently used objects *) (*****************************************************************************) module OrderedCache (Config : CacheConfig) : CacheType with type key := Config.key and type value := Config.value = struct let (cache : (Config.key, Config.value) Hashtbl.t) = Hashtbl.create Config.capacity let queue = Queue.create () let size = ref 0 let get_size () = !size let clear () = Hashtbl.clear cache; size := 0; Queue.clear queue; () let add x y = ( if !size >= Config.capacity then (* Remove oldest element - if it's still around. *) let elt = Queue.pop queue in if Hashtbl.mem cache elt then ( decr size; Hashtbl.remove cache elt ) ); (* Add the new element, but bump the size only if it's a new addition. *) Queue.push x queue; if not (Hashtbl.mem cache x) then incr size; Hashtbl.replace cache x y let find x = Hashtbl.find cache x let get x = try Some (find x) with | Not_found -> None let remove x = try if Hashtbl.mem cache x then decr size; Hashtbl.remove cache x with | Not_found -> () end (*****************************************************************************) (* Every time we create a new cache, a function that knows how to clear the * cache is registered in the "invalidate_callback_list" global. *) (*****************************************************************************) let invalidate_callback_list = ref [] module LocalCache (Config : CacheConfig) = struct type key = Config.key type value = Config.value (* Young values cache *) module L1 = OrderedCache (Config) (* Frequent values cache *) module L2 = FreqCache (Config) (* These are exposed only for tests *) module DebugL1 = L1 module DebugL2 = L2 let add x y = L1.add x y; L2.add x y let get x = match L1.get x with | None -> (match L2.get x with | None -> None | Some v as result -> L1.add x v; result) | Some v as result -> L2.add x v; result let remove x = L1.remove x; L2.remove x let clear () = L1.clear (); L2.clear () end (*****************************************************************************) (* A functor returning an implementation of the S module with caching. * We need to avoid constantly deserializing types, because it costs us too * much time. The caches keep a deserialized version of the types. *) (*****************************************************************************) module WithCache (Key : Key) (Value : Value) : WithCache with type key = Key.t and type value = Value.t and module KeySet = Flow_set.Make(Key) = struct module Direct = NoCache (Key) (Value) type key = Direct.key type value = Direct.value module KeySet = Direct.KeySet module Cache = LocalCache (struct type nonrec key = key type nonrec value = value let capacity = 1000 end) (* This is exposed for tests *) module DebugCache = Cache let add x y = Direct.add x y; Cache.add x y let get_no_cache = Direct.get let write_around x y = (* Note that we do not need to do any cache invalidation here because * Direct.add is a no-op if the key already exists. *) Direct.add x y let log_hit_rate ~hit = Measure.sample (Value.description ^ " (cache hit rate)") ( if hit then 1. else 0. ); Measure.sample "(ALL cache hit rate)" ( if hit then 1. else 0. ) let get x = match Cache.get x with | None -> let result = match Direct.get x with | None -> None | Some v as result -> Cache.add x v; result in if hh_log_level () > 0 then log_hit_rate ~hit:false; result | Some _ as result -> if hh_log_level () > 0 then log_hit_rate ~hit:true; result (* We don't cache old objects, they are not accessed often enough. *) let get_old = Direct.get_old let mem_old = Direct.mem_old let mem x = match get x with | None -> false | Some _ -> true let oldify key = Direct.oldify key; Cache.remove key let oldify_batch keys = Direct.oldify_batch keys; KeySet.iter Cache.remove keys let revive_batch keys = Direct.revive_batch keys; KeySet.iter Cache.remove keys let remove x = Direct.remove x; Cache.remove x let remove_batch xs = KeySet.iter remove xs let () = invalidate_callback_list := begin fun () -> Cache.clear () end :: !invalidate_callback_list let remove_old_batch = Direct.remove_old_batch end module NewAPI = struct type chunk = { heap: buf; mutable next_addr: int; mutable remaining_size: int; } type heap_string type heap_int64 type 'a entity type 'a addr_tbl type ast type docblock type aloc_table type type_sig type file_sig type exports type resolved_requires type +'a parse type file type haste_module type file_module type size = int let bsize_wsize bsize = bsize * Sys.word_size / 8 let addr_offset addr size = addr + bsize_wsize size let get_heap () = match !heap_ref with | None -> failwith "get_heap: not connected" | Some heap -> heap external alloc : size -> _ addr = "hh_ml_alloc" let alloc size f = let addr = alloc size in let chunk = { heap = get_heap (); next_addr = addr; remaining_size = size } in let x = f chunk in (* Ensure allocated space was initialized. *) assert (chunk.remaining_size = 0); assert (chunk.next_addr = addr_offset addr size); x (** Primitives These low-level functions write to and read from the shared heap directly. Prefer using interfaces based on the `chunk` APIs, which ensure that the destination has been allocated. Also prefer higher-level APIs below. *) external buf_read_int8 : buf -> int -> int = "%caml_ba_ref_1" external buf_write_int8 : buf -> int -> int -> unit = "%caml_ba_set_1" external buf_read_int64 : buf -> int -> int64 = "%caml_bigstring_get64" external buf_write_int64 : buf -> int -> int64 -> unit = "%caml_bigstring_set64" (* Read a string from the heap at the specified address with the specified * size (in words). This read is not bounds checked or type checked; caller * must ensure that the given destination contains string data. *) external unsafe_read_string : _ addr -> int -> string = "hh_read_string" (* Write a string at the specified address in the heap. This write is not * bounds checked; caller must ensure the given destination has already been * allocated. *) external unsafe_write_string_at : _ addr -> string -> unit = "hh_write_string" [@@noalloc] external unsafe_write_bytes_at : _ addr -> bytes -> pos:int -> len:int -> unit = "hh_write_bytes" [@@noalloc] external compare_exchange_weak : _ addr -> int -> int -> bool = "hh_compare_exchange_weak" [@@noalloc] (** Addresses *) let addr_size = 1 (* Addresses are relative to the hashtbl pointer, so the null address actually * points to the hash field of the first hashtbl entry, which is never a * meaningful address, so we can use it to represent "missing" or similar. * * Naturally, we need to be careful not to dereference the null addr! Any * internal use of null should be hidden from callers of this module. *) let null_addr = 0 (* Write an address at a specified address in the heap. The caller must ensure * the given destination has already been allocated. *) let unsafe_write_addr_at heap dst addr = buf_write_int64 heap dst (Int64.of_int addr) (* Write an address into the given chunk and advance the chunk address. This * write is not bounds checked; caller must ensure the given destination has * already been allocated. *) let unsafe_write_addr chunk addr = unsafe_write_addr_at chunk.heap chunk.next_addr addr; chunk.next_addr <- addr_offset chunk.next_addr addr_size (* Read an address from the heap. *) let read_addr heap addr = let addr64 = buf_read_int64 heap addr in (* double-check that the data looks like an address *) assert (Int64.logand addr64 1L = 0L); Int64.to_int addr64 (** Headers *) let header_size = 1 let with_header_size f x = header_size + f x (* Write a header at a specified address in the heap. The caller must ensure * the given destination has already been allocated. * * The low bytes of the header includes a 6-bit tag and 2 GC bits, initially * 0b01, or "white." See hh_shared.c for more about the GC. The size of the * object in words is stored in the remaining space. *) let unsafe_write_header_at heap dst tag obj_size = let tag = Int64.of_int (tag_val tag) in let obj_size = Int64.of_int obj_size in let ( lsl ) = Int64.shift_left in let ( lor ) = Int64.logor in let hd = (obj_size lsl 8) lor (tag lsl 2) lor 1L in buf_write_int64 heap dst hd (* Consume space in the chunk for the object described by the given header, * write header, advance chunk address, and return address to the header. This * function should be called before writing any heap object. *) let write_header chunk tag obj_size = let size = header_size + obj_size in chunk.remaining_size <- chunk.remaining_size - size; assert (chunk.remaining_size >= 0); let addr = chunk.next_addr in unsafe_write_header_at chunk.heap addr tag obj_size; chunk.next_addr <- addr_offset addr header_size; addr (* Similar to `unsafe_write_header_at` above, but the header format is * different. * * The low byte contains the same 6-bit tag and 2 GC bits, but the remaining * space contains two sizes: the size of the object in words as well as the * size (in words) of the buffer needed to hold the decompressed data. * * Is 56 bits enough space to store the serialized size and decompress * capacity? * * In the worst case, we try to compress uncompressible input of * LZ4_MAX_INPUT_SIZE, consuming the entire compress bound. That would be * 0x7E7E7E8E bytes compressed size. * * NOTE: The compressed size might actually be bigger than the serialized * size, in a worst case scenario where the input is not compressible. This * shouldn't happen in practice, but we account for it in the worse case. * * If we store the size in words instead of bytes, the max size is 0xFCFCFD2 * words, which fits in 2^28, so we can fit both sizes (in words) in 56 bits. * * All this is somewhat academic, since we have bigger problems if we're * trying to store 2 gig entries. *) let unsafe_write_serialized_header_at heap dst tag obj_size decompress_capacity = let tag = Int64.of_int (tag_val tag) in let obj_size = Int64.of_int obj_size in let decompress_capacity = Int64.of_int decompress_capacity in (* Just in case the math above doesn't check out *) assert (obj_size < 0x10000000L); assert (decompress_capacity < 0x10000000L); let ( lsl ) = Int64.shift_left in let ( lor ) = Int64.logor in let hd = (obj_size lsl 36) lor (decompress_capacity lsl 8) lor (tag lsl 2) lor 1L in buf_write_int64 heap dst hd (* See `write_header` above *) let write_serialized_header chunk tag obj_size decompress_capacity = let size = header_size + obj_size in chunk.remaining_size <- chunk.remaining_size - size; assert (chunk.remaining_size >= 0); let addr = chunk.next_addr in unsafe_write_serialized_header_at chunk.heap addr tag obj_size decompress_capacity; chunk.next_addr <- addr_offset addr header_size; addr (* Read a header from the heap. The low 2 bits of the header are reserved for * GC and not used in OCaml. *) let read_header heap addr = let hd64 = buf_read_int64 heap addr in (* Double-check that the data looks like a header. All reachable headers * will have the lsb set. *) assert (Int64.(logand hd64 1L = 1L)); Int64.(to_int (shift_right_logical hd64 2)) let obj_tag hd = hd land 0x3F let obj_size hd = hd lsr 6 let assert_tag hd tag = assert (obj_tag hd = tag_val tag) let read_header_checked heap tag addr = let hd = read_header heap addr in assert_tag hd tag; hd (** Strings *) (* Obj used as an efficient way to get at the word size of an OCaml string * directly from the block header, since that's the size we need. *) let string_size s = Obj.size (Obj.repr s) (* Write a string into the given chunk and advance the chunk address. This * write is not bounds checked; caller must ensure the given destination has * already been allocated. *) let unsafe_write_string chunk s = unsafe_write_string_at chunk.next_addr s; chunk.next_addr <- addr_offset chunk.next_addr (string_size s) let write_string chunk s = let heap_string = write_header chunk String_tag (string_size s) in unsafe_write_string chunk s; heap_string let read_string_generic tag addr offset = let hd = read_header_checked (get_heap ()) tag addr in let str_addr = addr_offset addr (header_size + offset) in let str_size = obj_size hd - offset in unsafe_read_string str_addr str_size let read_string addr = read_string_generic String_tag addr 0 (** Int64 *) let int64_size = 1 (* Write an int64 into the given chunk and advance the chunk address. *) let unsafe_write_int64 chunk n = buf_write_int64 chunk.heap chunk.next_addr n; chunk.next_addr <- addr_offset chunk.next_addr int64_size let write_int64 chunk n = let addr = write_header chunk Int64_tag int64_size in unsafe_write_int64 chunk n; addr let read_int64 addr = let heap = get_heap () in let _ = read_header_checked heap Int64_tag addr in buf_read_int64 heap (addr_offset addr header_size) (** Address tables *) let addr_tbl_size xs = addr_size * Array.length xs let write_addr_tbl f chunk xs = if Array.length xs = 0 then null_addr else let size = addr_tbl_size xs in let map = write_header chunk Addr_tbl_tag size in chunk.next_addr <- addr_offset chunk.next_addr size; Array.iteri (fun i x -> let addr = f chunk x in unsafe_write_addr_at chunk.heap (addr_offset map (header_size + i)) addr) xs; map let read_addr_tbl_generic f addr init = if addr = null_addr then init 0 (fun _ -> failwith "empty") else let heap = get_heap () in let hd = read_header_checked heap Addr_tbl_tag addr in init (obj_size hd) (fun i -> f (read_addr heap (addr_offset addr (header_size + i)))) let read_addr_tbl f addr = read_addr_tbl_generic f addr Array.init (** Optionals *) let opt_none = null_addr let is_none addr = addr == opt_none let read_opt addr = if is_none addr then None else Some addr (** Entities * * We often want to represent some entity, like a file, where we can write new * data while keeping the old data around. For example, during a recheck we * process updates and write new data while serving IDE requests from the * committed data. * * Entities are a versioned data structure that support storing up to two * versions at any point in time: a "committed" and "latest" version. * * Each entity stores its version number. There is also a global version * counter. Each version corresponds to a "slot" which is either 0 or 1. We * compute the slot from the version by taking the least significant bit. * * Entities support reading committed data concurrently with updates without * synchronization. The global version counter can not be updated * concurrently, however. *) let version_size = 1 let entity_size = (2 * addr_size) + version_size let version_addr entity = addr_offset entity 3 let write_entity_data heap entity_addr slot data = let data_addr = addr_offset entity_addr (header_size + slot) in let data = Option.value data ~default:null_addr in unsafe_write_addr_at heap data_addr data let write_entity chunk data = let addr = write_header chunk Entity_tag entity_size in unsafe_write_addr chunk null_addr; unsafe_write_addr chunk null_addr; let version = get_next_version () in unsafe_write_int64 chunk (Int64.of_int version); let slot = version land 1 in write_entity_data chunk.heap addr slot data; addr let get_entity_version heap entity = Int64.to_int (buf_read_int64 heap (version_addr entity)) (* To write new data for an entity, we advance its version, then write the new * data to the appropriate slot. To support concurrent readers, we do this * somewhat carefully. * * A concurrent reader might observe the entity version either before the we * write a new version or after. In either case, the reader will compute the * same slot value -- the committed data has not moved. * * Two concurrent writers are not supported, but could be if there is a need. * As is, nothing will go wrong, except that writers will race to write into * the data slot. * * Advancing an entity which has already been advanced to the latest version * will simply overwrite the previous latest data. *) let entity_advance entity data = let heap = get_heap () in let version = get_next_version () in let entity_version = get_entity_version heap entity in let slot = if entity_version >= version then entity_version land 1 else let slot = lnot entity_version land 1 in let new_version = version lor slot in buf_write_int64 heap (version_addr entity) (Int64.of_int new_version); slot in write_entity_data heap entity slot data let entity_read_committed entity = let heap = get_heap () in let next_version = get_next_version () in let v = ref (get_entity_version heap entity) in if !v >= next_version then v := lnot !v; let slot = !v land 1 in let data = addr_offset entity (header_size + slot) in read_opt (read_addr heap data) let entity_read_latest entity = let heap = get_heap () in let entity_version = get_entity_version heap entity in let slot = entity_version land 1 in let data = addr_offset entity (header_size + slot) in read_opt (read_addr heap data) (* The next version is always an even number. Entities written to the * transaction for the next version will have the entity version that is * either equal or exactly 1 greater (see entity_advance). * * To roll back, we change the entity version to be less than the next version * while also alternating the stamp. *) let entity_rollback entity = let heap = get_heap () in let next_version = get_next_version () in let entity_version = get_entity_version heap entity in let diff = if entity_version == next_version then 1 else if entity_version > next_version then 3 else 0 in if diff > 0 then let new_version = entity_version - diff in buf_write_int64 heap (version_addr entity) (Int64.of_int new_version) let entity_changed entity = let version = get_next_version () in let entity_version = get_entity_version (get_heap ()) entity in entity_version >= version (** Compressed OCaml values We store OCaml values as serialized+compressed blobs in the heap. The object header stores both the compressed size (in words) and the size (in words) of the buffer needed to hold the decompressed value. LZ4 decompression requires the precise compressed size in bytes. To recover the precise byte size, we use a trick lifted from OCaml's representation of strings. The last byte of the block stores a value which we can use to recover the byte size from the word size. If the value is exactly word sized, we add another word to hold this final byte. *) let prepare_write_compressed tag serialized = let serialized_bsize = String.length serialized in let compress_bound = Lz4.compress_bound serialized_bsize in if compress_bound = 0 then invalid_arg "value larger than max input size"; let compressed = Bytes.create compress_bound in let compressed_bsize = Lz4.compress_default serialized compressed in let compressed_wsize = (compressed_bsize + 8) / 8 in let decompress_capacity = (serialized_bsize + 7) / 8 in let write chunk = let addr = write_serialized_header chunk tag compressed_wsize decompress_capacity in unsafe_write_bytes_at chunk.next_addr compressed ~pos:0 ~len:compressed_bsize; let offset_index = bsize_wsize compressed_wsize - 1 in buf_write_int8 chunk.heap (chunk.next_addr + offset_index) (offset_index - compressed_bsize); chunk.next_addr <- addr_offset chunk.next_addr compressed_wsize; addr in (compressed_wsize, write) let read_compressed tag addr = let heap = get_heap () in let hd = read_header_checked heap tag addr in let compressed_wsize = hd lsr 34 in let offset_index = bsize_wsize compressed_wsize - 1 in let compressed_bsize = offset_index - buf_read_int8 heap (addr_offset addr header_size + offset_index) in let buf = Bigarray.Array1.sub heap (addr_offset addr header_size) compressed_bsize in let decompress_capacity = bsize_wsize ((hd lsr 6) land 0xFFFFFFF) in let decompressed = Bytes.create decompress_capacity in let serialized_bsize = Lz4.decompress_safe buf decompressed in Bytes.sub_string decompressed 0 serialized_bsize (** ASTs *) let prepare_write_ast ast = prepare_write_compressed Serialized_ast_tag ast let read_ast addr = read_compressed Serialized_ast_tag addr (** Docblocks *) let docblock_size = string_size let read_docblock addr = read_string_generic Docblock_tag addr 0 let write_docblock chunk docblock = let addr = write_header chunk Docblock_tag (docblock_size docblock) in unsafe_write_string chunk docblock; addr (** ALoc tables *) let aloc_table_size = string_size let write_aloc_table chunk tbl = let addr = write_header chunk ALoc_table_tag (aloc_table_size tbl) in unsafe_write_string chunk tbl; addr let read_aloc_table addr = read_string_generic ALoc_table_tag addr 0 (** Type signatures *) (* Because the heap is word aligned, we store the size of the type sig object * in words. The underlying data might not be word sized, so we use a trick * lifted from OCaml's representation of strings. The last byte of the block * stores a value which we can use to recover the byte size from the word * size. If the value is exactly word sized, we add another word to hold this * final byte. *) let type_sig_size bsize = (bsize + 8) lsr 3 let write_type_sig chunk bsize f = let size = type_sig_size bsize in let addr = write_header chunk Type_sig_tag size in let offset_index = bsize_wsize size - 1 in buf_write_int8 chunk.heap (addr_offset addr header_size + offset_index) (offset_index - bsize); let buf = Bigarray.Array1.sub chunk.heap (addr_offset addr header_size) bsize in f buf; chunk.next_addr <- addr_offset chunk.next_addr size; addr let type_sig_buf addr = let heap = get_heap () in let hd = read_header_checked heap Type_sig_tag addr in let offset_index = bsize_wsize (obj_size hd) - 1 in let bsize = offset_index - buf_read_int8 heap (addr_offset addr header_size + offset_index) in Bigarray.Array1.sub heap (addr_offset addr header_size) bsize let read_type_sig addr f = f (type_sig_buf addr) (** File sigs *) let prepare_write_file_sig file_sig = prepare_write_compressed Serialized_file_sig_tag file_sig let read_file_sig addr = read_compressed Serialized_file_sig_tag addr (** Exports *) let prepare_write_exports exports = prepare_write_compressed Serialized_exports_tag exports let read_exports addr = read_compressed Serialized_exports_tag addr (** Resolved requires *) let prepare_write_resolved_requires resolved_requires = prepare_write_compressed Serialized_resolved_requires_tag resolved_requires let read_resolved_requires addr = read_compressed Serialized_resolved_requires_tag addr (** Field utils *) let set_generic offset base = unsafe_write_addr_at (get_heap ()) (offset base) let get_generic offset base = read_addr (get_heap ()) (offset base) let get_generic_opt offset base = read_opt (get_generic offset base) (** Parse data *) let untyped_parse_size = 3 * addr_size let typed_parse_size = 10 * addr_size let write_untyped_parse chunk hash haste_module = let haste_module = Option.value haste_module ~default:opt_none in let addr = write_header chunk Untyped_tag untyped_parse_size in unsafe_write_addr chunk hash; unsafe_write_addr chunk haste_module; unsafe_write_addr chunk null_addr (* next haste provider *); addr let write_typed_parse chunk hash haste_module exports resolved_requires = let haste_module = Option.value haste_module ~default:opt_none in let addr = write_header chunk Typed_tag typed_parse_size in unsafe_write_addr chunk hash; unsafe_write_addr chunk haste_module; unsafe_write_addr chunk null_addr (* next haste provider *); unsafe_write_addr chunk null_addr; unsafe_write_addr chunk null_addr; unsafe_write_addr chunk null_addr; unsafe_write_addr chunk null_addr; unsafe_write_addr chunk null_addr; unsafe_write_addr chunk exports; unsafe_write_addr chunk resolved_requires; addr let is_typed parse = let hd = read_header (get_heap ()) parse in obj_tag hd = tag_val Typed_tag let coerce_typed parse = if is_typed parse then Some parse else None let file_hash_addr parse = addr_offset parse 1 let haste_module_addr parse = addr_offset parse 2 let next_haste_provider_addr parse = addr_offset parse 3 let ast_addr parse = addr_offset parse 4 let docblock_addr parse = addr_offset parse 5 let aloc_table_addr parse = addr_offset parse 6 let type_sig_addr parse = addr_offset parse 7 let file_sig_addr parse = addr_offset parse 8 let exports_addr parse = addr_offset parse 9 let resolved_requires_addr parse = addr_offset parse 10 let get_file_hash = get_generic file_hash_addr let get_haste_module = get_generic_opt haste_module_addr let get_ast = get_generic_opt ast_addr let get_docblock = get_generic_opt docblock_addr let get_aloc_table = get_generic_opt aloc_table_addr let get_type_sig = get_generic_opt type_sig_addr let get_file_sig = get_generic_opt file_sig_addr let get_exports = get_generic exports_addr let get_resolved_requires = get_generic resolved_requires_addr let set_ast = set_generic ast_addr let set_docblock = set_generic docblock_addr let set_aloc_table = set_generic aloc_table_addr let set_type_sig = set_generic type_sig_addr let set_file_sig = set_generic file_sig_addr (** File data *) type file_kind = | Source_file | Json_file | Resource_file | Lib_file let file_tag = function | Source_file -> Source_file_tag | Json_file -> Json_file_tag | Resource_file -> Resource_file_tag | Lib_file -> Lib_file_tag let file_size = 4 * addr_size let write_file chunk kind file_name file_module parse = let file_module = Option.value file_module ~default:opt_none in let addr = write_header chunk (file_tag kind) file_size in unsafe_write_addr chunk file_name; unsafe_write_addr chunk file_module; unsafe_write_addr chunk parse; unsafe_write_addr chunk null_addr (* next file provider *); addr let file_name_addr file = addr_offset file 1 let file_module_addr file = addr_offset file 2 let parse_addr file = addr_offset file 3 let next_file_provider_addr file = addr_offset file 4 let get_file_kind file = let hd = read_header (get_heap ()) file in let tag = obj_tag hd in if tag = tag_val Source_file_tag then Source_file else if tag = tag_val Json_file_tag then Json_file else if tag = tag_val Resource_file_tag then Resource_file else if tag = tag_val Lib_file_tag then Lib_file else failwith "get_file_kind: unexpected tag" let get_file_name = get_generic file_name_addr let get_file_module = get_generic_opt file_module_addr let get_parse = get_generic parse_addr let files_equal = Int.equal let file_changed file = entity_changed (get_parse file) (** All providers *) let add_provider head_addr next_addr file = let heap = get_heap () in let rec loop () = let head = read_addr heap head_addr in unsafe_write_addr_at heap next_addr head; if not (compare_exchange_weak head_addr head file) then loop () in loop () (** Haste modules *) let haste_module_size = 3 * addr_size let write_haste_module chunk name provider = let addr = write_header chunk Haste_module_tag haste_module_size in unsafe_write_addr chunk name; unsafe_write_addr chunk provider; unsafe_write_addr chunk null_addr (* all providers *); addr let haste_modules_equal = Int.equal let haste_name_addr m = addr_offset m 1 let haste_provider_addr m = addr_offset m 2 let haste_all_providers_addr m = addr_offset m 3 let get_haste_name = get_generic haste_name_addr let get_haste_provider = get_generic haste_provider_addr let add_haste_provider m file parse = let head_addr = haste_all_providers_addr m in let next_addr = next_haste_provider_addr parse in add_provider head_addr next_addr file (* Iterate through linked list of providers, accumulating a list. While * traversing, we also remove any files which are no longer providers. * * Deferred delete happens here because concurrent deletion from a linked * list is complicated (but possible!) and we need to iterate over all * providers anyway, so it's much more convenient to do it here. * * Deferred deletions _must_ be performed before a transaction commits. If a * transaction is rolled back, changes to the all providers list need to be * unwound. *) let get_haste_all_providers_exclusive m = let heap = get_heap () in let rec loop acc node_addr node = if is_none node then acc else let parse_ent = get_parse node in match entity_read_latest parse_ent with | Some parse when m == get_generic haste_module_addr parse -> (* `node` is a current provider of `m` *) let next_addr = next_haste_provider_addr parse in let next = read_addr heap next_addr in loop (node :: acc) next_addr next | _ -> (* `node` no longer provides `m` -- perform deferred deletion. * Invariant: `node` used to provide `m`, so the next item in this * list comes from the committed parse data. *) let old_parse = Option.get (entity_read_committed parse_ent) in assert (m == get_generic haste_module_addr old_parse); let next_addr = next_haste_provider_addr old_parse in let next = read_addr heap next_addr in unsafe_write_addr_at heap node_addr next; loop acc node_addr next in let head_addr = haste_all_providers_addr m in let head = read_addr heap head_addr in loop [] head_addr head (* In the case of a transaction rollback, we need to remove providers which * were added during the transaction. * * This function also performs deferred deletion, since we might as well. It * speeds up subsequent traversals. * * TODO: It is unfortunate that this function duplicates so much of the logic * from `get_haste_all_providers` above. It would be nice to share more code, * if possible. *) let remove_haste_provider_exclusive m file = let heap = get_heap () in let rec loop node_addr node = if is_none node then () else let parse_ent = get_parse node in match entity_read_latest parse_ent with | Some parse when m == get_generic haste_module_addr parse -> let next_addr = next_haste_provider_addr parse in let next = read_addr heap next_addr in if node == file then unsafe_write_addr_at heap node_addr next else loop next_addr next | _ -> let old_parse = Option.get (entity_read_committed parse_ent) in assert (m == get_generic haste_module_addr old_parse); let next_addr = next_haste_provider_addr old_parse in let next = read_addr heap next_addr in unsafe_write_addr_at heap node_addr next; loop node_addr next in let head_addr = haste_all_providers_addr m in let head = read_addr heap head_addr in loop head_addr head (** File modules *) let file_module_size = 2 * addr_size let write_file_module chunk provider = let addr = write_header chunk File_module_tag file_module_size in unsafe_write_addr chunk provider; unsafe_write_addr chunk null_addr (* all providers *); addr let file_provider_addr m = addr_offset m 1 let file_all_providers_addr m = addr_offset m 2 let get_file_provider = get_generic file_provider_addr let add_file_provider m file = let head_addr = file_all_providers_addr m in let next_addr = next_file_provider_addr file in add_provider head_addr next_addr file (* Iterate through linked list of providers, accumulating a list. While * traversing, we also remove any files which are no longer providers. * * See `get_haste_all_providers_exclusive` for more details about deferred * deletion. *) let get_file_all_providers_exclusive m = let heap = get_heap () in let rec loop acc node_addr node = if is_none node then acc else let next_addr = next_file_provider_addr node in let next = read_addr heap next_addr in match entity_read_latest (get_parse node) with | Some _ -> (* As long as `node` has some parse information, then the file exists * and provides `m`. *) loop (node :: acc) next_addr next | None -> (* `node` has no parse information, and thus does not exist and does * not provide `m`. *) unsafe_write_addr_at heap node_addr next; loop acc node_addr next in let head_addr = file_all_providers_addr m in let head = read_addr heap head_addr in loop [] head_addr head (* See `remove_haste_provider_exclusive` *) let remove_file_provider_exclusive m file = let heap = get_heap () in let rec loop node_addr node = if is_none node then () else let next_addr = next_file_provider_addr node in let next = read_addr heap next_addr in if node == file then unsafe_write_addr_at heap node_addr next else loop next_addr next in let head_addr = file_all_providers_addr m in let head = read_addr heap head_addr in loop head_addr head let iter_resolved_requires f = let heap = get_heap () in let f addr = let hd = read_header heap addr in if obj_tag hd = tag_val Source_file_tag then match entity_read_latest (get_parse addr) with | None -> () | Some parse -> let hd = read_header heap parse in if obj_tag hd = tag_val Typed_tag then ( match entity_read_latest (get_resolved_requires parse) with | None -> () | Some resolved_requires -> f addr resolved_requires ) in hh_iter f end

src/heap/sharedMem.ml (1,366 lines of code) (raw):