Merge remote-tracking branch 'origin/trunk' into str-fromUtf8

2025-09-28 06:14:46 +00:00 · 2021-02-21 15:25:36 +01:00 · 2021-02-21 15:25:36 +01:00 · 57b78dde06
commit 57b78dde06
parent 2159d94b87 2f479e9ffb
156 changed files with 19265 additions and 10809 deletions
--- a/compiler/builtins/bitcode/src/dict.zig
+++ b/compiler/builtins/bitcode/src/dict.zig
@ -0,0 +1,795 @@
+const std = @import("std");
+const testing = std.testing;
+const expectEqual = testing.expectEqual;
+const mem = std.mem;
+const Allocator = mem.Allocator;
+const assert = std.debug.assert;
+
+const utils = @import("utils.zig");
+const RocList = @import("list.zig").RocList;
+
+const INITIAL_SEED = 0xc70f6907;
+
+const InPlace = packed enum(u8) {
+    InPlace,
+    Clone,
+};
+
+const Slot = packed enum(u8) {
+    Empty,
+    Filled,
+    PreviouslyFilled,
+};
+
+const MaybeIndexTag = enum {
+    index, not_found
+};
+
+const MaybeIndex = union(MaybeIndexTag) {
+    index: usize, not_found: void
+};
+
+fn nextSeed(seed: u64) u64 {
+    // TODO is this a valid way to get a new seed? are there better ways?
+    return seed + 1;
+}
+
+fn totalCapacityAtLevel(input: usize) usize {
+    if (input == 0) {
+        return 0;
+    }
+
+    var n = input;
+    var slots: usize = 8;
+
+    while (n > 1) : (n -= 1) {
+        slots = slots * 2 + slots;
+    }
+
+    return slots;
+}
+
+fn capacityOfLevel(input: usize) usize {
+    if (input == 0) {
+        return 0;
+    }
+
+    var n = input;
+    var slots: usize = 8;
+
+    while (n > 1) : (n -= 1) {
+        slots = slots * 2;
+    }
+
+    return slots;
+}
+
+// aligmnent of elements. The number (16 or 8) indicates the maximum
+// alignment of the key and value. The tag furthermore indicates
+// which has the biggest aligmnent. If both are the same, we put
+// the key first
+const Alignment = packed enum(u8) {
+    Align16KeyFirst,
+    Align16ValueFirst,
+    Align8KeyFirst,
+    Align8ValueFirst,
+
+    fn toUsize(self: Alignment) usize {
+        switch (self) {
+            .Align16KeyFirst => return 16,
+            .Align16ValueFirst => return 16,
+            .Align8KeyFirst => return 8,
+            .Align8ValueFirst => return 8,
+        }
+    }
+
+    fn keyFirst(self: Alignment) bool {
+        switch (self) {
+            .Align16KeyFirst => return true,
+            .Align16ValueFirst => return false,
+            .Align8KeyFirst => return true,
+            .Align8ValueFirst => return false,
+        }
+    }
+};
+
+pub fn decref(
+    allocator: *Allocator,
+    alignment: Alignment,
+    bytes_or_null: ?[*]u8,
+    data_bytes: usize,
+) void {
+    return utils.decref(allocator, alignment.toUsize(), bytes_or_null, data_bytes);
+}
+
+pub fn allocateWithRefcount(
+    allocator: *Allocator,
+    alignment: Alignment,
+    data_bytes: usize,
+) [*]u8 {
+    return utils.allocateWithRefcount(allocator, alignment.toUsize(), data_bytes);
+}
+
+pub const RocDict = extern struct {
+    dict_bytes: ?[*]u8,
+    dict_entries_len: usize,
+    number_of_levels: usize,
+
+    pub fn empty() RocDict {
+        return RocDict{
+            .dict_entries_len = 0,
+            .number_of_levels = 0,
+            .dict_bytes = null,
+        };
+    }
+
+    pub fn allocate(
+        allocator: *Allocator,
+        number_of_levels: usize,
+        number_of_entries: usize,
+        alignment: Alignment,
+        key_size: usize,
+        value_size: usize,
+    ) RocDict {
+        const number_of_slots = totalCapacityAtLevel(number_of_levels);
+        const slot_size = slotSize(key_size, value_size);
+        const data_bytes = number_of_slots * slot_size;
+
+        return RocDict{
+            .dict_bytes = allocateWithRefcount(allocator, alignment, data_bytes),
+            .number_of_levels = number_of_levels,
+            .dict_entries_len = number_of_entries,
+        };
+    }
+
+    pub fn reallocate(
+        self: RocDict,
+        allocator: *Allocator,
+        alignment: Alignment,
+        key_width: usize,
+        value_width: usize,
+    ) RocDict {
+        const new_level = self.number_of_levels + 1;
+        const slot_size = slotSize(key_width, value_width);
+
+        const old_capacity = self.capacity();
+        const new_capacity = totalCapacityAtLevel(new_level);
+        const delta_capacity = new_capacity - old_capacity;
+
+        const data_bytes = new_capacity * slot_size;
+        const first_slot = allocateWithRefcount(allocator, alignment, data_bytes);
+
+        // transfer the memory
+
+        if (self.dict_bytes) |source_ptr| {
+            const dest_ptr = first_slot;
+
+            var source_offset: usize = 0;
+            var dest_offset: usize = 0;
+
+            if (alignment.keyFirst()) {
+                // copy keys
+                @memcpy(dest_ptr + dest_offset, source_ptr + source_offset, old_capacity * key_width);
+
+                // copy values
+                source_offset = old_capacity * key_width;
+                dest_offset = new_capacity * key_width;
+                @memcpy(dest_ptr + dest_offset, source_ptr + source_offset, old_capacity * value_width);
+            } else {
+                // copy values
+                @memcpy(dest_ptr + dest_offset, source_ptr + source_offset, old_capacity * value_width);
+
+                // copy keys
+                source_offset = old_capacity * value_width;
+                dest_offset = new_capacity * value_width;
+                @memcpy(dest_ptr + dest_offset, source_ptr + source_offset, old_capacity * key_width);
+            }
+
+            // copy slots
+            source_offset = old_capacity * (key_width + value_width);
+            dest_offset = new_capacity * (key_width + value_width);
+            @memcpy(dest_ptr + dest_offset, source_ptr + source_offset, old_capacity * @sizeOf(Slot));
+        }
+
+        var i: usize = 0;
+        const first_new_slot_value = first_slot + old_capacity * slot_size + delta_capacity * (key_width + value_width);
+        while (i < (new_capacity - old_capacity)) : (i += 1) {
+            (first_new_slot_value)[i] = @enumToInt(Slot.Empty);
+        }
+
+        const result = RocDict{
+            .dict_bytes = first_slot,
+            .number_of_levels = self.number_of_levels + 1,
+            .dict_entries_len = self.dict_entries_len,
+        };
+
+        // NOTE we fuse an increment of all keys/values with a decrement of the input dict
+        decref(allocator, alignment, self.dict_bytes, self.capacity() * slotSize(key_width, value_width));
+
+        return result;
+    }
+
+    pub fn asU8ptr(self: RocDict) [*]u8 {
+        return @ptrCast([*]u8, self.dict_bytes);
+    }
+
+    pub fn len(self: RocDict) usize {
+        return self.dict_entries_len;
+    }
+
+    pub fn isEmpty(self: RocDict) bool {
+        return self.len() == 0;
+    }
+
+    pub fn isUnique(self: RocDict) bool {
+        // the empty dict is unique (in the sense that copying it will not leak memory)
+        if (self.isEmpty()) {
+            return true;
+        }
+
+        // otherwise, check if the refcount is one
+        const ptr: [*]usize = @ptrCast([*]usize, @alignCast(8, self.dict_bytes));
+        return (ptr - 1)[0] == utils.REFCOUNT_ONE;
+    }
+
+    pub fn capacity(self: RocDict) usize {
+        return totalCapacityAtLevel(self.number_of_levels);
+    }
+
+    pub fn makeUnique(self: RocDict, allocator: *Allocator, alignment: Alignment, key_width: usize, value_width: usize) RocDict {
+        if (self.isEmpty()) {
+            return self;
+        }
+
+        if (self.isUnique()) {
+            return self;
+        }
+
+        // unfortunately, we have to clone
+        var new_dict = RocDict.allocate(allocator, self.number_of_levels, self.dict_entries_len, alignment, key_width, value_width);
+
+        var old_bytes: [*]u8 = @ptrCast([*]u8, self.dict_bytes);
+        var new_bytes: [*]u8 = @ptrCast([*]u8, new_dict.dict_bytes);
+
+        const number_of_bytes = self.capacity() * (@sizeOf(Slot) + key_width + value_width);
+        @memcpy(new_bytes, old_bytes, number_of_bytes);
+
+        // NOTE we fuse an increment of all keys/values with a decrement of the input dict
+        const data_bytes = self.capacity() * slotSize(key_width, value_width);
+        decref(allocator, alignment, self.dict_bytes, data_bytes);
+
+        return new_dict;
+    }
+
+    fn getSlot(self: *const RocDict, index: usize, key_width: usize, value_width: usize) Slot {
+        const offset = self.capacity() * (key_width + value_width) + index * @sizeOf(Slot);
+
+        const ptr = self.dict_bytes orelse unreachable;
+        return @intToEnum(Slot, ptr[offset]);
+    }
+
+    fn setSlot(self: *RocDict, index: usize, key_width: usize, value_width: usize, slot: Slot) void {
+        const offset = self.capacity() * (key_width + value_width) + index * @sizeOf(Slot);
+
+        const ptr = self.dict_bytes orelse unreachable;
+        ptr[offset] = @enumToInt(slot);
+    }
+
+    fn setKey(self: *RocDict, index: usize, alignment: Alignment, key_width: usize, value_width: usize, data: Opaque) void {
+        if (key_width == 0) {
+            return;
+        }
+
+        const offset = blk: {
+            if (alignment.keyFirst()) {
+                break :blk (index * key_width);
+            } else {
+                break :blk (self.capacity() * value_width) + (index * key_width);
+            }
+        };
+
+        const ptr = self.dict_bytes orelse unreachable;
+
+        const source = data orelse unreachable;
+        const dest = ptr + offset;
+        @memcpy(dest, source, key_width);
+    }
+
+    fn getKey(self: *const RocDict, index: usize, alignment: Alignment, key_width: usize, value_width: usize) Opaque {
+        if (key_width == 0) {
+            return null;
+        }
+
+        const offset = blk: {
+            if (alignment.keyFirst()) {
+                break :blk (index * key_width);
+            } else {
+                break :blk (self.capacity() * value_width) + (index * key_width);
+            }
+        };
+
+        const ptr = self.dict_bytes orelse unreachable;
+        return ptr + offset;
+    }
+
+    fn setValue(self: *RocDict, index: usize, alignment: Alignment, key_width: usize, value_width: usize, data: Opaque) void {
+        if (value_width == 0) {
+            return;
+        }
+
+        const offset = blk: {
+            if (alignment.keyFirst()) {
+                break :blk (self.capacity() * key_width) + (index * value_width);
+            } else {
+                break :blk (index * value_width);
+            }
+        };
+
+        const ptr = self.dict_bytes orelse unreachable;
+
+        const source = data orelse unreachable;
+        const dest = ptr + offset;
+        @memcpy(dest, source, value_width);
+    }
+
+    fn getValue(self: *const RocDict, index: usize, alignment: Alignment, key_width: usize, value_width: usize) Opaque {
+        if (value_width == 0) {
+            return null;
+        }
+
+        const offset = blk: {
+            if (alignment.keyFirst()) {
+                break :blk (self.capacity() * key_width) + (index * value_width);
+            } else {
+                break :blk (index * value_width);
+            }
+        };
+
+        const ptr = self.dict_bytes orelse unreachable;
+        return ptr + offset;
+    }
+
+    fn findIndex(self: *const RocDict, alignment: Alignment, key: Opaque, key_width: usize, value_width: usize, hash_fn: HashFn, is_eq: EqFn) MaybeIndex {
+        if (self.isEmpty()) {
+            return MaybeIndex.not_found;
+        }
+
+        var seed: u64 = INITIAL_SEED;
+
+        var current_level: usize = 1;
+        var current_level_size: usize = 8;
+        var next_level_size: usize = 2 * current_level_size;
+
+        while (true) {
+            if (current_level > self.number_of_levels) {
+                return MaybeIndex.not_found;
+            }
+
+            // hash the key, and modulo by the maximum size
+            // (so we get an in-bounds index)
+            const hash = hash_fn(seed, key);
+            const index = capacityOfLevel(current_level - 1) + (hash % current_level_size);
+
+            switch (self.getSlot(index, key_width, value_width)) {
+                Slot.Empty, Slot.PreviouslyFilled => {
+                    return MaybeIndex.not_found;
+                },
+                Slot.Filled => {
+                    // is this the same key, or a new key?
+                    const current_key = self.getKey(index, alignment, key_width, value_width);
+
+                    if (is_eq(key, current_key)) {
+                        return MaybeIndex{ .index = index };
+                    } else {
+                        current_level += 1;
+                        current_level_size *= 2;
+                        next_level_size *= 2;
+
+                        seed = nextSeed(seed);
+                        continue;
+                    }
+                },
+            }
+        }
+    }
+};
+
+// Dict.empty
+pub fn dictEmpty() callconv(.C) RocDict {
+    return RocDict.empty();
+}
+
+pub fn slotSize(key_size: usize, value_size: usize) usize {
+    return @sizeOf(Slot) + key_size + value_size;
+}
+
+// Dict.len
+pub fn dictLen(dict: RocDict) callconv(.C) usize {
+    return dict.dict_entries_len;
+}
+
+// commonly used type aliases
+const Opaque = ?[*]u8;
+const HashFn = fn (u64, ?[*]u8) callconv(.C) u64;
+const EqFn = fn (?[*]u8, ?[*]u8) callconv(.C) bool;
+
+const Inc = fn (?[*]u8) callconv(.C) void;
+const Dec = fn (?[*]u8) callconv(.C) void;
+
+// Dict.insert : Dict k v, k, v -> Dict k v
+pub fn dictInsert(input: RocDict, alignment: Alignment, key: Opaque, key_width: usize, value: Opaque, value_width: usize, hash_fn: HashFn, is_eq: EqFn, dec_key: Dec, dec_value: Dec, output: *RocDict) callconv(.C) void {
+    var seed: u64 = INITIAL_SEED;
+
+    var result = input.makeUnique(std.heap.c_allocator, alignment, key_width, value_width);
+
+    var current_level: usize = 1;
+    var current_level_size: usize = 8;
+    var next_level_size: usize = 2 * current_level_size;
+
+    while (true) {
+        if (current_level > result.number_of_levels) {
+            result = result.reallocate(std.heap.c_allocator, alignment, key_width, value_width);
+        }
+
+        const hash = hash_fn(seed, key);
+        const index = capacityOfLevel(current_level - 1) + (hash % current_level_size);
+        assert(index < result.capacity());
+
+        switch (result.getSlot(index, key_width, value_width)) {
+            Slot.Empty, Slot.PreviouslyFilled => {
+                result.setSlot(index, key_width, value_width, Slot.Filled);
+                result.setKey(index, alignment, key_width, value_width, key);
+                result.setValue(index, alignment, key_width, value_width, value);
+
+                result.dict_entries_len += 1;
+                break;
+            },
+            Slot.Filled => {
+                // is this the same key, or a new key?
+                const current_key = result.getKey(index, alignment, key_width, value_width);
+
+                if (is_eq(key, current_key)) {
+                    // we will override the old value, but first have to decrement its refcount
+                    const current_value = result.getValue(index, alignment, key_width, value_width);
+                    dec_value(current_value);
+
+                    // we must consume the key argument!
+                    dec_key(key);
+
+                    result.setValue(index, alignment, key_width, value_width, value);
+                    break;
+                } else {
+                    seed = nextSeed(seed);
+
+                    current_level += 1;
+                    current_level_size *= 2;
+                    next_level_size *= 2;
+
+                    continue;
+                }
+            },
+        }
+    }
+
+    // write result into pointer
+    output.* = result;
+}
+
+// Dict.remove : Dict k v, k -> Dict k v
+pub fn dictRemove(input: RocDict, alignment: Alignment, key: Opaque, key_width: usize, value_width: usize, hash_fn: HashFn, is_eq: EqFn, dec_key: Dec, dec_value: Dec, output: *RocDict) callconv(.C) void {
+    switch (input.findIndex(alignment, key, key_width, value_width, hash_fn, is_eq)) {
+        MaybeIndex.not_found => {
+            // the key was not found; we're done
+            output.* = input;
+            return;
+        },
+        MaybeIndex.index => |index| {
+            var dict = input.makeUnique(std.heap.c_allocator, alignment, key_width, value_width);
+
+            assert(index < dict.capacity());
+
+            dict.setSlot(index, key_width, value_width, Slot.PreviouslyFilled);
+            const old_key = dict.getKey(index, alignment, key_width, value_width);
+            const old_value = dict.getValue(index, alignment, key_width, value_width);
+
+            dec_key(old_key);
+            dec_value(old_value);
+            dict.dict_entries_len -= 1;
+
+            // if the dict is now completely empty, free its allocation
+            if (dict.dict_entries_len == 0) {
+                const data_bytes = dict.capacity() * slotSize(key_width, value_width);
+                decref(std.heap.c_allocator, alignment, dict.dict_bytes, data_bytes);
+                output.* = RocDict.empty();
+                return;
+            }
+
+            output.* = dict;
+        },
+    }
+}
+
+// Dict.contains : Dict k v, k -> Bool
+pub fn dictContains(dict: RocDict, alignment: Alignment, key: Opaque, key_width: usize, value_width: usize, hash_fn: HashFn, is_eq: EqFn) callconv(.C) bool {
+    switch (dict.findIndex(alignment, key, key_width, value_width, hash_fn, is_eq)) {
+        MaybeIndex.not_found => {
+            return false;
+        },
+        MaybeIndex.index => |_| {
+            return true;
+        },
+    }
+}
+
+// Dict.get : Dict k v, k -> { flag: bool, value: Opaque }
+pub fn dictGet(dict: RocDict, alignment: Alignment, key: Opaque, key_width: usize, value_width: usize, hash_fn: HashFn, is_eq: EqFn, inc_value: Inc) callconv(.C) extern struct { value: Opaque, flag: bool } {
+    switch (dict.findIndex(alignment, key, key_width, value_width, hash_fn, is_eq)) {
+        MaybeIndex.not_found => {
+            return .{ .flag = false, .value = null };
+        },
+        MaybeIndex.index => |index| {
+            var value = dict.getValue(index, alignment, key_width, value_width);
+            inc_value(value);
+            return .{ .flag = true, .value = value };
+        },
+    }
+}
+
+// Dict.elementsRc
+// increment or decrement all dict elements (but not the dict's allocation itself)
+pub fn elementsRc(dict: RocDict, alignment: Alignment, key_width: usize, value_width: usize, modify_key: Inc, modify_value: Inc) callconv(.C) void {
+    const size = dict.capacity();
+
+    var i: usize = 0;
+    while (i < size) : (i += 1) {
+        switch (dict.getSlot(i, key_width, value_width)) {
+            Slot.Filled => {
+                modify_key(dict.getKey(i, alignment, key_width, value_width));
+                modify_value(dict.getValue(i, alignment, key_width, value_width));
+            },
+            else => {},
+        }
+    }
+}
+
+pub fn dictKeys(dict: RocDict, alignment: Alignment, key_width: usize, value_width: usize, inc_key: Inc, output: *RocList) callconv(.C) void {
+    const size = dict.capacity();
+
+    var length: usize = 0;
+    var i: usize = 0;
+    while (i < size) : (i += 1) {
+        switch (dict.getSlot(i, key_width, value_width)) {
+            Slot.Filled => {
+                length += 1;
+            },
+            else => {},
+        }
+    }
+
+    if (length == 0) {
+        output.* = RocList.empty();
+        return;
+    }
+
+    const data_bytes = length * key_width;
+    var ptr = allocateWithRefcount(std.heap.c_allocator, alignment, data_bytes);
+
+    var offset = blk: {
+        if (alignment.keyFirst()) {
+            break :blk 0;
+        } else {
+            break :blk (dict.capacity() * value_width);
+        }
+    };
+
+    i = 0;
+    var copied: usize = 0;
+    while (i < size) : (i += 1) {
+        switch (dict.getSlot(i, key_width, value_width)) {
+            Slot.Filled => {
+                const key = dict.getKey(i, alignment, key_width, value_width);
+                inc_key(key);
+
+                const key_cast = @ptrCast([*]const u8, key);
+                @memcpy(ptr + (copied * key_width), key_cast, key_width);
+                copied += 1;
+            },
+            else => {},
+        }
+    }
+
+    output.* = RocList{ .bytes = ptr, .length = length };
+}
+
+pub fn dictValues(dict: RocDict, alignment: Alignment, key_width: usize, value_width: usize, inc_value: Inc, output: *RocList) callconv(.C) void {
+    const size = dict.capacity();
+
+    var length: usize = 0;
+    var i: usize = 0;
+    while (i < size) : (i += 1) {
+        switch (dict.getSlot(i, key_width, value_width)) {
+            Slot.Filled => {
+                length += 1;
+            },
+            else => {},
+        }
+    }
+
+    if (length == 0) {
+        output.* = RocList.empty();
+        return;
+    }
+
+    const data_bytes = length * value_width;
+    var ptr = allocateWithRefcount(std.heap.c_allocator, alignment, data_bytes);
+
+    var offset = blk: {
+        if (alignment.keyFirst()) {
+            break :blk (dict.capacity() * key_width);
+        } else {
+            break :blk 0;
+        }
+    };
+
+    i = 0;
+    var copied: usize = 0;
+    while (i < size) : (i += 1) {
+        switch (dict.getSlot(i, key_width, value_width)) {
+            Slot.Filled => {
+                const value = dict.getValue(i, alignment, key_width, value_width);
+                inc_value(value);
+
+                const value_cast = @ptrCast([*]const u8, value);
+                @memcpy(ptr + (copied * value_width), value_cast, value_width);
+                copied += 1;
+            },
+            else => {},
+        }
+    }
+
+    output.* = RocList{ .bytes = ptr, .length = length };
+}
+
+fn doNothing(ptr: Opaque) callconv(.C) void {
+    return;
+}
+
+pub fn dictUnion(dict1: RocDict, dict2: RocDict, alignment: Alignment, key_width: usize, value_width: usize, hash_fn: HashFn, is_eq: EqFn, inc_key: Inc, inc_value: Inc, output: *RocDict) callconv(.C) void {
+    output.* = dict1.makeUnique(std.heap.c_allocator, alignment, key_width, value_width);
+
+    var i: usize = 0;
+    while (i < dict2.capacity()) : (i += 1) {
+        switch (dict2.getSlot(i, key_width, value_width)) {
+            Slot.Filled => {
+                const key = dict2.getKey(i, alignment, key_width, value_width);
+
+                switch (output.findIndex(alignment, key, key_width, value_width, hash_fn, is_eq)) {
+                    MaybeIndex.not_found => {
+                        const value = dict2.getValue(i, alignment, key_width, value_width);
+                        inc_value(value);
+
+                        // we need an extra RC token for the key
+                        inc_key(key);
+                        inc_value(value);
+
+                        // we know the newly added key is not a duplicate, so the `dec`s are unreachable
+                        const dec_key = doNothing;
+                        const dec_value = doNothing;
+
+                        dictInsert(output.*, alignment, key, key_width, value, value_width, hash_fn, is_eq, dec_key, dec_value, output);
+                    },
+                    MaybeIndex.index => |_| {
+                        // the key is already in the output dict
+                        continue;
+                    },
+                }
+            },
+            else => {},
+        }
+    }
+}
+
+pub fn dictIntersection(dict1: RocDict, dict2: RocDict, alignment: Alignment, key_width: usize, value_width: usize, hash_fn: HashFn, is_eq: EqFn, dec_key: Inc, dec_value: Inc, output: *RocDict) callconv(.C) void {
+    output.* = dict1.makeUnique(std.heap.c_allocator, alignment, key_width, value_width);
+
+    var i: usize = 0;
+    const size = dict1.capacity();
+    while (i < size) : (i += 1) {
+        switch (output.getSlot(i, key_width, value_width)) {
+            Slot.Filled => {
+                const key = dict1.getKey(i, alignment, key_width, value_width);
+
+                switch (dict2.findIndex(alignment, key, key_width, value_width, hash_fn, is_eq)) {
+                    MaybeIndex.not_found => {
+                        dictRemove(output.*, alignment, key, key_width, value_width, hash_fn, is_eq, dec_key, dec_value, output);
+                    },
+                    MaybeIndex.index => |_| {
+                        // keep this key/value
+                        continue;
+                    },
+                }
+            },
+            else => {},
+        }
+    }
+}
+
+pub fn dictDifference(dict1: RocDict, dict2: RocDict, alignment: Alignment, key_width: usize, value_width: usize, hash_fn: HashFn, is_eq: EqFn, dec_key: Dec, dec_value: Dec, output: *RocDict) callconv(.C) void {
+    output.* = dict1.makeUnique(std.heap.c_allocator, alignment, key_width, value_width);
+
+    var i: usize = 0;
+    const size = dict1.capacity();
+    while (i < size) : (i += 1) {
+        switch (output.getSlot(i, key_width, value_width)) {
+            Slot.Filled => {
+                const key = dict1.getKey(i, alignment, key_width, value_width);
+
+                switch (dict2.findIndex(alignment, key, key_width, value_width, hash_fn, is_eq)) {
+                    MaybeIndex.not_found => {
+                        // keep this key/value
+                        continue;
+                    },
+                    MaybeIndex.index => |_| {
+                        dictRemove(output.*, alignment, key, key_width, value_width, hash_fn, is_eq, dec_key, dec_value, output);
+                    },
+                }
+            },
+            else => {},
+        }
+    }
+}
+
+pub fn setFromList(list: RocList, alignment: Alignment, key_width: usize, value_width: usize, hash_fn: HashFn, is_eq: EqFn, dec_key: Dec, output: *RocDict) callconv(.C) void {
+    output.* = RocDict.empty();
+
+    var ptr = @ptrCast([*]u8, list.bytes);
+
+    const dec_value = doNothing;
+    const value = null;
+
+    const size = list.length;
+    var i: usize = 0;
+    while (i < size) : (i += 1) {
+        const key = ptr + i * key_width;
+        dictInsert(output.*, alignment, key, key_width, value, value_width, hash_fn, is_eq, dec_key, dec_value, output);
+    }
+
+    // NOTE: decref checks for the empty case
+    const data_bytes = size * key_width;
+    decref(std.heap.c_allocator, alignment, list.bytes, data_bytes);
+}
+
+const StepperCaller = fn (?[*]u8, ?[*]u8, ?[*]u8, ?[*]u8, ?[*]u8) callconv(.C) void;
+pub fn dictWalk(dict: RocDict, stepper: Opaque, stepper_caller: StepperCaller, accum: Opaque, alignment: Alignment, key_width: usize, value_width: usize, accum_width: usize, inc_key: Inc, inc_value: Inc, output: Opaque) callconv(.C) void {
+    // allocate space to write the result of the stepper into
+    // experimentally aliasing the accum and output pointers is not a good idea
+    const alloc: [*]u8 = @ptrCast([*]u8, std.heap.c_allocator.alloc(u8, accum_width) catch unreachable);
+    var b1 = output orelse unreachable;
+    var b2 = alloc;
+
+    @memcpy(b2, accum orelse unreachable, accum_width);
+
+    var i: usize = 0;
+    const size = dict.capacity();
+    while (i < size) : (i += 1) {
+        switch (dict.getSlot(i, key_width, value_width)) {
+            Slot.Filled => {
+                const key = dict.getKey(i, alignment, key_width, value_width);
+                const value = dict.getValue(i, alignment, key_width, value_width);
+
+                stepper_caller(stepper, key, value, b2, b1);
+
+                const temp = b1;
+                b2 = b1;
+                b1 = temp;
+            },
+            else => {},
+        }
+    }
+
+    @memcpy(output orelse unreachable, b2, accum_width);
+    std.heap.c_allocator.free(alloc[0..accum_width]);
+
+    const data_bytes = dict.capacity() * slotSize(key_width, value_width);
+    decref(std.heap.c_allocator, alignment, dict.dict_bytes, data_bytes);
+}
--- a/compiler/builtins/bitcode/src/hash.zig
+++ b/compiler/builtins/bitcode/src/hash.zig
@ -0,0 +1,255 @@
+// SPDX-License-Identifier: MIT
+// Copyright (c) 2015-2021 Zig Contributors
+// This file is part of [zig](https://ziglang.org/), which is MIT licensed.
+// The MIT license requires this copyright notice to be included in all copies
+// and substantial portions of the software.
+const std = @import("std");
+const str = @import("str.zig");
+const mem = std.mem;
+
+pub fn wyhash(seed: u64, bytes: ?[*]const u8, length: usize) callconv(.C) u64 {
+    const stdout = std.io.getStdOut().writer();
+
+    if (bytes) |nonnull| {
+        return wyhash_hash(seed, nonnull[0..length]);
+    } else {
+        return 42;
+    }
+}
+
+pub fn wyhash_rocstr(seed: u64, input: str.RocStr) callconv(.C) u64 {
+    return wyhash_hash(seed, input.asSlice());
+}
+
+const primes = [_]u64{
+    0xa0761d6478bd642f,
+    0xe7037ed1a0b428db,
+    0x8ebc6af09c88c6e3,
+    0x589965cc75374cc3,
+    0x1d8e4e27c47d124f,
+};
+
+fn read_bytes(comptime bytes: u8, data: []const u8) u64 {
+    const T = std.meta.Int(.unsigned, 8 * bytes);
+    return mem.readIntLittle(T, data[0..bytes]);
+}
+
+fn read_8bytes_swapped(data: []const u8) u64 {
+    return (read_bytes(4, data) << 32 | read_bytes(4, data[4..]));
+}
+
+fn mum(a: u64, b: u64) u64 {
+    var r = std.math.mulWide(u64, a, b);
+    r = (r >> 64) ^ r;
+    return @truncate(u64, r);
+}
+
+fn mix0(a: u64, b: u64, seed: u64) u64 {
+    return mum(a ^ seed ^ primes[0], b ^ seed ^ primes[1]);
+}
+
+fn mix1(a: u64, b: u64, seed: u64) u64 {
+    return mum(a ^ seed ^ primes[2], b ^ seed ^ primes[3]);
+}
+
+// Wyhash version which does not store internal state for handling partial buffers.
+// This is needed so that we can maximize the speed for the short key case, which will
+// use the non-iterative api which the public Wyhash exposes.
+const WyhashStateless = struct {
+    seed: u64,
+    msg_len: usize,
+
+    pub fn init(seed: u64) WyhashStateless {
+        return WyhashStateless{
+            .seed = seed,
+            .msg_len = 0,
+        };
+    }
+
+    fn round(self: *WyhashStateless, b: []const u8) void {
+        std.debug.assert(b.len == 32);
+
+        self.seed = mix0(
+            read_bytes(8, b[0..]),
+            read_bytes(8, b[8..]),
+            self.seed,
+        ) ^ mix1(
+            read_bytes(8, b[16..]),
+            read_bytes(8, b[24..]),
+            self.seed,
+        );
+    }
+
+    pub fn update(self: *WyhashStateless, b: []const u8) void {
+        std.debug.assert(b.len % 32 == 0);
+
+        var off: usize = 0;
+        while (off < b.len) : (off += 32) {
+            @call(.{ .modifier = .always_inline }, self.round, .{b[off .. off + 32]});
+        }
+
+        self.msg_len += b.len;
+    }
+
+    pub fn final(self: *WyhashStateless, b: []const u8) u64 {
+        std.debug.assert(b.len < 32);
+
+        const seed = self.seed;
+        const rem_len = @intCast(u5, b.len);
+        const rem_key = b[0..rem_len];
+
+        self.seed = switch (rem_len) {
+            0 => seed,
+            1 => mix0(read_bytes(1, rem_key), primes[4], seed),
+            2 => mix0(read_bytes(2, rem_key), primes[4], seed),
+            3 => mix0((read_bytes(2, rem_key) << 8) | read_bytes(1, rem_key[2..]), primes[4], seed),
+            4 => mix0(read_bytes(4, rem_key), primes[4], seed),
+            5 => mix0((read_bytes(4, rem_key) << 8) | read_bytes(1, rem_key[4..]), primes[4], seed),
+            6 => mix0((read_bytes(4, rem_key) << 16) | read_bytes(2, rem_key[4..]), primes[4], seed),
+            7 => mix0((read_bytes(4, rem_key) << 24) | (read_bytes(2, rem_key[4..]) << 8) | read_bytes(1, rem_key[6..]), primes[4], seed),
+            8 => mix0(read_8bytes_swapped(rem_key), primes[4], seed),
+            9 => mix0(read_8bytes_swapped(rem_key), read_bytes(1, rem_key[8..]), seed),
+            10 => mix0(read_8bytes_swapped(rem_key), read_bytes(2, rem_key[8..]), seed),
+            11 => mix0(read_8bytes_swapped(rem_key), (read_bytes(2, rem_key[8..]) << 8) | read_bytes(1, rem_key[10..]), seed),
+            12 => mix0(read_8bytes_swapped(rem_key), read_bytes(4, rem_key[8..]), seed),
+            13 => mix0(read_8bytes_swapped(rem_key), (read_bytes(4, rem_key[8..]) << 8) | read_bytes(1, rem_key[12..]), seed),
+            14 => mix0(read_8bytes_swapped(rem_key), (read_bytes(4, rem_key[8..]) << 16) | read_bytes(2, rem_key[12..]), seed),
+            15 => mix0(read_8bytes_swapped(rem_key), (read_bytes(4, rem_key[8..]) << 24) | (read_bytes(2, rem_key[12..]) << 8) | read_bytes(1, rem_key[14..]), seed),
+            16 => mix0(read_8bytes_swapped(rem_key), read_8bytes_swapped(rem_key[8..]), seed),
+            17 => mix0(read_8bytes_swapped(rem_key), read_8bytes_swapped(rem_key[8..]), seed) ^ mix1(read_bytes(1, rem_key[16..]), primes[4], seed),
+            18 => mix0(read_8bytes_swapped(rem_key), read_8bytes_swapped(rem_key[8..]), seed) ^ mix1(read_bytes(2, rem_key[16..]), primes[4], seed),
+            19 => mix0(read_8bytes_swapped(rem_key), read_8bytes_swapped(rem_key[8..]), seed) ^ mix1((read_bytes(2, rem_key[16..]) << 8) | read_bytes(1, rem_key[18..]), primes[4], seed),
+            20 => mix0(read_8bytes_swapped(rem_key), read_8bytes_swapped(rem_key[8..]), seed) ^ mix1(read_bytes(4, rem_key[16..]), primes[4], seed),
+            21 => mix0(read_8bytes_swapped(rem_key), read_8bytes_swapped(rem_key[8..]), seed) ^ mix1((read_bytes(4, rem_key[16..]) << 8) | read_bytes(1, rem_key[20..]), primes[4], seed),
+            22 => mix0(read_8bytes_swapped(rem_key), read_8bytes_swapped(rem_key[8..]), seed) ^ mix1((read_bytes(4, rem_key[16..]) << 16) | read_bytes(2, rem_key[20..]), primes[4], seed),
+            23 => mix0(read_8bytes_swapped(rem_key), read_8bytes_swapped(rem_key[8..]), seed) ^ mix1((read_bytes(4, rem_key[16..]) << 24) | (read_bytes(2, rem_key[20..]) << 8) | read_bytes(1, rem_key[22..]), primes[4], seed),
+            24 => mix0(read_8bytes_swapped(rem_key), read_8bytes_swapped(rem_key[8..]), seed) ^ mix1(read_8bytes_swapped(rem_key[16..]), primes[4], seed),
+            25 => mix0(read_8bytes_swapped(rem_key), read_8bytes_swapped(rem_key[8..]), seed) ^ mix1(read_8bytes_swapped(rem_key[16..]), read_bytes(1, rem_key[24..]), seed),
+            26 => mix0(read_8bytes_swapped(rem_key), read_8bytes_swapped(rem_key[8..]), seed) ^ mix1(read_8bytes_swapped(rem_key[16..]), read_bytes(2, rem_key[24..]), seed),
+            27 => mix0(read_8bytes_swapped(rem_key), read_8bytes_swapped(rem_key[8..]), seed) ^ mix1(read_8bytes_swapped(rem_key[16..]), (read_bytes(2, rem_key[24..]) << 8) | read_bytes(1, rem_key[26..]), seed),
+            28 => mix0(read_8bytes_swapped(rem_key), read_8bytes_swapped(rem_key[8..]), seed) ^ mix1(read_8bytes_swapped(rem_key[16..]), read_bytes(4, rem_key[24..]), seed),
+            29 => mix0(read_8bytes_swapped(rem_key), read_8bytes_swapped(rem_key[8..]), seed) ^ mix1(read_8bytes_swapped(rem_key[16..]), (read_bytes(4, rem_key[24..]) << 8) | read_bytes(1, rem_key[28..]), seed),
+            30 => mix0(read_8bytes_swapped(rem_key), read_8bytes_swapped(rem_key[8..]), seed) ^ mix1(read_8bytes_swapped(rem_key[16..]), (read_bytes(4, rem_key[24..]) << 16) | read_bytes(2, rem_key[28..]), seed),
+            31 => mix0(read_8bytes_swapped(rem_key), read_8bytes_swapped(rem_key[8..]), seed) ^ mix1(read_8bytes_swapped(rem_key[16..]), (read_bytes(4, rem_key[24..]) << 24) | (read_bytes(2, rem_key[28..]) << 8) | read_bytes(1, rem_key[30..]), seed),
+        };
+
+        self.msg_len += b.len;
+        return mum(self.seed ^ self.msg_len, primes[4]);
+    }
+
+    pub fn hash(seed: u64, input: []const u8) u64 {
+        const aligned_len = input.len - (input.len % 32);
+
+        var c = WyhashStateless.init(seed);
+        @call(.{ .modifier = .always_inline }, c.update, .{input[0..aligned_len]});
+        return @call(.{ .modifier = .always_inline }, c.final, .{input[aligned_len..]});
+    }
+};
+
+/// Fast non-cryptographic 64bit hash function.
+/// See https://github.com/wangyi-fudan/wyhash
+pub const Wyhash = struct {
+    state: WyhashStateless,
+
+    buf: [32]u8,
+    buf_len: usize,
+
+    pub fn init(seed: u64) Wyhash {
+        return Wyhash{
+            .state = WyhashStateless.init(seed),
+            .buf = undefined,
+            .buf_len = 0,
+        };
+    }
+
+    pub fn update(self: *Wyhash, b: []const u8) void {
+        var off: usize = 0;
+
+        if (self.buf_len != 0 and self.buf_len + b.len >= 32) {
+            off += 32 - self.buf_len;
+            mem.copy(u8, self.buf[self.buf_len..], b[0..off]);
+            self.state.update(self.buf[0..]);
+            self.buf_len = 0;
+        }
+
+        const remain_len = b.len - off;
+        const aligned_len = remain_len - (remain_len % 32);
+        self.state.update(b[off .. off + aligned_len]);
+
+        mem.copy(u8, self.buf[self.buf_len..], b[off + aligned_len ..]);
+        self.buf_len += @intCast(u8, b[off + aligned_len ..].len);
+    }
+
+    pub fn final(self: *Wyhash) u64 {
+        const seed = self.state.seed;
+        const rem_len = @intCast(u5, self.buf_len);
+        const rem_key = self.buf[0..self.buf_len];
+
+        return self.state.final(rem_key);
+    }
+
+    pub fn hash(seed: u64, input: []const u8) u64 {
+        return WyhashStateless.hash(seed, input);
+    }
+};
+
+fn wyhash_hash(seed: u64, input: []const u8) u64 {
+    return Wyhash.hash(seed, input);
+}
+
+const expectEqual = std.testing.expectEqual;
+
+test "test vectors" {
+    const hash = Wyhash.hash;
+
+    expectEqual(hash(0, ""), 0x0);
+    expectEqual(hash(1, "a"), 0xbed235177f41d328);
+    expectEqual(hash(2, "abc"), 0xbe348debe59b27c3);
+    expectEqual(hash(3, "message digest"), 0x37320f657213a290);
+    expectEqual(hash(4, "abcdefghijklmnopqrstuvwxyz"), 0xd0b270e1d8a7019c);
+    expectEqual(hash(5, "ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789"), 0x602a1894d3bbfe7f);
+    expectEqual(hash(6, "12345678901234567890123456789012345678901234567890123456789012345678901234567890"), 0x829e9c148b75970e);
+}
+
+test "test vectors streaming" {
+    var wh = Wyhash.init(5);
+    for ("ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789") |e| {
+        wh.update(mem.asBytes(&e));
+    }
+    expectEqual(wh.final(), 0x602a1894d3bbfe7f);
+
+    const pattern = "1234567890";
+    const count = 8;
+    const result = 0x829e9c148b75970e;
+    expectEqual(Wyhash.hash(6, pattern ** 8), result);
+
+    wh = Wyhash.init(6);
+    var i: u32 = 0;
+    while (i < count) : (i += 1) {
+        wh.update(pattern);
+    }
+    expectEqual(wh.final(), result);
+}
+
+test "iterative non-divisible update" {
+    var buf: [8192]u8 = undefined;
+    for (buf) |*e, i| {
+        e.* = @truncate(u8, i);
+    }
+
+    const seed = 0x128dad08f;
+
+    var end: usize = 32;
+    while (end < buf.len) : (end += 32) {
+        const non_iterative_hash = Wyhash.hash(seed, buf[0..end]);
+
+        var wy = Wyhash.init(seed);
+        var i: usize = 0;
+        while (i < end) : (i += 33) {
+            wy.update(buf[i..std.math.min(i + 33, end)]);
+        }
+        const iterative_hash = wy.final();
+
+        std.testing.expectEqual(iterative_hash, non_iterative_hash);
+    }
+}
--- a/compiler/builtins/bitcode/src/list.zig
+++ b/compiler/builtins/bitcode/src/list.zig
@ -0,0 +1,326 @@
+const std = @import("std");
+const utils = @import("utils.zig");
+const RocResult = utils.RocResult;
+const mem = std.mem;
+const Allocator = mem.Allocator;
+
+const EqFn = fn (?[*]u8, ?[*]u8) callconv(.C) bool;
+const Opaque = ?[*]u8;
+
+const Inc = fn (?[*]u8) callconv(.C) void;
+const Dec = fn (?[*]u8) callconv(.C) void;
+
+pub const RocList = extern struct {
+    bytes: ?[*]u8,
+    length: usize,
+
+    pub fn len(self: RocList) usize {
+        return self.length;
+    }
+
+    pub fn isEmpty(self: RocList) bool {
+        return self.len() == 0;
+    }
+
+    pub fn empty() RocList {
+        return RocList{ .bytes = null, .length = 0 };
+    }
+
+    pub fn isUnique(self: RocList) bool {
+        // the empty list is unique (in the sense that copying it will not leak memory)
+        if (self.isEmpty()) {
+            return true;
+        }
+
+        // otherwise, check if the refcount is one
+        const ptr: [*]usize = @ptrCast([*]usize, @alignCast(8, self.bytes));
+        return (ptr - 1)[0] == utils.REFCOUNT_ONE;
+    }
+
+    pub fn allocate(
+        allocator: *Allocator,
+        alignment: usize,
+        length: usize,
+        element_size: usize,
+    ) RocList {
+        const data_bytes = length * element_size;
+
+        return RocList{
+            .bytes = utils.allocateWithRefcount(allocator, alignment, data_bytes),
+            .length = length,
+        };
+    }
+
+    pub fn makeUnique(self: RocList, allocator: *Allocator, alignment: usize, element_width: usize) RocList {
+        if (self.isEmpty()) {
+            return self;
+        }
+
+        if (self.isUnique()) {
+            return self;
+        }
+
+        // unfortunately, we have to clone
+        var new_list = RocList.allocate(allocator, alignment, self.length, element_width);
+
+        var old_bytes: [*]u8 = @ptrCast([*]u8, self.bytes);
+        var new_bytes: [*]u8 = @ptrCast([*]u8, new_list.bytes);
+
+        const number_of_bytes = self.len() * element_width;
+        @memcpy(new_bytes, old_bytes, number_of_bytes);
+
+        // NOTE we fuse an increment of all keys/values with a decrement of the input dict
+        const data_bytes = self.len() * element_width;
+        utils.decref(allocator, alignment, self.bytes, data_bytes);
+
+        return new_list;
+    }
+
+    pub fn reallocate(
+        self: RocList,
+        allocator: *Allocator,
+        alignment: usize,
+        new_length: usize,
+        element_width: usize,
+    ) RocList {
+        const old_length = self.length;
+        const delta_length = new_length - old_length;
+
+        const data_bytes = new_capacity * slot_size;
+        const first_slot = allocateWithRefcount(allocator, alignment, data_bytes);
+
+        // transfer the memory
+
+        if (self.bytes) |source_ptr| {
+            const dest_ptr = first_slot;
+
+            @memcpy(dest_ptr, source_ptr, old_length);
+        }
+
+        // NOTE the newly added elements are left uninitialized
+
+        const result = RocList{
+            .dict_bytes = first_slot,
+            .length = new_length,
+        };
+
+        // NOTE we fuse an increment of all keys/values with a decrement of the input dict
+        utils.decref(allocator, alignment, self.bytes, old_length * element_width);
+
+        return result;
+    }
+};
+
+const Caller1 = fn (?[*]u8, ?[*]u8, ?[*]u8) callconv(.C) void;
+const Caller2 = fn (?[*]u8, ?[*]u8, ?[*]u8, ?[*]u8) callconv(.C) void;
+
+pub fn listMap(list: RocList, transform: Opaque, caller: Caller1, alignment: usize, old_element_width: usize, new_element_width: usize) callconv(.C) RocList {
+    if (list.bytes) |source_ptr| {
+        const size = list.len();
+        var i: usize = 0;
+        const output = RocList.allocate(std.heap.c_allocator, alignment, size, new_element_width);
+        const target_ptr = output.bytes orelse unreachable;
+
+        while (i < size) : (i += 1) {
+            caller(transform, source_ptr + (i * old_element_width), target_ptr + (i * new_element_width));
+        }
+
+        utils.decref(std.heap.c_allocator, alignment, list.bytes, size * old_element_width);
+
+        return output;
+    } else {
+        return RocList.empty();
+    }
+}
+
+pub fn listMapWithIndex(list: RocList, transform: Opaque, caller: Caller2, alignment: usize, old_element_width: usize, new_element_width: usize) callconv(.C) RocList {
+    if (list.bytes) |source_ptr| {
+        const size = list.len();
+        var i: usize = 0;
+        const output = RocList.allocate(std.heap.c_allocator, alignment, size, new_element_width);
+        const target_ptr = output.bytes orelse unreachable;
+
+        while (i < size) : (i += 1) {
+            caller(transform, @ptrCast(?[*]u8, &i), source_ptr + (i * old_element_width), target_ptr + (i * new_element_width));
+        }
+
+        utils.decref(std.heap.c_allocator, alignment, list.bytes, size * old_element_width);
+
+        return output;
+    } else {
+        return RocList.empty();
+    }
+}
+
+pub fn listKeepIf(list: RocList, transform: Opaque, caller: Caller1, alignment: usize, element_width: usize, inc: Inc, dec: Dec) callconv(.C) RocList {
+    if (list.bytes) |source_ptr| {
+        const size = list.len();
+        var i: usize = 0;
+        var output = RocList.allocate(std.heap.c_allocator, alignment, list.len(), list.len() * element_width);
+        const target_ptr = output.bytes orelse unreachable;
+
+        var kept: usize = 0;
+        while (i < size) : (i += 1) {
+            var keep = false;
+            const element = source_ptr + (i * element_width);
+            inc(element);
+            caller(transform, element, @ptrCast(?[*]u8, &keep));
+
+            if (keep) {
+                @memcpy(target_ptr + (kept * element_width), element, element_width);
+
+                kept += 1;
+            } else {
+                dec(element);
+            }
+        }
+
+        // consume the input list
+        utils.decref(std.heap.c_allocator, alignment, list.bytes, size * element_width);
+
+        if (kept == 0) {
+            // if the output is empty, deallocate the space we made for the result
+            utils.decref(std.heap.c_allocator, alignment, output.bytes, size * element_width);
+            return RocList.empty();
+        } else {
+            output.length = kept;
+
+            return output;
+        }
+    } else {
+        return RocList.empty();
+    }
+}
+
+pub fn listKeepOks(list: RocList, transform: Opaque, caller: Caller1, alignment: usize, before_width: usize, result_width: usize, after_width: usize, inc_closure: Inc, dec_result: Dec) callconv(.C) RocList {
+    return listKeepResult(list, RocResult.isOk, transform, caller, alignment, before_width, result_width, after_width, inc_closure, dec_result);
+}
+
+pub fn listKeepErrs(list: RocList, transform: Opaque, caller: Caller1, alignment: usize, before_width: usize, result_width: usize, after_width: usize, inc_closure: Inc, dec_result: Dec) callconv(.C) RocList {
+    return listKeepResult(list, RocResult.isErr, transform, caller, alignment, before_width, result_width, after_width, inc_closure, dec_result);
+}
+
+pub fn listKeepResult(list: RocList, is_good_constructor: fn (RocResult) bool, transform: Opaque, caller: Caller1, alignment: usize, before_width: usize, result_width: usize, after_width: usize, inc_closure: Inc, dec_result: Dec) RocList {
+    if (list.bytes) |source_ptr| {
+        const size = list.len();
+        var i: usize = 0;
+        var output = RocList.allocate(std.heap.c_allocator, alignment, list.len(), list.len() * after_width);
+        const target_ptr = output.bytes orelse unreachable;
+
+        var temporary = @ptrCast([*]u8, std.heap.c_allocator.alloc(u8, result_width) catch unreachable);
+
+        var kept: usize = 0;
+        while (i < size) : (i += 1) {
+            const before_element = source_ptr + (i * before_width);
+            inc_closure(transform);
+            caller(transform, before_element, temporary);
+
+            const result = utils.RocResult{ .bytes = temporary };
+
+            const after_element = temporary + @sizeOf(i64);
+            if (is_good_constructor(result)) {
+                @memcpy(target_ptr + (kept * after_width), after_element, after_width);
+                kept += 1;
+            } else {
+                dec_result(temporary);
+            }
+        }
+
+        utils.decref(std.heap.c_allocator, alignment, list.bytes, size * before_width);
+        std.heap.c_allocator.free(temporary[0..result_width]);
+
+        if (kept == 0) {
+            utils.decref(std.heap.c_allocator, alignment, output.bytes, size * after_width);
+            return RocList.empty();
+        } else {
+            output.length = kept;
+            return output;
+        }
+    } else {
+        return RocList.empty();
+    }
+}
+
+pub fn listWalk(list: RocList, stepper: Opaque, stepper_caller: Caller2, accum: Opaque, alignment: usize, element_width: usize, accum_width: usize, output: Opaque) callconv(.C) void {
+    if (accum_width == 0) {
+        return;
+    }
+
+    @memcpy(output orelse unreachable, accum orelse unreachable, accum_width);
+
+    if (list.bytes) |source_ptr| {
+        var i: usize = 0;
+        const size = list.len();
+        while (i < size) : (i += 1) {
+            const element = source_ptr + i * element_width;
+            stepper_caller(stepper, element, output, output);
+        }
+
+        const data_bytes = list.len() * element_width;
+        utils.decref(std.heap.c_allocator, alignment, list.bytes, data_bytes);
+    }
+}
+
+pub fn listWalkBackwards(list: RocList, stepper: Opaque, stepper_caller: Caller2, accum: Opaque, alignment: usize, element_width: usize, accum_width: usize, output: Opaque) callconv(.C) void {
+    if (accum_width == 0) {
+        return;
+    }
+
+    @memcpy(output orelse unreachable, accum orelse unreachable, accum_width);
+
+    if (list.bytes) |source_ptr| {
+        const size = list.len();
+        var i: usize = size;
+        while (i > 0) {
+            i -= 1;
+            const element = source_ptr + i * element_width;
+            stepper_caller(stepper, element, output, output);
+        }
+
+        const data_bytes = list.len() * element_width;
+        utils.decref(std.heap.c_allocator, alignment, list.bytes, data_bytes);
+    }
+}
+
+// List.contains : List k, k -> Bool
+pub fn listContains(list: RocList, key: Opaque, key_width: usize, is_eq: EqFn) callconv(.C) bool {
+    if (list.bytes) |source_ptr| {
+        const size = list.len();
+        var i: usize = 0;
+        while (i < size) : (i += 1) {
+            const element = source_ptr + i * key_width;
+            if (is_eq(element, key)) {
+                return true;
+            }
+        }
+    }
+
+    return false;
+}
+
+pub fn listRepeat(count: usize, alignment: usize, element: Opaque, element_width: usize, inc_n_element: Inc) callconv(.C) RocList {
+    if (count == 0) {
+        return RocList.empty();
+    }
+
+    const allocator = std.heap.c_allocator;
+    var output = RocList.allocate(allocator, alignment, count, element_width);
+
+    if (output.bytes) |target_ptr| {
+        var i: usize = 0;
+        const source = element orelse unreachable;
+        while (i < count) : (i += 1) {
+            @memcpy(target_ptr + i * element_width, source, element_width);
+        }
+
+        // TODO do all increments at once!
+        i = 0;
+        while (i < count) : (i += 1) {
+            inc_n_element(element);
+        }
+
+        return output;
+    } else {
+        unreachable;
+    }
+}
--- a/compiler/builtins/bitcode/src/main.zig
+++ b/compiler/builtins/bitcode/src/main.zig
@ -2,6 +2,46 @@ const builtin = @import("builtin");
 const std = @import("std");
 const testing = std.testing;

+// List Module
+const list = @import("list.zig");
+
+comptime {
+    exportListFn(list.listMap, "map");
+    exportListFn(list.listMapWithIndex, "map_with_index");
+    exportListFn(list.listKeepIf, "keep_if");
+    exportListFn(list.listWalk, "walk");
+    exportListFn(list.listWalkBackwards, "walk_backwards");
+    exportListFn(list.listKeepOks, "keep_oks");
+    exportListFn(list.listKeepErrs, "keep_errs");
+    exportListFn(list.listContains, "contains");
+    exportListFn(list.listRepeat, "repeat");
+}
+
+// Dict Module
+const dict = @import("dict.zig");
+const hash = @import("hash.zig");
+
+comptime {
+    exportDictFn(dict.dictLen, "len");
+    exportDictFn(dict.dictEmpty, "empty");
+    exportDictFn(dict.dictInsert, "insert");
+    exportDictFn(dict.dictRemove, "remove");
+    exportDictFn(dict.dictContains, "contains");
+    exportDictFn(dict.dictGet, "get");
+    exportDictFn(dict.elementsRc, "elementsRc");
+    exportDictFn(dict.dictKeys, "keys");
+    exportDictFn(dict.dictValues, "values");
+    exportDictFn(dict.dictUnion, "union");
+    exportDictFn(dict.dictIntersection, "intersection");
+    exportDictFn(dict.dictDifference, "difference");
+    exportDictFn(dict.dictWalk, "walk");
+
+    exportDictFn(dict.setFromList, "set_from_list");
+
+    exportDictFn(hash.wyhash, "hash");
+    exportDictFn(hash.wyhash_rocstr, "hash_str");
+}
+
 // Num Module
 const num = @import("num.zig");
 comptime {
@ -25,6 +65,7 @@ comptime {
    exportStrFn(str.strJoinWithC, "joinWith");
    exportStrFn(str.strNumberOfBytes, "number_of_bytes");
    exportStrFn(str.strFromIntC, "from_int");
+    exportStrFn(str.strFromFloatC, "from_float");
    exportStrFn(str.strEqual, "equal");
    exportStrFn(str.validateUtf8Bytes, "validate_utf8_bytes");
 }
@ -39,6 +80,13 @@ fn exportNumFn(comptime func: anytype, comptime func_name: []const u8) void {
 fn exportStrFn(comptime func: anytype, comptime func_name: []const u8) void {
    exportBuiltinFn(func, "str." ++ func_name);
 }
+fn exportDictFn(comptime func: anytype, comptime func_name: []const u8) void {
+    exportBuiltinFn(func, "dict." ++ func_name);
+}
+
+fn exportListFn(comptime func: anytype, comptime func_name: []const u8) void {
+    exportBuiltinFn(func, "list." ++ func_name);
+}

 // Run all tests in imported modules
 // https://github.com/ziglang/zig/blob/master/lib/std/std.zig#L94
--- a/compiler/builtins/bitcode/src/str.zig
+++ b/compiler/builtins/bitcode/src/str.zig
@ -1,3 +1,4 @@
+const utils = @import("utils.zig");
 const std = @import("std");
 const mem = std.mem;
 const always_inline = std.builtin.CallOptions.Modifier.always_inline;
@ -41,8 +42,6 @@ pub const RocStr = extern struct {
    // This clones the pointed-to bytes if they won't fit in a
    // small string, and returns a (pointer, len) tuple which points to them.
    pub fn init(allocator: *Allocator, bytes_ptr: [*]const u8, length: usize) RocStr {
-        const roc_str_size = @sizeOf(RocStr);
-
        var result = RocStr.allocate(allocator, InPlace.Clone, length);
        @memcpy(result.asU8ptr(), bytes_ptr, length);

@ -50,18 +49,7 @@ pub const RocStr = extern struct {
    }

    pub fn initBig(allocator: *Allocator, in_place: InPlace, number_of_chars: u64) RocStr {
-        const length = @sizeOf(usize) + number_of_chars;
-        var new_bytes: []usize = allocator.alloc(usize, length) catch unreachable;
-
-        if (in_place == InPlace.InPlace) {
-            new_bytes[0] = @intCast(usize, number_of_chars);
-        } else {
-            const v: isize = std.math.minInt(isize);
-            new_bytes[0] = @bitCast(usize, v);
-        }
-
-        var first_element = @ptrCast([*]align(@alignOf(usize)) u8, new_bytes);
-        first_element += @sizeOf(usize);
+        const first_element = utils.allocateWithRefcount(allocator, @sizeOf(usize), number_of_chars);

        return RocStr{
            .str_bytes = first_element,
@ -315,6 +303,23 @@ fn strFromIntHelp(allocator: *Allocator, comptime T: type, int: T) RocStr {
    return RocStr.init(allocator, &buf, result.len);
 }

+// Str.fromFloat
+// When we actually use this in Roc, libc will be linked so we have access to std.heap.c_allocator
+pub fn strFromFloatC(float: f64) callconv(.C) RocStr {
+    // NOTE the compiled zig for float formatting seems to use LLVM11-specific features
+    // hopefully we can use zig instead of snprintf in the future when we upgrade
+    const c = @cImport({
+        // See https://github.com/ziglang/zig/issues/515
+        @cDefine("_NO_CRT_STDIO_INLINE", "1");
+        @cInclude("stdio.h");
+    });
+    var buf: [100]u8 = undefined;
+
+    const result = c.snprintf(&buf, 100, "%f", float);
+
+    return RocStr.init(std.heap.c_allocator, &buf, @intCast(usize, result));
+}
+
 // Str.split
 // When we actually use this in Roc, libc will be linked so we have access to std.heap.c_allocator
 pub fn strSplitInPlaceC(array: [*]RocStr, string: RocStr, delimiter: RocStr) callconv(.C) void {
@ -829,8 +834,10 @@ pub fn strConcatC(result_in_place: InPlace, arg1: RocStr, arg2: RocStr) callconv

 fn strConcat(allocator: *Allocator, result_in_place: InPlace, arg1: RocStr, arg2: RocStr) RocStr {
    if (arg1.isEmpty()) {
+        // the second argument is borrowed, so we must increment its refcount before returning
        return RocStr.clone(allocator, result_in_place, arg2);
    } else if (arg2.isEmpty()) {
+        // the first argument is owned, so we can return it without cloning
        return RocStr.clone(allocator, result_in_place, arg1);
    } else {
        const combined_length = arg1.len() + arg2.len();
--- a/compiler/builtins/bitcode/src/utils.zig
+++ b/compiler/builtins/bitcode/src/utils.zig
@ -0,0 +1,107 @@
+const std = @import("std");
+const Allocator = std.mem.Allocator;
+
+const REFCOUNT_ONE_ISIZE: comptime isize = std.math.minInt(isize);
+pub const REFCOUNT_ONE: usize = @bitCast(usize, REFCOUNT_ONE_ISIZE);
+
+pub fn decref(
+    allocator: *Allocator,
+    alignment: usize,
+    bytes_or_null: ?[*]u8,
+    data_bytes: usize,
+) void {
+    if (data_bytes == 0) {
+        return;
+    }
+
+    var bytes = bytes_or_null orelse return;
+
+    const isizes: [*]isize = @ptrCast([*]isize, @alignCast(8, bytes));
+
+    const refcount = (isizes - 1)[0];
+    const refcount_isize = @bitCast(isize, refcount);
+
+    switch (alignment) {
+        16 => {
+            if (refcount == REFCOUNT_ONE_ISIZE) {
+                allocator.free((bytes - 16)[0 .. 16 + data_bytes]);
+            } else if (refcount_isize < 0) {
+                (isizes - 1)[0] = refcount - 1;
+            }
+        },
+        else => {
+            // NOTE enums can currently have an alignment of < 8
+            if (refcount == REFCOUNT_ONE_ISIZE) {
+                allocator.free((bytes - 8)[0 .. 8 + data_bytes]);
+            } else if (refcount_isize < 0) {
+                (isizes - 1)[0] = refcount - 1;
+            }
+        },
+    }
+}
+
+pub fn allocateWithRefcount(
+    allocator: *Allocator,
+    alignment: usize,
+    data_bytes: usize,
+) [*]u8 {
+    comptime const result_in_place = false;
+
+    switch (alignment) {
+        16 => {
+            const length = 2 * @sizeOf(usize) + data_bytes;
+
+            var new_bytes: []align(16) u8 = allocator.alignedAlloc(u8, 16, length) catch unreachable;
+
+            var as_usize_array = @ptrCast([*]usize, new_bytes);
+            if (result_in_place) {
+                as_usize_array[0] = 0;
+                as_usize_array[1] = @intCast(usize, number_of_slots);
+            } else {
+                as_usize_array[0] = 0;
+                as_usize_array[1] = REFCOUNT_ONE;
+            }
+
+            var as_u8_array = @ptrCast([*]u8, new_bytes);
+            const first_slot = as_u8_array + 2 * @sizeOf(usize);
+
+            return first_slot;
+        },
+        else => {
+            const length = @sizeOf(usize) + data_bytes;
+
+            var new_bytes: []align(8) u8 = allocator.alignedAlloc(u8, 8, length) catch unreachable;
+
+            var as_usize_array = @ptrCast([*]isize, new_bytes);
+            if (result_in_place) {
+                as_usize_array[0] = @intCast(isize, number_of_slots);
+            } else {
+                as_usize_array[0] = REFCOUNT_ONE_ISIZE;
+            }
+
+            var as_u8_array = @ptrCast([*]u8, new_bytes);
+            const first_slot = as_u8_array + @sizeOf(usize);
+
+            return first_slot;
+        },
+    }
+}
+
+pub const RocResult = extern struct {
+    bytes: ?[*]u8,
+
+    pub fn isOk(self: RocResult) bool {
+        // assumptions
+        //
+        // - the tag is the first field
+        // - the tag is usize bytes wide
+        // - Ok has tag_id 1, because Err < Ok
+        const usizes: [*]usize = @ptrCast([*]usize, @alignCast(8, self.bytes));
+
+        return usizes[0] == 1;
+    }
+
+    pub fn isErr(self: RocResult) bool {
+        return !self.isOk();
+    }
+};