function worker_message(worker, message) { return new Promise((resolve) => { worker.onmessage = (e) => resolve(e.data); worker.postMessage(message); }); } function workers_messages(workers, messages) { const promises = []; for (let i = 0; i < workers.length; ++i) { promises.push(worker_message(workers[i], messages[i])); } return Promise.all(promises); } function workers_thread_message(workers, message, thread_field=null) { const messages = []; for (let i = 0; i < workers.length; ++i) { if (thread_field !== null) { const m = structuredClone(message); m[thread_field] = i; messages.push(m); } else { messages.push(message); } } return workers_messages(workers, messages); } async function init_wasm(state) { const memory = new WebAssembly.Memory({ initial: 16384, // F U maximum: 16384, // 1GiB shared: true, }); // "Master thread" to do maintance on (static allocations, merging results etc) const master_wasm = await WebAssembly.instantiateStreaming(fetch('wasm/lod.wasm'), { env: { 'memory': memory } }); const nworkers = navigator.hardwareConcurrency; state.wasm.exports = master_wasm.instance.exports; state.wasm.heap_base = state.wasm.exports.alloc_static(0); state.wasm.workers = []; state.wasm.memory = memory; for (let i = 0; i < nworkers; ++i) { const w = new Worker('lod_worker.js'); state.wasm.workers.push(w); } await workers_thread_message(state.wasm.workers, { 'type': 'init', 'heap_base': state.wasm.heap_base, 'memory': memory, }, 'thread_id'); const initial = config.initial_wasm_bytes; state.wasm.buffers = { 'xs': { 'used': 0, 'cap': initial }, 'ys': { 'used': 0, 'cap': initial }, 'coords_from': { 'used': 0, 'cap': initial }, 'pressures': { 'used': 0, 'cap': initial }, 'width': { 'used': 0, 'cap': initial } }; state.wasm.buffers['xs'].offset = state.wasm.exports.alloc_static(initial); state.wasm.buffers['ys'].offset = state.wasm.exports.alloc_static(initial); state.wasm.buffers['pressures'].offset = state.wasm.exports.alloc_static(initial); state.wasm.buffers['coords_from'].offset = state.wasm.exports.alloc_static(initial); state.wasm.buffers['width'].offset = state.wasm.exports.alloc_static(initial); const mem = state.wasm.memory.buffer; state.wasm.buffers['xs'].tv = tv_create_on(Float32Array, initial / 4, mem, state.wasm.buffers['xs'].offset); state.wasm.buffers['ys'].tv = tv_create_on(Float32Array, initial / 4, mem, state.wasm.buffers['ys'].offset); state.wasm.buffers['pressures'].tv = tv_create_on(Uint8Array, initial, mem, state.wasm.buffers['pressures'].offset); state.wasm.buffers['coords_from'].tv = tv_create_on(Uint32Array, initial / 4, mem, state.wasm.buffers['coords_from'].offset); state.wasm.buffers['width'].tv = tv_create_on(Uint32Array, initial / 4, mem, state.wasm.buffers['width'].offset); tv_add(state.wasm.buffers['coords_from'].tv, 0); state.wasm.buffers['coords_from'].used = 4; } function wasm_ensure_by(state, nstrokes, ncoords) { const buffers = state.wasm.buffers; const old_ys_offset = buffers['ys'].offset; const old_coords_from_offset = buffers['coords_from'].offset; const old_pressures_offset = buffers['pressures'].offset; const old_width_offset = buffers['width'].offset; let realloc = false; let coords_bytes = buffers['xs'].cap; let stroke_bytes = buffers['coords_from'].cap; if (buffers['xs'].used + ncoords * 4 > buffers['xs'].cap) { coords_bytes = round_to_pow2(buffers['xs'].cap + ncoords * 4, 4096 * 16); // 1 wasm page (although it doesn't matter here) realloc = true; } if (buffers['coords_from'].used + nstrokes * 4 > buffers['coords_from'].cap) { stroke_bytes = round_to_pow2(buffers['coords_from'].cap + nstrokes * 4, 4096 * 16); realloc = true; } if (realloc) { if (config.debug_print) console.debug('WASM static data re-layout'); state.wasm.exports.free_static(); const mem = state.wasm.memory.buffer; const memv = new Uint8Array(mem); buffers['xs'].offset = state.wasm.exports.alloc_static(coords_bytes); buffers['ys'].offset = state.wasm.exports.alloc_static(coords_bytes); buffers['pressures'].offset = state.wasm.exports.alloc_static(coords_bytes); buffers['coords_from'].offset = state.wasm.exports.alloc_static(stroke_bytes); buffers['width'].offset = state.wasm.exports.alloc_static(stroke_bytes); buffers['xs'].tv = tv_create_on(Float32Array, coords_bytes / 4, mem, buffers['xs'].offset); buffers['ys'].tv = tv_create_on(Float32Array, coords_bytes / 4, mem, buffers['ys'].offset); buffers['pressures'].tv = tv_create_on(Uint8Array, coords_bytes, mem, buffers['pressures'].offset); buffers['coords_from'].tv = tv_create_on(Uint32Array, stroke_bytes / 4, mem, buffers['coords_from'].offset); buffers['width'].tv = tv_create_on(Uint32Array, stroke_bytes / 4, mem, buffers['width'].offset); // TODO: this should have been automatic maybe? buffers['xs'].tv.size = buffers['xs'].used / 4; buffers['ys'].tv.size = buffers['ys'].used / 4; buffers['pressures'].tv.size = buffers['pressures'].used; buffers['coords_from'].tv.size = buffers['coords_from'].used / 4; buffers['width'].tv.size = buffers['width'].used / 4; // TODO: this is SUS, should all the caps really be coords_bytes? buffers['xs'].cap = buffers['ys'].cap = buffers['pressures'].cap = coords_bytes; buffers['coords_from'].cap = buffers['width'].cap = stroke_bytes; const tmp = new Uint8Array(Math.max(coords_bytes, stroke_bytes)); // Copy from back to front (otherwise we will overwrite) tmp.set(new Uint8Array(mem, old_width_offset, buffers['width'].used)); memv.set(new Uint8Array(tmp.buffer, 0, buffers['width'].used), buffers['width'].offset); tmp.set(new Uint8Array(mem, old_coords_from_offset, buffers['coords_from'].used)); memv.set(new Uint8Array(tmp.buffer, 0, buffers['coords_from'].used), buffers['coords_from'].offset); tmp.set(new Uint8Array(mem, old_pressures_offset, buffers['pressures'].used)); memv.set(new Uint8Array(tmp.buffer, 0, buffers['pressures'].used), buffers['pressures'].offset); tmp.set(new Uint8Array(mem, old_ys_offset, buffers['ys'].used)); memv.set(new Uint8Array(tmp.buffer, 0, buffers['ys'].used), buffers['ys'].offset); } } async function do_lod(state, context) { state.wasm.exports.free_dynamic(); const buffers = state.wasm.buffers; const result_buffers = state.wasm.exports.alloc_dynamic(state.wasm.workers.length * 4); const result_counts = state.wasm.exports.alloc_dynamic(state.wasm.workers.length * 4); const result_batch_counts = state.wasm.exports.alloc_dynamic(state.wasm.workers.length * 4); const clipped_indices = state.wasm.exports.alloc_dynamic(context.clipped_indices.size * 4); const mem = new Uint8Array(state.wasm.memory.buffer); // Dynamic input data that should (by design) never be too big mem.set(tv_bytes(context.clipped_indices), clipped_indices); // NOTE: this static partitioning scheme turned out to be "good enough" (i.e., trying // to allocate approximately the same amount of points per job wasn't any faster) const indices_per_thread = Math.floor(context.clipped_indices.size / state.wasm.workers.length); const offsets = { 'coords_from': buffers['coords_from'].offset, 'width': buffers['width'].offset, 'xs': buffers['xs'].offset, 'ys': buffers['ys'].offset, 'pressures': buffers['pressures'].offset, 'result_buffers': result_buffers, 'result_counts': result_counts, 'result_batch_counts': result_batch_counts, }; const jobs = []; for (let i = 0; i < state.wasm.workers.length; ++i) { let count = indices_per_thread; if (i === state.wasm.workers.length - 1) { count += context.clipped_indices.size % state.wasm.workers.length; } jobs.push({ 'type': 'lod', 'indices_base': clipped_indices + i * 4 * indices_per_thread, 'indices_count': count, 'zoom': state.canvas.zoom, 'offsets': offsets }); } await workers_messages(state.wasm.workers, jobs); const result_offset = state.wasm.exports.merge_results( result_counts, result_batch_counts, result_buffers, state.wasm.workers.length ); const segment_count = new Int32Array(state.wasm.memory.buffer, result_counts, 1)[0]; // by convention const batch_count = new Int32Array(state.wasm.memory.buffer, result_batch_counts, 1)[0]; // by convention // Use results without copying from WASM memory const wasm_points = new Float32Array(state.wasm.memory.buffer, result_offset, segment_count * 2); const wasm_ids = new Uint32Array(state.wasm.memory.buffer, result_offset + segment_count * 2 * 4, segment_count); const wasm_pressures = new Uint8Array(state.wasm.memory.buffer, result_offset + segment_count * 3 * 4, segment_count); const wasm_batches = new Int32Array(state.wasm.memory.buffer, result_offset + round_to_pow2(segment_count * (3 * 4 + 1), 4), batch_count * 2); context.instance_data_points.data = wasm_points; context.instance_data_points.size = segment_count * 2; context.instance_data_points.capacity = segment_count * 2; context.instance_data_ids.data = wasm_ids; context.instance_data_ids.size = segment_count; context.instance_data_ids.capacity = segment_count; context.instance_data_pressures.data = wasm_pressures; context.instance_data_pressures.size = segment_count; context.instance_data_pressures.capacity = segment_count; context.instance_data_batches.data = wasm_batches; context.instance_data_batches.size = batch_count * 2; context.instance_data_batches.capacity = batch_count * 2; return segment_count; }