raphlinus’s gists

raphlinus / neon_flatten.rs

Created July 7, 2025 18:19

Sketch of Neon code for flattening

	unsafe fn approx_parabola_integral(x: float32x4_t) -> float32x4_t {
	const D: f32 = 0.67;
	let x2 = vmulq_f32(x, x);
	let t1 = vfmaq_f32(vdupq_n_f32(D.powi(4)), vdupq_n_f32(0.25), x2);
	let t1_sqrt = vsqrtq_f32(t1);
	let t1_fourthroot = vsqrtq_f32(t1_sqrt);
	let denom = vaddq_f32(vdupq_n_f32(1.0 - D), t1_fourthroot);
	vdivq_f32(x, denom)
	}

raphlinus / hello_stickshift.rs

Created March 27, 2025 04:45

First code from stickshift

	// Input:
	// fn foo(x: [f32; 4], y: f32) -> [f32; 4] {
	// x; x * (x - 2.0) * y
	// }
	fn foo(x: [f32; 4], y: f32) -> [f32; 4] {
	unsafe {
	let v__0 = ::core::mem::transmute::<[f32; 4usize], ::core::arch::aarch64::float32x4_t>(x);
	let v__1 = y;
	let v__2 = v__0;
	let v__3 = v__0;

raphlinus / flatten.rs

Created January 16, 2025 05:31

Snapshot of SIMD flatten implementation

	// Copyright 2025 the Fearless_SIMD Authors
	// SPDX-License-Identifier: Apache-2.0 OR MIT

	//! Example of fast flattening cubic Beziers.

	// Arguably we should just take a kurbo dep (or do development
	// in another crate), but here we can

	use core::f32;

raphlinus / ordered_queue_test.rs

Created December 7, 2024 22:42

Sketch of queue

	use std::time::Duration;
	use rand::Rng;

	fn main() {
	let (s, mut r) = ordered_channel::bounded(10);
	for i in 0..100 {
	let s_clone = s.clone();
	rayon::spawn_fifo(move \|\| {
	let mut rng = rand::thread_rng();
	let sleep_time = rng.gen_range(0..100);

raphlinus / neon_to_srgb.rs

Created November 15, 2024 15:48

Neon implementation of linear to sRGB transfer function

	// Copyright 2024 the Color Authors
	// SPDX-License-Identifier: Apache-2.0 OR MIT

	#[cfg(target_arch = "aarch64")]
	#[target_feature(enable = "neon")]
	#[inline(never)]
	pub unsafe fn to_srgb(rgba: [f32; 4]) -> [f32; 4] {
	let v = aarch64::vld1q_f32(rgba.as_ptr());
	let vabs = aarch64::vabsq_f32(v);
	let bias = aarch64::vdupq_n_f32(-5.35862651e-04);

raphlinus / simd_reduce_test.rs

Last active April 12, 2025 20:33

Comparison of scalar and SIMD max reduction

	// run with `RUSTFLAGS='-C target-cpu=native' cargo +nightly bench`

	#![feature(test)]

	fn main() {
	let mut a = [0u32; 65536];
	a[1] = 42;
	println!("{}", scalar_max(&a));
	println!("{}", avx2_max(&a));
	}

raphlinus / gist:5aca9de53f9d6b24933cb24d8a60df63

Created March 15, 2024 04:22

apparent miscompilation of flatten.wgsl

raphlinus / relaxed.rs

Last active November 5, 2023 16:35

LB litmus test adapted to loom crate

raphlinus / main.rs

Created July 4, 2023 19:00

Property testing of email scanner

	// SPDX-License-Identifier: MIT
	use proptest::test_runner::TestRunner;
	use proptest::strategy::{Strategy, ValueTree};

	fn main() {
	let email_re = "^[a-zA-Z0-9.!#$%&'*+/=?^_`{\|}~-]+@[a-zA-Z0-9](?:[a-zA-Z0-9-]{0,61}[a-zA-Z0-9])?\
	(?:\\.[a-zA-Z0-9](?:[a-zA-Z0-9-]{0,61}[a-zA-Z0-9])?)*$";
	let re = regex::Regex::new(email_re).unwrap();
	let mut runner = TestRunner::default();
	for _ in 0..100_000_000 {

raphlinus / max.hlsl

Last active June 9, 2023 16:41

MetalLibraryExplorer dump of metal-shaderconverter output

	ByteAddressBuffer input;
	RWByteAddressBuffer output;

	groupshared uint max_value;

	[numthreads(256, 1, 1)]
	void main(uint index: SV_GroupIndex) {
	if (index == 0) {
	max_value = 0;
	}

Raph Levien raphlinus