Skip to content

Instantly share code, notes, and snippets.

View LunNova's full-sized avatar
🌐
worldbuilding in progress

Luna LunNova

🌐
worldbuilding in progress
View GitHub Profile

Load Logic Perf

Subject Time Peak Memory vs Baseline
[hipblaslt] Use multiprocessing.Pool for TensileCreateLibrary 18.531s 879.0 MB baseline
[hipblaslt] CustomKernels: lru_cache for 20x speedup of some logic files 18.275s 878.3 MB 0% faster, 0% less memory
[hipblaslt] reduce memory usage during logic load 15.500s 873.7 MB 15% faster, 0% less memory
[hipblaslt] Remove unused key arg for getPrimitiveParameterValueAbbreviation 15.535s 873.4 MB 15% faster, 0% less memory
[hipblaslt] intern strings to reduce duplicate memory for solution keys 15.001s 721.9 MB 17.5% faster, 17.5% less memory
[hipblaslt] tensilelite: gc in parallel worker 15.167s 722.1 MB 17.5% faster, 17.5% less memory
@LunNova
LunNova / hipblaslt-tcl-flamegraph.svg
Created October 12, 2025 04:56
my god, it's full of deepcopy
Loading
Sorry, something went wrong. Reload?
Sorry, we cannot display this file.
Sorry, this file is invalid so it cannot be displayed.
hipblaslt> Generating assembly kernels done in 1344.1s! 196454/ 196454
hipblaslt> Found 2657 .o files shared across multiple code objects:
hipblaslt> Cijk_Ailk_Bjlk_BBS_BH_Bias_HA_S_SAV_UserArgs_MT8erymT8rQGt6XFA1NWV4QsUpLY29cgz1uxrgsp6VsR2A=.o: used by 2 code objects
hipblaslt> Cijk_Ailk_Bjlk_BBS_BH_Bias_HA_S_SAV_UserArgs_MT6MF1BML7wMbEKqG1Q0D4GlKLG4f8LUr11brv2zeSVlc8=.o: used by 2 code objects
hipblaslt> Cijk_Ailk_Bjlk_BBS_BH_Bias_HA_S_SAV_UserArgs_MT65lDvCXl7XhQy83Y8oL4f6RUf9nbwadR1KWgVYPsTbrQ=.o: used by 2 code objects
hipblaslt> Cijk_Ailk_Bjlk_BBS_BH_Bias_HA_S_SAV_UserArgs_MT2ckytA8P_xPIbSnDkNavRbNCvlU05dwqXFFR3NDOdtMQ=.o: used by 2 code objects
hipblaslt> Cijk_Ailk_Bjlk_BBS_BH_Bias_HA_S_SAV_UserArgs_MT9XxmHU6veNZ1qUUrovw0wMqLq7nlsrFA8qINVvjfwl6Y=.o: used by 2 code objects
hipblaslt> Cijk_Ailk_Bjlk_BBS_BH_Bias_HA_S_SAV_UserArgs_MT1C_BKtMsNfHVFHhtsT_YlAB8FJTnndhtSMMyt4CWEXH0=.o: used by 2 code objects
hipblaslt> Cijk_Ailk_Bjlk_BBS_BH_Bias_HA_S_SAV_UserArgs_MT15wlgV3V1gt5s4AK4TKNG5CbMHKqm
2025-09-30T15:25:12.8506820Z Current runner version: '2.328.0'
2025-09-30T15:25:12.8530560Z ##[group]Runner Image Provisioner
2025-09-30T15:25:12.8532110Z Hosted Compute Agent
2025-09-30T15:25:12.8533090Z Version: 20250912.392
2025-09-30T15:25:12.8534280Z Commit: d921fda672a98b64f4f82364647e2f10b2267d0b
2025-09-30T15:25:12.8535650Z Build Date: 2025-09-12T15:23:14Z
2025-09-30T15:25:12.8536880Z ##[endgroup]
2025-09-30T15:25:12.8538090Z ##[group]Operating System
2025-09-30T15:25:12.8539370Z macOS
2025-09-30T15:25:12.8540660Z 15.6.1
Commit ID: 91450254dba4c03cc51dbcb18cd9be9395fc7a90
Change ID: xvomkvwpnurxzlnsozlxvtzvrmxxqnms
Author : Luna Nova <[email protected]> (59m)
Committer: Luna Nova <[email protected]> (<=1m)
chromium: pin LLVM to 20 to work around compile error
chromium's histogram_macros_internal contains a UB static cast
return static_cast<Enum>(base::to_underlying(Enum::kMaxValue) + 1);
resulting in
diff --git a/src/cmd/dist/buildruntime.go b/src/cmd/dist/buildruntime.go
index 87e8867176..dbb635011f 100644
--- a/src/cmd/dist/buildruntime.go
+++ b/src/cmd/dist/buildruntime.go
@@ -62,7 +62,7 @@ func mkbuildcfg(file string) {
fmt.Fprintf(&buf, "const DefaultGORISCV64 = `%s`\n", goriscv64)
fmt.Fprintf(&buf, "const defaultGOEXPERIMENT = `%s`\n", goexperiment)
fmt.Fprintf(&buf, "const defaultGO_EXTLINK_ENABLED = `%s`\n", goextlinkenabled)
- fmt.Fprintf(&buf, "const defaultGO_LDSO = `%s`\n", defaultldso)
+ fmt.Fprintf(&buf, "const DefaultGO_LDSO = `%s`\n", defaultldso)
trait TypeFn {type Output<A>;}
struct Fix<F: TypeFn>(<F as TypeFn>::Output<Fix<F>>);
struct FnRes;
impl TypeFn for FnRes { type Output<A> = fn() -> A;}
fn return_me() -> Fix<FnRes> {
Fix(return_me as fn() -> Fix<FnRes>)
}
Building 144 packages
.#alex .#arion .#autosubst2 .#aws-spend-summary .#bench .#bintools-unwrapped .#binutils-unwrapped .#binutils-unwrapped-all-targets .#binutils-unwrapped_2_38 .#bruijn .#buildah-unwrapped .#busybox .#busybox-sandbox-shell .#cabal-install .#cabal2nix-unwrapped .#cachix .#changelog-d .#client-ip-echo .#clisp .#cornelis .#darcs .#dclock .#dconf2nix .#dhall .#dhall-bash .#dhall-docs .#dhall-json .#dhall-lsp-server .#dhall-nix .#dhall-nixpkgs .#dhall-yaml .#echidna .#elm2nix .#elmPackages.elm .#elmPackages.elm-format .#emanote .#faustPhysicalModeling .#fffuu .#fourmolu .#fpc .#futhark .#gawk .#gawkInteractive .#gcc-unwrapped .#gccForLibs .#ghc .#ghcid .#git-annex .#git-brunch .#gitit .#glibc .#glibc_memusage .#glirc .#hadolint .#happy .#haskell-ci .#hci .#hercules-ci-agent .#hinit .#hledger .#hledger-iadd .#hledger-interest .#hledger-ui .#hledger-web .#hlint .#hpack .#hscolour .#iconv .#idrisPackages.idris-no-deps .#jacinda .#json2yaml .#kexec-tools .#kind-lang .#kmonad .#koka .#krank .#lambdab
# Building https://github.com/LunNova/nixpkgs/blob/ad384653a6094ad6460ee2c10a01fc42a252038a/pkgs/development/rocm-modules/6/aotriton/default.nix
https://cache.nixos.org/hqr05ly7gm93gasdqmxsgmyin0bdkq86.narinfo
https://cache.nixos.org/pbmiqw44xjgdgx6ncwn0p3pw2dz520vm.narinfo
structuredAttrs is enabled
Running phase: unpackPhase
@nix {"action":"setPhase","phase":"unpackPhase"}
unpacking source archive /nix/store/sj81yw7mqagddvxbhcl2bk6m1rs6v43k-source
source root is source
separate-debug-info: recording checksum of source files for debug support...
@LunNova
LunNova / broken-ra.rs
Created July 6, 2025 02:27
failed attempt at using rust-analyzer to map macro expansion to original lines in a project. always gets no items in macro expansion
[dependencies]
# HIR analysis - use consistent versions
ra_ap_hir = "0.0.289"
ra_ap_base_db = "0.0.289"
ra_ap_hir_def = "0.0.289"
ra_ap_hir_expand = "0.0.289"
ra_ap_ide_db = "0.0.289"
ra_ap_load-cargo = "0.0.289"
ra_ap_paths = "0.0.289"