Created
March 10, 2025 16:59
-
-
Save pashu123/d0923d1492f51038fd0e108f61096591 to your computer and use it in GitHub Desktop.
This file contains hidden or bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
: 1709405007:0;git clone --depth 1 https://github.com/junegunn/fzf.git ~/.fzf\ | |
~/.fzf/install | |
: 1709405026:0;source ~/.zshrcs | |
: 1709405061:0;hipcc --version | |
: 1709405083:0;hipcc -o3 | |
: 1709405161:0;sudo dnf install raedontop | |
: 1709405239:0;sudo dnf install cargo | |
: 1709405609:0;sudo apt-get intall lld | |
: 1709405648:0;sudo dnf install libdrm-dev | |
: 1709405653:0;sudo dnf install libdrm-devel | |
: 1709405663:0;sudo cargo install amdgpu_top | |
: 1709405814:0;sudo cd /root/.cargo | |
: 1709405829:0;cd /root/.cargo | |
: 1709405859:0;sudo mv /root/.cargo/ ~/heyya | |
: 1709405864:0;cd heyya | |
: 1709405869:0;./amdgpu_top | |
: 1709406036:0;sudo mv ~/heyya/ /root/.cargo/ | |
: 1709406061:0;sudo dnf install pip | |
: 1709406071:0;sudo dnf install venv | |
: 1709406081:0;sudo pip3 install venv | |
: 1709406101:0;sudo dnf install python3-venv | |
: 1709406292:0;sudo dnf install pyright | |
: 1709406298:0;sudo dnf install clangd | |
: 1709406331:0;sudo dnf install clang-tools | |
: 1709406345:0;sudo dnf update | |
: 1709406351:0;sudo dnf upgreade | |
: 1709406356:0;sudo dnf upgrade | |
: 1709406414:0;udo dnf install clang-tools-extra | |
: 1709406426:0;sudo dnf install clang-tools-extra | |
: 1709406442:0;locate clang-format | |
: 1709406468:0;where clang-format | |
: 1709406472:0;which clang-format | |
: 1709406553:0;ssh-keygen | |
: 1709406615:0;git clone [email protected]:pashu123/personal_commands.git | |
: 1709406649:0;sudo dnf install xorg-x11-drv-nvidia-cuda | |
: 1709406687:0;mv personal_commands build_commands | |
: 1709406723:0;vi .zshrc | |
: 1709406742:0;mv .tmux.conf .gitconfig ../ | |
: 1709406894:0;sudo dnf copr enable atim/lazygit -y | |
: 1709406902:0;sudo dnf install lazygit | |
: 1709406969:0;git pmf | |
: 1709407082:0;git push -f | |
: 1709407111:0;lvim ~/.zshrc .zshrc | |
: 1709407238:0;python -m venv global_venv | |
: 1709407242:0;cd global_venv | |
: 1709407265:0;pip install -r torch-mlir/requirements.txt | |
: 1709407367:0;sud | |
: 1709407581:0;sudo vi /etc/systemd/logind.conf | |
: 1709408293:0;nvin | |
: 1709408342:0;cd ~/.local/share/lunarvim | |
: 1709408345:0;cd lvim | |
: 1709408354:0;cd site | |
: 1709408531:0;sudo dnf install cmake | |
: 1709408558:0;pip install -r ~/torch-mlir/requirements.txt | |
: 1709408715:0;pip install -r pytorch-requirements.txt | |
: 1709408763:0;sudo dnf install python3-devel | |
: 1709408800:0;sudo dnf install ninja-build | |
: 1709408959:0;git clone https://github.com/openxla/iree.git | |
: 1709408969:0;git clone [email protected]:openxla/iree.git | |
: 1709409911:0;pip install sympy | |
: 1709410088:0;sudo dnf install vulkaninfo | |
: 1709410137:0;sudo dnf install vulkan vulkan-info | |
: 1709410148:0;sudo dnf install vulkan | |
: 1709410178:0;pipewire-vulkan --help | |
: 1709410187:0;pipewire-vulkan | |
: 1709411007:0;where rocminfo | |
: 1709411977:0;vulkaninfo | |
: 1709412013:0;vulkaninfo | fzf | |
: 1709412143:0;sudo yum install https://repo.radeon.com/amdgpu-install/6.0.2/rhel/9.3/amdgpu-install-6.0.60002-1.el9.noarch.rpm | |
: 1709412200:0;sudo amdgpu-install --usecase=hiplibsdk,rocm | |
: 1709412222:0;sudo dnf install amdgpu-dkms | |
: 1709412248:0;amdgpu-arch | |
: 1709412278:0;sudo amdgpu-install -y --usecase=rocm | |
: 1709412443:0;wget https://repo.radeon.com/amdgpu-install/23.40.2/rhel/9.3/amdgpu-install-6.0.60002-1.el9.noarch.rpm | |
: 1709412460:0;chmod +x amdgpu-install-6.0.60002-1.el9.noarch.rpm | |
: 1709412462:0;./amdgpu-install-6.0.60002-1.el9.noarch.rpm | |
: 1709412492:0;sudo rpm -i amdgpu-install-6.0.60002-1.el9.noarch.rpm | |
: 1709412508:0;amdgpu-install | |
: 1709412620:0;sudo dnf install amdgpu | |
: 1709412668:0;rm amdgpu-install-6.0.60002-1.el9.noarch.rpm | |
: 1709412828:0;git clone https://github.com/flame/blis.git | |
: 1709412854:0;git o pfhp | |
: 1709412873:0;./configure -t openmp -p ~/blis auto | |
: 1709412898:0;make check -j16 | |
: 1709412941:0;git clone https://github.com/ULAFF/LAFF-On-PfHP.git | |
: 1709412993:0;cd Week1 | |
: 1709412998:0;make IJP | |
: 1709413048:0;./driver_IJP.x | |
: 1709413343:0;vi FLA_Clock. | |
: 1709413347:0;vi FLA_Clock.c | |
: 1709414462:0;sudo shutdown | |
: 1709444680:0;cd blis | |
: 1709444693:0;cd Assignments | |
: 1709444712:0;cd Assignments/Week1 | |
: 1709444727:0;cd Week1/C | |
: 1709567543:0;cd Assignments/Week1/C | |
: 1709567984:0;make Gemv_I_Dot | |
: 1709571434:0;make J_Gemv_I_Dots | |
: 1709573473:0;cp Gemm_IJP.c Gemm_JPI.c | |
: 1709573533:0;make JPI | |
: 1709573560:0;vi data/output_JPI.m | |
: 1709692111:0;mkdir intel_intrinsics | |
: 1709692146:0;touch intr.cpp | |
: 1709692180:0;clang++ intr.cpp | |
: 1709743099:0;cat intr.cpp | |
: 1709787020:0;git checkout pashu/batchquant | |
: 1709787029:0;git ob batchquant | |
: 1709787470:0;sudo dnf install libcapstone-devel | |
: 1709787693:0;sudo apt install libtbb-devel libzstd-devel libglfw3-devel libfreetype6-devel libgtk-3-devel\ | |
: 1709787701:0;sudo dnf install libtbb-devel libzstd-devel libglfw3-devel libfreetype6-devel libgtk-3-devel\ | |
: 1709787797:0;sudo dnf install tbb-devel zstd-devel glfw3-devel freetype6-devel gtk-3-devel\ | |
: 1709787812:0;sudo dnf install tbb-devel | |
: 1709787838:0;sudo dnf install libzstd-devel | |
: 1709787880:0;sudo dnf install gtk3-devel | |
: 1709787933:0;sudo dnf install glfw-devel | |
: 1709787980:0;sudo dnf install libfreetype6\-devel | |
: 1709787986:0;sudo dnf install libfreetype-devel | |
: 1709788009:0;sudo dnf install freetype-devel | |
: 1709788056:0;sudo dnf install capstone-devel | |
: 1709788424:0;vi .gitconfig | |
: 1709791239:0;bash | |
: 1709804063:0;vi run_iree.sh | |
: 1709806074:0;sudo dnf get install clang-libs | |
: 1709806085:0;sudo dnf-get install clang-libs | |
: 1709806090:0;sudo dnf install clang-libs | |
: 1709806148:0;sudo dnf install clang-devel | |
: 1709806260:0;sudo dnf install compiler-rt | |
: 1709806433:0;lib/clang/17/lib/x86_64-redhat-linux-gnu/libclang_rt.asan.so | |
: 1709806512:0;LD_PRELOAD=lib/clang/17/lib/x86_64-redhat-linux-gnu/libclang_rt.asan.so | |
: 1709806659:0;LD_PRELOAD=lib/clang/17/lib/x86_64-redhat-linux-gnu/libclang_rt.asan.so ASAN_OPTIONS=detect_leaks=0 \\ | |
ASAN_SYMBOLIZER_PATH=/usr/lib/llvm-12/bin/llvm-symbolizer \ | |
: 1709806675:0;LD_PRELOAD=lib/clang/17/lib/x86_64-redhat-linux-gnu/libclang_rt.asan.so\ ASAN_OPTIONS=detect_leaks=0 \\ | |
ASAN_SYMBOLIZER_PATH=/usr/lib/llvm-12/bin/llvm-symbolizer \ | |
: 1709806810:0;sudo dnf install llvm-symbolizer | |
: 1709806857:0;where llvm-symbolizer | |
: 1709806864:0;sudo dnf install llvm | |
: 1709807005:0;llvm-symbolizer --version | |
: 1709807326:0;ASAN_SYMBOLIZER_PATH=/usr/bin/llvm-symbolizer | |
: 1709807538:0;cmake/build_and_test_asan.sh | |
: 1709807556:0;./cmake/build_and_test_asan.sh | |
: 1709807566:0;vi build_and_test_asan.sh | |
: 1709808013:0;cd tracy | |
: 1709808116:0;iree-compile --version | |
: 1709808145:0;cd tests/e2e/regression | |
: 1709813847:0;iree-compile --output-format=vm-bytecode --mlir-print-op-on-diagnostic=false --iree-hal-target-backends=llvm-cpu --iree-input-type=tosa --iree-llvmcpu-link-embedded=false --iree-llvmcpu-sanitize=address /work/tests/e2e/regression/linalg_quantized_matmul_vs_linalg_matmul.mlir -o check_regression_tosa_llvm-cpu_linalg_quantized_matmul_vs_linalg_matmul.mlir_asan_module.vmfb | |
: 1709813989:0;vi linalg_quantized_matmul_vs_linalg_matmul.mlir | |
: 1709814285:0;iree-compile --output-format=vm-bytecode --mlir-print-op-on-diagnostic=false --iree-hal-target-backends=llvm-cpu --iree-input-type=tosa --iree-llvmcpu-link-embedded=false linalg_quantized_matmul_vs_linalg_matmul.mlir -o check_regression_tosa_llvm-cpu_linalg_quantized_matmul_vs_linalg_matmul.mlir_asan_module.vmfb | |
: 1709814306:0;iree-compile --output-format=vm-bytecode --mlir-print-op-on-diagnostic=false --iree-hal-target-backends=llvm-cpu --iree-input-type=tosa --iree-llvmcpu-link-embedded=false --iree-llvmcpu-sanitize=address linalg_quantized_matmul_vs_linalg_matmul.mlir -o check_regression_tosa_llvm-cpu_linalg_quantized_matmul_vs_linalg_matmul.mlir_asan_module.vmfb | |
: 1709814354:0;iree-opt --pass-pipeline="builtin.module(func.func(iree-linalg-quantized-matmul-to-matmul))" compiler/src/iree/compiler/InputConversion/Common/test/linalg_quantized_matmul_to_matmul.mlir | FileCheck compiler/src/iree/compiler/InputConversion/Common/test/linalg_quantized_matmul_to_matmul.mlir | |
: 1709816144:0;wget https://storage.googleapis.com/shark_tank/elias/facebook_opt_1.3b.mlir | |
: 1709816155:0;vi facebook_opt_1.3b.mlir | |
: 1709816167:0;mv facebook_opt_1.3b.mlir ../ | |
: 1709816181:0;wget https://storage.googleapis.com/shark_tank/elias/facebook_opt_1.3b_weights.irpa | |
: 1709820455:0;iree-compile \\ | |
--iree-hal-target-backends=llvm-cpu \\ | |
--iree-llvmcpu-target-cpu=znver4 \\ | |
--iree-llvmcpu-enable-ukernels=all \\ | |
~/facebook_opt_1.3b.mlir -o /tmp/facebook_opt_1.3b.vmfb | |
: 1709820592:0;iree-compile \\ | |
--iree-hal-target-backends=llvm-cpu \\ | |
--iree-llvmcpu-target-cpu=znver4 \\ | |
--iree-llvmcpu-enable-ukernels=none \\ | |
~/facebook_opt_1.3b.mlir -o /tmp/facebook_opt_1.3b.vmfb | |
: 1709820683:0;iree-benchmark-module --parameters=model=facebook_opt_1.3b_weights.irpa --module=/tmp/facebook_opt_1.3b.vmfb --function=run --input=1x1xi64 | |
: 1709820737:0;mkdir testing && mv facebook_opt_1.3b* testing | |
: 1709821461:0;TRACY_NO_EXIT=1 iree-benchmark-module --parameters=model=facebook_opt_1.3b_weights.irpa --module=/tmp/facebook_opt_1.3b.vmfb --function=run --input=1x1xi64 | |
: 1709821480:0;TRACY_NO_EXIT=1 iree-benchmark-module --parameters=model=~/testing/facebook_opt_1.3b_weights.irpa --module=/tmp/facebook_opt_1.3b.vmfb --function=run --input=1x1xi64 | |
: 1709822008:0;iree-tracy-capture | |
: 1709822028:0;TRACY_NO_EXIT=1 iree-benchmark-module --parameters=model=$HOME/testing/facebook_opt_1.3b_weights.irpa --module=/tmp/facebook_opt_1.3b.vmfb --function=run --input=1x1xi64 | |
: 1709822040:0;iree-tracy-capture -p 8086 | |
: 1709822052:0;iree-tracy-capture --help | fzf | |
: 1709822067:0;iree-tracy-capture -help | |
: 1709822197:0;mv xyz.tracy .. | |
: 1709838944:0;./runtime/src/iree/builtins/ukernel/tools/mmt4d_benchmark | |
: 1709840084:0;hwinfo | |
: 1709840146:0;hwinfo | fzf | |
: 1709840166:0;more hwinfo | |
: 1709840176:0;less hwinfo | |
: 1709840182:0;hwinfo | more | |
: 1709840276:0;hwinfo --memory | |
: 1709840308:0;sudo hwinfo --memory | |
: 1709840353:0;sudo dnf install lshw | |
: 1709840363:0;sudo lshw -short -C memory | |
: 1709870314:0;git ob x86s8s4s32 | |
: 1709894835:0;cd LAFF-On-PfHP | |
: 1709894839:0;Assignments/Week2/C | |
: 1709905099:0;vi data/output_JI_4x4Kernel.m | |
: 1709906014:0;make JI_4x4Kernel | |
: 1709906058:0;make JI_8x4Kernel | |
: 1709906099:0;vi data/output_JI_8x4Kernel.m | |
: 1709912494:0;cd Week4 | |
: 1709912497:0;cd C | |
: 1709915106:0;./runtime/src/iree/builtins/ukernel/tools/mmt4d_benchmark | |
: 1709957172:0;sudo dnf install clang | |
: 1709985864:0;./runtime/src/iree/builtins/ukernel/tools/mmt4d_test | |
: 1709986121:0;cd runtime/src/iree/builtins/ukernel/tools/ | |
: 1709986131:0;./e2e_matmul_benchmark | |
: 1709986188:0;./util_test | |
: 1709986200:0;./unpack_test | |
: 1709987288:0;lldb | |
: 1709987297:0;sudo dnf install lldb | |
: 1709988500:0;runtime/src/iree/builtins/ukernel/arch/x86_64/mmt4d_x86_64_entry_point.c riree | |
: 1709991033:0;vi intr.cpp | |
: 1709991234:0;IR_UK_TEST_ABORT_ON_ERROR=ON ./mmt4d_test | |
: 1709991281:0;lldb mmt4d_test | |
: 1710009597:0;mmt4d_test | |
: 1710009603:0;..mmt4d_test | |
: 1710009623:0;mmt4d_benchmark | |
: 1710010951:0;k | |
: 1710043982:0;./mmt4d_test --help | |
: 1710050239:0;of output is 22\ | |
The value of output is 1\ | |
The value of output is 16\ | |
The value of output is 6\ | |
The value of output is 0\ | |
The value of output is -1\ | |
The value of output is 18\ | |
The value of output is 6 | |
: 1710053449:0;./mmt4d_test > xyz.txt | |
: 1710085496:0;cd intel_intrinsics | |
: 1710089511:0;clang-format -i intr.cpp | |
: 1710089588:0;clang++ -march=native intr.cpp | |
: 1710091563:0;./mmt4d_test | |
: 1710091831:0;BM_mmt4d_s8s4s32_tile_4x8x4_av | |
: 1710092154:0;./mmt4d_benchmark | |
: 1710099865:0;clar | |
: 1710135524:0;echo $OMP_NUM_THREADS | |
: 1710135533:0;omp | |
: 1710150037:0;sudo dnf install libomp | |
: 1710182675:0;uname -a | |
: 1710182688:0;sudo dnf install nasm | |
: 1710182905:0;lld hello.o -o hello | |
: 1710182909:0;nasm -f elf64 -o hello.o hello.asm | |
: 1710182913:0;ld.lld hello.o -o hello | |
: 1710183031:0;vi hello.asm | |
: 1710183067:0;nasm -f elf64 -o hello.o hello.asm $$ ld.lld hello.o -o hello | |
: 1710218142:0;rm hello hello.o hello.asm | |
: 1710218148:0;mkdir assembly_pro | |
: 1710218175:0;cd assembly_pro | |
: 1710218532:0;nasm -f elf64 -o hello.o hello.asm && ld.lld hello.o -o hello | |
: 1710218535:0;./hello | |
: 1710243835:0;git ob conv_suite | |
: 1710246409:0;make all | |
: 1710246413:0;make . | |
: 1710246434:0;rm CMakeCache.txt | |
: 1710246482:0;python generate_e2e_matmul_tests.py | |
: 1710246522:0;vi generate_e2e_matmul_tests.py | |
: 1710252711:0;cd ireels | |
: 1710252737:0;iree-e2e-matmul-test | |
: 1710252748:0;iree-e2e-matmul-test --help | |
: 1710255691:0;tests/e2e/matmul/ | |
: 1710255722:0;python generate_e2e_matmul_tests.py --lhs_rhs_type=f32 --acc_type=f32 --shapes=small | |
: 1710255764:0;python generate_e2e_matmul_tests.py --lhs_rhs_type=f32 --acc_type=f32 --shapes=small --output_matmuls_mlir="./" --output_calls_mlir="./" | |
: 1710256615:0;python generate_e2e_matmul_tests.py --lhs_rhs_type=f32 --acc_type=f32 --shapes=small --output_matmuls_mlir="mm.mlir" --output_calls_mlir="calls.txt" --name="e2e_matmul" | |
: 1710307098:0;python generate_e2e_matmul_tests.py --lhs_rhs_type=f32 --acc_type=f32 --shapes=small --output_matmuls_mlir="mm.mlir" --output_calls_mlir="calls.txt" | |
: 1710307102:0;vi mm.mlir | |
: 1710328731:0;vi calls.txt | |
: 1710334389:0;python generate_e2e_convolution_tests.py | |
: 1710334545:0;touch generate | |
: 1710334556:0;rm generate | |
: 1710334560:0;python generate --output_conv2d_mlir=xyz.mlir --output_calls_mlir=aa.mlir --input_type=f16 --input_layout="nchw" --kernel_type=f16 --kernel_layout="fchw" | |
: 1710334611:0;python generate_e2e_convolution_tests.py --output_conv2d_mlir=xyz.mlir --output_calls_mlir=aa.mlir --input_type=f16 --input_layout="nchw" --kernel_type=f16 --kernel_layout="fchw" | |
: 1710334617:0;python generate_e2e_convolution_tests.py --output_conv2d_mlir=xyz.mlir --output_calls_mlir=aa.mlir --input_type=f16 --input_layout="nchw" --kernel_type=f16 --kernel_layout="fchw" --shapes=1 | |
: 1710335148:0;vi txt.mlir | |
: 1710335268:0;torch-mlir-opt --torch-backend-to-linalg-on-tensors-backend-pipeline txt.mlir > heyya.mlir | |
: 1710335283:0;torch-mlir-opt --torch-backend-to-linalg-on-tensors-backend-pipeline -allow-unregistered-dialect txt.mlir > heyya.mlir | |
: 1710337914:0;iree-opt --torch-backend-to-linalg-on-tensors-backend-pipeline -allow-unregistered-dialect txt.mlir > heyya.mlir | |
: 1710337979:0;iree-opt --convert-torch-to-linalg -allow-unregistered-dialect txt.mlir > heyya.mlir | |
: 1710338033:0;iree-opt --convert-torch-to-linalg -canonicalize txt.mlir > heyya.mlir | |
: 1710348991:0;python generate_e2e_convolution_tests.py --output_conv2d_mlir=xyz.mlir --output_calls_mlir=aa.mlir --input_type=f16 --input_layout="nchw" --kernel_type=f16 --kernel_layout="fchw" --shapes=small | |
: 1710351839:0;black generate_e2e_convolution_tests.py | |
: 1710352964:0;iree-e2e-matmul-test --help | fzf | |
: 1710353008:0;iree-e2e-matmul-test xyz.mlir aa.mlir | |
: 1710353018:0;iree-e2e-matmul-test --module=xyz.mlir aa.mlir | |
: 1710353024:0;iree-e2e-matmul-test --module=xyz.mlir | |
: 1710353032:0;iree-e2e-matmul-test --module=aa.mlir | |
: 1710353049:0;iree-e2e-matmul-test --module=heyy.mlir | |
: 1710353051:0;vi heyya.mlir | |
: 1710353060:0;iree-e2e-matmul-test --module=heyya.mlir | |
: 1710353112:0;iree-e2e-matmul-test --module=xyz.mlir,aa.mlir | |
: 1710353118:0;iree-e2e-matmul-test --module=xyz.mlir | |
: 1710391896:0;python generate_e2e_matmul_tests.py --lhs_rhs_type=f32 --acc_type=f32 --shapes=small --output_matmuls_mlir="1.mlir" --output_calls_mlir="2.txt" | |
: 1710391904:0;mv 2.txt 2.mlir | |
: 1710391911:0;rm mm.mlir calls.txt | |
: 1710391914:0;vi 1.mlir | |
: 1710391932:0;rm -rf CMakeFiles | |
: 1710391949:0;cat CMakeLists.txt | |
: 1710392138:0;iree-e2e-matmul-test 1.mlir 2.mlir | |
: 1710392147:0;iree-e2e-matmul-test --module=1.mlir 2.mlir | |
: 1710392160:0;iree-e2e-matmul-test --module=1.mlir | |
: 1710392175:0;iree-e2e-matmul-test --module=1.mlir --module=2.mlir | |
: 1710392306:0;iree-compile --module=1.mlir --function=run --input=1x1xi64 | |
: 1710415377:0;mkdir cmake_docs | |
: 1710415781:0;vi Makefile | |
: 1710416401:0;./trim helodsfdfj djfldsjf | |
: 1710416482:0;cd ~/cmake_docs | |
: 1710416503:0;make install | |
: 1710417010:0;nm libnoobmath.a | |
: 1710417176:0;mkdir -p src/noobmath/cpp | |
: 1710417199:0;mv CMakeLists.txt main.cpp noobmath.cpp noobmath.h src/noobmath/cpp | |
: 1710417214:0;mkdir TestSome | |
: 1710417630:0;cd noobmath | |
: 1710417633:0;cd cpp | |
: 1710417663:0;cd TestSome | |
: 1710417789:0;./testsome | |
: 1710420589:0;git submodule add [email protected]:glfw/glfw.git external/glfw | |
: 1710420604:0;vi .gitmodules | |
: 1710420683:0;touch build.sh run.sh configure.sh && chmod +x *.sh | |
: 1710420693:0;vi build | |
: 1710420802:0;touch CMakeLists.txt | |
: 1710420871:0;sh configure.sh | |
: 1710421147:0;make -j 32 | |
: 1710421157:0;./OLAS | |
: 1710421171:0;cd external | |
: 1710421174:0;cd glfw | |
: 1710421293:0;make build/ | |
: 1710426617:0;cdls | |
: 1710429685:0;vi /home/pashu/iree-build/tests/e2e/matmul/e2e_matmul_cpu_dt_uk_i8_i32_small_llvm-cpu_local-task_matmul.mlir | |
: 1710429722:0;vi e2e_matmul_cpu_dt_i8_i32_small_llvm-cpu_local-task_calls | |
: 1710429769:0;vi e2e_matmul_cpu_dt_uk_i8_i32_small_llvm-cpu_local-task_avx512vnni_matmuls | |
: 1710429798:0;vi e2e_matmul_cpu_dt_bf16_bf16_small_llvm-cpu_local-task_avx512bf16_matmuls | |
: 1710429809:0;vi e2e_matmul_cpu_dt_bf16_bf16_small_llvm-cpu_local-task_avx512bf16_matmuls.mlir | |
: 1710429824:0;vi e2e_matmul_cpu_dt_uk_i8_i32_small_llvm-cpu_local-task_avx512vnni_matmuls.mlir | |
: 1710469381:0;iree-e2e-conv2d-test --help | |
: 1710475820:0;cd iree-build/tests/e2e | |
: 1710475849:0;vi e2e_matmul_cpu_dt_bf16_bf16_small_llvm-cpu_local-task_avx2_matmuls.mlir | |
: 1710475889:0;vi e2e_matmul_cpu_dt_bf16_bf16_small_llvm-cpu_local-task_avx2_calls.mlir | |
: 1710481968:0;./a | |
: 1710482109:0;vi test_convolve.cpp | |
: 1710482121:0;clang++ test_convolve.cpp | |
: 1710501853:0;clang-format tools/iree-e2e-conv2d-test.cc | |
: 1710506590:0;cd ls | |
: 1710514667:0;vi tests/e2e/convolution/aa.mlir | |
: 1710521672:0;iree-e2e-conv2d-test | |
: 1710521868:0;iree-compile --output-format=vm-bytecode --mlir-print-op-on-diagnostic=false --iree-hal-target-backends=llvm-cpu --iree-llvmcpu-link-embedded=false --iree-llvmcpu-sanitize=address /tests/e2e/convolution/xyz.mlir -o matmuls.vmfb | |
: 1710521874:0;iree-compile --output-format=vm-bytecode --mlir-print-op-on-diagnostic=false --iree-hal-target-backends=llvm-cpu --iree-llvmcpu-link-embedded=false --iree-llvmcpu-sanitize=address tests/e2e/convolution/xyz.mlir -o matmuls.vmfb | |
: 1710522225:0;vi generate_e2e_convolution_tests.py | |
: 1710522277:0;python generate_e2e_convolution_tests.py --output_conv2d_mlir=xyz.mlir --output_calls_mlir=aa.mlir --input_type=f16 --input_layout="nchw" --kernel_type=f16 --kernel_layout="fchw" --shapes=large | |
: 1710522294:0;iree-opt tests/e2e/convolution/aa.mlir | |
: 1710522303:0;iree-compile --output-format=vm-bytecode --mlir-print-op-on-diagnostic=false --iree-hal-target-backends=llvm-cpu --iree-llvmcpu-link-embedded=false --iree-llvmcpu-sanitize=address tests/e2e/convolution/aa.mlir -o calls.vmfb | |
: 1710522388:0;/home/pashu/iree-build/tools/iree-e2e-matmul-test "--module=/home/pashu/iree/matmuls.vmfb" "--module=/home/pashu/iree/calls.vmfb" "--device=local-task" | |
: 1710523021:0;vi tests/e2e/convolution/aa.mlir | |
: 1710523035:0;vi tests/e2e/convolution/xyz.mlir | |
: 1710525000:0;python tests/e2e/convolution/generate_e2e_convolution_tests.py --output_conv2d_mlir=xyz.mlir --output_calls_mlir=aa.mlir --input_type=f16 --input_layout="nchw" --kernel_type=f16 --kernel_layout="fchw" --shapes=large | |
: 1710525082:0;rm aa.mlir "'" xyz.mlir | |
: 1710525099:0;python tests/e2e/convolution/generate_e2e_convolution_tests.py --output_conv2d_mlir=xyz.mlir --output_calls_mlir=aa.mlir --input_type=f16 --input_layout="nchw" --kernel_type=f16 --kernel_layout="fchw" --shapes=small | |
: 1710606801:0;rm -rf cmake_docs | |
: 1710606803:0;git clone [email protected]:codetechandtutorials/OurLordAndSavior.git cmake_docs | |
: 1710607039:0;cmake . -B build | |
: 1710607057:0;ninja . | |
: 1710607102:0;make | |
: 1710607112:0;cd cmake_docs | |
: 1710607395:0;./run.sh | |
: 1710608148:0;m | |
: 1710608237:0;rm -rf out | |
: 1710608384:0;vi configure.sh | |
: 1710608410:0;./out/build/OLAS | |
: 1710609047:0;./configure.sh | |
: 1710609052:0;./build | |
: 1710609058:0;./build.sh | |
: 1710760713:0;vi calls.vmfb | |
: 1710762268:0;vi aa.mlir xyz.mlir | |
: 1710767840:0;python tests/e2e/convolution/generate_e2e_convolution_tests.py --output_conv2d_mlir=xyz.mlir --output_calls_mlir=aa.mlir --input_type=f32 --input_layout="nchw" --kernel_type=f32 --kernel_layout="fchw" --shapes=large | |
: 1710769135:0;iree-opt xyz.mlir | |
: 1710769148:0;iree-compile --output-format=vm-bytecode --mlir-print-op-on-diagnostic=false --iree-hal-target-backends=llvm-cpu --iree-llvmcpu-link-embedded=false --iree-llvmcpu-sanitize=address xyz.mlir -o matmuls.vmfb | |
: 1710769161:0;iree-compile --output-format=vm-bytecode --mlir-print-op-on-diagnostic=false --iree-hal-target-backends=llvm-cpu --iree-llvmcpu-link-embedded=false --iree-llvmcpu-sanitize=address aa.mlir -o calls.vmfb | |
: 1710770936:0;/home/pashu/iree-build/tools/iree-e2e-conv2d-test "--module=/home/pashu/iree/matmuls.vmfb" "--module=/home/pashu/iree/calls.vmfb" "--device=local-task" 2> hey.x | |
: 1710771131:0;vi hey.x | |
: 1710771595:0;/home/pashu/iree-build/tools/iree-e2e-conv2d-test "--module=/home/pashu/iree/matmuls.vmfb" "--module=/home/pashu/iree/calls.vmfb" "--device=local-task"x | |
: 1710772145:0;clang-format -i tools/iree-e2e-conv2d-test.cc | |
: 1710772678:0;git pff | |
: 1710860972:0;cp iree-build/compile_commands.json iree | |
: 1710911892:0;build_tools/bazel_to_cmake/bazel_to_cmake.py | |
: 1710911939:0;build_tools/bazel_to_cmake/bazel_to_cmake.py tests/e2e/convolution | |
: 1710911950:0;build_tools/bazel_to_cmake/bazel_to_cmake.py --dir=tests/e2e/convolution | |
: 1710911981:0;build_tools/bazel_to_cmake/bazel_to_cmake.py --root_dir=tests/e2e/convolution | |
: 1710915769:0;vi e2e_conv2d_cpu_f16_f16_f16_large_llvm-cpu_local-task_conv2ds.mlir | |
: 1711018598:0;cd ../iree/tests | |
: 1711018618:0;clang-format -i tools/testing | |
: 1711023911:0;clang-format -i tools/testing/* | |
: 1711024280:0;cmake --build . | |
: 1711030023:0;mv tools/testing/test_utils.cc tools/testing/test_utils.h CMakeLists.txt BUILD.bazel runtime/src/iree/tooling/e2e_testing | |
: 1711030288:0;mv runtime/src/iree/tooling/e2e_testing/CMakeLists.txt runtime/src/iree/tooling/e2e_testing/BUILD.bazel . | |
: 1711032646:0;/home/pashu/iree-build/tools/iree-e2e-matmul-test "--module=/home/pashu/iree-build/tests/e2e/matmul/e2e_matmul_cpu_dt_uk_i8_i32_small_llvm-cpu_local-task_matmuls.mlir" "--module=/home/pashu/iree-build/tests/e2e/matmul/e2e_matmul_cpu_dt_uk_i8_i32_small_llvm-cpu_local-task_calls.mlir" "--device=local-task" | |
: 1711032670:0;/home/pashu/iree-build/tools/iree-e2e-matmul-test "--module=/home/pashu/iree-build/tests/e2e/matmul/e2e_matmul_cpu_dt_uk_i8_i32_small_llvm-cpu_local-task_matmuls.vmfb" "--module=/home/pashu/iree-build/tests/e2e/matmul/e2e_matmul_cpu_dt_uk_i8_i32_small_llvm-cpu_local-task_calls.vmfb" "--device=local-task" | |
: 1711032682:0;/home/pashu/iree-build/tools/iree-e2e-conv2d-test "--module=/home/pashu/iree/matmuls.vmfb" "--module=/home/pashu/iree/calls.vmfb" "--device=local-task" | |
: 1711032875:0;mv compile_commands.json ../iree | |
: 1711033430:0;ls -l; | |
: 1711037689:0;mv runtime/src/iree/tooling/e2e_testing/* tools/testing/e2e | |
: 1711038201:0;rm aa.mlir xyz.mlir hey.x calls.vmfb matmuls.vmfb | |
: 1711038513:0;mv tools/iree-e2e-*.cc tools/testing/e2e | |
: 1711092371:0;clang-format -i tools/testing/e2e | |
: 1711093912:0;ctest -R e2e_matmul_cpu_dt_uk_i8_i32_small_llvm-cpu_local-task$ --verbose | |
: 1711094039:0;ctest -R . | |
: 1711094430:0;ctest e2e_conv2d_cpu_f16_f16_f16_small_llvm-cpu_local-task_calls | |
: 1711094463:0;ctest -R e2e_conv2d_cpu_f16_f16_f16_small_llvm-cpu_local-task_calls | |
: 1711094483:0;ctest -R e2e_conv2d_cpu_f16_f16_f16_small_llvm-cpu_local-tass | |
: 1711094495:0;ctest -R e2e_conv2d_cpu_f16_f16_f16_small_llvm-cpu_local-task | |
: 1711094623:0;ctest | |
: 1711094792:0;ctest -R small | |
: 1711095822:0;vi e2e_conv2d_cpu_f16_f16_f16_small_llvm-cpu_local-task_calls.mlir | |
: 1711095896:0;e2e_conv2d_cpu_f16_f16_f16_small_llvm-cpu_local-task_conv2ds.mlir | |
: 1711095901:0;vi e2e_conv2d_cpu_f16_f16_f16_small_llvm-cpu_local-task_conv2ds.mlir | |
: 1711095985:0;iree-opt e2e_conv2d_cpu_f16_f16_f16_small_llvm-cpu_local-task_conv2ds.mlir | |
: 1711096817:0;rm -rf convolution | |
: 1711096828:0;cd co | |
: 1711096844:0;ctest convolution | |
: 1711096940:0;rm -rf iree-build | |
: 1711097718:0;ctest . -vv | |
: 1711097790:0;vi /home/pashu/iree-build/tests/e2e/matmul/Testing/Temporary/LastTest.log | |
: 1711098128:0;ctest -R e2e_matmul_cpu_dt_i8_i32_small_llvm-cpu_local-task -vv | |
: 1711098195:0;vi /home/pashu/iree-build/tests/e2e/convolution/Testing/Temporary/LastTest.log | |
: 1711098205:0;more /home/pashu/iree-build/tests/e2e/convolution/Testing/Temporary/LastTest.log | |
: 1711098216:0;"/home/pashu/iree-build/tools/iree-e2e-conv2d-test" "--module=/home/pashu/iree-build/tests/e2e/convolution/e2e_conv2d_cpu_f32_f32_f32_small_llvm-cpu_local-task_conv2ds\ | |
.vmfb" "--module=/home/pashu/iree-build/tests/e2e/convolution/e2e_conv2d_cpu_f32_f32_f32_small_llvm-cpu_local-task_calls.vmfb" "--device=local-task" | |
: 1711098299:0;vi /home/pashu/iree-build/tests/e2e/convolution/e2e_conv2d_cpu_f32_f32_f32_small_llvm-cpu_local-task_calls.mlir:156:3 | |
: 1711098993:0;"/home/pashu/iree-build/tools/iree-e2e-conv2d-test" "--module=/home/pashu/iree-build/tests/e2e/convolution/e2e_conv2d_cpu_f32_f32_f32_small_llvm-cpu_local-task_conv2ds.vmfb" "--module=/home/pashu/iree-build/tests/e2e/convolution/e2e_conv2d_cpu_f32_f32_f32_small_llvm-cpu_local-task_calls.vmfb" "--device=local-task" | |
: 1711099050:0;vi /home/pashu/iree-build/tests/e2e/convolution/e2e_conv2d_cpu_f32_f32_f32_small_llvm-cpu_local-task_calls.mlir:111:1 | |
: 1711099053:0;vi /home/pashu/iree-build/tests/e2e/convolution/e2e_conv2d_cpu_f32_f32_f32_small_llvm-cpu_local-task_calls.mlir | |
: 1711107024:0;build_tools/bazel_to_cmake/bazel_to_cmake.py --root_dir=tests/e2e/convolution --verbosity=1 | |
: 1711109064:0;python3 -m pip install black==23.3 | |
: 1711109078:0;black build_tools/bazel_to_cmake/bazel_to_cmake_converter.py | |
: 1711467703:0;git ob unpack_transpose | |
: 1711471326:0;git ob unpack_trans | |
: 1711523298:0;sudo dnf install lld | |
: 1711523365:0;ld.lld --version | |
: 1711523666:0;rm -rf OOTSTRAP_LLVM_ENABLE_LTO=Thin | |
: 1711526549:0;vi build_commands | |
: 1711527612:0;mlir-opt -test-pack-unpack-fold-patterns ~/xyz.mlir | |
: 1711527671:0;mlir-opt -test-tensor-transform-patterns=-test-fold-into-pack-and-unpack ~/xyz.mlir | |
: 1711532003:0;more mlir/test/Dialect/Tensor/fold-into-pack-and-unpack.mlir | |
: 1711539741:0;mlir-opt -test-tensor-transform-patterns=test-fold-into-pack-and-unpack ~/xyz.mlir | |
: 1711616057:0;touch example.cpp | |
: 1711616977:0;g++ example.cpp | |
: 1711618580:0;mlir-opt -split-input-file -test-tensor-transform-patterns=test-fold-into-pack-and-unpack mlir/test/Dialect/Tensor/fold-into-pack-and-unpack.mlir | FileCheck mlir/test/Dialect/Tensor/fold-into-pack-and-unpack.mlir | |
: 1711621484:0;clang-format -i mlir/lib/Dialect/Tensor/Transforms/PackAndUnpackPatterns.cpp | |
: 1711625030:0;git remote add pashu [email protected]:pashu123/personal_commands.git | |
: 1711625127:0;cat build_iree.sh | |
: 1711625216:0;git o conv_suite | |
: 1711629048:0;build_tools/bazel_to_cmake/bazel_to_cmake.py --root_dir=tests/e2e/convolution --verbosity | |
: 1711629060:0;build_tools/bazel_to_cmake/bazel_to_cmake.py --root_dir=tests/e2e/convolution -v | |
: 1711629074:0;build_tools/bazel_to_cmake/bazel_to_cmake.py --root_dir=tests/e2e/conv2d/ --verbosity=1 | |
: 1711629098:0;build_tools/bazel_to_cmake/bazel_to_cmake.py --root_dir=tests/e2e/convolutions/ --verbosity=1 | |
: 1711631622:0;clang-format tools/testing/e2/*.cc | |
: 1711631628:0;clang-format tools/testing/e2e/*.cc | |
: 1711631632:0;clang-format -i tools/testing/e2e/*.cc | |
: 1711649952:0;cd iree-build/tools/testing/e2e | |
: 1711649957:0;./iree-e2e-conv2d-test | |
: 1711649966:0;./iree-e2e-matmul-test | |
: 1711649972:0;./iree-e2e-matmul-test --module="xx" | |
: 1711650168:0;cd testing/e2e | |
: 1711679840:0;git ob math_fpowi | |
: 1711680315:0;vi ~/build_commands | |
: 1711717271:0;cd e2e/convolution | |
: 1711717726:0;cmake --build . --target iree-test-deps | |
: 1711717803:0;ctest -R e2e_matmul_cpu_dt_i8_i32_small_llvm-cpu_local-task | |
: 1711719224:0;sudo dnf install go | |
: 1711719448:0;go install buildifier | |
: 1711719457:0;go install buildifier@latest | |
: 1711719496:0;go env | |
: 1711719575:0;vi ~/.config/go/env | |
: 1711719594:0;cd ~/.cache/go-build | |
: 1711719606:0;cd ~/go | |
: 1711719721:0;cd ~/go/bin | |
: 1711719724:0;./buildifier | |
: 1711727159:0;git diff -U0 -w --no-color | git apply --cached --ignore-whitespace --unidiff-zero - | |
: 1711732646:0;iree-compile --output-format=vm-bytecode --iree-hal-target-backends=llvm-cpu --iree-llvmcpu-target-cpu=znver4 --iree-llvmcpu-target-triple=x86_64-unknown-linux-gnu ~/xyz.mlir -o /tmp/z.vmfb\ | |
\ | |
: 1711795173:0;tmux attach -t | |
: 1711796639:0;clang++ example.cpp | |
: 1711866983:0;vi test.cpp | |
: 1711867108:0;./test.cpp | |
: 1711902385:0;perf | |
: 1711902423:0;perf -- ./a.out | |
: 1711902441:0;perf stat -- a.out | |
: 1711902727:0;perf stat -- ./a.out | |
: 1711902794:0;perf stat -e mem_load_retired.fb_hit, mem_load_retired.l1_miss -- ./a.out | |
: 1711902836:0;perf list | |
: 1711902880:0;perf stat branch-misses -- ./a.out | |
: 1711902894:0;perf stat -e branch-misses -- ./a.out | |
: 1711902902:0;perf stat -e cache-misses -- ./a.out | |
: 1711902950:0;perf stat -e instructions -- ./a.out | |
: 1711902966:0;perf stat -e cycles -- ./a.out | |
: 1711903084:0;perf stat -e uops_issues.any -- ./a.out | |
: 1711903093:0;perf stat -e uops_issued.any -- ./a.out | |
: 1711903100:0;perf list | fzf | |
: 1711903118:0;perf list > xyz.txt | |
: 1711905929:0;mkdir build | |
: 1711905963:0;make -j16 | |
: 1711905967:0;./helloworld | |
: 1711906045:0;ccmake | |
: 1711906053:0;ccmake\ | |
: 1711906057:0;ccmake .\ | |
: 1711906215:0;make | |
: 1711906227:0;cmake . -B build | |
: 1711906280:0;vi build.ninja | |
: 1711968659:0;cd Te | |
: 1711984566:0;cd /usr/local/bin | |
: 1711984570:0;wget https://github.com/bazelbuild/bazelisk/releases/download/v1.19.0/bazelisk-linux-amd64 | |
: 1711984587:0;sudo wget https://github.com/bazelbuild/bazelisk/releases/download/v1.19.0/bazelisk-linux-amd64 | |
: 1711984612:0;mv bazelisk-linux-amd64 bazel | |
: 1711984617:0;sudo mv bazelisk-linux-amd64 bazel | |
: 1711984622:0;chmod +x bazel | |
: 1711984626:0;sudo chmod +x bazel | |
: 1711984795:0;bazel build ...:all | |
: 1711984890:0;vi .bazelrc | |
: 1711984916:0;vi configure_bazel.py | |
: 1711984927:0;bazel clean | |
: 1711984971:0;vi WORKSPACE | |
: 1711984985:0;bazel run | |
: 1711985391:0;bazel test -k //... \\ | |
--iree_drivers=local-sync,local-task,vulkan \\ | |
--test_tag_filters="-driver=vulkan,-driver=metal,-driver=cuda,-target=cuda" \\ | |
--build_tag_filters="-driver=cuda,-target=cuda" -v\ | |
: 1711985395:0;bazel test -k //... \\ | |
--iree_drivers=local-sync,local-task,vulkan \\ | |
--test_tag_filters="-driver=vulkan,-driver=metal,-driver=cuda,-target=cuda" \\ | |
--build_tag_filters="-driver=cuda,-target=cuda" -verbose\ | |
: 1711985398:0;bazel test -k //... \\ | |
--iree_drivers=local-sync,local-task,vulkan \\ | |
--test_tag_filters="-driver=vulkan,-driver=metal,-driver=cuda,-target=cuda" \\ | |
--build_tag_filters="-driver=cuda,-target=cuda" --v\ | |
: 1711985412:0;bazel test -k //... \\ | |
--iree_drivers=local-sync,local-task,vulkan \\ | |
--test_tag_filters="-driver=vulkan,-driver=metal,-driver=cuda,-target=cuda" \\ | |
--build_tag_filters="-driver=cuda,-target=cuda" --sandbox_debug\ | |
: 1711985428:0;cd bazel-bin | |
: 1711985446:0;bazel test -k //... \\ | |
--iree_drivers=local-sync,local-task,vulkan \\ | |
--test_tag_filters="-driver=vulkan,-driver=metal,-driver=cuda,-target=cuda" \\ | |
--build_tag_filters="-driver=cuda,-target=cuda" --sandbox_debug > xyz.txt\ | |
: 1711985460:0;bazel test -k //... \\ | |
--iree_drivers=local-sync,local-task,vulkan \\ | |
--test_tag_filters="-driver=vulkan,-driver=metal,-driver=cuda,-target=cuda" \\ | |
--build_tag_filters="-driver=cuda,-target=cuda" --sandbox_debug 2> xyz.txt\ | |
: 1711985972:0;sudo bazel test -k //... \\ | |
--iree_drivers=local-sync,local-task,vulkan \\ | |
--test_tag_filters="-driver=vulkan,-driver=metal,-driver=cuda,-target=cuda" \\ | |
--build_tag_filters="-driver=cuda,-target=cuda" 2> xyz.txt\ | |
: 1711986150:6;sudo bazel build tools/...\ | |
: 1711986612:0;sudo bazel test -k "convolution" //... \\ | |
--iree_drivers=local-sync,local-task,vulkan \\ | |
--test_tag_filters="-driver=vulkan,-driver=metal,-driver=cuda,-target=cuda" \\ | |
--build_tag_filters="-driver=cuda,-target=cuda" \ | |
: 1711987057:0;xi xyz.txt | |
: 1711987728:0;sudo bazel test -k "convolution" //... \\ | |
--iree_drivers=local-sync,local-task,vulkan \\ | |
--test_tag_filters="-driver=vulkan,-driver=metal,-driver=cuda,-target=cuda" \\ | |
--build_tag_filters="-driver=cuda,-target=cuda" 2> xyz.txt\ | |
: 1711987894:0;build --disk_cache=/tmp/bazel-cache | |
: 1711987915:0;bazel --disk_cache=/tmp/bazel-cache | |
: 1711987930:0;vi user.bazelrc | |
: 1711987942:0;sudo bazel test -k //... \\ | |
--iree_drivers=local-sync,local-task,vulkan \\ | |
--test_tag_filters="-driver=vulkan,-driver=metal,-driver=cuda,-target=cuda" \\ | |
--build_tag_filters="-driver=cuda,-target=cuda" \ | |
: 1711988087:0;export CC=clang\ | |
export CXX=clang++\ | |
: 1711988547:0;python configure_bazel.py | |
: 1711988554:0;vi configured.bazelrc | |
: 1711988733:0;rm -rf ~/.cache/bazel/ | |
: 1711988752:0;rm configured.bazelrc | |
: 1711988776:0;rm user.bazelrc | |
: 1711989007:0;build_tools/bazel/build_test_all.sh | |
: 1711992280:0;bazel clean --expunge | |
: 1711992364:0;export CC="/usr/bin/gcc"\ | |
export CXX="/usr/bin/g++" | |
: 1712048761:0;bazel test -k //... \\ | |
--iree_drivers=local-sync,local-task,vulkan \\ | |
--test_tag_filters="-driver=vulkan,-driver=metal,-driver=cuda,-target=cuda" \\ | |
--build_tag_filters="-driver=cuda,-target=cuda"\ | |
: 1712048905:0;cd Testing | |
: 1712048907:0;cd Temporary | |
: 1712048911:0;vi CTestCostData.txt | |
: 1712060264:0;byobu | |
: 1712060302:0;mv ~/iree-build/compile_commands.json . | |
: 1712061789:0;ctest -j12 . | |
: 1712062755:0;mv xyz.txt ../ | |
: 1712062888:0;black tests/e2e/convolution/generate_e2e_conv2d_tests.py | |
: 1712070906:0;cmake --graphviz=my-project.dot . | |
: 1712071097:0;rm my-project.dot* | |
: 1712071230:0;ld ./iree-e2e-conv2d-test | |
: 1712071237:0;ldd ./iree-e2e-conv2d-test | |
: 1712072737:0;objdump ./iree-e2e-conv2d-test | |
: 1712072751:0;objdump -t ./iree-e2e-conv2d-test | |
: 1712133270:0;tux | |
: 1712133444:0;git ob math_powf | |
: 1712136457:0;ear | |
: 1712137223:0;mlir-opt -test-expand-math ~/xyz.mlir | |
: 1712137770:0;clang-format -i mlir/lib/Dialect/Math/Transforms/ExpandPatterns.cpp | |
: 1712152512:0;cat ~/build_commands/build_torch.sh | |
: 1712154513:0;ctest -j16 . | |
: 1712159946:0;build_tools/bazel_to_cmake/bazel_to_cmake.py --root_dir=tests/e2e/matmul/ --verbosity=1 | |
: 1712164275:0;build_tools/bazel_to_cmake/bazel_to_cmake.py --root_dir=tests/e2e/convolution/ --verbosity=1 | |
: 1712216630:0;ctest -j32 . | |
: 1712219551:0;gist | |
: 1712219646:0;gist ~/.config/lvim/config.lua | |
: 1712221984:0;build_tools/bazel_to_cmake/bazel_to_cmake.py --root_dir=tools/testing/e2e/ --verbosity=1 | |
: 1712227359:0;mv ~/iree-build/compile_commands.json ~/iree | |
: 1712246201:0;wget https://sharkpublic.blob.core.windows.net/sharkpublic/max/llama2_7b_int4_turbine_llama_cpp_groupsize128_linalg.mlir | |
: 1712246222:0;vi llama2_7b_int4_turbine_llama_cpp_groupsize128_linalg.mlir | |
: 1712252278:0;cd ../matmul | |
: 1712252318:0;cd ../convolution | |
: 1712252548:0;clang-format -i tools/testing/e2e/*.cc | |
: 1712252550:0;clang-format -i tools/testing/e2e/*.c | |
: 1712252552:0;clang-format -i tools/testing/e2e/*.h | |
: 1712287368:0;git ob acc_fix | |
: 1712318469:0;mkdi custom_allocator | |
: 1712318473:0;mkdir custom_allocator | |
: 1712318505:0;cd custom_allocator | |
: 1712320197:0;ninja build | |
: 1712320210:0;ninja build/ | |
: 1712320218:0;./myprogram | |
: 1712320325:0;cmake -G Ninja ../ -B build | |
: 1712320340:0;./heap | |
: 1712320466:0;cmake -G Ninja ../ -B build -DCMAKE_BUILD_TYPE=Debug | |
: 1712320494:0;cmake -G Ninja ../ -B -DCMAKE_BUILD_TYPE=Debug | |
: 1712320501:0;cmake -G Ninja ../ -B . -DCMAKE_BUILD_TYPE=Debug | |
: 1712320550:0;gdb ./heap | |
: 1712322270:0;build/heap | |
: 1712338197:0;rm -rf custom_allocator | |
: 1712338208:0;mkdir llama2 | |
: 1712338217:0;mv llama2_7b_int4_turbine_llama_cpp_groupsize128_linalg.mlir llama2 | |
: 1712338257:0;wget https://sharkpublic.blob.core.windows.net/sharkpublic/max/repacked_pure_q4_1_params.irpa | |
: 1712338336:0;git remte add max [email protected]:Max191/iree.git | |
: 1712338343:0;git remote add max [email protected]:Max191/iree.git | |
: 1712338385:0;git o max/pack-propagation-test-branch | |
: 1712340411:0;iree-compile \\ | |
--iree-opt-const-eval=false \\ | |
--iree-hal-target-backends=llvm-cpu \\ | |
--iree-llvmcpu-target-cpu=znver4 \\ | |
--iree-stream-resource-index-bits=64 \\ | |
--iree-vm-target-index-bits=64 \\ | |
--iree-llvmcpu-enable-ukernels=mmt4d \\ | |
--iree-llvmcpu-narrow-matmul-tile-bytes=16777216 \\ | |
--iree-global-opt-enable-quantized-matmul-reassociation=true \\ | |
--iree-opt-propagate-global-layout \\ | |
--iree-global-opt-propagate-transposes \\ | |
llama2_7b_int4_turbine_llama_cpp_groupsize128_linalg.mlir \\ | |
-o llama2_7b_int4.vmfb | |
: 1712340533:0;iree-benchmark-module \\ | |
--module=/tmp/llama2_7b_int4.vmfb \\ | |
--function=run_forward \\ | |
--device=local-task \\ | |
--input=1x1xi64 \\ | |
--parameters=model=repacked_pure_q4_1_params.irpa \\ | |
--benchmark_repetitions=200 | |
: 1712340544:0;iree-benchmark-module \\ | |
--module=llama2_7b_int4.vmfb \\ | |
--function=run_forward \\ | |
--device=local-task \\ | |
--input=1x1xi64 \\ | |
--parameters=model=repacked_pure_q4_1_params.irpa \\ | |
--benchmark_repetitions=200 | |
: 1712341064:0;unzip llama2_7b_int4.vmfb | |
: 1712341097:0;mkdir xyz | |
: 1712341099:0;mv *.bin *.fb xyz | |
: 1712341107:0;mv llama_dpis_linked_llvm_cpu_embedded_elf_x86_64.so xyz | |
: 1712341110:0;cd xyz | |
: 1712341126:0;chmod +x llama_dpis_linked_llvm_cpu_embedded_elf_x86_64.so | |
: 1712341128:0;nm llama_dpis_linked_llvm_cpu_embedded_elf_x86_64.so | |
: 1712341133:0;sudo nm llama_dpis_linked_llvm_cpu_embedded_elf_x86_64.so | |
: 1712341173:0;nm _const.bin | |
: 1712341178:0;sudo nm _const.bin | |
: 1712341200:0;python -m venv llama_turbine_venv | |
: 1712341213:0;git clone https://github.com/nod-ai/SHARK-Turbine.git | |
: 1712341228:0;pip install --index-url https://download.pytorch.org/whl/cpu \\ | |
-r core/pytorch-cpu-requirements.txt \\ | |
-r core/torchvision-requirements.txt\ | |
: 1712341272:0;pip install --index-url https://download.pytorch.org/whl/cpu \\ | |
-r core/pytorch-requirements.txt \\ | |
: 1712341285:0;pip install --index-url https://download.pytorch.org/whl/cpu \\ | |
-r core/pytorch-cpu-requirements.txt \\ | |
: 1712342336:0;cd llama2 | |
: 1712342340:0;source llama_turbine_venv/bin/activate | |
: 1712342361:0;pip install --index-url https://download.pytorch.org/whl/cpu \\ | |
-r core/pytorch-cpu-requirements.txt | |
: 1712342499:0;pip install -e core | |
: 1712342506:0;pip install -e models | |
: 1712342537:0;cd ..\ | |
: 1712342543:0;git clone https://github.com/Max191/llama.turbine.git | |
: 1712342548:0;cd llama.turbine\ | |
: 1712342553:0;pip install gguf | |
: 1712342642:0;vi build_iree.sh | |
: 1712344673:0;python python/turbine_llamacpp/llamacpp_runner.py \\ | |
--external_weight_path=/path/to/repacked_pure_q4_1_params.irpa \\ | |
--vmfb_path=/tmp/llama2_7b_int4.vmfb | |
: 1712344690:0;python python/turbine_llamacpp/llamacpp_runner.py \\ | |
--external_weight_path=repacked_pure_q4_1_params.irpa \\ | |
--vmfb_path=llama2_7b_int4.vmfb | |
: 1712344717:0;cd llama.turbine | |
: 1712344727:0;python python/turbine_llamacpp/llamacpp_runner.py \\ | |
--external_weight_path=../repacked_pure_q4_1_params.irpa \\ | |
--vmfb_path=../llama2_7b_int4.vmfb | |
: 1712344789:0;vi turbine_llamacpp | |
: 1712381337:0;cd Templates/ | |
: 1712381342:0;cd Templates | |
: 1712383122:0;rm -rf Templates | |
: 1712383235:0;vi temp.py | |
: 1712383330:0;python3 temp.py | |
: 1712414146:0;git ob stat_pack | |
: 1712414447:0;mlir-opt -transform-interpreter ~/xyz.mlir -mlir-print-ir-after-all | |
: 1712484742:0;mlir-opt -linalg-bufferize ~/xyz.mlir | |
: 1712484824:0;mlir-opt -linalg-bufferize -cse ~/xyz.mlir | |
: 1712484841:0;mlir-opt -linalg-bufferize -canoncalize -cse ~/xyz.mlir | |
: 1712484870:0;mlir-opt -linalg-bufferize -canonicalize -cse -linalg-bufferize-finalize ~/xyz.mlir | |
: 1712484900:0;mlir-opt -linalg-bufferize -canonicalize -cse -linalg-bufferize-finalize -finalizing-bufferize ~/xyz.mlir | |
: 1712484915:0;mlir-opt -linalg-bufferize -canonicalize -cse -linalg-bufferize-finalize -linalg-bufferize-finalize ~/xyz.mlir | |
: 1712484999:0;mlir-opt -linalg-bufferize -canonicalize -cse ~/xyz.mlir | |
: 1712485016:0;mlir-opt -linalg-bufferize -canonicalize -cse -dce ~/xyz.mlir | |
: 1712485046:0;mlir-opt -linalg-bufferize -canonicalize="test-convergence" -cse -dce ~/xyz.mlir | |
: 1712485083:0;mlir-opt -linalg-bufferize -canonicalize="test-convergence" -cse ~/xyz.mlir | |
: 1712508209:0;git remote add gshukla https://github.com/Shukla-Gaurav/iree.git | |
: 1712508233:0;git checkout 90ecdec4fba9d0d75211140673bc22f5f47be7f4 | |
: 1712554181:0;git clone https://github.com/PacktPublishing/Learn-LLVM-17.git | |
: 1712564250:0;git branch | fzf | |
: 1712564256:0;git branch -f | |
: 1712564266:0;git branch -a | fzf | |
: 1712564289:0;git o remotes/origin/release/17.x | |
: 1712564358:0;git checkout -b llvm-17 llvmorg-17.0.1 | |
: 1712564435:0;cp ~/build_commands/*_mlir.sh | |
: 1712564442:0;cp ~/build_commands/*_mlir.sh . | |
: 1712564489:0;vi run_mlir.sh | |
: 1712564503:0;build_mlir.sh | |
: 1712564628:0;./build_mlir.sh | |
: 1712565769:0;cmake -GNinja -S . -B build -DCMAKE_C_COMPILER=../../llvm-project/build/bin/clang -DCMAKE_CXX_COMPILER=../../llvm-project/build/bin/clang++ -DLLVM_DIR=../../llvm-project/build | |
: 1712565934:0;cd Chapter04/tinylang | |
: 1712566422:0;cd Chapter05/tinylang | |
: 1712566428:0;cmake -GNinja -S . -B build -DCMAKE_C_COMPILER=/home/pashu/Learn-LLVM-17/llvm-project/build/bin/clang -DCMAKE_CXX_COMPILER=/home/pashu/Learn-LLVM-17/llvm-project/build/bin/clang++ -DLLVM_DIR=/home/pashu/Learn-LLVM-17/llvm-project/build | |
: 1712567023:0;rm -rf ~/torch-mlir | |
: 1712567067:0;cd Chapter04 | |
: 1712567078:0;cmake -GNinja -S . -B build -DCMAKE_C_COMPILER=/home/pashu/Learn-LLVM-17/llvm-project/build/bin/clang -DCMAKE_CXX_COMPILER=/home/pashu/Learn-LLVM-17/llvm-project/build/bin/clang++ -DLLVM_DIR=/home/pashu/Learn-LLVM-17/llvm-project/build -DCMAKE_LINKER_TYPE=lld | |
: 1712567282:0;cp -r ~/Learn-LLVM-17/llvm-project/build llvm-project | |
: 1712567309:0;cmake -GNinja -S . -B build -DCMAKE_C_COMPILER=/home/pashu/Learn-LLVM-17/llvm-project/build/bin/clang -DCMAKE_CXX_COMPILER=/home/pashu/Learn-LLVM-17/llvm-project/build/bin/clang++ -DLLVM_DIR=/home/pashu/Learn-LLVM-17/llvm-project/build | |
: 1712572019:0;cd pashu/iree | |
: 1712572299:0;cmake --build ~/iree-build --target iree-test-deps | |
: 1712572383:0;cmake --build ~/iree-build --target iree-test-deps -j 100 | |
: 1712572403:0;cmake --build ~/iree-build --target iree-test-deps -j 100 2> err.txt | |
: 1712572417:0;cmake --build ~/iree-build --target iree-test-deps -j 100 > err.txt | |
: 1712573154:0;vi ~/xyz.t | |
: 1712573262:0;more err.txt | |
: 1712574736:0;/home/pashu/iree-build/tools/iree-compile --output-format=vm-bytecode --mlir-print-op-on-diagnostic=false --iree-hal-target-backends=llvm-cpu --iree-input-type=stablehlo /home/pashu/iree/tests/e2e/regression/strided_slice.mlir -o check_regression_llvm-cpu_strided_slice.mlir_module.vmfb -mlir-print-ir-after-all 2> check.txt | |
: 1712574740:0;vi check.txt | |
: 1712575849:0;/home/pashu/iree-build/tools/iree-compile --output-format=vm-bytecode --mlir-print-op-on-diagnostic=false --iree-hal-target-backends=llvm-cpu --iree-input-type=stablehlo /home/pashu/iree/tests/e2e/regression/strided_slice.mlir -o check_regression_llvm-cpu_strided_slice.mlir_module.vmfb | |
: 1712576538:0;cat tests/e2e/linalg/i4_to_f32.mlir | |
: 1712576761:0;/home/pashu/iree-build/tools/iree-compile --output-format=vm-bytecode --mlir-print-op-on-diagnostic=false --iree-hal-target-backends=llvm-cpu --iree-input-type=stablehlo /home/pashu/iree/tests/e2e/linalg/i4_to_f32.mlir -o cpu_x.vmfb | |
: 1712576896:0;more third_party/llvm-project/mlir/python/mlir/dialects/TensorOps.td | |
: 1712576913:0;more third_party/llvm-project/mlir//dialects/TensorOps.td | |
: 1712576916:0;more third_party/llvm-project/mlir/dialects/TensorOps.td | |
: 1712576931:0;more third_party/llvm-project/mlir/include/mlir/Dialect/Tensor/IR/TensorOps.td | |
: 1712577554:0;/home/pashu/iree-build/tools/iree-compile --output-format=vm-bytecode --mlir-print-op-on-diagnostic=false --iree-hal-target-backends=llvm-cpu --iree-input-type=stablehlo /home/pashu/iree/tests/e2e/regression/layernorm.mlir | |
: 1712577599:0;/home/pashu/iree-build/tools/iree-compile --output-format=vm-bytecode --mlir-print-op-on-diagnostic=false --iree-hal-target-backends=llvm-cpu --iree-input-type=stablehlo /home/pashu/iree/tests/e2e/regression/layernorm.mlir -o x.vmfb | |
: 1712577623:0;/home/pashu/iree-build/tools/iree-compile --output-format=vm-bytecode --mlir-print-op-on-diagnostic=false --iree-hal-target-backends=llvm-cpu --iree-input-type=none /home/pashu/iree/tests/e2e/regression/layernorm.mlir -o x.vmfb | |
: 1712577833:0;/home/pashu/iree-build/tools/iree-compile --output-format=vm-bytecode --mlir-print-op-on-diagnostic=false --iree-hal-target-backends=llvm-cpu --iree-input-type=none /home/pashu/iree/tests/e2e/regression/reduction_broadcast_elementwise.mlir -o x.vmfb | |
: 1712578293:0;/home/pashu/iree-build/tools/iree-compile --output-format=vm-bytecode --mlir-print-op-on-diagnostic=false --iree-hal-target-backends=llvm-cpu --iree-input-type=none /home/pashu/iree/tests/e2e/stablehlo_ops/dot_general.mlir -o x.vmfb | |
: 1712578400:0;/home/pashu/iree-build/tools/iree-compile --output-format=vm-bytecode --mlir-print-op-on-diagnostic=false --iree-hal-target-backends=llvm-cpu --iree-input-type=stablehlo /home/pashu/iree/tests/e2e/stablehlo_ops/dot_general.mlir -o x.vmfb -mlir-print-ir-after-all 2> xyz.txt | |
: 1712580210:0;/home/pashu/iree-build/tools/iree-compile --output-format=vm-bytecode --mlir-print-op-on-diagnostic=false --iree-hal-target-backends=llvm-cpu --iree-input-type=stablehlo /home/pashu/iree/tests/e2e/stablehlo_ops/dot_general.mlir -o x.vmfb | |
: 1712580553:0;cmake --build ~/iree-build --target iree-test-deps > err.txt | |
: 1712581490:0;ctest -j100 ~/iree-build | |
: 1712581505:0;ctest -j100 /home/pashu/iree-build | |
: 1712581508:0;ctest -j100 /home/pashu/iree-build/ | |
: 1712581685:0;birer | |
: 1712587467:0;ctest --rerun-failed . -vv | |
: 1712587488:0;ctest --rerun-failed . -verbose | |
: 1712587607:0;vi Testing/Temporary/LastTest.log | |
: 1712587845:0;iree-run-mlir --Xcompiler,iree-hal-target-backends=vmvx /home/pashu/iree/tools/test/iree-run-mlir.mlir --input=f32=-2 | |
: 1712587906:0;which iree-run-mlir | |
: 1712588076:0;git o 3a8234cec1635418651b9d1346799920604464bd | |
: 1712588147:0;git fetch gshukla | |
: 1712588165:0;git o ac47212 | |
: 1712588215:0;git o 90ecdec4fba9d0d75211140673bc22f5f47be7f4 | |
: 1712588381:0;git o a4d17d7 | |
: 1712588511:0;git o test_expand | |
: 1712588623:0;cd third_party/llvm-project/mlir/lib/Dialect/Utils/ | |
: 1712591064:0;./iree-run-mlir | |
: 1712591215:0;git branch -d test_expand | |
: 1712591222:0;git branch -D test_expand | |
: 1712591227:0;git ob test_expand | |
: 1712597212:0;cd tests/e2e/convolution | |
: 1712597223:0;python tests/e2e/convolution/generate_e2e_convolution_tests.py --output_conv2d_mlir=xyz.mlir --output_calls_mlir=aa.mlir --input_type=f32 --input_layout="nchw" --kernel_type=f32 --kernel_layout="fchw" --shapes=large --dilation="2,2" | |
: 1712597236:0;python generate_e2e_convolution_tests.py --output_conv2d_mlir=xyz.mlir --output_calls_mlir=aa.mlir --input_type=f32 --input_layout="nchw" --kernel_type=f32 --kernel_layout="fchw" --shapes=large --dilation="2,2" | |
: 1712597247:0;python generate_e2e_conv2d_tests.py --output_conv2d_mlir=xyz.mlir --output_calls_mlir=aa.mlir --input_type=f32 --input_layout="nchw" --kernel_type=f32 --kernel_layout="fchw" --shapes=large --dilation="2,2" | |
: 1712597265:0;python generate_e2e_conv2d_tests.py --output_conv2d_mlir=conv2d.mlir --output_calls_mlir=calls.mlir --input_type=f32 --input_layout="nchw" --kernel_type=f32 --kernel_layout="fchw" --shapes=large --dilation="2,2" | |
: 1712597271:0;vi calls.mlir conv2d.mlir | |
: 1712598262:0;ctest . --verbose | |
: 1712598308:0;ctest . | |
: 1712660326:0;cd Learn-LLVM-17 | |
: 1712660330:0;mkdir hola | |
: 1712660336:0;cd hola | |
: 1712660350:0;cd ~/Learn-LLVM-17/hola | |
: 1712660355:0;touch test.c | |
: 1712660602:0;clang -Wall -pedantic -O0 -asmFunc.bin abi.s test.c | |
: 1712660960:0;objdump -D asmFunc.bin > asmFunc.dump | |
: 1712661300:0;clang -Wall -pedantic -O0 -o asmFunc.bin abi.s test.c | |
: 1712661301:0;./asmFunc.bin | |
: 1712662203:0;cd Chapter03 | |
: 1712662223:0;cmake -G Ninja . -B build | |
: 1712662246:0;cd driver | |
: 1712662248:0;./tinylang | |
: 1712662310:0;cat ~/build_commands/build_mlir.sh | |
: 1712662341:0;vi test.c | |
: 1712662347:0;cd Chapter03/tinylang | |
: 1712664271:0;cd ../Chapter04 | |
: 1712664273:0;cd tinylang | |
: 1712664303:0;clang -S -emit-llvm examples/Gcd.mod | |
: 1712664339:0;clang -S -emit-llvm examples/callgcd.c | |
: 1712664391:0;clang -arch arm64 -S -emit-llvm examples/callgcd.c | |
: 1712664427:0;clang -target=aarch64-macos-gnu -S -emit-llvm examples/callgcd.c | |
: 1712664444:0;clang --target=aarch64-macos-gnu -S -emit-llvm examples/callgcd.c | |
: 1712664454:0;clang --target=aarch64-macos-unknown -S -emit-llvm examples/callgcd.c | |
: 1712664464:0;clang --target=aarch64-linux-gnu -S -emit-llvm examples/callgcd.c | |
: 1712664607:0;build/tools/driver/tinylang examples/Gcd.mod --emit-llvm | |
: 1712664626:0;build/tools/driver/tinylang examples/Gcd.mod -o | |
: 1712664629:0;build/tools/driver/tinylang examples/Gcd.mod -o xyz.s | |
: 1712664651:0;build/tools/driver/tinylang examples/Gcd.mod -S -emit-llvm -o xyz.s | |
: 1712664662:0;vi xyz.s | |
: 1712665069:0;cat cmake -G Ninja . -B build -DCMAKE_EXPORT_COMPILE_COMMANDS=1 >> build_run.sh | |
: 1712665122:0;cmake -G Ninja . -B build -DCMAKE_EXPORT_COMPILE_COMMANDS=1 | |
: 1712665132:0;build/tools/driver/tinylang examples/Gcd.mod -emit-llvm -o xyz.s | |
: 1712665677:0;vi callgcd.s | |
: 1712665683:0;rm xyz.s | |
: 1712666507:0;build/tools/driver/tinylang examples/Gcd.mod -emit-llvm | |
: 1712672767:0;git o stat_pack | |
: 1712673287:0;where bm | |
: 1712673293:0;where build_mlir.sh | |
: 1712675833:0;vi ~/build_commands/build_mlir.sh | |
: 1712734704:0;"cmake -G Ninja . -B build -DCMAKE_EXPORT_COMPILE_COMMANDS=1 \n cmake --build build" >> build_run.sh | |
: 1712734715:0;cat "cmake -G Ninja . -B build -DCMAKE_EXPORT_COMPILE_COMMANDS=1 \n cmake --build build" >> build_run.sh | |
: 1712734724:0;vi build_run.sh | |
: 1712734825:0;chmod +x build_run.sh | |
: 1712734827:0;./build_run.sh | |
: 1712734851:0;cat build_run.sh | |
: 1712752749:0;tmux attach -t 2 | |
: 1712752783:0;git ob check_expand | |
: 1712752835:0;git remote add shukla https://github.com/Shukla-Gaurav/llvm-project.git | |
: 1712752856:0;git cp 4960d3b131dd11d2968a9578c6db9d2d31ee4fa3 | |
: 1712752897:0;git cp a4d17d7 | |
: 1712755336:0;tmux attach -t 3 | |
: 1712755425:0;git cp 90ecdec4fba9d0d75211140673bc22f5f47be7f4 | |
: 1712756862:0;cd /home/pashu/iree-build/tests/e2e/regression && /home/pashu/iree-build/tools/iree-compile --output-format=vm-bytecode --mlir-print-op-on-diagnostic=false --iree-hal-target-backends=llvm-cpu --iree-input-type=stablehlo /home/pashu/iree/tests/e2e/regression/reduction_broadcast_elementwise.mlir -o check_regression_llvm-cpu_reduction_broadcast_elementwise.mlir_module.vmfb --iree-hal-executable-object-search-path=\"/home/pashu/iree-build\" --iree-llvmcpu-embedded-linker-path=\"/home/pashu/iree-build/llvm-project/bin/lld\" --iree-llvmcpu-wasm-linker-path=\"/home/pashu/iree-build/llvm-project/bin/lld\" -mlir-print-ir-after-all | |
: 1712756883:0;cd /home/pashu/iree-build/tests/e2e/regression && /home/pashu/iree-build/tools/iree-compile --output-format=vm-bytecode --mlir-print-op-on-diagnostic=false --iree-hal-target-backends=llvm-cpu --iree-input-type=stablehlo /home/pashu/iree/tests/e2e/regression/reduction_broadcast_elementwise.mlir -o check_regression_llvm-cpu_reduction_broadcast_elementwise.mlir_module.vmfb --iree-hal-executable-object-search-path=\"/home/pashu/iree-build\" --iree-llvmcpu-embedded-linker-path=\"/home/pashu/iree-build/llvm-project/bin/lld\" --iree-llvmcpu-wasm-linker-path=\"/home/pashu/iree-build/llvm-project/bin/lld\" -mlir-print-ir-after-all 2> err.txt | |
: 1712757851:0;cd /home/pashu/iree-build/tests/e2e/regression && /home/pashu/iree-build/tools/iree-compile --output-format=vm-bytecode --mlir-print-op-on-diagnostic=false --iree-hal-target-backends=llvm-cpu --iree-input-type=stablehlo /home/pashu/iree/tests/e2e/regression/reduction_broadcast_elementwise.mlir -o check_regression_llvm-cpu_reduction_broadcast_elementwise.mlir_module.vmfb --iree-hal-executable-object-search-path=\"/home/pashu/iree-build\" --iree-llvmcpu-embedded-linker-path=\"/home/pashu/iree-build/llvm-project/bin/lld\" --iree-llvmcpu-wasm-linker-path=\"/home/pashu/iree-build/llvm-project/bin/lld\" -mlir-print-ir-after-all 2> err.txt -mlir-print-debuginfo | |
: 1712758152:0;/home/pashu/iree-build/tools/iree-compile --output-format=vm-bytecode --mlir-print-op-on-diagnostic=false --iree-hal-target-backends=llvm-cpu --iree-input-type=stablehlo /home/pashu/abc.mlir -o x.vmfb | |
: 1712759146:0;git fetch shukla | |
: 1712759157:0;git o aa6c9dca6e539189c15fd5a6e13b63bf4d5369bc | |
: 1712761370:0;git cp aa6c9dca6e539189c15fd5a6e13b63bf4d5369bc | |
: 1712761445:0;cmake --build ~/iree-build --target iree-test-deps | |
: 1712761772:0;ctest . -j 200 | |
: 1712761985:0;vi /home/pashu/iree-build/Testing/Temporary/LastTest.log | |
: 1712762380:0;ctest -R stable_hlo_to_linalg --verbose | |
: 1712762579:0;ctest -j100 . | |
: 1712762914:0;ctest --rerun-failed . | |
: 1712764532:0;cat /home/pashu/iree-build/compiler/Testing/Temporary/LastTest.log | |
: 1712764537:0;more /home/pashu/iree-build/compiler/Testing/Temporary/LastTest.log | |
: 1712765625:0;iree-opt -iree-flow-convert-to-flow compiler/src/iree/compiler/Dialect/Flow/Conversion/TensorToFlow/test/fill.mlir | |
: 1712769908:0;vi /home/pashu/iree-build/compiler/Testing/Temporary/LastTest.log | |
: 1712770010:0;cd runtime | |
: 1712770087:0;cd tests | |
: 1712770091:0;cd e2e | |
: 1712770182:0;vi /home/pashu/iree-build/tests/e2e/Testing/Temporary/LastTest.log | |
: 1712770261:0;iree-run-mlir | |
: 1712770281:0;ctest --rerun-failed . -j 200 | |
: 1712822929:0;more compiler/src/iree/compiler/GlobalOptimization/test/propagate_linalg_transpose.mlir | |
: 1712823053:0;iree-opt --pass-pipeline="builtin.module(util.func(iree-global-opt-propagate-linalg-transpose))" ~/xyz.mlir | |
: 1712823772:0;ctest --rerun-failed . -j 32 | |
: 1712823891:0;more compiler/src/iree/compiler/Dialect/Flow/Transforms/test/dispatch_linalg_on_tensors.mlir | |
: 1712823943:0;iree-opt --split-input-file --verify-diagnostics --pass-pipeline="builtin.module(util.func(iree-flow-form-dispatch-regions{fuse-multi-use=true}, iree-flow-clone-producers-into-dispatch-regions, iree-flow-form-dispatch-workgroups), cse, canonicalize, cse)" compiler/src/iree/compiler/Dialect/Flow/Transforms/test/dispatch_linalg_on_tensors.mlir | |
: 1712823995:0;iree-opt --split-input-file --verify-diagnostics --pass-pipeline="builtin.module(util.func(iree-flow-form-dispatch-regions{fuse-multi-use=true}, iree-flow-clone-producers-into-dispatch-regions, iree-flow-form-dispatch-workgroups), cse, canonicalize, cse)" ~/xyz.mlir | |
: 1712824039:0;ctest --rerun-failed . -j 3 | |
: 1712924088:0;mlir-opt -transform-interpreter mlir/test/Dialect/Linalg/vectorization.mlir | FileCheck | |
: 1712924148:0;mlir-opt -transform-interpreter mlir/test/Dialect/Linalg/vectorization.mlir | FileCheck mlir/test/Dialect/Linalg/vectorization.mlir | |
: 1712935404:0;dlopen | |
: 1712935417:0;sudo dnf install dlopen | |
: 1713170732:0;buildm | |
: 1713254281:0;cd testing | |
: 1713256308:0;clang++ test.cpp | |
: 1713256312:0;g++ test.cpp | |
: 1713261180:0;sudo dnf install ccls | |
: 1713262014:0;git clone [email protected]:nod-ai/2024-q1-sdxl-sprint.git | |
: 1713262213:0;git o sdxl | |
: 1713264834:0;./compile-unet.sh | |
: 1713264995:0;diff xyz.txt base_ir/stable_diffusion_xl_base_1_0_64_1024x1024_fp16_unet_linalg.mlir | |
: 1713265440:0;./compile-unet.sh > xyz.txt | |
: 1713265718:0;ls -lh ~ | |
: 1713265797:0;./compile-unet.sh 2> xyz.txt | |
: 1713269183:0;diff xyz.txt yz.txt | |
: 1713269205:0;diff xyz.txt yz.txt > diff.txt | |
: 1713269207:0;vi diff.txt | |
: 1713271366:0;cd 2024-q1-sdxl-sprint | |
: 1713271373:0;vi compile-unet.sh | |
: 1713273831:0;./compile-unet.sh 2> xy1.txt | |
: 1713273859:0;vi xy1.txt | |
: 1713274653:0;./compile-unet.sh | |
: 1713274679:0;./compile-unet.sh > test.val | |
: 1713276219:0;vi test.val | |
: 1713276373:0;./compile-unet.sh 2> test.val | |
: 1713276809:0;iree-opt '--iree-preprocessing-pad-linalg-ops=builtin.module(iree-global-opt-fuse-horizontal-contractions)' ~/test.mlir | |
: 1713276833:0;iree-opt '--iree-preprocessing-pass-pipeline=builtin.module(iree-global-opt-fuse-horizontal-contractions)' ~/test.mlir | |
: 1713277039:0;iree-opt --iree-global-opt-decompose-concat ~/test.mlir | |
: 1713277200:0;iree-opt --iree-global-optimization-transformation-pipeline ~/test.mlir | |
: 1713277219:0;iree-opt --iree-global-optimization-transformation-pipeline -mlir-print-ir-after-all ~/test.mlir | |
: 1713277254:0;more test.val | |
: 1713277279:0;iree-opt --iree-global-opt-propagate-transposes=true -mlir-print-ir-after-all ~/test.mlir | |
: 1713277317:0;iree-opt --iree-global-opt-propagate-transposes=true -mlir-print-ir-after-all ~/test.mlir 2> kk.mlir | |
: 1713277321:0;iree-opt --iree-global-opt-propagate-transposes=true -mlir-print-ir-after-all ~/test.mlir > kk.mlir | |
: 1713277392:0;iree-opt --iree-global-optimization-transformation-pipeline -mlir-print-ir-after-all ~/test.mlir > kk.mlir | |
: 1713277396:0;iree-opt --iree-global-optimization-transformation-pipeline -mlir-print-ir-after-all ~/test.mlir 2> kk.mlir | |
: 1713277636:0;iree-opt --iree-global-optimization-transformation-pipeline --iree-preprocessing-pass-pipeline=builtin.module\ | |
(iree-preprocessing-transpose-convolution-pipeline, iree-preprocessing-pad-to-intrinsics)' -mlir-print-ir-after-all ~/test.mlir 2> kk.mlir | |
: 1713277655:0;iree-opt --iree-global-optimization-transformation-pipeline '--iree-preprocessing-pass-pipeline=builtin.module\ | |
(iree-preprocessing-transpose-convolution-pipeline, iree-preprocessing-pad-to-intrinsics)' -mlir-print-ir-after-all ~/test.mlir 2> kk.mlir | |
: 1713277684:0;iree-opt '--iree-preprocessing-pass-pipeline=builtin.module\ | |
(iree-preprocessing-transpose-convolution-pipeline, iree-preprocessing-pad-to-intrinsics) -mlir-print-ir-after-all ~/test.mlir 2> kk.mlir | |
: 1713277692:0;iree-opt --iree-preprocessing-pass-pipeline=builtin.module(iree-preprocessing-transpose-convolution-pipeline, iree-preprocessing-pad-to-intrinsics) -mlir-print-ir-after-all ~/test.mlir 2> kk.mlir | |
: 1713277725:0;iree-opt '--iree-preprocessing-pass-pipeline=builtin.module(iree-preprocessing-transpose-convolution-pipeline, iree-preprocessing-pad-to-intrinsics)' -mlir-print-ir-after-all ~/test.mlir 2> kk.mlir | |
: 1713277746:0;iree-compile '--iree-preprocessing-pass-pipeline=builtin.module(iree-preprocessing-transpose-convolution-pipeline, iree-preprocessing-pad-to-intrinsics)' -mlir-print-ir-after-all ~/test.mlir 2> kk.mlir | |
: 1713277940:0;iree-opt --iree-global-opt-fuse-horizontal-contractions ~/test.mlir | |
: 1713277967:0;iree-opt -split-input-file --iree-global-opt-fuse-horizontal-contractions ~/test.mlir | |
: 1713278364:0;git ob fusehor | |
: 1713278389:0;git cp cdeab566a8e9994b8b764ea9eb258bdef5757c8b | |
: 1713278397:0;git cp afe94c937fb78e60e29c47853acff6f3bf94fc95 | |
: 1713278409:0;git cp 0d5a3119c5b62ddf69ddb733fe089275459af544 | |
: 1713282470:0;cd iree/compiler | |
: 1713282477:0;cd GlobalOptimization | |
: 1713282508:0;vi \ | |
/home/pashu/iree-build/compiler/src/iree/compiler/GlobalOptimization/test/Testing/Temporary/LastTest.log | |
: 1713282662:0;ctest . | |
: 1713283063:0;sudo vi /home/pashu/iree-build/compiler/src/iree/compiler/GlobalOptimization/test/Testing/Temporary/LastTest.log | |
: 1713283277:0;iree-opt --pass-pipeline="builtin.module(util.func(iree-global-opt-fuse-horizontal-contractions))" ~/test.mlir | |
: 1713283519:0;ctest . -j 20 | |
: 1713283674:0;cd ../../.. | |
: 1713343478:0;iree-compile --iree-hal-target-backends=llvm-cpu --iree-llvmcpu-target-cpu-features=host -o test.vmfb test.mlir | |
: 1713343504:0;iree-benchmark-module --module=test.vmfb --function=turbine_llm_mmtfp_3d_8640_3200_f32f16 --input=4x128x3200xf32 --input=8640x3200xf16 | |
: 1713343599:0;TRACY_NO_EXIT=1 iree-benchmark-module --module=test.vmfb --function=turbine_llm_mmtfp_3d_8640_3200_f32f16 --input=4x128x3200xf32 --input=8640x3200xf16 | |
: 1713343613:0;iree-tracy-capture -o xyz.tracy | |
: 1713343620:0;iree-tracy-capture -o a.tracy | |
: 1713343984:0;cd /tmp | |
: 1713344005:0;iree-compile --iree-hal-target-backends=llvm-cpu --iree-llvmcpu-target-cpu-features=host -o test.vmfb test.mlir --iree-hal-dump-executable-intermediates-to=/tmp --x86-asm-syntax=intel | |
: 1713345085:0;iree-compile --iree-hal-target-backends=llvm-cpu --iree-llvmcpu-target-cpu-features=host -o test.vmfb test.mlir --iree-hal-dump-executable-intermediates-to=/tmp --x86-asm-syntax=iantel -print-ir-after-all 2> xyz.txt | |
: 1713345088:0;vi xyz.t | |
: 1713345102:0;iree-compile --iree-hal-target-backends=llvm-cpu --iree-llvmcpu-target-cpu-features=host -o test.vmfb test.mlir --iree-hal-dump-executable-intermediates-to=/tmp --x86-asm-syntax=iantel --mlir-print-ir-after-all 2> xyz.txt | |
: 1713345117:0;iree-compile --iree-hal-target-backends=llvm-cpu --iree-llvmcpu-target-cpu-features=host -o test.vmfb test.mlir --iree-hal-dump-executable-intermediates-to=/tmp --x86-asm-syntax=intel --mlir-print-ir-after-all 2> xyz.txt | |
: 1713345572:0;vi /tmp/module_test_linked_llvm_cpu_embedded_elf_x86_64.s | |
: 1713348095:0;:vs | |
: 1713373742:0;iree-compile --iree-hal-target-backends=llvm-cpu --iree-llvmcpu-target-cpu-features=host -o test.vmfb test.mlir --iree-hal-dump-executable-sources-to=$HOME/dump | |
: 1713373832:0;gist-paste *.mlir | |
: 1713373843:0;gist *.mlir | |
: 1713431067:0;mv ../test.mlir . | |
: 1713431077:0;mv test.mlir mmt3d_kernel.mlir | |
: 1713431083:0;rm ../test.vmfb | |
: 1713431138:0;rm a.tracy | |
: 1713431218:0;iree-benchmark-module --module=mmt3d_kernel.vmfb --function=turbine_llm_mmtfp_3d_8640_3200_f32f16 --input=4x128x3200xf32 --input=8640x3200xf16 | |
: 1713435543:0;iree-compile --iree-hal-target-backends=llvm-cpu --iree-llvmcpu-target-cpu-features=host -o mmt3d_kernel.vmfb mmt3d_kernel.mlir --iree-hal-dump-executable-sources-to=dump -mlir-print-ir-after-all 2> xyz.txt | |
: 1713442903:0;git remote add dcab https://github.com/dcaballe/iree.git | |
: 1713442906:0;git fetch dcab | |
: 1713442935:0;git checkout dcab/flatten-small-vector-xfers | |
: 1713444109:0;cd 24 | |
: 1713444123:0;iree-compile --iree-hal-target-backends=llvm-cpu --iree-llvmcpu-target-cpu-features=host -o mmt3d_kernel.vmfb mmt3d_kernel.mlir --iree-hal-dump-executable-sources-to=dump -mlir-print-ir-after-all 2> xyz1.txt | |
: 1713444186:0;diff xyz1.txt xyz.txt | |
: 1713444810:0;vi xyz1.txt | |
: 1713451654:0;iree-compile --iree-hal-target-backends=llvm-cpu --iree-llvmcpu-target-cpu-features=host -o mmt3d_kernel.vmfb mmt3d_kernel.mlir --iree-hal-dump-executable-sources-to=dump -mlir-print-ir-after-all 2> xyz1.txt --iree-llvmcpu-target-cpu=znver4 \\ | |
--iree-llvmcpu-enable-ukernels=all | |
: 1713451725:0;iree-compile --iree-hal-target-backends=llvm-cpu --iree-llvmcpu-target-cpu-features=host -o mmt3d_kernel.vmfb mmt3d_kernel.mlir --iree-hal-dump-executable-sources-to=dump -mlir-print-ir-after-all 2> xyz1.txt --iree-llvmcpu-enable-ukernels=all | |
: 1713451857:0;iree-compile --iree-hal-target-backends=llvm-cpu --iree-llvmcpu-target-cpu-features=host -o mmt3d_kernel.vmfb mmt3d_kernel.mlir --iree-hal-dump-executable-sources-to=dump -mlir-print-ir-after-all 2> xyz1.txt | |
: 1713452611:0;iree-benchmark-module --device=local-task --module=mmt3d_kernel.vmfb --function=turbine_llm_mmtfp_3d_8640_3200_f32f16 --input=4x128x3200xf32 --input=8640x3200xf16 -benchmark-repetitions=5 --batch-size=2 | |
: 1713452764:0;vi module_turbine_llm_mmtfp_3d_8640_3200_f32f16_dispatch_1.mlir | |
: 1713453312:0;vi module_turbine_llm_mmtfp_3d_8640_3200_f32f16_dispatch_0.mlir | |
: 1713453942:0;mv pack_f16.mlir burn_24 | |
: 1713454114:0;vi pack_f16.mlir | |
: 1713454128:0;iree-compile --iree-hal-target-backends=llvm-cpu --iree-llvmcpu-target-cpu-features=host -o pack.vmfb pack_f16.mlir --iree-hal-dump-executable-sources-to=dump | |
: 1713454157:0;cat pack_f16.mlir | |
: 1713454173:0;iree-benchmark-module --device=local-task --module=pack.vmfb --function=pack_f16 --input=8640x3200xf16 | |
: 1713454191:0;vi module_pack_f16_dispatch_0.mlir | |
: 1713454233:0;iree-compile --iree-hal-target-backends=llvm-cpu --iree-llvmcpu-target-cpu-features=host -o pack.vmfb pack_f16.mlir --iree-hal-dump-executable-sources-to=dump -mlir-print-ir-after-all 2> pack.txt | |
: 1713454238:0;vi pack.txt | |
: 1713456292:0;iree-compile --iree-hal-target-backends=llvm-cpu --iree-llvmcpu-target-cpu-features=host -o mmt3d_kernel.vmfb mmt3d_kernel.mlir --iree-hal-dump-executable-sources-to=dump -mlir-print-ir-after-all 2> mmt3d_ir_dump.mlir | |
: 1713529388:0;iree-compile --iree-hal-target-backends=llvm-cpu --iree-llvmcpu-target-cpu-features=host -o mmt3d_kernel.vmfb mmt3d_kernel.mlir --iree-hal-dump-executable-sources-to=dump | |
: 1713529461:0;iree-compile --iree-hal-target-backends=llvm-cpu --iree-llvmcpu-target-cpu-features=host -o mmt3d_kernel.vmfb mmt3d_kernel.mlir --iree-hal-dump-executable-sources-to=dump -mlir-disable-threading | |
: 1713533762:0;vi updated_mmt3d_kernel.mlir mmt3d_kernel.mlir | |
: 1713534513:0;vi mmt3d_ir_dump.mlir mmt3d_kernel.mlir | |
: 1713534891:0;iree-compile --iree-hal-target-backends=llvm-cpu --iree-llvmcpu-target-cpu-features=host -o mmt3d_kernel.vmfb new_ir.mlir --iree-hal-dump-executable-sources-to=dump -mlir-disable-threading | |
: 1713534993:0;iree-compile --iree-hal-target-backends=llvm-cpu --iree-llvmcpu-target-cpu-features=host -o mmt3d_kernel.vmfb new_ir.mlir --iree-hal-dump-executable-sources-to=dump -mlir-disable-threading -mlir-print-ir-after-all | |
: 1713546453:0;iree-compile --iree-hal-target-backends=llvm-cpu --iree-llvmcpu-target-cpu-features=host -o mmt3d_kernel.vmfb new_ir.mlir | |
: 1713546981:0;iree-benchmark-module --device=local-task --module=mmt3d_kernel.vmfb --function=turbine_llm_mmtfp_3d_8640_3200_f32f16 --input=4x128x3200xf32 --input=8640x3200xf16 | |
: 1713547056:0;iree-compile --iree-hal-target-backends=llvm-cpu --iree-llvmcpu-target-cpu-features=host -o mmt3d_kernel.vmfb mmt3d_kernel.mlir -mlir-print-ir-after-all 2> mmt3d_ir_dump_.mlir | |
: 1713547078:0;vi mmt3d_ir_dump*.mlir | |
: 1713547400:0;iree-benchmark-module --device=local-task --module=mmt3d_kernel.vmfb --function=turbine_llm_mmtfp_3d_8640_3200_f32f16 --input=4x128x3200xf32 --input=8640x3200xf32 | |
: 1713547438:0;iree-benchmark-module --device=local-sync --module=mmt3d_kernel.vmfb --function=turbine_llm_mmtfp_3d_8640_3200_f32f32 --input=4x128x3200xf32 --input=8640x3200xf32 | |
: 1713550434:0;iree-benchmark-module --device=local-sync --module=mmt3d_kernel.vmfb --function=turbine_llm_mmtfp_3d_8640_3200_f32f16 --input=4x128x3200xf32 --input=8640x3200xf16 | |
: 1713551968:0;iree-compile --iree-hal-target-backends=llvm-cpu --iree-llvmcpu-target-cpu-features=host -o mmt3d_kernel.vmfb mmt3d_kernel.mlir -mlir-print-ir-after-all 2> mmt3d_ir_dump.mlir | |
: 1713552156:0;iree-compile --iree-hal-target-backends=llvm-cpu --iree-llvmcpu-target-cpu-features=host -o mmt3d_kernel.vmfb mmt3d_kernel.mlir -mlir-print-ir-after-all 2> mmt3d_ir_dump.mlir -mlir-print-debug-info | |
: 1713552168:0;iree-compile --iree-hal-target-backends=llvm-cpu --iree-llvmcpu-target-cpu-features=host -o mmt3d_kernel.vmfb mmt3d_kernel.mlir -mlir-print-ir-after-all -mlir-print-debug-info | |
: 1713552173:0;iree-compile --iree-hal-target-backends=llvm-cpu --iree-llvmcpu-target-cpu-features=host -o mmt3d_kernel.vmfb mmt3d_kernel.mlir -mlir-print-ir-after-all -mlir-print-debuginfo | |
: 1713552333:0;= linalg.generic {indexing_maps = [affine_map<(d0, d1, d2) -> (d1, d2)>, affine_map<(d0, d1, d2) -> (d0, d1, d2)>], iterator_types = ["parallel", "parallel", "parallel"]} ins(%17 : tensor<8640x3200xf16>) outs(%19 : tensor<?x8640x3200xf16>) {\ | |
^bb0(%in: f16 loc("mmt3d_kernel.mlir":12:10), %out: f16 loc("mmt3d_kernel.mlir":12:20)):\ | |
linalg.yield %in : f16 loc(callsite("mmt3d_kernel.mlir":13:7 at "mmt3d_kernel.mlir":4:3))\ | |
} -> tensor<?x8640x3200xf16> loc(callsite("mmt3d_kernel.mlir":11:10 at "mmt3d_kernel.mlir":4:3))\ | |
%20 = linalg.generic {indexing_maps = [affine_map<(d0, d1, d2) -> (d1, d2)>, affine_map<(d0, d1, d2) -> (d0, d1, d2)>], iterator_types = ["parallel", "parallel", "parallel"]} ins(%17 : tensor<8640x3200xf16>) outs(%19 : tensor<?x8640x3200xf16>) {\ | |
^bb0(%in: f16 loc("mmt3d_kernel.mlir":12:10), %out: f16 loc("mmt3d_kernel.mlir":12:20)):\ | |
linalg.yield %in : f16 loc(callsite("mmt3d_kernel.mlir":13:7 at "mmt3d_kernel.mlir":4:3))\ | |
} -> tensor<?x8640x3200xf16> loc(callsite("mmt3d_kernel.mlir":11:10 at "mmt3d_kernel.mlir":4:3)) | |
: 1713552421:0;iree-compile --iree-hal-target-backends=llvm-cpu --iree-llvmcpu-target-cpu-features=host -o mmt3d_kernel.vmfb mmt3d_kernel.mlir -mlir-print-debuginfo | |
: 1713552925:0;iree-benchmark-module --device=local-task --module=mmt3d_kernel.vmfb --function=turbine_llm_mmtfp_3d_8640_3200_f32f16 --input=4x128x3200xf32 --input=8640x3200xf16 -mlir-print-debug-info | |
: 1713554021:0;iree-compile --iree-hal-target-backends=llvm-cpu --iree-llvmcpu-target-cpu-features=host -o mmt3d_kernel.vmfb mmt3d_kernel.mlir -mlir-print-ir-after-all 2> mmt3d_ir_dump.mlir | |
: 1713557254:0;iree-compile --iree-hal-target-backends=llvm-cpu --iree-llvmcpu-target-cpu-features=host -o mmt3d_kernel.vmfb mmt3d_kernel.mlir -mlir-print-ir-after-all 2> mmt3d_ir_dump.mlir --iree-hal-dump-executable-intermediates-to=dumpex/ | |
: 1713557317:0;vi module_mmt3d_kernel_linked_llvm_cpu_embedded_elf_x86_64.s | |
: 1713557808:0;gist * | |
: 1713557817:0;gist *.s | |
: 1713557992:0;iree-compile --iree-hal-target-backends=llvm-cpu --iree-llvmcpu-target-cpu-features=host -o mmt3d_kernel.vmfb mmt3d_kernel.mlir -mlir-print-ir-after-all 2> mmt3d_ir_dump.mlir --iree-hal-dump-executable-intermediates-to=dumpex/ --x86-asm-syntax=intel | |
: 1713558377:0;cd dumpex | |
: 1713558770:0;mv mmt3d_kernel.vmfb fast.vmfb | |
: 1713558773:0;rm pack.vmfb | |
: 1713558783:0;rm pack_f16.mlir pack.txt | |
: 1713559009:0;rm dump dumpex | |
: 1713559014:0;rm -rf dump dumpex | |
: 1713559017:0;rm xyz* | |
: 1713559028:0;rm mmt3d_ir_dump_.mlir | |
: 1713559166:0;iree-compile --iree-hal-target-backends=llvm-cpu --iree-llvmcpu-target-cpu-features=host -o mmt3d_kernel.vmfb mmt3d_kernel.mlir -mlir-print-ir-after-all 2> mmt3d_ir_dump_new.mlir --iree-hal-dump-executable-intermediates-to=dumpnew/ --x86-asm-syntax=intel | |
: 1713559265:0;iree-compile --iree-hal-target-backends=llvm-cpu --iree-llvmcpu-target-cpu-features=host -o mmt3d_kernel.vmfb mmt3d_kernel.mlir -mlir-print-ir-after-all 2> mmt3d_ir_dump.mlir --iree-hal-dump-executable-intermediates-to=dumpold/ --x86-asm-syntax=intel | |
: 1713559358:0;gist module_mmt3d_kernel_linked_llvm_cpu_embedded_elf_x86_64.s | |
: 1713559431:0;rm mmt3d_ir_dump_new.mlir | |
: 1713559442:0;gist mmt3d_ir_dump.mlir | |
: 1713559594:0;cd dumpold | |
: 1713559675:0;iree-compile --iree-hal-target-backends=llvm-cpu --iree-llvmcpu-target-cpu-features=host -o mmt3d_kernel.vmfb mmt3d_kernel.mlir -mlir-print-ir-after-all 2> mmt3d_ir_dump.mlir --iree-hal-dump-executable-intermediates-to=dumpold/ --x86-asm-syntax=intel --iree-llvmcpu-keep-linker-artifacts | |
: 1713559750:0;vi mmt3d_ir_dump.mlir | |
: 1713559767:0;iree-compile --iree-hal-target-backends=llvm-cpu --iree-llvmcpu-target-cpu-features=host -o mmt3d_kernel.vmfb mmt3d_kernel.mlir -mlir-print-ir-after-all --iree-hal-dump-executable-intermediates-to=dumpold/ --x86-asm-syntax=intel --iree-llvmcpu-keep-linker-artifacts | |
: 1713559783:0;iree-compile --iree-hal-target-backends=llvm-cpu --iree-llvmcpu-target-cpu-features=host -o mmt3d_kernel.vmfb mmt3d_kernel.mlir --iree-hal-dump-executable-intermediates-to=dumpold/ --x86-asm-syntax=intel --iree-llvmcpu-keep-linker-artifacts | |
: 1713559823:0;objdump -MIntel -d /tmp/mmt3d_kernel_linked_llvm_cpu-2a673d.so | |
: 1713559845:0;objdump -MIntel -d /tmp/mmt3d_kernel_linked_llvm_cpu-2a673d.so > mmt3dobjdump.txt | |
: 1713559957:0;objdump -MIntel -d /tmp/mmt3d_kernel_linked_llvm_cpu-9a3500.so > mmt3dobjdump.txt | |
: 1713560056:0;gist mmt3dobjdump.txt | |
: 1713560138:0;vi mmt3dobjdump.txt | |
: 1713561621:0;vi mmt3d_kernel.vmfb | |
: 1713561700:0;iree-benchmark-module --device=local-task --module=mmt3d_kernel.vmfb --function=turbine_llm_mmtfp_3d_8640_3200_f32f32 --input=4x128x3200xf32 --input=8640x3200xf32 | |
: 1713562281:0;iree-compile --iree-hal-target-backends=llvm-cpu --iree-llvmcpu-target-cpu-features=host -o mmt3d_kernel.vmfb mmt3d_kernel.mlir --iree-hal-dump-executable-intermediates-to=dumpold/ --x86-asm-syntax=intel --iree-llvmcpu-keep-linker-artifacts -iree-llvmcpu-link-embedded=false | |
: 1713562321:0;iree-benchmark-module --device=local-task --module=mmt3d_kernel.vmfb --function=turbine_llm_mmtfp_3d_8640_3200_f32f32 --input=4x128x3200xf32 --input=4x8640x3200xf32 | |
: 1713562460:0;iree-benchmark-module --device=local-task --module=fast.vmfb --function=turbine_llm_mmtfp_3d_8640_3200_f32f16 --input=4x128x3200xf32 --input=8640x3200xf16 | |
: 1713562483:0;iree-benchmark-module --device=local-task --module=fast.vmfb --function=turbine_llm_mmtfp_3d_8640_3200_f32f16 --input=4x128x3200xf32 --input=4x8640x3200xf16 | |
: 1713562577:0;iree-benchmark-module --device=local-task --module=mmt3d_kernel.vmfb --function=turbine_llm_mmtfp_3d_8640_3200_f32f16 --input=1x128x3200xf32 --input=1x8640x3200xf16 | |
: 1713562589:0;iree-benchmark-module --device=local-task --module=mmt3d_kernel.vmfb --function=turbine_llm_mmtfp_3d_8640_3200_f32f16 --input=2x128x3200xf32 --input=2x8640x3200xf16 | |
: 1713562738:0;iree-cpuinfo | |
: 1713563509:0;unzip 20240415_llama2_13b_q4_1_bs2_bs1.zip -o llama2_13b | |
: 1713563517:0;unzip 20240415_llama2_13b_q4_1_bs2_bs1.zip llama2_13b | |
: 1713563540:0;unzip 20240415_llama2_13b_q4_1_bs2_bs1.zip -d llama2_13b | |
: 1713563567:0;mv llama2_13b burn_24 | |
: 1713563640:0;cd llama2_13b | |
: 1713563657:0;vi 0c7f98910d22219c5d505b85c0b496744244c583.mlir | |
: 1713563814:0;vi runtime.log | |
: 1713589828:0;vi torch_module.py | |
: 1713589895:0;python torch_module.py | |
: 1713590001:0;gist torch_module.py | |
: 1713610546:0;iree-compile --iree-hal-target-backends=llvm-cpu --iree-llvmcpu-target-cpu-features=host -o xy.vmfb ex.mlir -mlir-print-ir-after-all > xyz.txt | |
: 1713610553:0;iree-compile --iree-hal-target-backends=llvm-cpu --iree-llvmcpu-target-cpu-features=host -o xy.vmfb ex.mlir -mlir-print-ir-after-all 2> xyz.txt | |
: 1713612510:0;wget https://us.download.nvidia.com/XFree86/Linux-x86_64/550.76/NVIDIA-Linux-x86_64-550.76.run | |
: 1713613587:0;chmod + NVIDIA-Linux-x86_64-550.76.run | |
: 1713613592:0;sudo ./NVIDIA-Linux-x86_64-550.76.run | |
: 1713613752:0;sudo run ./NVIDIA-Linux-x86_64-550.76.run | |
: 1713613759:0;sudo sh ./NVIDIA-Linux-x86_64-550.76.run | |
: 1713613900:0;sudo dnf install dnf-plugins-core -y\ | |
: 1713613922:0;sudo dnf copr enable t0xic0der/nvidia-auto-installer-for-fedora -y\ | |
: 1713613931:0;sudo dnf install nvautoinstall -y\ | |
: 1713613954:0;sudo nvautoinstall cheksu\ | |
: 1713613968:0;$ sudo nvautoinstall compat\ | |
: 1713613974:0;sudo nvautoinstall compat\ | |
: 1713614024:0;sudo nvautoinstall rpmadd | |
: 1713614063:0;sudo nvautoinstall driver\ | |
: 1713614266:0;sudo nvautoinstall nvrepo | |
: 1713614414:0;sudo nvautoinstall plcuda | |
: 1713615578:0;cd /run/media/pashu/Fedora-WS-Live-39-1-5 | |
: 1713615614:0;sudo mkdir home | |
: 1713615692:0;chmod +x -R . | |
: 1713615708:0;sudo chmod 777 -R . | |
: 1713615961:0;sudo | |
: 1713615964:0;sudo sh | |
: 1713616113:0;cd Fedora-WS-Live-39-1-5 | |
: 1713616122:0;chmod 777 Fedora-WS-Live-39-1-5 | |
: 1713616128:0;sudo chmod 777 Fedora-WS-Live-39-1-5 | |
: 1713616146:0;sudo chmod -R 777 Fedora-WS-Live-39-1-5 | |
: 1713616459:0;cd Pop_OS\ 22.04\ amd64\ Nvidia | |
: 1713616957:0;cd /run/media/pashu | |
: 1713616960:0;cd Untitled | |
: 1713616960:0;LS | |
: 1713616966:0;mkdir home | |
: 1713616981:0;cp -R ~/ home/ | |
: 1713616997:0;sudo cp -R ~/ home/ | |
: 1713617303:0;cd home | |
: 1713617307:0;cd pashu | |
: 1713617322:0;rsync | |
: 1713617407:0;cp ~/.zsh_history . | |
: 1713622097:0;cd .ssh | |
: 1713622117:0;mv id_rsa id_rsa.pub ~/.ssh | |
: 1713622156:0;git clone --depth 1 https://github.com/junegunn/fzf.git ~/.fzf\ | |
~/.fzf/install\ | |
: 1713622193:0;vi .zsh_history | |
: 1713622237:0;sudo apt-get install ripgrep cargo node npm \ | |
: 1713622241:0;sudo apt-get install ripgrep cargo nodejs npm \ | |
: 1713622324:0;sudo apt-get install lazygit | |
: 1713622369:0;lazygit --version | |
: 1713622475:0;cd neovim\ | |
: 1713622655:0;sudo apt-get install ninja-build gettext cmake unzip curl build-essential\ | |
: 1713622668:0;make CMAKE_BUILD_TYPE=Release\ | |
: 1713622710:0;rm -rf cmake.deps | |
: 1713622959:0;LAZYGIT_VERSION=$(curl -s "https://api.github.com/repos/jesseduffield/lazygit/releases/latest" | grep -Po '"tag_name": "v\K[^"]*')\ | |
curl -Lo lazygit.tar.gz "https://github.com/jesseduffield/lazygit/releases/latest/download/lazygit_${LAZYGIT_VERSION}_Linux_x86_64.tar.gz"\ | |
tar xf lazygit.tar.gz lazygit\ | |
sudo install lazygit /usr/local/bin\ | |
: 1713622976:0;rm lazygit.tar.gz | |
: 1713622979:0;rm lazygit | |
: 1713623190:0;nvim ~/.zshrc | |
: 1713623343:0;sudo apt-get install tmux | |
: 1713624077:0;sudo apt install python3.11-ven | |
: 1713624082:0;sudo apt install python3.11-venv | |
: 1713624111:0;python3.11 -m venv global_venv | |
: 1713624160:0;python -m pip install --upgrade pip\ | |
: 1713624161:0;pip | |
: 1713624184:0;pip install -r iree/runtime/bindings/python/iree/runtime/build_requirements.txt | |
: 1713624218:0;sudo apt install cmake ninja-build clang lld\ | |
: 1713624272:0;sudo apt-get install clangd clang-format | |
: 1713624395:0;pip list | |
: 1713624427:0;sudo apt-get remove cmake | |
: 1713624489:0;pip install python3-dev | |
: 1713624506:0;sudo apt-get install python-dev | |
: 1713624570:0;rm -rf global_venv | |
: 1713624617:0;sudo apt-get install python3.10-venv | |
: 1713624624:0;python3 -m venv global_venv | |
: 1713624650:0;pip install mlir/python/requirements.txt | |
: 1713625077:0;git o v0.9.0 | |
: 1713625090:0;make CMAKE_BUILD_TYPE=Release -j 32\ | |
: 1713625169:0;sudo make install\ | |
: 1713625196:0;sudo apt-get install cmake | |
: 1713625536:0;sudo apt install libcapstone-dev\ | |
: 1713625548:0;sudo apt install libtbb-dev libzstd-dev libglfw3-dev libfreetype6-dev libgtk-3-dev\ | |
: 1713625587:0;sudo apt install libtbb-dev libzstd-dev\ | |
: 1713625883:0;sudo apt-get install psutil | |
: 1713626075:0;sudo apt instal nodejs | |
: 1713626080:0;sudo apt install nodejs | |
: 1713626180:0;sudo apt-get remove nodejs | |
: 1713626217:0;sudo apt autoremove | |
: 1713626283:0;nvm install 20 | |
: 1713626296:0;node -v | |
: 1713626301:0;npm -v | |
: 1713626636:0;node --version | |
: 1713626855:0;mv build/compile_commands.json . | |
: 1713626897:0;clangd | |
: 1713663905:0;iree-opt --help | |
: 1713664313:0;pip install pynvim --user | |
: 1713664320:0;pip3 install pynvim --user | |
: 1713664325:0;sudo pip3 install pynvim --user | |
: 1713664361:0;LV_BRANCH='release-1.3/neovim-0.9' bash <(curl -s https://raw.githubusercontent.com/LunarVim/LunarVim/release-1.3/neovim-0.9/utils/installer/install.sh) | |
: 1713664528:0;rm -rf neovim | |
: 1713664532:0;sudo rm -rf neovim | |
: 1713664544:0;git clone https://github.com/neovim/neovim.git\ | |
: 1713664602:0;cd neovim | |
: 1713664612:0;git o v0.9.5 | |
: 1713664665:0;make CMAKE_BUILD_TYPE=RELWithDebInfo -j 32 | |
: 1713664748:0;git checkout stable | |
: 1713664786:0;make clean | |
: 1713664792:0;make CMAKE_BUILD_TYPE=RelWithDebInfo | |
: 1713664803:0;cd cmake.deps | |
: 1713664854:0;rm -rf .deps | |
: 1713664862:0;make CMAKE_BUILD_TYPE=RelWithDebInfo -j 32 | |
: 1713665077:0;nvim | |
: 1713665138:0;LV_BRANCH='release-1.3/neovim-0.9' bash <(curl -s https://raw.githubusercontent.com/LunarVim/LunarVim/release-1.3/neovim-0.9/utils/installer/install.sh)\ | |
: 1713665171:0;where lvim | |
: 1713665254:0;where nvim | |
: 1713665465:0;clangd --version | |
: 1713665696:0;pip install pyright --user | |
: 1713665849:0;mv ../iree-build/compile_commands.json . | |
: 1713666033:0;lvim | |
: 1713666086:0;sudo apt upgrade -y | |
: 1713666153:0;brew install node@20 | |
: 1713666158:0;sudo apt-get install brew | |
: 1713666173:0;curl -o- https://raw.githubusercontent.com/nvm-sh/nvm/v0.39.7/install.sh | bash | |
: 1713666210:0;sudo apt-get install nodejs | |
: 1713666915:0;which python | |
: 1713666942:0;python -m pip install -r mlir/python/requirements.txt | |
: 1713667199:0;git remote add grypp https://github.com/grypp/llvm-project.git | |
: 1713667204:0;git fetch grypp | |
: 1713667228:0;git checkout grypp/nvgpu-tutorial | |
: 1713670671:0;cd mlir/test/Examples/nvgpu | |
: 1713670698:0;vi Ch0.py | |
: 1713670765:0;cd CMakeFiles | |
: 1713670772:0;cd tools | |
: 1713670949:0;cmake . | |
: 1713671315:0;ebc | |
: 1713671318:0;ebm | |
: 1713671583:0;cd llvm-project/build | |
: 1713671585:0;cd runtimes | |
: 1713672153:0;cd mlir | |
: 1713672177:0;cd test/Examples/nvgpu/ | |
: 1713672942:0;ls /usr/lib/cuda/nvvm/libdevice/libdevice.10.bc | |
: 1713673490:0;python Ch2.py | |
: 1713673661:0;sudo wget https://developer.download.nvidia.com/compute/cuda/repos/ubuntu2204/x86_64/cuda-keyring_1.1-1_all.deb | |
: 1713673711:0;curl https://developer.download.nvidia.com/compute/cuda/repos/ubuntu2204/x86_64/cuda-keyring_1.1-1_all.deb | |
: 1713673736:0;wget https://developer.download.nvidia.com/compute/cuda/repos/ubuntu2204/x86_64/cuda-keyring_1.1-1_all.deb | |
: 1713673743:0;sudo dpkg -i cuda-keyring_1.1-1_all.deb | |
: 1713673764:0;sudo apt-get -y install cuda-toolkit-12-4 | |
: 1713674148:0;cd /usr/lib/cuda/ls | |
: 1713674151:0;cd /usr/lib/cuda/ | |
: 1713674221:0;nvidia --version | |
: 1713674278:0;cd mlir/test/Examples/nvgpu/Ch1.py | |
: 1713674281:0;cd mlir/test/Examples/nvgpu/ | |
: 1713674296:0;python Ch0.py | |
: 1713674350:0;cd usr/local/cuda-12 | |
: 1713674355:0;cd nvvm | |
: 1713674358:0;cd libdevice | |
: 1713674461:0;cd local | |
: 1713674481:0;bin/nvcc --version | |
: 1713674510:0;:f | |
: 1713674561:0;export CUDA_ROOT=/usr/local/cuda | |
: 1713674644:0;cd /usr/lib | |
: 1713674701:0;export nvcc=/usr/local/cuda/bin/nvcc | |
: 1713674713:0;alias nvcc=/usr/local/cuda/bin/nvcc | |
: 1713674715:0;python Ch1.py | |
: 1713674731:0;pytho mlir/test/Examples/nvgpu/Ch0.py | |
: 1713675005:0;python mlir/test/Examples/nvgpu/Ch3.py | |
: 1713676584:0;cd /usr/local | |
: 1713676586:0;cd cuda | |
: 1713676589:0;cd include | |
: 1713676593:0;vi cuda.h | |
: 1713676645:0;./nvcc --version | |
: 1713676659:0;history | |
: 1713676666:0;vi ~/.bash_history | |
: 1713676688:0;sudo apt remove nvidia-cuda-toolkit | |
: 1713676710:0;sudo apt-get remove --auto-remove nvidia-cuda-toolkit | |
: 1713677304:0;nvcc --version | |
: 1713677660:0;export PYTHONPATH=$(cd build && pwd)/tools/mlir/python_packages/mlir_core | |
: 1713677669:0;export SUPPORT_LIB=/home/prashant/llvm-project/build/lib/libmlir_cuda_runtime.so | |
: 1713677719:0;python mlir/test/Examples/nvgpu/Ch0.py | |
: 1713677744:0;python mlir/test/Examples/nvgpu/Ch1.py | |
: 1713677747:0;python mlir/test/Examples/nvgpu/Ch2.py | |
: 1713677913:0;git clone https://github.com/siboehm/SGEMM_CUDA.git | |
: 1713677955:0;mkdir build && cd build && cmake .. && cmake --build . | |
: 1713677992:0;./sgemm 1 | |
: 1713678137:0;cd SGEMM_CUDA | |
: 1713711744:0;./sgemm 10 | |
: 1713711752:0;./sgemm 0 | |
: 1713716007:0;./sgemm 2 | |
: 1713716129:0;./sgemm 3 | |
: 1713720337:0;rm cuda-keyring_1.1-1_all.deb | |
: 1713720386:0;mkdir burn_24 | |
: 1713720490:0;touch mmt3d_kernel.mlir | |
: 1713721662:0;mlir-lsp-server | |
: 1713722008:0;git clone https://github.com/pashu123/nvim-lua-config ~/.config/nvim | |
: 1713722080:0;git clone --depth 1 https://github.com/wbthomason/packer.nvim\\ | |
~/.local/share/nvim/site/pack/packer/start/packer.nvim | |
: 1713722238:0;./mlir-lsp-server | |
: 1713723135:0;nvim mmt3d_kernel.mlir | |
: 1713723363:0;nvim . | |
: 1713724028:0;npm i tree-sitter-mlir | |
: 1713724412:0;vi ~/.config/nvim | |
: 1713725071:0;npm install tree-sitter-cli | |
: 1713725146:0;wget https://github.com/tree-sitter/tree-sitter/releases/download/v0.22.5/tree-sitter-linux-x64.gz | |
: 1713725155:0;tar xzf tree-sitter-linux-x64.gz | |
: 1713725165:0;tar -xzf tree-sitter-linux-x64.gz | |
: 1713725188:0;tar -czf tree-sitter-linux-x64.gz | |
: 1713725222:0;unzip tree-sitter-linux-x64.gz | |
: 1713725258:0;gzip -d tree-sitter-linux-x64.gz | |
: 1713725290:0;chmod +x tree-sitter-linux-x64 | |
: 1713725292:0;./tree-sitter-linux-x64 | |
: 1713725323:0;mv tree-sitter-linux-x64 tree-sitter | |
: 1713725333:0;sudo mv tree-sitter /usr/bin | |
: 1713727217:0;3\ | |
3\ | |
3 | |
: 1713727951:0;TRACY_NO_EXIT=1 iree-benchmark-module --module=mmt3d_kernel.vmfb --function=turbine_llm_mmtfp_3d_8640_3200_f32f16 --input=4x128x3200xf32 --input=8640x3200xf16 | |
: 1713728179:0;iree-compile --iree-hal-target-backends=llvm-cpu --iree-llvmcpu-target-cpu-features=host -o mmt3d_kernel.vmfb mmt3d_kernel.mlir --iree-llvmcpu-enable-ukernels=all | |
: 1713754443:0;tmux -u | |
: 1713754565:0;tmux --version | |
: 1713754798:0;cat ~/.config/lvim/config.lua | |
: 1713755718:0;cl | |
: 1713756087:0;cat ~/.tmux.conf | |
: 1713759940:0;cd bu | |
: 1713760371:0;./clang --version | |
: 1713760433:0;sudo mv * /usr/bin | |
: 1713760668:0;sudo make install | |
: 1713760735:0;sudo apt-get remove clang lld | |
: 1713760748:0;sudo cmake --build . --target install | |
: 1713769584:0;iree-compile --iree-hal-target-backends=llvm-cpu --iree-llvmcpu-target-cpu-features=host -o mmt3d_kernel.vmfb mmt3d_kernel.mlir | |
: 1713769592:0;iree-benchmark-module --device=local-task --module=mmt3d_kernel.vmfb --function=turbine_llm_mmtfp_3d_8640_3200_f32f16 --input=4x128x3200xf32 --input=4x8640x3200xf16 | |
: 1713769719:0;ln -s ~/iree-build/compile_commands.json ~/iree/compile_commands.json | |
: 1713769731:0;ln -sf ~/iree-build/compile_commands.json ~/iree/compile_commands.json | |
: 1713770418:0;sudo apt-get install gist-paste | |
: 1713770422:0;sudo apt-get install gist | |
: 1713770435:0;gist auth | |
: 1713778848:0;iree-benchmark-module --device=local-task --module=slow.vmfb --function=turbine_llm_mmtfp_3d_8640_3200_f32f16 --input=4x128x3200xf32 --input=8640x3200xf16 | |
: 1713778862:0;iree-benchmark-module --device=local-task --module=mmt3d_kernel.vmfb --function=turbine_llm_mmtfp_3d_8640_3200_f32f16 --input=4x128x3200xf32 --input=8640x3200xf16 | |
: 1713778945:0;iree-benchmark-module --device=local-task --module=mmt3d_kernel.vmfb --function=turbine_llm_mmtfp_3d_8640_3200_f32f16 --input=4x128x3200xf32 --input=8640x3200xf16 -benchmark-repetitions=5 | |
: 1713778957:0;iree-benchmark-module --help | fzf | |
: 1713778977:0;iree-benchmark-module --device=local-task --module=mmt3d_kernel.vmfb --function=turbine_llm_mmtfp_3d_8640_3200_f32f16 --input=4x128x3200xf32 --input=8640x3200xf16 -benchmark_repetitions=5 | |
: 1713779000:0;iree-benchmark-module --benchmark_repetitions=5 --device=local-task --module=mmt3d_kernel.vmfb --function=turbine_llm_mmtfp_3d_8640_3200_f32f16 --input=4x128x3200xf32 --input=8640x3200xf16 | |
: 1713779028:0;iree-benchmark-module --benchmark_repetitions=10 --device=local-task --module=mmt3d_kernel.vmfb --function=turbine_llm_mmtfp_3d_8640_3200_f32f16 --input=4x128x3200xf32 --input=8640x3200xf16 | |
: 1713780521:0;iree-compile --iree-hal-target-backends=llvm-cpu --iree-llvmcpu-target-cpu-features=host -o slow.vmfb mmt3d_kernel.mlir | |
: 1713780947:0;iree-compile --iree-hal-target-backends=llvm-cpu --iree-llvmcpu-target-cpu-features=host -o /tmp/xy.vmfb mmt3d_kernel.mlir -mlir-print-ir-after-all 2> ir_print.txt | |
: 1713782554:0;iree-compile --iree-hal-target-backends=llvm-cpu --iree-llvmcpu-target-cpu-features=host -o /tmp/xy.vmfb mmt3d_kernel.mlir -mlir-print-ir-after-all 2> ir_print1.mlir | |
: 1713782616:0;vi ir_print1.mlir | |
: 1713783412:0;iree-benchmark-module --benchmark_repetitions=5 --device=local-task --module=slow.vmfb --function=turbine_llm_mmtfp_3d_8640_3200_f32f16 --input=4x128x3200xf32 --input=8640x3200xf16 | |
: 1713784890:0;iree-compile --iree-hal-target-backends=llvm-cpu --iree-llvmcpu-target-cpu-features=host -o /tmp/xy.vmfb mmt3d_kernel.mlir | |
: 1713784895:0;iree-benchmark-module --benchmark_repetitions=5 --device=local-task --module=/tmp/xy.vmfb --function=turbine_llm_mmtfp_3d_8640_3200_f32f16 --input=4x128x3200xf32 --input=8640x3200xf16 | |
: 1713784938:0;iree-benchmark-module --benchmark_repetitions=10 --device=local-task --module=slow.vmfb --function=turbine_llm_mmtfp_3d_8640_3200_f32f16 --input=4x128x3200xf32 --input=8640x3200xf16 | |
: 1713785220:0;iree-compile --iree-hal-target-backends=llvm-cpu --iree-llvmcpu-target-cpu-features=host -o /tmp/xy.vmfb mmt3d_kernel.mlir -mlir-print-ir-after-all 2> new_ir.mlir | |
: 1713802032:0;iree-benchmark-module --benchmark_repetitions=15 --device=local-task --module=/tmp/xy.vmfb --function=turbine_llm_mmtfp_3d_8640_3200_f32f16 --input=4x128x3200xf32 --input=8640x3200xf16 | |
: 1713802418:0;iree-compile --iree-hal-target-backends=llvm-cpu --iree-llvmcpu-target-cpu-features=host -o /tmp/xy.vmfb mmt3d_kernel.mlir -mlir-print-ir-after-all 2> latest_ir.mlir | |
: 1713802437:0;gist-paste latest_ir.mlir | |
: 1713802641:0;iree-compile --iree-hal-target-backends=llvm-cpu --iree-llvmcpu-target-cpu-features=host -o mmt3d_kernel.vmfb mmt3d_kernel.mlir --iree-hal-dump-executable-sources-to=dump | |
: 1713802686:0;iree-compile --compile-from=executable-sources dump/module_turbine_llm_mmtfp_3d_8640_3200_f32f16_dispatch_1.mlir | |
: 1713802702:0;iree-compile --compile-from=executable-sources dump/module_turbine_llm_mmtfp_3d_8640_3200_f32f16_dispatch_1.mlir -mlir-print-ir-after-all 2> xyz.mlir | |
: 1713859170:0;vi ir_print.txt | |
: 1713859660:0;iree-opt pack_micro.mlir | |
: 1713859782:0;iree-compile --compile-from=executable-sources pack_micro.mlir -o micro.vmfb | |
: 1713859801:0;iree-compile pack_micro.mlir -o micro.vmfb | |
: 1713860124:0;iree-benchmark-module --benchmark_repetitions=15 --device=local-task --module=pack.vmfb --function=broadcast_pack_micro --input=4x128x3200xf32 --input=8640x3200xf16 | |
: 1713860145:0;cat pack_micro.mlir | |
: 1713860232:0;iree-compile --iree-hal-target-backends=llvm-cpu --iree-llvmcpu-target-cpu-features=host -o pack.vmfb pack_micro.mlir -mlir-print-ir-after-all 2> ir_dump_pack_micro_default.mlir | |
: 1713860248:0;vi ir_dump_pack_micro_default.mlir | |
: 1713861841:0;iree-compile --iree-hal-target-backends=llvm-cpu --iree-llvmcpu-target-cpu-features=host -o pack.vmfb pack_micro.mlir -mlir-print-ir-after-all 2> new.mlir | |
: 1713862382:0;mv new_ir.mlir vec_1_16_16.mlir | |
: 1713862387:0;mv ir_dump_pack_micro_default.mlir | |
: 1713862392:0;vi ir_dump_pack_micro_default.mlir | |
: 1713862417:0;mv ir_dump_pack_micro_default.mlir vec_1_16_1.mlir | |
: 1713862428:0;gist-paste vec_1_16_16.mlir | |
: 1713862444:0;gist-paste vec_1_16_1.mlir | |
: 1713862692:0;iree-compile --iree-hal-target-backends=llvm-cpu --iree-llvmcpu-target-cpu-features=host -o pack.vmfb pack_micro.mlir r | |
: 1713866479:0;vi /tmp/read.mlir | |
: 1713869990:0;git o test_branch | |
: 1713870451:0;TRACY_NO_EXIT=1 iree-benchmark-module --module=pack.vmfb --function=broadcast_pack_kernel --input=4x128x3200xf32 --input=8640x3200xf16 | |
: 1713870476:0;iree-tracy-capture -o ~/pack_broadcast.tracy | |
: 1713871071:0;vi vec*.mlir | |
: 1713877172:0;vi pack_micro.mlir mmt3d_kernel.mlir | |
: 1713878163:0;mv _kernel.mlir mod_kernel.mlir | |
: 1713878198:0;iree-benchmark-module --benchmark_repetitions=15 --device=local-task --module=mod.vmfb --function=broadcast_pack_kernel --input=4x128x3200xf32 --input=8640x3200xf16 | |
: 1713878210:0;vi mod_kernel.mlir | |
: 1713878229:0;iree-compile --iree-hal-target-backends=llvm-cpu --iree-llvmcpu-target-cpu-features=host -o mod.vmfb mod_kernel.mlir | |
: 1713878238:0;iree-benchmark-module --benchmark_repetitions=15 --device=local-task --module=mod.vmfb --function=mod_kernel --input=4x128x3200xf32 --input=8640x3200xf16 | |
: 1713878642:0;vi vec_1_16_1.mlir | |
: 1713892812:0;git remote add hanhan https://github.com/hanhanW/iree.git | |
: 1713892838:0;git o hanhan/disable-pack-unpack-decomposition-by-default | |
: 1713895899:0;iree-compile --iree-hal-target-backends=llvm-cpu --iree-llvmcpu-target-cpu-features=host -o pack.vmfb pack_micro.mlir -mlir-print-ir-after-all 2> new_ir.mlir | |
: 1713896467:0;iree-compile --iree-hal-target-backends=llvm-cpu --iree-llvmcpu-target-cpu-features=host -o pack.vmfb pack_micro.mlir -mlir-print-ir-after-all | |
: 1713896476:0;iree-compile --iree-hal-target-backends=llvm-cpu --iree-llvmcpu-target-cpu-features=host -o pack.vmfb pack_micro.mlir | |
: 1713896530:0;iree-compile --iree-hal-target-backends=llvm-cpu --iree-llvmcpu-target-cpu-features=host -o pack.vmfb pack_micro.mlir -mlir-print-ir-after-all 2> tmp_ir.mlir | |
: 1713896639:0;iree-benchmark-module --benchmark_repetitions=15 --device=local-task --module=slow.vmfb --function=turbine_llm_mmtfp_3d_8640_3200_f32f16 --input=4x128x3200xf32 --input=8640x3200xf16 | |
: 1713897021:0;iree-benchmark-module --benchmark_repetitions=15 --device=local-task --module=pack.vmfb --function=turbine_llm_mmtfp_3d_8640_3200_f32f16 --input=4x128x3200xf32 --input=8640x3200xf16 | |
: 1713897168:0;gist-paste tmp_ir.mlir | |
: 1713897325:0;iree-compile --iree-hal-target-backends=llvm-cpu --iree-llvmcpu-target-cpu-features=host -o pack.vmfb pack_micro.mlir --iree-hal-dump-executable-sources-to=dump | |
: 1713897387:0;iree-compile --iree-hal-target-backends=llvm-cpu --iree-llvmcpu-target-cpu-features=host -o pack.vmfb pack_micro.mlir --iree-hal-dump-executable-intermediates-to=dump/ --x86-asm-syntax=intel | |
: 1713897412:0;gist-paste module_broadcast_pack_kernel_dispatch_0_embedded_elf_x86_64.s | |
: 1713897417:0;vi module_broadcast_pack_kernel_dispatch_0_embedded_elf_x86_64.s | |
: 1713921623:0;iree-compile --iree-hal-target-backends=llvm-cpu --iree-llvmcpu-target-cpu-features=host -o pack.vmfb pack_micro.mlir -mlir-print-ir-after-all 2> tmp_ir.mlir | |
: 1713922062:0;iree-benchmark-module --benchmark_repetitions=100 --device=local-task --module=pack.vmfb --function=broadcast_pack_kernel --input=4x128x3200xf32 --input=8640x3200xf16 | |
: 1713922846:0;iree-benchmark-module --benchmark_repetitions=15 --device=local-task --module=pack.vmfb --function=broadcast_pack_kernel --input=4x128x3200xf32 --input=8640x3200xf16 | |
: 1713923096:0;iree-benchmark-module --benchmark_repetitions=15 --device=local-task --module=pack.vmfb --function=broadcast_pack_kernel --input=4x128x3200xf32 --input=8640x3200xi16 | |
: 1713923148:0;iree-benchmark-module --benchmark_repetitions=15 --device=local-task --module=pack.vmfb --function=broadcast_pack_kernel --input=4x128x3200xf32 --input=8640x3200xi32 | |
: 1713923239:0;iree-compile --iree-hal-target-backends=llvm-cpu --iree-llvmcpu-target-cpu-features=host -o pack.vmfb pack_micro.mlir | |
: 1713923250:0;iree-benchmark-module --benchmark_repetitions=15 --device=local-task --module=pack.vmfb --function=broadcast_pack_kernel --input=4x128x3200xf32 --input=8640x3200xi16 | |
: 1713923268:0;vi tmp_ir.mlir | |
: 1713952814:0;vi pack_micro.mlir\ | |
: 1713952862:0;mv pack.mlir broadcast.mlir burn_24 | |
: 1713952911:0;iree-benchmark-module --benchmark_repetitions=15 --device=local-task --module=pack.vmfb --function=pack --input=4x8640x3200xi16 | |
: 1713953099:0;iree-compile --iree-hal-target-backends=llvm-cpu --iree-llvmcpu-target-cpu-features=host -o broadcast.vmfb broadcast.mlir | |
: 1713953102:0;iree-benchmark-module --benchmark_repetitions=15 --device=local-task --module=broadcast.vmfb --function=broadcast --input=4x128x3200xf32 --input=8640x3200xi16 | |
: 1713953210:0;iree-benchmark-module --benchmark_repetitions=15 --device=local-task --module=pack_broadcast.vmfb --function=pack_broadcast --input=4x128x3200xf32 --input=8640x3200xf16 | |
: 1713953234:0;iree-compile --iree-hal-target-backends=llvm-cpu --iree-llvmcpu-target-cpu-features=host -o pack_broadcast.vmfb pack_micro.mlir | |
: 1713953238:0;iree-benchmark-module --benchmark_repetitions=15 --device=local-task --module=pack_broadcast.vmfb --function=broadcast_pack --input=4x128x3200xf32 --input=8640x3200xf16 | |
: 1713954532:0;iree-compile --iree-hal-target-backends=llvm-cpu --iree-llvmcpu-target-cpu-features=host -o pack.vmfb pack.mlir --iree-hal-dump-executable-intermediates-to=onlypack/ --x86-asm-syntax=intel | |
: 1713954775:0;iree-compile --iree-hal-target-backends=llvm-cpu --iree-llvmcpu-target-cpu-features=host -o pack.vmfb pack.mlir --iree-hal-dump-executable-intermediates-to=onlypack/ --x86-asm-syntax=intel -mlir-print-ir-after-all 2> only_pack.mlir | |
: 1713954923:0;git o hanhan/do-not-decompose-pack-unpack-on-x86 | |
: 1713957941:0;gist-paste module_pack_dispatch_0_embedded_elf_x86_64.s | |
: 1713959301:0;iree-compile --iree-hal-target-backends=llvm-cpu --iree-llvmcpu-target-cpu-features=host -o pack.vmfb pack.mlir --iree-hal-dump-executable-intermediates-to=onlypack/ --x86-asm-syntax=intel | |
: 1713959329:0;iree-benchmark-module --benchmark_repetitions=15 --device=local-task --module=pack.vmfb --function=pack --input=4x8640x3200xf32 | |
: 1713959360:0;cd onlypack | |
: 1713959362:0;vi module_pack_dispatch_0_embedded_elf_x86_64.s | |
: 1713960157:0;vi pack_micro.mlir | |
: 1713960239:0;iree-compile --iree-hal-target-backends=llvm-cpu --iree-llvmcpu-target-cpu-features=host -o broadcast_pack.vmfb pack_micro.mlir | |
: 1713960303:0;mv pack_micro.mlir broadcast_pack.mlir | |
: 1713960657:0;iree-compile --iree-hal-target-backends=llvm-cpu --iree-llvmcpu-target-cpu-features=host -o broadcast_pack.vmfb broadcast_pack.mlir -mlir-print-ir-after-all 2> xyz.txt | |
: 1713960829:0;iree-benchmark-module --benchmark_repetitions=15 --device=local-task --module=broadcast_pack.vmfb --function=broadcast_pack --input=4x128x3200xf32 --input=8640x3200xf16 | |
: 1713961000:0;vi broadcast_pack. | |
: 1713961004:0;vi broadcast_pack.mlir | |
: 1713961030:0;iree-compile --iree-hal-target-backends=llvm-cpu --iree-llvmcpu-target-cpu-features=host -o broadcast_pack.vmfb broadcast_pack.mlir | |
: 1713961039:0;iree-benchmark-module --benchmark_repetitions=15 --device=local-task --module=broadcast_pack.vmfb --function=broadcast_pack --input=4x128x3200xf32 --input=8640x3200xf32 | |
: 1713963453:0;vi only_pack.mlir | |
: 1713963510:0;gist-paste only_pack.mlir | |
: 1713963688:0;iree-compile --iree-hal-target-backends=llvm-cpu --iree-llvmcpu-target-cpu-features=host -o broadcast.vmfb broadcast.mlir --iree-hal-dump-executable-intermediates-to=onlybroadcast/ --x86-asm-syntax=intel -mlir-print-ir-after-all 2> only_broadcast.mlir | |
: 1713963695:0;vi broadcast.mlir | |
: 1713963710:0;iree-benchmark-module --benchmark_repetitions=15 --device=local-task --module=broadcast.vmfb --function=broadcast --input=4x128x3200xf32 --input=8640x3200xf16 | |
: 1713963733:0;gist-paste only_broadcast.mlir | |
: 1713963829:0;gist-paste -f asm_broadcast.s < onlybroadcast/module_broadcast_dispatch_0_embedded_elf_x86_64.s | |
: 1713963859:0;vi only_broadcast.mlir | |
: 1713964725:0;git o improve_pack | |
: 1713964733:0;git o hanhan/improve_pack | |
: 1713964767:0;git o hanhan/improve-pack | |
: 1713974716:0;vi pack.mlir | |
: 1713975040:0;iree-compile --iree-hal-target-backends=llvm-cpu --iree-llvmcpu-target-cpu-features=host -o pack.vmfb pack.mlir | |
: 1713975072:0;TRACY_NO_EXIT=1 iree-benchmark-module --benchmark_repetitions=15 --device=local-task --module=pack.vmfb --function=pack --input=4x8640x3200xf16 | |
: 1713975088:0;iree-tracy-capture -o ~/pack.tracy | |
: 1713975098:0;gist-paste ~/pack.tracy | |
: 1713975400:0;TRACY_NO_EXIT=1 iree-benchmark-module --benchmark_repetitions=15 --device=local-sync --module=pack.vmfb --function=pack --input=4x8640x3200xf16 | |
: 1713975410:0;gist-paste ~/pack1.tracy | |
: 1713975418:0;iree-tracy-capture -o ~/pack1.tracy | |
: 1713980251:0;iree-compile --iree-hal-target-backends=llvm-cpu --iree-llvmcpu-target-cpu-features=host -o pack.vmfb pack.mlir -mlir-print-ir-after-all 2> xyz.txt | |
: 1713980295:0;iree-benchmark-module --benchmark_repetitions=15 --device=local-task --module=pack.vmfb --function=pack --input=4x8640x3200xf16 | |
: 1713980312:0;iree-benchmark-module --benchmark_repetitions=15 --device=local-sync --module=pack.vmfb --function=pack --input=4x8640x3200xf16 | |
: 1713980541:0;iree-tracy-capture -o ~/mmt3d.tracy | |
: 1713980549:0;iree-tracy-capture -o -f ~/mmt3d.tracy | |
: 1713980676:0;iree-compile \\ | |
--iree-opt-const-eval=false \\ | |
--iree-hal-target-backends=llvm-cpu \\ | |
--iree-llvmcpu-target-cpu=znver4 \\ | |
--iree-stream-resource-index-bits=64 \\ | |
--iree-vm-target-index-bits=64 \\ | |
--iree-llvmcpu-enable-ukernels=mmt4d \\ | |
--iree-global-opt-enable-quantized-matmul-reassociation=true \\ | |
--iree-opt-propagate-global-layout mmt3d_kernel.mlir -o mmt3d_ukernel.vmfb | |
: 1713980691:0;iree-compile \\ | |
--iree-opt-const-eval=false \\ | |
--iree-hal-target-backends=llvm-cpu \\ | |
--iree-llvmcpu-target-cpu=znver4 \\ | |
--iree-stream-resource-index-bits=64 \\ | |
--iree-vm-target-index-bits=64 \\ | |
--iree-llvmcpu-enable-ukernels=mmt4d \\ | |
--iree-global-opt-enable-quantized-matmul-reassociation=true \\ | |
mmt3d_kernel.mlir -o mmt3d_ukernel.vmfb | |
: 1713980719:0;TRACY_NO_EXIT=1 iree-benchmark-module --benchmark_repetitions=15 --device=local-sync --module=mmt3d_kernel.vmfb --function=turbine_llm_mmtfp_3d_8640_3200_f32f16 --input=4x128x3200xf32 --input=8640x3200xf16 | |
: 1713980749:0;TRACY_NO_EXIT=1 iree-benchmark-module --benchmark_repetitions=15 --device=local-sync --module=mmt3d_ukernel.vmfb --function=turbine_llm_mmtfp_3d_8640_3200_f32f16 --input=4x128x3200xf32 --input=8640x3200xf16 | |
: 1713980774:0;iree-tracy-capture -o -f ~/mmt3dukernel.tracy | |
: 1713980791:0;iree-tracy-capture -o ~/mmt3dukernel.tracy | |
: 1713980804:0;iree-tracy-capture --help | |
: 1713980835:0;vi mmt3d_kernel.mlir | |
: 1713981005:0;iree-compile \\ | |
--iree-opt-const-eval=false \\ | |
--iree-hal-target-backends=llvm-cpu \\ | |
--iree-llvmcpu-target-cpu=znver4 \\ | |
--iree-stream-resource-index-bits=64 \\ | |
--iree-vm-target-index-bits=64 \\ | |
--iree-llvmcpu-enable-ukernels=mmt4d \\ | |
--iree-global-opt-enable-quantized-matmul-reassociation=true \\ | |
mmtfp32_kernel.mlir -o mmt3dfp32_ukernel.vmfb | |
: 1713981040:0;TRACY_NO_EXIT=1 iree-benchmark-module --benchmark_repetitions=15 --device=local-sync --module=mmt3d_ukernel.vmfb --function=turbine_llm_mmtfp_3d_8640_3200_f32f32 --input=4x128x3200xf32 --input=8640x3200xf32 | |
: 1713981062:0;TRACY_NO_EXIT=1 iree-benchmark-module --benchmark_repetitions=15 --device=local-sync --module=mmt3dfp32_ukernel.vmfb --function=turbine_llm_mmtfp_3d_8640_3200_f32f32 --input=4x128x3200xf32 --input=8640x3200xf32 | |
: 1713981098:0;iree-tracy-capture -o ~/mmt3dfp32ukernel.tracy | |
: 1713981149:0;iree-compile \\ | |
--iree-opt-const-eval=false \\ | |
--iree-hal-target-backends=llvm-cpu \\ | |
--iree-stream-resource-index-bits=64 \\ | |
--iree-vm-target-index-bits=64 \\ | |
--iree-global-opt-enable-quantized-matmul-reassociation=true \\ | |
mmtfp32_kernel.mlir -o mmt3dfp32.vmfb | |
: 1713981171:0;TRACY_NO_EXIT=1 iree-benchmark-module --benchmark_repetitions=15 --device=local-sync --module=mmt3dfp32.vmfb --function=turbine_llm_mmtfp_3d_8640_3200_f32f32 --input=4x128x3200xf32 --input=8640x3200xf32 | |
: 1713981218:0;iree-tracy-capture -o ~/mmt3dfp32.tracy | |
: 1713981339:0;mkdir tracy_profiles | |
: 1713981341:0;mv *.tracy tracy_profiles/ | |
: 1714026347:0;git ob pack_f16 | |
: 1714028689:0;iree-compile --iree-hal-target-backends=llvm-cpu --iree-llvmcpu-target-cpu-features=host -o mmt3d_kernel.vmfb mmt3d_kernel.mlir -mlir-disable-threading | |
: 1714028806:0;iree-compile --iree-hal-target-backends=llvm-cpu --iree-llvmcpu-target-cpu-features=host -o mmt3d_kernel.vmfb mmt3d_kernel.mlir | |
: 1714028818:0;iree-benchmark-module --benchmark_repetitions=15 --device=local-sync --module=mmt3d_kernel.vmfb --function=turbine_llm_mmtfp_3d_8640_3200_f32f16 --input=4x128x3200xf32 --input=8640x3200xf16 | |
: 1714028846:0;iree-benchmark-module --benchmark_repetitions=15 --device=local-task --module=mmt3d_kernel.vmfb --function=turbine_llm_mmtfp_3d_8640_3200_f32f16 --input=4x128x3200xf32 --input=8640x3200xf16 | |
: 1714029098:0;iree-compile --iree-hal-target-backends=llvm-cpu --iree-llvmcpu-target-cpu-features=host -o mmt3d_kernel.vmfb mmt3d_kernel.mlir -mlir-print-ir-after-all 2> xyz.txt | |
: 1714039853:0;ctest -R iree-run-mlir --verbose | |
: 1714039875:0;cmake --build ~/iree-build/ --target iree-test-deps 2> err.txt | |
: 1714039883:0;cmake --build ~/iree-build/ --target iree-test-deps > err.txt | |
: 1714041238:0;iree-compile --iree-hal-target-backends=llvm-cpu --iree-llvmcpu-target-cpu-features=host -o /tmp/x.vmfb e2e_matmul_cpu_dt_bf16_f32_small_llvm-cpu_local-task_avx512bf16_matmul.mlir -mlir-print-ir-after-all 2> xyz.txt | |
: 1714041823:0;vi e2e_matmul_cpu_dt_bf16_f32_small_llvm-cpu_local-task_avx512bf16_matmul.mlir | |
: 1714041872:0;iree-compile --iree-hal-target-backends=llvm-cpu --iree-llvmcpu-target-cpu-features=host -o /tmp/x.vmfb ~/xyz.mlir -mlir-print-ir-after-all 2> xyz.txt | |
: 1714042239:0;iree-compile --iree-hal-target-backends=llvm-cpu --iree-llvmcpu-target-cpu-features=host -o /tmp/x.vmfb ~/xyz.mlir -mlir-print-ir-after-all 2> xyz.txt -mlir-disable-threading | |
: 1714043161:0;rm -rf ~/llvm-project/build | |
: 1714043861:0;vim | |
: 1714044071:0;rm -rf node_modules | |
: 1714044094:0;rm ''$'\250\017''&'$'\001' | |
: 1714044213:0;cd $HOME | |
: 1714044222:0;ls -lf | |
: 1714044318:0;gt lg | |
: 1714044590:0;rm -rf llvm-project | |
: 1714044626:0;git clone [email protected]:pashu123/llvm-project.git | |
: 1714045248:0;git remote add main [email protected]:llvm/llvm-project.git | |
: 1714045274:0;git remote remove origin | |
: 1714045620:0;git o main/main | |
: 1714045633:0;git ob upstream_main | |
: 1714045721:0;git o pashu/unpack_nosize | |
: 1714045726:0;git ob unpack_nosize | |
: 1714058263:0;mlir-opt -transform-interpreter ~/test.mlir | |
: 1714062392:0;git ob var_fix | |
: 1714065858:0;clang-format -i mlir/lib/Dialect/Vector/Utils/VectorUtils.cpp | |
: 1714065897:0;clang-format -i mlir/include/mlir/Dialect/Vector/Utils/VectorUtils.h | |
: 1714066118:0;git add mlir/include/mlir/Dialect/Vector/Utils/VectorUtils.h | |
: 1714118987:0;git remote vv | |
: 1714119732:0;git ob acos | |
: 1714127002:0;vi -f | |
: 1714127020:0;rm -rf -f | |
: 1714127021:0;clea | |
: 1714127021:0;rls | |
: 1714127040:0;rm -rf "-f" | |
: 1714127092:0;iree-compile xyz.mlir -o /tmp/x.vmfb | |
: 1714127462:0;iree-compile --iree-hal-target-backends=llvm-cpu --iree-llvmcpu-target-cpu-features=host iree-llvm-link-embedded=false -o /tmp/x.vmfb ~/xyz.mlir | |
: 1714127468:0;iree-compile --iree-hal-target-backends=llvm-cpu --iree-llvmcpu-target-cpu-features=host -iree-llvm-link-embedded=false -o /tmp/x.vmfb ~/xyz.mlir | |
: 1714127709:0;iree-compile --iree-hal-target-backends=llvm-cpu --iree-llvmcpu-target-cpu-features=host -iree-llvmcpu-link-embedded=true -o /tmp/x.vmfb ~/xyz.mlir | |
: 1714127746:0;iree-benchmark-module --benchmark_repetitions=15 --device=local-task --module=mmt3d_kernel.vmfb --function=test_acos --input=128x256xf32 | |
: 1714127791:0;iree-compile --iree-hal-target-backends=llvm-cpu --iree-llvmcpu-target-cpu-features=host -iree-llvmcpu-link-embedded=false -o /tmp/x.vmfb ~/xyz.mlir | |
: 1714127869:0;where libc | |
: 1714127898:0;iree-compile --iree-hal-target-backends=llvm-cpu --iree-llvmcpu-target-cpu-features=host -iree-llvmcpu-link-embedded=false -iree-llvm-link-static -o /tmp/x.vmfb ~/xyz.mlir | |
: 1714128146:0;iree-compile --iree-hal-target-backends=llvm-cpu --iree-llvmcpu-target-cpu-features=host -iree-llvmcpu-link-embedded=false -iree-llvmcpu-link-static -o /tmp/x.vmfb ~/xyz.mlir | |
: 1714128155:0;iree-run-mlir --help | |
: 1714128165:0;iree-benchmark-module --help | |
: 1714128282:0;iree-benchmark-module --benchmark_repetitions=15 --device=local-task --module=/tmp/x.vmfb --function=test_acos --executable_plugin= /usr/lib32/libc.so.6 --input=128x256xf32 | |
: 1714128313:0;nm /usr/lib32/libc.so.6 | |
: 1714128330:0;iree-benchmark-module --benchmark_repetitions=15 --device=local-task --module=/tmp/x.vmfb --function=test_acos --executable_plugin= /usr/lib32/libc.a --input=128x256xf32 | |
: 1714128337:0;nm /usr/lib32/libc.a | |
: 1714128566:0;iree-compile --iree-hal-target-backends=llvm-cpu --iree-llvmcpu-target-cpu-features=host -iree-llvmcpu-link-embedded=false -iree-llvmcpu-system-linker-path= /usr/lib32/libc.so.6 -o /tmp/x.vmfb ~/xyz.mlir | |
: 1714128573:0;iree-compile --iree-hal-target-backends=llvm-cpu --iree-llvmcpu-target-cpu-features=host -iree-llvmcpu-link-embedded=false -iree-llvmcpu-system-linker-path=/usr/lib32/libc.so.6 -o /tmp/x.vmfb ~/xyz.mlir | |
: 1714128703:0;gcc -lm | |
: 1714128716:0;gcc --print-file-name=libm | |
: 1714128719:0;gcc --print-file-name=libm.a | |
: 1714128963:0;iree-compile --iree-hal-target-backends=llvm-cpu --iree-llvmcpu-target-cpu-features=host -iree-llvmcpu-link-embedded=false -iree-llvmcpu-system-linker-path= /usr//usr/lib/gcc/x86_64-linux-gnu/11/../../../x86_64-linux-gnu/libm.a -o /tmp/x.vmfb ~/xyz.mlir | |
: 1714128970:0;iree-compile --iree-hal-target-backends=llvm-cpu --iree-llvmcpu-target-cpu-features=host -iree-llvmcpu-link-embedded=false -iree-llvmcpu-system-linker-path=/usr//usr/lib/gcc/x86_64-linux-gnu/11/../../../x86_64-linux-gnu/libm.a -o /tmp/x.vmfb ~/xyz.mlir | |
: 1714129707:0;gist-paste -f acos.py < xyz.py | |
: 1714130224:0;fjdlj | |
: 1714130247:0;python xyz.py | |
: 1714130468:0;vi xyz.py | |
: 1714130497:0;python3 xyz.py | |
: 1714131905:0;git o upstream_main | |
: 1714131912:0;git rebase main/main | |
: 1714131922:0;git ob poly_acos | |
: 1714132765:0;iree-compile --iree-hal-target-backends=llvm-cpu --iree-llvmcpu-target-cpu-features=host /tmp/x.vmfb ~/xyz.mlir | |
: 1714143002:0;git remote add pashu [email protected]:pashu123/llvm-project.git | |
: 1714143012:0;git fetch pashu/poly_acos | |
: 1714143059:0;git cp 897d417 | |
: 1714143246:0;iree-benchmark-module --benchmark_repetitions=15 --device=local-task --module=/tmp/x.vmfb --function=test_acos --input=128x256xf32 | |
: 1714143261:0;iree-benchmark-module --benchmark_repetitions=15 --device=local-task --module=/tmp/x.vmfb --function=test_acos --input=256x128xf32 | |
: 1714143520:0;iree-benchmark-module --benchmark_repetitions=1 --device=local-task --module=/tmp/x.vmfb --function=test_acos --input=256x128xf32 | |
: 1714145116:0;tools/mlir/test/CMakeFiles/check-mlir /home/prashant/llvm-project/build/tools/mlir/test/CMakeFiles/check-mlir\ | |
cd /home/prashant/llvm-project/build/tools/mlir/test && /home/prashant/global_venv/bin/python3.10 /home/prashant/llvm-project/build/./bin/llvm-lit -sv /home/prashant/llvm-project/build/tools/mlir/test | |
: 1714145254:0;/home/prashant/llvm-project/build/bin/mlir-opt /home/prashant/llvm-project/mlir/test/mlir-cpu-runner/math-polynomial-approx.mlir -pass-pipeline="builtin.module(func.func(test-math-polynomial-approximation,convert-arith-to-llvm),convert-vector-to-scf,convert-scf-to-cf,convert-cf-to-llvm,convert-vector-to-llvm,func.func(convert-math-to-llvm),convert-func-to-llvm,reconcile-unrealized-casts)" | /home/prashant/llvm-project/build/bin/mlir-cpu-runner -e main -entry-point-result=void -O0 -shared-libs=/home/prashant/llvm-project/build/lib/libmlir_c_runner_utils.so -shared-libs=/home/prashant/llvm-project/build/lib/libmlir_runner_utils.so | |
: 1714145363:0;python ~/xyz.py | |
: 1714146955:0;sudo lshw -C memory | |
: 1714213386:0;vi ~/xyz.py | |
: 1714213413:0;python3 ~/xyz.py | |
: 1714218397:0;ulimit -n | |
: 1714218455:0;uname -v | |
: 1714218462:0;uname -r | |
: 1714218485:0;where openmax | |
: 1714219958:0;sl | |
: 1714219963:0;cd ~/ire | |
: 1714219970:0;git o pack_f16 | |
: 1714326695:0;echo $$ | |
: 1714326714:0;ls -l /proc/1614619/fd | |
: 1714381251:0;wall | |
: 1714381327:0;wall --help | |
: 1714386068:0;ctest . -j 32 | |
: 1714386624:0;iree-opt --pass-pipeline='builtin.module(iree-llvmcpu-select-lowering-strategy)' compiler/src/iree/compiler/Codegen/LLVMCPU/test/select_x86_64_lowering_strategy.mlir | FileCheck compiler/src/iree/compiler/Codegen/LLVMCPU/test/select_x86_64_lowering_strategy.mlir | |
: 1714386718:0;iree-opt --pass-pipeline='builtin.module(iree-llvmcpu-select-lowering-strategy)' compiler/src/iree/compiler/Codegen/LLVMCPU/test/select_x86_64_lowering_strategy.mlir -split-input-file | FileCheck compiler/src/iree/compiler/Codegen/LLVMCPU/test/select_x86_64_lowering_strategy.mlir | |
: 1714388061:0;clang++ /tmp/x.cpp | |
: 1714388115:0;vi /tmp/x.cpp | |
: 1714388238:0;clang++ -march=native /tmp/x.cpp | |
: 1714388318:0;clang -march=native /tmp/x.cpp | |
: 1714399798:0;rm a.out | |
: 1714399826:0;cd ~/llvm-project | |
: 1714400519:0;mlir-opt -transform-interpreter ~/xyz.mlir -verify-each=0 | |
: 1714404128:0;eunm | |
: 1714469000:0;man pmap | |
: 1714469730:0;cd /usr/src | |
: 1714469738:0;cd linux-headers-6.5.0-18-generic | |
: 1714469746:0;cd lib/ | |
: 1714478186:0;wget https://github.com/iree-org/iree/files/15155944/batch_llama_3_8B.zip | |
: 1714489492:0;iree-compile --mlir-disable-threading --iree-opt-const-eval=false --compile-to=flow batch_llama_3_8B.mlir -o result_llama_3.mlir | |
: 1714489532:0;iree-compile --mlir-disable-threading --iree-opt-const-eval=false --compile-to=flow batch_llama_3_8B.mlir -o result_llama_3.mlir -mlir-print-ir-after-all 2> llama_err.mlir | |
: 1714489748:0;vi llama_err.mlir | |
: 1714490628:0;rm llama_err.mlir | |
: 1714490840:0;iree-compile -iree-input-type=flow --iree-vm-bytecode-module-output-format=flatbuffer-binary --iree-hal-target-backends=rocm --mlir-print-debuginfo --mlir-print-op-on-diagnostic=false --iree-hal-target-backends=rocm --iree-rocm-target-chip=gfx940 --iree-global-opt-propagate-transposes=true --iree-opt-const-eval=false result_llama_3.mlir -o llama_3.vmfb | |
: 1714490855:0;iree-compile -iree-input-type=tm_tensor --iree-vm-bytecode-module-output-format=flatbuffer-binary --iree-hal-target-backends=rocm --mlir-print-debuginfo --mlir-print-op-on-diagnostic=false --iree-hal-target-backends=rocm --iree-rocm-target-chip=gfx940 --iree-global-opt-propagate-transposes=true --iree-opt-const-eval=false result_llama_3.mlir -o llama_3.vmfb | |
: 1714490914:0;iree-compile -iree-input-type=torch --iree-vm-bytecode-module-output-format=flatbuffer-binary --iree-hal-target-backends=rocm --mlir-print-debuginfo --mlir-print-op-on-diagnostic=false --iree-hal-target-backends=rocm --iree-rocm-target-chip=gfx940 --iree-global-opt-propagate-transposes=true --iree-opt-const-eval=false batch_llama_3_8B.mlir -o llama_3.vmfb | |
: 1714491028:0;iree-compile -iree-input-type=torch --iree-vm-bytecode-module-output-format=flatbuffer-binary --mlir-print-debuginfo --mlir-print-op-on-diagnostic=false --iree-hal-target-backends=llvm-cpu --iree-global-opt-propagate-transposes=true --iree-opt-const-eval=false batch_llama_3_8B.mlir -o llama_3.vmfb | |
: 1714492729:0;mlir-opt ~/xyz.mlir --allow-unregistered-dialect | |
: 1714492741:0;mlir-opt ~/xyz.mlir --allow-unregistered-dialect -verify-each=0 | |
: 1714492956:0;iree-compile --iree-vm-bytecode-module-output-format=flatbuffer-binary --iree-hal-target-backends=rocm --mlir-print-debuginfo --mlir-print-op-on-diagnostic=false --iree-hal-target-backends=rocm --iree-rocm-target-chip=gfx940 --iree-global-opt-propagate-transposes=true --iree-opt-const-eval=false ~/xyz.mlir -o llama_3.vmfb -mlir-print-ir-after-all | |
: 1714493268:0;unzip batch_llama_3_8B.zip | |
: 1714493275:0;mv batch_llama_3_8B.mlir burn_24 | |
: 1714493473:0;iree-compile --iree-vm-bytecode-module-output-format=flatbuffer-binary --iree-hal-target-backends=rocm --mlir-print-debuginfo --mlir-print-op-on-diagnostic=false --iree-hal-target-backends=rocm --iree-rocm-target-chip=gfx940 --iree-global-opt-propagate-transposes=true --iree-opt-const-eval=false batch_llama_3_8B.mlir -o llama_3.vmfb | |
: 1714493521:0;iree-compile --mlir-disable-threading --iree-opt-const-eval=false --compile-to=flow batch_llama_3_8B.mlir -o result_llama_3.mlir | |
: 1714493537:0;iree-compile --iree-vm-bytecode-module-output-format=flatbuffer-binary --iree-hal-target-backends=rocm --mlir-print-debuginfo --mlir-print-op-on-diagnostic=false --iree-hal-target-backends=rocm --iree-rocm-target-chip=gfx940 --iree-global-opt-propagate-transposes=true --iree-opt-const-eval=false result_llama_3.mlir -o llama_3.vmfb | |
: 1714493573:0;gist-paste batch_llama_3_8B.mlir | |
: 1714493718:0;iree-compile --iree-vm-bytecode-module-output-format=flatbuffer-binary --iree-hal-target-backends=rocm --mlir-print-debuginfo --mlir-print-op-on-diagnostic=false --iree-hal-target-backends=rocm --iree-rocm-target-chip=gfx940 --iree-global-opt-propagate-transposes=true --iree-opt-const-eval=false result_llama_3.mlir -o llama_3.vmfb -mlir-print-ir-after-all 2> err.mlir | |
: 1714494477:0;vi err.mlir | |
: 1714496364:0;iree-opt ~/xyz.mlir | |
: 1714496450:0;gist-paste -f embedding_to_f16.mlir < ~/xyz.mlir | |
: 1714497424:0;iree-compile --iree-vm-bytecode-module-output-format=flatbuffer-binary --iree-hal-target-backends=rocm --mlir-print-debuginfo --mlir-print-op-on-diagnostic=false --iree-hal-target-backends=rocm --iree-rocm-target-chip=gfx940 --iree-global-opt-propagate-transposes=true --iree-opt-const-eval=false ~/xyz.mlir -o llama_3.vmfb | |
: 1714497629:0;iree-compile --iree-hal-target-backends=llvm-cpu --iree-llvmcpu-target-cpu-features=host -o /tmp/x.vmfb ~/xyz.mlir | |
: 1714497728:0;iree-compile -iree-input-type=torch --iree-hal-target-backends=llvm-cpu --iree-llvmcpu-target-cpu-features=host -o /tmp/x.vmfb ~/xyz.mlir | |
: 1714498902:0;iree-compile -iree-input-type=torch --iree-hal-target-backends=llvm-cpu --iree-llvmcpu-target-cpu-features=host -o /tmp/x.vmfb ~/xyz.mlir -mlir-print-ir-after-all | |
: 1714498925:0;iree-compile -iree-input-type=torch --iree-hal-target-backends=llvm-cpu --iree-llvmcpu-target-cpu-features=host -o /tmp/x.vmfb ~/xyz.mlir -mlir-print-ir-after-all 2> full_ir.mlir | |
: 1714498934:0;vi full_ir.mlir | |
: 1714530302:0;cd llama_3 | |
: 1714530307:0;mkdir llama3 | |
: 1714530330:0;git o enable_llama3 | |
: 1714530440:0;# Clone and install editable SHARK-Turbine dep in deps/\ | |
pip install -f https://iree.dev/pip-release-links.html --src deps \\ | |
-e "git+https://github.com/nod-ai/SHARK-Turbine.git#egg=SHARK-Turbine&subdirectory=core"\ | |
\ | |
# Install editable local projects.\ | |
pip install -r requirements -e sharktank/ shortfin/ | |
: 1714530455:0;pip install -f https://iree.dev/pip-release-links.html --src deps \\ | |
-e "git+https://github.com/nod-ai/SHARK-Turbine.git#egg=SHARK-Turbine&subdirectory=core" | |
: 1714530488:0;pip install -r requirements -e sharktank/ shortfin/ | |
: 1714530693:0;git clone https://github.com/ggerganov/llama.cpp | |
: 1714530717:0;cmake -B build | |
: 1714530724:0;cmake --build build --config Release | |
: 1714530739:0;cmake --build build --config Release -j 32 | |
: 1714530797:0;pip install -U "huggingface_hub[cli]" | |
: 1714530806:0;huggingface-cli download --local-dir . NousResearch/Meta-Llama-3-8B | |
: 1714531977:0;cd ll | |
: 1714532646:0;pip install sentencepiece | |
: 1714532648:0;python ./llama.cpp/convert.py --outtype f16 --outfile Meta-Llama-3-8B-f16_3.gguf . --vocab-type bpe | |
: 1714532673:0;cd llama.cpp | |
: 1714532686:0;python convert.py --outtype f16 --outfile Meta-Llama-3-8B-f16_3.gguf . --vocab-type bpe | |
: 1714532760:0;cp Meta-Llama-3-8B-f16_3.gguf ../ | |
: 1714532840:0;pip install -f https://iree.dev/pip-release-links.html --src deps -e "git+https://github.com/iree-org/iree-turbine.git#egg=shark-turbine" | |
: 1714532901:0;python -m sharktank.sharktank.examples.export_paged_llm_v1 --gguf-file=Meta-Llama-3-8B-f16.gguf | |
: 1714532982:0;python -m sharktank.sharktank.sharktank.examples.export_paged_llm_v1 --gguf-file=Meta-Llama-3-8B-f16.gguf | |
: 1714532995:0;python -m sharktank.examples.export_paged_llm_v1 --gguf-file=Meta-Llama-3-8B-f16.gguf | |
: 1714533050:0;python -m sharktank.examples.export_paged_llm_v1 --gguf-file=/home/prashant/llama3/Meta-Llama-3-8B-f16.gguf | |
: 1714533179:0;tmux attach -t 5 | |
: 1714533375:0;/usr/bin/htop | |
: 1714533400:0;cd / | |
: 1714533429:0;sudo swapoff -a | |
: 1714533456:0;sudo dd if=/dev/zero of=/swapfile bs=1G count=32 | |
: 1714533499:0;sudo chmod 0600 /swapfile | |
: 1714533507:0;sudo mkswap /swapfile | |
: 1714533514:0;sudo swapon /swapfile | |
: 1714533516:0;top | |
: 1714533526:0;grep Swap /proc/meminfo | |
: 1714533538:0;vi /etc/fstab | |
: 1714533581:0;sudo vi /etc/fstab | |
: 1714533759:0;cd ops/templates | |
: 1714534030:0;vi /home/prashant/llama3/.venv/lib/python3.10/site-packages/sharktank/ops/templates/mmtfp_3d.mlir | |
: 1714534193:0;ls /tmp | |
: 1714534509:0;vi /home/prashant/llama3/.venv/lib/python3.10/site-packages/sharktank/examples/export_paged_llm_v1.py | |
: 1714534786:0;cd sharktank/sharktank/sharktank | |
: 1714534806:0;cd sharktank/ops | |
: 1714534810:0;cd templates | |
: 1714534820:0;vi __init__.py | |
: 1714534874:0;cp /home/prashant/llama3/sharktank/sharktank\ | |
: 1714534887:0;cd /home/prashant/llama3/sharktank/sharktank\ | |
: 1714534911:0;.. | |
: 1714535566:0;vi /home/prashant/llama3/.venv/lib/python3.10/site-packages/sharktank/ops/templates/mmtfp_3d.mlir | |
: 1714535824:0;vi ops | |
: 1714535893:0;rm -rf sharkta* | |
: 1714535903:0;pip install . | |
: 1714535914:0;cd /home/prashant/llama3/.venv/lib/python3.10/site-packages/sharktank/ | |
: 1714535917:0;cd ops | |
: 1714535944:0;vi paged_llm_v1.py | |
: 1714535974:0;cd ~/llama3/sharktank/sharktank | |
: 1714536325:0;cp -r * /home/prashant/llama3/.venv/lib/python3.10/site-packages/sharktank/ | |
: 1714536742:0;vi complex.mlir | |
: 1714536779:0;iree-opt --convert-torch-to-linalg complex.mlir | |
: 1714536838:0;git clone [email protected]:llvm/torch-mlir.git | |
: 1714539482:0;vi build_tools/build_standalone.sh | |
: 1714539527:0;build_tools/build_standalone.sh | |
: 1714540642:0;mv complex.mlir .. | |
: 1714540646:0;cd ../torch-mlir | |
: 1714540770:0;build/bin/torch-mlir-opt -convert-torch-to-linalg ~/complex.mlir | |
: 1714541564:0;torch-mlir-opt -convert-torch-to-linalg ~/complex.mlir | |
: 1714541618:0;torch-mlir-opt --help | fzf | |
: 1714542073:0;clang-format -i lib/Conversion/TorchToLinalg/Uncategorized.cpp | |
: 1714542107:0;clang-format -i lib/Conversion/Utils/Utils.cpp | |
: 1714542174:0;torch-mlir-opt -torch-backend-to-linalg-on-tensors-backend-pipeline ~/complex.mlir | |
: 1714542716:0;pip install torchvision | |
: 1714542746:0;pip install -r torchvision-requirements.txt | |
: 1714542757:0;cd projects/pt1 | |
: 1714542760:0;python -m e2e_testing.main -f 'AtenComplex' | |
: 1714542788:0;python -m e2e_testing.main -f 'ElementWiseMul' | |
: 1714542801:0;python -m e2e_testing.main -f 'ElementwiseMul' | |
: 1714542943:0;vi /tmp/ElementwiseMulTensorComplexDiffModule.mlir | |
: 1714543152:0;python -m e2e_testing.main -f 'ElementwiseMul' -v | |
: 1714543514:0;git ob complex_cast | |
: 1714543712:0;cd lib | |
: 1714543719:0;vi whl-requirements.txt | |
: 1714543724:0;vi build-requirements.txt | |
: 1714543791:0;pip install black=24.4.2 | |
: 1714543796:0;pip install black==24.4.2 | |
: 1714543805:0;black projects/pt1/python/torch_mlir_e2e_test/test_suite/elementwise.py | |
: 1714545557:0;cd _python_build | |
: 1714545879:0;vi /tmp/batch_llama_v1.mlir | |
: 1714545914:0;ls -l /tmp/batch_llama_v1.mlir | |
: 1714545921:0;ls -lh /tmp/batch_llama_v1.mlir | |
: 1714545961:0;mv /tmp/batch_llama_v1.mlir ~/burn_24 | |
: 1714545970:0;cd ~/burn_24 | |
: 1714546128:0;vi batch_llama_3_8B.mlir | |
: 1714546223:0;iree-compile --mlir-disable-threading --iree-opt-const-eval=false --compile-to=flow batch_llama_v1.mlir -o result_llama_3.mlir | |
: 1714546253:0;iree-compile -iree-input-type=torch --mlir-disable-threading --iree-opt-const-eval=false --compile-to=flow batch_llama_v1.mlir -o result_llama_3.mlir | |
: 1714546311:0;torch-mlir-opt --convert-torch-to-linalg batch_llama_v1.mlir | |
: 1714546364:0;iree-compile -iree-input-type=torch --mlir-disable-threading --iree-opt-const-eval=false --compile-to=flow batch_llama_v1.mlir -o result_llama_3.mlir -mlir-print-ir-after-all 2> xyz.mlir | |
: 1714546444:0;iree-compile -iree-input-type=torch --mlir-disable-threading --iree-opt-const-eval=false --compile-to=flow batch_llama_v1.mlir -o result_llama_3.mlir -mlir-print-ir-after-failure 2> xyz.mlir | |
: 1714546463:0;iree-compile -iree-input-type=torch --mlir-disable-threading --iree-opt-const-eval=false --compile-to=flow batch_llama_v1.mlir -o result_llama_3.mlir -mlir-print-ir-after-failure | |
: 1714546659:0;iree-compile -iree-input-type=torch --mlir-disable-threading --iree-opt-const-eval=false --compile-to=flow batch_llama_v1.mlir -o result_llama_3.mlir | |
: 1714546683:0;iree-compile -iree-input-type=torch --iree-opt-const-eval=false --compile-to=flow batch_llama_v1.mlir -o result_llama_3.mlir | |
: 1714546743:0;iree-compile --iree-vm-bytecode-module-output-format=flatbuffer-binary --iree-hal-target-backends=rocm --mlir-print-debuginfo --mlir-print-op-on-diagnostic=false --iree-hal-target-backends=rocm --iree-rocm-target-chip=gfx940 --iree-global-opt-propagate-transposes=true --iree-opt-const-eval=false result_llama_3.mlir -o llama_3.vmfb | |
: 1714546866:0;iree-compile -iree-input-type=torch --iree-hal-target-backends=llvm-cpu --iree-llvmcpu-target-cpu-features=host result_llama_3.mlir -o llama3.vmfb | |
: 1714546887:0;iree-compile --iree-hal-target-backends=llvm-cpu --iree-llvmcpu-target-cpu-features=host result_llama_3.mlir -o llama3.vmfb | |
: 1714547412:0;iree-compile --iree-vm-bytecode-module-output-format=flatbuffer-binary --iree-hal-target-backends=rocm --mlir-print-debuginfo --mlir-print-op-on-diagnostic=false --iree-hal-target-backends=rocm --iree-rocm-target-chip=gfx940 --iree-global-opt-propagate-transposes=true --iree-opt-const-eval=false batch_llama_v1.mlir -o llama_3.vmfb | |
: 1714547545:0;iree-compile --iree-vm-bytecode-module-output-format=flatbuffer-binary --iree-hal-target-backends=rocm --mlir-print-debuginfo --mlir-print-op-on-diagnostic=false --iree-hal-target-backends=rocm --iree-rocm-target-chip=gfx940 --iree-global-opt-propagate-transposes=true --iree-opt-const-eval=false batch_llama_v1.mlir -o llama_3.vmfb -mlir-print-ir-before-failure | |
: 1714547550:0;iree-compile --iree-vm-bytecode-module-output-format=flatbuffer-binary --iree-hal-target-backends=rocm --mlir-print-debuginfo --mlir-print-op-on-diagnostic=false --iree-hal-target-backends=rocm --iree-rocm-target-chip=gfx940 --iree-global-opt-propagate-transposes=true --iree-opt-const-eval=false batch_llama_v1.mlir -o llama_3.vmfb -mlir-print-ir-after-failure | |
: 1714547583:0;iree-compile --iree-vm-bytecode-module-output-format=flatbuffer-binary --iree-hal-target-backends=rocm --mlir-print-debuginfo --mlir-print-op-on-diagnostic=false --iree-hal-target-backends=rocm --iree-rocm-target-chip=gfx940 --iree-global-opt-propagate-transposes=true --iree-opt-const-eval=false batch_llama_v1.mlir -o llama_3.vmfb -mlir-print-ir-after-all 2> xyz.mlir | |
: 1714547765:0;rm batch_llama_3_8B.zip | |
: 1714547958:0;rm xyz.mlir | |
: 1714548570:0;iree-compile --iree-vm-bytecode-module-output-format=flatbuffer-binary --iree-hal-target-backends=rocm --mlir-print-debuginfo --mlir-print-op-on-diagnostic=false --iree-hal-target-backends=rocm --iree-rocm-target-chip=gfx940 --iree-global-opt-propagate-transposes=true --iree-opt-const-eval=false test.mlir -o llama_3.vmfb | |
: 1714548620:0;iree-compile iree-input-type=torch --iree-vm-bytecode-module-output-format=flatbuffer-binary --iree-hal-target-backends=rocm --mlir-print-debuginfo --mlir-print-op-on-diagnostic=false --iree-hal-target-backends=rocm --iree-rocm-target-chip=gfx940 --iree-global-opt-propagate-transposes=true --iree-opt-const-eval=false test.mlir -o llama_3.vmfb | |
: 1714548625:0;iree-compile -iree-input-type=torch --iree-vm-bytecode-module-output-format=flatbuffer-binary --iree-hal-target-backends=rocm --mlir-print-debuginfo --mlir-print-op-on-diagnostic=false --iree-hal-target-backends=rocm --iree-rocm-target-chip=gfx940 --iree-global-opt-propagate-transposes=true --iree-opt-const-eval=false test.mlir -o llama_3.vmfb | |
: 1714548660:0;iree-compile -iree-input-type=torch --iree-vm-bytecode-module-output-format=flatbuffer-binary --iree-hal-target-backends=rocm --mlir-print-debuginfo --mlir-print-op-on-diagnostic=false --iree-hal-target-backends=rocm --iree-rocm-target-chip=gfx940 --iree-global-opt-propagate-transposes=true --iree-opt-const-eval=false test.mlir -o llama_3.vmfb -mlir-print-ir-after-all 2> xyz.mlir | |
: 1714548761:0;iree-compile -iree-input-type=torch --iree-vm-bytecode-module-output-format=flatbuffer-binary --iree-hal-target-backends=rocm --mlir-print-debuginfo --mlir-print-op-on-diagnostic=false --iree-hal-target-backends=rocm --iree-rocm-target-chip=gfx940 --iree-global-opt-propagate-transposes=true --iree-opt-const-eval=false test.mlir -o llama_3.vmfb -mlir-print-ir-after-all -mlir-disable-threading 2> xyz.mlir | |
: 1714548948:0;iree-compile -iree-input-type=torch --iree-vm-bytecode-module-output-format=flatbuffer-binary --iree-hal-target-backends=rocm --mlir-print-debuginfo --mlir-print-op-on-diagnostic=false --iree-hal-target-backends=rocm --iree-rocm-target-chip=gfx940 --iree-global-opt-propagate-transposes=true --iree-opt-const-eval=false test.mlir -o llama_3.vmfb -mlir-disable-threading | |
: 1714548984:0;iree-compile --iree-hal-target-backends=llvm-cpu --iree-llvmcpu-target-cpu-features=host test.mlir -o llama3.vmfb | |
: 1714549001:0;iree-compile --iree-hal-target-backends=llvm-cpu --iree-llvmcpu-target-cpu-features=host batch_llama_v1.mlir -o llama3.vmfb | |
: 1714549036:0;iree-compile --iree-hal-target-backends=llvm-cpu --iree-llvmcpu-target-cpu-features=host batch_llama_v1.mlir -o llama3.vmfb -mlir-print-ir-after-all 2> xyz.mlir | |
: 1714549065:0;iree-compile --iree-hal-target-backends=llvm-cpu --iree-llvmcpu-target-cpu-features=host complex.mlir -o llama3.vmfb | |
: 1714549071:0;iree-compile --iree-hal-target-backends=llvm-cpu --iree-llvmcpu-target-cpu-features=host ~/complex.mlir -o llama3.vmfb | |
: 1714549086:0;iree-compile --iree-hal-target-backends=llvm-cpu --iree-llvmcpu-target-cpu-features=host ~/complex.mlir -o llama3.vmfb -mlir-print-ir-after-all | |
: 1714549103:0;iree-compile --iree-hal-target-backends=llvm-cpu --iree-llvmcpu-target-cpu-features=host ~/complex.mlir -o llama3.vmfb -mlir-print-ir-after-all -mlir-disable-threading | |
: 1714549645:0;iree-compile --iree-hal-target-backends=llvm-cpu --iree-llvmcpu-target-cpu-features=host ~/complex.mlir -o llama3.vmfb | |
: 1714549730:0;iree-compile --iree-hal-target-backends=llvm-cpu --iree-llvmcpu-target-cpu-features=host batch_llama_v1.mlir -o llama3.vmfb | |
: 1714549788:0;iree-compile --iree-hal-target-backends=llvm-cpu --iree-llvmcpu-target-cpu-features=host batch_llama_v1.mlir -o llama3.vmfb -mlir-disable-threading 2> xyz.mlir > xyz.mlir | |
: 1714549841:0;clang-format -i compiler/src/iree/compiler/Codegen/LLVMCPU/KernelDispatch.cpp | |
: 1714549949:0;git ob dtype_fix | |
: 1714550158:0;cat ~/complex.mlir | |
: 1714550792:0;iree-compile -iree-input-type=torch --iree-hal-target-backends=llvm-cpu --iree-llvmcpu-target-cpu-features=host batch_llama_v1.mlir -o llama3.vmfb | |
: 1714550832:0;vi ~/complex.mlir | |
: 1714550877:0;vi result_llama_3.mlir | |
: 1714552058:0;iree-compile -iree-input-type=torch --iree-hal-target-backends=llvm-cpu --iree-llvmcpu-target-cpu-features=host ~/xyz.mlir -mlir-print-ir-after-all 2> fail.mlir | |
: 1714552068:0;vi fail.mlir | |
: 1714552359:0;iree-compile -iree-input-type=torch --iree-hal-target-backends=llvm-cpu --iree-llvmcpu-target-cpu-features=host batch_llama_v1.mlir -iree-input-demote-i64-to-i32 -o llama3.vmfb 2> xyz.mlir > xyz.mlir | |
: 1714552387:0;vi batch_llama_ | |
: 1714552711:0;cd llama3 | |
: 1714552720:0;python -m sharktank.examples.export_paged_llm_v1 --gguf-file=/home/prashant/llama3/Meta-Llama-3-8B-f16_3.gguf | |
: 1714552869:0;cp /tmp/batch_llama_v1.mlir ~/burn_24/llama_dont.mlir | |
: 1714552877:0;vi llama_dont.mlir | |
: 1714553049:0;cp llama_dont.mlir batch_llama_v1.mlir | |
: 1714553058:0;iree-compile -iree-input-type=torch --iree-hal-target-backends=llvm-cpu --iree-llvmcpu-target-cpu-features=host batch_llama_v1.mlir -iree-input-demote-i64-to-i32 -o llama3.vmfb | |
: 1714553108:0;iree-compile -iree-input-type=torch --iree-hal-target-backends=llvm-cpu --iree-llvmcpu-target-cpu-features=host ~/xyz.mlir | |
: 1714553152:0;iree-compile -iree-input-type=torch --iree-hal-target-backends=llvm-cpu --iree-llvmcpu-target-cpu-features=host ~/xyz.mlir -iree-demote-i64-to-32 | |
: 1714553158:0;iree-compile -iree-input-type=torch --iree-hal-target-backends=llvm-cpu --iree-llvmcpu-target-cpu-features=host ~/xyz.mlir -iree-opt-demote-i64-to-32 | |
: 1714553168:0;iree-compile -iree-input-type=torch --iree-hal-target-backends=llvm-cpu --iree-llvmcpu-target-cpu-features=host ~/xyz.mlir -iree-opt-demote-i64-to-i32 | |
: 1714553195:0;iree-compile -iree-input-type=torch --iree-hal-target-backends=llvm-cpu --iree-llvmcpu-target-cpu-features=host batch_llama_v1.mlir -iree-input-demote-i64-to-i32 -o llama3.vmfb >xyz.mlir 2> xyz.mlir | |
: 1714553448:0;git lfs track batch_llama_v1.mlir | |
: 1714553461:0;rm -rf .git | |
: 1714553502:0;gist-paste batch_llama_v1.mlir | |
: 1714553714:0;huggingface-cli upload batch_llama_v1.mlir prashantk/test_files | |
: 1714553788:0;huggingface-cli login | |
: 1714553844:0;huggingface-cli upload prashantk/test_files batch_llama_v1.mlir | |
: 1714554001:0;wget https://huggingface.co/prashantk/test_files/resolve/main/batch_llama_v1.mlir\?download\=true | |
: 1714554179:0;huggingface-cli upload prashantk/test_files batch_llama_v1.mlir . | |
: 1714554184:0;source ~/llama3/.venv/bin/activate | |
: 1714554212:0;iree-compile --iree-hal-target-backends=llvm-cpu --iree-llvmcpu-target-cpu-features=host batch_llama_v1.mlir -iree-opt-demote-i64-to-i32 -o llama3.vmfb | |
: 1714554252:0;iree-compile -iree-input-type=torch --iree-hal-target-backends=llvm-cpu --iree-llvmcpu-target-cpu-features=host batch_llama_v1.mlir -iree-opt-demote-i64-to-i32 -o llama3.vmfb | |
: 1714554387:0;/home/prashant/iree-build/tools/iree-compile -iree-input-type=torch --iree-hal-target-backends=llvm-cpu --iree-llvmcpu-target-cpu-features=host -mlir-disable-threading batch_llama_v1.mlir -iree-opt-demote-i64-to-i32 -o llama3.vmfb | |
: 1714554439:0;iree-compile -iree-input-type=torch --iree-hal-target-backends=llvm-cpu --iree-llvmcpu-target-cpu-features=host -mlir-disable-threading batch_llama_v1.mlir -iree-opt-demote-i64-to-i32 -o llama3.vmfb | |
: 1714554740:0;iree-compile -iree-input-type=torch --iree-vm-bytecode-module-output-format=flatbuffer-binary --iree-hal-target-backends=rocm --mlir-print-debuginfo --mlir-print-op-on-diagnostic=false --iree-hal-target-backends=rocm --iree-rocm-target-chip=gfx940 --iree-global-opt-propagate-transposes=true --iree-opt-const-eval=false llama_dont.mlir -o llama_3.vmfb \ | |
/home/prashant/iree-build/tools/iree-compile -iree-input-type=torch --iree-hal-target-backends=llvm-cpu --iree-llvmcpu-target-cpu-features=host -mlir-disable-threading batch_llama_v1.mlir -iree-opt-demote-i64-to-i32 -o llama3.vmfb | |
: 1714554788:0;/home/prashant/iree-build/tools/iree-compile -iree-input-type=torch --iree-vm-bytecode-module-output-format=flatbuffer-binary --iree-hal-target-backends=rocm --mlir-print-debuginfo --mlir-print-op-on-diagnostic=false -iree-opt-demote-i64-to-i32 --iree-hal-target-backends=rocm --iree-rocm-target-chip=gfx940 --iree-global-opt-propagate-transposes=true --iree-opt-const-eval=false llama_dont.mlir -o llama_3.vmfb | |
: 1714554811:0;/home/prashant/iree-build/tools/iree-compile -iree-input-type=torch --iree-vm-bytecode-module-output-format=flatbuffer-binary --iree-hal-target-backends=rocm --mlir-print-debuginfo --mlir-print-op-on-diagnostic=false -iree-opt-demote-i64-to-i32 --iree-hal-target-backends=rocm --iree-rocm-target-chip=gfx940 --iree-opt-const-eval=false llama_dont.mlir -o llama_3.vmfb | |
: 1714645246:0;env | |
: 1714645295:0;where export\ | |
: 1714651153:0;mlir-opt -transform-interpreter ~/xyz.mlir | mlir/utils/generate-test-checks.py | |
: 1714651321:0;mlir-opt -transform-interpreter ~/xyz.mlir | |
: 1714651661:0;bmbm | |
: 1714651704:0;mlir-opt -transform-interpreter mlir/test/Dialect/Linalg/vectorization.mlir -split-input-file | FileCheck mlir/test/Dialect/Linalg/vectorization.mlir | |
: 1714653972:0;git ob type_cast | |
: 1714658816:0;build_tools/update_torch_ods.sh | |
: 1714659293:0;build/bin/torch-mlir-opt ~/xyz.mlir | |
: 1714659963:0;clang-format lib/Dialect/Torch/IR/TorchOps.cpp | |
: 1714660335:0;build/bin/torch-mlir-opt -canonicalize ~/xyz.mlir | |
: 1714660376:0;build/bin/torch-mlir-opt -canonicalize -dce ~/xyz.mlir | |
: 1714661476:0;build/bin/torch-mlir-opt -canonicalize -cse ~/xyz.mlir | |
: 1714661485:0;build/bin/torch-mlir-opt -canonicalize -cse -cse ~/xyz.mlir | |
: 1714661493:0;build/bin/torch-mlir-opt -canonicalize -cse -canonicalize ~/xyz.mlir | |
: 1714661497:0;build/bin/torch-mlir-opt -canonicalize -cse -dce ~/xyz.mlir | |
: 1714661579:0;build/bin/torch-mlir-opt -canonicalize -convert-torch-to-linalg -cse -symbol-dce ~/xyz.mlir | |
: 1714661615:0;torch-mlir-opt --torch-backend-to-linalg-on-tensors-backend-pipeline -allow-unregistered-dialect ~/xyz.mlir | |
: 1714661620:0;build/bin/torch-mlir-opt --torch-backend-to-linalg-on-tensors-backend-pipeline -allow-unregistered-dialect ~/xyz.mlir | |
: 1714661634:0;build/bin/torch-mlir-opt --torch-backend-to-linalg-on-tensors-backend-pipeline ~/xyz.mlir | |
: 1714661656:0;build/bin/torch-mlir-opt -torch-to-linalg --torch-backend-to-linalg-on-tensors-backend-pipeline ~/xyz.mlir | |
: 1714661663:0;build/bin/torch-mlir-opt -convert-torch-to-linalg --torch-backend-to-linalg-on-tensors-backend-pipeline ~/xyz.mlir | |
: 1714661678:0;build/bin/torch-mlir-opt -convert-torch-to-linalg ~/xyz.mlir | |
: 1714661705:0;build/bin/torch-mlir-opt -canonicalize -convert-torch-to-linalg ~/xyz.mlir | |
: 1714661715:0;build/bin/torch-mlir-opt -canonicalize -convert-torch-to-linalg -canonicalize -cse ~/xyz.mlir | |
: 1714661764:0;iree-compile -iree-input-type=torch --iree-hal-target-backends=llvm-cpu --iree-llvmcpu-target-cpu-features=host ~/xyz.mlir -iree-input-demote-i64-to-i32 | |
: 1714661935:0;build/bin/torch-mlir-opt --torch-backend-to-linalg-on-tensors-backend-pipeline -mlir-print-ir-after-all ~/xyz.mlir | |
: 1714662070:0;build/bin/torch-mlir-opt -canonicalize -cse -symbol-dce ~/xyz.mlir | |
: 1714662099:0;iree-compile -iree-input-type=torch --iree-hal-target-backends=llvm-cpu --iree-llvmcpu-target-cpu-features=host ~/new.mlir -iree-input-demote-i64-to-i32 | |
: 1714662111:0;iree-compile -iree-input-type=torch --iree-hal-target-backends=llvm-cpu --iree-llvmcpu-target-cpu-features=host ~/new.mlir -iree-input-demote-i64-to-i32 -mlir-print-ir-after-all | |
: 1714662184:0;build/bin/torch-mlir-opt -canonicalize -cse -symbol-dce ~/xyz.mlir | |
: 1714662263:0;build/bin/torch-mlir-opt -canonicalize -cse -symbol-dce ~/xyz.mlir > ~/new.mlir | |
: 1714662276:0;iree-compile -iree-input-type=torch --iree-hal-target-backends=llvm-cpu --iree-llvmcpu-target-cpu-features=host ~/new.mlir -iree-input-demote-i64-to-i32 -mlir-print-ir-after-all 2> kk.mlir | |
: 1714662401:0;rm kk.mlir | |
: 1714662714:0;build/bin/torch-mlir -canonicalize ~/xyz.mlir | ~/llvm-project/mlir/utils/generate-test-checks.py | |
: 1714662735:0;build/bin/torch-mlir-opt -canonicalize ~/xyz.mlir | ~/llvm-project/mlir/utils/generate-test-checks.py | |
: 1714663604:0;black projects/pt1/python/torch_mlir/jit_ir_importer/build_tools/torch_ods_gen.py | |
: 1714737451:0;git o poly_acos | |
: 1714738855:0;clang-format -i mlir/include/mlir/Dialect/llvm-project/mlir/lib/Dialect/Math/Transforms/PolynomialApproximation.cpp | |
: 1714738875:0;clang-format -i mlir/lib/Dialect/Math/Transforms/PolynomialApproximation.cpp | |
: 1714747186:0;psrset | |
: 1714747658:0;git o unpack_nosize | |
: 1714750656:0;clang-format -i mlir/lib/Dialect/Linalg/Transforms/Vectorization.cpp | |
: 1714796039:0;cd pashu_home | |
: 1714796043:0;rm -rf pashu_home | |
: 1714796216:0;python3 | |
: 1714837345:0;tmux kill-server | |
: 1714837381:0;git clone https://github.com/PeterTh/uibk_cpp | |
: 1714837403:0;mv uibk_cpp advance_cpp | |
: 1714837545:0;cd 01_values | |
: 1714837554:0;g++ 01_06_advanced_string.cpp | |
: 1714837570:0;g++ -O1 01_06_advanced_string.cpp | |
: 1714837633:0;clang++ -O1 01_06_advanced_string.cpp | |
: 1714837717:0;clang++ -std=c++11 -O1 01_06_advanced_string.cpp | |
: 1714837730:0;clang++ -std=gnu++11 -O1 01_06_advanced_string.cpp | |
: 1714837776:0;clang++ -std=gnu++98 -O1 01_06_advanced_string.cpp | |
: 1714838356:0;clang++ -O3 01_06_advanced_string.cpp | |
: 1714838463:0;clang++ -O3 01_07_advanced_string_move.cpp | |
: 1714838473:0;clang++ -O1 01_07_advanced_string_move.cpp | |
: 1714844994:0;cd 02_classes_and_interfaces | |
: 1714845035:0;g++ 02_01_basic_interfaces.cpp | |
: 1714845579:0;g++ 02_02_function_size.cpp | |
: 1714845812:0;cc | |
: 1714845817:0;where cc | |
: 1714845822:0;cc -version | |
: 1714845826:0;cc --version | |
: 1714845836:0;cc 02_01_basic_interfaces.cpp | |
: 1714904433:0;g++ 02_04_return_smart_pointers.cpp | |
: 1714904664:0;g++ -g 02_04_return_smart_pointers.cpp | |
: 1714904686:0;g++ -g -O1 02_04_return_smart_pointers.cpp | |
: 1714904697:0;g++ -G -O1 02_04_return_smart_pointers.cpp | |
: 1714904704:0;g++ --help | fzf | |
: 1715004198:0;cp ~/.zshrc ~/.zsh_history . | |
: 1715004206:0;git init | |
: 1715095007:0;cd 03_lambdas_and_algorithms | |
: 1715095038:0;cd ../03_lambdas_and_algorithms | |
: 1715095104:0;g++ 03_01_containers_sequence.cpp | |
: 1715136531:0;cd third_party | |
: 1715136610:0;git remote add pashu [email protected]:pashu123/torch-mlir.git | |
: 1715136654:0;git cp 22465ee | |
: 1715137367:0;wget https://sharkpublic.blob.core.windows.net/sharkpublic/scotttodd/issue_reports/open_llama_3b_v2_f16.mlir | |
: 1715137398:0;iree-compile open_llama_3b_v2_f16.mlir --iree-hal-target-backends=llvm-cpu -o /tmp/open_llama_3b_v2_f16_cpu.vmfb | |
: 1715137472:0;iree-compile open_llama_3b_v2_f16.mlir --iree-hal-target-backends=llvm-cpu -o /tmp/open_llama_3b_v2_f16_cpu.vmfb -iree-opt-demote-i64-to-i32 | |
: 1715137651:0;iree-compile open_llama_3b_v2_f16.mlir --iree-hal-target-backends=vulkan-spirv -o /tmp/open_llama_3b_v2_f16_vulkan.vmfb -iree-opt-demote-i64-to-i32 | |
: 1715137990:0;iree-compile llama_dont.mlir --iree-hal-target-backends=vulkan-spirv -o /tmp/open_llama_3b_v2_f16_vulkan.vmfb | |
: 1715138033:0;vi batch_llama_v1.mlir | |
: 1715138063:0;iree-compile batch_llama_v1.mlir --iree-hal-target-backends=vulkan-spirv -o /tmp/open_llama_3b_v2_f16_vulkan.vmfb | |
: 1715138279:0;iree-compile llama_dont.mlir --iree-hal-target-backends=vulkan-spirv -o /tmp/open_llama_3b_v2_f16_vulkan.vmfb -iree-opt-demote-i64-to-i32 | |
: 1715143283:0;iree-compile open_llama_3b_v2_f16.mlir --iree-hal-target-backends=llvm-cpu -o /tmp/open_llama_3b_v2_f16_cpu.vmfb -mlir-print-ir-after-all 2> xyz.mlir | |
: 1715143676:0;iree-compile open_llama_3b_v2_f16.mlir --iree-hal-target-backends=llvm-cpu -o /tmp/open_llama_3b_v2_f16_cpu.vmfb > xyz.mlir | |
: 1715143694:0;iree-compile open_llama_3b_v2_f16.mlir --iree-hal-target-backends=llvm-cpu -o /tmp/open_llama_3b_v2_f16_cpu.vmfb 2> xyz.mlir | |
: 1715143932:0;vi open_llama_3b_v2_f16.mlir | |
: 1715145051:0;iree-compile ~/xyz.mlir --iree-hal-target-backends=llvm-cpu -o /tmp/open_llama_3b_v2_f16_cpu.vmfb | |
: 1715145076:0;cat ~/xyz.mlir | |
: 1715145088:0;torch-mlir-opt ~/xyz.mlir | |
: 1715148603:0;iree-compile ~/xyz.mlir --iree-hal-target-backends=llvm-cpu -o /tmp/open_llama_3b_v2_f16_cpu.vmfb -mlir-print-ir-after-all 2> xyz.mlir | |
: 1715148635:0;gist-paste xyz.mlir | |
: 1715262085:0;cd prashant/torch-mlir | |
: 1715266823:0;build/bin/torch-mlir-opt -canonicalize ~/xyz.mlir | |
: 1715272100:0;mkdir tresleches | |
: 1715272114:0;mv splat_tresleches.irpa tresleches.mlir tresleches | |
: 1715272175:0;iree-compile ~/tresleches.mlir --iree-hal-target-backends=llvm-cpu -o tres.vmfb | |
: 1715272184:0;iree-compile tresleches.mlir --iree-hal-target-backends=llvm-cpu -o tres.vmfb | |
: 1715272217:0;vi tresleches.mlir | |
: 1715272472:0;./tools/iree-compile --mlir-elide-elementsattrs-if-larger=2 --iree-hal-target-backends=llvm-cpu tresleches.mlir --iree-hal-dump-executable-sources-to=../dispatches_no_dtile2 --iree-opt-data-tiling=0 -o tresleches.vmfb | |
: 1715272500:0;./tools/iree-compile --mlir-elide-elementsattrs-if-larger=2 --iree-hal-target-backends=llvm-cpu tresleches.mlir -o tresleches.vmfb | |
: 1715272508:0;iree-compile --mlir-elide-elementsattrs-if-larger=2 --iree-hal-target-backends=llvm-cpu tresleches.mlir -o tresleches.vmfb | |
: 1715272797:0;c d.. | |
: 1715272799:0;cd ../tr | |
: 1715272803:0;cd ../tresleches | |
: 1715272834:0;git fetch | |
: 1715272838:0;git cp 8580114 | |
: 1715272892:0;git fetch all | |
: 1715272923:0;git remote add torch [email protected]:llvm/torch-mlir.git | |
: 1715272925:0;git fetch torch | |
: 1715272935:0;git cp 85801144cab0f405693ff99b685bbf9b23351df4 | |
: 1715273027:0;iree-compile -iree-input-type=torch --mlir-elide-elementsattrs-if-larger=2 --iree-hal-target-backends=llvm-cpu tresleches.mlir -o tresleches.vmfb | |
: 1715273315:0;iree-benchmark-module --device=local-task --module=tresleches.vmfb --parameters=model=splat_tresleches.irpa --input=1x77x4096xf32=1 --input=1x2048xf32=1 --input=1x77x4096xf32=1 --input=1x2048xf32=1 --input=1x16x128x128xf32=1 --input=1x16x128x128xf32=1 -input=3x1024x1024=1 | |
: 1715273924:0;mv sd3.tracy tresleches.tracy | |
: 1715274286:0;tracy --help | |
: 1715274656:0;mv ../1_step_tresleches.mlir . | |
: 1715274665:0;iree-compile -iree-input-type=torch --mlir-elide-elementsattrs-if-larger=2 --iree-hal-target-backends=llvm-cpu 1_step_tresleches.mlir -o tresleches.vmfb | |
: 1715274854:0;TRACY_NO_EXIT=1 iree-benchmark-module --device=local-task --module=tresleches.vmfb --parameters=model=splat_tresleches.irpa --input=1x77x4096xf32=1 --input=1x2048xf32=1 --input=1x77x4096xf32=1 --input=1x2048xf32=1 --input=1x16x128x128xf32=1 --input=1x16x128x128xf32=1 -input=3x1024x1024=1 | |
: 1715274948:0;iree-run-module --device=local-task --module=tresleches.vmfb --parameters=model=splat_tresleches.irpa --input=1x77x4096xf32=1 --input=1x2048xf32=1 --input=1x77x4096xf32=1 --input=1x2048xf32=1 --input=1x16x128x128xf32=1 --input=1x16x128x128xf32=1 -input=3x1024x1024=1 | |
: 1715276119:0;cd tr | |
: 1715276133:0;iree-tracy-capture -o ~/sd3.tracy | |
: 1715278736:0;iree-compile \\ | |
--iree-opt-const-eval=false \\ | |
--iree-hal-target-backends=llvm-cpu \\ | |
--iree-llvmcpu-target-cpu=znver4 \\ | |
--iree-stream-resource-index-bits=64 \\ | |
--iree-vm-target-index-bits=64 \\ | |
--iree-llvmcpu-enable-ukernels=mmt4d \\ | |
--iree-global-opt-enable-quantized-matmul-reassociation=true \\ | |
tresleches.mlir -o tresleches.vmfb | |
: 1715278822:0;iree-tracy-capture -o ~/tresleches_ukernel.tracy | |
: 1715278824:0;TRACY_NO_EXIT=1 iree-benchmark-module --device=local-task --module=tresleches.vmfb --parameters=model=splat_tresleches.irpa --input=1x77x4096xf32=1 --input=1x2048xf32=1 --input=1x77x4096xf32=1 --input=1x2048xf32=1 --input=1x16x128x128xf32=1 --input=1x16x128x128xf32=1 -input=3x1024x1024=1 --function=main | |
: 1715283872:0;tmux attach -t 7 | |
: 1715283898:0;tmux attach -t 6 | |
: 1715603002:0;cd prashant/iree | |
: 1715603107:0;git ob pack_decomp | |
: 1715606084:0;git cp e936ee64c3e65027b2cb3f222df6cfb73a370f5c | |
: 1715607512:0;cd tests/e2e/matmul | |
: 1715607535:0;cd convolution | |
: 1715607537:0;ctest . -j 64 | |
: 1715607600:0;iree-compile \\ | |
--iree-opt-const-eval=false \\ | |
--iree-hal-target-backends=llvm-cpu \\ | |
--iree-llvmcpu-target-cpu=znver4 \\ | |
--iree-stream-resource-index-bits=64 \\ | |
--iree-vm-target-index-bits=64 \\ | |
--iree-llvmcpu-enable-ukernels=mmt4d \\ | |
--iree-global-opt-enable-quantized-matmul-reassociation=true \\ | |
1_step_tresleches.mlir -o tresleches.vmfb | |
: 1715608370:0;2vi | |
: 1715618551:0;iree-compile \\ | |
--iree-opt-const-eval=false \\ | |
--iree-hal-target-backends=llvm-cpu \\ | |
--iree-llvmcpu-target-cpu=znver4 \\ | |
--iree-stream-resource-index-bits=64 \\ | |
--iree-vm-target-index-bits=64 \\ | |
--iree-llvmcpu-enable-ukernels=mmt4d \\ | |
1_step_tresleches.mlir -o tresleches.vmfb | |
: 1715620300:0;iree-benchmark-module --device=local-task --module=tresleches.vmfb --parameters=model=splat_tresleches.irpa --input=1x77x4096xf32=1 --input=1x2048xf32=1 --input=1x77x4096xf32=1 --input=1x2048xf32=1 --input=1x16x128x128xf32=1 --input=1x16x128x128xf32=1 -input=3x1024x1024=1 --function=main | |
: 1715622053:0;iree-benchmark-module --device=local-task --module=tresleches.vmfb --parameters=model=splat_tresleches.irpa --input=1x77x4096xf32=1 --input=1x2048xf32=1 --input=1x77x4096xf32=1 --input=1x2048xf32=1 --input=1x16x128x128xf32=1 --input=1x16x128x128xf32=1 -input=3x1024x1024=1 --function=main --task_topology_group_count=8 | |
: 1715623836:0;iree-benchmark-module --device=local-task --module=tresleches.vmfb --parameters=model=splat_tresleches.irpa --input=1x77x4096xf32=1 --input=1x2048xf32=1 --input=1x77x4096xf32=1 --input=1x2048xf32=1 --input=1x16x128x128xf32=1 --input=1x16x128x128xf32=1 -input=3x1024x1024=1 --function=main --task_topology_group_count=32 | |
: 1715662893:0;iree-dump-module splat_tresleches.irpa | |
: 1715662902:0;iree-dump-module 1_step_tresleches.mlir | |
: 1715662916:0;iree-dump-module --help | fzf | |
: 1715662943:0;iree-dump-module tresleches.vmfb | |
: 1715663615:0;pythonc convert_param_dtype.py --mlir-file="1_step_tresleches.mlir" | |
: 1715663618:0;python convert_param_dtype.py --mlir-file="1_step_tresleches.mlir" | |
: 1715663654:0;python convert_param_dtype.py --mlir-file="1_step_tresleches.mlir" --convert_param_dtype = bf16 --irpa_file=bf16_tresleches.irpa | |
: 1715663671:0;python convert_param_dtype.py --mlir-file="1_step_tresleches.mlir" --convert_param_dtype=bf16 --irpa_file=bf16_tresleches.irpa | |
: 1715663704:0;python convert_param_dtype.py --mlir-file="1_step_tresleches.mlir" --required-dtype=bf16 --irpa-file=bf16_tresleches.irpa | |
: 1715663734:0;python convert_param_dtype.py --mlir-file="1_step_tresleches.mlir" --required-dtype=bf16 --irpa-file=bf16_tresleches.irpa -h | |
: 1715663749:0;python convert_param_dtype.py --mlir-file="1_step_tresleches.mlir" --required-dtype=bf16 --irpa-file=bf16_tresleches.irpa | |
: 1715663770:0;python convert_param_dtype.py -mlir-file="1_step_tresleches.mlir" --required-dtype=bf16 --irpa-file=bf16_tresleches.irpa | |
: 1715663828:0;python convert_param_dtype.py --mlir-file="1_step_tresleches.mlir" --required-dtype="bf16" --irpa-file="bf16_tresleches.irpa" | |
: 1715663861:0;python --mlir-file="1_step_tresleches.mlir" convert_param_dtype.py | |
: 1715663883:0;python convert_param_dtype.py --mlir-file="1_step_tresleches.mlir" | |
: 1715663901:0;python convert_param_dtype.py mlir-file="1_step_tresleches.mlir" | |
: 1715663940:0;python convert_param_dtype.py mlir_file="1_step_tresleches.mlir" | |
: 1715663965:0;python convert_param_dtype.py "1_step_tresleches.mlir" | |
: 1715665925:0;python convert_param_dtype.py "1_step_tresleches.mlir" "bf16" "bf16_tresleches.irpa" | |
: 1715665954:0;vi bf16_tresleches.irpa | |
: 1715666067:0;vi convert_param_dtype.py | |
: 1715666229:0;vi splat_tresleches.irpa | |
: 1715666359:0;mv ../1_step_tresleches_bf16_b.mlir . | |
: 1715666381:0;iree-compile \\ | |
--iree-opt-const-eval=false \\ | |
--iree-hal-target-backends=llvm-cpu \\ | |
--iree-llvmcpu-target-cpu=znver4 \\ | |
--iree-stream-resource-index-bits=64 \\ | |
--iree-vm-target-index-bits=64 \\ | |
--iree-llvmcpu-enable-ukernels=mmt4d \\ | |
1_step_tresleches_bf16_b.mlir -o tresleches.vmfb | |
: 1715666473:0;iree-benchmark-module --device=local-task --module=tresleches.vmfb --parameters=model=bf16_tresleches.irpa --input=1x77x4096xbf16=1 --input=1x2048xbf16=1 --input=1x77x4096xbf16=1 --input=1x2048xbf16=1 --input=1x16x128x128xbf16=1 --input=1x16x128x128xbf16=1 -input=3x1024x1024=1 --function=main --task_topology_group_count=32 | |
: 1715666562:0;iree-benchmark-module --device=local-task --module=tresleches.vmfb --parameters=model=bf16_tresleches.irpa --input=1x154x4096xbf16=1 --input=1x2048xbf16=1 --input=1x154x4096xbf16=1 --input=1x2048xbf16=1 --input=1x16x128x128xbf16=1 --input=1x16x128x128xbf16=1 -input=3x1024x1024=1 --function=main --task_topology_group_count=32 | |
: 1715666768:0;gist-paste convert_param_dtype.py | |
: 1715667627:0;iree-tracy-capture -o ~/tresleches_bf16.tracy | |
: 1715667629:0;TRACY_NO_EXIT=1 iree-benchmark-module --device=local-task --module=tresleches.vmfb --parameters=model=bf16_tresleches.irpa --input=1x154x4096xbf16=1 --input=1x2048xbf16=1 --input=1x154x4096xbf16=1 --input=1x2048xbf16=1 --input=1x16x128x128xbf16=1 --input=1x16x128x128xbf16=1 -input=3x1024x1024=1 --function=main --task_topology_group_count=32 | |
: 1715671131:0;iree-compile \\ | |
--iree-opt-const-eval=false \\ | |
--iree-hal-target-backends=llvm-cpu \\ | |
1_step_tresleches_bf16_b.mlir -o tresleches.vmfb | |
: 1715695283:0;cat ~/test.mlir | |
: 1715695317:0;iree-opt --pass-pipeline='builtin.module(iree-llvmcpu-select-lowering-strategy, func.func(iree-llvmcpu-lower-executable-target))' --split-input-file ~/test.mlir | |
: 1715695406:0;vi ~/out.mlir | |
: 1715695613:0;iree-opt --pass-pipeline='builtin.module(iree-llvmcpu-select-lowering-strategy, func.func(iree-llvmcpu-lower-executable-target))' --split-input-file ~/test.mlir > ~/out.mlir | |
: 1715696422:0;cat /proc/cpuinfo | less | |
: 1715696845:0;iree-opt --pass-pipeline='builtin.module(iree-llvmcpu-select-lowering-strategy, func.func(iree-llvmcpu-lower-executable-target))' --split-input-file ~/test.mlir | FileCheck ~/test.mlir | |
: 1715699902:0;pidstat | |
: 1715699907:0;sudo apt-get install pidstat | |
: 1715699918:0;sudo apt-get install tuna | |
: 1715699926:0;tuna | |
: 1715699937:0;tuna -t | |
: 1715699943:0;tuna -t 7081 | |
: 1715699952:0;tuna -t iree-compile | |
: 1715699956:0;tuna -t iree-compile -P | |
: 1715699963:0;tuna -P | |
: 1715700109:0;vmstat | |
: 1715700121:0;vmstat -w l | |
: 1715700129:0;vmstat -w 1 | |
: 1715706686:0;mv ../tresleches_vae_bf16.mlir . | |
: 1715706714:0;iree-compile \\ | |
--iree-opt-const-eval=false \\ | |
--iree-hal-target-backends=llvm-cpu \\ | |
--iree-llvmcpu-target-cpu=znver4 \\ | |
--iree-stream-resource-index-bits=64 \\ | |
--iree-vm-target-index-bits=64 \\ | |
--iree-llvmcpu-enable-ukernels=mmt4d \\ | |
tresleches_vae_bf16.mlir -o vae.vmfb | |
: 1715706791:0;iree-benchmark-module --device=local-task --module=vae.vmfb --parameters=model=bf16_tresleches.irpa --input=1x16x128x128xbf16=1 --function=main | |
: 1715706899:0;iree-benchmark-module --device=local-task --module=vae.vmfb --parameters=model=bf16_tresleches.irpa --input=1x16x128x128xbf16=1 --function=main --benchmark_repetitions=5 | |
: 1715708776:0;iree-compile \\ | |
--iree-opt-const-eval=false \\ | |
--iree-hal-target-backends=llvm-cpu \\ | |
--iree-llvmcpu-target-cpu=znver4 \\ | |
--iree-stream-resource-index-bits=64 \\ | |
--iree-vm-target-index-bits=64 \\ | |
--iree-llvmcpu-enable-ukernels=mmt4d \\ | |
--iree-flow-enable-conv-img2col-transform \\ | |
tresleches_vae_bf16.mlir -o vae.vmfb | |
: 1715709002:0;iree-compile \\ | |
--iree-opt-const-eval=false \\ | |
--iree-hal-target-backends=llvm-cpu \\ | |
--iree-llvmcpu-target-cpu=znver4 \\ | |
--iree-stream-resource-index-bits=64 \\ | |
--iree-vm-target-index-bits=64 \\ | |
--iree-llvmcpu-enable-ukernels=mmt4d \\ | |
--iree-preprocessing-convert-conv2d-to-img2col \\ | |
tresleches_vae_bf16.mlir -o vae.vmfb | |
: 1715709188:0;iree-compile \\ | |
--iree-preprocessing-pass-pipeline="builtin.module(util.func(iree-preprocessing-convert-conv2d-to-img2col))" \\ | |
--iree-opt-const-eval=false \\ | |
--iree-hal-target-backends=llvm-cpu \\ | |
--iree-llvmcpu-target-cpu=znver4 \\ | |
--iree-stream-resource-index-bits=64 \\ | |
--iree-vm-target-index-bits=64 \\ | |
--iree-llvmcpu-enable-ukernels=mmt4d \\ | |
tresleches_vae_bf16.mlir -o vae.vmfb | |
: 1715709244:0;iree-tracy-capture -o ~/vae_bf16.tracy | |
: 1715709295:0;TRACY_NO_EXIT=1 iree-benchmark-module --device=local-task --module=vae.vmfb --parameters=model=bf16_tresleches.irpa --input=1x16x128x128xbf16=1 --function=main | |
: 1715709297:0;iree-tracy-capture -o ~/vae_bf16.tracy -f | |
: 1715709473:0;iree-compile \\ | |
--iree-preprocessing-pass-pipeline="builtin.module(util.func(iree-preprocessing-convert-conv2d-to-img2col))" \\ | |
--iree-opt-const-eval=true \\ | |
--iree-hal-target-backends=llvm-cpu \\ | |
--iree-llvmcpu-target-cpu=znver4 \\ | |
--iree-llvmcpu-enable-ukernels=mmt4d \\ | |
tresleches_vae_bf16.mlir -o vae.vmfb | |
: 1715715373:0;cd advance_cpp | |
: 1715715391:0;cd 04_templates | |
: 1715715470:0;g++ 04_03_template_parameter_packs.cpp | |
: 1715716877:0;g++ 04_05_class_template_basics.cpp | |
: 1715784094:0;mv ../tresleches_vae_f32_b.mlir . | |
: 1715784165:0;iree-benchmark-module --device=local-task --module=vae.vmfb --input=1x16x128x128xbf16=1 --function=main | |
: 1715784323:0;iree-compile \\ | |
--iree-preprocessing-pass-pipeline="builtin.module(util.func(iree-preprocessing-convert-conv2d-to-img2col))" \\ | |
--iree-hal-target-backends=llvm-cpu \\ | |
--iree-llvmcpu-target-cpu=znver4 \\ | |
--iree-llvmcpu-enable-ukernels=mmt4d \\ | |
tresleches_vae_f32_b.mlir -o vae.vmfb\ | |
: 1715784377:0;iree-compile \\ | |
--iree-hal-target-backends=llvm-cpu \\ | |
--iree-llvmcpu-target-cpu=znver4 \\ | |
--iree-llvmcpu-enable-ukernels=mmt4d \\ | |
tresleches_vae_f32_b.mlir -o vae.vmfb\ | |
: 1715784600:0;iree-tracy-capture -o ~/vae_f32_demote_bf16.tracy | |
: 1715784839:0;iree-tracy-capture -o ~/vae_f32_demote_bf16_img2col.tracy -f | |
: 1715785265:0;git ob just_fun | |
: 1715785441:0;iree-benchmark-module --device=local-task --module=vae.vmfb --input=1x16x128x128xf32=1 --function=main --benchmark_repetitions=5 | |
: 1715785768:0;git o pack_decomp | |
: 1715785842:0;iree-compile \\ | |
--iree-preprocessing-pass-pipeline="builtin.module(util.func(iree-preprocessing-convert-conv2d-to-img2col))" \\ | |
--iree-hal-target-backends=llvm-cpu \\ | |
--iree-llvmcpu-target-cpu=znver4 \\ | |
--iree-llvmcpu-enable-ukernels=mmt4d \\ | |
--iree-global-opt-enable-demote-contraction-inputs-to-bf16 \\ | |
tresleches_vae_f32_b.mlir -o vae.vmfb\ | |
: 1715788243:0;vi tresleches_vae_f32_b.mlir | |
: 1715788266:0;nvim tresleches_vae_f32_b.mlir | |
: 1715788285:0;vim tresleches_vae_f32_b.mlir | |
: 1715792473:0;TRACY_NO_EXIT=1 iree-benchmark-module --device=local-sync --module=vae.vmfb --input=1x16x128x128xf32=1 --function=main | |
: 1715792505:0;sudo reboot | |
: 1715792929:0;TRACY_NO_EXIT=1 iree-benchmark-module --device=local-task --module=vae.vmfb --input=1x16x128x128xf32=1 --function=main | |
: 1715792932:0;iree-tracy-capture -o ~/vae_f32_demote_bf16.tracy -f | |
: 1715793754:0;iree-compile \\ | |
--iree-opt-data-tiling \\ | |
--iree-hal-target-backends=llvm-cpu \\ | |
--iree-llvmcpu-target-cpu=znver4 \\ | |
--iree-llvmcpu-enable-ukernels=mmt4d \\ | |
--iree-global-opt-enable-demote-contraction-inputs-to-bf16 \\ | |
tresleches_vae_f32_b.mlir -o vae.vmfb\ | |
: 1715794094:0;rm -rf new.vmfb | |
: 1715794109:0;iree-compile \\ | |
--iree-hal-target-backends=llvm-cpu \\ | |
--iree-llvmcpu-target-cpu=znver4 \\ | |
--iree-llvmcpu-enable-ukernels=mmt4d \\ | |
--iree-global-opt-enable-demote-contraction-inputs-to-bf16 \\ | |
tresleches_vae_f32_b.mlir -o new.vmfb\ | |
: 1715794227:0;iree-compile \\ | |
--iree-hal-target-backends=llvm-cpu \\ | |
--iree-llvmcpu-target-cpu=znver4 \\ | |
--iree-llvmcpu-enable-ukernels=mmt4d \\ | |
--iree-global-opt-enable-demote-contraction-inputs-to-bf16 \\ | |
tresleches_vae_f32_b.mlir -o new.vmfb -mlir-print-ir-after-all 2> xyz.txt\ | |
: 1715794817:0;vi tresleches_vae_f32_b.mlir ~/new.txt | |
: 1715795025:0;0 | |
: 1715795189:0;iree-opt --iree-global-opt-demote-contraction-inputs-to-bf16 ~/new.txt -mlir-print-ir-after-all | |
: 1715795204:0;iree-opt --iree-global-opt-demote-contraction-inputs-to-bf16 ~/new.txt -mlir-print-ir-after-all > xyz.txt | |
: 1715795564:0;iree-opt xyz.txt | |
: 1715795895:0;iree-opt --iree-global-opt-demote-contraction-inputs-to-bf16 ~/new.txt -mlir-print-ir-after-all 2> xyz.txt | |
: 1715795910:0;iree-opt --iree-global-opt-demote-contraction-inputs-to-bf16 ~/new.txt | |
: 1715796355:0;iree-compile \\ | |
--iree-hal-target-backends=llvm-cpu \\ | |
--iree-llvmcpu-target-cpu=znver4 \\ | |
--iree-llvmcpu-enable-ukernels=mmt4d \\ | |
--iree-global-opt-enable-demote-contraction-inputs-to-bf16 \\ | |
tresleches_vae_f32_b.mlir -o vae.vmfb | |
: 1715796409:0;git o just_fun | |
: 1715796543:0;vi ~/new.txt | |
: 1715796878:0;rm ~/new.txt | |
: 1715796916:0;iree-opt --iree-global-opt-demote-contraction-inputs-to-bf16 ~/xyz.mlir | |
: 1715797030:0;iree-opt -iree-global-opt-demote-contraction-inputs-to-bf16 ~/xyz.mlir | ~/llvm-project/mlir/utils/generate-test-checks.py | |
: 1715797443:0;iree-opt -iree-global-opt-demote-contraction-inputs-to-bf16 compiler/src/iree/compiler/GlobalOptimization/test/demote_contraction_inputs_to_bf16.mlir | FileCheck compiler/src/iree/compiler/GlobalOptimization/test/demote_contraction_inputs_to_bf16.mlir | |
: 1715889315:0;mkdir kernel | |
: 1715889391:0;build/tools/iree-compile \\ | |
--iree-hal-target-backends=llvm-cpu \\ | |
--iree-llvmcpu-target-cpu=znver4 \\ | |
--iree-llvmcpu-target-triple=x86_64-unknown-linux-gnu \\ | |
im2col.mlir -o img2col.vmfb | |
: 1715889514:0;iree-benchmark-module \\ | |
--device=local-sync \\ | |
--task_topology_group_count=1 \\ | |
--module=img2col.vmfb \\ | |
--function=img2col \\ | |
--input=128x1026x1026xf32 | |
: 1715889992:0;iree-benchmark-module \\ | |
--device=local-task \\ | |
--task_topology_group_count=1 \\ | |
--module=img2col.vmfb \\ | |
--function=img2col \\ | |
--input=128x1026x1026xf32 | |
: 1715894359:0;mlir-opt im2col.mlir | |
: 1715894403:0;iree-compile \\ | |
--iree-hal-target-backends=llvm-cpu \\ | |
--iree-llvmcpu-target-cpu=znver4 \\ | |
--iree-llvmcpu-target-triple=x86_64-unknown-linux-gnu \\ | |
im2col.mlir -o img2col.vmfb --mlir-print-ir-after-all 2> xyz.txt | |
: 1715896298:0;gist-paste im2col.mlir | |
: 1715897161:0;iree-benchmark-module \\ | |
--device=local-task \\ | |
--module=img2col.vmfb \\ | |
--function=img2col \\ | |
--input=128x1026x1026xf32 | |
: 1715920018:0;iree-benchmark-module \\ | |
--device=local-sync \\ | |
--module=img2col.vmfb \\ | |
--function=img2col \\ | |
--input=128x1026x1026xf32 | |
: 1715943599:0;iree-benchmark-module \\ | |
--device=local-task \\ | |
--module=img2col.vmfb \\ | |
--function=scalar \\ | |
--input=128x1026x1026xf32 | |
: 1715943615:0;iree-benchmark-module \\ | |
--device=local-sync \\ | |
--module=img2col.vmfb \\ | |
--function=scalar \\ | |
--input=128x1026x1026xf32 | |
: 1715944098:0;iree-compile \\ | |
--iree-hal-target-backends=llvm-cpu \\ | |
--iree-llvmcpu-target-cpu=znver4 \\ | |
--iree-llvmcpu-target-triple=x86_64-unknown-linux-gnu \\ | |
im2col.mlir -o img2col.vmfb | |
: 1715944270:0;iree-compile \\ | |
--iree-hal-target-backends=llvm-cpu \\ | |
--iree-llvmcpu-target-cpu=znver4 \\ | |
--iree-llvmcpu-target-triple=x86_64-unknown-linux-gnu \\ | |
im2col.mlir -o img2col.vmfb --debug | |
: 1715960314:0;vi vae.vmfb tresleches_vae_bf16.mlir | |
: 1715960331:0;vi vae.vmfb tresleches_vae_f32_b.mlir | |
: 1715960358:0;vi 1_step_tresleches.mlir | |
: 1716010063:0;iree-compile \\ | |
--iree-hal-target-backends=llvm-cpu \\ | |
--iree-llvmcpu-target-cpu=znver4 \\ | |
--iree-llvmcpu-target-triple=x86_64-unknown-linux-gnu \\ | |
im2col.mlir -o img2col.vmfb | |
: 1716010091:0;iree-benchmark-module \\ | |
--device=local-task \\ | |
--module=img2col.vmfb \\ | |
--function=scalar \\ | |
--input=1x1x2048xf32 --benchmark_repetitions=5 | |
: 1716010833:0;iree-opt --linalg-fold-unit-extent-dims test.mlir | |
: 1716011176:0;vi im2col.mlir | |
: 1716012207:0;iree-benchmark-module \\ | |
--device=local-task \\ | |
--module=img2col.vmfb \\ | |
--function=scalar \\ | |
--input=128x1026x1026xf32 --benchmark_repetitions=5 | |
: 1716012368:0;iree-benchmark-module \\ | |
--device=local-task \\ | |
--task_topology_group_count=1 \\ | |
--module=img2col.vmfb \\ | |
--function=scalar \\ | |
--input=128x1026x1026xf32 --benchmark_repetitions=5 | |
: 1716012381:0;iree-benchmark-module \\ | |
--device=local-task \\ | |
--task_topology_group_count=2 \\ | |
--module=img2col.vmfb \\ | |
--function=scalar \\ | |
--input=128x1026x1026xf32 --benchmark_repetitions=5 | |
: 1716014013:0;git ob experiment | |
: 1716014187:0;iree-benchmark-module \\ | |
--device=local-task \\ | |
--task_topology_group_count=8 \\ | |
--module=img2col.vmfb \\ | |
--function=scalar \\ | |
--input=128x1026x1026xf32 --benchmark_repetitions=5 | |
: 1716014467:0;iree-benchmark-module \\ | |
--device=local-sync \\ | |
--task_topology_group_count=32 \\ | |
--module=img2col.vmfb \\ | |
--function=scalar \\ | |
--input=128x1026x1026xf32 --benchmark_repetitions=5 | |
: 1716014846:0;git o experiment | |
: 1716014866:0;iree-benchmark-module \\ | |
--device=local-sync \\ | |
--module=img2col.vmfb \\ | |
--function=scalar \\ | |
--input=128x1026x1026xf32 --benchmark_repetitions=5 | |
: 1716014889:0;iree-benchmark-module \\ | |
--device=local-sync \\ | |
--task-topology-count=16 \\ | |
--module=img2col.vmfb \\ | |
--function=scalar \\ | |
--input=128x1026x1026xf32 --benchmark_repetitions=5 | |
: 1716014922:0;iree-benchmark-module \\ | |
--device=local-sync \\ | |
--task-topology-group-count=16 \\ | |
--module=img2col.vmfb \\ | |
--function=scalar \\ | |
--input=128x1026x1026xf32 --benchmark_repetitions=5 | |
: 1716014952:0;iree-benchmark-module \\ | |
--device=local-sync \\ | |
--task_topology_group_count=16 \\ | |
--module=img2col.vmfb \\ | |
--function=scalar \\ | |
--input=128x1026x1026xf32 --benchmark_repetitions=5 | |
: 1716015156:0;iree-benchmark-module \\ | |
--device=local-task \\ | |
--task_topology_group_count= \\ | |
--module=img2col.vmfb \\ | |
--function=scalar \\ | |
--input=128x1026x1026xf32 --benchmark_repetitions=5 | |
: 1716015167:0;iree-benchmark-module \\ | |
--device=local-task \\ | |
--task_topology_group_count=64 \\ | |
--module=img2col.vmfb \\ | |
--function=scalar \\ | |
--input=128x1026x1026xf32 --benchmark_repetitions=5 | |
: 1716015178:0;iree-benchmark-module \\ | |
--device=local-task \\ | |
--task_topology_group_count=16 \\ | |
--module=img2col.vmfb \\ | |
--function=scalar \\ | |
--input=128x1026x1026xf32 --benchmark_repetitions=5 | |
: 1716015188:0;iree-benchmark-module \\ | |
--device=local-task \\ | |
--task_topology_group_count=32 \\ | |
--module=img2col.vmfb \\ | |
--function=scalar \\ | |
--input=128x1026x1026xf32 --benchmark_repetitions=5 | |
: 1716015618:0;iree-compile \\ | |
--iree-preprocessing-pass-pipeline="builtin.module(util.func(iree-preprocessing-convert-conv2d-to-img2col))" \\ | |
--iree-opt-data-tiling \\ | |
--iree-hal-target-backends=llvm-cpu \\ | |
--iree-llvmcpu-target-cpu=znver4 \\ | |
--iree-llvmcpu-enable-ukernels=mmt4d \\ | |
--iree-global-opt-enable-demote-contraction-inputs-to-bf16 \\ | |
tresleches_vae_f32_b.mlir -o vae.vmfb\ | |
: 1716015658:0;iree-benchmark-module --device=local-task --module=vae.vmfb --input=1x16x128x128xf32=1 --function=main | |
: 1716015961:0;iree-compile \\ | |
--iree-hal-target-backends=llvm-cpu \\ | |
--iree-llvmcpu-target-cpu=znver4 \\ | |
--iree-llvmcpu-enable-ukernels=mmt4d \\ | |
--iree-global-opt-enable-demote-contraction-inputs-to-bf16 \ --iree-preprocessing-pass-pipeline="builtin.module(util.func(iree-preprocessing-convert-conv2d-to-img2col}))" \\ | |
--iree-flow-collapse-reduction-dims \\ | |
~/tresleches_vae_f32_b.mlir -o vae.vmfb | |
: 1716016005:0;iree-compile \\ | |
--iree-hal-target-backends=llvm-cpu \\ | |
--iree-llvmcpu-target-cpu=znver4 \\ | |
--iree-llvmcpu-enable-ukernels=mmt4d \\ | |
--iree-global-opt-enable-demote-contraction-inputs-to-bf16 --iree-preprocessing-pass-pipeline="builtin.module(util.func(iree-preprocessing-convert-conv2d-to-img2col}))" \\ | |
--iree-flow-collapse-reduction-dims \\ | |
~/tresleches_vae_f32_b.mlir -o vae.vmfb | |
: 1716016011:0;iree-compile \\ | |
--iree-hal-target-backends=llvm-cpu \\ | |
--iree-llvmcpu-target-cpu=znver4 \\ | |
--iree-llvmcpu-enable-ukernels=mmt4d \\ | |
--iree-global-opt-enable-demote-contraction-inputs-to-bf16 --iree-preprocessing-pass-pipeline="builtin.module(util.func(iree-preprocessing-convert-conv2d-to-img2col}))" \\ | |
--iree-flow-collapse-reduction-dims \\ | |
tresleches_vae_f32_b.mlir -o vae.vmfb | |
: 1716016060:0;iree-compile \\ | |
--iree-preprocessing-pass-pipeline="builtin.module(util.func(iree-preprocessing-convert-conv2d-to-img2col))" \\ | |
--iree-opt-data-tiling \\ | |
--iree-hal-target-backends=llvm-cpu \\ | |
--iree-llvmcpu-target-cpu=znver4 \\ | |
--iree-llvmcpu-enable-ukernels=mmt4d \\ | |
--iree-flow-collapse-reduction-dims\\ | |
--iree-global-opt-enable-demote-contraction-inputs-to-bf16 \\ | |
tresleches_vae_f32_b.mlir -o vae.vmfb\ | |
: 1716016099:0;iree-benchmark-module --device=local-task -task_topology_group_count=32 --module=vae.vmfb --input=1x16x128x128xf32=1 --function=main | |
: 1716016213:0;iree-benchmark-module --device=local-sync -task_topology_group_count=32 --module=vae.vmfb --input=1x16x128x128xf32=1 --function=main | |
: 1716016377:0;iree-tracy-capture -o ~/vae.tracy -f | |
: 1716016774:0;iree-compile \\ | |
--iree-preprocessing-pass-pipeline="builtin.module(util.func(iree-preprocessing-convert-conv2d-to-img2col))" \\ | |
--iree-opt-data-tiling \\ | |
--iree-hal-target-backends=llvm-cpu \\ | |
--iree-llvmcpu-target-cpu=znver4 \\ | |
--iree-llvmcpu-enable-ukernels=mmt4d \\ | |
--iree-flow-collapse-reduction-dims \\ | |
--iree-global-opt-enable-demote-contraction-inputs-to-bf16 \\ | |
tresleches_vae_f32_b.mlir -o vae.vmfb\ | |
: 1716016788:0;TRACY_NO_EXIT=1 iree-benchmark-module --device=local-sync -task_topology_group_count=32 --module=vae.vmfb --input=1x16x128x128xf32=1 --function=main | |
: 1716016792:0;iree-tracy-capture -o ~/vae1.tracy -f | |
: 1716026875:0;iree-compile \\ | |
--iree-hal-target-backends=llvm-cpu \\ | |
--iree-llvmcpu-target-cpu=znver4 \\ | |
--iree-llvmcpu-target-triple=x86_64-unknown-linux-gnu \\ | |
im2col.mlir -o img2col.vmfb -mlir-print-ir-after-all 2> xyz.txt | |
: 1716225438:0;git fetch hanhan | |
: 1716225464:0;git o hanhan/hanhan-20240520-snapshot | |
: 1716228596:0;iree-compile \\ | |
--iree-hal-target-backends=llvm-cpu \\ | |
--iree-llvmcpu-target-cpu=znver4 \\ | |
--iree-llvmcpu-enable-ukernels=mmt4d,pack \\ | |
--iree-global-opt-enable-demote-contraction-inputs-to-bf16 \ --iree-preprocessing-pass-pipeline="builtin.module(util.func(iree-linalg-ext-convert-conv2d-to-winograd{replace-all-convs=true}))" \\ | |
--iree-flow-collapse-reduction-dims \\ | |
--iree-opt-const-expr-max-size-increase-threshold=1000000000000000 \\ | |
tresleches_vae_f32_b.mlir -o /tmp/vae_f32_bf16_winograd.vmfb | |
: 1716228627:0;iree-compile \\ | |
--iree-hal-target-backends=llvm-cpu \\ | |
--iree-llvmcpu-target-cpu=znver4 \\ | |
--iree-llvmcpu-enable-ukernels=mmt4d,pack \\ | |
--iree-global-opt-enable-demote-contraction-inputs-to-bf16 --iree-preprocessing-pass-pipeline="builtin.module(util.func(iree-linalg-ext-convert-conv2d-to-winograd{replace-all-convs=true}))" \\ | |
--iree-flow-collapse-reduction-dims \\ | |
--iree-opt-const-expr-max-size-increase-threshold=1000000000000000 \\ | |
tresleches_vae_f32_b.mlir -o /tmp/vae_f32_bf16_winograd.vmfb | |
: 1716228667:0;iree-benchmark-module --device=local-sync -task_topology_group_count=32 --module=/tmp/vae_f32_bf16_winograd.vmfb --input=1x16x128x128xf32=1 --function=main | |
: 1716228718:0;iree-benchmark-module --device=local-task -task_topology_group_count=32 --module=/tmp/vae_f32_bf16_winograd.vmfb --input=1x16x128x128xf32=1 --function=main | |
: 1716228739:0;iree-benchmark-module --device=local-task -task_topology_group_count=48 --module=/tmp/vae_f32_bf16_winograd.vmfb --input=1x16x128x128xf32=1 --function=main | |
: 1716233011:0;cat gather.mlir | |
: 1716233058:0;vi gather.mlir | |
: 1716233079:0;iree-opt --iree-flow-fusion-preprocessing gather.mlir | |
: 1716349938:0;rm gather.mlir im2col.mlir img2col.vmfb test.mlir xyz.txt | |
: 1716349983:0;iree-compile unpack.mlir \\ | |
--iree-hal-target-backends=llvm-cpu \\ | |
--iree-llvmcpu-target-cpu=znver4 \\ | |
--iree-llvmcpu-enable-ukernels=mmt4d \\ | |
-o /tmp/unpack.vmfb | |
: 1716350047:0;iree-benchmark-module --device=local-task -task_topology_group_count=16 --module=/tmp/unpack.vmfb --input=64x1828x8x16x16xf32=1 --function=unpack | |
: 1716350098:0;iree-compile unpack.mlir \\ | |
--iree-hal-target-backends=llvm-cpu \\ | |
--iree-llvmcpu-target-cpu=znver4 \\ | |
--iree-llvmcpu-enable-ukernels=mmt4d \\ | |
-o /tmp/unpack.vmfb -mlir-print-ir-after-all 2> xyz.txt | |
: 1716350818:0;iree-compile u_tra.mlir \\ | |
--iree-hal-target-backends=llvm-cpu \\ | |
--iree-llvmcpu-target-cpu=znver4 \\ | |
--iree-llvmcpu-enable-ukernels=mmt4d \\ | |
-o /tmp/unpack.vmfb -mlir-print-ir-after-all 2> xyz.txt | |
: 1716350825:0;iree-benchmark-module --device=local-task -task_topology_group_count=16 --module=/tmp/unpack.vmfb --input=64x1828x8x16x16xf32=1 --function=unpack -mlir-print-ir-after-all 2> xyz.txt | |
: 1716353405:0;iree-compile --iree-hal-target-backends=llvm-cpu --iree-llvmcpu-target-cpu-features=host unpack.mlir -o unpack.vmfb --iree-hal-dump-executable-intermediates-to=onlyunpack/ --x86-asm-syntax=intel -mlir-print-ir-after-all 2> only_unpack.mlir | |
: 1716353440:0;iree-compile --iree-hal-target-backends=llvm-cpu --iree-llvmcpu-target-cpu-features=host unpack.mlir -o unpack.vmfb --iree-hal-dump-executable-intermediates-to=onlyunpack/ | |
: 1716353550:0;iree-compile u_tra.mlir \\ | |
--iree-hal-target-backends=llvm-cpu \\ | |
--iree-llvmcpu-target-cpu=znver4 \\ | |
--iree-llvmcpu-enable-ukernels=mmt4d \\ | |
-o /tmp/unpack.vmfb | |
: 1716353624:0;iree-compile --iree-hal-target-backends=llvm-cpu --iree-llvmcpu-target-cpu-features=host unpack.mlir -o unpack.vmfb | |
: 1716353635:0;iree-benchmark-module --device=local-task -task_topology_group_count=16 --module=unpack.vmfb --input=64x1828x8x16x16xf32=1 --function=unpack -mlir-print-ir-after-all 2> xyz.txt | |
: 1716353644:0;iree-benchmark-module --device=local-task -task_topology_group_count=16 --module=unpack.vmfb --input=64x1828x8x16x16xf32=1 --function=unpack | |
: 1716353740:0;iree-compile --iree-hal-target-backends=llvm-cpu --iree-llvmcpu-target-cpu-features=host -o unpack.vmfb unpack.mlir --iree-hal-dump-executable-intermediates-to=dump/ --x86-asm-syntax=intel | |
: 1716353891:0;iree-compile --iree-hal-target-backends=llvm-cpu --iree-llvmcpu-target-cpu-features=host -o unpack.vmfb unpack.mlir | |
: 1716353902:0;iree-dump-module unpack.vmfb | |
: 1716353928:0;rm -rf dump onlyunpack | |
: 1716353955:0;unzip -d unpack ./unpack.vmfb | |
: 1716354059:0;iree-compile --iree-hal-target-backends=llvm-cpu --iree-llvmcpu-target-cpu-features=host -o unpack.vmfb unpack.mlir iree-hal-dump-executable-binaries-to=unpack/ | |
: 1716354076:0;iree-compile --iree-hal-target-backends=llvm-cpu --iree-llvmcpu-target-cpu-features=host -o unpack.vmfb unpack.mlir --iree-hal-dump-executable-binaries-to=unpack/ | |
: 1716354091:0;readelf unpack_dispatch_0_embedded_elf_x86_64.so | |
: 1716354100:0;readelf -Ws unpack_dispatch_0_embedded_elf_x86_64.so | |
: 1716354104:0;sudo readelf -Ws unpack_dispatch_0_embedded_elf_x86_64.so | |
: 1716354134:0;iree-compile --iree-hal-target-backends=llvm-cpu --iree-llvmcpu-target-cpu-features=host -o unpack.vmfb unpack.mlir iree-hal-dump-executable-files-to=unpack/ | |
: 1716354142:0;iree-compile --iree-hal-target-backends=llvm-cpu --iree-llvmcpu-target-cpu-features=host -o unpack.vmfb unpack.mlir --iree-hal-dump-executable-files-to=unpack/ | |
: 1716354220:0;iree-compile --iree-hal-target-backends=llvm-cpu --iree-llvmcpu-target-cpu-features=host -o unpack.vmfb unpack.mlir iree-hal-dump-executable-sources-to=unpack/ | |
: 1716354232:0;iree-compile --iree-hal-target-backends=llvm-cpu --iree-llvmcpu-target-cpu-features=host -o unpack.vmfb unpack.mlir --iree-hal-dump-executable-sources-to=unpack/ | |
: 1716354256:0;vi module_unpack_dispatch_0.mlir | |
: 1716354282:0;rm -rf unpack | |
: 1716354287:0;vi u_tra.mlir | |
: 1716354346:0;iree-compile --iree-hal-target-backends=llvm-cpu --iree-llvmcpu-target-cpu-features=host -o unpack.vmfb unpack.mlir --iree-llvmcpu-link-embedded=false \\ | |
--iree-hal-dump-executable-files-to=unpack/ \\ | |
: 1716355896:0;iree-compile u_tra.mlir \\ | |
--iree-hal-target-backends=llvm-cpu \\ | |
--iree-llvmcpu-target-cpu=znver4 \\ | |
--iree-llvmcpu-enable-ukernels=mmt4d \\ | |
-o u_tra.vmfb | |
: 1716355970:0;cd u_tra | |
: 1716355980:0;vi module_unpack_dispatch_0_system_elf_x86_64.codegen.ll | |
: 1716356126:0;vi configured_module_unpack_dispatch_0.mlir | |
: 1716356544:0;iree-benchmark-module --device=local-task -task_topology_group_count=16 --module=u_tra.vmfb --input=64x1828x8x16x16xf32=1 --function=unpack | |
: 1716356555:0;iree-benchmark-module --device=local-task -task_topology_group_count=16 --module=unpack.vmfb --input=64x1828x8x16x16xf32=1 --function=unpack | |
: 1716356563:0;iree-benchmark-module --device=local-task -task_topology_group_count=32 --module=unpack.vmfb --input=64x1828x8x16x16xf32=1 --function=unpack | |
: 1716357609:0;iree-benchmark-module --device=local-sync --module=unpack.vmfb --input=64x1828x8x16x16xf32=1 --function=unpack | |
: 1716358773:0;iree-compile --iree-hal-target-backends=llvm-cpu --iree-llvmcpu-target-cpu-features=host -o u_tra.vmfb u_tra.mlir --iree-llvmcpu-link-embedded=false \\ | |
--iree-hal-dump-executable-files-to=u_tra/ \\ | |
: 1716358782:0;iree-benchmark-module --device=local-sync --module=u_tra.vmfb --input=64x1828x8x16x16xf32=1 --function=unpack | |
: 1716359782:0;cmake --build ~/iree-build/ --target iree-test-deps | |
: 1716359897:0;sudo apt-get install nvtop | |
: 1716359925:0;nvtop | |
: 1716360161:0;iree-opt --pass-pipeline='builtin.module(iree-llvmcpu-select-lowering-strategy)' ~/iree/compiler/src/iree/compiler/Codegen/LLVMCPU/test/select_x86_64_lowering_strategy.mlir -split-input-file | FileCheck ~/iree/compiler/src/iree/compiler/Codegen/LLVMCPU/test/select_x86_64_lowering_strategy.mlir | |
: 1716360240:0;clang-format -i ~/iree/compiler/src/iree/compiler/Codegen/LLVMCPU/KernelDispatch.cpp | |
: 1716360638:0;git ob tilesizes | |
: 1716360832:0;iree-benchmark-module --device=local-task --module=u_tra.vmfb --input=64x1828x8x16x16xf32=1 --function=unpack | |
: 1716360871:0;iree-compile --iree-hal-target-backends=llvm-cpu --iree-llvmcpu-target-cpu-features=host -o unpack.vmfb unpack.mlir --iree-llvmcpu-link-embedded=false \\ | |
--iree-hal-dump-executable-files-to=unpack/ -mlir-print-ir-after-all 2> xyz.txt\ | |
: 1716360880:0;iree-benchmark-module --device=local-task --module=unpack.vmfb --input=64x1828x8x16x16xf32=1 --function=unpack | |
: 1716365261:0;git ob layoutpropagate | |
: 1716382686:0;git ob check_branch | |
: 1716383396:0;vi fuse.mlir | |
: 1716383495:0;iree-benchmark-module --device=local-task --module=fuse.vmfb --input=1x1024x1024x16x16xf32=1 --function=foo | |
: 1716390221:0;iree-compile --iree-hal-target-backends=llvm-cpu --iree-llvmcpu-target-cpu-features=host -o fuse.vmfb fuse.mlir -mlir-print-ir-after-all 2> xyz.txt\ | |
: 1716390302:0;iree-compile --iree-hal-target-backends=llvm-cpu --iree-llvmcpu-target-cpu-features=host -o unpack.vmfb unpack.mlir --iree-llvmcpu-link-embedded=false \\ | |
--iree-hal-dump-executable-files-to=unpack/ | |
: 1716390317:0;cd unpack | |
: 1716390321:0;vi module_unpack_dispatch_0_system_elf_x86_64.s | |
: 1716455010:0;cp ~/vae2b_fp32_weights.mlir ~/tresleches | |
: 1716455036:0;iree-compile `\ | |
--iree-preprocessing-pass-pipeline="builtin.module(util.func(iree-linalg-ext-convert-conv2d-to-winograd{replace-all-convs=true},iree-global-opt-demote-contraction-inputs-to-bf16))" `\ | |
--iree-hal-target-backends=llvm-cpu `\ | |
--iree-llvmcpu-target-cpu=znver4 `\ | |
--iree-llvmcpu-enable-ukernels=mmt4d,pack `\ | |
--iree-flow-collapse-reduction-dims `\ | |
--iree-opt-const-expr-max-size-increase-threshold=1000000000000000 `\ | |
vae2b_fp32_weights.mlir -o vae.vmfb | |
: 1716455079:0;iree-compile `\ | |
--iree-preprocessing-pass-pipeline="builtin.module(util.func(iree-linalg-ext-convert-conv2d-to-winograd{replace-all-convs=true},iree-global-opt-demote-contraction-inputs-to-bf16))" \\ | |
--iree-hal-target-backends=llvm-cpu \\ | |
--iree-llvmcpu-target-cpu=znver4 \\ | |
--iree-llvmcpu-enable-ukernels=mmt4d,pack \ \ | |
--iree-flow-collapse-reduction-dims \\ | |
--iree-opt-const-expr-max-size-increase-threshold=1000000000000000 \\ | |
vae2b_fp32_weights.mlir -o vae.vmfb\ | |
\ | |
: 1716455085:0;iree-compile --iree-preprocessing-pass-pipeline="builtin.module(util.func(iree-linalg-ext-convert-conv2d-to-winograd{replace-all-convs=true},iree-global-opt-demote-contraction-inputs-to-bf16))" \\ | |
--iree-hal-target-backends=llvm-cpu \\ | |
--iree-llvmcpu-target-cpu=znver4 \\ | |
--iree-llvmcpu-enable-ukernels=mmt4d,pack \ \ | |
--iree-flow-collapse-reduction-dims \\ | |
--iree-opt-const-expr-max-size-increase-threshold=1000000000000000 \\ | |
vae2b_fp32_weights.mlir -o vae.vmfb\ | |
\ | |
: 1716455103:0;iree-compile --iree-preprocessing-pass-pipeline="builtin.module(util.func(iree-linalg-ext-convert-conv2d-to-winograd{replace-all-convs=true},iree-global-opt-demote-contraction-inputs-to-bf16))" \\ | |
--iree-hal-target-backends=llvm-cpu \\ | |
--iree-llvmcpu-target-cpu=znver4 \\ | |
--iree-llvmcpu-enable-ukernels=mmt4d,pack \ \ | |
--iree-flow-collapse-reduction-dims \\ | |
--iree-opt-const-expr-max-size-increase-threshold=1000000000000000 vae2b_fp32_weights.mlir -o vae.vmfb\ | |
\ | |
: 1716455586:0;iree-benchmark-module --device=local-task -task_topology_group_count=48 --module=vae.vmfb --input=1x16x64x64xf32=1 --function=main | |
: 1716455655:0;iree-benchmark-module --device=local-sync -task_topology_group_count=48 --module=vae.vmfb --input=1x16x64x64xf32=1 --function=main | |
: 1716456014:0;iree-benchmark-module --device=local-sync --module=vae.vmfb --task-topology-group-count=4 --input=1x16x64x64xf32=1 --function=main | |
: 1716456078:0;iree-compile --iree-preprocessing-pass-pipeline="builtin.module(util.func(iree-linalg-ext-convert-conv2d-to-winograd{replace-all-convs=true},iree-global-opt-demote-contraction-inputs-to-bf16))" --iree-hal-target-backends=llvm-cpu --iree-llvmcpu-target-cpu=znver4 --iree-flow-collapse-reduction-dims vae2b_fp32_weights.mlir -o vae.vmfb\ | |
\ | |
: 1716456749:0;iree-benchmark-module --device=local-task --module=vae.vmfb --task-topology-group-count=4 --input=1x16x64x64xf32=1 --function=main | |
: 1716456755:0;iree-benchmark-module --device=local-task --module=vae.vmfb --task-topology-group-count=1 --input=1x16x64x64xf32=1 --function=main | |
: 1716457143:0;iree-compile --iree-preprocessing-pass-pipeline="builtin.module(util.func(iree-linalg-ext-convert-conv2d-to-winograd{replace-all-convs=true},iree-global-opt-demote-contraction-inputs-to-bf16))" --iree-hal-target-backends=llvm-cpu --iree-llvmcpu-target-cpu=znver4 --iree-flow-collapse-reduction-dims vae2b_fp32_weights.mlir -o vae.vmfb --pass-timing\ | |
\ | |
: 1716457149:0;iree-compile --iree-preprocessing-pass-pipeline="builtin.module(util.func(iree-linalg-ext-convert-conv2d-to-winograd{replace-all-convs=true},iree-global-opt-demote-contraction-inputs-to-bf16))" --iree-hal-target-backends=llvm-cpu --iree-llvmcpu-target-cpu=znver4 --iree-flow-collapse-reduction-dims vae2b_fp32_weights.mlir -o vae.vmfb --mlir-timing\ | |
\ | |
: 1716457378:0;iree-compile --iree-preprocessing-pass-pipeline="builtin.module(util.func(iree-linalg-ext-convert-conv2d-to-winograd{replace-all-convs=true},iree-global-opt-demote-contraction-inputs-to-bf16))" --iree-hal-target-backends=llvm-cpu --iree-llvmcpu-target-cpu=znver4 --iree-llvmcpu-enable-ukernels=mmt4d,pack --iree-flow-collapse-reduction-dims --iree-opt-const-expr-max-size-increase-threshold=1000000000000000 vae2b_fp32_weights.mlir -o vae.vmfb\ | |
\ | |
: 1716466864:0;iree-compile --iree-preprocessing-pass-pipeline="builtin.module(util.func(iree-linalg-ext-convert-conv2d-to-winograd{replace-all-convs=true},iree-global-opt-demote-contraction-inputs-to-bf16))" --iree-hal-target-backends=llvm-cpu --iree-llvmcpu-target-cpu=znver4 --iree-llvmcpu-enable-ukernels=mmt4d,pack --iree-flow-collapse-reduction-dims --iree-opt-const-expr-max-size-increase-threshold=1000000000000000 vae2b_fp32_weights.mlir -o vae.vmfb --iree-llvmcpu-link-embedded=false --iree-hal-dump-executable-files-to=vae2b_dump/\ | |
\ | |
: 1716467451:0;cd vae2b_dump | |
: 1716467737:0;iree-compile --iree-preprocessing-pass-pipeline="builtin.module(util.func(iree-linalg-ext-convert-conv2d-to-winograd{replace-all-convs=true},iree-global-opt-demote-contraction-inputs-to-bf16))" --iree-hal-target-backends=llvm-cpu --iree-llvmcpu-target-cpu=znver4 --iree-llvmcpu-enable-ukernels=mmt4d,pack --iree-flow-collapse-reduction-dims --iree-opt-const-expr-max-size-increase-threshold=1000000000000000 vae2b_fp32_weights.mlir -o vae.vmfb --iree-llvmcpu-link-embedded=false --iree-hal-dump-executable-files-to=vae2b_dump/ -mlir-print-ir-after-all 2> ir_dump.txt | |
: 1716468584:0;vi vae2b_fp32_weights.mlir | |
: 1716468612:0;/usr/bin/vim.tiny vae2b_fp32_weights.mlir | |
: 1716468698:0;/usr/bin/vim.tiny vae_fp32_weights.mlir | |
: 1716468752:0;/usr/bin/vim.tiny tresleches_vae_f32_b.mlir | |
: 1716468801:0;torch-mlir-opt --print-op-stats vae2b_fp32_weights.mlir | |
: 1716468811:0;iree-opt --print-op-stats vae2b_fp32_weights.mlir | |
: 1716468821:0;iree-opt --print-op-stats vae2b_fp32_weights.mlir > /dev/null | |
: 1716468874:0;iree-opt --print-op-stats tresleches_vae_f32_b.mlir > /dev/null | |
: 1716470671:0;rm -rf ir_dump.txt | |
: 1716478689:0;mv ../vae2b_decomp.mlir . | |
: 1716478715:0;git o origin/shared/tresleches-cpu | |
: 1716479058:0;iree-compile --iree-preprocessing-pass-pipeline="builtin.module(util.func(iree-linalg-ext-convert-conv2d-to-winograd{replace-all-convs=true},iree-global-opt-demote-contraction-inputs-to-bf16))" --iree-hal-target-backends=llvm-cpu --iree-llvmcpu-target-cpu=znver4 --iree-llvmcpu-enable-ukernels=mmt4d,pack --iree-flow-collapse-reduction-dims --iree-opt-const-expr-max-size-increase-threshold=1000000000000000 vae2b_decomp.mlir -o vae.vmfb | |
: 1716557669:0;vi only_unpack.mlir | |
: 1716558038:0;git ob unpack_ukernel | |
: 1716558066:0;cp unpack.mlir ~/ | |
: 1716558626:0;iree-compile --iree-preprocessing-pass-pipeline="builtin.module(util.func(iree-linalg-ext-convert-conv2d-to-winograd{replace-all-convs=true},iree-global-opt-demote-contraction-inputs-to-bf16))" --iree-hal-target-backends=llvm-cpu --iree-llvmcpu-target-cpu=znver4 --iree-llvmcpu-enable-ukernels=mmt4d,pack,unpack --iree-flow-collapse-reduction-dims --iree-opt-const-expr-max-size-increase-threshold=1000000000000000 ~/unpack.mlir -o /tmp/x.vmfb -mlir-print-ir-after-all > ~/xyz.txt | |
: 1716558631:0;iree-compile --iree-preprocessing-pass-pipeline="builtin.module(util.func(iree-linalg-ext-convert-conv2d-to-winograd{replace-all-convs=true},iree-global-opt-demote-contraction-inputs-to-bf16))" --iree-hal-target-backends=llvm-cpu --iree-llvmcpu-target-cpu=znver4 --iree-llvmcpu-enable-ukernels=mmt4d,pack,unpack --iree-flow-collapse-reduction-dims --iree-opt-const-expr-max-size-increase-threshold=1000000000000000 ~/unpack.mlir -o /tmp/x.vmfb -mlir-print-ir-after-all 2> ~/xyz.txt | |
: 1716559380:0;iree-compile --iree-hal-target-backends=llvm-cpu --iree-llvmcpu-target-cpu=znver4 --iree-llvmcpu-enable-ukernels=mmt4d,pack,unpack ~/unpack.mlir -o /tmp/x.vmfb -mlir-print-ir-after-all 2> ~/xyz.txt | |
: 1716559752:0;iree-compile --iree-hal-target-backends=llvm-cpu --iree-llvmcpu-target-cpu=znver4 --iree-llvmcpu-enable-ukernels=mmt4d,pack,unpack ~/unpack.mlir -o /tmp/x.vmfb | |
: 1716559977:0;iree-compile --iree-hal-target-backends=llvm-cpu --iree-llvmcpu-target-cpu=znver4 --iree-llvmcpu-enable-ukernels=mmt4d,pack,unpack ~/unpack.mlir -o /tmp/x.vmfb 2> /dev/null | |
: 1716561525:0;vi yx | |
: 1716568264:0;vi ~/pack.mlir | |
: 1716568820:0;iree-opt --pass-pipeline="builtin.module(func.func(iree-codegen-cpu-prepare-ukernels))" -cse ~/pack.mlir | |
: 1716573113:0;iree-opt --pass-pipeline="builtin.module(func.func(iree-codegen-cpu-prepare-ukernels))" ~/pack.mlir | |
: 1716581087:0;iree-opt --pass-pipeline="builtin.module(func.func(iree-codegen-cpu-prepare-ukernels))" ~/unpack.mlir | |
: 1716611492:0;iree-opt --pass-pipeline="builtin.module(func.func(iree-codegen-cpu-prepare-ukernels))" ~/unpack.mlir --debug | |
: 1716617300:0;cd ../tresleches/kernel | |
: 1716617306:0;vi unpack | |
: 1716617349:0;iree-compile --iree-hal-target-backends=llvm-cpu --iree-llvmcpu-target-cpu=znver4 --iree-llvmcpu-enable-ukernels=mmt4d,pack,unpack unpack.mlir -o /tmp/x.vmfb 2> xyz.txt | |
: 1716617355:0;iree-compile --iree-hal-target-backends=llvm-cpu --iree-llvmcpu-target-cpu=znver4 --iree-llvmcpu-enable-ukernels=mmt4d,pack,unpack unpack.mlir -o /tmp/x.vmfb | |
: 1716617380:0;iree-benchmark-module --device=local-task --module=/tmp/x.vmfb --input=64x1828x8x16x16xf32=1 --function=unpack | |
: 1716617513:0;iree-compile --iree-hal-target-backends=llvm-cpu --iree-llvmcpu-target-cpu=znver4 --iree-llvmcpu-enable-ukernels=mmt4d,pack,unpack ~/unpack.mlir -o /tmp/x.vmfb 2> xyz.txt | |
: 1716617819:0;iree-compile --iree-preprocessing-pass-pipeline="builtin.module(util.func(iree-linalg-ext-convert-conv2d-to-winograd{replace-all-convs=true},iree-global-opt-demote-contraction-inputs-to-bf16))" --iree-hal-target-backends=llvm-cpu --iree-llvmcpu-target-cpu=znver4 --iree-llvmcpu-enable-ukernels=mmt4d,pack,unpack --iree-flow-collapse-reduction-dims --iree-opt-const-expr-max-size-increase-threshold=1000000000000000 vae2b_decomp.mlir -o vae.vmfb -mlir-elide-elements-attrs>2 | |
: 1716617840:0;iree-compile --iree-preprocessing-pass-pipeline="builtin.module(util.func(iree-linalg-ext-convert-conv2d-to-winograd{replace-all-convs=true},iree-global-opt-demote-contraction-inputs-to-bf16))" --iree-hal-target-backends=llvm-cpu --iree-llvmcpu-target-cpu=znver4 --iree-llvmcpu-enable-ukernels=mmt4d,pack,unpack --iree-flow-collapse-reduction-dims --iree-opt-const-expr-max-size-increase-threshold=1000000000000000 vae2b_decomp.mlir -o vae.vmfb -mlir-elide-elementattrs-if-larger=2 | |
: 1716617859:0;iree-compile --iree-preprocessing-pass-pipeline="builtin.module(util.func(iree-linalg-ext-convert-conv2d-to-winograd{replace-all-convs=true},iree-global-opt-demote-contraction-inputs-to-bf16))" --iree-hal-target-backends=llvm-cpu --iree-llvmcpu-target-cpu=znver4 --iree-llvmcpu-enable-ukernels=mmt4d,pack,unpack --iree-flow-collapse-reduction-dims --iree-opt-const-expr-max-size-increase-threshold=1000000000000000 vae2b_decomp.mlir -o vae.vmfb -mlir-elide-elementsattrs-if-larger=2 -mlir-print-ir-after-all 2> xyz.txt | |
: 1716618019:0;iree-compile --iree-preprocessing-pass-pipeline="builtin.module(util.func(iree-linalg-ext-convert-conv2d-to-winograd{replace-all-convs=true},iree-global-opt-demote-contraction-inputs-to-bf16))" --iree-hal-target-backends=llvm-cpu --iree-llvmcpu-target-cpu=znver4 --iree-llvmcpu-enable-ukernels=mmt4d,pack,unpack --iree-flow-collapse-reduction-dims --iree-opt-const-expr-max-size-increase-threshold=1000000000000000 vae2b_decomp.mlir -o vae.vmfb -mlir-elide-elementsattrs-if-larger=2 -mlir-print-ir-after-failure 2> xyz.txt | |
: 1716618055:0;iree-compile --iree-preprocessing-pass-pipeline="builtin.module(util.func(iree-linalg-ext-convert-conv2d-to-winograd{replace-all-convs=true},iree-global-opt-demote-contraction-inputs-to-bf16))" --iree-hal-target-backends=llvm-cpu --iree-llvmcpu-target-cpu=znver4 --iree-llvmcpu-enable-ukernels=mmt4d,pack,unpack --iree-flow-collapse-reduction-dims --iree-opt-const-expr-max-size-increase-threshold=1000000000000000 vae2b_decomp.mlir -o vae.vmfb -mlir-elide-elementsattrs-if-larger=2 -mlir-print-ir-before-failure 2> xyz.txt | |
: 1716618173:0;iree-compile --iree-preprocessing-pass-pipeline="builtin.module(util.func(iree-linalg-ext-convert-conv2d-to-winograd{replace-all-convs=true},iree-global-opt-demote-contraction-inputs-to-bf16))" --iree-hal-target-backends=llvm-cpu --iree-llvmcpu-target-cpu=znver4 --iree-llvmcpu-enable-ukernels=mmt4d,pack,unpack --iree-flow-collapse-reduction-dims --iree-opt-const-expr-max-size-increase-threshold=1000000000000000 vae2b_decomp.mlir -o vae.vmfb -mlir-elide-elementsattrs-if-larger=2 -mlir-print-ir-before=iree-codegen-cpu-prepare-ukernels 2> xyz.txt | |
: 1716618679:0;iree-compile --iree-preprocessing-pass-pipeline="builtin.module(util.func(iree-linalg-ext-convert-conv2d-to-winograd{replace-all-convs=true},iree-global-opt-demote-contraction-inputs-to-bf16))" --iree-hal-target-backends=llvm-cpu --iree-llvmcpu-target-cpu=znver4 --iree-llvmcpu-enable-ukernels=mmt4d,pack,unpack --iree-flow-collapse-reduction-dims --iree-opt-const-expr-max-size-increase-threshold=1000000000000000 vae2b_decomp.mlir -o vae.vmfb -mlir-elide-elementsattrs-if-larger=2 | |
: 1716619027:0;iree-compile --iree-preprocessing-pass-pipeline="builtin.module(util.func(iree-linalg-ext-convert-conv2d-to-winograd{replace-all-convs=true},iree-global-opt-demote-contraction-inputs-to-bf16))" --iree-hal-target-backends=llvm-cpu --iree-llvmcpu-target-cpu=znver4 --iree-llvmcpu-enable-ukernels=mmt4d,pack,unpack --iree-flow-collapse-reduction-dims --iree-opt-const-expr-max-size-increase-threshold=1000000000000000 vae2b_decomp.mlir -o vae.vmfb iree-hal-dump-executable-sources-to=dump/ | |
: 1716619032:0;iree-compile --iree-preprocessing-pass-pipeline="builtin.module(util.func(iree-linalg-ext-convert-conv2d-to-winograd{replace-all-convs=true},iree-global-opt-demote-contraction-inputs-to-bf16))" --iree-hal-target-backends=llvm-cpu --iree-llvmcpu-target-cpu=znver4 --iree-llvmcpu-enable-ukernels=mmt4d,pack,unpack --iree-flow-collapse-reduction-dims --iree-opt-const-expr-max-size-increase-threshold=1000000000000000 vae2b_decomp.mlir -o vae.vmfb -iree-hal-dump-executable-sources-to=dump/ | |
: 1716619344:0;iree-compile --iree-preprocessing-pass-pipeline="builtin.module(util.func(iree-linalg-ext-convert-conv2d-to-winograd{replace-all-convs=true},iree-global-opt-demote-contraction-inputs-to-bf16))" --iree-hal-target-backends=llvm-cpu --iree-llvmcpu-target-cpu=znver4 --iree-llvmcpu-enable-ukernels=mmt4d,pack,unpack --iree-flow-collapse-reduction-dims --iree-opt-const-expr-max-size-increase-threshold=1000000000000000 ~/unpack.mlir -o unpack.vmfb -mlir-elide-elementsattrs-if-larger=2 -mlir-print-ir-before=iree-codegen-cpu-prepare-ukernels | |
: 1716619385:0;iree-compile --iree-preprocessing-pass-pipeline="builtin.module(util.func(iree-linalg-ext-convert-conv2d-to-winograd{replace-all-convs=true},iree-global-opt-demote-contraction-inputs-to-bf16))" --iree-hal-target-backends=llvm-cpu --iree-llvmcpu-target-cpu=znver4 --iree-llvmcpu-enable-ukernels=mmt4d,pack,unpack --iree-flow-collapse-reduction-dims --iree-opt-const-expr-max-size-increase-threshold=1000000000000000 ~/unpack.mlir -o unpack.vmfb -mlir-elide-elementsattrs-if-larger=2 -mlir-print-ir-before=iree-codegen-cpu-prepare-ukernels 2> xyz.txt | |
: 1716620494:0;iree-compile --iree-preprocessing-pass-pipeline="builtin.module(util.func(iree-linalg-ext-convert-conv2d-to-winograd{replace-all-convs=true},iree-global-opt-demote-contraction-inputs-to-bf16))" --iree-hal-target-backends=llvm-cpu --iree-llvmcpu-target-cpu=znver4 --iree-llvmcpu-enable-ukernels=mmt4d,pack,unpack --iree-flow-collapse-reduction-dims --iree-opt-const-expr-max-size-increase-threshold=1000000000000000 ~/unpack.mlir -o unpack.vmfb -mlir-elide-elementsattrs-if-larger=2 | |
: 1716620520:0;iree-opt ~/unpack.mlir | |
: 1716620639:0;iree-compile --iree-preprocessing-pass-pipeline="builtin.module(util.func(iree-linalg-ext-convert-conv2d-to-winograd{replace-all-convs=true},iree-global-opt-demote-contraction-inputs-to-bf16))" --iree-hal-target-backends=llvm-cpu --iree-llvmcpu-target-cpu=znver4 --iree-llvmcpu-enable-ukernels=mmt4d,pack,unpack --iree-flow-collapse-reduction-dims --iree-opt-const-expr-max-size-increase-threshold=1000000000000000 ~/unpack.mlir -o unpack.vmfb -mlir-elide-elementsattrs-if-larger=2 -mlir-print-ir-after-all 2> xzy.txt | |
: 1716623315:0;iree-opt -canonicalize ~/unpack.mlir | |
: 1716624923:0;git ob buggy | |
: 1716624999:0;git remote add llvm_upstream https://github.com/llvm/llvm-project.git | |
: 1716625002:0;git fetch llvm_upstream | |
: 1716625045:0;git o llvm_upstream/main | |
: 1716625062:0;git cp 7fed4bb54b35 | |
: 1716625081:0;git ob bug_multiple | |
: 1716625612:0;vi ~/unpack.mlir | |
: 1716625953:0;git cp e460bd8abd | |
: 1716626088:0;git cp abort | |
: 1716626116:0;git o un | |
: 1716626122:0;git o unpack_kernel | |
: 1716626554:0;git revert 57c3040bcccc2f0432a8ec934df38bab91eadeca | |
: 1716626598:0;git cherry-pick --abort | |
: 1716626616:0;git ob 46c6bf5660022068cb1078bd7eeae527b13b30c2 | |
: 1716626654:0;git o 008add90d3de1333e9dcacc16eb9583989cfc492 | |
: 1716626677:0;git cp 008add90d3de1333e9dcacc16eb9583989cfc492 | |
: 1716626688:0;git cp 46c6bf5660022068cb1078bd7eeae527b13b30c2 | |
: 1716626741:0;git o shared/tresleches-cpu | |
: 1716626745:0;git cp * 8a59f827c7 | |
: 1716626749:0;git cp 8a59f827c7 | |
: 1716626821:0;git cp aeadd8437ad0 | |
: 1716627027:0;iree-compile --iree-preprocessing-pass-pipeline="builtin.module(util.func(iree-linalg-ext-convert-conv2d-to-winograd{replace-all-convs=true},iree-global-opt-demote-contraction-inputs-to-bf16))" --iree-hal-target-backends=llvm-cpu --iree-llvmcpu-target-cpu=znver4 --iree-llvmcpu-enable-ukernels=mmt4d,pack,unpack --iree-flow-collapse-reduction-dims --iree-opt-const-expr-max-size-increase-threshold=1000000000000000 vae2b_decomp.mlir -o vae.vmfb | |
: 1716627046:0;iree-benchmark-module --device=local-task --module=vae.vmfb --input=1x16x64x64xf32=1 --function=main | |
: 1716627074:0;iree-benchmark-module --device=local-sync --module=vae.vmfb --input=1x16x64x64xf32=1 --function=main | |
: 1716659713:0;locale | |
: 1716661286:0;iree-opt --pass-pipeline="builtin.module(func.func(iree-codegen-cpu-prepare-ukernels))" ~/unpack.mlir | |
: 1716662328:0;iree-opt --pass-pipeline="builtin.module(func.func(iree-codegen-cpu-prepare-ukernels))" ~/unpack.mlir | ~/llvm-project/mlir/utils/generate-test-checks.py | |
: 1716662375:0;iree-opt --pass-pipeline="builtin.module(func.func(iree-codegen-cpu-prepare-ukernels))" ~/unpack.mlir | ~/llvm-project/mlir/utils/generate-test-checks.py > xyz.txt | |
: 1716664147:0;rm xyz.txt xzy.txt | |
: 1716664603:0;mkdir test_sandbox | |
: 1716664685:0;iree-compile -iree-input-type=tmtensor --iree-input-demote-i64-to-i32 --iree-hal-target-backends=llvm-cpu test_scan.mlir | |
: 1716664695:0;iree-compile -iree-input-type=tm_tensor --iree-input-demote-i64-to-i32 --iree-hal-target-backends=llvm-cpu test_scan.mlir | |
: 1716665489:0;iree-compile -iree-input-type=tm_tensor --iree-input-demote-i64-to-i32 --iree-hal-target-backends=llvm-cpu test_scan_small.mlir | |
: 1716665515:0;iree-compile -iree-input-type=tm_tensor --iree-input-demote-i64-to-i32 --iree-hal-target-backends=llvm-cpu test_scan_small.mlir -mlir-print-ir-after-all 2> xyz.txt | |
: 1716665956:0;git ob test_scan | |
: 1716666137:0;iree-opt --iree-codegen-tile-and-distribute-to-workgroups new.mlir | |
: 1716666247:0;iree-opt --pass-pipeline='builtin.module(hal.executable(hal.executable.variant(builtin.module(func.func(iree-codegen-tile-and-distribute-to-workgroups)))' new.mlir | |
: 1716666262:0;iree-opt --pass-pipeline='builtin.module(hal.executable(hal.executable.variant(builtin.module(func.func(iree-codegen-tile-and-distribute-to-workgroups))))' new.mlir | |
: 1716666273:0;iree-opt --pass-pipeline='builtin.module(hal.executable(hal.executable.variant(builtin.module(func.func(iree-codegen-tile-and-distribute-to-workgroups)))))' new.mlir | |
: 1716666636:0;iree-compile -iree-input-type=tmtensor --iree-hal-target-backends=llvm-cpu test_scan.mlir | |
: 1716666661:0;iree-compile -iree-input-type=tm_tensor --iree-hal-target-backends=llvm-cpu test_scan.mlir | |
: 1716666672:0;iree-compile -iree-input-type=tm_tensor --iree-hal-target-backends=llvm-cpu test_scan.mlir -mlir-disable-threading | |
: 1716666722:0;vi test_scan | |
: 1716666727:0;vi test_scan.mlir | |
: 1716666733:0;vi test_scan_small.mlir | |
: 1716666789:0;iree-opt --pass-pipeline='builtin.module(hal.executable(hal.executable.variant(builtin.module(func.func(iree-codegen-tile-and-distribute-to-workgroups)))))' new.mlir -mlir-print-ir-after-all | |
: 1716666802:0;rm test_scan.mlir | |
: 1716666809:0;mv test_scan_small.mlir scan.mlir | |
: 1716666823:0;iree-opt --pass-pipeline='builtin.module(hal.executable(hal.executable.variant(builtin.module(func.func(iree-codegen-tile-and-distribute-to-workgroups)))))' scan.mlir | |
: 1716667554:0;iree-opt --pass-pipeline='builtin.module(hal.executable(hal.executable.variant(builtin.module(func.func(iree-codegen-tile-and-distribute-to-workgroups, canonicalize)))))' new.mlir -mlir-print-ir-after-all | |
: 1716667615:0;iree-opt --pass-pipeline='builtin.module(hal.executable(hal.executable.variant(builtin.module(func.func(iree-codegen-tile-and-distribute-to-workgroups, canonicalize))cse)))' new.mlir -mlir-print-ir-after-all | |
: 1716667624:0;iree-opt --pass-pipeline='builtin.module(hal.executable(hal.executable.variant(builtin.module(func.func(iree-codegen-tile-and-distribute-to-workgroups, canonicalize)), cse)))' new.mlir -mlir-print-ir-after-all | |
: 1716667817:0;iree-opt --pass-pipeline='builtin.module(hal.executable(hal.executable.variant(builtin.module(func.func(iree-codegen-tile-and-distribute-to-workgroups{max-workgroup-parallel-dims=1}, canonicalize))cse)))' new.mlir -mlir-print-ir-after-all | |
: 1716667825:0;iree-opt --pass-pipeline='builtin.module(hal.executable(hal.executable.variant(builtin.module(func.func(iree-codegen-tile-and-distribute-to-workgroups{max-workgroup-parallel-dims=1}, canonicalize)), cse)))' new.mlir -mlir-print-ir-after-all | |
: 1716667870:0;iree-opt --pass-pipeline='builtin.module(hal.executable(hal.executable.variant(builtin.module(func.func(iree-codegen-tile-and-distribute-to-workgroups{distribute-method=2}, canonicalize)), cse)))' new.mlir -mlir-print-ir-after-all | |
: 1716667890:0;iree-opt --pass-pipeline='builtin.module(hal.executable(hal.executable.variant(builtin.module(func.func(iree-codegen-tile-and-distribute-to-workgroups{distribution-method=2}, canonicalize)), cse)))' new.mlir -mlir-print-ir-after-all | |
: 1716667905:0;iree-compile -iree-input-type=tm_tensor --iree-hal-target-backends=llvm-cpu test_scan_small.mlir -mlir-disable-threading | |
: 1716668000:0;iree-compile -iree-input-type=tm_tensor --iree-input-demote-i64-to-i32 --iree-hal-target-backends=llvm-cpu scan.mlir | |
: 1716668007:0;iree-compile -iree-input-type=tm_tensor --iree-input-demote-i64-to-i32 --iree-hal-target-backends=llvm-cpu scan.mlir -mlir-disable-threading | |
: 1716668041:0;iree-compile --iree-hal-target-backends=llvm-cpu scan.mlir -mlir-disable-threading | |
: 1716668051:0;iree-compile -iree-input-type=tm_tensor --iree-hal-target-backends=llvm-cpu scan.mlir -mlir-disable-threading | |
: 1716668068:0;iree-compile -iree-input-type=tm_tensor --iree-hal-target-backends=llvm-cpu scan.mlir | |
: 1716668116:0;iree-compile -iree-input-type=tm_tensor --iree-hal-target-backends=llvm-cpu scan.mlir -mlir-disable-threading --iree-input-demote-i64-to-i32 | |
: 1716668125:0;iree-compile -iree-input-type=tm_tensor --iree-hal-target-backends=llvm-cpu scan.mlir --iree-input-demote-i64-to-i32 | |
: 1716668741:0;iree-opt --pass-pipeline='builtin.module(hal.executable(hal.executable.variant(builtin.module(func.func(iree-codegen-tile-and-distribute-to-workgroups{distribution-method=0}, canonicalize)), cse)))' new.mlir | |
: 1716668800:0;iree-opt --pass-pipeline='builtin.module(hal.executable(hal.executable.variant(builtin.module(func.func(iree-codegen-tile-and-distribute-to-workgroups{distribution-method=0, max-workgroup-parallel-dims=3}, canonicalize)), cse)))' new.mlir | |
: 1716668845:0;iree-opt --pass-pipeline='builtin.module(hal.executable(hal.executable.variant(builtin.module(func.func(iree-codegen-tile-and-distribute-to-workgroups{max-workgroup-parallel-dims=3}, canonicalize)), cse)))' new.mlir | |
: 1716668998:0;iree-opt --pass-pipeline='builtin.func(hal.executable(hal.executable.variant(builtin.func(func.func(iree-codegen-tile-and-distribute-to-workgroups{max-workgroup-parallel-dims=3}, canonicalize)), cse)))' new.mlir | |
: 1716669025:0;iree-opt --pass-pipeline='builtin.module(hal.executable(hal.executable.variant(builtin.func(func.func(iree-codegen-tile-and-distribute-to-workgroups{max-workgroup-parallel-dims=3}, canonicalize)), cse)))' new.mlir | |
: 1716669342:0;iree-opt --pass-pipeline='builtin.module(func.func(iree-codegen-tile-and-distribute-to-workgroups{max-workgroup-parallel-dims=3}, canonicalize))' new.mlir | |
: 1716669382:0;iree-opt --pass-pipeline='builtin.module(func.func(iree-codegen-tile-and-distribute-to-workgroups{max-workgroup-parallel-dims=3}, canonicalize))' new.mlir -verify-each=0 | |
: 1716669404:0;iree-opt --pass-pipeline='builtin.module(func.func(iree-codegen-tile-and-distribute-to-workgroups{max-workgroup-parallel-dims=3}, canonicalize))' new.mlir -mlir-disable-threading | |
: 1716669413:0;iree-opt --pass-pipeline='builtin.module(func.func(iree-codegen-tile-and-distribute-to-workgroups{max-workgroup-parallel-dims=3}))' new.mlir -mlir-disable-threading | |
: 1716669422:0;iree-opt --pass-pipeline='builtin.module(func.func(iree-codegen-tile-and-distribute-to-workgroups{max-workgroup-parallel-dims=3}),cse)' new.mlir -mlir-disable-threading | |
: 1716669484:0;iree-opt --pass-pipeline='builtin.module(builtin.module(iree-codegen-tile-and-distribute-to-workgroups{max-workgroup-parallel-dims=3}))' new.mlir -verify-each=0 | |
: 1716669492:0;iree-opt --pass-pipeline='builtin.module(func.func(iree-codegen-tile-and-distribute-to-workgroups{max-workgroup-parallel-dims=3}))' new.mlir -verify-each=0 | |
: 1716669532:0;iree-opt --pass-pipeline='builtin.module(func.func(iree-codegen-tile-and-distribute-to-workgroups))' new.mlir -verify-each=0 | |
: 1716669542:0;iree-opt --pass-pipeline='builtin.module(func.func(iree-codegen-tile-and-distribute-to-workgroups))' new.mlir -debug | |
: 1716670073:0;iree-opt --pass-pipeline='builtin.module(func.func(iree-codegen-tile-and-distribute-to-workgroups))' new.mlir -debug 2> xyz.txt | |
: 1716670538:0;iree-opt --pass-pipeline='builtin.module(func.func(iree-codegen-tile-and-distribute-to-workgroups))' new.mlir -mlir-print-ir-after-all | |
: 1716670701:0;mlir-opt --help | fzf | |
: 1716670717:0;iree-opt --pass-pipeline='builtin.module(func.func(iree-codegen-tile-and-distribute-to-workgroups))' new.mlir -mlir-print-ir-after-all -mlir-pretty-debuginfo | |
: 1716670726:0;iree-opt --pass-pipeline='builtin.module(func.func(iree-codegen-tile-and-distribute-to-workgroups))' new.mlir -mlir-print-ir-after-all -mlir-pretty-debuginfo -debug | |
: 1716671300:0;iree-opt --pass-pipeline='builtin.module(func.func(iree-codegen-tile-and-distribute-to-workgroups))' new.mlir -mlir-print-ir-after-all | |
: 1716671318:0;iree-opt --pass-pipeline='builtin.module(func.func(iree-codegen-tile-and-distribute-to-workgroups))' new.mlir -mlir-print-ir-after-all -mlir-pretty-debuginfo -debug 2> xyz.txt | |
: 1716671542:0;iree-opt --pass-pipeline='builtin.module(func.func(iree-codegen-tile-and-distribute-to-workgroups))' new.mlir -mlir-print-ir-after-all -mlir-pretty-debuginfo -debug 2> xyz.txt -mlir-disable-threading | |
: 1716673632:0;iree-compile -iree-input-type=tm_tensor --iree-hal-target-backends=llvm-cpu scan.mlir --iree-input-demote-i64-to-i32 -mlir-disable-threading | |
: 1716673747:0;iree-compile -iree-input-type=tm_tensor --iree-hal-target-backends=llvm-cpu scan.mlir --iree-input-demote-i64-to-i32 -mlir-disable-threading 2> -mlir-print-ir-after-all 2> xyz.txt | |
: 1716673781:0;rm -mlir-print-ir-after-all | |
: 1716673791:0;rm "-mlir-print-ir-after-all" | |
: 1716673802:0;rm ./-mlir-print-ir-after-all | |
: 1716673877:0;iree-compile -iree-input-type=tm_tensor --iree-hal-target-backends=llvm-cpu scan.mlir --iree-input-demote-i64-to-i32 -mlir-disable-threading -mlir-print-ir-after-all 2> xyz.txt | |
: 1716673925:0;iree-compile -iree-input-type=tm_tensor --iree-hal-target-backends=llvm-cpu scan.mlir --iree-input-demote-i64-to-i32 -mlir-disable-threading -mlir-print-ir-after-all 2> xzy.txt | |
: 1716673933:0;vi xzy.txt | |
: 1716673940:0;diff xzy.txt xyz.txt | |
: 1716673950:0;diff xzy.txt xyz.txt > kk.diff | |
: 1716673952:0;vi kk.diff | |
: 1716674008:0;vi xzy.txt xyz.txt | |
: 1716675400:0;iree-opt -iree-util-hoist-into-globals new.mlir | |
: 1716675421:0;iree-opt -iree-util-hoist-into-globals new.mlir -debug | |
: 1716675721:0;iree-opt -iree-util-hoist-into-globals new.mlir -debug -mlir-disable-threading | |
: 1716790104:0;cat new.mlir | |
: 1716792270:0;git remote rename main origin | |
: 1716792360:0;git ob bug_mul | |
: 1716794952:0;iree-compile --iree-preprocessing-pass-pipeline="builtin.module(util.func(iree-linalg-ext-convert-conv2d-to-winograd{replace-all-convs=true},iree-global-opt-demote-contraction-inputs-to-bf16))" --iree-hal-target-backends=llvm-cpu --iree-llvmcpu-target-cpu=znver4 --iree-llvmcpu-enable-ukernels=mmt4d,pack,unpack --iree-flow-collapse-reduction-dims --iree-opt-const-expr-max-size-increase-threshold=1000000000000000 ~/unpack.mlir -o unpack.vmfb -mlir-elide-elementsattrs-if-larger=2 -mlir-print-ir-after-all 2> xyz.txt | |
: 1716795068:0;iree-compile --iree-preprocessing-pass-pipeline="builtin.module(util.func(iree-linalg-ext-convert-conv2d-to-winograd{replace-all-convs=true},iree-global-opt-demote-contraction-inputs-to-bf16))" --iree-hal-target-backends=llvm-cpu --iree-llvmcpu-target-cpu=znver4 --iree-llvmcpu-enable-ukernels=mmt4d,pack,unpack --iree-flow-collapse-reduction-dims --iree-opt-const-expr-max-size-increase-threshold=1000000000000000 ~/unpack.mlir -o unpack.vmfb -mlir-print-ir-after-all | |
: 1716795076:0;iree-compile --iree-preprocessing-pass-pipeline="builtin.module(util.func(iree-linalg-ext-convert-conv2d-to-winograd{replace-all-convs=true},iree-global-opt-demote-contraction-inputs-to-bf16))" --iree-hal-target-backends=llvm-cpu --iree-llvmcpu-target-cpu=znver4 --iree-llvmcpu-enable-ukernels=mmt4d,pack,unpack --iree-flow-collapse-reduction-dims --iree-opt-const-expr-max-size-increase-threshold=1000000000000000 ~/unpack.mlir -o unpack.vmfb -mlir-print-ir-after-all 2> xyz.txt | |
: 1716796339:0;mlir-opt unpack.mlir | |
: 1716796356:0;#map = affine_map<(d0, d1) -> (d0, d1)>\ | |
module {\ | |
func.func @multiple_result(%arg0: tensor<16x16xf32>) -> (tensor<16x?xindex>, tensor<16x16xindex>) {\ | |
%0 = tensor.empty() : tensor<16x16xindex>\ | |
%1 = tensor.empty() : tensor<16x16xf32>\ | |
%cast = tensor.cast %0 : tensor<16x16xindex> to tensor<16x?xindex>\ | |
%2:2 = linalg.generic {indexing_maps = [#map, #map, #map], iterator_types = ["parallel", "parallel"]} ins(%arg0 : tensor<16x16xf32>) outs(%cast, %0 : tensor<16x?xindex>, tensor<16x16xindex>) {\ | |
^bb0(%in: f32, %out: index, %out_0: index):\ | |
%3 = linalg.index 0 : index\ | |
%4 = linalg.index 1 : index\ | |
linalg.yield %3, %4 : index, index\ | |
} -> (tensor<16x?xindex>, tensor<16x16xindex>)\ | |
return %2#0, %2#1 : tensor<16x?xindex>, tensor<16x16xindex>\ | |
}\ | |
} | |
: 1716796777:0;mlir-opt unpack.mlir -canonicalize | |
: 1716823418:0;torch-mlir-opt ~/test.mlir | |
: 1716823477:0;torch-mlir-opt ~/test.mlir -canonicalize | |
: 1716823913:0;git o type_cast | |
: 1716823932:0;bt | |
: 1716825290:0;clang-format -i lib/Dialect/Torch/IR/TorchOps.cpp | |
: 1716825918:0;gist-paste ~/.config/lvim/config.lua | |
: 1716829315:0;git ob hoist_bug | |
: 1716829611:0;iree-opt -iree-util-hoist-into-globals new.mlir -mlir-disable-threading | |
: 1716829618:0;vi ../new.mlir | |
: 1716830121:0;iree-opt -iree-util-hoist-into-globals ~/new.mlir -mlir-disable-threading | |
: 1716830220:0;iree-opt -iree-util-hoist-into-globals ~/new.mlir -mlir-disable-threading 2> ~/xyz.txt | |
: 1716830333:0;iree-opt -iree-util-hoist-into-globals ~/new.mlir -mlir-disable-threading 2> ~/xzy.txt | |
: 1716830344:0;diff ~/xyz.txt ~/xzy.txt | |
: 1716830401:0;vi ~/xyz.txt ~/xyz.txt | |
: 1716830644:0;vi ~/xyz.txt ~/xzy.txt ~/new.mlir | |
: 1716897342:0;dpkg --list | |
: 1716897515:0;sudo apt-get purge google-chrome-stable | |
: 1716897532:0;sudo apt-get autoremove | |
: 1716911855:0;python3 -m venv torch_cuda | |
: 1716911959:0;pip3 install --pre torch torchvision torchaudio --index-url https://download.pytorch.org/whl/nightly/cu124 | |
: 1716912146:0;pip install --upgrade diffusers[torch] | |
: 1716912156:0;pip install --upgrade diffusers | |
: 1716912212:0;pip install transformers | |
: 1716912402:0;21 | |
: 1716913156:0;sudo systemctl start ssh.service | |
: 1716913159:0;ifconfig | |
: 1716913227:0;clera | |
: 1716913304:0;source ~/torch_cuda/bin/activate | |
: 1716914369:0; | |
: 1716914418:0;pip install iree-compiler iree-runtime -f https://iree.dev/pip-release-links.html | |
: 1716915049:0;where iree-compile | |
: 1716915243:0;cd prashant | |
: 1716915551:0;git clone https://github.com/nod-ai/SHARK.git | |
: 1716915971:0;cd examples | |
: 1716915975:0;cd shark_eager | |
: 1716915986:0;cd shark_inference | |
: 1716915995:0;vi resnet50_fp16.py | |
: 1716916290:0;cd tresleches | |
: 1716916449:0;vi generate | |
: 1716916452:0;vi generate.py | |
: 1716916481:0;cd SHARK | |
: 1716916626:0;python generate.py | |
: 1716954228:0;git ob cli_demote | |
: 1716999642:0;iree-opt -iree-global-opt-demote-contraction-inputs-to-bf16 compiler/src/iree/compiler/GlobalOptimization/test/demote_contraction_inputs_to_bf16.mlir | |
: 1716999678:0;iree-opt -iree-global-opt-demote-contraction-inputs-to-bf16=matmul -split-input-file compiler/src/iree/compiler/GlobalOptimization/test/demote_contraction_inputs_to_bf16.mlir | |
: 1716999695:0;iree-opt -iree-global-opt-demote-contraction-inputs-to-bf16{demote-only=matmul} -split-input-file compiler/src/iree/compiler/GlobalOptimization/test/demote_contraction_inputs_to_bf16.mlir | |
: 1716999713:0;iree-opt -iree-global-opt-demote-contraction-inputs-to-bf16=demote-only=matmul -split-input-file compiler/src/iree/compiler/GlobalOptimization/test/demote_contraction_inputs_to_bf16.mlir | |
: 1716999764:0;cat compiler/src/iree/compiler/GlobalOptimization/test/demote_contraction_inputs_to_bf16.mlir | |
: 1716999996:0;iree-opt -iree-global-opt-demote-contraction-inputs-to-bf16=demote-only=all -split-input-file compiler/src/iree/compiler/GlobalOptimization/test/demote_contraction_inputs_to_bf16.mlir | |
: 1717001098:0;iree-opt -iree-global-opt-demote-contraction-inputs-to-bf16=demote-only{all} -split-input-file compiler/src/iree/compiler/GlobalOptimization/test/demote_contraction_inputs_to_bf16.mlir | |
: 1717001109:0;iree-opt -iree-global-opt-demote-contraction-inputs-to-bf16=demote-only="all" -split-input-file compiler/src/iree/compiler/GlobalOptimization/test/demote_contraction_inputs_to_bf16.mlir | |
: 1717001281:0;iree-opt -iree-global-opt-demote-contraction-inputs-to-bf16{demote-only="all} -split-input-file compiler/src/iree/compiler/GlobalOptimization/test/demote_contraction_inputs_to_bf16.mlir \ | |
\ | |
: 1717001364:0;iree-opt -iree-global-opt-demote-contraction-inputs-to-bf16{demote-only="all"} -split-input-file compiler/src/iree/compiler/GlobalOptimization/test/demote_contraction_inputs_to_bf16.mlir \ | |
\ | |
: 1717001476:0;more compiler/src/iree/compiler/Dialect/Stream/Transforms/test/dump_statistics.mlir | |
: 1717001543:0;iree-opt --pass-pipeline="builtin.module(iree-global-opt-demote-contraction-inputs-to-bf16{demote-only="all"})"-split-input-file compiler/src/iree/compiler/GlobalOptimization/test/demote_contraction_inputs_to_bf16.mlir \ | |
\ | |
: 1717001587:0;iree-opt --pass-pipeline="builtin.module(iree-global-opt-demote-contraction-inputs-to-bf16{demote-only=all})"-split-input-file compiler/src/iree/compiler/GlobalOptimization/test/demote_contraction_inputs_to_bf16.mlir \ | |
\ | |
: 1717001624:0;iree-opt -iree-global-opt-demote-contraction-inputs-to-bf16{demote-only=all} -split-input-file compiler/src/iree/compiler/GlobalOptimization/test/demote_contraction_inputs_to_bf16.mlir \ | |
\ | |
: 1717001690:0;iree-opt -iree-global-opt-demote-contraction-inputs-to-bf16=all -split-input-file compiler/src/iree/compiler/GlobalOptimization/test/demote_contraction_inputs_to_bf16.mlir \ | |
\ | |
: 1717005088:0;iree-opt -iree-global-opt-demote-contraction-inputs-to-bf16="conv" -split-input-file compiler/src/iree/compiler/GlobalOptimization/test/demote_contraction_inputs_to_bf16.mlir \ | |
\ | |
: 1717006436:0;morecompiler/src/iree/compiler/GlobalOptimization/test/set_encoding.mlir | |
: 1717006443:0;more compiler/src/iree/compiler/GlobalOptimization/test/set_encoding.mlir | |
: 1717006608:0;iree-opt --iree-global-opt-set-encoding="pad-factor=16" compiler/src/iree/compiler/GlobalOptimization/test/set_encoding.mlir | more | |
: 1717007242:0;iree-opt --iree-global-opt-set-encoding="pad-factor=16" compiler/src/iree/compiler/GlobalOptimization/test/set_encoding.mlir | |
: 1717008428:0;iree-opt -iree-global-opt-demote-contraction-inputs-to-bf16="demote-only=all" -split-input-file compiler/src/iree/compiler/GlobalOptimization/test/demote_contraction_inputs_to_bf16.mlir \ | |
\ | |
: 1717008438:0;iree-opt -iree-global-opt-demote-contraction-inputs-to-bf16="demote-only=matmul" -split-input-file compiler/src/iree/compiler/GlobalOptimization/test/demote_contraction_inputs_to_bf16.mlir \ | |
\ | |
: 1717008451:0;iree-opt -iree-global-opt-demote-contraction-inputs-to-bf16 -split-input-file compiler/src/iree/compiler/GlobalOptimization/test/demote_contraction_inputs_to_bf16.mlir \ | |
\ | |
: 1717008476:0;iree-opt -iree-global-opt-demote-contraction-inputs-to-bf16="demote-only=conv" -split-input-file compiler/src/iree/compiler/GlobalOptimization/test/demote_contraction_inputs_to_bf16.mlir \ | |
\ | |
: 1717010409:0;iree-opt -iree-global-opt-demote-contraction-inputs-to-bf16 -split-input-file compiler/src/iree/compiler/GlobalOptimization/test/demote_contraction_inputs_to_bf16.mlir | FileCheck compiler/src/iree/compiler/GlobalOptimization/test/demote_contraction_inputs_to_bf16.mlir | |
: 1717053781:0;iree-opt -iree-global-opt-demote-contraction-inputs-to-bf16{demote-only=all} -split-input-file compiler/src/iree/compiler/GlobalOptimization/test/demote_contraction_inputs_to_bf16.mlir | FileCheck compiler/src/iree/compiler/GlobalOptimization/test/demote_contraction_inputs_to_bf16.mlir | |
: 1717053799:0;iree-opt -iree-global-opt-demote-contraction-inputs-to-bf16=all -split-input-file compiler/src/iree/compiler/GlobalOptimization/test/demote_contraction_inputs_to_bf16.mlir | FileCheck compiler/src/iree/compiler/GlobalOptimization/test/demote_contraction_inputs_to_bf16.mlir | |
: 1717053807:0;iree-opt -iree-global-opt-demote-contraction-inputs-to-bf16=All -split-input-file compiler/src/iree/compiler/GlobalOptimization/test/demote_contraction_inputs_to_bf16.mlir | FileCheck compiler/src/iree/compiler/GlobalOptimization/test/demote_contraction_inputs_to_bf16.mlir | |
: 1717053826:0;iree-opt -iree-global-opt-demote-contraction-inputs-to-bf16=demote-only=All -split-input-file compiler/src/iree/compiler/GlobalOptimization/test/demote_contraction_inputs_to_bf16.mlir | FileCheck compiler/src/iree/compiler/GlobalOptimization/test/demote_contraction_inputs_to_bf16.mlir | |
: 1717054027:0;iree-opt -iree-global-opt-demote-contraction-inputs-to-bf16{demote-only=All} -split-input-file compiler/src/iree/compiler/GlobalOptimization/test/demote_contraction_inputs_to_bf16.mlir | FileCheck compiler/src/iree/compiler/GlobalOptimization/test/demote_contraction_inputs_to_bf16.mlir | |
: 1717054039:0;iree-opt -iree-global-opt-demote-contraction-inputs-to-bf16{demote-only=Conv} -split-input-file compiler/src/iree/compiler/GlobalOptimization/test/demote_contraction_inputs_to_bf16.mlir | FileCheck compiler/src/iree/compiler/GlobalOptimization/test/demote_contraction_inputs_to_bf16.mlir | |
: 1717054049:0;iree-opt -iree-global-opt-demote-contraction-inputs-to-bf16=Conv -split-input-file compiler/src/iree/compiler/GlobalOptimization/test/demote_contraction_inputs_to_bf16.mlir | FileCheck compiler/src/iree/compiler/GlobalOptimization/test/demote_contraction_inputs_to_bf16.mlir | |
: 1717054068:0;iree-opt -iree-global-opt-demote-contraction-inputs-to-bf16="demote-only=Conv" -split-input-file compiler/src/iree/compiler/GlobalOptimization/test/demote_contraction_inputs_to_bf16.mlir | FileCheck compiler/src/iree/compiler/GlobalOptimization/test/demote_contraction_inputs_to_bf16.mlir | |
: 1717054083:0;iree-opt -iree-global-opt-demote-contraction-inputs-to-bf16="demote-only=Matmul" -split-input-file compiler/src/iree/compiler/GlobalOptimization/test/demote_contraction_inputs_to_bf16.mlir | FileCheck compiler/src/iree/compiler/GlobalOptimization/test/demote_contraction_inputs_to_bf16.mlir | |
: 1717056230:0;iree-opt -iree-global-opt-demote-contraction-inputs-to-bf16="demote-only=none" -split-input-file compiler/src/iree/compiler/GlobalOptimization/test/demote_contraction_inputs_to_bf16.mlir | FileCheck compiler/src/iree/compiler/GlobalOptimization/test/demote_contraction_inputs_to_bf16.mlir | |
: 1717056236:0;iree-opt -iree-global-opt-demote-contraction-inputs-to-bf16="demote-only=conv" -split-input-file compiler/src/iree/compiler/GlobalOptimization/test/demote_contraction_inputs_to_bf16.mlir | FileCheck compiler/src/iree/compiler/GlobalOptimization/test/demote_contraction_inputs_to_bf16.mlir | |
: 1717056584:0;clang-format compiler/src/iree/compiler/GlobalOptimization/Passes.td | |
: 1717071998:0;git ob test_tile | |
: 1717072002:0;l | |
: 1717072053:0;iree-opt --pass-pipeline='builtin.module(func.func(iree-codegen-tile-and-distribute-to-workgroups))' before_fail.mlir -debug | |
: 1717073082:0;iree-opt -mlir-pretty-debuginfo before_fail.mlir | |
: 1717073231:0;iree-opt --pass-pipeline='builtin.module(func.func(iree-codegen-tile-and-distribute-to-workgroups))' before_fail.mlir -debug 2> debug.txt | |
: 1717073567:0;iree-opt before_fail.mlir | |
: 1717076907:0;iree-compile --iree-hal-target-backends=llvm-cpu --iree-llvmcpu-target-cpu-features=host ~/new.mlir -iree-input-demote-i64-to-i32 -mlir-print-ir-after-all 2> kk.mlir | |
: 1717076966:0;vi scan.mlir | |
: 1717076989:0;iree-compile --iree-hal-target-backends=llvm-cpu --iree-llvmcpu-target-cpu-features=host new.mlir -iree-input-demote-i64-to-i32 -mlir-print-ir-after-all 2> kk.mlir | |
: 1717076998:0;vi kk.mlir | |
: 1717077209:0;vi before_fail.mlir | |
: 1717077299:0;iree-opt --pass-pipeline='builtin.module(func.func(iree-codegen-tile-and-distribute-to-workgroups))' before_fail.mlir -verify-each=0 | |
: 1717077304:0;iree-opt --pass-pipeline='builtin.module(func.func(iree-codegen-tile-and-distribute-to-workgroups))' before_fail.mlir | |
: 1717077360:0;cat before_fail.mlir | |
: 1717505816:0;iree-opt -iree-global-opt-demote-contraction-inputs-to-bf16="demote-only=matmul" -split-input-file compiler/src/iree/compiler/GlobalOptimization/test/demote_contraction_inputs_to_bf16.mlir | FileCheck compiler/src/iree/compiler/GlobalOptimization/test/demote_contraction_inputs_to_bf16.mlir | |
: 1717507171:0;clang-format -i compiler/src/iree/compiler/GlobalOptimization/Passes.cpp | |
: 1717507528:0;iree-compile --iree-global-opt-enable-demote-contraction-inputs-to-bf16=conv | |
: 1717507538:0;iree-compile --iree-global-opt-enable-demote-contraction-inputs-to-bf16=conv ~/xyz.mlir | |
: 1717507554:0;iree-compile --iree-global-opt-enable-demote-contraction-inputs-to-bf16=conv ~/xyz.mlir --target-devices=llvm-cpu | |
: 1717507568:0;iree-compile --iree-global-opt-enable-demote-contraction-inputs-to-bf16=conv ~/xyz.mlir --hal-backend=llvm-cpu | |
: 1717508023:0;iree-opt -iree-global-opt-demote-contraction-inputs-to-bf16="demote-only=all" -split-input-file compiler/src/iree/compiler/GlobalOptimization/test/demote_contraction_inputs_to_bf16.mlir | FileCheck compiler/src/iree/compiler/GlobalOptimization/test/demote_contraction_inputs_to_bf16.mlir | |
: 1717508056:0;iree-opt -iree-global-opt-demote-contraction-inputs-to-bf16="demote-only=all" -split-input-file compiler/src/iree/compiler/GlobalOptimization/test/demote_contraction_inputs_to_bf16.mlir | FileCheck compiler/src/iree/compiler/GlobalOptimization/test/demote_contraction_inputs_to_bf16.mlir --check-prefix=MATMUL | |
: 1717508888:0;iree-opt -iree-global-opt-demote-contraction-inputs-to-bf16="demote-only=conv" -split-input-file compiler/src/iree/compiler/GlobalOptimization/test/demote_contraction_inputs_to_bf16.mlir | FileCheck compiler/src/iree/compiler/GlobalOptimization/test/demote_contraction_inputs_to_bf16.mlir --check-prefix=CONV | |
: 1717508893:0;iree-opt -iree-global-opt-demote-contraction-inputs-to-bf16="demote-only=conv" -split-input-file compiler/src/iree/compiler/GlobalOptimization/test/demote_contraction_inputs_to_bf16.mlir | FileCheck compiler/src/iree/compiler/GlobalOptimization/test/demote_contraction_inputs_to_bf16.mlir --check-prefix=MATMUL | |
: 1717508905:0;iree-opt -iree-global-opt-demote-contraction-inputs-to-bf16="demote-only=matmul" -split-input-file compiler/src/iree/compiler/GlobalOptimization/test/demote_contraction_inputs_to_bf16.mlir | FileCheck compiler/src/iree/compiler/GlobalOptimization/test/demote_contraction_inputs_to_bf16.mlir --check-prefix=MATMUL | |
: 1717510350:0;git cp e1c82f05a50719d1c500d25a00f024a62b1d33fa | |
: 1717510532:0;git branch -D new_test | |
: 1717510698:0;git o cli_demote | |
: 1717510826:0;ls ~ | |
: 1717510833:0;mkdir tmp | |
: 1717510837:0;rm tmp | |
: 1717510842:0;rm -rf tmp | |
: 1717510848:0;mkdir ~/tmp | |
: 1717510851:0;cp compiler/src/iree/compiler/GlobalOptimization/DemoteContractionInputsToBF16.cpp compiler/src/iree/compiler/GlobalOptimization/test/demote_contraction_inputs_to_bf16.mlir compiler/src/iree/compiler/GlobalOptimization/PassDetail.h compiler/src/iree/compiler/GlobalOptimization/Passes.cpp compiler/src/iree/compiler/GlobalOptimization/Passes.h compiler/src/iree/compiler/GlobalOptimization/Passes.td ~/tmp/ | |
: 1717510873:0;git ob nb | |
: 1717510935:0;cp ~/tmp/DemoteContractionInputsToBF16.cpp compiler/src/iree/compiler/GlobalOptimization/DemoteContractionInputsToBF16.cpp | |
: 1717510957:0;cp ~/tmp/PassDetail.h compiler/src/iree/compiler/GlobalOptimization/PassDetail.h | |
: 1717510978:0;cp ~/tmp/Passes.cpp compiler/src/iree/compiler/GlobalOptimization/Passes.cpp | |
: 1717510994:0;cp ~/tmp/Passes.h compiler/src/iree/compiler/GlobalOptimization/Passes.h | |
: 1717511010:0;cp ~/tmp/Passes.td compiler/src/iree/compiler/GlobalOptimization/Passes.td | |
: 1717511026:0;cp ~/tmp/demote_contraction_inputs_to_bf16.mlir compiler/src/iree/compiler/GlobalOptimization/test/demote_contraction_inputs_to_bf16.mlir | |
: 1717511104:0;git branch -D cli_demote | |
: 1717511114:0;git branch -m cli_demote | |
: 1717511775:0;clang-format -i compiler/src/iree/compiler/GlobalOptimization/Passes.td | |
: 1717523110:0;cmake --build ~/iree-build/ | |
: 1717524931:0;ctest --rerun-failed . --output-on-failure | |
: 1717527480:0;pip install requests | |
: 1717527559:0;iree-opt --split-input-file -iree-global-opt-demote-contraction-inputs-to-bf16="demote-only=matmul" /home/prashant/iree/compiler/src/iree/compiler/GlobalOptimiz\ | |
ation/test/demote_contraction_inputs_to_bf16.mlir | FileCheck /home/prashant/iree/compiler/src/iree/compiler/GlobalOptimization/test/demote_contraction_inputs_to_bf16.mlir --ch\ | |
eck-prefix=MATMUL | |
: 1717527576:0;iree-opt --split-input-file -iree-global-opt-demote-contraction-inputs-to-bf16="demote-only=matmul" /home/prashant/iree/compiler/src/iree/compiler/GlobalOptimization/test/demote_contraction_inputs_to_bf16.mlir | FileCheck /home/prashant/iree/compiler/src/iree/compiler/GlobalOptimization/test/demote_contraction_inputs_to_bf16.mlir --ch\ | |
eck-prefix=MATMUL | |
: 1717527944:0;iree-opt --split-input-file -iree-global-opt-demote-contraction-inputs-to-bf16="demote-only=matmul" /home/prashant/iree/compiler/src/iree/compiler/GlobalOptimization/test/demote_contraction_inputs_to_bf16.mlir | FileCheck /home/prashant/iree/compiler/src/iree/compiler/GlobalOptimization/test/demote_contraction_inputs_to_bf16.mlir --check-prefix=CONV | |
: 1717528542:0;iree-opt --split-input-file -iree-global-opt-demote-contraction-inputs-to-bf16="=matmul" /home/prashant/iree/compiler/src/iree/compiler/GlobalOptimization/test/demote_contraction_inputs_to_bf16.mlir | FileCheck /home/prashant/iree/compiler/src/iree/compiler/GlobalOptimization/test/demote_contraction_inputs_to_bf16.mlir --check-prefix=MATMUL | |
: 1717528555:0;iree-opt --split-input-file -iree-global-opt-demote-contraction-inputs-to-bf16="matmul" /home/prashant/iree/compiler/src/iree/compiler/GlobalOptimization/test/demote_contraction_inputs_to_bf16.mlir | FileCheck /home/prashant/iree/compiler/src/iree/compiler/GlobalOptimization/test/demote_contraction_inputs_to_bf16.mlir --check-prefix=MATMUL | |
: 1717529146:0;iree-opt --split-input-file -iree-global-opt-demote-contraction-inputs-to-bf16="demote-only=matmul" /home/prashant/iree/compiler/src/iree/compiler/GlobalOptimization/test/demote_contraction_inputs_to_bf16.mlir | FileCheck /home/prashant/iree/compiler/src/iree/compiler/GlobalOptimization/test/demote_contraction_inputs_to_bf16.mlir | |
: 1717529167:0;iree-opt --split-input-file -iree-global-opt-demote-contraction-inputs-to-bf16="demote-only=conv" /home/prashant/iree/compiler/src/iree/compiler/GlobalOptimization/test/demote_contraction_inputs_to_bf16.mlir | FileCheck /home/prashant/iree/compiler/src/iree/compiler/GlobalOptimization/test/demote_contraction_inputs_to_bf16.mlir | |
: 1717529753:0;iree-opt --split-input-file -iree-global-opt-demote-contraction-inputs-to-bf16="demote-only=all" /home/prashant/iree/compiler/src/iree/compiler/GlobalOptimization/test/demote_contraction_inputs_to_bf16.mlir | FileCheck /home/prashant/iree/compiler/src/iree/compiler/GlobalOptimization/test/demote_contraction_inputs_to_bf16.mlir | |
: 1717529836:0;iree-opt --split-input-file -iree-global-opt-demote-contraction-inputs-to-bf16="demote-only=all" /home/prashant/iree/compiler/src/iree/compiler/GlobalOptimization/test/demote_contraction_inputs_to_bf16.mlir | FileCheck /home/prashant/iree/compiler/src/iree/compiler/GlobalOptimization/test/demote_contraction_inputs_to_bf16.mlir --prefix=MATMUL | |
: 1717529849:0;iree-opt --split-input-file -iree-global-opt-demote-contraction-inputs-to-bf16="demote-only=all" /home/prashant/iree/compiler/src/iree/compiler/GlobalOptimization/test/demote_contraction_inputs_to_bf16.mlir | FileCheck /home/prashant/iree/compiler/src/iree/compiler/GlobalOptimization/test/demote_contraction_inputs_to_bf16.mlir --check-prefix=MATMUL | |
: 1717529858:0;iree-opt --split-input-file -iree-global-opt-demote-contraction-inputs-to-bf16="demote-only=conv" /home/prashant/iree/compiler/src/iree/compiler/GlobalOptimization/test/demote_contraction_inputs_to_bf16.mlir | FileCheck /home/prashant/iree/compiler/src/iree/compiler/GlobalOptimization/test/demote_contraction_inputs_to_bf16.mlir --check-prefix=MATMUL | |
: 1717530096:0;cd ../iree-build | |
: 1717530128:0;vi /home/prashant/iree-build/Testing/Temporary/LastTest.log | |
: 1717530637:0;cd test_tmpdir/iree/compiler/GlobalOptimization/test/demote_contraction_inputs_to_bf16.mlir.test_test_tmpdir | |
: 1717530640:0;cd src | |
: 1717530644:0;cd compiler | |
: 1717530647:0;cd GlobalOptimization/test | |
: 1717530650:0;cd Output | |
: 1717531042:0;chmod +x ./demote_contraction_inputs_to_bf16.mlir.script | |
: 1717531043:0;./demote_contraction_inputs_to_bf16.mlir.script | |
: 1717531051:0;cat demote_contraction_inputs_to_bf16.mlir.script | |
: 1717531324:0;bazel | |
: 1717531428:0;vi demote_contraction_inputs_to_bf16.mlir.script | |
: 1717531477:0;iree-opt --split-input-file -iree-global-opt-demote-contraction-inputs-to-bf16="demote-only=matmul" /home/prashant/iree/compiler/src/iree/compiler/GlobalOptimization/test/demote_contraction_inputs_to_bf16.mlir | FileCheck /home/prashant/iree/compiler/src/iree/compiler/GlobalOptimization/test/demote_contraction_inputs_to_bf16.mlir --check-prefix=MATMUL | |
: 1717531558:0;wget https://github.com/bazelbuild/bazelisk/releases/download/v1.20.0/bazelisk-linux-amd64 | |
: 1717531571:0;mv bazelisk-linux-amd64 bazelisk | |
: 1717531577:0;chmod +x bazelisk | |
: 1717531594:0;mv bazelisk /usr/bin/bazel/ | |
: 1717531602:0;sudo mv bazelisk /usr/bin/bazel | |
: 1717531645:0;bazel test -k //... \\ | |
--iree_drivers=local-sync,local-task \\ | |
: 1717531691:0;vi BUILD.bazel | |
: 1717531704:0;python3 configure_bazel.py | |
: 1717531731:0;bazel test -k //... | |
: 1717562318:0;vi /home/prashant/.cache/bazel/_bazel_prashant/ff4e76a442c7b6306957b7618e366985/execroot/iree_core/bazel-out/k8-opt/testlogs/compiler/src/iree/compiler/GlobalOptimization/test/demote_contraction_inputs_to_bf16.mlir.test/test.log | |
: 1717562604:0;iree-opt /home/prashant/.cache/bazel/_bazel_prashant/ff4e76a442c7b6306957b7618e366985/sandbox/linux-sandbox/69/execroot/iree_core/bazel-out/k8-opt/bin/compiler/src/iree/compiler/GlobalOptimization/test/demote_contraction_inputs_to_bf16.mlir.test.runfiles/iree_core/compiler/src/iree/compiler/GlobalOptimization/test/demote_contraction_inputs_to_bf16.mlir --split-input-file -iree-global-opt-demote-contraction-inputs-to-bf16=demote-only=matmul | |
: 1717563036:0;iree-opt compiler/src/iree/compiler/GlobalOptimization/test/demote_contraction_inputs_to_bf16.mlir --split-input-file -iree-global-opt-demote-contraction-inputs-to-bf16="demote-only=matmul" | |
: 1717563081:0;iree-opt compiler/src/iree/compiler/GlobalOptimization/test/demote_contraction_inputs_to_bf16.mlir --split-input-file -iree-global-opt-demote-contraction-inputs-to-bf16="demote-only=conv" | |
: 1717563087:0;iree-opt compiler/src/iree/compiler/GlobalOptimization/test/demote_contraction_inputs_to_bf16.mlir --split-input-file -iree-global-opt-demote-contraction-inputs-to-bf16=demote-only=conv | |
: 1717563374:0;iree-opt compiler/src/iree/compiler/GlobalOptimization/test/demote_contraction_inputs_to_bf16.mlir --split-input-file -iree-global-opt-demote-contraction-inputs-to-bf16=demote-only=matmul | |
: 1717563398:0;iree-opt --split-input-file -iree-global-opt-demote-contraction-inputs-to-bf16="demote-only=conv" /home/prashant/iree/compiler/src/iree/compiler/GlobalOptimization/test/demote_contraction_inputs_to_bf16.mlir | FileCheck /home/prashant/iree/compiler/src/iree/compiler/GlobalOptimization/test/demote_contraction_inputs_to_bf16.mlir --check-prefix=CONV | |
: 1717563426:0;iree-opt --split-input-file -iree-global-opt-demote-contraction-inputs-to-bf16="demote-only=conv" /home/prashant/iree/compiler/src/iree/compiler/GlobalOptimization/test/demote_contraction_inputs_to_bf16.mlir | |
: 1717563608:0;iree-opt --split-input-file -iree-global-opt-demote-contraction-inputs-to-bf16="demote-only=matmul" /home/prashant/iree/compiler/src/iree/compiler/GlobalOptimization/test/demote_contraction_inputs_to_bf16.mlir | |
: 1717564140:0;iree-opt --split-input-file -iree-global-opt-demote-contraction-inputs-to-bf16="demote-only=all" ~/test.mlir | |
: 1717564232:0;iree-opt --split-input-file -iree-global-opt-demote-contraction-inputs-to-bf16="demote-only=conv" ~/test.mlir | |
: 1717564249:0;iree-opt --split-input-file -iree-global-opt-demote-contraction-inputs-to-bf16="demote-only=none" ~/test.mlir | |
: 1717565161:0;iree-opt --split-input-file -iree-global-opt-demote-contraction-inputs-to-bf16="demote-only=matmul" ~/test.mlir | |
: 1717571020:0;clang-format -i compiler/src/iree/compiler/GlobalOptimization/DemoteContractionInputsToBF16.cpp | |
: 1717571024:0;iree-opt -iree-global-opt-demote-contraction-inputs-to-bf16="demote-only=matmul" ~/test.mlir | |
: 1717571032:0;iree-opt -iree-global-opt-demote-contraction-inputs-to-bf16="demote-only=all" ~/test.mlir | |
: 1717571036:0;iree-opt -iree-global-opt-demote-contraction-inputs-to-bf16="demote-only=conv" ~/test.mlir | |
: 1717571040:0;iree-opt -iree-global-opt-demote-contraction-inputs-to-bf16="demote-only=none" ~/test.mlir | |
: 1717571093:0;bazel test -k //... \\ | |
--iree_drivers=local-sync,local-task,vulkan \\ | |
--test_tag_filters="-driver=cuda,-target=cuda" \\ | |
--build_tag_filters="-driver=cuda,-target=cuda" | |
: 1717601611:0;git o unpack_ukernel | |
: 1717605190:0;iree-opt --pass-pipeline='builtin.module(iree-llvmcpu-select-lowering-strategy, func.func(iree-llvmcpu-lower-executable-target))' --split-input-file compiler/src/iree/compiler/Codegen/LLVMCPU/test/pipeline_pack_unpack_tests.mlir | FileCheck compiler/src/iree/compiler/Codegen/LLVMCPU/test/pipeline_pack_unpack_tests.mlir | |
: 1717605675:0;iree-opt --pass-pipeline='builtin.module(iree-llvmcpu-select-lowering-strategy, func.func(iree-llvmcpu-lower-executable-target))' --split-input-file compiler/src/iree/compiler/Codegen/LLVMCPU/test/pipeline_pack_unpack_tests.mlir | |
: 1717612600:0;iree-opt --pass-pipeline="builtin.module(func.func(iree-codegen-cpu-prepare-ukernels))" compiler/src/iree/compiler/Codegen/Common/CPU/test/prepare_ukernels.mlir -split-input-file | FileCheck compiler/src/iree/compiler/Codegen/Common/CPU/test/prepare_ukernels.mlir | |
: 1717612677:0;clang-format -i compiler/src/iree/compiler/Codegen/Common/CPU/CPUPrepareUkernels.cpp | |
: 1717612790:0;cd tresleches/kernel | |
: 1717612796:0;vi unpack.mlir | |
: 1717612897:0;iree-compile --iree-preprocessing-pass-pipeline="builtin.module(util.func(iree-linalg-ext-convert-conv2d-to-winograd{replace-all-convs=true},iree-global-opt-demote-contraction-inputs-to-bf16))" --iree-hal-target-backends=llvm-cpu --iree-llvmcpu-target-cpu=znver4 --iree-llvmcpu-enable-ukernels=mmt4d,pack,unpack --iree-flow-collapse-reduction-dims vae2b_fp32_weights.mlir -o vae.vmfb | |
: 1717614010:0;cd prashant/llvm-project | |
: 1717615406:0;mlir-opt mlir/test/Interfaces/DestinationStyleOpInterface/verify-destination-style-op-interface.mlir | |
: 1717616549:0;mlir-opt -canonicalize ~/test.mlir | ~/llvm-project/mlir/utils/generate-test-checks.py | |
: 1717616611:0;mlir-opt ~/test.mlir | |
: 1717680343:0;cd build_commands | |
: 1717680354:0;vi build_mlir.sh | |
: 1717680566:0;gcc --version | |
: 1717683263:0;clang-format -i mlir/lib/Dialect/Tensor/IR/TensorOps.cpp | |
: 1717684540:0;mlir-opt -transform-interpreter -canonicalize mlir/test/Dialect/Tensor/tiling.mlir | |
: 1717684548:0;mlir-opt -transform-interpreter -cse -canonicalize mlir/test/Dialect/Tensor/tiling.mlir | |
: 1717685977:0;mlir-opt -canonicalize mlir/test/Dialect/Tensor/tiling.mlir | |
: 1717686361:0;mlir-opt -canonicalize ~/test.mlir | |
: 1717691874:0;sudo apt --fix-broken install | |
: 1717691886:0;sudo apt-get install clang++ | |
: 1717692425:0;mlir-opt -transform-interpreter -cse -canonicalize mlir/test/Dialect/Tensor/tiling.mlir -split-input-file | |
: 1717692542:0;mlir-opt -transform-interpreter -cse -canonicalize ~/xyz.mlir -split-input-file | |
: 1717692583:0;mlir-opt -transform-interpreter -cse -canonicalize ~/test.mlir -split-input-file -mlr-print-ir-after-all 2> ~/full.txt | |
: 1717692856:0;mlir-opt -transform-interpreter -cse -canonicalize ~/test.mlir -split-input-file -mlir-print-ir-after-all 2> ~/full.txt | |
: 1717692859:0;vi ~/full.txt | |
: 1717693188:0;git ob jb | |
: 1717693241:0;rm .git/index.lock | |
: 1717693508:0;mlir-opt -transform-interpreter -cse -canonicalize ~/test.mlir -split-input-file | |
: 1717699714:0;git o bug_mul | |
: 1717699718:0;git o bug_multiple | |
: 1717740099:0;cd build/bin | |
: 1717741244:0;mv clang clang++ /usr/bin/ | |
: 1717741255:0;sudo mv clang clang++ /usr/bin/ | |
: 1717741262:0;sudo cp clang clang++ /usr/bin/ | |
: 1717741277:0;sudo cp clang clang++ /bin/ | |
: 1717741285:0;sudo cp clang clang++ /usr/local/bin | |
: 1717741354:0;sudo apt-get remove clang | |
: 1717741360:0;sudo apt-get remove clang++ | |
: 1717741382:0;rm clang clang++ /usr/bin/ | |
: 1717741399:0;rm -rf clang* | |
: 1717741797:0;ls /usr/bin | fzf | |
: 1717741868:0;clang++ --verbose | |
: 1717741902:0;sudo apt install libstdc++-dev | |
: 1717742417:0;iree-compile --iree-hal-target-backends=llvm-cpu --iree-llvmcpu-target-cpu-features=host -o out.vmfb broad_matmul.mlir | |
: 1717742443:0;iree-benchmark-module --module=out.vmfb --function=matmul_broad --input=4x128x3200xf32 --input=8640x3200xf16 | |
: 1717742575:0;iree-compile --iree-hal-target-backends=llvm-cpu --iree-llvmcpu-target-cpu-features=host -o out.vmfb broad_matmul.mlir --device=local-task | |
: 1717743911:0;git ob bm_check | |
: 1717749912:0;iree-compile --iree-hal-target-backends=llvm-cpu --iree-llvmcpu-target-cpu=znver4 --iree-llvmcpu-enable-ukernels=mmt4d,pack,unpack --iree-flow-collapse-reduction-dims broad_matmul.mlir -o out.vmfb | |
: 1717749939:0;iree-compile --iree-hal-target-backends=llvm-cpu --iree-llvmcpu-target-cpu=znver4 --iree-llvmcpu-enable-ukernels=mmt4d,pack,unpack --iree-flow-collapse-reduction-dims broad_matmul.mlir -o out.vmfb 2> all.txt | |
: 1717762410:0;iree-opt -iree-global-opt-set-encoding broad_matmul.mlir | |
: 1717762732:0;iree-opt -iree-global-opt-set-encoding broad_matmul.mlir --verify-each=0 | |
: 1717762751:0;vi out. | |
: 1717825224:0;iree-opt -iree-global-opt-set-encoding broad_matmul.mlir --verify-each=0 > out.mlir | |
: 1717950903:0;git ob shaptran | |
: 1717953141:0;mlir-opt ~/xyz.mlir | |
: 1717953430:0;mlir-opt -canonicalize ~/xyz.mlir | |
: 1717954120:0;mlir-opt -convert-vector-to-llvm ~/xyz.mlir -mlir-print-ir-after-all | |
: 1717954688:0;mlir-opt -convert-vector-to-llvm ~/xyz.mlir | |
: 1717954772:0;mlir-opt -debug -convert-vector-to-llvm ~/xyz.mlir | |
: 1717954897:0;mlir-opt -debug -convert-vector-to-llvm ~/xyz.mlir 2> ~/dbg.mlir | |
: 1717954901:0;vi ~/dbg.mlir | |
: 1717962919:0;cat -i mlir/lib/Dialect/Vector/Transforms/LowerVectorTranspose.cpp | |
: 1717962925:0;cat mlir/lib/Dialect/Vector/Transforms/LowerVectorTranspose.cpp | |
: 1717963573:0;mlir-opt -transform-interpreter ~/xyz.mlir | |
: 1717963940:0;clang-format -i mlir/lib/Dialect/Vector/Transforms/LowerVectorTranspose.cpp | |
: 1718105124:0;clang-format -i compiler/src/iree/compiler/GlobalOptimization/SetEncoding.cpp | |
: 1718106694:0;iree-compile --iree-hal-target-backends=llvm-cpu --iree-llvmcpu-target-cpu=znver4 --iree-llvmcpu-enable-ukernels=mmt4d,pack,unpack --iree-flow-collapse-reduction-dims out.mlir -o out.vmfb -mlir-print-ir-after-all 2> all.txt | |
: 1718106718:0;iree-compile --iree-hal-target-backends=llvm-cpu --iree-llvmcpu-target-cpu=znver4 --iree-llvmcpu-enable-ukernels=mmt4d,pack,unpack --iree-flow-collapse-reduction-dims matmul.mlir -o out.vmfb -mlir-print-ir-after-all 2> all.txt | |
: 1718107058:0;iree-opt -iree-global-opt-set-encoding broad_matmul.mlir > out.mlir | |
: 1718111625:0;cp broad_matmul.mlir xx.mlir | |
: 1718111627:0;vi xx.mlir | |
: 1718117220:0;iree-compile --iree-hal-target-backends=llvm-cpu --iree-llvmcpu-target-cpu=znver4 --iree-llvmcpu-enable-ukernels=mmt4d,pack,unpack --iree-flow-collapse-reduction-dims broad_matmul.mlir -o out.vmfb -mlir-print-ir-after-all 2> all.txt | |
: 1718117378:0;iree-opt -cpu-materialize-encoding test.mlir | |
: 1718117385:0;iree-opt -iree-codegen-cpu-materialize-encoding test.mlir | |
: 1718117467:0;more compiler/src/iree/compiler/Codegen/Common/CPU/test/llvmcpu_materialize_encoding.mlir | |
: 1718117490:0;iree-opt --pass-pipeline="builtin.module(func.func(iree-codegen-cpu-materialize-encoding),canonicalize,cse)" test.mlir | |
: 1718117556:0;iree-opt --pass-pipeline="builtin.module(func.func(iree-codegen-cpu-materialize-encoding),canonicalize,cse)" test.mlir --verify-each=0 | |
: 1718117756:0;mlir-opt test.mlir | |
: 1718117768:0;iree-opt test.mlir | |
: 1718118056:0;iree-opt -cse -canonicalize test.mlir | |
: 1718118897:0;iree-opt -iree-global-opt-set-encoding broad_matmul.mlir > out.mlir --verify-each=0 | |
: 1718119317:0;iree-opt -canonicalize test.mlir | |
: 1718119350:0;iree-opt --pass-pipeline="builtin.module(func.func(iree-codegen-cpu-materialize-encoding))" test.mlir --verify-each=0 | |
: 1718119367:0;iree-opt --pass-pipeline="builtin.module(func.func(iree-codegen-cpu-materialize-encoding))" test.mlir | |
: 1718120671:0;cd ../test_sandbox | |
: 1718130212:0;iree-compile --iree-hal-target-backends=llvm-cpu --iree-llvmcpu-target-cpu=znver4 --iree-flow-collapse-reduction-dims broad_matmul.mlir -o out.vmfb -mlir-print-ir-after-all 2> all.txt | |
: 1718131672:0;vi out.mlir | |
: 1718172712:0;iree-opt --pass-pipeline="builtin.module(func.func(iree-codegen-cpu-materialize-encoding))" out.mlir | |
: 1718172720:0;iree-opt -iree-global-opt-set-encoding broad_matmul.mlir > out.mlir | |
: 1718173399:0;iree-opt -iree-global-opt-set-encoding broad_matmul.mlir -canonicalize > out.mlir | |
: 1718173412:0;iree-opt -iree-global-opt-set-encoding broad_matmul.mlir -cse -canonicalize > out.mlir | |
: 1718179524:0;iree-opt brd.mlir | |
: 1718179536:0;iree-opt -cse -canonicalize brd.mlir | |
: 1718186624:0;more compiler/src/iree/compiler/Dialect/Flow/Transforms/test/form_dispatch_regions.mlir | |
: 1718186886:0;iree-opt --pass-pipeline="builtin.module(util.func(iree-flow-form-dispatch-regions))" bef_dis.mlir | |
: 1718187221:0;iree-opt --pass-pipeline="builtin.module(util.func(iree-flow-form-dispatch-regions{aggressive-fusion=true}))" bef_dis.mlir | |
: 1718205274:0;iree-opt -iree-global-opt-data-layout-propagation layout.mlir | |
: 1718206927:0;vi layout.mlir | |
: 1718206957:0;iree-opt --pass-pipeline="builtin.module(func.func(iree-global-opt-data-layout-propagation))" layout.mlir | |
: 1718208496:0;iree-compile --iree-hal-target-backends=llvm-cpu --iree-llvmcpu-target-cpu=znver4 --iree-flow-collapse-reduction-dims brd.mlir --iree-opt-const-expr-max-size-increase-threshold=1000000000000000 \\ | |
-o out.vmfb | |
: 1718219538:0;iree-compile --iree-hal-target-backends=llvm-cpu --iree-llvmcpu-target-cpu=znver4 --iree-flow-collapse-reduction-dims broad_matmul.mlir --iree-opt-const-expr-max-size-increase-threshold=1000000000000000 \\ | |
-o out.vmfb | |
: 1718221935:0;vi broad_matmul.mlir brd.mlir | |
: 1718266372:0;iree-compile --iree-hal-target-backends=llvm-cpu --iree-llvmcpu-target-cpu=znver4 --iree-flow-collapse-reduction-dims brd.mlir -o out.vmfb -mlir-print-ir-after-all 2> all.txt -mlir-disable-threading | |
: 1718267119:0;iree-opt --linalg-fold-unit-extent-dims vector.mlir | |
: 1718267216:0;iree-opt --pass-pipeline='builtin.module(func.func(iree-codegen-generic-vectorization))' | |
: 1718267342:0;iree-compile --iree-hal-target-backends=llvm-cpu --iree-llvmcpu-target-cpu=znver4 --iree-flow-collapse-reduction-dims broad_matmul.mlir -o out.vmfb -mlir-print-ir-after-all 2> all.txt -mlir-disable-threading | |
: 1718267769:0;vi vector.mlir | |
: 1718267780:0;iree-opt --pass-pipeline='builtin.module(func.func(iree-codegen-generic-vectorization))' vector.mlir | |
: 1718267959:0;iree-compile --iree-hal-target-backends=llvm-cpu --iree-flow-collapse-reduction-dims brd.mlir -o out.vmfb -mlir-print-ir-after-all 2> all.txt | |
: 1718268068:0;iree-compile --iree-hal-target-backends=llvm-cpu --iree-llvmcpu-target-cpu=znver4 --iree-flow-collapse-reduction-dims broad_matmul.mlir -o out.vmfb -mlir-print-ir-after-all 2> all.txt | |
: 1718269346:0;iree-compile --iree-hal-target-backends=llvm-cpu --iree-llvmcpu-target-cpu=znver4 --iree-llvmcpu-enable-ukernels=mmt4d,pack,unpack --iree-flow-collapse-reduction-dims broad_matmul.mlir -o out.vmfb | |
: 1718269409:0;iree-compile --iree-hal-target-backends=llvm-cpu --iree-llvmcpu-enable-ukernels=mmt4d,pack,unpack --iree-flow-collapse-reduction-dims broad_matmul.mlir -o out.vmfb 2> xyz.txt | |
: 1718269442:0;iree-compile --iree-hal-target-backends=llvm-cpu --iree-flow-collapse-reduction-dims broad_matmul.mlir -o out.vmfb 2> xyz.txt | |
: 1718269504:0;iree-compile --iree-hal-target-backends=llvm-cpu --iree-flow-collapse-reduction-dims brd.mlir -o out.vmfb 2> xyz.txt | |
: 1718283654:0;gist-paste vector.mlir | |
: 1718283698:0;iree-opt --pass-pipeline='builtin.module(func.func(iree-codegen-generic-vectorization))' vector.mlir -mlir-print-ir-after-all | |
: 1718283947:0;mv vector.mlir input.mlir | |
: 1718283989:0;iree-opt --pass-pipeline='builtin.module(func.func(iree-codegen-generic-vectorization))' input.mlir > out.mlir | |
: 1718284011:0;gist-paste input.mlir out.mlir | |
: 1718341358:0;mkdir sfmax_dbg | |
: 1718345314:0;iree-compile --iree-hal-target-backends=llvm-cpu --iree-llvmcpu-target-triple=x86_64-linux-gnu --iree-llvmcpu-target-cpu-features=host sfmax.mlir -o 42.vmfb | |
: 1718345319:0;iree-compile --iree-hal-target-backends=llvm-cpu --iree-llvmcpu-target-triple=x86_64-linux-gnu --iree-llvmcpu-target-cpu-features=host sfmax.mlir -o sfmax.vmfb | |
: 1718345325:0;rm 42.vmfb | |
: 1718348191:0;vi 42_inputs.npy | |
: 1718348433:0;cp sfmax.mlir exp.mlir | |
: 1718348436:0;vi exp.mlir | |
: 1718348527:0;iree-compile --iree-hal-target-backends=llvm-cpu --iree-llvmcpu-target-triple=x86_64-linux-gnu --iree-llvmcpu-target-cpu-features=host exp.mlir -o exp.vmfb -mlir-print-ir-after-all 2> all.txt | |
: 1718348575:0;iree-run-module --module=sfmax.vmfb --function=exp --input=@sub_out.npy --output=@exp_ref.npy | |
: 1718348591:0;iree-run-module --module=sfmax.vmfb --function=softmax --input=@sub_out.npy --output=@exp_ref.npy | |
: 1718348869:0;iree-run-module --module=exp.vmfb --function=softmax --input=@sub_out.npy --output=@exp_ref.npy | |
: 1718349418:0;cd ~/sfmax_dbg | |
: 1718350222:0;cd ../sfmax_dbg | |
: 1718352702:0;python sfmax.py 2> xyz.txt | |
: 1718353240:0;iree-compile --iree-hal-target-backends=llvm-cpu --iree-llvmcpu-target-triple=x86_64-linux-gnu --iree-llvmcpu-target-cpu-features=host sfmax.mlir -o sfmax.vmfb -mlir-print-ir-after-all 2> all.txt | |
: 1718355167:0;gist-paste sfmax.mlir | |
: 1718355198:0;mv xyz.txt py_out.txt | |
: 1718355202:0;gist-paste py_out.txt | |
: 1718355229:0;gist-paste sfmax.py | |
: 1718356366:0;vi sfmax.py | |
: 1718356370:0;python sfmax.py | |
: 1718357266:0;vi sfmax. | |
: 1718357270:0;vi sfmax.mlir | |
: 1718357293:0;iree-compile --iree-hal-target-backends=llvm-cpu --iree-llvmcpu-target-triple=x86_64-linux-gnu --iree-llvmcpu-target-cpu-features=host sfmax.mlir -o sfmax.vmfb | |
: 1718357304:0;python sfmax.py > xyz.txt | |
: 1718357314:0;:w | |
: 1718718041:0;iree-compile --iree-hal-target-backends=llvm-cpu --iree-flow-collapse-reduction-dims broad_matmul.mlir -o out.vmfb -mlir-print-ir-after-all 2> all.txt | |
: 1718727021:0;iree-compile --iree-hal-target-backends=llvm-cpu --iree-flow-collapse-reduction-dims broad_matmul.mlir -o out.vmfb | |
: 1718727060:0;iree-compile --iree-hal-target-backends=llvm-cpu --iree-flow-collapse-reduction-dims broad_matmul.mlir -o out.vmfb -mlir-disable-threading | |
: 1718727157:0;iree-compile --iree-hal-target-backends=llvm-cpu --iree-flow-collapse-reduction-dims broad_matmul.mlir -o out.vmfb -mlir-print-ir-after-all -mlir-disable-threading 2> all.txt | |
: 1718728900:0;gist-paste all.txt | |
: 1718731422:0;iree-compile --iree-hal-target-backends=llvm-cpu --iree-llvmcpu-target-cpu=znver4 --iree-llvmcpu-enable-ukernels=mmt4d,pack,unpack --iree-flow-collapse-reduction-dims broad_matmul.mlir -o out.vmfb 2> xyz.txt | |
: 1718731453:0;iree-compile --iree-hal-target-backends=llvm-cpu --iree-llvmcpu-target-cpu=znver4 --iree-llvmcpu-enable-ukernels=mmt4d,pack,unpack --iree-flow-collapse-reduction-dims broad_matmul.mlir -o out.vmfb 2> xyz.txt -mlir-disable-threading | |
: 1718732270:0;rm out.vmfb | |
: 1718799886:0;vi projects/pt1/examples/torchscript_resnet18.py | |
: 1718800288:0;iree-compile --iree-hal-target-backends=llvm-cpu --iree-llvmcpu-target-cpu=znver4 --iree-llvmcpu-enable-ukernels=mmt4d,pack,unpack --iree-flow-collapse-reduction-dims broad_matmul.mlir -o out.vmfb -mlir-disable-threading | |
: 1718800426:0;TRACY_NO_EXIT=1 iree-benchmark-module --module=out.vmfb --function=matmul_broad --input=4x128x3200xf32 --input=8640x3200xf16 --device=local-task | |
: 1718800448:0;iree-tracy-capture -o ~/batch_matmut.tracy | |
: 1718800557:0;iree-compile --iree-hal-target-backends=llvm-cpu --iree-llvmcpu-target-cpu=znver4 --iree-llvmcpu-enable-ukernels=mmt4d,pack,unpack --iree-flow-collapse-reduction-dims broad_matmul.mlir -o out.vmfb -mlir-disable-threading -iree-hal-dump-executable-binaries-to=dump/ | |
: 1718800572:0;nm module_broad_matmul_linked_llvm_cpu_embedded_elf_x86_64.so | |
: 1718800650:0;iree-compile --iree-hal-target-backends=llvm-cpu --iree-llvmcpu-target-cpu=znver4 --iree-llvmcpu-enable-ukernels=mmt4d,pack,unpack --iree-flow-collapse-reduction-dims broad_matmul.mlir -o out.vmfb -mlir-disable-threading -iree-hal-dump-executable-files-to=dump/ | |
: 1718801011:0;vi module_broad_matmul_linked_llvm_cpu_embedded_elf_x86_64.so | |
: 1718801016:0;vi module_broad_matmul_linked_llvm_cpu_embedded_elf_x86_64.s | |
: 1718801039:0;vi module_matmul_broad_dispatch_0.mlir | |
: 1718801361:0;iree-benchmark-module --module=out.vmfb --function=matmul_broad --input=4x128x3200xf32 --input=8640x3200xf16 --device=local-sync | |
: 1718801493:0;vi ~/.tmux.conf | |
: 1718809698:0;iree-benchmark-module --module=out.vmfb --function=matmul_broad --input=4x128x3200xf32 --input=8640x3200xf16 --device=local-task | |
: 1718809752:0;iree-benchmark-module --module=out.vmfb --function=matmul_broad --input=4x128x3200xf32 --input=8640x3200xf16 --device=local-task --benchmark_repetitions=5 | |
: 1718811181:0;git o pashu/fyi_soft | |
: 1718811190:0;git ob fyi_soft | |
: 1718818607:0;clicll | |
: 1718819250:0;3 | |
: 1718819360:0;python tests/kernel/wave/wave_gemm_test.py | |
: 1718855429:0;git remote add ian https://github.com/IanWood1/iree.git | |
: 1718855434:0;git fetch ian | |
: 1718855455:0;git checkout scatter_failure | |
: 1718856223:0;f | |
: 1718856616:0;vi dbg.mlir | |
: 1718856665:0;iree-opt | |
: 1718882206:0;cd torch | |
: 1718882209:0;cd torch-mlir | |
: 1718882234:0;export PYTHONPATH=`pwd`/build/tools/torch-mlir/python_packages/torch_mlir:`pwd`/test/python/fx_importer | |
: 1718882425:0;pip uninstall -r requirements.txt | |
: 1718882511:0;rt | |
: 1718882635:0;vi sum.mlir | |
: 1718882660:0;iree-compile --iree-hal-target-backends=llvm-cpu --iree-llvmcpu-target-cpu=znver4 --iree-llvmcpu-enable-ukernels=mmt4d,pack,unpack --iree-flow-collapse-reduction-dims sum.mlir -o sum.vmfb | |
: 1718882742:0;gist-paste sum.mlir sum.py | |
: 1718883843:0;vi sum. | |
: 1718884022:0;iree-benchmark-module --module=sum.vmfb --function=forward --input=1048576xf32 --device=local-task | |
: 1718884026:0;iree-benchmark-module --module=sum.vmfb --function=forward --input=1048576xf32 --device=local-sync | |
: 1718884342:0;vi sum.py | |
: 1718884402:0;python sum.py | |
: 1718970897:0;iree-opt --pass-pipeline='builtin.module(func.func(iree-codegen-tile-and-distribute-to-workgroups))' new.mlir | |
: 1718972029:0;iree-opt --pass-pipeline='builtin.module(func.func(iree-codegen-tile-and-distribute-to-workgroups))' new.mlir --verify-each=0 | |
: 1718972087:0;iree-opt --pass-pipeline='builtin.module(func.func(iree-codegen-tile-and-distribute-to-workgroups))' new.mlir --verify-each=0 -debug | |
: 1718972223:0;iree-opt --pass-pipeline='builtin.module(func.func(iree-codegen-tile-and-distribute-to-workgroups))' new.mlir --verify-each=0 -debug > xyz.txt | |
: 1718972678:0;iree-opt --pass-pipeline='builtin.module(func.func(iree-codegen-tile-and-distribute-to-workgroups))' new.mlir --verify-each=0 -debug 2> xyz.txt | |
: 1718973122:0;ri | |
: 1718976518:0;vi opt.mlir | |
: 1718976542:0;iree-compile --iree-input-demote-i64-to-i32 --iree-hal-target-backends=llvm-cpu opt.mlir | |
: 1718976631:0;git branch -m scan_tile_issue | |
: 1718976825:0;iree-compile --iree-input-demote-i64-to-i32 -iree-util-zero-fill-elided-attrs --iree-hal-target-backends=llvm-cpu opt.mlir | |
: 1718988492:0;iree-opt --pass-pipeline='builtin.module(func.func(iree-codegen-tile-and-distribute-to-workgroups))' new.mlir | |
: 1719332602:0;pip install -r mlir/python/requirements.txt | |
: 1719334541:0;mlir-opt --transformer-interpreter mlir/test/Interfaces/TilingInterface/tile-and-fuse-consumer.mlir | |
: 1719334551:0;mlir-opt --transforme-interpreter mlir/test/Interfaces/TilingInterface/tile-and-fuse-consumer.mlir | |
: 1719334558:0;mlir-opt --transform-interpreter mlir/test/Interfaces/TilingInterface/tile-and-fuse-consumer.mlir | |
: 1719334568:0;mlir-opt --transform-interpreter mlir/test/Interfaces/TilingInterface/tile-and-fuse-consumer.mlir -split-input-file | |
: 1719334685:0;mlir-opt --transform-interpreter mlir/test/Interfaces/TilingInterface/tile-and-fuse-consumer.mlir -split-input-file > ~/xyz.mlir | |
: 1719346369:0;mlir-opt --transform-interpreter -cse mlir/test/Interfaces/TilingInterface/tile-and-fuse-consumer.mlir -split-input-file > ~/xyz.mlir | |
: 1719397867:0;git ob tile_fuse_pipe | |
: 1719398026:0;mkdir tile&fuse | |
: 1719398031:0;mkdir tile_fuse | |
: 1719398047:0;iree-opt --pass-pipeline='builtin.module(func.func(iree-codegen-tile-and-distribute-to-workgroups))' ir.mlir | |
: 1719398107:0;iree-compile --iree-hal-target-backends=llvm-cpu --iree-llvmcpu-target-cpu=znver4 -mlir-print-ir-after-all 2> all.txt ir.mlir -o ir.vmfb | |
: 1719398290:0;cd ire | |
: 1719398299:0;ls ~/tile | |
: 1719398305:0;rm ~/tile | |
: 1719398308:0;rm -rf ~/tile | |
: 1719398365:0;iree-opt --pass-pipeline="builtin.module(func.func(iree-llvmcpu-tile-and-fuse{tiling-level=0}))" ir.mlir | |
: 1719398378:0;iree-opt --pass-pipeline="builtin.module(func.func(iree-llvmcpu-tile-and-fuse{tiling-level=1}))" ir.mlir | |
: 1719398615:0;iree-opt --pass-pipeline="builtin.module(func.func(iree-llvmcpu-tile-and-fuse))" ir.mlir | |
: 1719398626:0;iree-opt --pass-pipeline="builtin.module(func.func(iree-llvmcpu-tile-and-fuse))" ir.mlir --debug | |
: 1719398636:0;iree-opt --pass-pipeline="builtin.module(func.func(iree-llvmcpu-tile-and-fuse))" ir.mlir --debug 2> dbg.txt | |
: 1719402840:0;ls ~/test_sandbox | |
: 1719403262:0;mv broad_matmul.mlir mat_relu.mlir | |
: 1719409896:0;iree-compile --iree-hal-target-backends=llvm-cpu --iree-llvmcpu-target-cpu=znver4 mat_relu.mlir -o ir.vmfb | |
: 1719409985:0;cp ~/test_sandbox/broad_matmul.mlir . | |
: 1719410005:0;iree-compile --iree-hal-target-backends=llvm-cpu --iree-llvmcpu-target-cpu=znver4 --iree-llvmcpu-enable-ukernels=mmt4d,pack,unpack --iree-flow-collapse-reduction-dims broad_matmul.mlir -o out1.vmfb -mlir-disable-threading | |
: 1719410058:0;iree-compile --iree-hal-target-backends=llvm-cpu --iree-llvmcpu-target-cpu=znver4 --iree-llvmcpu-enable-ukernels=mmt4d,pack,unpack --iree-flow-collapse-reduction-dims broad_matmul.mlir -o out1.vmfb -mlir-print-ir-after-all 2> all_broad.txt | |
: 1719410066:0;vi all_broad.txt | |
: 1719500051:0;cp ~/test_sandbox/brd.mlir . | |
: 1719500096:0;iree-compile --iree-hal-target-backends=llvm-cpu --iree-llvmcpu-target-cpu=znver4 -mlir-print-ir-after-all 2> all.txt brd.mlir -o ir.vmfb | |
: 1719501545:0;iree-opt broad_matmul.mlir | |
: 1719501566:0;iree-opt -cse broad_matmul.mlir | |
: 1719502028:0;iree-compile --iree-hal-target-backends=llvm-cpu --iree-llvmcpu-target-cpu=znver4 -mlir-print-ir-after-all 2> all.txt new_ir.mlir -o ir.vmfb | |
: 1719504262:0;iree-opt new_ir.mlir | |
: 1719504405:0;iree-compile --iree-hal-target-backends=llvm-cpu --iree-llvmcpu-target-cpu=znver4 broad_matmul.mlir -o out1.vmfb -mlir-print-ir-after-all 2> all.txt | |
: 1719504818:0;iree-opt --pass-pipeline="builtin.module(func.func(iree-global-opt-data-layout-propagation))" new_ir.mlir | |
: 1719504964:0;iree-compile --iree-hal-target-backends=llvm-cpu --iree-llvmcpu-target-cpu=znver4 new_ir.mlir -o out1.vmfb -mlir-print-ir-after-all 2> all.txt | |
: 1719505509:0;gist-paste new_ir.mlir | |
: 1719579392:0;vi new_ir.mlir | |
: 1719586601:0;iree-opt --split-input-file --pass-pipeline='builtin.module(hal.executable(hal.executable.variant(builtin.module(func.func(iree-spirv-tile-and-distribute, cse))))) compiler/src/iree/compiler/Codegen/SPIRV/test/tile_and_distribute_sort.mlir | |
: 1719586626:0;iree-opt --split-input-file --pass-pipeline='builtin.module(hal.executable(hal.executable.variant(builtin.module(func.func(iree-spirv-tile-and-distribute, cse)))))' compiler/src/iree/compiler/Codegen/SPIRV/test/tile_and_distribute_sort.mlir | FileCheck bazel-testlogs/compiler/src/iree/compiler/Codegen/SPIRV/test/tile_and_distribute_sort.mlir.test | |
: 1719586890:0;iree-opt --split-input-file --pass-pipeline='builtin.module(hal.executable(hal.executable.variant(builtin.module(func.func(iree-spirv-tile-and-distribute, cse)))))' compiler/src/iree/compiler/Codegen/SPIRV/test/tile_and_distribute_sort.mlir | |
: 1719588837:0;iree-opt --split-input-file --pass-pipeline='builtin.module(hal.executable(hal.executable.variant(builtin.module(func.func(iree-spirv-tile-and-distribute, cse)))))' compiler/src/iree/compiler/Codegen/SPIRV/test/tile_and_distribute_sort.mlir | FileCheck compiler/src/iree/compiler/Codegen/SPIRV/test/tile_and_distribute_sort.mlir | |
: 1719589289:0;iree-compile --iree-hal-target-backends=llvm-cpu --iree-llvmcpu-target-cpu=znver4 -mlir-print-ir-after-all 2> all.txt mat_relu.mlir -o ir.vmfb | |
: 1719589513:0;iree-opt --pass-pipeline="builtin.module(func.func(iree-llvmcpu-tile-root-and-fuse-producer-consumer))" ir.mlir --debug 2> dbg.txt | |
: 1719589833:0;git o scan_tile_issue | |
: 1719589881:0;clang-format -i compiler/src/iree/compiler/Codegen/Common/TileDispatchUsingInterface.cpp | |
: 1719589941:0;rm -rf dbg.txt | |
: 1719606123:0;curl -fsSL https://tailscale.com/install.sh | sh | |
: 1719608857:0;iree-opt --pass-pipeline="builtin.module(func.func(iree-llvmcpu-tile-root-and-fuse-producer-consumer{tiling-level=1}))" ir.mlir --debug 2> dbg.txt | |
: 1719611404:0;iree-opt --pass-pipeline="builtin.module(func.func(iree-llvmcpu-tile-root-and-fuse-producer-consumer{tiling-level=1}))" ir.mlir | |
: 1719611473:0;iree-opt --pass-pipeline="builtin.module(func.func(iree-llvmcpu-tile-root-and-fuse-producer-consumer{tiling-level=1}))" ir.mlir > /dev/null | |
: 1719611493:0;iree-opt --pass-pipeline="builtin.module(func.func(iree-llvmcpu-tile-root-and-fuse-producer-consumer{tiling-level=1}))" -cse ir.mlir > /dev/null | |
: 1719611512:0;iree-opt --pass-pipeline="builtin.module(func.func(iree-llvmcpu-tile-root-and-fuse-producer-consumer{tiling-level=1}), cse)" ir.mlir > /dev/null | |
: 1719612689:0;gist-paste ir.mlir | |
: 1719616116:0;git ob fuseCons | |
: 1719677535:0;mlir-opt -transform-interpreter -cse -split-input-file mlir/test/Interfaces/TilingInterface/tile-and-fuse-using-interface.mlir | |
: 1719775972:0;mlir-opt -transform-interpreter -cse -split-input-file ~/xyz.mlir > /dev/null | |
: 1719778440:0;mlir-opt -transform-interpreter -cse -split-input-file ~/xyz.mlir | |
: 1719778474:0;mlir-opt -transform-interpreter -cse -split-input-file ~/xyz.mlir --debug | |
: 1719921690:0;mlir-opt -transform-interpreter -cse -split-input-file ~/xyz.mlir | |
: 1719921828:0;mlir-opt -canonicalize -cse ~/new.mlir | |
: 1719922525:0;mlir-opt -transform-interpreter -cse -canonicalize -split-input-file ~/xyz.mlir > ~/new.mlir | |
: 1719924374:0;git cp 8aea5cc2946e6ec2d7747dfcb01c8a19481e28c6 | |
: 1719924385:0;git cherry-pick skip | |
: 1719924395:0;git cp 5ba402530cd9909ae76136d8d253e4897987dfb7 | |
: 1719924418:0;git fetch main | |
: 1719925249:0;git cp ec9640cc835809df13bc013f8d6818303e9d60a2 | |
: 1719925274:0;git cherry-pick continue | |
: 1719925278:0;git cherry-pick --continue | |
: 1719930537:0;mlir-opt -transform-interpreter -cse -canonicalize -split-input-file ~/xyz.mlir --debug > ~/dbg.txt | |
: 1719931110:0;mlir-opt -transform-interpreter -cse -canonicalize -split-input-file ~/xyz.mlir --debug 2> ~/dbg.txt | |
: 1719984721:0;mlir-opt -transform-interpreter -cse -canonicalize -split-input-file ~/xyz.mlir | |
: 1719985280:0;vi ~/xyz.mlir | |
: 1720006955:0;vi ~/dbg.txt | |
: 1720007431:0;mlir-opt -transform-interpreter -cse -canonicalize -split-input-file --debug ~/xyz.mlir 2> ~/dbg.txt | |
: 1720009092:0;run | |
: 1720009104:0;mlir-opt -transform-interpreter -cse -canonicalize -split-input-file ~/xyz.mlir | |
: 1720009984:0;cd ../tile_fuse | |
: 1720010986:0;iree-opt --pass-pipeline="builtin.module(func.func(iree-llvmcpu-tile-root-and-fuse-producer-consumer{tiling-level=1}), canonicalize)" ir.mlir > /dev/null | |
: 1720010996:0;iree-opt --pass-pipeline="builtin.module(func.func(iree-llvmcpu-tile-root-and-fuse-producer-consumer{tiling-level=1}), canonicalize)" ir.mlir | |
: 1720011171:0;iree-opt --pass-pipeline="builtin.module(func.func(iree-llvmcpu-tile-root-and-fuse-producer-consumer{tiling-level=2}), canonicalize)" ir.mlir | |
: 1720018998:0;iree-opt --pass-pipeline="builtin.module(func.func(iree-llvmcpu-tile-root-and-fuse-producer-consumer{tiling-level=0}), canonicalize)" ir.mlir | ~/llvm-project/mlir/utils/generate-test-checks.py | |
: 1720020054:0;build_tools/bazel_to_cmake/bazel_to_cmake.py --root_dir=iree/ --verbosity=1 | |
: 1720020256:0;build_tools/scripts/run_buildifier.sh | |
: 1720020340:0;third_party/stablehlo/build_tools/github_actions/lint_buildifier.sh | |
: 1720453039:0;iree-opt --pass-pipeline="builtin.module(func.func(iree-llvmcpu-tile-root-and-fuse-producer-consumer{tiling-level=0}), canonicalize)" ir.mlir | ~/llvm-project/mlir/utils/generate-test-checks.py > test.mlir | |
: 1720532750:0;./matrix_calculator.py --architecture cdna3 --instruction v_mfma_i32_32x32x16_i8 -R --C-matrix --csv > ~/output_layout_c.csv | |
: 1720533136:0;./matrix_calculator.py --architecture cdna3 --instruction v_mfma_f32_16x16x4_f32 -R --C-matrix --csv > ~/output_layout_c.csv | |
: 1720533180:0;./matrix_calculator.py --architecture cdna2 --instruction v_mfma_f32_16x16x4_f32 -R --C-matrix --csv > ~/output_layout_c.csv | |
: 1720533203:0;./matrix_calculator.py --architecture cdna2 --instruction v_mfma_f32_16x16x4f32 -R --C-matrix --csv > ~/output_layout_c.csv | |
: 1720533308:0;./matrix_calculator.py --architecture cdna3 --instruction v_mfma_f32_16x16x4f32 -R --A-matrix --csv > ~/output_layout_a.csv | |
: 1720533335:0;./matrix_calculator.py --architecture cdna2 --instruction v_mfma_f32_16x16x4f32 -R --A-matrix --csv > ~/output_layout_a.csv | |
: 1720533360:0;./matrix_calculator.py --architecture cdna3 --instruction v_mfma_f32_16x16x4_f32 -R --A-matrix --csv > ~/output_layout_a.csv | |
: 1720533367:0;vi ~/output_layout_a.csv | |
: 1720544992:0;./matrix_calculator.py --architecture cdna2 --instruction v_mfma_f16_16x16x16f32 -R --A-matrix --csv > ~/output_layout_a_2.csv | |
: 1720545005:0;./matrix_calculator.py --architecture cdna3 --instruction v_mfma_f16_16x16x16f32 -R --A-matrix --csv > ~/output_layout_a_2.csv | |
: 1720545055:0;./matrix_calculator.py --architecture cdna3 --instruction v_mfma_f32_16x16x16_f16 -R --A-matrix --csv > ~/output_layout_a_2.csv | |
: 1720591221:0;./matrix_calculator.py --architecture cdna2 --instruction v_mfma_f32_16x16x4f32 -R --A-matrix --csv > ~/output_layout_a_2.csv | |
: 1720591224:0;vi ~/output_layout_a_2.csv | |
: 1720591268:0;./matrix_calculator.py --architecture cdna3 --instruction v_mfma_f32_16x16x16_f16 -R --A-matrix --csv > ~/output_layout_a_f16.csv | |
: 1720592036:0;./matrix_calculator.py --architecture cdna3 --instruction v_wmma_f16_16x16x16_f32 -R --A-matrix --csv > ~/output_layout_a_f16.csv | |
: 1720592052:0;./matrix_calculator.py --architecture cdna2 --instruction v_wmma_f16_16x16x16f32 -R --A-matrix --csv > ~/output_layout_a_f16.csv | |
: 1720592087:0;./matrix_calculator.py --architecture rdna3 --instruction v_wmma_f16_16x16x16f32 -R --A-matrix --csv > ~/output_layout_a_f16.csv | |
: 1720592115:0;./matrix_calculator.py --architecture rdna3 --instruction v_wmma_f32_16x16x16_f16 -R --A-matrix --csv > ~/output_layout_a_f16.csv | |
: 1720592122:0;vi ~/output_layout_c.csv | |
: 1720592191:0;./matrix_calculator.py --architecture rdna3 --instruction v_wmma_f32_16x16x16_f16 -R --C-matrix --csv > ~/output_layout_a_f16.csv | |
: 1720592194:0;vi ~/output_layout_a_f16.csv | |
: 1720592255:0;rm ~/*.csv | |
: 1720592281:0;./matrix_calculator.py --architecture rdna3 --instruction v_wmma_f32_16x16x16_f16 -R --C-matrix --csv | |
: 1720607663:0;./matrix_calculator.py --architecture cdna2 --instruction v_mfma_f32_16x16x4f32 -R --C-matrix --csv | |
: 1720607691:0;./matrix_calculator.py --architecture cdna2 --instruction v_mfma_f32_16x16x4f32 -R --A-matrix --csv | |
: 1720607702:0;./matrix_calculator.py --architecture cdna3 --instruction v_mfma_f32_16x16x4f32 -R --A-matrix --csv | |
: 1720607711:0;./matrix_calculator.py --architecture cdna2 --instruction v_mfma_f32_16x16x4_f32 -R --A-matrix --csv | |
: 1720607749:0;./matrix_calculator.py --architecture cdna3,cdna2 --instruction v_mfma_f32_16x16x4_f32 -R --A-matrix --csv | |
: 1720607757:0;./matrix_calculator.py --architecture cdna3 --instruction v_mfma_f32_16x16x4_f32 -R --A-matrix --csv | |
: 1720607833:0;./matrix_calculator.py --architecture cdna3 --instruction v_mfma_i8_16x16x32_i32 -R --A-matrix --csv | |
: 1720607854:0;./matrix_calculator.py --architecture cdna3 --instruction v_mfma_i32_16x16x32_i8 -R --A-matrix --csv | |
: 1720607925:0;./matrix_calculator.py --architecture cdna3 --instruction v_mfma_i32_16x16x32_i8 -R --A-matrix | |
: 1720607949:0;./matrix_calculator.py --architecture cdna3 --instruction v_mfma_f32_16x16x16_f16 -R --A-matrix | |
: 1720609408:0;bire | |
: 1720610338:0;./matrix_calculator.py --architecture cdna3 --instruction v_mfma_f32_16x16x4_f32 -R --C-matrix --cs | |
: 1720611137:0;./matrix_calculator.py --architecture cdna3 --instruction v_mfma_f32_16x16x4_f32 -m --C-matrix --csv | |
: 1720611176:0;./matrix_calculator.py --architecture cdna3 --instruction v_mfma_f32_16x16x4_f32 -m=-r=0 --C-matrix --csv | |
: 1720611196:0;./matrix_calculator.py --architecture cdna3 --instruction v_mfma_f32_16x16x4_f32 -m [-r=0] --C-matrix --csv | |
: 1720611202:0;./matrix_calculator.py --architecture cdna3 --instruction v_mfma_f32_16x16x4_f32 -m [r=0] --C-matrix --csv | |
: 1720611225:0;./matrix_calculator.py --architecture cdna3 --instruction v_mfma_f32_16x16x4_f32 -detail-instruction | |
: 1720611341:0;./matrix_calculator.py --architecture cdna3 --instruction v_mfma_f32_16x16x16_f16 --detail-instruction | |
: 1720612442:0;cd tools/testing/e2e | |
: 1720612454:0;cd tests/e2e | |
: 1720612456:0;cd matmul | |
: 1720615430:0;git fetch origin/main | |
: 1720624860:0;./matrix_calculator.py --architecture cdna3 --instruction v_mfma_f32_16x16x4_f32 -R --A-matrix --cs | |
: 1720634626:0;./matrix_calculator.py --architecture cdna3 --instruction v_mfma_f32_16x16x4_f32 --detail-instruction | |
: 1720634685:0;./matrix_calculator.py --architecture cdna3 --instruction v_mfma_f32_16x16x4_f32 -r --C-matrix --csv | |
: 1720701369:0;iree-opt --pass-pipeline='builtin.module(iree-hal-assign-target-devices{targetBackends=rocm},iree-hal-transformation-pipeline{serialize-executables=false})' --iree-rocm -target-chip=mi300x compiler/plugins/target/ROCM/test/target_device_features.mlir | |
: 1720701387:0;iree-opt --pass-pipeline='builtin.module(iree-hal-assign-target-devices{targetBackends=rocm},iree-hal-transformation-pipeline{serialize-executables=false})' --iree-rocm-target-chip=mi300x compiler/plugins/target/ROCM/test/target_device_features.mlir | |
: 1720701508:0;iree-opt --pass-pipeline='builtin.module(iree-hal-assign-target-devices{targetBackends=rocm},iree-hal-transformation-pipeline{serialize-executables=false})' --iree-rocm-target-chip=mi300x compiler/plugins/target/ROCM/test/target_device_features.mlir | FileCheck compiler/plugins/target/ROCM/test/target_device_features.mlir | |
: 1720701523:0;cat compiler/plugins/target/ROCM/test/target_device_features.mlir | |
: 1720701585:0;iree-opt --pass-pipeline='builtin.module(iree-hal-assign-target-devices{targetBackends=rocm},iree-hal-transformation-pipeline{serialize-executables=false})' --iree-rocm-target-chip=mi300x compiler/plugins/target/ROCM/test/target_device_features.mlir | FileCheck compiler/plugins/target/ROCM/test/target_device_features.mlir --check-prefix=GFX940 | |
: 1720705106:0;./matrix_calculator.py --architecture cdna3 --instruction v_mfma_f32_16x16x4f32 -R --B-matrix --csv | |
: 1720705329:0;./matrix_calculator.py --architecture cdna3 --instruction v_mfma_f32_16x16x8_f32 -R --B-matrix --csv | |
: 1720705371:0;./matrix_calculator.py --architecture cdna3 --instruction v_mfma_f32_16x16x8_xf32 -R --B-matrix --csv | |
: 1720705899:0;./matrix_calculator.py --architecture cdna3 --instruction v_mfma_f16_16x16x16_f32 -R --C-matrix v | |
: 1720705903:0;./matrix_calculator.py --architecture cdna3 --instruction v_mfma_f16_16x16x16_f32 -R --C-matrix --csv | |
: 1720705920:0;./matrix_calculator.py --architecture cdna3 --instruction v_mfma_f32_16x16x16_xf16 -R --C-matrix --csv | |
: 1720705935:0;./matrix_calculator.py --architecture cdna3 --instruction v_mfma_f16_16x16x16_xf32 -R --C-matrix --csv | |
: 1720706001:0;./matrix_calculator.py --architecture cdna3 --instruction v_mfma_f32_16x16x16_f16 -R --C-matrix --csv | |
: 1720706018:0;./matrix_calculator.py --architecture cdna3 --instruction v_mfma_f32_16x16x8_xf32 -R --C-matrix --csv | |
: 1720706041:0;./matrix_calculator.py --architecture cdna3 --instruction v_mfma_f32_16x16x16_f16 -R --A-matrix --csv | |
: 1720709314:0;git ob wmma_ab_f32_c_f32 | |
: 1720709362:0;cat compiler/src/iree/compiler/Codegen/LLVMGPU/test/rocdl_pipeline_test.mlir | |
: 1720709416:0;iree-opt --split-input-file --iree-gpu-test-target=gfx940 --pass-pipeline="builtin.module(hal.executable(hal.executable.variant(builtin.module(iree-codegen-llvmgpu-configuration-pipeline), iree-codegen-linalg-to-rocdl-pipeline)))" compiler/src/iree/compiler/Codegen/LLVMGPU/test/rocdl_pipeline_test.mlir | FileCheck compiler/src/iree/compiler/Codegen/LLVMGPU/test/rocdl_pipeline_test.mlir --check-prefix=CDNA3 | |
: 1720709733:0;./matrix_calculator.py --architecture cdna3 --instruction v_mfma_f32_16x16x8_xf32 -R --A-matrix --csv | |
: 1720710804:0;vi xyz. | |
: 1720716413:0;iree-compile matmul.mlir --iree-hal-target-backends=rocm --iree-rocm-target-chip=gfx942 --iree-global-opt-propagate-transposes=true --iree-opt-outer-dim-concat=true --iree-opt-const-eval=false --iree-opt-data-tiling=false --iree-rocm-waves-per-eu=2 --iree-vm-target-truncate-unsupported-floats --iree-codegen-llvmgpu-use-vector-distribution --iree-codegen-gpu-native-math-precision=true -o small_matmul.vmfb -mlir-print-ir-after-all 2> xyz.txt | |
: 1720716597:0;iree-opt --split-input-file --iree-gpu-test-target=gfx942 --pass-pipeline="builtin.module(hal.executable(hal.executable.variant(builtin.module(iree-codegen-llvmgpu-configuration-pipeline), iree-codegen-linalg-to-rocdl-pipeline)))" compiler/src/iree/compiler/Codegen/LLVMGPU/test/rocdl_pipeline_test.mlir | FileCheck compiler/src/iree/compiler/Codegen/LLVMGPU/test/rocdl_pipeline_test.mlir --check-prefix=CDNA3 | |
: 1720716770:0;iree-compile matmul.mlir --iree-hal-target-backends=rocm --iree-rocm-target-chip=gfx942 --iree-global-opt-propagate-transposes=true --iree-opt-outer-dim-concat=true --iree-opt-const-eval=false --iree-opt-data-tiling=false --iree-rocm-waves-per-eu=2 --iree-vm-target-truncate-unsupported-floats --iree-codegen-llvmgpu-use-vector-distribution --iree-codegen-gpu-native-math-precision=true --iree-flow-enable-aggressive-fusion -o small_matmul.vmfb -mlir-print-ir-after-all | |
: 1720719697:0;iree-opt --split-input-file --iree-gpu-test-target=gfx942 --pass-pipeline="builtin.module(hal.executable(hal.executable.variant(builtin.module(iree-codegen-llvmgpu-configuration-pipeline), iree-codegen-linalg-to-rocdl-pipeline)))" compiler/src/iree/compiler/Codegen/LLVMGPU/test/rocdl_pipeline_test.mlir | |
: 1720719821:0;ls -l | fzf | |
: 1720729935:0;/python ~/iree/iree/tests/e2e/matmul/generate_e2e_matmul_tests.py --output_matmul_mlir=matmul/e2e_matmul_rocm_f32_large_cdna3_mfma_rocm_hip_matmul.mlir --output_calls_mlir=e2e_matmul_rocm_f32_large_cdna3_mfma_rocm_hip_calls.mlir --lhs_rhs_type=f32 --acc_type=f32 --shapes=gpu_large_aligned --compilation_info=LLVMGPUVectorDistributeMFMA | |
: 1720729975:0;python ~/iree-build/iree/tests/e2e/matmul/generate_e2e_matmul_tests.py --output_matmul_mlir=matmul/e2e_matmul_rocm_f32_large_cdna3_mfma_rocm_hip_matmul.mlir --output_calls_mlir=e2e_matmul_rocm_f32_large_cdna3_mfma_rocm_hip_calls.mlir --lhs_rhs_type=f32 --acc_type=f32 --shapes=gpu_large_aligned --compilation_info=LLVMGPUVectorDistributeMFMA | |
: 1720729993:0;python ~/iree/iree/tests/e2e/matmul/generate_e2e_matmul_tests.py --output_matmul_mlir=matmul/e2e_matmul_rocm_f32_large_cdna3_mfma_rocm_hip_matmul.mlir --output_calls_mlir=e2e_matmul_rocm_f32_large_cdna3_mfma_rocm_hip_calls.mlir --lhs_rhs_type=f32 --acc_type=f32 --shapes=gpu_large_aligned --compilation_info=LLVMGPUVectorDistributeMFMA | |
: 1720730022:0;python ~/iree/tests/e2e/matmul/generate_e2e_matmul_tests.py --output_matmul_mlir=matmul/e2e_matmul_rocm_f32_large_cdna3_mfma_rocm_hip_matmul.mlir --output_calls_mlir=e2e_matmul_rocm_f32_large_cdna3_mfma_rocm_hip_calls.mlir --lhs_rhs_type=f32 --acc_type=f32 --shapes=gpu_large_aligned --compilation_info=LLVMGPUVectorDistributeMFMA | |
: 1720732082:0;vi matmul.mlir e2e_matmul_rocm_f32_large_cdna3_mfma_rocm_hip_matmul.mlir | |
: 1720732264:0;vi e2e_matmul_rocm_f32_large_cdna3_mfma_rocm_hip_calls.mlir | |
: 1720782084:0;iree-compile matmul.mlir --iree-hal-target-backends=rocm --iree-rocm-target-chip=gfx942 --iree-global-opt-propagate-transposes=true --iree-opt-outer-dim-concat=true --iree-opt-const-eval=false --iree-opt-data-tiling=false --iree-rocm-waves-per-eu=2 --iree-vm-target-truncate-unsupported-floats --iree-codegen-llvmgpu-use-vector-distribution --iree-codegen-gpu-native-math-precision=true --iree-flow-enable-aggressive-fusion -o small_matmul.vmfb -mlir-print-ir-after-all 2> xyz.txt | |
: 1720794873:0;python ~/iree/tests/e2e/matmul/generate_e2e_matmul_tests.py --output_matmul_mlir=e2e_matmul_rocm_f32_large_cdna3_mfma_rocm_hip_matmul.mlir --output_calls_mlir=e2e_matmul_rocm_f32_large_cdna3_mfma_rocm_hip_calls.mlir --lhs_rhs_type=f32 --acc_type=f32 --shapes=gpu_large_aligned --compilation_info=LLVMGPUVectorDistributeMFMA | |
: 1720794881:0;pytho3n ~/iree/tests/e2e/matmul/generate_e2e_matmul_tests.py --output_matmul_mlir=e2e_matmul_rocm_f32_large_cdna3_mfma_rocm_hip_matmul.mlir --output_calls_mlir=e2e_matmul_rocm_f32_large_cdna3_mfma_rocm_hip_calls.mlir --lhs_rhs_type=f32 --acc_type=f32 --shapes=gpu_large_aligned --compilation_info=LLVMGPUVectorDistributeMFMA | |
: 1720794893:0;vi e2e_matmul_rocm_f32_large_cdna3_mfma_rocm_hip_ | |
: 1720794949:0;rm -rf e2e_matmul_rocm_f32_large_cdna3_mfma_rocm_hip_* | |
: 1720800274:0;python3 ~/iree/tests/e2e/matmul/generate_e2e_matmul_tests.py --output_matmul_mlir=e2e_matmul_rocm_f32_large_cdna3_mfma_rocm_hip_matmul.mlir --output_calls_mlir=e2e_matmul_rocm_f32_large_cdna3_mfma_rocm_hip_calls.mlir --lhs_rhs_type=f16 --acc_type=f32 --shapes=gpu_large_aligned --compilation_info=LLVMGPUVectorDistributeMFMA | |
: 1720800283:0;python3 ~/iree/tests/e2e/matmul/generate_e2e_matmul_tests.py --output_matmul_mlir=e2e_matmul_rocm_f32_large_cdna3_mfma_rocm_hip_matmul.mlir --output_calls_mlir=e2e_matmul_rocm_f32_large_cdna3_mfma_rocm_hip_calls.mlir --lhs_rhs_type=f32 --acc_type=f32 --shapes=gpu_large_aligned --compilation_info=LLVMGPUVectorDistributeMFMA | |
: 1720800295:0;vi e2e_matmul_rocm_f32_large_cdna3_mfma_rocm_hip_matmul.mlir | |
: 1720800308:0;mv e2e_matmul_rocm_f32_large_cdna3_mfma_rocm_hip_matmul.mlir ../matmul.mlir | |
: 1720800316:0;rm e2e_matmul_rocm_f32_large_cdna3_mfma_rocm_hip_calls.mlir | |
: 1720800391:0;python3 ~/iree/tests/e2e/matmul/generate_e2e_matmul_tests.py --output_matmul_mlir=~/matmul.mlir --output_calls_mlir=calls.mlir --lhs_rhs_type=f32 --acc_type=f32 --shapes=gpu_large_aligned --compilation_info=LLVMGPUVectorDistributeMFMA | |
: 1720800551:0;vi matmul.mlir | |
: 1720800591:0;mv matmul.mlir ../ | |
: 1720802400:0;iree-compile matmul.mlir --iree-hal-target-backends=rocm --iree-rocm-target-chip=gfx942 --iree-global-opt-propagate-transposes=true --iree-opt-outer-dim-concat=true --iree-opt-const-eval=false --iree-opt-data-tiling=false --iree-rocm-waves-per-eu=2 --iree-vm-target-truncate-unsupported-floats --iree-codegen-llvmgpu-use-vector-distribution --iree-codegen-gpu-native-math-precision=true --iree-flow-enable-aggressive-fusion -o small_matmul.vmfb | |
: 1721102525:0;git o wmma_ab_f32_c_f32 | |
: 1721102661:0;git revert 02c2000795 | |
: 1721102672:0;rm calls.mlir | |
: 1721112880:0;iree-opt --pass-pipeline="builtin.module(func.func(iree-llvmcpu-tile-root-and-fuse-producer-consumer{tiling-level=0}), canonicalize)" ir.mlir | |
: 1721198155:0;iree-opt compiler/src/iree/compiler/Codegen/LLVMCPU/test/tile-root-fuse-consumer-producer.mlir | |
: 1721200484:0;gpg | |
: 1721200616:0;git config --global user.signingkey 2C06887DC1FD9872 | |
: 1721200661:0;git status | |
: 1721200718:0;git config --global gpg.program gpg1 | |
: 1721200818:0;gpg2 | |
: 1721200850:0;git config --global user.signingkey BF03C01E9127D982E37E41052C06887DC1FD9872 | |
: 1721200919:0;git config --global --unset gpg.program | |
: 1721200974:0;echo "test" | gpg --clearsign | |
: 1721201028:0;killall gpg-agent\ | |
\ | |
: 1721201045:0;git commit --amend compiler/src/iree/compiler/Codegen/LLVMCPU/test/tile-root-fuse-consumer-producer.mlir | |
: 1721201109:0;rm -rf ~/.gnupg | |
: 1721201125:0;gpg --gen-key | |
: 1721201272:0;gpg --list-secret-keys --keyid-format LONG | |
: 1721201324:0;git config --global user.signingkey A5932799D923F8A5 | |
: 1721201363:0;source ~/.zshrc | |
: 1721201483:0;gpg --list-keys | |
: 1721201497:0;vi ~/.gnupg/pubring.kbx | |
: 1721201502:0;cat ~/.gnupg/pubring.kbx | |
: 1721201571:0;gpg --armor --export [email protected] | |
: 1721201694:0;git commit -S --amend | |
: 1721201986:0;go install github.com/bazelbuild/buildtools/buildifier@latest | |
: 1721201991:0;sudo apt-get install go | |
: 1721202017:0;sudo apt-get install buildifier | |
: 1721202073:0;git clone https://github.com/bazelbuild/buildtools.git\ | |
cd buildtools | |
: 1721202083:0;bazel build //buildifier | |
: 1721202328:0;sudo cp bazel-bin/buildifier/buildifier /usr/local/bin/ | |
: 1721202520:0;sudo cp bazel-bin/buildifier_/buildifier /usr/local/bin/ | |
: 1721202548:0;sudo cp bazel-bin/buildifier/buildifier_/buildifier /usr/local/bin | |
: 1721202552:0;buildifier | |
: 1721202587:0;buildifier compiler/plugins/target/LLVMCPU/BUILD.bazel | |
: 1721202598:0;buildifier -i compiler/plugins/target/LLVMCPU/BUILD.bazel | |
: 1721202651:0;buildifier compiler/plugins/target/LLVMCPU/test/BUILD.bazel | |
: 1721202669:0;buildifier compiler/plugins/target/LLVMCPU/test/ | |
: 1721202678:0;buildifier compiler/plugins/target/LLVMCPU/test/CMakeLists.txt | |
: 1721202758:0;buildifier --version | |
: 1721202793:0;buildifier --lint=warn compiler/plugins/target/LLVMCPU/BUILD.bazel | |
: 1721202801:0;buildifier --lint=warn compiler/plugins/target/LLVMCPU/test/BUILD.bazel | |
: 1721203806:0;git log --show-signature | |
: 1721237005:0;iree-opt --pass-pipeline="builtin.module(func.func(iree-llvmcpu-tile-root-and-fuse-producer-consumer{tiling-level=0}), canonicalize)" compiler/src/iree/compiler/Codegen/LLVMCPU/test/tile-root-fuse-consumer-producer.mlir --mlir-disable-threading | |
: 1721237449:0;iree-opt --pass-pipeline="builtin.module(func.func(iree-llvmcpu-tile-and-fuse{tiling-level=0}), canonicalize)" compiler/src/iree/compiler/Codegen/LLVMCPU/test/tile-root-fuse-consumer-producer.mlir --debug 2> ~/xyz.txt | |
: 1721237711:0;vi ~/xyz.txt | |
: 1721237972:0;iree-opt --pass-pipeline="builtin.module(func.func(iree-llvmcpu-tile-root-and-fuse-producer-consumer{tiling-level=0}), canonicalize)" compiler/src/iree/compiler/Codegen/LLVMCPU/test/tile-root-fuse-consumer-producer.mlir --debug 2> ~/xyz.txt | |
: 1721314506:0;clang-format -i compiler/src/iree/compiler/Codegen/LLVMCPU/LLVMCPUTileRootAndFuseProdCons.cpp | |
: 1721317280:0;git clone [email protected]:nod-ai/SHARK-Turbine.git | |
: 1721318214:0;rm -rf iree-turbine | |
: 1721318226:0;git clone [email protected]:iree-org/iree-turbine.git | |
: 1721318408:0;python -m venv --prompt iree-turbine .venv | |
: 1721323241:0;python3 -m venv --prompt iree-turbine .venv | |
: 1721323331:0;vi wave.py | |
: 1721324066:0;cd iree-turbine | |
: 1721324102:0;cd lit_tests | |
: 1721324104:0;cd kernel | |
: 1721324106:0;cd wave | |
: 1721324116:0;pytest codegen.py | |
: 1721324356:0;rm -rf SHARK | |
: 1721324398:0;git remote add harsh https://github.com/harsh-nod/SHARK-Turbine.git | |
: 1721324403:0;git fetch harsh | |
: 1721324418:0;git o harsh/tkw_batch_matmul | |
: 1721324462:0;cd shark_turbine | |
: 1721324580:0;python3.11 -m venv --prompt iree-turbine .venv | |
: 1721324777:0;pip install -r mypy-requirements.txt | |
: 1721324879:0;pip install -r requirements.txt -e . | |
: 1721330227:0;pip uninstall iree-compiler iree-runtime | |
: 1721330273:0;pip install -r requirements.txt | |
: 1721330294:0;vi pytorch-rocm-requirements.txt | |
: 1721330303:0;vi pytorch-cpu-requirements.txt | |
: 1721330396:0;pip install --upgrade -r core/requirements.txt | |
: 1721330435:0;pip install --upgrade -e "core[torch-cpu-nightly,testing]" | |
: 1721330450:0;pytest | |
: 1721330539:0;source ~/iree-turbine/.venv/bin/activate | |
: 1721330589:0;export $PYTHONPATH='' | |
: 1721330599:0;export $PYTHONPATH="h" | |
: 1721330618:0;$PYTHONPATH="" | |
: 1721330793:0;rm -rf ~/global_venv | |
: 1721330831:0;python3.11 -m venv ~/global_venv | |
: 1721331435:0;pip install numpy | |
: 1721331656:0;sudo apt-get install python3.11-dev | |
: 1721332008:0;pip uninstall iree-compiler | |
: 1721332028:0;echo $PYTHONPATH | |
: 1721332094:0;where iree-opt | |
: 1721332466:0;cmake --build ~/iree-build | |
: 1721335978:0;source ~/iree-build/.env && export PYTHONPATH | |
: 1721336085:0;curl https://github.com/iree-org/iree/releases/download/untagged-d113fd654767c3d74d97/iree_runtime-20240708.948-cp311-cp311-manylinux_2_28_aarch64.whl | |
: 1721336111:0;wget https://objects.githubusercontent.com/github-production-release-asset-2e65be/208145128/3f028a67-e2cd-4585-b266-2df07b49995f\?X-Amz-Algorithm\=AWS4-HMAC-SHA256\&X-Amz-Credential\=releaseassetproduction%2F20240718%2Fus-east-1%2Fs3%2Faws4_request\&X-Amz-Date\=20240718T205457Z\&X-Amz-Expires\=300\&X-Amz-Signature\=47094bcad504635a248819df36a54d85bd98e97c2184834f3833c2b66770a4f3\&X-Amz-SignedHeaders\=host\&actor_id\=16246821\&key_id\=0\&repo_id\=208145128\&response-content-disposition\=attachment%3B%20filename%3Diree_runtime-20240708.948-cp311-cp311-manylinux_2_28_aarch64.whl\&response-content-type\=application%2Foctet-stream | |
: 1721336124:0;rm 3f028a67-e2cd-4585-b266-2df07b49995f\?X-Amz-Algorithm=AWS4-HMAC-SHA256\&X-Amz-Credential=releaseassetproduction%2F20240718%2Fus-east-1%2Fs3%2Faws4_request\&X-Amz-Date=20240718T205457Z\&X-Amz-Expires=300\&X-Amz-Signature=47094bcad504635a24881 | |
: 1721336136:0;wget https://github.com/iree-org/iree/releases/download/untagged-d113fd654767c3d74d97/iree_runtime-20240708.948-cp311-cp311-manylinux_2_28_aarch64.whl | |
: 1721336185:0;python -m pip install \\ | |
--find-links https://iree.dev/pip-release-links.html \\ | |
--upgrade \\ | |
iree-compiler \\ | |
iree-runtime | |
: 1721336203:0;python core/tests/kernel/functional_batch_matmul_test.py | |
: 1721336230:0;export PYTHONPATH='' | |
: 1721336232:0;pytest . | |
: 1721336290:0;python core/tests/kernel/functional_argmax_test.py | |
: 1721336306:0;cd ~/SHARK-Turbine | |
: 1721336377:0;cd SHARK-Turbine | |
: 1721336477:0;cd tests/kernel/ | |
: 1721336509:0;git checkout harsh/main | |
: 1721336524:0;cd core | |
: 1721336716:0;python tests/kernel/gemm_test.py | |
: 1721336761:0;python tests/kernel/arith_test.py | |
: 1721336927:0;python functional_test_integer.py | |
: 1721337362:0;git ob test_branch | |
: 1721654793:0;python tests/kernel/functional_test_integer.py | |
: 1721654928:0;git o pashu/wmma_rebased | |
: 1721659331:0;cd sfmax_dbg | |
: 1721659340:0;rm -rf sfmax_dbg | |
: 1721659348:0;mkdir conv_mfma_dbg | |
: 1721659379:0;pip uninstall iree | |
: 1721659700:0;where iree-compile\ | |
: 1721659708:0;which iree-compile | |
: 1721660018:0;iree-compile test.mlir --iree-hal-target-backends=rocm --iree-rocm-target-chip=gfx942 --iree-opt-const-eval=false --iree-global-opt-propagate-transposes=true --iree-global-opt-enable-fuse-horizontal-contractions=true --iree-flow-enable-aggressive-fusion=true --iree-opt-aggressively-propagate-transposes=true --iree-opt-outer-dim-concat=true --iree-vm-target-truncate-unsupported-floats --iree-llvmgpu-enable-prefetch=true --iree-opt-data-tiling=false --iree-codegen-gpu-native-math-precision=true --iree-codegen-llvmgpu-use-vector-distribution --iree-rocm-waves-per-eu=2 --iree-execution-model=async-external "--iree-preprocessing-pass-pipeline=builtin.module(iree-preprocessing-transpose-convolution-pipeline, util.func(iree-preprocessing-pad-to-intrinsics))" --iree-scheduling-dump-statistics-format=json --iree-scheduling-dump-statistics-file=compilation_info.json -o test_rocm.vmfb -mlir-print-ir-after-all 2> full.txt | |
: 1721664770:0;iree-compile test.mlir --iree-hal-target-backends=rocm --iree-rocm-target-chip=gfx942 --iree-opt-const-eval=false --iree-global-opt-propagate-transposes=true --iree-global-opt-enable-fuse-horizontal-contractions=true --iree-flow-enable-aggressive-fusion=true --iree-opt-aggressively-propagate-transposes=true --iree-opt-outer-dim-concat=true --iree-vm-target-truncate-unsupported-floats --iree-llvmgpu-enable-prefetch=true --iree-opt-data-tiling=false --iree-codegen-gpu-native-math-precision=true --iree-codegen-llvmgpu-use-vector-distribution --iree-rocm-waves-per-eu=2 --iree-execution-model=async-external "--iree-preprocessing-pass-pipeline=builtin.module(iree-preprocessing-transpose-convolution-pipeline, util.func(iree-preprocessing-pad-to-intrinsics))" --iree-scheduling-dump-statistics-format=json --iree-scheduling-dump-statistics-file=compilation_info.json -o test_rocm.vmfb -mlir-print-ir-after-all 2> correct.txt | |
: 1721664777:0;vi correct.txt | |
: 1721748076:0;iree-compile test.mlir --iree-hal-target-backends=rocm --iree-rocm-target-chip=gfx942 --iree-opt-const-eval=false --iree-global-opt-propagate-transposes=true --iree-global-opt-enable-fuse-horizontal-contractions=true --iree-flow-enable-aggressive-fusion=true --iree-opt-aggressively-propagate-transposes=true --iree-opt-outer-dim-concat=true --iree-vm-target-truncate-unsupported-floats --iree-llvmgpu-enable-prefetch=true --iree-opt-data-tiling=false --iree-codegen-gpu-native-math-precision=true --iree-codegen-llvmgpu-use-vector-distribution --iree-rocm-waves-per-eu=2 --iree-execution-model=async-external "--iree-preprocessing-pass-pipeline=builtin.module(iree-preprocessing-transpose-convolution-pipeline, util.func(iree-preprocessing-pad-to-intrinsics))" --iree-scheduling-dump-statistics-format=json --iree-scheduling-dump-statistics-file=compilation_info.json -o test_rocm.vmfb | |
: 1721748184:0;git ob wmma_rebased | |
: 1721748894:0;git ob new_branch | |
: 1721749015:0;git branch -d wmma_rebased | |
: 1721749033:0;git branch -D wmma_rebased | |
: 1721749042:0;git branch -m wmma_rebased | |
: 1721750518:0;iree-opt --pass-pipeline='builtin.module(iree-hal-assign-target-devices{targetBackends=rocm},iree-hal-transformation-pipeline{serialize-executables=false})' --iree-rocm-target-chip=gfx940 compiler/plugins/target/ROCM/test/target_device_features.mlir | FileCheck compiler/plugins/target/ROCM/test/target_device_features.mlir --check-prefix=GFX940 | |
: 1721750537:0;iree-opt --pass-pipeline='builtin.module(iree-hal-assign-target-devices{targetBackends=rocm},iree-hal-transformation-pipeline{serialize-executables=false})' --iree-rocm-target-chip=gfx940 compiler/plugins/target/ROCM/test/target_device_features.mlir | |
: 1721750618:0;iree-opt --pass-pipeline='builtin.module(iree-hal-assign-target-devices{targetBackends=rocm},iree-hal-transformation-pipeline{serialize-executables=false})' --iree-rocm-target-chip=gfx940 compiler/plugins/target/ROCM/test/target_device_features.mlir | FileCheck compiler/plugins/target/ROCM/test/target_device_features.mlir --check-prefix=GFX942 | |
: 1721750687:0;iree-opt --pass-pipeline='builtin.module(iree-hal-assign-target-devices{targetBackends=rocm},iree-hal-transformation-pipeline{serialize-executables=false})' --iree-rocm-target-chip=gfx944 compiler/plugins/target/ROCM/test/target_device_features.mlir | FileCheck compiler/plugins/target/ROCM/test/target_device_features.mlir --check-prefix=GFX942 | |
: 1721750708:0;iree-opt --pass-pipeline='builtin.module(iree-hal-assign-target-devices{targetBackends=rocm},iree-hal-transformation-pipeline{serialize-executables=false})' --iree-rocm-target-chip=gfx942 compiler/plugins/target/ROCM/test/target_device_features.mlir | |
: 1721750772:0;iree-opt --pass-pipeline='builtin.module(iree-hal-assign-target-devices{targetBackends=rocm},iree-hal-transformation-pipeline{serialize-executables=false})' --iree-rocm-target-chip=gfx942 compiler/plugins/target/ROCM/test/target_device_features.mlir | FileCheck compiler/plugins/target/ROCM/test/target_device_features.mlir --check-prefix=GFX942 | |
: 1721750991:0;iree-opt --pass-pipeline='builtin.module(iree-hal-assign-target-devices{targetBackends=rocm},iree-hal-transformation-pipeline{serialize-executables=false})' --iree-rocm-target-chip=mi300x compiler/plugins/target/ROCM/test/target_device_features.mlir | FileCheck compiler/plugins/target/ROCM/test/target_device_features.mlir --check-prefix=GFX942 | |
: 1721765675:0;clang-format -i compiler/src/iree/compiler/Preprocessing/Common/PadToIntrinsics.cpp | |
: 1721766278:0;python3 ~/iree/tests/e2e/matmul/generate_e2e_matmul_tests.py --output_matmul_mlir=matmul.mlir --output_calls_mlir=calls.mlir --lhs_rhs_type=f32 --acc_type=f32 --shapes=gpu_large_aligned --compilation_info=LLVMGPUVectorDistributeMFMA | |
: 1721766304:0;python3 ~/iree/tests/e2e/matmul/generate_e2e_matmul_tests.py --output_matmul_mlir=matmul.mlir --output_calls_mlir=calls.mlir --lhs_rhs_type=f8e4m3fnuz --acc_type=f32 --shapes=gpu_large_aligned --compilation_info=LLVMGPUVectorDistributeMFMA | |
: 1721766323:0;python3 ~/iree/tests/e2e/matmul/generate_e2e_matmul_tests.py --output_matmul_mlir=matmul.mlir --output_calls_mlir=calls.mlir --lhs_rhs_type=f8e4M3FNUZ --acc_type=f32 --shapes=gpu_large_aligned --compilation_info=LLVMGPUVectorDistributeMFMA | |
: 1721766342:0;vi calls.mlir | |
: 1721766360:0;python3 ~/iree/tests/e2e/matmul/generate_e2e_matmul_tests.py --output_matmul_mlir=matmul.mlir --output_calls_mlir=calls.mlir --lhs_rhs_type=f8E4M3FNUZ --acc_type=f32 --shapes=gpu_large_aligned --compilation_info=LLVMGPUVectorDistributeMFMA | |
: 1721766587:0;iree-compile test.mlir --iree-hal-target-backends=rocm --iree-rocm-target-chip=gfx942 --iree-opt-const-eval=false --iree-global-opt-propagate-transposes=true --iree-global-opt-enable-fuse-horizontal-contractions=true --iree-flow-enable-aggressive-fusion=true --iree-opt-aggressively-propagate-transposes=true --iree-opt-outer-dim-concat=true --iree-vm-target-truncate-unsupported-floats --iree-llvmgpu-enable-prefetch=true --iree-opt-data-tiling=false --iree-codegen-gpu-native-math-precision=true --iree-codegen-llvmgpu-use-vector-distribution --iree-rocm-waves-per-eu=2 --iree-execution-model=async-external "--iree-preprocessing-pass-pipeline=builtin.module(iree-preprocessing-transpose-convolution-pipeline, util.func(iree-preprocessing-pad-to-intrinsics))" --iree-scheduling-dump-statistics-format=json --iree-scheduling-dump-statistics-file=compilation_info.json -o test_rocm.vmfb -mlir-print-ir-after-all 2> incorrect.txt | |
: 1721766594:0;vi incorrect.txt | |
: 1721766784:0;black tests/e2e/matmul/generate_e2e_matmul_tests.py | |
: 1721934479:0;rm -rf * | |
: 1721934512:0;iree-compile --iree-input-demote-i64-to-i32 --iree-hal-target-backends=llvm-cpu test.mlir -o test.vmfb | |
: 1721934988:0;iree-compile --iree-hal-target-backends=llvm-cpu --iree-llvmcpu-target-cpu=znver4 test.mlir -o out1.vmfb -iree-llvmcpu-stack-allocation-limit=100000 -mlir-print-ir-after-all 2> all.txt | |
: 1721935002:0;iree-compile --iree-hal-target-backends=llvm-cpu --iree-llvmcpu-target-cpu=znver4 test.mlir -o out1.vmfb -iree-llvmcpu-stack-allocation-limit=1000000 | |
: 1721935006:0;iree-compile --iree-hal-target-backends=llvm-cpu --iree-llvmcpu-target-cpu=znver4 test.mlir -o out1.vmfb -iree-llvmcpu-stack-allocation-limit=10000000 | |
: 1721935013:0;iree-compile --iree-hal-target-backends=llvm-cpu --iree-llvmcpu-target-cpu=znver4 test.mlir -o out1.vmfb -iree-llvmcpu-stack-allocation-limit=100000000 | |
: 1721935016:0;iree-compile --iree-hal-target-backends=llvm-cpu --iree-llvmcpu-target-cpu=znver4 test.mlir -o out1.vmfb -iree-llvmcpu-stack-allocation-limit=1000000000 | |
: 1721935019:0;iree-compile --iree-hal-target-backends=llvm-cpu --iree-llvmcpu-target-cpu=znver4 test.mlir -o out1.vmfb -iree-llvmcpu-stack-allocation-limit=10000000000 | |
: 1721935039:0;iree-compile --iree-hal-target-backends=llvm-cpu --iree-llvmcpu-target-cpu=znver4 -iree-llvmcpu-stack-allocation-limit=10000000000 test.mlir | |
: 1721935045:0;iree-compile --iree-hal-target-backends=llvm-cpu --iree-llvmcpu-target-cpu=znver4 -iree-llvmcpu-stack-allocation-limit=1000000000 test.mlir | |
: 1721987258:0;git ob avgpool_test | |
: 1721988785:0;cat aa.mlir | |
: 1721991431:0;git remote add yunfly https://github.com/Yun-Fly/llvm-project.git | |
: 1722266862:0;vi aa.mlir | |
: 1722432716:0;ls -, | |
: 1722434091:0;cmake --build ~/iree-build --target iree-run-tests -i | |
: 1722434581:0;cd ~/iree-build | |
: 1722434609:0;cd tests/e2e/matmul | |
: 1722434614:0;ctest --rerun-failed . -j 32 --verbose | |
: 1722436808:0;ctest --rerun-failed . --output-on-failure -R demote_con -vv | |
: 1722436982:0;iree-compile --output-format=vm-bytecode --iree-hal-target-backends=llvm-cpu --iree-input-type=stablehlo /home/prashant/iree/tests/e2e/reression/linal_ops.mlir -o check_reression_llvm-cpu_linal_ops.mlir_module.vmfb | |
: 1722436991:0;iree-compile --output-format=vm-bytecode --iree-hal-target-backends=llvm-cpu --iree-input-type=stablehlo /home/prashant/iree/tests/e2e/reression/linal_ops.mlir -o check_reression_llvm-cpu_linalg_ops.mlir_module.vmfb | |
: 1722437004:0;iree-compile --output-format=vm-bytecode --iree-hal-target-backends=llvm-cpu --iree-input-type=stablehlo /home/prashant/iree/tests/e2e/reression/linalg_ops.mlir -o check_reression_llvm-cpu_linalg_ops.mlir_module.vmfb | |
: 1722437070:0;iree-compile --output-format=vm-bytecode --iree-hal-target-backends=llvm-cpu --iree-input-type=stablehlo /home/prashant/iree/tests/e2e/regression/linalg_ops.mlir -o check_reression_llvm-cpu_linalg_ops.mlir_module.vmfb | |
: 1722437075:0;rm check_reression_llvm-cpu_linalg_ops.mlir_module.vmfb | |
: 1722514715:0;cd third_party/torch-mlir | |
: 1722522793:0;iree-compile --output-format=vm-bytecode --mlir-print-op-on-diagnostic=false --iree-hal-target-backends=llvm-cpu /home/prashant/iree/tests/e2e/tensor_ops/extract_slice.mlir -o check_llvm-cpu_local-task_extract_slice.mlir_module.vmfb | |
: 1722522807:0;iree-compile --output-format=vm-bytecode --mlir-print-op-on-diagnostic=false --iree-hal-target-backends=llvm-cpu /home/prashant/iree/tests/e2e/tensor_ops/extract_slice.mlir -o check_llvm-cpu_local-task_extract_slice.mlir_module.vmfb -mlir-print-ir-after-all 2> all.txt | |
: 1722523146:0;iree-compile --output-format=vm-bytecode --mlir-print-op-on-diagnostic=false --iree-hal-target-backends=llvm-cpu tests/e2e/tensor_ops/pack_dynamic_inner_tiles.mlir -o check_llvm-cpu_local-task_extract_slice.mlir_module.vmfb -mlir-print-ir-after-all 2> all.txt | |
: 1722632792:0;iree-opt --pass-pipeline="builtin.module(func.func(iree-llvmcpu-tile-root-and-fuse-producer-consumer{tiling-level=0}), canonicalize)" compiler/src/iree/compiler/Codegen/LLVMCPU/test/tile-root-fuse-consumer-producer.mlir | |
: 1722633687:0;clang-format compiler/src/iree/compiler/Codegen/LLVMCPU/LLVMCPUTileRootAndFuseProducerConsumer.cpp | |
: 1722858744:0;build_tools/bazel_to_cmake/bazel_to_cmake.py --root_dir=. --verbosity=1 | |
: 1722865232:0;cd burn_24 | |
: 1722865345:0;cd tmp | |
: 1722866268:0;test_conv.mlir | |
: 1722866287:0;iree-compile --iree-hal-target-backends=llvm-cpu --iree-llvmcpu-target-cpu=znver4 test_conv.mlir -o out1.vmfb | |
: 1722876367:0;iree-compile --iree-hal-target-backends=llvm-cpu --iree-llvmcpu-target-cpu=znver4 test_conv.mlir -o out1.vmfb -mlir-print-ir-after-all 2> all.txt | |
: 1722884048:0;iree-compile --iree-hal-target-backends=llvm-cpu --iree-llvmcpu-target-cpu=znver4 test_conv.mlir -o out1.vmfb -mlir-print-ir-after-all 2> all1.txt | |
: 1722884437:0;mv Deeplabv3.default.onnx.torch.mlir.txt conv_mfma_dbg/deep.mlir | |
: 1722884484:0;vi deep.mlir | |
: 1722885762:0;ctest -j 128 ~/iree-build | |
: 1722886524:0;iree-benchmark-module --module=out1.vmfb --function=forward --input=1x513x513x3xf16 --device=local-task | |
: 1722886529:0;cat deep.mlir | |
: 1722886531:0;more deep | |
: 1722886535:0;more deep.mlir | |
: 1722886568:0;iree-benchmark-module --module=out1.vmfb --function=tf2onnx --input=1x513x513x3xf32 --device=local-task | |
: 1722926287:0;git ls | |
: 1722926312:0;git o tile_fuse_pipe | |
: 1722926337:0;git log | |
: 1722927338:0;iree-opt ~/test.mlir | |
: 1722927495:0;iree-opt --pass-pipeline="builtin.module(func.func(iree-llvmcpu-tile-and-fuse{tiling-level=0}), canonicalize)" compiler/src/iree/compiler/Codegen/LLVMCPU/test/tile-root-fuse-consumer-producer.mlir | |
: 1722927585:0;git ob fix_test | |
: 1722944826:0;build_tools/bazel_to_cmake/bazel_to_cmake.py --root_dir=compiler/src/iree/compiler/Codegen/LLVMCPU --verbosity=1 | |
: 1722946948:0;iree-opt --pass-pipeline="builtin.module(func.func(iree-llvmcpu-tile-root-and-fuse-producer-consumer{tiling-level=0}), canonicalize)" ~/conv_mfma_dbg/test.mlir | |
: 1722946980:0;iree-opt --pass-pipeline="builtin.module(func.func(iree-llvmcpu-tile-reduction-and-fuse-input-operands{tiling-level=2}), canonicalize)" ~/conv_mfma_dbg/test.mlir | |
: 1722947908:0;iree-opt ~/conv_mfma_dbg/test.mlir | |
: 1722948043:0;iree-opt --pass-pipeline="builtin.module(func.func(iree-llvmcpu-tile-reduction-and-fuse-input-operands{tiling-level=2}), canonicalize)" ~/conv_mfma_dbg/test.mlir | ~/llvm-project/mlir/utils/generate-test-checks.py > test.mlir | |
: 1722948113:0;iree-opt --pass-pipeline="builtin.module(func.func(iree-llvmcpu-tile-reduction-and-fuse-input-operands{tiling-level=2}), canonicalize)" compiler/src/iree/compiler/Codegen/LLVMCPU/test/tile-reduction-and-fuse-input-operands.mlir | ~/llvm-project/mlir/utils/generate-test-checks.py > test.mlir | |
: 1723029700:0;./matrix_calculator.py --architecture cdna3 --instruction v_mfma_f32_16x16x4_f32 -R ---matrix --csv | |
: 1723030592:0;./matrix_calculator.py --architecture cdna3 --instruction v_mfma_f32_16x16x4_f32 -R --C-matrix --csv | |
: 1723111506:0;iree-run-module --module=sfmax.vmfb --function=softmax --input=@42_inputs.npy --output=@42_out_repro.npy | |
: 1723118270:0;iree-opt --pass-pipeline="builtin.module(func.func(iree-llvmcpu-tile-reduction-and-fuse-input-operands{tiling-level=2}), canonicalize)" compiler/src/iree/compiler/Codegen/LLVMCPU/test/tile-reduction-and-fuse-input-operands.mlir | FileCheck compiler/src/iree/compiler/Codegen/LLVMCPU/test/tile-reduction-and-fuse-input-operands.mlir | |
: 1723118280:0;iree-opt --pass-pipeline="builtin.module(func.func(iree-llvmcpu-tile-reduction-and-fuse-input-operands{tiling-level=2}), canonicalize)" compiler/src/iree/compiler/Codegen/LLVMCPU/test/tile-reduction-and-fuse-input-operands.mlir | |
: 1723118304:0;iree-opt --pass-pipeline="builtin.module(func.func(iree-llvmcpu-tile-and-fuse{tiling-level=2}), canonicalize)" compiler/src/iree/compiler/Codegen/LLVMCPU/test/tile-reduction-and-fuse-input-operands.mlir | |
: 1723118436:0;iree-opt --pass-pipeline="builtin.module(func.func(iree-llvmcpu-tile-and-fuse{tiling-level=2}), canonicalize)" compiler/src/iree/compiler/Codegen/LLVMCPU/test/tile-reduction-and-fuse-input-operands.mlir | FileCheck compiler/src/iree/compiler/Codegen/LLVMCPU/test/tile-reduction-and-fuse-input-operands.mlir | |
: 1723119032:0;/home/prashant/iree-build/tools/iree-compile --output-format=vm-bytecode --mlir-print-op-on-diagnostic=false --iree-hal-target-backends=llvm-cpu --iree-llvmcpu-target-cpu-features=+avx,+avx2,+fma,+f16c,+avx512f,+avx512vl,+avx512cd,+avx512bw,+avx512dq --iree-opt-data-tiling --iree-global-opt-enable-early-materialization=false --iree-llvmcpu-enable-ukernels=all /home/prashant/iree-build/tests/e2e/matmul/e2e_matmul_cpu_experimental_dt_uk_f16_f16_small_llvm-cpu_local-task_avx512_matmul.mlir -o /home/prashant/iree-build/tests/e2e/matmul/e2e_matmul_cpu_experimental_dt_uk_f16_f16_small_llvm-cpu_local-task_avx512_matmul.vmfb --iree-hal-executable-object-search-path=\"/home/prashant/iree-build\" --iree-llvmcpu-embedded-linker-path=\"/home/prashant/iree-build/llvm-project/bin/lld\" --iree-llvmcpu-wasm-linker-path=\"/home/prashant/iree-build/llvm-project/bin/lld\" | |
: 1723119042:0;/home/prashant/iree-build/tools/iree-compile --output-format=vm-bytecode --mlir-print-op-on-diagnostic=false --iree-hal-target-backends=llvm-cpu --iree-llvmcpu-target-cpu-features=+avx,+avx2,+fma,+f16c,+avx512f,+avx512vl,+avx512cd,+avx512bw,+avx512dq --iree-opt-data-tiling --iree-global-opt-enable-early-materialization=false --iree-llvmcpu-enable-ukernels=all /home/prashant/iree-build/tests/e2e/matmul/e2e_matmul_cpu_experimental_dt_uk_f16_f16_small_llvm-cpu_local-task_avx512_matmul.mlir -o /home/prashant/iree-build/tests/e2e/matmul/e2e_matmul_cpu_experimental_dt_uk_f16_f16_small_llvm-cpu_local-task_avx512_matmul.vmfb --iree-hal-executable-object-search-path=\"/home/prashant/iree-build\" --iree-llvmcpu-embedded-linker-path=\"/home/prashant/iree-build/llvm-project/bin/lld\" --iree-llvmcpu-wasm-linker-path=\"/home/prashant/iree-build/llvm-project/bin/lld\" -mlir-print-ir-after-all | |
: 1723119062:0;/home/prashant/iree-build/tools/iree-compile --output-format=vm-bytecode --mlir-print-op-on-diagnostic=false --iree-hal-target-backends=llvm-cpu --iree-llvmcpu-target-cpu-features=+avx,+avx2,+fma,+f16c,+avx512f,+avx512vl,+avx512cd,+avx512bw,+avx512dq --iree-opt-data-tiling --iree-global-opt-enable-early-materialization=false --iree-llvmcpu-enable-ukernels=all /home/prashant/iree-build/tests/e2e/matmul/e2e_matmul_cpu_experimental_dt_uk_f16_f16_small_llvm-cpu_local-task_avx512_matmul.mlir -o /home/prashant/iree-build/tests/e2e/matmul/e2e_matmul_cpu_experimental_dt_uk_f16_f16_small_llvm-cpu_local-task_avx512_matmul.vmfb --iree-hal-executable-object-search-path=\"/home/prashant/iree-build\" --iree-llvmcpu-embedded-linker-path=\"/home/prashant/iree-build/llvm-project/bin/lld\" --iree-llvmcpu-wasm-linker-path=\"/home/prashant/iree-build/llvm-project/bin/lld\" -mlir-print-ir-after-all 2> xyz.txt | |
: 1723120103:0;vi bazel-bin/tests/e2e/linalg_ext_ops/check_llvm-cpu_local-task_attention.mlir | |
: 1723120151:0;vi tests/e2e/linalg_ext_ops/attention.mlir | |
: 1723120732:0;/home/prashant/iree-build/tools/iree-compile --output-format=vm-bytecode --mlir-print-op-on-diagnostic=false --iree-hal-target-backends=llvm-cpu --iree-llvmcpu-target-cpu-features=+avx,+avx2,+fma,+f16c,+avx512f,+avx512vl,+avx512cd,+avx512bw,+avx512dq --iree-opt-data-tiling --iree-global-opt-enable-early-materialization=false --iree-llvmcpu-enable-ukernels=all /home/prashant/iree-build/tests/e2e/matmul/e2e_matmul_cpu_experimental_dt_uk_f16_f16_small_llvm-cpu_local-task_avx512_matmul.mlir -o /home/prashant/iree-build/tests/e2e/matmul/e2e_matmul_cpu_experimental_dt_uk_f16_f16_small_llvm-cpu_local-task_avx512_matmul.vmfb --iree-hal-executable-object-search-path=\"/home/prashant/iree-build\" --iree-llvmcpu-embedded-linker-path=\"/home/prashant/iree-build/llvm-project/bin/lld\" --iree-llvmcpu-wasm-linker-path=\"/home/prashant/iree-build/llvm-project/bin/lld\" -mlir-print-ir-after-all 2> xyz.txt -mlir-disable-threading | |
: 1723123489:0;clang-format -i compiler/src/iree/compiler/Codegen/LLVMCPU/LLVMCPUTileReductionAndFuseInputOperands.cpp | |
: 1723200750:0;git ob new_test | |
: 1723201612:0;clang-format -i compiler/src/iree/compiler/Codegen/LLVMCPU/Passes.td | |
: 1723204662:0;iree-opt --pass-pipeline="builtin.module(func.func(iree-llvmcpu-tile-root-and-fuse-producer-consumer{tiling-level=0}), canonicalize)" compiler/src/iree/compiler/Codegen/LLVMCPU/test/tile-root-fuse-consumer-producer.mlir | FileCheck compiler/src/iree/compiler/Codegen/LLVMCPU/test/tile-root-fuse-consumer-producer.mlir | |
: 1723204677:0;iree-opt --pass-pipeline="builtin.module(func.func(iree-llvmcpu-tile-root-and-fuse-producer-consumer{tiling-level=0}), canonicalize)" compiler/src/iree/compiler/Codegen/LLVMCPU/test/tile-root-fuse-consumer-producer.mlir | |
: 1723204711:0;iree-opt --pass-pipeline="builtin.module(func.func(iree-llvmcpu-tile-root-and-fuse-producer-consumer{tiling-level=0, only-fuse-producer-input-operands=1}), canonicalize)" compiler/src/iree/compiler/Codegen/LLVMCPU/test/tile-root-fuse-consumer-producer.mlir | |
: 1723204741:0;iree-opt --pass-pipeline="builtin.module(func.func(iree-llvmcpu-tile-root-and-fuse-producer-consumer{tiling-level=0, only-fuse-producer-input-operands=true}), canonicalize)" compiler/src/iree/compiler/Codegen/LLVMCPU/test/tile-root-fuse-consumer-producer.mlir | |
: 1723204869:0;iree-opt --pass-pipeline="builtin.module(func.func(iree-llvmcpu-tile-root-and-fuse-producer-consumer{only-fuse-producer-input-operands=true}), canonicalize)" compiler/src/iree/compiler/Codegen/LLVMCPU/test/tile-root-fuse-consumer-producer.mlir | |
: 1723205692:0;iree-opt --pass-pipeline="builtin.module(func.func(iree-llvmcpu-tile-root-and-fuse-producer-consumer{tiling-level=0 only-fuse-producer-input-operands=true}), canonicalize)" compiler/src/iree/compiler/Codegen/LLVMCPU/test/tile-root-fuse-consumer-producer.mlir | |
: 1723205787:0;iree-opt --pass-pipeline="builtin.module(func.func(iree-llvmcpu-tile-root-and-fuse-producer-consumer{tiling-level=2 only-fuse-producer-input-operands=true}), canonicalize)" compiler/src/iree/compiler/Codegen/LLVMCPU/test/tile-root-fuse-consumer-producer.mlir --split-input-file --check-prefix=CHECK-REDUCTION | |
: 1723206354:0;/home/prashant/iree-build/tools/iree-compile --output-format=vm-bytecode --mlir-print-op-on-diagnostic=false --iree-hal-target-backends=llvm-cpu --iree-llvmcpu-target-cpu-features=+avx,+avx2,+fma,+f16c,+avx512f,+avx512vl,+avx512cd,+avx512bw,+avx512dq --iree-opt-data-tiling --iree-global-opt-enable-early-materialization=false --iree-llvmcpu-enable-ukernels=all /home/prashant/iree-build/tests/e2e/matmul/e2e_matmul_cpu_experimental_dt_uk_f16_f16_small_llvm-cpu_local-task_avx512_matmul.mlir -o /home/prashant/iree-build/tests/e2e/matmul/e2e_matmul_cpu_experimental_dt_uk_f16_f16_small_llvm-cpu_local-task_avx512_matmul.vmfb --iree-hal-executable-object-search-path=\"/home/prashant/iree-build\" --iree-llvmcpu-embedded-linker-path=\"/home/prashant/iree-build/llvm-project/bin/lld\" --iree-llvmcpu-wasm-linker-path=\"/home/prashant/iree-build/llvm-project/bin/lld\" | |
: 1723213383:0;// Copyright 2020 The IREE Authors\ | |
//\ | |
// Licensed under the Apache License v2.0 with LLVM Exceptions.\ | |
// See https://llvm.org/LICENSE.txt for license information.\ | |
// SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception\ | |
\ | |
#include "iree-dialects/Dialect/LinalgTransform/Passes.h"\ | |
#include "iree/compiler/Codegen/Common/CPU/Passes.h"\ | |
#include "iree/compiler/Codegen/Common/PassUtils.h"\ | |
#include "iree/compiler/Codegen/Common/Passes.h"\ | |
#include "iree/compiler/Codegen/Common/TileSizeSelection.h"\ | |
#include "iree/compiler/Codegen/LLVMCPU/Passes.h"\ | |
#include "iree/compiler/Dialect/LinalgExt/Transforms/Passes.h"\ | |
#include "iree/compiler/Utils/PassUtils.h"\ | |
#include "llvm/ADT/TypeSwitch.h"\ | |
#include "llvm/Support/CommandLine.h"\ | |
#include "mlir/Conversion/ArithToArmSME/ArithToArmSME.h"\ | |
#include "mlir/Conversion/ArmSMEToLLVM/ArmSMEToLLVM.h"\ | |
#include "mlir/Conversion/ArmSMEToSCF/ArmSMEToSCF.h"\ | |
#include "mlir/Conversion/ComplexToStandard/ComplexToStandard.h"\ | |
#include "mlir/Conversion/ReconcileUnrealizedCasts/ReconcileUnrealizedCasts.h"\ | |
#include "mlir/Conversion/SCFToControlFlow/SCFToControlFlow.h"\ | |
#include "mlir/Conversion/VectorToArmSME/VectorToArmSME.h"\ | |
#include "mlir/Conversion/VectorToLLVM/ConvertVectorToLLVMPass.h"\ | |
#include "mlir/Dialect/Arith/Transforms/Passes.h"\ | |
#include "mlir/Dialect/ArmSME/Transforms/Passes.h"\ | |
#include "mlir/Dialect/Func/IR/FuncOps.h"\ | |
#include "mlir/Dialect/Linalg/Passes.h"\ | |
#include "mlir/Dialect/MemRef/Transforms/Passes.h"\ | |
#include "mlir/Pass/PassManager.h"\ | |
#include "mlir/Transforms/Passes.h"\ | |
\ | |
#define DEBUG_TYPE "iree-llvmcpu-pass-pipelines"\ | |
\ | |
namespace mlir::iree_compiler {\ | |
\ | |
/// Command line options used purely for development purposes. Not to be relied\ | |
/// on in any way.\ | |
static llvm::cl::opt<bool> clFailOnOutOfBoundsStackAllocation(\ | |
"iree-llvmcpu-fail-on-out-of-bounds-stack-allocation",\ | |
llvm::cl::desc("fail if the upper bound of dynamic stack allocation cannot "\ | |
"be solved"),\ | |
llvm::cl::init(true));\ | |
\ | |
static llvm::cl::opt<bool> clFailOnLargeVector(\ | |
"iree-llvmcpu-fail-on-large-vector",\ | |
llvm::cl::desc("fail if there are operations with large vectors"),\ | |
llvm::cl::init(true));\ | |
\ | |
static llvm::cl::opt<bool> clCheckLinalgVectorization(\ | |
"iree-llvmcpu-check-linalg-vectorization",\ | |
llvm::cl::desc(\ | |
"Runs the pass to check if all the Linalg ops are vectorized"),\ | |
llvm::cl::init(false));\ | |
\ | |
static llvm::cl::opt<bool> clUseFastMinMaxOps(\ | |
"iree-llvmcpu-use-fast-min-max-ops",\ | |
llvm::cl::desc(\ | |
"Use `arith.minf/maxf` instead of `arith.minimumf/maximumf` ops"),\ | |
llvm::cl::init(false));\ | |
\ | |
static llvm::cl::opt<bool> clEnableReassociateFpReductions(\ | |
"iree-llvmcpu-reassociate-fp-reductions",\ | |
llvm::cl::desc("Enables reassociation for FP reductions"),\ | |
llvm::cl::init(true));\ | |
\ | |
static llvm::cl::opt<bool> clSkipIntermediateRoundings(\ | |
"iree-llvmcpu-skip-intermediate-roundings",\ | |
llvm::cl::desc(\ | |
"Allow skipping intermediate roundings. For example, in f16 matmul "\ | |
"kernels on targets with only f32 arithmetic, we have to perform each "\ | |
"multiply-accumulate in f32, and if this flag is false, then we have "\ | |
"to round those f32 accumulators to the nearest f16 every time, which "\ | |
"is slow."),\ | |
llvm::cl::init(true));\ | |
\ | |
static llvm::cl::opt<bool> clInstrumentMemoryAccesses{\ | |
"iree-llvmcpu-instrument-memory-accesses",\ | |
llvm::cl::desc("Instruments memory accesses in dispatches when dispatch "\ | |
"instrumentation is enabled."),\ | |
llvm::cl::init(false)};\ | |
\ | |
static llvm::cl::opt<bool> clUseSoftmaxInterFusion(\ | |
"iree-llvmcpu-use-decompose-softmax-fuse",\ | |
llvm::cl::desc("Enables inter-pass fusion for the DecomposeSoftmax pass."),\ | |
llvm::cl::init(true));\ | |
\ | |
static llvm::cl::opt<bool> clEnableVectorContractCustomKernels(\ | |
"iree-llvmcpu-enable-vector-contract-custom-kernels",\ | |
llvm::cl::desc("Enables vector contract custom kernels for "\ | |
"LLVMCPUMmt4dVectorLowering pass."),\ | |
llvm::cl::init(false));\ | |
\ | |
// By default, IREE does not enable the Armv9-A streaming SVE mode in the\ | |
// presence of scalable vectors (even when using `+sme`), as currently there's\ | |
// no cost model of when it could be beneficial. This flag will effectively make\ | |
// IREE/LLVM switch from SVE to SSVE in dispatch regions with supported\ | |
// scalable vector operations.\ | |
static llvm::cl::opt<bool> clForceArmStreaming(\ | |
"iree-llvmcpu-force-arm-streaming",\ | |
llvm::cl::desc(\ | |
"Enables Armv9-A streaming SVE mode for any dispatch region that "\ | |
"contains supported scalable vector operations (i.e., use SSVE rather "\ | |
"than SVE). Requires the +sme feature flag."),\ | |
llvm::cl::init(false));\ | |
\ | |
static void addTileAndDistributePasses(OpPassManager &funcPassManager) {\ | |
funcPassManager.addPass(createTileAndDistributeToWorkgroupsPass());\ | |
funcPassManager.addPass(createCSEPass());\ | |
funcPassManager.addPass(createConvertToDestinationPassingStylePass());\ | |
funcPassManager.addPass(createFoldAffineMinInDistributedLoopsPass());\ | |
funcPassManager.addPass(createCanonicalizerPass());\ | |
funcPassManager.addPass(createCSEPass());\ | |
funcPassManager.addPass(createFuseTensorPadWithConsumerPass());\ | |
funcPassManager.addPass(createConcretizePadResultShapePass());\ | |
}\ | |
\ | |
//===---------------------------------------------------------------------===//\ | |
// Codegen configuration verifications.\ | |
//===---------------------------------------------------------------------===//\ | |
\ | |
static bool isValidInterchange(ArrayRef<int64_t> interchange, int numLoops) {\ | |
if (interchange.empty())\ | |
return true;\ | |
llvm::SmallDenseSet<int64_t> s;\ | |
s.insert(interchange.begin(), interchange.end());\ | |
for (int i = 0; i < numLoops; ++i) {\ | |
if (!s.contains(i))\ | |
return false;\ | |
}\ | |
return true;\ | |
}\ | |
\ | |
LogicalResult verifyDoubleTilingExpertPassPipelineConfig(\ | |
Operation *op, TilingConfig &tilingConfig,\ | |
IREE::Codegen::TranslationInfoAttr translationInfo,\ | |
ArrayRef<int64_t> workgroupSize) {\ | |
if (!workgroupSize.empty()) {\ | |
return op->emitOpError(\ | |
"expected workgroup size to be empty for CPU pipelines");\ | |
}\ | |
\ | |
// Verify that the translation info is using the right pipeline.\ | |
if (translationInfo.getDispatchLoweringPassPipeline() !=\ | |
IREE::Codegen::DispatchLoweringPassPipeline::CPUDoubleTilingExpert) {\ | |
return op->emitOpError("expected pipeline in translation_info to be ")\ | |
<< stringifyEnum(IREE::Codegen::DispatchLoweringPassPipeline::\ | |
CPUDoubleTilingExpert);\ | |
}\ | |
\ | |
if (tilingConfig.getNumTilingLevels() == 6) {\ | |
// TODO: update verification.\ | |
return success();\ | |
}\ | |
\ | |
if (tilingConfig.getNumTilingLevels() != 4) {\ | |
return op->emitOpError("expected four tiling levels, got ")\ | |
<< tilingConfig.getNumTilingLevels();\ | |
}\ | |
\ | |
auto interfaceOp = dyn_cast_or_null<TilingInterface>(op);\ | |
if (interfaceOp) {\ | |
llvm::SmallDenseSet<unsigned> pLoopsSet;\ | |
for (auto [index, iteratorType] :\ | |
llvm::enumerate(interfaceOp.getLoopIteratorTypes())) {\ | |
if (iteratorType == utils::IteratorType::parallel) {\ | |
pLoopsSet.insert(index);\ | |
}\ | |
}\ | |
\ | |
SmallVector<int64_t> secondLevelTileSizes;\ | |
std::tie(secondLevelTileSizes, std::ignore) =\ | |
tilingConfig.getVectorCommonParallelSizes();\ | |
for (auto [index, tileSize] : llvm::enumerate(secondLevelTileSizes)) {\ | |
if (tileSize != 0 && !pLoopsSet.contains(index)) {\ | |
return op->emitOpError(\ | |
"expected only parallel dims to be set in the second tiling "\ | |
"level, got ")\ | |
<< index << "-th tile size set";\ | |
}\ | |
}\ | |
\ | |
SmallVector<int64_t> thirdLevelTileSizes;\ | |
std::tie(thirdLevelTileSizes, std::ignore) =\ | |
tilingConfig.getVectorReductionSizes();\ | |
for (auto [index, tileSize] : llvm::enumerate(thirdLevelTileSizes)) {\ | |
if (tileSize != 0 && pLoopsSet.contains(index)) {\ | |
return op->emitOpError(\ | |
"expected only reduction dims to be set in the third tiling "\ | |
"level, got ")\ | |
<< index << "-th tile size set";\ | |
}\ | |
}\ | |
}\ | |
\ | |
// Verify interchange\ | |
auto tileSizesForLevel = tilingConfig.getTileSizes();\ | |
for (int level = 0; level < tilingConfig.getNumTilingLevels(); level++) {\ | |
auto interchange = tilingConfig.getTileInterchangeSizes(level);\ | |
auto &tileSizes = tileSizesForLevel[level];\ | |
if (!isValidInterchange(interchange, tileSizes.size())) {\ | |
return op->emitOpError("expected [0, ")\ | |
<< tileSizes.size() << ") to be set exactly once in interchange #"\ | |
<< level;\ | |
}\ | |
}\ | |
\ | |
// Verify that native vector size is empty.\ | |
SmallVector<int64_t> nativeVectorSize = tilingConfig.getNativeVectorSizes();\ | |
if (!nativeVectorSize.empty()) {\ | |
return op->emitOpError("native_vector_size must be empty");\ | |
}\ | |
return success();\ | |
}\ | |
\ | |
LogicalResult verifyConvTileAndDecomposeExpertConfig(\ | |
Operation *op, TilingConfig &tilingConfig,\ | |
IREE::Codegen::TranslationInfoAttr translationInfo,\ | |
ArrayRef<int64_t> workgroupSize) {\ | |
if (!isa<linalg::ConvolutionOpInterface>(op))\ | |
return success();\ | |
\ | |
if (tilingConfig.getNumTilingLevels() == 6) {\ | |
// TODO: update verification.\ | |
return success();\ | |
}\ | |
\ | |
if (tilingConfig.getNumTilingLevels() != 4) {\ | |
return op->emitOpError("expected four tiling levels, got ")\ | |
<< tilingConfig.getNumTilingLevels();\ | |
}\ | |
\ | |
linalg::LinalgOp linalgOp = cast<linalg::LinalgOp>(op);\ | |
SmallVector<int64_t> shape = linalgOp.getStaticLoopRanges();\ | |
for (auto sizes : tilingConfig.getTileSizes()) {\ | |
for (auto [i, size] : llvm::enumerate(sizes)) {\ | |
if (size == 1)\ | |
shape[i] = 1;\ | |
if (shape[i] == -1 || size == 0)\ | |
continue;\ | |
if (shape[i] % size != 0) {\ | |
shape[i] = -1;\ | |
} else {\ | |
shape[i] = size;\ | |
}\ | |
}\ | |
}\ | |
\ | |
int64_t khSize, kwSize, ohSize, owSize;\ | |
auto isSizeExtracted =\ | |
TypeSwitch<Operation *, LogicalResult>(op)\ | |
.Case<linalg::Conv2DNhwcHwcfOp, linalg::DepthwiseConv2DNhwcHwcOp,\ | |
linalg::PoolingNhwcSumOp, linalg::PoolingNhwcMaxOp,\ | |
linalg::PoolingNhwcMaxUnsignedOp, linalg::PoolingNhwcMinOp,\ | |
linalg::PoolingNhwcMinUnsignedOp>([&](auto) {\ | |
// Shape: N, OH, OW, OC, KH, KW, (IC)\ | |
khSize = shape[4];\ | |
kwSize = shape[5];\ | |
ohSize = shape[1];\ | |
owSize = shape[2];\ | |
return success();\ | |
})\ | |
.Case<linalg::Conv2DNchwFchwOp>([&](auto) {\ | |
// Shape: N, OC, OH, OW, (IC), KH, KW\ | |
khSize = shape[5];\ | |
kwSize = shape[6];\ | |
ohSize = shape[2];\ | |
owSize = shape[3];\ | |
return success();\ | |
})\ | |
.Case<linalg::PoolingNchwSumOp, linalg::PoolingNchwMaxOp>([&](auto) {\ | |
// Shape: N, OC, OH, OW, KH, KW\ | |
khSize = shape[4];\ | |
kwSize = shape[5];\ | |
ohSize = shape[2];\ | |
owSize = shape[3];\ | |
return success();\ | |
})\ | |
.Default([&](auto) { return failure(); });\ | |
if (failed(isSizeExtracted)) {\ | |
return op->emitOpError("unsupported conv types");\ | |
}\ | |
\ | |
bool removeH = (khSize == 1 && ohSize == 1);\ | |
bool removeW = (kwSize == 1 && owSize == 1);\ | |
if (!removeH && !removeW) {\ | |
return op->emitOpError("can't decompose the conv op");\ | |
}\ | |
\ | |
return success();\ | |
}\ | |
\ | |
//===---------------------------------------------------------------------===//\ | |
// Codegen pipelines.\ | |
//===---------------------------------------------------------------------===//\ | |
\ | |
void buildLLVMCPUVectorLoweringPipeline(\ | |
OpPassManager &funcPassManager,\ | |
const LLVMCPUVectorLoweringPassOptions &options) {\ | |
funcPassManager.addPass(createLLVMCPUDropVectorUnitDimsPass());\ | |
funcPassManager.addPass(createLLVMCPUVirtualVectorLoweringPass(\ | |
LLVMCPUVirtualVectorLoweringPassOptions{options.splitVectorTransfersTo,\ | |
options.enableArmI8mm}));\ | |
\ | |
// Make sure we remove redundant vector ops (e.g., vector tranposes) before we\ | |
// lower them and can't be optimized away anymore.\ | |
funcPassManager.addPass(createCanonicalizerPass());\ | |
\ | |
funcPassManager.addPass(createLLVMCPUVectorTransferLoweringPass());\ | |
funcPassManager.addPass(createLLVMCPUVectorTransposeLoweringPass(\ | |
LLVMCPUVectorTransposeLoweringPassOptions{\ | |
options.lowerVectorTransposeToAVX2}));\ | |
\ | |
// Potentially removes shape_cast and broadcast on unit dims before shape_cast\ | |
// lowering.\ | |
funcPassManager.addPass(createCanonicalizerPass());\ | |
\ | |
// 'vector.shape_cast' are very expensive operations that are even generated\ | |
// by some of the lowerings above (e.g., transpose lowering). There are\ | |
// chances to cancel them out if they are not lowered too early so we lower\ | |
// them at the very end of the pass.\ | |
funcPassManager.addPass(createLLVMCPUVectorShapeCastLoweringPass());\ | |
}\ | |
\ | |
void addCPUBufferOpsTileAndVectorizePipeline(\ | |
OpPassManager &funcPassManager, TilingConfig &tilingConfig,\ | |
LLVMCPUPipelineOptions &pipelineOpt) {\ | |
addTileAndDistributePasses(funcPassManager);\ | |
\ | |
// Skip tiling reduction loops because this is expected to apply on copy ops\ | |
// only.\ | |
funcPassManager.addPass(\ | |
createLLVMCPUTilePass(tilingConfig.getVectorCommonParallelLevel()));\ | |
funcPassManager.addPass(createLLVMCPUPeelPass());\ | |
{\ | |
GenericVectorizationPassOptions options;\ | |
options.useConfiguredVectorSizes = pipelineOpt.useConfiguredVectorSizes;\ | |
options.enableVectorMasking = pipelineOpt.enableVectorMasking;\ | |
options.vectorizeGatherAccesses = true;\ | |
funcPassManager.addPass(createGenericVectorizationPass(options));\ | |
funcPassManager.addPass(createOptimizeTensorInsertExtractSlicesPass());\ | |
funcPassManager.addPass(createCanonicalizerPass());\ | |
funcPassManager.addPass(createCSEPass());\ | |
if (clFailOnLargeVector) {\ | |
funcPassManager.addPass(createLLVMCPUVerifyVectorSizeLegalityPass());\ | |
}\ | |
}\ | |
\ | |
// Run IREE specific passes before vector lowering expert.\ | |
funcPassManager.addPass(createRemoveSingleIterationLoopPass());\ | |
\ | |
{\ | |
LLVMCPUVectorLoweringPassOptions options;\ | |
options.lowerVectorTransposeToAVX2 = pipelineOpt.lowerToAVX2;\ | |
options.splitVectorTransfersTo = "linalg-copy";\ | |
options.enableArmI8mm = pipelineOpt.enableAArch64I8mm;\ | |
buildLLVMCPUVectorLoweringPipeline(funcPassManager, options);\ | |
}\ | |
}\ | |
\ | |
void addMultiTilingExpertPassPipeline(OpPassManager &funcPassManager,\ | |
TilingConfig &tilingConfig,\ | |
LLVMCPUPipelineOptions &pipelineOpt) {\ | |
addTileAndDistributePasses(funcPassManager);\ | |
\ | |
SmallVector<int64_t> allFusableLevels(tilingConfig.getFusableLevels());\ | |
// Apply tile and fuse to all the non-distribution fusable levels. Skip\ | |
// distribution level as that level has been fused already.\ | |
if (allFusableLevels.size() > 1) {\ | |
llvm::SmallSetVector<int64_t, 4> fusableLevels(allFusableLevels.begin(),\ | |
allFusableLevels.end());\ | |
for (int i = 0; i < tilingConfig.getNumTilingLevels(); ++i) {\ | |
if (i == tilingConfig.getDistributionLevel())\ | |
continue;\ | |
if (fusableLevels.contains(i)) {\ | |
funcPassManager.addPass(createLLVMCPUTileAndFusePass(i));\ | |
funcPassManager.addPass(createFuseTensorPadWithConsumerPass());\ | |
funcPassManager.addPass(createConcretizePadResultShapePass());\ | |
continue;\ | |
}\ | |
\ | |
if (i == tilingConfig.getVectorReductionLevel()) {\ | |
// Run SplitReductionPass before the final reduction Fuse pass, because\ | |
// SplitReductionPass takes care of banked-tiling.\ | |
funcPassManager.addPass(\ | |
createLLVMCPUSplitReductionPass(clEnableReassociateFpReductions));\ | |
funcPassManager.addPass(createLLVMCPUTilePass(i));\ | |
continue;\ | |
}\ | |
\ | |
funcPassManager.addPass(createLLVMCPUTilePass(i));\ | |
}\ | |
}\ | |
\ | |
if (pipelineOpt.enablePeeling) {\ | |
funcPassManager.addPass(createLLVMCPUPeelPass());\ | |
}\ | |
\ | |
if (pipelineOpt.enableAArch64SSVE) {\ | |
funcPassManager.addPass(createLLVMCPU2DScalableTo1DScalablePass());\ | |
}\ | |
\ | |
{\ | |
funcPassManager.addPass(createVectorizePadPass());\ | |
if (pipelineOpt.decomposePackUnPackOps) {\ | |
funcPassManager.addPass(createDecomposePackUnPackOpsPass());\ | |
funcPassManager.addPass(createCanonicalizerPass());\ | |
funcPassManager.addPass(createCSEPass());\ | |
}\ | |
\ | |
GenericVectorizationPassOptions options;\ | |
options.useConfiguredVectorSizes = pipelineOpt.useConfiguredVectorSizes;\ | |
options.enableVectorMasking = pipelineOpt.enableVectorMasking;\ | |
options.vectorizePadding = true;\ | |
options.vectorizeGatherAccesses = true;\ | |
funcPassManager.addPass(createGenericVectorizationPass(options));\ | |
funcPassManager.addPass(createOptimizeTensorInsertExtractSlicesPass());\ | |
funcPassManager.addPass(createCanonicalizerPass());\ | |
funcPassManager.addPass(createCSEPass());\ | |
if (clFailOnLargeVector) {\ | |
funcPassManager.addPass(createLLVMCPUVerifyVectorSizeLegalityPass());\ | |
}\ | |
}\ | |
\ | |
addCPUBufferizePasses(funcPassManager);\ | |
\ | |
// Run IREE specific passes before vector lowering expert.\ | |
funcPassManager.addPass(createRemoveSingleIterationLoopPass());\ | |
\ | |
{\ | |
LLVMCPUVectorLoweringPassOptions options;\ | |
options.lowerVectorTransposeToAVX2 = pipelineOpt.lowerToAVX2;\ | |
options.splitVectorTransfersTo = "linalg-copy";\ | |
options.enableArmI8mm = pipelineOpt.enableAArch64I8mm;\ | |
buildLLVMCPUVectorLoweringPipeline(funcPassManager, options);\ | |
}\ | |
}\ | |
\ | |
void addConvTileAndDecomposeExpertPassPipeline(\ | |
OpPassManager &funcPassManager, TilingConfig &tilingConfig,\ | |
LLVMCPUPipelineOptions &pipelineOpt) {\ | |
addTileAndDistributePasses(funcPassManager);\ | |
\ | |
// Run LLVMTileAndFuse firstly in case that we have fill + conv + generic\ | |
// ops. At this stage, we do not apply vectorization. The reduction dim won't\ | |
// get tiled if the case is conv + generic op. In this case, we have to tile\ | |
// along reduction dim again, which needs them to be Linalg ops form.\ | |
\ | |
funcPassManager.addPass(createLLVMCPUTileAndFusePass(\ | |
tilingConfig.getVectorCommonParallelLevel()));\ | |
funcPassManager.addPass(createFuseTensorPadWithConsumerPass());\ | |
funcPassManager.addPass(createConcretizePadResultShapePass());\ | |
\ | |
funcPassManager.addPass(\ | |
createLLVMCPUTilePass(tilingConfig.getVectorReductionLevel()));\ | |
funcPassManager.addPass(\ | |
createLLVMCPUTileAndFusePass(tilingConfig.getVectorInnerParallelLevel()));\ | |
funcPassManager.addPass(createDecomposeConvolutionToLowerDimOpsPass());\ | |
\ | |
funcPassManager.addPass(createFuseTensorPadWithConsumerPass());\ | |
funcPassManager.addPass(createConcretizePadResultShapePass());\ | |
\ | |
if (pipelineOpt.enablePeeling) {\ | |
funcPassManager.addPass(createLLVMCPUPeelPass());\ | |
}\ | |
\ | |
{\ | |
funcPassManager.addPass(createVectorizePadPass());\ | |
GenericVectorizationPassOptions options;\ | |
options.useConfiguredVectorSizes = pipelineOpt.useConfiguredVectorSizes;\ | |
options.enableVectorMasking = pipelineOpt.enableVectorMasking;\ | |
options.vectorizePadding = true;\ | |
options.vectorizeGatherAccesses = true;\ | |
funcPassManager.addPass(createGenericVectorizationPass(options));\ | |
funcPassManager.addPass(createOptimizeTensorInsertExtractSlicesPass());\ | |
funcPassManager.addPass(createCanonicalizerPass());\ | |
funcPassManager.addPass(createCSEPass());\ | |
if (clFailOnLargeVector) {\ | |
funcPassManager.addPass(createLLVMCPUVerifyVectorSizeLegalityPass());\ | |
}\ | |
}\ | |
\ | |
// Eliminate redundant transfer_read/write to avoid stack allocations.\ | |
funcPassManager.addPass(createOptimizeVectorTransferPass(/*flatten=*/true));\ | |
\ | |
addCPUBufferizePasses(funcPassManager);\ | |
\ | |
// Run IREE specific passes before vector lowering expert.\ | |
funcPassManager.addPass(createRemoveSingleIterationLoopPass());\ | |
\ | |
{\ | |
LLVMCPUVectorLoweringPassOptions options;\ | |
options.lowerVectorTransposeToAVX2 = pipelineOpt.lowerToAVX2;\ | |
options.splitVectorTransfersTo = "shuffle";\ | |
options.enableArmI8mm = pipelineOpt.enableAArch64I8mm;\ | |
buildLLVMCPUVectorLoweringPipeline(funcPassManager, options);\ | |
}\ | |
}\ | |
\ | |
void addMmt4dTilingExpertPassPipeline(OpPassManager &funcPassManager,\ | |
TilingConfig &tilingConfig,\ | |
LLVMCPUPipelineOptions &pipelineOpt) {\ | |
addTileAndDistributePasses(funcPassManager);\ | |
\ | |
funcPassManager.addPass(createLLVMCPUTileAndFusePass(\ | |
static_cast<int64_t>(tilingConfig.getVectorCommonParallelLevel())));\ | |
// The below two passes are nop if the "mmt4d" is explicitly excluded in the\ | |
// ukernels attribute.\ | |
funcPassManager.addPass(createCPUPrepareUkernelsPass());\ | |
funcPassManager.addPass(\ | |
createCPULowerToUKernelsPass(clSkipIntermediateRoundings));\ | |
funcPassManager.addPass(createLLVMCPUTilePass(\ | |
static_cast<int64_t>(tilingConfig.getVectorReductionLevel())));\ | |
\ | |
{\ | |
GenericVectorizationPassOptions options;\ | |
options.enableVectorMasking = pipelineOpt.enableVectorMasking;\ | |
options.vectorizePadding = true;\ | |
options.vectorizeGatherAccesses = true;\ | |
funcPassManager.addPass(createGenericVectorizationPass(options));\ | |
funcPassManager.addPass(createOptimizeTensorInsertExtractSlicesPass());\ | |
funcPassManager.addPass(createCanonicalizerPass());\ | |
funcPassManager.addPass(createCSEPass());\ | |
if (clFailOnLargeVector) {\ | |
funcPassManager.addPass(createLLVMCPUVerifyVectorSizeLegalityPass());\ | |
}\ | |
}\ | |
\ | |
funcPassManager.addPass(createCanonicalizerPass());\ | |
funcPassManager.addPass(createCSEPass());\ | |
\ | |
addCPUBufferizePasses(funcPassManager);\ | |
\ | |
// Vector lowering of Mmt4d.\ | |
funcPassManager.addPass(createLLVMCPUMmt4dVectorLoweringPass(\ | |
LLVMCPUMmt4dVectorLoweringPassOptions{\ | |
clEnableVectorContractCustomKernels}));\ | |
\ | |
// Generic vector lowering.\ | |
LLVMCPUVectorLoweringPassOptions options;\ | |
options.lowerVectorTransposeToAVX2 = pipelineOpt.lowerToAVX2;\ | |
options.splitVectorTransfersTo = "linalg-copy";\ | |
options.enableArmI8mm = pipelineOpt.enableAArch64I8mm;\ | |
buildLLVMCPUVectorLoweringPipeline(funcPassManager, options);\ | |
}\ | |
\ | |
void addCPUDataTilingPipeline(OpPassManager &funcPassManager,\ | |
TilingConfig &tilingConfig,\ | |
LLVMCPUPipelineOptions &pipelineOpt) {\ | |
addTileAndDistributePasses(funcPassManager);\ | |
\ | |
// The below two passes are nop if pack/unpack is not specified in ukernels\ | |
// attribute. By default, they are disabled.\ | |
funcPassManager.addPass(createCPUPrepareUkernelsPass());\ | |
funcPassManager.addPass(\ | |
createCPULowerToUKernelsPass(clSkipIntermediateRoundings));\ | |
\ | |
funcPassManager.addPass(\ | |
createLLVMCPUTilePass(tilingConfig.getVectorCommonParallelLevel()));\ | |
if (pipelineOpt.decomposePackUnPackOps) {\ | |
funcPassManager.addPass(createDecomposePackUnPackOpsPass());\ | |
}\ | |
\ | |
{\ | |
GenericVectorizationPassOptions options;\ | |
options.useConfiguredVectorSizes = pipelineOpt.useConfiguredVectorSizes;\ | |
options.vectorizePadding = true;\ | |
options.enableVectorMasking = pipelineOpt.enableVectorMasking;\ | |
funcPassManager.addPass(createGenericVectorizationPass(options));\ | |
funcPassManager.addPass(createOptimizeTensorInsertExtractSlicesPass());\ | |
funcPassManager.addPass(createCanonicalizerPass());\ | |
funcPassManager.addPass(createCSEPass());\ | |
if (clFailOnLargeVector) {\ | |
funcPassManager.addPass(createLLVMCPUVerifyVectorSizeLegalityPass());\ | |
}\ | |
}\ | |
\ | |
addCPUBufferizePasses(funcPassManager);\ | |
\ | |
{\ | |
LLVMCPUVectorLoweringPassOptions options;\ | |
options.lowerVectorTransposeToAVX2 = pipelineOpt.lowerToAVX2;\ | |
options.splitVectorTransfersTo = "linalg-copy";\ | |
options.enableArmI8mm = pipelineOpt.enableAArch64I8mm;\ | |
buildLLVMCPUVectorLoweringPipeline(funcPassManager, options);\ | |
}\ | |
}\ | |
\ | |
void addCPULinalgExtTileAndVectorizePipeline(\ | |
OpPassManager &funcPassManager, TilingConfig &tilingConfig,\ | |
LLVMCPUPipelineOptions &pipelineOpt) {\ | |
addTileAndDistributePasses(funcPassManager);\ | |
funcPassManager.addPass(\ | |
createLLVMCPUTilePass(tilingConfig.getVectorCommonParallelLevel()));\ | |
// TODO: Remove the pass once we have PartialReductionOpInterface implemented\ | |
// for AttentionOp.\ | |
funcPassManager.addPass(\ | |
IREE::LinalgExt::createConvertAttentionToOnlineAttentionPass());\ | |
funcPassManager.addPass(\ | |
createLLVMCPUTilePass(tilingConfig.getVectorReductionLevel()));\ | |
funcPassManager.addPass(\ | |
IREE::LinalgExt::createDecomposeWinogradTransformPass());\ | |
funcPassManager.addPass(IREE::LinalgExt::createDecomposeAttentionPass());\ | |
\ | |
{\ | |
GenericVectorizationPassOptions options;\ | |
options.useConfiguredVectorSizes = pipelineOpt.useConfiguredVectorSizes;\ | |
options.enableVectorMasking = pipelineOpt.enableVectorMasking;\ | |
funcPassManager.addPass(createGenericVectorizationPass(options));\ | |
funcPassManager.addPass(createOptimizeTensorInsertExtractSlicesPass());\ | |
funcPassManager.addPass(createCanonicalizerPass());\ | |
funcPassManager.addPass(createCSEPass());\ | |
if (clFailOnLargeVector) {\ | |
funcPassManager.addPass(createLLVMCPUVerifyVectorSizeLegalityPass());\ | |
}\ | |
}\ | |
\ | |
addCPUBufferizePasses(funcPassManager);\ | |
\ | |
{\ | |
LLVMCPUVectorLoweringPassOptions options;\ | |
options.lowerVectorTransposeToAVX2 = pipelineOpt.lowerToAVX2;\ | |
options.splitVectorTransfersTo = "linalg-copy";\ | |
options.enableArmI8mm = pipelineOpt.enableAArch64I8mm;\ | |
buildLLVMCPUVectorLoweringPipeline(funcPassManager, options);\ | |
}\ | |
}\ | |
\ | |
void addCPUDefaultPassPipeline(OpPassManager &funcPassManager) {\ | |
addTileAndDistributePasses(funcPassManager);\ | |
addCPUBufferizePasses(funcPassManager);\ | |
}\ | |
\ | |
static void addLowerToLLVMPasses(OpPassManager &modulePassManager,\ | |
bool enableAArch64SME) {\ | |
// TODO: Remove the following pass and plumb support for #hal.descriptor_type\ | |
// memory space through the stack.\ | |
FunctionLikeNest(modulePassManager)\ | |
.addPass(createEraseHALDescriptorTypeFromMemRefPass);\ | |
\ | |
// Lower `ukernel.*` ops to function calls\ | |
modulePassManager.addPass(createLowerUKernelOpsToCallsPass());\ | |
\ | |
FunctionLikeNest(modulePassManager)\ | |
// LinalgExt -> SCF\ | |
.addPass(IREE::LinalgExt::createLinalgExtToLoopsPass)\ | |
// Linalg -> SCF\ | |
.addPass(createMemrefCopyToLinalgPass)\ | |
.addPredicatedPass(clCheckLinalgVectorization,\ | |
createLLVMCPUEmitVectorizationRemarksPass)\ | |
.addPass(createConvertLinalgToLoopsPass)\ | |
.addPass(createConvertBf16ArithToF32Pass)\ | |
.addPass(createConvertBf16ToUInt16BuffersPass)\ | |
.addPass(createCanonicalizerPass)\ | |
.addPass(createCSEPass);\ | |
\ | |
// Handled tensor-type constants.\ | |
addConstantBufferizePasses(modulePassManager);\ | |
\ | |
FunctionLikeNest(modulePassManager)\ | |
.addPass(createFoldTensorExtractOpPass)\ | |
// Handle complex operation conversion.\ | |
.addPass(createConvertComplexToStandardPass)\ | |
// math dialect elementry functions -> polynomial form.\ | |
.addPass(createPolynomialApproximationPass)\ | |
.addPass(createHoistStaticallyBoundAllocationsPass)\ | |
// Use `arith.minf/maxf` instead of `arith.minimumf/maximumf`.\ | |
.addPredicatedPass(clUseFastMinMaxOps, createReplaceSlowMinMaxOpsPass);\ | |
\ | |
if (enableAArch64SME) {\ | |
modulePassManager.addPass(mlir::arm_sme::createVectorLegalizationPass());\ | |
FunctionLikeNest(modulePassManager)\ | |
.addPredicatedPass(\ | |
clForceArmStreaming,\ | |
[] {\ | |
// 1. Enable Armv9-A streaming mode without ZA (i.e., SSVE) for\ | |
// dispatch regions that contain scalable vectors when forced via\ | |
// the --iree-llvmcpu-force-arm-streaming flag.\ | |
return mlir::arm_sme::createEnableArmStreamingPass(\ | |
mlir::arm_sme::ArmStreamingMode::StreamingLocally,\ | |
mlir::arm_sme::ArmZaMode::Disabled,\ | |
/*ifRequiredByOps=*/false,\ | |
/*ifContainsScalableVectors=*/true);\ | |
})\ | |
.addPass(createCanonicalizerPass)\ | |
.addPass(createCSEPass)\ | |
.addPass(mlir::createArithToArmSMEConversionPass)\ | |
.addPass(mlir::createConvertVectorToArmSMEPass)\ | |
.addPass([] {\ | |
// 2. Enable ZA for dispatch regions that contain ArmSME ops (which\ | |
// all make use of the ZA state).\ | |
return mlir::arm_sme::createEnableArmStreamingPass(\ | |
mlir::arm_sme::ArmStreamingMode::StreamingLocally,\ | |
mlir::arm_sme::ArmZaMode::NewZA,\ | |
/*ifRequiredByOps=*/true);\ | |
})\ | |
.addPass(mlir::createConvertArmSMEToSCFPass);\ | |
}\ | |
\ | |
FunctionLikeNest(modulePassManager)\ | |
// Resolve get_buffer_descriptor ops. All structural buffer manipulations\ | |
// must conclude before this point.\ | |
.addPass(createIREEExpandStridedMetadataPass)\ | |
.addPass(createCleanupBufferAllocViewPass)\ | |
// Checking stack allocation before converting to CF dialect is easier.\ | |
.addPass([&]() {\ | |
return createLLVMCPUCheckIRBeforeLLVMConversionPass(\ | |
LLVMCPUCheckIRBeforeLLVMConversionPassOptions{\ | |
clFailOnOutOfBoundsStackAllocation});\ | |
})\ | |
// SCF -> CF\ | |
.addPass(createConvertSCFToCFPass)\ | |
.addPass(createCanonicalizerPass)\ | |
.addPass(createCSEPass)\ | |
// (HAL, IREE, Linalg, CF) -> LLVM\ | |
.addPass(arith::createArithExpandOpsPass)\ | |
.addPass(memref::createExpandOpsPass)\ | |
.addPass(memref::createFoldMemRefAliasOpsPass)\ | |
.addPass(createEmulateNarrowTypePass)\ | |
.addPass(createCanonicalizerPass)\ | |
.addPass(createCSEPass)\ | |
.addPredicatedPass(clInstrumentMemoryAccesses,\ | |
createInstrumentMemoryAccessesPass);\ | |
\ | |
if (enableAArch64SME) {\ | |
FunctionLikeNest(modulePassManager).addPass([&] {\ | |
return createConvertArmSMEToLLVMPass();\ | |
});\ | |
}\ | |
modulePassManager.addPass(\ | |
createConvertToLLVMPass(clEnableReassociateFpReductions));\ | |
modulePassManager.addPass(createReconcileUnrealizedCastsPass());\ | |
\ | |
// We rely on MLIR symbol visibility being correct after this point and need\ | |
// to mirror the LLVM linkage that was assigned during conversion.\ | |
modulePassManager.addPass(createLLVMCPUSynchronizeSymbolVisibilityPass());\ | |
\ | |
modulePassManager.addPass(createCanonicalizerPass());\ | |
modulePassManager.addPass(createCSEPass());\ | |
modulePassManager.addNestedPass<LLVM::LLVMFuncOp>(\ | |
createAddFastMathFlagsPass());\ | |
}\ | |
\ | |
void buildLLVMCPUCodegenConfigurationPassPipelineImpl(\ | |
OpPassManager &modulePassManager) {\ | |
{\ | |
FunctionLikeNest funcPassManager(modulePassManager);\ | |
addCommonTargetExecutablePreprocessingPasses(funcPassManager,\ | |
clUseSoftmaxInterFusion);\ | |
}\ | |
modulePassManager.addPass(createMaterializeUserConfigsPass());\ | |
FunctionLikeNest(modulePassManager)\ | |
.addPass(createRematerializeParallelOpsPass)\ | |
// TODO(#13888): This(createExpandF16OpToF32Pass()) pass is being added\ | |
// way to late and should insted be be done during lowering to LLVM.\ | |
.addPass(createExpandF16OpToF32Pass)\ | |
.addPass(createCPUMaterializeDeviceEncodingPass)\ | |
// TODO: Remove the following pass the plumb support for\ | |
// #hal.descriptor_type memory space through the stack.\ | |
.addPass(createEraseHALDescriptorTypeFromMemRefPass);\ | |
\ | |
modulePassManager.addPass(createLLVMCPUSelectLoweringStrategyPass());\ | |
LLVM_DEBUG({\ | |
llvm::dbgs() << "LLVMCPU codegen configuration pass pipeline:\n";\ | |
modulePassManager.printAsTextualPipeline(llvm::dbgs());\ | |
llvm::dbgs() << "\n";\ | |
});\ | |
}\ | |
\ | |
void buildLLVMCPUCodegenConfigurationPassPipeline(\ | |
OpPassManager &variantPassManager) {\ | |
OpPassManager &modulePassManager = variantPassManager.nest<ModuleOp>();\ | |
buildLLVMCPUCodegenConfigurationPassPipelineImpl(modulePassManager);\ | |
}\ | |
\ | |
void buildLLVMCPUCodegenPassPipeline(OpPassManager &variantPassManager,\ | |
bool enableAArch64SME) {\ | |
OpPassManager &modulePassManager = variantPassManager.nest<ModuleOp>();\ | |
modulePassManager.addPass(createLowerExecutableUsingTransformDialectPass());\ | |
FunctionLikeNest(modulePassManager)\ | |
.addPass(createLLVMCPULowerExecutableTargetPass);\ | |
\ | |
// Run conversion to LLVM at `ModuleOp` granularity.\ | |
addLowerToLLVMPasses(modulePassManager, enableAArch64SME);\ | |
LLVM_DEBUG({\ | |
llvm::dbgs() << "LLVMCPU codegen pass pipeline:\n";\ | |
variantPassManager.printAsTextualPipeline(llvm::dbgs());\ | |
llvm::dbgs() << "\n";\ | |
});\ | |
}\ | |
\ | |
// NOTE: this runs on the top-level program module containing all\ | |
// hal.executable ops.\ | |
void buildLLVMCPULinkingPassPipeline(OpPassManager &modulePassManager) {\ | |
// Link together executables. This may produce some IR duplication.\ | |
modulePassManager.addPass(createLLVMCPULinkExecutablesPass());\ | |
\ | |
// Cleanup IR duplication.\ | |
modulePassManager.addNestedPass<IREE::HAL::ExecutableOp>(\ | |
mlir::createCanonicalizerPass());\ | |
\ | |
// Assign final executable constant and import ordinals.\ | |
auto &variantPassManager = modulePassManager.nest<IREE::HAL::ExecutableOp>()\ | |
.nest<IREE::HAL::ExecutableVariantOp>();\ | |
variantPassManager.addPass(createLLVMCPUAssignConstantOrdinalsPass());\ | |
variantPassManager.addPass(createLLVMCPUAssignImportOrdinalsPass());\ | |
}\ | |
\ | |
//===---------------------------------------------------------------------===//\ | |
// Register LLVMCPU Passes\ | |
//===---------------------------------------------------------------------===//\ | |
\ | |
namespace {\ | |
#define GEN_PASS_REGISTRATION\ | |
#include "iree/compiler/Codegen/LLVMCPU/Passes.h.inc"\ | |
} // namespace\ | |
\ | |
void registerCodegenLLVMCPUPasses() {\ | |
// Generated.\ | |
registerPasses();\ | |
\ | |
static PassPipelineRegistration<> LLVMCPUConfigPipeline(\ | |
"iree-codegen-llvmcpu-configuration-pipeline",\ | |
"Runs the translation strategy configuration pipeline on Linalg for CPU",\ | |
[](OpPassManager &modulePassManager) {\ | |
buildLLVMCPUCodegenConfigurationPassPipeline(modulePassManager);\ | |
});\ | |
\ | |
static PassPipelineRegistration<> LLVMCPUBufferizationPipeline(\ | |
"iree-codegen-llvmcpu-bufferization-pipeline",\ | |
"Runs the bufferization pipeline for CPU",\ | |
[](OpPassManager &funcPassManager) {\ | |
addCPUBufferizePasses(funcPassManager);\ | |
});\ | |
\ | |
static PassPipelineRegistration<> LLVMCPUVectorLoweringPipeline(\ | |
"iree-codegen-llvmcpu-vector-lowering-pipeline",\ | |
"Runs the translation strategy configuration pipeline on Linalg for CPU",\ | |
[](OpPassManager &funcPassManager) {\ | |
LLVMCPUVectorLoweringPassOptions options;\ | |
options.splitVectorTransfersTo = "linalg-copy";\ | |
buildLLVMCPUVectorLoweringPipeline(funcPassManager, options);\ | |
});\ | |
\ | |
struct LinalgToLLVMPipelineOptions\ | |
: public PassPipelineOptions<LinalgToLLVMPipelineOptions> {\ | |
Option<bool> enableArmSME{\ | |
*this, "enable-arm-sme",\ | |
llvm::cl::desc("Enable the ArmSME lowering pipeline.")};\ | |
};\ | |
\ | |
static PassPipelineRegistration<LinalgToLLVMPipelineOptions>\ | |
LinalgLLVMPipeline(\ | |
"iree-codegen-linalg-to-llvm-pipeline",\ | |
"Runs the progressive lowering pipeline from Linalg to LLVM",\ | |
[](OpPassManager &variantPassManager,\ | |
LinalgToLLVMPipelineOptions const &options) {\ | |
buildLLVMCPUCodegenPassPipeline(variantPassManager,\ | |
options.enableArmSME);\ | |
});\ | |
\ | |
static PassPipelineRegistration<> LLVMCPULinkingPipeline(\ | |
"iree-codegen-llvmcpu-linking-pipeline",\ | |
"Runs the LLVMCPU HAL executable linking pipeline",\ | |
[](OpPassManager &modulePassManager) {\ | |
buildLLVMCPULinkingPassPipeline(modulePassManager);\ | |
});\ | |
}\ | |
\ | |
} // namespace mlir::iree_compiler | |
: 1723213398:0;git o new_test | |
: 1723213420:0;git cp ae2d365c32 | |
: 1723214120:0;git o ae2d365c32 | |
: 1723214179:0;git o 930398af37 | |
: 1723214316:0;git o df3d588dde | |
: 1723214427:0;git o fbf677d209 | |
: 1723214575:0;git o 95fb6cb1b8 | |
: 1723214687:0;iree-opt -iree-llvmcpu-select-lowering-strategy test_conv.mlir | |
: 1723214703:0;vi all | |
: 1723214748:0;iree-compile --iree-hal-target-backends=llvm-cpu --iree-llvmcpu-target-cpu=znver4 test.mlir -o out1.vmfb -mlir-disable-threading -mlir-print-ir-after-all 2> all.txt | |
: 1723214798:0;vi test_conv.mlir | |
: 1723214843:0;git o avgpool_test | |
: 1723215012:0;iree-compile --iree-hal-target-backends=llvm-cpu --iree-llvmcpu-target-cpu=znver4 test.mlir -o out1.vmfb | |
: 1723215043:0;iree-compile --iree-hal-target-backends=llvm-cpu --iree-llvmcpu-target-cpu=znver4 deep.mlir -o out1.vmfb | |
: 1723227776:0;cd ../amd_matrix_instruction_calculator | |
: 1723228815:0;/home/prashant/iree-build/tools/iree-compile --output-format=vm-bytecode --mlir-print-op-on-diagnostic=false --iree-hal-target-backends=llvm-cpu --iree-llvmcpu-target-cpu-features=+avx,+avx2,+fma,+f16c,+avx512f,+avx512vl,+avx512cd,+avx512bw,+avx512dq --iree-opt-data-tiling --iree-global-opt-enable-early-materialization=false --iree-llvmcpu-enable-ukernels=all /home/prashant/iree-build/tests/e2e/matmul/e2e_matmul_cpu_experimental_dt_uk_f16_f16_small_llvm-cpu_local-task_avx512_matmul.mlir -o /home/prashant/iree-build/tests/e2e/matmul/e2e_matmul_cpu_experimental_dt_uk_f16_f16_small_llvm-cpu_local-task_avx512_matmul.vmfb --iree-hal-executable-object-search-path=\"/home/prashant/iree-build\" --iree-llvmcpu-embedded-linker-path=\"/home/prashant/iree-build/llvm-project/bin/lld\" --iree-llvmcpu-wasm-linker-path=\"/home/prashant/iree-build/llvm-project/bin/lld\" -mlir-disable-threading | |
: 1723228956:0;gist-paste /home/prashant/iree-build/tests/e2e/matmul/e2e_matmul_cpu_experimental_dt_uk_f16_f16_small_llvm-cpu_local-task_avx512_matmul.mlir | |
: 1723228982:0;vi /home/prashant/iree-build/tests/e2e/matmul/e2e_matmul_cpu_experimental_dt_uk_f16_f16_small_llvm-cpu_local-task_avx512_matmul.mlir | |
: 1723230939:0;./matrix_calculator.py --architecture cdna3 --instruction v_mfma_f32_16x16x4_f32 -R --B-matrix --csv | |
: 1723460744:0;iree-opt --pass-pipeline="builtin.module(func.func(iree-llvmcpu-tile-root-and-fuse-producer-consumer{tiling-level=2 only-fuse-producer-input-operands=false}), canonicalize)" compiler/src/iree/compiler/Codegen/LLVMCPU/test/tile-root-fuse-consumer-producer.mlir --split-input-file | |
: 1723460755:0;iree-opt --pass-pipeline="builtin.module(func.func(iree-llvmcpu-tile-root-and-fuse-producer-consumer{tiling-level=2 only-fuse-producer-input-operands=false}), canonicalize)" compiler/src/iree/compiler/Codegen/LLVMCPU/test/tile-root-fuse-consumer-producer.mlir --split-input-file | FileCheck compiler/src/iree/compiler/Codegen/LLVMCPU/test/tile-root-fuse-consumer-producer.mlir | |
: 1723460806:0;iree-opt --pass-pipeline="builtin.module(func.func(iree-llvmcpu-tile-root-and-fuse-producer-consumer{tiling-level=2 only-fuse-producer-input-operands=true}), canonicalize)" compiler/src/iree/compiler/Codegen/LLVMCPU/test/tile-root-fuse-consumer-producer.mlir --split-input-file | FileCheck compiler/src/iree/compiler/Codegen/LLVMCPU/test/tile-root-fuse-consumer-producer.mlir --check-prefix=CHECK-REDUCTION | |
: 1723465377:0;cd ../conv_mfma_dbg | |
: 1723465383:0;vi double_generic.mlir | |
: 1723465539:0;iree-opt -cse ~/conv_mfma_dbg/double_generic.mlir | |
: 1723465589:0;iree-compile --iree-hal-target-backends=llvm-cpu --iree-llvmcpu-target-cpu=znver4 double_generic.mlir -o out1.vmfb | |
: 1723465617:0;iree-compile --iree-hal-target-backends=llvm-cpu --iree-llvmcpu-target-cpu=znver4 double_generic.mlir -o out1.vmfb -mlir-print-ir-after-all 2> all.txt | |
: 1723466048:0;cat double_generic.mlir | |
: 1723466053:0;gist-paste double_generic.mlir | |
: 1723472296:0;nvidia-smi | |
: 1723570633:0;tailscale | |
: 1723570650:0;tailscale status | |
: 1723570718:0;df -h | |
: 1723577062:0;sudo upgrade | |
: 1723916086:0;./matrix_calculator.py --architecture cdna3 --instruction v_mfma_f32_16x16x4_f32 -R --A-matrix --csv | |
: 1723917117:0;hipcc | |
: 1723917122:0;sudo apt-get install hipcc | |
: 1723984253:0;curl -s https://packagecloud.io/install/repositories/ookla/speedtest-cli/script.deb.sh | sudo bash | |
: 1723984272:0;sudo apt-get install speedtest | |
: 1724013601:0;cler | |
: 1724013626:0;cd tile_fuse | |
: 1724013689:0;vi brd.mlir | |
: 1724013725:0;vi broad_matmul.mlir | |
: 1724013786:0;cat broad_matmul.mlir | |
: 1724252988:0;git cp 80a980334ac6e1d46ff918dd3f07832486ebc7a6 | |
: 1724252993:0;git cp be282cd1e917c426509cff631ba31960313621ad | |
: 1724252998:0;git cp a015bf75325e22ababc627e664365ea60a09fa12 | |
: 1724256020:0;cd conv_mfma_dbg | |
: 1724256027:0;cd test_sandbox | |
: 1724256114:0;mkdir mmt4d | |
: 1724256115:0;cd mmt4d | |
: 1724256146:0;iree-compile --iree-hal-target-backends=llvm-cpu --iree-llvmcpu-target-cpu=znver4 test.mlir -o out1.vmfb -mlir-print-ir-after-all 2> all.txt | |
: 1724256609:0;iree-compile --iree-hal-target-backends=llvm-cpu --iree-llvmcpu-target-cpu=znver4 --iree-flow-experimental-data-tiling --iree-opt-data-tiling=false test.mlir -o out1.vmfb -mlir-print-ir-after-all 2> xyz.txt | |
: 1724256622:0;iree-benchmark-module --module=out1.vmfb --function=matmul_broad --input=4x128x3200xf32 --input=8640x3200xf16 --device=local-sync | |
: 1724256750:0;iree-benchmark-module --module=out1.vmfb --function=matmul_broad --input=4x128x3200xf32 --input=8640x3200xf16 --device=local-task | |
: 1724256841:0;vi all.txt | |
: 1724257074:0;vi xyz.txt | |
: 1724320696:0;clear | |
: 1724320697:0;s | |
: 1724320697:0;ls | |
: 1724321894:0;tmux attach -t 0 | |
: 1724322238:0;iree-compile --iree-hal-target-backends=llvm-cpu --iree-llvmcpu-target-cpu=host --iree-flow-experimental-data-tiling --iree-opt-data-tiling=false test.mlir -o out1.vmfb -mlir-print-ir-after-all 2> xyz.txt | |
: 1724322254:0;iree-benchmark-module --module=out1.vmfb --function=matmul_broad --input=4x128x3200xf32 --input=8640x3200xf16 --device=local-task | |
: 1724322280:0;htop | |
: 1724322528:0;clear | |
: 1724322528:0;ls | |
: 1724322536:0;git o bm_check | |
: 1724322539:0;git submodule update --init | |
: 1724322544:0;riree | |
: 1724325626:0;iree-compile --iree-hal-target-backends=llvm-cpu --iree-llvmcpu-target-cpu=znver4 test.mlir -o out1.vmfb -mlir-print-ir-after-all 2> old.txt | |
: 1724325635:0;ls | |
: 1724325636:0;ls -l | |
: 1724325652:0;iree-benchmark-module --module=out1.vmfb --function=matmul_broad --input=4x128x3200xf32 --input=8640x3200xf16 --device=local-task | |
: 1724325726:0;git o mmt4dnewtracknewpipeline | |
: 1724325729:0;clear | |
: 1724325729:0;ls | |
: 1724325734:0;cd .. | |
: 1724325737:0;cd iree | |
: 1724325738:0;clear | |
: 1724325739:0;vi | |
: 1724325787:0;riree | |
: 1724325858:0;git submodule update --init | |
: 1724325865:0;riree | |
: 1724326882:0;iree-compile --iree-hal-target-backends=llvm-cpu --iree-llvmcpu-target-cpu=host --iree-flow-experimental-data-tiling --iree-opt-data-tiling=false test.mlir -o out1.vmfb | |
: 1724326894:0;iree-benchmark-module --module=out1.vmfb --function=matmul_broad --input=4x128x3200xf32 --input=8640x3200xf16 --device=local-task | |
: 1724326953:0;iree-compile --iree-hal-target-backends=llvm-cpu --iree-llvmcpu-target-cpu=znver4 --iree-flow-experimental-data-tiling --iree-opt-data-tiling=false test.mlir -o out1.vmfb | |
: 1724326957:0;iree-benchmark-module --module=out1.vmfb --function=matmul_broad --input=4x128x3200xf32 --input=8640x3200xf16 --device=local-task | |
: 1724327268:0;clear | |
: 1724327268:0;ls | |
: 1724327688:0;vi old.txt | |
: 1724327800:0;ls | |
: 1724336094:0;tmux attach -t 0 | |
: 1724336095:0;vi | |
: 1724336099:0;ls | |
: 1724336102:0;vi old.txt | |
: 1724726360:0;tmux attach -t 0 | |
: 1724731246:0;clear | |
: 1724731246:0;ls | |
: 1724731248:0;riree | |
: 1724731319:0;clear | |
: 1724731319:0;ls | |
: 1724731354:0;vi old.txt all.txt | |
: 1724731509:0;git lg | |
: 1724732207:0;clear | |
: 1724732207:0;ls | |
: 1724732214:0;iree-compile --iree-hal-target-backends=llvm-cpu --iree-llvmcpu-target-cpu=znver4 --iree-flow-experimental-data-tiling --iree-opt-data-tiling=false test.mlir -o out1.vmfb | |
: 1724732226:0;iree-benchmark-module --module=out1.vmfb --function=matmul_broad --input=4x128x3200xf32 --input=8640x3200xf16 --device=local-task | |
: 1725194249:0;\ | |
: 1725194250:0;clear | |
: 1725194250:0;ls | |
: 1725194256:0;tmux ls | |
: 1725194263:0;tmux attach -t 0 | |
: 1725194265:0;clear | |
: 1725194265:0;ls | |
: 1725194268:0;clear | |
: 1725194269:0;ls | |
: 1725194270:0;riree | |
: 1725199177:0;clear | |
: 1725199178:0;ls | |
: 1725199191:0;clear | |
: 1725199191:0;ls | |
: 1725199194:0;clear | |
: 1725199194:0;ls | |
: 1725199230:0;riree | |
: 1725199236:0;clear | |
: 1725199236:0;ls | |
: 1725199247:0;iree-compile --iree-hal-target-backends=llvm-cpu --iree-llvmcpu-target-cpu=znver4 --iree-flow-experimental-data-tiling --iree-opt-data-tiling=false test.mlir -o out1.vmfb | |
: 1725199268:0;iree-compile --iree-hal-target-backends=llvm-cpu --iree-llvmcpu-target-cpu=znver4 --iree-flow-experimental-data-tiling --iree-opt-data-tiling=false test.mlir -o out1.vmfb -mlir-print-ir-after-all 2> new.txt | |
: 1725199277:0;vi new.txt | |
: 1725199828:0;git fo | |
: 1725201338:0;iree-benchmark-module --module=out1.vmfb --function=matmul_broad --input=4x128x3200xf32 --input=8640x3200xf16 --device=local-task | |
: 1725250171:0;clear | |
: 1725250172:0;ls | |
: 1725250175:0;tmux attach -t 0 | |
: 1725250177:0;clear | |
: 1725250178:0;ls | |
: 1725250181:0;clear | |
: 1725250181:0;ls | |
: 1725283348:0;tmux attach -t 1 | |
: 1725283351:0;clear | |
: 1725283351:0;ls | |
: 1725283353:0;tmux ls | |
: 1725283356:0;tmux attach -t 4 | |
: 1725283358:0;clear | |
: 1725283359:0;ls | |
: 1725283359:0;cd .. | |
: 1725283363:0;clear | |
: 1725283363:0;ls | |
: 1725283364:0;cd ~ | |
: 1725283365:0;ls | |
: 1725283372:0;mkdir rust | |
: 1725283382:0;mv rust rust_diaries | |
: 1725283385:0;cd rust_diaries | |
: 1725283388:0;ls | |
: 1725283390:0;vi | |
: 1725283465:0;vi play.rs | |
: 1725283519:0;ls | |
: 1725283544:0;vi play.rs | |
: 1725283568:0;cargo build | |
: 1725283574:0;cargo play.rs | |
: 1725283598:0;rustc play.rs | |
: 1725283600:0;ls | |
: 1725283602:0;./play | |
: 1725283614:0;rustc play.rs | |
: 1725283615:0;./play | |
: 1725284703:0;sudo apt-get install rust-analyzer | |
: 1725284716:0;cargo install rust-analayzer | |
: 1725287788:0;clear | |
: 1725287788:0;ls | |
: 1725287804:0;tmux attach -t 0 | |
: 1725287811:0;clear | |
: 1725287811:0;ls | |
: 1725287819:0;vi old.txt | |
: 1725288124:0;riree | |
: 1725288162:0;iree-compile --iree-hal-target-backends=llvm-cpu --iree-llvmcpu-target-cpu=znver4 --iree-flow-experimental-data-tiling --iree-opt-data-tiling=false test.mlir -o out1.vmfb -mlir-print-ir-after-all 2> new1.txt | |
: 1725288173:0;iree-benchmark-module --module=out1.vmfb --function=matmul_broad --input=4x128x3200xf32 --input=8640x3200xf16 --device=local-task | |
: 1725288222:0;ls | |
: 1725288298:0;vi new1.txt | |
: 1725288456:0;riree | |
: 1725288472:0;iree-compile --iree-hal-target-backends=llvm-cpu --iree-llvmcpu-target-cpu=znver4 --iree-flow-experimental-data-tiling --iree-opt-data-tiling=false test.mlir -o out1.vmfb -mlir-print-ir-after-all 2> new1.txt | |
: 1725288482:0;iree-benchmark-module --module=out1.vmfb --function=matmul_broad --input=4x128x3200xf32 --input=8640x3200xf16 --device=local-task | |
: 1725288491:0;ls | |
: 1725288497:0;git branch | |
: 1725288519:0;git o bm_check | |
: 1725288525:0;git stash | |
: 1725288527:0;git o bm_check | |
: 1725288530:0;git submodule update --init | |
: 1725288535:0;riree | |
: 1725288618:0;iree-compile --iree-hal-target-backends=llvm-cpu --iree-llvmcpu-target-cpu=znver4 --iree-flow-experimental-data-tiling --iree-opt-data-tiling=false test.mlir -o out1.vmfb -mlir-print-ir-after-all 2> old.txt | |
: 1725288628:0;vi old.txt | |
: 1725288643:0;iree-compile --iree-hal-target-backends=llvm-cpu --iree-llvmcpu-target-cpu=znver4 test.mlir -o out1.vmfb -mlir-print-ir-after-all 2> old.txt | |
: 1725288653:0;vi old.txt | |
: 1725288664:0;iree-benchmark-module --module=out1.vmfb --function=matmul_broad --input=4x128x3200xf32 --input=8640x3200xf16 --device=local-task | |
: 1725288678:0;vi old.txt | |
: 1725288966:0;git rebase main | |
: 1725288993:0;git rebase --skip | |
: 1725289023:0;git lg | |
: 1725289047:0;git o mmt4dnewtracknewpipeline | |
: 1725289051:0;git submodule update --init | |
: 1725289060:0;git rebase origin/main | |
: 1725289105:0;git rebase --skip | |
: 1725289112:0;git rebase --abort | |
: 1725289117:0;riree | |
: 1725289245:0;vi new.txt | |
: 1725289256:0;iree-compile --iree-hal-target-backends=llvm-cpu --iree-llvmcpu-target-cpu=znver4 --iree-flow-experimental-data-tiling --iree-opt-data-tiling=false test.mlir -o out1.vmfb -mlir-print-ir-after-all 2> new.txt | |
: 1725289268:0;iree-benchmark-module --module=out1.vmfb --function=matmul_broad --input=4x128x3200xf32 --input=8640x3200xf16 --device=local-task | |
: 1725289368:0;riree | |
: 1725289440:0;iree-compile --iree-hal-target-backends=llvm-cpu --iree-llvmcpu-target-cpu=znver4 --iree-flow-experimental-data-tiling --iree-opt-data-tiling=false test.mlir -o out1.vmfb -mlir-print-ir-after-all 2> new.txt | |
: 1725289450:0;iree-benchmark-module --module=out1.vmfb --function=matmul_broad --input=4x128x3200xf32 --input=8640x3200xf16 --device=local-task | |
: 1725289490:0;vi new.txt | |
: 1725291286:0;iree-compile --iree-hal-target-backends=llvm-cpu --iree-llvmcpu-target-cpu=znver4 test.mlir -o out1.vmfb | |
: 1725291293:0;iree-benchmark-module --module=out1.vmfb --function=matmul_broad --input=4x128x3200xf32 --input=8640x3200xf16 --device=local-task | |
: 1725291323:0;vi new | |
: 1725291326:0;vi new.txt | |
: 1725291693:0;iree-benchmark-module --module=out1.vmfb --function=matmul_broad --input=4x128x3200xf32 --input=8640x3200xf16 --device=local-task -mlir-print-ir-after-all 2> new1.txt | |
: 1725291721:0;iree-compile --iree-hal-target-backends=llvm-cpu --iree-llvmcpu-target-cpu=znver4 test.mlir -o out1.vmfb -mlir-print-ir-after-all 2> all1.txt | |
: 1725291734:0;vi | |
: 1725291933:0;mv all1.txt new1.txt | |
: 1725291936:0;vi | |
: 1725293255:0;tmux attach -t 0 | |
: 1725293615:0;iree-compile --iree-hal-target-backends=llvm-cpu --iree-llvmcpu-target-cpu=znver4 --iree-llvmcpu-enable-ukernels=mmt4d,pack,unpack --iree-flow-collapse-reduction-dims test.mlir -o out1.vmfb | |
: 1725293641:0;iree-benchmark-module --module=out1.vmfb --function=matmul_broad --input=4x128x3200xf32 --input=8640x3200xf16 --device=local-task | |
: 1725293696:0;iree-compile --iree-hal-target-backends=llvm-cpu --iree-llvmcpu-target-cpu=znver4 --iree-llvmcpu-enable-ukernels=mmt4d,pack,unpack test.mlir -o out1.vmfb | |
: 1725293702:0;iree-benchmark-module --module=out1.vmfb --function=matmul_broad --input=4x128x3200xf32 --input=8640x3200xf16 --device=local-task | |
: 1725293719:0;iree-compile --iree-hal-target-backends=llvm-cpu --iree-llvmcpu-target-cpu=znver4 --iree-llvmcpu-enable-ukernels=mmt4d,pack,unpack test.mlir -o out1.vmfb -mlir-print-ir-after-all 2> mmtkernel.txt | |
: 1725293737:0;vi mmtkernel.txt | |
: 1725294080:0;iree-compile --iree-hal-target-backends=llvm-cpu --iree-llvmcpu-target-cpu=znver4 --iree-llvmcpu-enable-ukernels=mmt4d test.mlir -o out1.vmfb -mlir-print-ir-after-all 2> mmtkernel.txt | |
: 1725294096:0;iree-benchmark-module --module=out1.vmfb --function=matmul_broad --input=4x128x3200xf32 --input=8640x3200xf16 --device=local-task | |
: 1725294250:0;vi mmtkernel.txt | |
: 1725294737:0;git o bm_check | |
: 1725294740:0;git stash | |
: 1725294743:0;git o bm_check | |
: 1725294746:0;git submodule update --init | |
: 1725294748:0;riree | |
: 1725335745:0;clear | |
: 1725335745:0;ls | |
: 1725335753:0;iree-compile --iree-hal-target-backends=llvm-cpu --iree-llvmcpu-target-cpu=znver4 --iree-llvmcpu-enable-ukernels=mmt4d test.mlir -o out1.vmfb -mlir-print-ir-after-all 2> mmtkernel.txt | |
: 1725335768:0;iree-compile --iree-hal-target-backends=llvm-cpu --iree-llvmcpu-target-cpu=znver4 --iree-llvmcpu-enable-ukernels=mmt4d,pack,unpack test.mlir -o out1.vmfb -mlir-print-ir-after-all 2> mmtkernel.txt | |
: 1725335779:0;iree-benchmark-module --module=out1.vmfb --function=matmul_broad --input=4x128x3200xf32 --input=8640x3200xf16 --device=local-task | |
: 1725335810:0;iree-compile --iree-hal-target-backends=llvm-cpu --iree-llvmcpu-target-cpu=znver4 --iree-llvmcpu-enable-ukernels=mmt4d,pack,unpack --iree-flow-collapse-reduction-dims test.mlir -o out1.vmfb | |
: 1725335814:0;iree-benchmark-module --module=out1.vmfb --function=matmul_broad --input=4x128x3200xf32 --input=8640x3200xf16 --device=local-task | |
: 1725335828:0;iree-benchmark-module --module=out1.vmfb --function=matmul_broad --input=1x128x3200xf32 --input=8640x3200xf16 --device=local-task | |
: 1725356570:0;clear | |
: 1725356571:0;ls | |
: 1725356574:0;clear | |
: 1725356574:0;ls | |
: 1725356583:0;iree-benchmark-module --module=out1.vmfb --function=matmul_broad --input=1x128x3200xf32 --input=8640x3200xf16 --device=local-task | |
: 1725356833:0;iree-benchmark-module --module=out1.vmfb --function=matmul_broad --input=1x128x3200xf32 --input=8640x3200xf16 --device=local-sync | |
: 1725356845:0;iree-benchmark-module --module=out1.vmfb --function=matmul_broad --input=4x128x3200xf32 --input=8640x3200xf16 --device=local-sync | |
: 1725357017:0;riree | |
: 1725357054:0;git lg | |
: 1725357076:0;git o pashu/bm_check | |
: 1725357082:0;git submodule update --init | |
: 1725357090:0;git lh | |
: 1725357095:0;git lg | |
: 1725357097:0;clear | |
: 1725357098:0;ls | |
: 1725357099:0;riree | |
: 1725357922:0;iree-compile --iree-hal-target-backends=llvm-cpu --iree-llvmcpu-target-cpu=znver4 --iree-llvmcpu-enable-ukernels=mmt4d,pack,unpack --iree-flow-collapse-reduction-dims test.mlir -o out1.vmfb | |
: 1725357939:0;iree-benchmark-module --module=out1.vmfb --function=matmul_broad --input=4x128x3200xf32 --input=8640x3200xf16 --device=local-sync | |
: 1725357945:0;iree-benchmark-module --module=out1.vmfb --function=matmul_broad --input=4x128x3200xf32 --input=8640x3200xf16 --device=local-task | |
: 1725357958:0;iree-benchmark-module --module=out1.vmfb --function=matmul_broad --input=1x128x3200xf32 --input=8640x3200xf16 --device=local-task | |
: 1725358134:0;iree-compile --iree-hal-target-backends=llvm-cpu --iree-llvmcpu-target-cpu=znver4 --iree-llvmcpu-enable-ukernels=mmt4d,pack,unpack --iree-flow-collapse-reduction-dims test.mlir -o out1.vmfb -mlir-print-ir-after-all 2> xyz.txt | |
: 1725358141:0;vi test.mlir | |
: 1725358167:0;vi xyz.txt | |
: 1725358449:0;git o main | |
: 1725358454:0;git puom | |
: 1725358460:0;clear | |
: 1725358461:0;ls | |
: 1725358465:0;git submodule update --init | |
: 1725358471:0;git l | |
: 1725358474:0;git lhg | |
: 1725358477:0;git lg | |
: 1725358484:0;riree | |
: 1725361463:0;iree-compile --iree-hal-target-backends=llvm-cpu --iree-llvmcpu-target-cpu=znver4 --iree-llvmcpu-enable-ukernels=mmt4d,pack,unpack --iree-flow-collapse-reduction-dims test.mlir -o out1.vmfb -mlir-print-ir-after-all 2> xyz.txt | |
: 1725361469:0;vi xyz.txt | |
: 1725361481:0;iree-compile --iree-hal-target-backends=llvm-cpu --iree-llvmcpu-target-cpu=znver4 --iree-llvmcpu-enable-ukernels=mmt4d,pack,unpack test.mlir -o out1.vmfb -mlir-print-ir-after-all 2> xyz.txt | |
: 1725361507:0;iree-benchmark-module --module=out1.vmfb --function=matmul_broad --input=1x128x3200xf32 --input=8640x3200xf16 --device=local-task | |
: 1725361513:0;iree-benchmark-module --module=out1.vmfb --function=matmul_broad --input=1x128x3200xf32 --input=8640x3200xf16 --device=local-sync | |
: 1725361535:0;vi xyz.txt | |
: 1725362827:0;iree-benchmark-module --module=out1.vmfb --function=matmul_broad --input=4x128x3200xf32 --input=8640x3200xf16 --device=local-task | |
: 1725362836:0;ls | |
: 1725362846:0;vi xyz.txt | |
: 1725371219:0;iree-benchmark-module --module=out1.vmfb --function=matmul_broad --input=4x128x3200xf32 --input=8640x3200xf16 --device=local-task | |
: 1725371225:0;vi xyz.txt | |
: 1725371254:0;git lg | |
: 1725371258:0;riree | |
: 1725371268:0;iree-compile --iree-hal-target-backends=llvm-cpu --iree-llvmcpu-target-cpu=znver4 --iree-llvmcpu-enable-ukernels=mmt4d,pack,unpack --iree-flow-collapse-reduction-dims test.mlir -o out1.vmfb | |
: 1725371278:0;iree-compile --iree-hal-target-backends=llvm-cpu --iree-llvmcpu-target-cpu=znver4 --iree-llvmcpu-enable-ukernels=mmt4d,pack,unpack test.mlir -o out1.vmfb | |
: 1725371282:0;iree-benchmark-module --module=out1.vmfb --function=matmul_broad --input=4x128x3200xf32 --input=8640x3200xf16 --device=local-task | |
: 1725371949:0;vi new.txt | |
: 1725372484:0;iree-opt --pass-pipeline="builtin.module(func.func(iree-llvmcpu-tile-root-and-fuse-producer-consumer{tiling-level=2 only-fuse-producer-input-operands=true}), canonicalize)" compiler/src/iree/compiler/Codegen/LLVMCPU/test/tile-root-fuse-consumer-producer.mlir --split-input-file | |
: 1725372501:0;iree-opt --pass-pipeline="builtin.module(func.func(iree-llvmcpu-tile-root-and-fuse-producer-consumer{tiling-level=0 only-fuse-producer-input-operands=true}), canonicalize)" compiler/src/iree/compiler/Codegen/LLVMCPU/test/tile-root-fuse-consumer-producer.mlir --split-input-file | |
: 1725372522:0;iree-opt --pass-pipeline="builtin.module(func.func(iree-llvmcpu-tile-root-and-fuse-producer-consumer{tiling-level=0 only-fuse-producer-input-operands=false}), canonicalize)" compiler/src/iree/compiler/Codegen/LLVMCPU/test/tile-root-fuse-consumer-producer.mlir --split-input-file | |
: 1725373056:0;git lg | |
: 1725373118:0;riree | |
: 1725373159:0;iree-compile --iree-hal-target-backends=llvm-cpu --iree-llvmcpu-target-cpu=znver4 --iree-llvmcpu-enable-ukernels=mmt4d,pack,unpack test.mlir -o out1.vmfb | |
: 1725373206:0;iree-compile --iree-hal-target-backends=llvm-cpu --iree-llvmcpu-target-cpu=znver4 --iree-llvmcpu-enable-ukernels=mmt4d,pack,unpack test.mlir -o out1.vmfb -mlir-print-ir-after-all 2> test.txt | |
: 1725373210:0;vi test. | |
: 1725373214:0;vi test.txt | |
: 1725373762:0;clear | |
: 1725373762:0;ls | |
: 1725373763:0;riree | |
: 1725373779:0;vi new | |
: 1725373782:0;vi new.txt | |
: 1725377050:0;ls | |
: 1725377696:0;iree-compile --iree-hal-target-backends=llvm-cpu --iree-llvmcpu-target-cpu=znver4 --iree-llvmcpu-enable-ukernels=mmt4d,pack,unpack --iree-hal-dump-executable-configurations-to=configs test.mlir -o out1.vmfb | |
: 1725377716:0;riree | |
: 1725377734:0;iree-compile --iree-hal-target-backends=llvm-cpu --iree-llvmcpu-target-cpu=znver4 --iree-llvmcpu-enable-ukernels=mmt4d,pack,unpack --iree-hal-dump-executable-configurations-to=configs test.mlir -o out1.vmfb | |
: 1725377736:0;ls | |
: 1725377738:0;cd configs | |
: 1725377739:0;ls | |
: 1725377745:0;vi configured_module_matmul_broad_dispatch_2.mlir | |
: 1725377767:0;git o mmt4dnewtracknewpipeline | |
: 1725377771:0;git submodule update --init | |
: 1725377782:0;cd third_party/llvm-project | |
: 1725377895:0;git remote -vv | |
: 1725377902:0;git fetch yunflu | |
: 1725377904:0;git fetch yunfly | |
: 1725377963:0;git cp 4a1862857a277e75bdc88c1f0832cf562e76f90e | |
: 1725377995:0;git submodule update --init | |
: 1725378001:0;cd .. | |
: 1725378002:0;ls | |
: 1725378005:0;git submodule update --init | |
: 1725378011:0;cd llvm-project | |
: 1725378012:0;ls | |
: 1725378014:0;git lg | |
: 1725378029:0;git cp --skip | |
: 1725378039:0;git cp 0884a18e47ea8049a55075e59f92521d07d268e8 | |
: 1725378046:0;git cherry-pick --skip | |
: 1725378072:0;git o 0884a18e47ea8049a55075e59f92521d07d268e8 | |
: 1725378085:0;git lg | |
: 1725378097:0;cd ../.. | |
: 1725378098:0;riree | |
: 1725379790:0;git submodule update --init | |
: 1725379794:0;riree | |
: 1725412376:0;tmux attach -t 0 | |
: 1725412380:0;clear | |
: 1725412380:0;ls | |
: 1725412407:0;iree-compile --iree-hal-target-backends=llvm-cpu --iree-llvmcpu-target-cpu=znver4 --iree-flow-experimental-data-tiling --iree-opt-data-tiling=false test.mlir -o out1.vmfb -mlir-print-ir-after-all 2> new.txt | |
: 1725412410:0;vi new.txt | |
: 1725412414:0;cd .. | |
: 1725412416:0;iree-compile --iree-hal-target-backends=llvm-cpu --iree-llvmcpu-target-cpu=znver4 --iree-flow-experimental-data-tiling --iree-opt-data-tiling=false test.mlir -o out1.vmfb -mlir-print-ir-after-all 2> new.txt | |
: 1725412427:0;vi new.txt | |
: 1725412543:0;iree-compile --iree-hal-target-backends=llvm-cpu --iree-llvmcpu-target-cpu=znver4 --iree-flow-experimental-data-tiling --iree-opt-data-tiling=false test.mlir -o out1.vmfb --iree-hal-dump-executable-configurations-to=configs -mlir-print-ir-after-all 2> new.txt | |
: 1725412552:0;cd configs | |
: 1725412553:0;ls | |
: 1725412565:0;vi configured_module_matmul_broad_dispatch_2.mlir | |
: 1725412610:0;cd .. | |
: 1725412610:0;ls | |
: 1725412630:0;iree-compile --iree-hal-target-backends=llvm-cpu --iree-llvmcpu-target-cpu=znver4 --iree-flow-experimental-data-tiling --iree-opt-data-tiling=false test.mlir -o out1.vmfb --compile-from=configs -mlir-print-ir-after-all 2> new.txt | |
: 1725412634:0;vi new | |
: 1725412638:0;vi new.txt | |
: 1725412696:0;iree-compile --iree-hal-target-backends=llvm-cpu --iree-llvmcpu-target-cpu=znver4 --iree-flow-experimental-data-tiling --iree-opt-data-tiling=false test.mlir -o out1.vmfb --compile-from=configs | |
: 1725412703:0;iree-compile --iree-hal-target-backends=llvm-cpu --iree-llvmcpu-target-cpu=znver4 --iree-flow-experimental-data-tiling --iree-opt-data-tiling=false test.mlir -o out1.vmfb --compile-from=sources | |
: 1725412720:0;iree-compile --iree-hal-target-backends=llvm-cpu --iree-llvmcpu-target-cpu=znver4 --iree-flow-experimental-data-tiling --iree-opt-data-tiling=false test.mlir -o out1.vmfb --compile-from=source | |
: 1725412728:0;iree-compile --help | fzf | |
: 1725412751:0;iree-compile --iree-hal-target-backends=llvm-cpu --iree-llvmcpu-target-cpu=znver4 --iree-flow-experimental-data-tiling --iree-opt-data-tiling=false test.mlir -o out1.vmfb --compile-from=executable-sources | |
: 1725412781:0;iree-compile --iree-hal-target-backends=llvm-cpu --iree-llvmcpu-target-cpu=znver4 --iree-flow-experimental-data-tiling --iree-opt-data-tiling=false configs/configured_module_matmul_broad_dispatch_2.mlir -o out1.vmfb --compile-from=executable-sources | |
: 1725412799:0;iree-compile --iree-hal-target-backends=llvm-cpu --iree-llvmcpu-target-cpu=znver4 --iree-flow-experimental-data-tiling --iree-opt-data-tiling=false configs/configured_module_matmul_broad_dispatch_2.mlir -o out1.vmfb --compile-from=executable-sources -mlir-print-ir-after-all 2> xyz.txt | |
: 1725412803:0;vi xyz.txt | |
: 1725413084:0;cd configs | |
: 1725413084:0;ls | |
: 1725413086:0;vi configured_module_matmul_broad_dispatch_2.mlir | |
: 1725413111:0;iree-compile --iree-hal-target-backends=llvm-cpu --iree-llvmcpu-target-cpu=znver4 --iree-flow-experimental-data-tiling --iree-opt-data-tiling=false configs/configured_module_matmul_broad_dispatch_2.mlir -o out1.vmfb --compile-from=executable-sources -mlir-print-ir-after-all 2> xyz.txt | |
: 1725413113:0;vi xyz.txt | |
: 1725413117:0;cd .. | |
: 1725413119:0;iree-compile --iree-hal-target-backends=llvm-cpu --iree-llvmcpu-target-cpu=znver4 --iree-flow-experimental-data-tiling --iree-opt-data-tiling=false configs/configured_module_matmul_broad_dispatch_2.mlir -o out1.vmfb --compile-from=executable-sources -mlir-print-ir-after-all 2> xyz.txt | |
: 1725413124:0;vi xyz.txt | |
: 1725413328:0;iree-compile --help | fzf | |
: 1725413373:0;iree-benchmark-module --module=out1.vmfb --function=matmul_broad --input=4x128x3200xf32 --input=8640x3200xf16 --device=local-task | |
: 1725413379:0;vi xyz.txt | |
: 1725413402:0;iree-benchmark-module --module=out1.vmfb --function=matmul_broad_dispatch_2 --input=4x128x3200xf32 --input=8640x3200xf16 --device=local-task | |
: 1725413407:0;vi xyz.txt | |
: 1725413453:0;iree-benchmark-module --module=out1.vmfb --function=matmul_broad_dispatch_2_batch_matmul_transpose_b_DxDx8640x3200_f32xf16xf32 --input=4x128x3200xf32 --input=8640x3200xf16 --device=local-task | |
: 1725413457:0;vi xyz.txt | |
: 1725413622:0;iree-compile --iree-hal-target-backends=llvm-cpu --iree-llvmcpu-target-cpu=znver4 --iree-flow-experimental-data-tiling --iree-opt-data-tiling=false test.mlir -o out1.vmfb --iree-hal-dump-executable-benchmarks-to=benchmarsk -mlir-print-ir-after-all 2> new.txt | |
: 1725413635:0;ls | |
: 1725413648:0;iree-compile --iree-hal-target-backends=llvm-cpu --iree-llvmcpu-target-cpu=znver4 --iree-flow-experimental-data-tiling --iree-opt-data-tiling=false test.mlir -o out1.vmfb --iree-hal-dump-executable-benchmarks-to=benchmark | |
: 1725413683:0;ls | |
: 1725413685:0;cd configs | |
: 1725413685:0;ls | |
: 1725413690:0;vi configured_module_matmul_broad_dispatch_2.mlir | |
: 1725413715:0;vi configured_module_matmul_broad_dispatch_0.mlir | |
: 1725413819:0;riree | |
: 1725413870:0;iree-compile --iree-hal-target-backends=llvm-cpu --iree-llvmcpu-target-cpu=znver4 --iree-flow-experimental-data-tiling --iree-opt-data-tiling=false test.mlir -o out1.vmfb --mlir-print-ir-after-all 2> xyz.txt | |
: 1725413872:0;vi xyz.txt | |
: 1725413875:0;cd .. | |
: 1725413877:0;iree-compile --iree-hal-target-backends=llvm-cpu --iree-llvmcpu-target-cpu=znver4 --iree-flow-experimental-data-tiling --iree-opt-data-tiling=false test.mlir -o out1.vmfb --mlir-print-ir-after-all 2> xyz.txt | |
: 1725413886:0;vi xyz.txt | |
: 1725413942:0;riree | |
: 1725413968:0;iree-compile --iree-hal-target-backends=llvm-cpu --iree-llvmcpu-target-cpu=znver4 --iree-flow-experimental-data-tiling --iree-opt-data-tiling=false test.mlir -o out1.vmfb --mlir-print-ir-after-all 2> xyz.txt | |
: 1725413977:0;vi xyz.txt | |
: 1725414174:0;riree | |
: 1725414203:0;iree-compile --iree-hal-target-backends=llvm-cpu --iree-llvmcpu-target-cpu=znver4 --iree-flow-experimental-data-tiling --iree-opt-data-tiling=false test.mlir -o out1.vmfb --mlir-print-ir-after-all 2> xyz.txt | |
: 1725414212:0;vi xyz.txt | |
: 1725414273:0;riree | |
: 1725414371:0;iree-compile --iree-hal-target-backends=llvm-cpu --iree-llvmcpu-target-cpu=znver4 --iree-flow-experimental-data-tiling --iree-opt-data-tiling=false test.mlir -o out1.vmfb | |
: 1725414440:0;riree | |
: 1725414478:0;iree-compile --iree-hal-target-backends=llvm-cpu --iree-llvmcpu-target-cpu=znver4 --iree-flow-experimental-data-tiling --iree-opt-data-tiling=false test.mlir -o out1.vmfb | |
: 1725414590:0;ls | |
: 1725414615:0;vi xyz.txt | |
: 1725415217:0;riree | |
: 1725415239:0;iree-compile --iree-hal-target-backends=llvm-cpu --iree-llvmcpu-target-cpu=znver4 --iree-flow-experimental-data-tiling --iree-opt-data-tiling=false test.mlir -o out1.vmfb | |
: 1725415584:0;riree | |
: 1725415608:0;iree-compile --iree-hal-target-backends=llvm-cpu --iree-llvmcpu-target-cpu=znver4 --iree-flow-experimental-data-tiling --iree-opt-data-tiling=false test.mlir -o out1.vmfb | |
: 1725415628:0;iree-compile --iree-hal-target-backends=llvm-cpu --iree-llvmcpu-target-cpu=znver4 --iree-flow-experimental-data-tiling --iree-opt-data-tiling=false test.mlir -o out1.vmfb -mlir-print-ir-after-all 2> xyz.txt | |
: 1725415636:0;vi xyz.txt | |
: 1725415695:0;iree-benchmark-module --module=out1.vmfb --function=matmul_broad --input=1x128x3200xf32 --input=8640x3200xf16 --device=local-task | |
: 1725415710:0;iree-benchmark-module --module=out1.vmfb --function=matmul_broad --input=4x128x3200xf32 --input=8640x3200xf16 --device=local-task | |
: 1725415768:0;vi xyz.txt | |
: 1725415781:0;iree-compile --iree-hal-target-backends=llvm-cpu --iree-llvmcpu-target-cpu=znver4 --iree-flow-experimental-data-tiling --iree-opt-data-tiling=false test.mlir -o out1.vmfb | |
: 1725415787:0;iree-benchmark-module --module=out1.vmfb --function=matmul_broad --input=4x128x3200xf32 --input=8640x3200xf16 --device=local-task | |
: 1725415798:0;iree-benchmark-module --module=out1.vmfb --function=matmul_broad --input=1x128x3200xf32 --input=8640x3200xf16 --device=local-task | |
: 1725415803:0;vi xyz.txt | |
: 1725448635:0;iree-benchmark-module --module=out1.vmfb --function=matmul_broad --input=4x128x3200xf32 --input=8640x3200xf16 --device=local-task | |
: 1725448650:0;iree-benchmark-module --module=out1.vmfb --function=matmul_broad --input=1x128x3200xf32 --input=8640x3200xf16 --device=local-task | |
: 1725448791:0;git o main | |
: 1725448799:0;git submodule update --init | |
: 1725448832:0;git lg | |
: 1725448871:0;clear | |
: 1725448872:0;ls | |
: 1725448886:0;clear | |
: 1725448887:0;ls | |
: 1725448905:0;git puom | |
: 1725448918:0;git submodule update --init | |
: 1725449103:0;git stash | |
: 1725449109:0;curl -sL https://deb.nodesource.com/setup_18.x | sudo -E bash -\ | |
sudo apt-get install -y nodejs | |
: 1725449306:0;git submodule update --init | |
: 1725449317:0;clear | |
: 1725449318:0;ls | |
: 1725449615:0;git lg | |
: 1725449633:0;git ob consumerforall | |
: 1725449635:0;clear | |
: 1725449635:0;ls | |
: 1725449766:0;riree | |
: 1725451463:0;vi ~/test.mlir | |
: 1725451548:0;iree-opt --pass-pipeline="builtin.module(func.func(iree-codegen-tile-and-distribute-to-workgroups-using-forall-op, cse))" ~/test.mlir | |
: 1725451608:0;vi | |
: 1725451619:0;iree-opt --pass-pipeline="builtin.module(func.func(iree-codegen-tile-and-distribute-to-workgroups-using-forall-op, cse))" ~/test.mlir | |
: 1725451953:0;riree | |
: 1725451973:0;iree-opt --pass-pipeline="builtin.module(func.func(iree-codegen-tile-and-distribute-to-workgroups-using-forall-op, cse))" ~/test.mlir | |
: 1725452933:0;rire | |
: 1725452934:0;riree | |
: 1725453061:0;iree-opt --pass-pipeline="builtin.module(func.func(iree-codegen-tile-and-distribute-to-workgroups-using-forall-op, cse))" ~/test.mlir | |
: 1725453220:0;git clang-format compiler/src/iree/compiler/Codegen/Common/TileDispatchUsingForall.cpp | |
: 1725453227:0;ng | |
: 1725453238:0;clang-format -i compiler/src/iree/compiler/Codegen/Common/TileDispatchUsingForall.cpp | |
: 1725453456:0;vi | |
: 1725453881:0;iree-opt --pass-pipeline="builtin.module(func.func(iree-codegen-tile-and-distribute-to-workgroups-using-forall-op, cse))" ~/test.mlir | |
: 1725453919:0;riree | |
: 1725453947:0;iree-opt --pass-pipeline="builtin.module(func.func(iree-codegen-tile-and-distribute-to-workgroups-using-forall-op, cse))" ~/test.mlir | |
: 1725453954:0;riree | |
: 1725454414:0;iree-opt --pass-pipeline="builtin.module(func.func(iree-codegen-tile-and-distribute-to-workgroups-using-forall-op, cse))" compiler/src/iree/compiler/Codeen/Common/test/tile_and_distribute_workroups_usin_forall.mlir | |
: 1725454482:0;iree-opt --pass-pipeline="builtin.module(func.func(iree-codegen-tile-and-distribute-to-workgroups-using-forall-op, cse))" compiler/src/iree/compiler/Codegen/Common/test/tile_and_distribute_workgroups_using_forall.mlir | |
: 1725454524:0;iree-opt --pass-pipeline="builtin.module(func.func(iree-codegen-tile-and-distribute-to-workgroups-using-forall-op, cse))" compiler/src/iree/compiler/Codegen/Common/test/tile_and_distribute_workgroups_using_forall.mlir | FileCheck compiler/src/iree/compiler/Codegen/Common/test/tile_and_distribute_workgroups_using_forall.mlir | |
: 1725454776:0;iree-opt --pass-pipeline="builtin.module(func.func(iree-codegen-tile-and-distribute-to-workgroups-using-forall-op, cse))" -split-input-file compiler/src/iree/compiler/Codegen/Common/test/tile_and_distribute_workgroups_using_forall.mlir | FileCheck compiler/src/iree/compiler/Codegen/Common/test/tile_and_distribute_workgroups_using_forall.mlir | |
: 1725455093:0;git ppf | |
: 1725544763:0;tmux attach -t 0 | |
: 1725544777:0;ls | |
: 1725544784:0;cd ~ | |
: 1725544789:0;ebd | |
: 1725544891:0;riree | |
: 1725544903:0;biree | |
: 1725544956:0;git submodule update --init | |
: 1725544963:0;rm -rf ~/iree-build | |
: 1725544968:0;biree | |
: 1725544986:0;sudo apt-get install libstdc++ | |
: 1725545024:0;sudo apt-get update | |
: 1725545045:0;sudo apt-get install libstdc++8 | |
: 1725545048:0;sudo apt-get install libstdc++7 | |
: 1725545060:0;sudo apt-get update && sudo apt-get upgrade | |
: 1725545169:0;sudo apt-get install build-essential | |
: 1725545176:0;sudo apt-get install libstdc++6 | |
: 1725545182:0;sudo apt-get install libstdc++7 | |
: 1725545206:0;sudo apt-get install libstdc+-12-dev | |
: 1725545220:0;sudo apt install libstdc++-12-dev | |
: 1725545228:0;sudo apt install libstdc++-8-dev | |
: 1725545232:0;clear | |
: 1725545232:0;ls | |
: 1725545239:0;rm -rf ~/iree-build | |
: 1725545244:0;vi ~/.zshrc | |
: 1725545255:0;biree | |
: 1725545399:0;strings /usr/lib/x86_64-linux-gnu/libstdc++.so.6 | grep "GLIBCXX" | |
: 1725545413:0;sudo apt install gcc-7 g++-7 | |
: 1725545419:0;sudo apt install libstdc++-7-dev | |
: 1725545429:0;sudo add-apt-repository ppa:ubuntu-toolchain-r/test\ | |
sudo apt update\ | |
sudo apt install gcc-7 g++-7 | |
: 1725545485:0;export LD_LIBRARY_PATH=/usr/local/lib64:$LD_LIBRARY_PATH | |
: 1725545490:0;rm -rf ~/iree-build | |
: 1725545492:0;biree | |
: 1725545536:0;/sbin/ldconfig -p | grep stdc++ | |
: 1725545656:0;sudo apt-get install gcc-12 g++-12 | |
: 1725545668:0;rm -rf ~/iree-build | |
: 1725545669:0;biree | |
: 1725545675:0;rm -rf ~/iree-build | |
: 1725545692:0;biree | |
: 1725545772:0;sudo apt-get install gcc-13 g++-13 | |
: 1725545851:0;speedtest | |
: 1725546229:0;rm -rf ~/iree-build | |
: 1725546230:0;biree | |
: 1725546276:0;riree | |
: 1725546278:0;biree | |
: 1725546743:0;ls | |
: 1725546748:0;clang++-13 | |
: 1725546751:0;clang++-12 | |
: 1725546772:0;sudo apt-get install clang-17 clang++-17 | |
: 1725546792:0;sudo apt-get install clang-16 clang++-16 | |
: 1725546813:0;rm -rf ~/iree-build | |
: 1725546815:0;biree | |
: 1725546838:0;sudo apt-get install clang clang++ | |
: 1725546873:0;rm -rf ~/iree-build | |
: 1725546874:0;biree | |
: 1725546899:0;sudo apt-get install libatomic | |
: 1725546904:0;ebd | |
: 1725546922:0;biree | |
: 1725546928:0;rm -rf ~/iree-build | |
: 1725546929:0;biree | |
: 1725549847:0;git o main | |
: 1725549868:0;git ob unit_broadcast | |
: 1725550237:0;riree | |
: 1725550830:0;git ppf | |
: 1725550840:0;git clang-format HEAD~1 | |
: 1725550851:0;git ppf | |
: 1725550863:0;git branch | |
: 1725635984:0;tmux attach -t 0 | |
: 1725635993:0;git o consumerforall | |
: 1725636565:0;iree-opt --pass-pipeline="builtin.module(func.func(iree-codegen-tile-and-distribute-to-workgroups-using-forall-op, cse))" -split-input-file compiler/src/iree/compiler/Codegen/Common/test/tile_and_distribute_workgroups_using_forall.mlir | FileCheck compiler/src/iree/compiler/Codegen/Common/test/tile_and_distribute_workgroups_using_forall.mlir | |
: 1725636573:0;iree-opt --pass-pipeline="builtin.module(func.func(iree-codegen-tile-and-distribute-to-workgroups-using-forall-op, cse))" -split-input-file compiler/src/iree/compiler/Codegen/Common/test/tile_and_distribute_workgroups_using_forall.mlir | |
: 1725636599:0;riree | |
: 1725636626:0;iree-opt --pass-pipeline="builtin.module(func.func(iree-codegen-tile-and-distribute-to-workgroups-using-forall-op, cse))" -split-input-file compiler/src/iree/compiler/Codegen/Common/test/tile_and_distribute_workgroups_using_forall.mlir | |
: 1725636760:0;iree-opt --pass-pipeline="builtin.module(func.func(iree-codegen-tile-and-distribute-to-workgroups-using-forall-op, cse))" -split-input-file compiler/src/iree/compiler/Codegen/Common/test/tile_and_distribute_workgroups_using_forall.mlir | FileCheck compiler/src/iree/compiler/Codegen/Common/test/tile_and_distribute_workgroups_using_forall.mlir | |
: 1725636875:0;git ppf | |
: 1725637281:0;vi ~/test.mlir | |
: 1725637654:0;iree-opt --pass-pipeline="builtin.module(func.func(iree-codegen-tile-and-distribute-to-workgroups-using-forall-op, cse))" -split-input-file ~/test.mlir | |
: 1725637831:0;gist-paste ~/test.mlir | |
: 1725637846:0;vi ~/test.mlir | |
: 1725637872:0;gist-paste ~/test.mlir | |
: 1725639172:0;clear | |
: 1725639172:0;ls | |
: 1725639180:0;git o unit_broadcast | |
: 1725639202:0;riree | |
: 1725641610:0;ls | |
: 1725641618:0;vi /tmp/less.txt | |
: 1725641643:0;iree-compile /tmp/less.txt --iree-hal-target-backends=llvm-cpu --iree-input-demote-i64-to-i32 | |
: 1725715664:0;tmux attach -t 0 | |
: 1725715730:0;git o consumerforall | |
: 1725715743:0;biree | |
: 1725717524:0;rm -rf ~/iree-build | |
: 1725717528:0;biree | |
: 1725717545:0;clang | |
: 1725717548:0;clang --version | |
: 1725717561:0;clang++-14 | |
: 1725717577:0;clang++-14 --version | |
: 1725717602:0;where clang | |
: 1725717608:0;clang --version | |
: 1725717630:0;sudo apt-get install clang | |
: 1725717644:0;clang --version | |
: 1725717665:0;rm -rf /usr/local/bin/clang* | |
: 1725717682:0;sudo rm -rf /usr/local/bin/clang | |
: 1725717689:0;sudo apt-get install clang | |
: 1725717693:0;clang --version | |
: 1725717697:0;which clang | |
: 1725717714:0;sudo rm -rf /usr/bin/clang | |
: 1725717717:0;clang --version | |
: 1725717720:0;sudo apt-get install clang | |
: 1725717724:0;clang --version | |
: 1725717815:0;wget wget https://apt.llvm.org/llvm.sh | |
: 1725717825:0;chmod +x llvm.sh | |
: 1725717832:0;sudo ./llvm.sh 19 | |
: 1725717871:0;clang --version | |
: 1725717885:0;clang-19 | |
: 1725717894:0;clang++-19 --version | |
: 1725717903:0;ebd | |
: 1725717922:0;1biree | |
: 1725717923:0;biree | |
: 1725717933:0;rm -rf ~/iree-build | |
: 1725717934:0;biree | |
: 1725717988:0;sudo ./llvm.sh 18 | |
: 1725718035:0;ebd | |
: 1725718055:0;rm -rf ~/iree-build | |
: 1725718057:0;biree | |
: 1725770748:0;clear | |
: 1725770749:0;ls | |
: 1725775765:0;\ | |
\ | |
\ | |
: 1725775767:0;clear | |
: 1725775768:0;ls | |
: 1725775771:0;tmux attach -t 0 | |
: 1725775775:0;clear | |
: 1725775775:0;ls | |
: 1725775778:0;riree | |
: 1725775932:0;iree-opt --pass-pipeline="builtin.module(func.func(iree-codegen-tile-and-distribute-to-workgroups-using-forall-op, cse))" -split-input-file compiler/src/iree/compiler/Codegen/Common/test/tile_and_distribute_workgroups_using_forall.mlir | |
: 1725776278:0;iree-opt --pass-pipeline="builtin.module(func.func(iree-codegen-tile-and-distribute-to-workgroups-using-forall-op, cse))" -split-input-file -mlir-disable-threading compiler/src/iree/compiler/Codegen/Common/test/tile_and_distribute_workgroups_using_forall.mlir | |
: 1725776437:0;riree | |
: 1725776460:0;iree-opt --pass-pipeline="builtin.module(func.func(iree-codegen-tile-and-distribute-to-workgroups-using-forall-op, cse))" -split-input-file -mlir-disable-threading compiler/src/iree/compiler/Codegen/Common/test/tile_and_distribute_workgroups_using_forall.mlir | |
: 1725776469:0;riree | |
: 1725794588:0;tmux attach -t 0 | |
: 1725794931:0;riree | |
: 1725794967:0;iree-opt --pass-pipeline="builtin.module(func.func(iree-codegen-tile-and-distribute-to-workgroups-using-forall-op, cse))" -split-input-file -mlir-disable-threading compiler/src/iree/compiler/Codegen/Common/test/tile_and_distribute_workgroups_using_forall.mlir | |
: 1725794999:0;riree | |
: 1725795020:0;iree-opt --pass-pipeline="builtin.module(func.func(iree-codegen-tile-and-distribute-to-workgroups-using-forall-op, cse))" -split-input-file -mlir-disable-threading compiler/src/iree/compiler/Codegen/Common/test/tile_and_distribute_workgroups_using_forall.mlir | |
: 1725795028:0;riree | |
: 1725795103:0;iree-opt --pass-pipeline="builtin.module(func.func(iree-codegen-tile-and-distribute-to-workgroups-using-forall-op, cse))" -split-input-file -mlir-disable-threading compiler/src/iree/compiler/Codegen/Common/test/tile_and_distribute_workgroups_using_forall.mlir | |
: 1725795292:0;riree | |
: 1725795714:0;iree-opt --pass-pipeline="builtin.module(func.func(iree-codegen-tile-and-distribute-to-workgroups-using-forall-op, cse))" -split-input-file -mlir-disable-threading compiler/src/iree/compiler/Codegen/Common/test/tile_and_distribute_workgroups_using_forall.mlir | |
: 1725795902:0;riree | |
: 1725795924:0;iree-opt --pass-pipeline="builtin.module(func.func(iree-codegen-tile-and-distribute-to-workgroups-using-forall-op, cse))" -split-input-file -mlir-disable-threading compiler/src/iree/compiler/Codegen/Common/test/tile_and_distribute_workgroups_using_forall.mlir | |
: 1725795947:0;riree | |
: 1725795969:0;iree-opt --pass-pipeline="builtin.module(func.func(iree-codegen-tile-and-distribute-to-workgroups-using-forall-op, cse))" -split-input-file -mlir-disable-threading compiler/src/iree/compiler/Codegen/Common/test/tile_and_distribute_workgroups_using_forall.mlir | |
: 1725795987:0;iree-opt --pass-pipeline="builtin.module(func.func(iree-codegen-tile-and-distribute-to-workgroups-using-forall-op, cse))" -split-input-file compiler/src/iree/compiler/Codegen/Common/test/tile_and_distribute_workgroups_using_forall.mlir | FileCheck compiler/src/iree/compiler/Codegen/Common/test/tile_and_distribute_workgroups_using_forall.mlir | |
: 1725796039:0;riree | |
: 1725796066:0;iree-opt --pass-pipeline="builtin.module(func.func(iree-codegen-tile-and-distribute-to-workgroups-using-forall-op, cse))" -split-input-file compiler/src/iree/compiler/Codegen/Common/test/tile_and_distribute_workgroups_using_forall.mlir | FileCheck compiler/src/iree/compiler/Codegen/Common/test/tile_and_distribute_workgroups_using_forall.mlir | |
: 1725796077:0;iree-opt --pass-pipeline="builtin.module(func.func(iree-codegen-tile-and-distribute-to-workgroups-using-forall-op, cse))" -split-input-file -mlir-disable-threading compiler/src/iree/compiler/Codegen/Common/test/tile_and_distribute_workgroups_using_forall.mlir | |
: 1725796307:0;git clang-format HEAD~1 | |
: 1725796335:0;git ppf | |
: 1725796769:0;clear | |
: 1725796769:0;ls | |
: 1725797579:0;git o consumerforall | |
: 1725797581:0;clear | |
: 1725797581:0;ls | |
: 1725797598:0;riree | |
: 1725798288:0;git o unit_broadcast | |
: 1725798299:0;riree | |
: 1725798432:0;ls | |
: 1725798440:0;vi mmtkernel.txt | |
: 1725798458:0;cat test.txt | |
: 1725798460:0;jj | |
: 1725798460:0;ls | |
: 1725798465:0;cat mmtkernel.txt | |
: 1725798467:0;ls | |
: 1725798471:0;vi test.mlir | |
: 1725798496:0;vi mmtkernel.txt | |
: 1725798871:0;iree-opt -cse compiler/src/iree/compiler/Codegen/Common/test/unit_broadcast_to_expand_shape.mlir | |
: 1725799222:0;iree-opt --pass-pipeline="builtin.module(func.func(iree-codegen-unit-broadcast-to-expand-shape, cse))" -split-input-file compiler/src/iree/compiler/Codegen/Common/test/unit_broadcast_to_expand_shape.mlir | |
: 1725799424:0;git ppf | |
: 1725799599:0;riree | |
: 1725800074:0;iree-opt --pass-pipeline="builtin.module(func.func(iree-codegen-unit-broadcast-to-expand-shape, cse))" -split-input-file compiler/src/iree/compiler/Codegen/Common/test/unit_broadcast_to_expand_shape.mlir | |
: 1725800327:0;riree | |
: 1725800368:0;iree-opt --pass-pipeline="builtin.module(func.func(iree-codegen-unit-broadcast-to-expand-shape, cse))" -split-input-file compiler/src/iree/compiler/Codegen/Common/test/unit_broadcast_to_expand_shape.mlir | |
: 1725800401:0;riree | |
: 1725800470:0;iree-opt --pass-pipeline="builtin.module(func.func(iree-codegen-unit-broadcast-to-expand-shape, cse))" -split-input-file compiler/src/iree/compiler/Codegen/Common/test/unit_broadcast_to_expand_shape.mlir | |
: 1725805426:0;vi | |
: 1725805620:0;riree | |
: 1725805736:0;iree-opt --pass-pipeline="builtin.module(func.func(iree-codegen-unit-broadcast-to-expand-shape, cse))" -split-input-file compiler/src/iree/compiler/Codegen/Common/test/unit_broadcast_to_expand_shape.mlir | |
: 1725805831:0;iree-opt --pass-pipeline="builtin.module(func.func(iree-codegen-unit-broadcast-to-expand-shape, cse))" -split-input-file compiler/src/iree/compiler/Codegen/Common/test/unit_broadcast_to_expand_shape.mlir --verify-each=0 | |
: 1725805894:0;riree | |
: 1725805913:0;iree-opt --pass-pipeline="builtin.module(func.func(iree-codegen-unit-broadcast-to-expand-shape, cse))" -split-input-file compiler/src/iree/compiler/Codegen/Common/test/unit_broadcast_to_expand_shape.mlir --verify-each=0 | |
: 1725805929:0;riree | |
: 1725805948:0;iree-opt --pass-pipeline="builtin.module(func.func(iree-codegen-unit-broadcast-to-expand-shape, cse))" -split-input-file compiler/src/iree/compiler/Codegen/Common/test/unit_broadcast_to_expand_shape.mlir --verify-each=0 | |
: 1725805955:0;iree-opt --pass-pipeline="builtin.module(func.func(iree-codegen-unit-broadcast-to-expand-shape, cse))" -split-input-file compiler/src/iree/compiler/Codegen/Common/test/unit_broadcast_to_expand_shape.mlir | |
: 1725805963:0;iree-opt --pass-pipeline="builtin.module(func.func(iree-codegen-unit-broadcast-to-expand-shape, cse))" -split-input-file compiler/src/iree/compiler/Codegen/Common/test/unit_broadcast_to_expand_shape.mlir --verify-each=0 | |
: 1725806067:0;riree | |
: 1725806087:0;iree-opt --pass-pipeline="builtin.module(func.func(iree-codegen-unit-broadcast-to-expand-shape, cse))" -split-input-file compiler/src/iree/compiler/Codegen/Common/test/unit_broadcast_to_expand_shape.mlir --verify-each=0 | |
: 1725806193:0;iree-opt compiler/src/iree/compiler/Codegen/Common/test/unit_broadcast_to_expand_shape.mlir | |
: 1725806203:0;iree-opt --pass-pipeline="builtin.module(func.func(iree-codegen-unit-broadcast-to-expand-shape, cse))" -split-input-file compiler/src/iree/compiler/Codegen/Common/test/unit_broadcast_to_expand_shape.mlir --verify-each=0 | |
: 1725806293:0;riree | |
: 1725806313:0;iree-opt --pass-pipeline="builtin.module(func.func(iree-codegen-unit-broadcast-to-expand-shape, cse))" -split-input-file compiler/src/iree/compiler/Codegen/Common/test/unit_broadcast_to_expand_shape.mlir --verify-each=0 | |
: 1725806371:0;riree | |
: 1725806390:0;iree-opt --pass-pipeline="builtin.module(func.func(iree-codegen-unit-broadcast-to-expand-shape, cse))" -split-input-file compiler/src/iree/compiler/Codegen/Common/test/unit_broadcast_to_expand_shape.mlir --verify-each=0 | |
: 1725806446:0;riree | |
: 1725806481:0;iree-opt --pass-pipeline="builtin.module(func.func(iree-codegen-unit-broadcast-to-expand-shape, cse))" -split-input-file compiler/src/iree/compiler/Codegen/Common/test/unit_broadcast_to_expand_shape.mlir --verify-each=0 | |
: 1725806667:0;riree | |
: 1725806687:0;iree-opt --pass-pipeline="builtin.module(func.func(iree-codegen-unit-broadcast-to-expand-shape, cse))" -split-input-file compiler/src/iree/compiler/Codegen/Common/test/unit_broadcast_to_expand_shape.mlir --verify-each=0 | |
: 1725806706:0;riree | |
: 1725806731:0;iree-opt --pass-pipeline="builtin.module(func.func(iree-codegen-unit-broadcast-to-expand-shape, cse))" -split-input-file compiler/src/iree/compiler/Codegen/Common/test/unit_broadcast_to_expand_shape.mlir --verify-each=0 | |
: 1725806774:0;iree-opt --pass-pipeline="builtin.module(func.func(iree-codegen-unit-broadcast-to-expand-shape, cse))" -split-input-file compiler/src/iree/compiler/Codegen/Common/test/unit_broadcast_to_expand_shape.mlir --verify-each=0 -mlir-disable-threading | |
: 1725806852:0;git clang-format HEAD~1 | |
: 1725806860:0;git ppf | |
: 1725806972:0;riree | |
: 1725807022:0;iree-opt --pass-pipeline="builtin.module(func.func(iree-codegen-unit-broadcast-to-expand-shape, cse))" -split-input-file compiler/src/iree/compiler/Codegen/Common/test/unit_broadcast_to_expand_shape.mlir --verify-each=0 -mlir-disable-threading | |
: 1725807029:0;iree-opt --pass-pipeline="builtin.module(func.func(iree-codegen-unit-broadcast-to-expand-shape, cse))" -split-input-file compiler/src/iree/compiler/Codegen/Common/test/unit_broadcast_to_expand_shape.mlir | |
: 1725807312:0;riree | |
: 1725807419:0;iree-opt --pass-pipeline="builtin.module(func.func(iree-codegen-unit-broadcast-to-expand-shape, cse))" -split-input-file compiler/src/iree/compiler/Codegen/Common/test/unit_broadcast_to_expand_shape.mlir | |
: 1725808521:0;git ppf | |
: 1725808532:0;iree-opt --pass-pipeline="builtin.module(func.func(iree-codegen-unit-broadcast-to-expand-shape, cse))" -split-input-file compiler/src/iree/compiler/Codegen/Common/test/unit_broadcast_to_expand_shape.mlir | |
: 1725808837:0;iree-opt --pass-pipeline="builtin.module(func.func(iree-codegen-unit-broadcast-to-expand-shape, cse))" -split-input-file compiler/src/iree/compiler/Codegen/Common/test/unit_broadcast_to_expand_shape.mlir | FileCheck compiler/src/iree/compiler/Codegen/Common/test/unit_broadcast_to_expand_shape.mlir | |
: 1725808896:0;git ppf | |
: 1725808903:0;iree-opt --pass-pipeline="builtin.module(func.func(iree-codegen-unit-broadcast-to-expand-shape, cse))" -split-input-file compiler/src/iree/compiler/Codegen/Common/test/unit_broadcast_to_expand_shape.mlir | FileCheck compiler/src/iree/compiler/Codegen/Common/test/unit_broadcast_to_expand_shape.mlir | |
: 1725809206:0;git ppf | |
: 1725809228:0;buildifier compiler/src/iree/compiler/ | |
: 1725809236:0;buildifier compiler/src/iree/compiler/Codegen/LLVMCPU/test/BUILD.bazel | |
: 1725809241:0;buildifier compiler/src/iree/compiler/Codegen/LLVMCPU/test/CMakeLists.txt | |
: 1725809318:0;buildifier compiler/src/iree/compiler/Codegen/Common/test/CMakeLists.txt | |
: 1725809546:0;git ppf | |
: 1725809553:0;buildifier compiler/src/iree/compiler/Codegen/Common/test/CMakeLists.txt | |
: 1725809560:0;buildifier compiler/src/iree/compiler/Codegen/Common/test/BUILD.bazel | |
: 1725809911:0;buildifier compiler/src/iree/compiler/Codegen/Common/BUILD.bazel | |
: 1725809967:0;git ppf | |
: 1725810074:0;buildifier -i compiler/src/iree/compiler/Codegen/Common/BUILD.bazel | |
: 1725810081:0;buildifier -i compiler/src/iree/compiler/Codegen/Common/ | |
: 1725810086:0;buildifier compiler/src/iree/compiler/Codegen/Common/ | |
: 1725810091:0;buildifier compiler/src/iree/compiler/Codegen/Common/BUILD.bazel | |
: 1725810202:0;git ppf | |
: 1725810268:0;riree | |
: 1725810294:0;biree | |
: 1725810650:0;riree | |
: 1725810956:0;git ppf | |
: 1725849738:0;tmux attach -t 0 | |
: 1725849820:0;riree | |
: 1725849846:0;iree-opt --pass-pipeline="builtin.module(func.func(iree-codegen-unit-broadcast-to-expand-shape, cse))" -split-input-file compiler/src/iree/compiler/Codegen/Common/test/unit_broadcast_to_expand_shape.mlir | FileCheck compiler/src/iree/compiler/Codegen/Common/test/unit_broadcast_to_expand_shape.mlir | |
: 1725849858:0;iree-opt --pass-pipeline="builtin.module(func.func(iree-codegen-unit-broadcast-to-expand-shape, cse))" -split-input-file compiler/src/iree/compiler/Codegen/Common/test/unit_broadcast_to_expand_shape.mlir | |
: 1725849890:0;clang-format -i compiler/src/iree/compiler/Codegen/Common/test/unit_broadcast_to_expand_shape.mlir | |
: 1725849907:0;clang-format -i compiler/src/iree/compiler/Codegen/Common/compiler/src/iree/compiler/Codegen/Common/UnitBroadcastToExpandShape.cpp | |
: 1725849917:0;clang-format -i compiler/src/iree/compiler/Codegen/Common/UnitBroadcastToExpandShape.cpp | |
: 1725849961:0;git ppf | |
: 1725851334:0;clear | |
: 1725851335:0;ls | |
: 1725896082:0;tmux attach -t 0 | |
: 1725896106:0;git ppf | |
: 1725896360:0;git remote add mahesh https://github.com/MaheshRavishankar/iree.git | |
: 1725896368:0;git fetch mahesh | |
: 1725896379:0;clear | |
: 1725896380:0;ls | |
: 1725896400:0;git cp 8675c4af0b96c4dc209e1571f5713299243f8a4f | |
: 1725896405:0;git cp 7008977a81bd41ecc9f42281e9fb07d6f69ab656 | |
: 1725896410:0;git cp 70ec987e626d17ef96c00c7bb308da87111906e6 | |
: 1725896412:0;clear | |
: 1725896413:0;ls | |
: 1725896434:0;git cp 476bf4800ea7b1a27623a19f6243af1fe6c4bd37 | |
: 1725896440:0;git cp 675a1540ddc9326d97afdc11e736f3dd2695d08f | |
: 1725896446:0;git | |
: 1725896452:0;git cp e83f16416ae94dee662c496241bb2aa30a7133aa | |
: 1725896454:0;riree | |
: 1725896926:0;iree-compile --iree-hal-target-backends=llvm-cpu --iree-llvmcpu-target-cpu=znver4 test.mlir -o out1.vmfb -mlir-print-ir-after-all 2> all1.txt | |
: 1725896933:0;vi all1.txt | |
: 1725897191:0;riree | |
: 1725897739:0;iree-compile --iree-hal-target-backends=llvm-cpu --iree-llvmcpu-target-cpu=znver4 test.mlir -o out1.vmfb -mlir-print-ir-after-all 2> all1.txt | |
: 1725897746:0;vi all1.txt | |
: 1725897816:0;riree | |
: 1725897841:0;iree-compile --iree-hal-target-backends=llvm-cpu --iree-llvmcpu-target-cpu=znver4 test.mlir -o out1.vmfb -mlir-print-ir-after-all 2> all1.txt | |
: 1725897847:0;vi all1.txt | |
: 1725897933:0;riree | |
: 1725899711:0;iree-compile --iree-hal-target-backends=llvm-cpu --iree-llvmcpu-target-cpu=znver4 test.mlir -o out1.vmfb -mlir-print-ir-after-all 2> all1.txt | |
: 1725899718:0;vi all1.txt | |
: 1725900052:0;ls | |
: 1725900062:0;vi dest.mlir | |
: 1725900085:0;iree-opt compiler/src/iree/compiler/Codegen/Common/test/unit_broadcast_to_expand_shape.mlir | |
: 1725900090:0;iree-opt dest.mlir | |
: 1725900125:0;iree-opt --pass-pipeline="builtin.module(func.func(iree-codegen-convert-to-destination-style, cse))" dest.mlir | |
: 1725900137:0;iree-opt --help | fzf | |
: 1725900157:0;iree-opt --pass-pipeline="builtin.module(func.func(iree-codegen-convert-to-destination-passing-style, cse))" dest.mlir | |
: 1725900869:0;iree-compile --iree-hal-target-backends=llvm-gpu test.mlir -o out1.vmfb -mlir-print-ir-after-all 2> all1.txt | |
: 1725900873:0;vi all1.txt | |
: 1725900923:0;iree-compile --iree-hal-target-backends=rocm test.mlir -o out1.vmfb -mlir-print-ir-after-all 2> all1.txt | |
: 1725900927:0;vi all1.txt | |
: 1725965178:0;tmux attach -t 0 | |
: 1725965185:0;riree | |
: 1725965482:0;iree-compile --iree-hal-target-backends=llvm-cpu --iree-llvmcpu-target-cpu=znver4 -iree-llvmcpu-tile-dispatch-using-forall test.mlir -o out1.vmfb -mlir-print-ir-after-all 2> all1.txt | |
: 1725965494:0;vi all1.txt | |
: 1725965518:0;iree-benchmark-module --module=out1.vmfb --function=matmul_broad --input=1x128x3200xf32 --input=8640x3200xf16 --device=local-task | |
: 1725965534:0;iree-benchmark-module --module=out1.vmfb --function=matmul_broad --input=4x128x3200xf32 --input=8640x3200xf16 --device=local-task | |
: 1725965551:0;rm -rf out1.vmfb | |
: 1725965569:0;iree-compile --iree-hal-target-backends=llvm-cpu --iree-llvmcpu-target-cpu=znver4 -iree-llvmcpu-tile-dispatch-using-forall test.mlir -o out1.vmfbt | |
: 1725965577:0;mv out1.vmfb out1.vmfb | |
: 1725965585:0;mv out1.vmfbt out1.vmfb | |
: 1725965591:0;iree-benchmark-module --module=out1.vmfb --function=matmul_broad --input=4x128x3200xf32 --input=8640x3200xf16 --device=local-task | |
: 1725965596:0;vi all1.txt | |
: 1725965847:0;clear | |
: 1725965847:0;ls | |
: 1725966538:0;iree-opt --help | fzf | |
: 1725966581:0;iree-opt --linalg-fold-unit-extent-dims compiler/src/iree/compiler/Codegen/Common/test/unit_broadcast_to_expand_shape.mlir | |
: 1725966607:0;iree-opt --linalg-fold-unit-extent-dims -cse compiler/src/iree/compiler/Codegen/Common/test/unit_broadcast_to_expand_shape.mlir | |
: 1725966655:0;iree-opt --linalg-fold-unit-extent-dims -cse -canonicalize compiler/src/iree/compiler/Codegen/Common/test/unit_broadcast_to_expand_shape.mlir | |
: 1725973760:0;tmux attach -t 0 | |
: 1725973778:0;vi | |
: 1725973782:0;clear | |
: 1725973782:0;ls | |
: 1725973791:0;git o main | |
: 1725973798:0;git lg | |
: 1725973802:0;clear | |
: 1725973803:0;ls | |
: 1725973829:0;git ob newtile | |
: 1725973831:0;clear | |
: 1725973831:0;ls | |
: 1725973975:0;git submodule update --init | |
: 1725974041:0;git remote -vv | |
: 1725974054:0;git remote add max https://github.com/Max191/iree.git | |
: 1725974059:0;git fetch max | |
: 1725974194:0;clear | |
: 1725974195:0;ls | |
: 1725974198:0;git cp ab59fdb768256090b38ef4ad604f358c79284f09 | |
: 1725974204:0;git cp 37032369bf03a654ea7b1b07911ef7cf4b774f7d | |
: 1725974209:0;git cp 1138f39be510409716cadabefdba7492c6ca1f88 | |
: 1725974214:0;git cp f0b5cb64e4af964d9494340455aefab5e2466739 | |
: 1725974218:0;git cp 2f0c20c1a2562e8e0afd3d706956c3e2d1b85908 | |
: 1725974224:0;git cp ec51576919441c2f0e828cc3b1b3156c9d70413d | |
: 1725974230:0;git cp b6bbc78e8325315033f73ca37d5a37af179197ed | |
: 1725974253:0;git fetch mahesh | |
: 1725974268:0;git cp 39a63a31b366af256a0c7119eb94cd869af782cb | |
: 1725974274:0;git stash | |
: 1725974275:0;git cp 39a63a31b366af256a0c7119eb94cd869af782cb | |
: 1725974278:0;clear | |
: 1725974279:0;ls | |
: 1725974614:0;riree | |
: 1725974624:0;ebd | |
: 1725974643:0;rm -rf ~/iree-build | |
: 1725974646:0;biree | |
: 1725974658:0;git submodule update --init | |
: 1725974660:0;riree | |
: 1725974662:0;biree | |
: 1725978653:0;iree-compile --iree-hal-target-backends=llvm-cpu --iree-llvmcpu-target-cpu=znver4 --iree-flow-experimental-data-tiling --iree-opt-data-tiling=false test.mlir -o out1.vmfb | |
: 1725978673:0;iree-opt --help | fzf | |
: 1725978683:0;riree | |
: 1725978785:0;iree-opt --help | fzf | |
: 1725978822:0;iree-compile --iree-hal-target-backends=llvm-cpu --iree-llvmcpu-target-cpu=znver4 -iree-llvmcpu-tile-dispatch-using-forall test.mlir -o out1.vmfbt | |
: 1725978872:0;iree-compile --iree-hal-target-backends=llvm-cpu --iree-llvmcpu-target-cpu=znver4 -iree-llvmcpu-tile-dispatch-using-forall test.mlir -o out1.vmfb --mlir-print-ir-after-all 2> all.txt | |
: 1725978881:0;vi all.txt | |
: 1725979244:0;iree-compile --iree-hal-target-backends=llvm-cpu --iree-llvmcpu-target-cpu=znver4 test.mlir -o out1.vmfb | |
: 1725979250:0;iree-benchmark-module --module=out1.vmfb --function=matmul_broad --input=4x128x3200xf32 --input=8640x3200xf16 --device=local-task | |
: 1725979265:0;vi all.txt | |
: 1725979405:0;iree-opt --help | fzf | |
: 1725980395:0;iree-compile --iree-hal-target-backends=llvm-cpu --iree-llvmcpu-target-cpu=znver4 -iree-global-opt-enable-early-materialization=false test.mlir -o out1.vmfb | |
: 1725980413:0;iree-benchmark-module --module=out1.vmfb --function=matmul_broad --input=4x128x3200xf32 --input=8640x3200xf16 --device=local-task | |
: 1725980424:0;iree-compile --iree-hal-target-backends=llvm-cpu --iree-llvmcpu-target-cpu=znver4 -iree-global-opt-enable-early-materialization=true test.mlir -o out1.vmfb | |
: 1725980511:0;iree-compile --iree-hal-target-backends=llvm-cpu --iree-llvmcpu-target-cpu=znver4 --iree-flow-experimental-data-tiling --iree-opt-data-tiling=false test.mlir -o out1.vmfb -mlir-print-ir-after-all 2> xyz.txt | |
: 1725980519:0;iree-compile --iree-hal-target-backends=llvm-cpu --iree-llvmcpu-target-cpu=znver4 --iree-flow-experimental-data-tiling --iree-opt-data-tiling=false test.mlir -o out1.vmfb | |
: 1725980542:0;iree-opt --help | fzf | |
: 1725980568:0;iree-compile --iree-hal-target-backends=llvm-cpu --iree-llvmcpu-target-cpu=znver4 --iree-opt-data-tiling=false test.mlir -o out1.vmfb | |
: 1725980594:0;iree-compile --iree-hal-target-backends=llvm-cpu --iree-llvmcpu-target-cpu=znver4 --iree-opt-data-tiling=false test.mlir -o out1.vmfb -mlir-print-ir-after-all 2> xyz.txt | |
: 1725980598:0;vi xyz.txt | |
: 1725980679:0;iree-compile --iree-hal-target-backends=llvm-cpu --iree-llvmcpu-target-cpu=znver4 --iree-opt-data-tiling=true test.mlir -o out1.vmfb -mlir-print-ir-after-all 2> xyz.txt | |
: 1725980690:0;iree-benchmark-module --module=out1.vmfb --function=matmul_broad --input=4x128x3200xf32 --input=8640x3200xf16 --device=local-task | |
: 1725980695:0;vi xyz.txt | |
: 1725981026:0;riree | |
: 1725981154:0;iree-benchmark-module --module=out1.vmfb --function=matmul_broad --input=4x128x3200xf32 --input=8640x3200xf16 --device=local-task | |
: 1725981159:0;iree-compile --iree-hal-target-backends=llvm-cpu --iree-llvmcpu-target-cpu=znver4 --iree-opt-data-tiling=true test.mlir -o out1.vmfb -mlir-print-ir-after-all 2> xyz.txt | |
: 1725981165:0;iree-benchmark-module --module=out1.vmfb --function=matmul_broad --input=4x128x3200xf32 --input=8640x3200xf16 --device=local-task | |
: 1725981176:0;vi xyz.txt | |
: 1726057001:0;tmux attach -t 0 | |
: 1726057016:0;clear | |
: 1726057016:0;ls | |
: 1726057020:0;clear | |
: 1726057021:0;ls | |
: 1726057027:0;git o main | |
: 1726057030:0;git stash | |
: 1726057032:0;git o main | |
: 1726057035:0;git puom | |
: 1726057042:0;clear | |
: 1726057042:0;ls | |
: 1726057048:0;git submodule update --init | |
: 1726057066:0;git ob new_mmt4d | |
: 1726057068:0;clear | |
: 1726057068:0;ls | |
: 1726057116:0;cd third_party/llvm-project | |
: 1726057126:0;git fetch yunfly | |
: 1726057194:0;git o yunfei/fuse_consumer_nested_loop | |
: 1726057198:0;git lg | |
: 1726057214:0;cd ~/iree | |
: 1726057215:0;clear | |
: 1726057215:0;ls | |
: 1726057240:0;git cp 476bf4800ea7b1a27623a19f6243af1fe6c4bd37 | |
: 1726057245:0;git cp 675a1540ddc9326d97afdc11e736f3dd2695d08f | |
: 1726057250:0;git cp e83f16416ae94dee662c496241bb2aa30a7133aa | |
: 1726057318:0;git cp ab59fdb768256090b38ef4ad604f358c79284f09 37032369bf03a654ea7b1b07911ef7cf4b774f7d 1138f39be510409716cadabefdba7492c6ca1f88 | |
: 1726057345:0;git cp f0b5cb64e4af964d9494340455aefab5e2466739 2f0c20c1a2562e8e0afd3d706956c3e2d1b85908 ec51576919441c2f0e828cc3b1b3156c9d70413d b6bbc78e8325315033f73ca37d5a37af179197ed | |
: 1726057480:0;git cp 39a63a31b366af256a0c7119eb94cd869af782cb | |
: 1726057499:0;riree | |
: 1726059193:0;git submodule update --init | |
: 1726059197:0;riree | |
: 1726060412:0;clear | |
: 1726060412:0;ls | |
: 1726060435:0;iree-compile --iree-hal-target-backends=llvm-cpu --iree-llvmcpu-target-cpu=znver4 test.mlir -o out1.vmfb | |
: 1726060442:0;iree-benchmark-module --module=out1.vmfb --function=matmul_broad --input=4x128x3200xf32 --input=8640x3200xf16 --device=local-task | |
: 1726060455:0;clear | |
: 1726060455:0;ls | |
: 1726060705:0;iree-compile --iree-hal-target-backends=llvm-cpu --iree-llvmcpu-target-cpu=znver4 --iree-flow-experimental-data-tiling --iree-opt-data-tiling=false test.mlir -o out1.vmfb | |
: 1726061233:0;iree-compile --iree-hal-target-backends=llvm-cpu --iree-llvmcpu-target-cpu=znver4 --iree-dispatch-creation-experimental-data-tiling --iree-opt-data-tiling=false test.mlir -o out1.vmfb | |
: 1726061385:0;iree-compile --iree-hal-target-backends=llvm-cpu --iree-llvmcpu-target-cpu=znver4 --iree-dispatch-creation-experimental-data-tiling --iree-opt-data-tiling=false test.mlir -o out1.vmfb 2> xyz.txt | |
: 1726061398:0;iree-compile --iree-hal-target-backends=llvm-cpu --iree-llvmcpu-target-cpu=znver4 --iree-dispatch-creation-experimental-data-tiling --iree-opt-data-tiling=false test.mlir -o out1.vmfb -mlir-print-ir-after-all 2> xyz.txt | |
: 1726061404:0;vi xyz.txt | |
: 1726061815:0;gist-paste xyz.txt | |
: 1726062902:0;iree-compile --iree-hal-target-backends=llvm-cpu --iree-llvmcpu-target-cpu=znver4 --iree-dispatch-creation-experimental-data-tiling --iree-opt-data-tiling=false -iree-llvmcpu-tile-dispatch-using-forall test.mlir -o out1.vmfb -mlir-print-ir-after-all 2> xyz.txt | |
: 1726062907:0;vi xyz.txt | |
: 1726063744:0;riree | |
: 1726063778:0;iree-compile --iree-hal-target-backends=llvm-cpu --iree-llvmcpu-target-cpu=znver4 --iree-dispatch-creation-experimental-data-tiling --iree-opt-data-tiling=false -iree-llvmcpu-tile-dispatch-using-forall test.mlir -o out1.vmfb -mlir-print-ir-after-all 2> xyz.txt | |
: 1726063787:0;vi xyz.txt | |
: 1726063797:0;iree-benchmark-module --module=out1.vmfb --function=matmul_broad --input=4x128x3200xf32 --input=8640x3200xf16 --device=local-task | |
: 1726063908:0;iree-benchmark-module --module=out1.vmfb --function=matmul_broad --input=1x128x3200xf32 --input=8640x3200xf16 --device=local-task | |
: 1726064025:0;riree | |
: 1726064044:0;clear | |
: 1726064044:0;ls | |
: 1726064070:0;iree-compile --iree-hal-target-backends=llvm-cpu --iree-llvmcpu-target-cpu=znver4 --iree-dispatch-creation-experimental-data-tiling --iree-opt-data-tiling=false -iree-llvmcpu-tile-dispatch-using-forall test.mlir -o out1.vmfb -mlir-print-ir-after-all 2> xyz.txt | |
: 1726064078:0;vi xyz.txt | |
: 1726064086:0;iree-benchmark-module --module=out1.vmfb --function=matmul_broad --input=1x128x3200xf32 --input=8640x3200xf16 --device=local-task | |
: 1726064100:0;iree-benchmark-module --module=out1.vmfb --function=matmul_broad --input=4x128x3200xf32 --input=8640x3200xf16 --device=local-task | |
: 1726064139:0;iree-compile --iree-hal-target-backends=llvm-cpu --iree-llvmcpu-target-cpu=znver4 --iree-dispatch-creation-experimental-data-tiling --iree-opt-data-tiling=false -iree-llvmcpu-tile-dispatch-using-forall test.mlir -o out1.vmfb -mlir-print-ir-after-all 2> xyz.txt | |
: 1726064148:0;vi xyz.txt | |
: 1726064452:0;riree | |
: 1726064478:0;iree-compile --iree-hal-target-backends=llvm-cpu --iree-llvmcpu-target-cpu=znver4 --iree-dispatch-creation-experimental-data-tiling --iree-opt-data-tiling=false -iree-llvmcpu-tile-dispatch-using-forall test.mlir -o out1.vmfb -mlir-print-ir-after-all 2> xyz.txt | |
: 1726064488:0;iree-benchmark-module --module=out1.vmfb --function=matmul_broad --input=4x128x3200xf32 --input=8640x3200xf16 --device=local-task | |
: 1726064501:0;vi xyz.txt | |
: 1726064632:0;riree | |
: 1726064675:0;iree-compile --iree-hal-target-backends=llvm-cpu --iree-llvmcpu-target-cpu=znver4 --iree-dispatch-creation-experimental-data-tiling --iree-opt-data-tiling=false -iree-llvmcpu-tile-dispatch-using-forall test.mlir -o out1.vmfb -mlir-print-ir-after-all 2> xyz.txt | |
: 1726064680:0;vi xyz.txt | |
: 1726064724:0;iree-benchmark-module --module=out1.vmfb --function=matmul_broad --input=4x128x3200xf32 --input=8640x3200xf16 --device=local-task | |
: 1726064735:0;vi xyz.txt | |
: 1726064937:0;riree | |
: 1726064960:0;iree-compile --iree-hal-target-backends=llvm-cpu --iree-llvmcpu-target-cpu=znver4 --iree-dispatch-creation-experimental-data-tiling --iree-opt-data-tiling=false -iree-llvmcpu-tile-dispatch-using-forall test.mlir -o out1.vmfb -mlir-print-ir-after-all 2> xyz.txt | |
: 1726064970:0;iree-benchmark-module --module=out1.vmfb --function=matmul_broad --input=4x128x3200xf32 --input=8640x3200xf16 --device=local-task | |
: 1726064974:0;vi xyz.txt | |
: 1726065123:0;riree | |
: 1726065161:0;iree-compile --iree-hal-target-backends=llvm-cpu --iree-llvmcpu-target-cpu=znver4 --iree-dispatch-creation-experimental-data-tiling --iree-opt-data-tiling=false -iree-llvmcpu-tile-dispatch-using-forall test.mlir -o out1.vmfb -mlir-print-ir-after-all 2> xyz.txt | |
: 1726065170:0;iree-benchmark-module --module=out1.vmfb --function=matmul_broad --input=4x128x3200xf32 --input=8640x3200xf16 --device=local-task | |
: 1726065176:0;vi xyz.txt | |
: 1726065310:0;vi tile.mlir | |
: 1726065342:0;iree-opt --pass-pipeline="builtin.module(func.func(iree-llvmcpu-tile-root-and-fuse-producer-consumer{tiling-level=0 only-fuse-producer-input-operands=false}), canonicalize)" tile.mlir | |
: 1726065356:0;iree-opt --pass-pipeline="builtin.module(func.func(iree-llvmcpu-tile-root-and-fuse-producer-consumer{tiling-level=1 only-fuse-producer-input-operands=false}), canonicalize)" tile.mlir | |
: 1726065364:0;iree-opt --pass-pipeline="builtin.module(func.func(iree-llvmcpu-tile-root-and-fuse-producer-consumer{tiling-level=2 only-fuse-producer-input-operands=false}), canonicalize)" tile.mlir | |
: 1726065494:0;iree-opt --pass-pipeline="builtin.module(func.func(iree-llvmcpu-tile-root-and-fuse-producer-consumer{tiling-level=2 only-fuse-producer-input-operands=true}), canonicalize)" tile.mlir | |
: 1726065537:0;riree | |
: 1726065567:0;iree-compile --iree-hal-target-backends=llvm-cpu --iree-llvmcpu-target-cpu=znver4 --iree-dispatch-creation-experimental-data-tiling --iree-opt-data-tiling=false -iree-llvmcpu-tile-dispatch-using-forall test.mlir -o out1.vmfb -mlir-print-ir-after-all 2> xyz.txt | |
: 1726065579:0;iree-benchmark-module --module=out1.vmfb --function=matmul_broad --input=4x128x3200xf32 --input=8640x3200xf16 --device=local-task | |
: 1726065598:0;vi xyz.txt | |
: 1726068723:0;tmux attach -t 0 | |
: 1726068751:0;riree | |
: 1726069277:0;iree-compile --iree-hal-target-backends=llvm-cpu --iree-llvmcpu-target-cpu=znver4 --iree-dispatch-creation-experimental-data-tiling --iree-opt-data-tiling=false -iree-llvmcpu-tile-dispatch-using-forall test.mlir | |
: 1726069457:0;iree-opt --pass-pipeline="builtin.module(func.func(iree-llvmcpu-tile-root-and-fuse-producer-consumer{tiling-level=3 only-fuse-producer-input-operands=false}), canonicalize)" tile.mlir | |
: 1726069500:0;iree-opt --pass-pipeline="builtin.module(func.func(iree-llvmcpu-tile-root-and-fuse-producer-consumer{tiling-level=2 only-fuse-producer-input-operands=false}), canonicalize)" tile.mlir | |
: 1726069507:0;iree-opt --pass-pipeline="builtin.module(func.func(iree-llvmcpu-tile-root-and-fuse-producer-consumer{tiling-level=0 only-fuse-producer-input-operands=false}), canonicalize)" tile.mlir | |
: 1726069515:0;iree-opt --pass-pipeline="builtin.module(func.func(iree-llvmcpu-tile-root-and-fuse-producer-consumer{tiling-level=1 only-fuse-producer-input-operands=false}), canonicalize)" tile.mlir | |
: 1726069565:0;vi old.txt | |
: 1726069797:0;ls | |
: 1726069800:0;vi xyz.txt | |
: 1726070097:0;riree | |
: 1726070183:0;ls | |
: 1726070185:0;cd iree | |
: 1726070186:0;ls | |
: 1726070253:0;git o consumerforall | |
: 1726070255:0;git lg | |
: 1726070259:0;vi | |
: 1726070375:0;clang-format -i compiler/src/iree/compiler/Codegen/Common/TileDispatchUsingForall.cpp | |
: 1726070377:0;vi | |
: 1726070420:0;git ppf | |
: 1726070819:0;git o new_mmt4d | |
: 1726070823:0;git ppf | |
: 1726070835:0;riree | |
: 1726070865:0;iree-opt --pass-pipeline="builtin.module(func.func(iree-llvmcpu-tile-root-and-fuse-producer-consumer{tiling-level=1 only-fuse-producer-input-operands=false}), canonicalize)" tile.mlir | |
: 1726070885:0;iree-compile --iree-hal-target-backends=llvm-cpu --iree-llvmcpu-target-cpu=znver4 --iree-dispatch-creation-experimental-data-tiling --iree-opt-data-tiling=false -iree-llvmcpu-tile-dispatch-using-forall test.mlir -o out1.vmfb | |
: 1726070908:0;vi test.mlir | |
: 1726070914:0;vi xyz.txt | |
: 1726071467:0;iree-benchmark-module --module=out1.vmfb --function=matmul_broad --input=4x128x3200xf32 --input=8640x3200xf16 --device=local-task | |
: 1726149348:0;ebd | |
: 1726149359:0;cat ~/build_commands/build_iree.sh | |
: 1726149743:0;cat ~/llvm.sh | |
: 1726149766:0;gist-paste ~/llvm.sh | |
: 1726151751:0;clear | |
: 1726151751:0;ls | |
: 1726151771:0;tmux attach -t 0 | |
: 1726151779:0;git ppf | |
: 1726151812:0;git o main | |
: 1726151815:0;git puom | |
: 1726151823:0;clear | |
: 1726151823:0;ls | |
: 1726151844:0;git ob add_unitbroadcast | |
: 1726151846:0;riree | |
: 1726151854:0;git submodule update --init | |
: 1726151872:0;riree | |
: 1726151914:0;ls | |
: 1726151917:0;clear | |
: 1726151918:0;ls | |
: 1726151919:0;vi | |
: 1726152398:0;git ppf | |
: 1726154397:0;vi | |
: 1726154487:0;iree-opt --pass-pipeline="builtin.module(iree-llvmcpu-select-lowering-strategy, func.func(iree-llvmcpu-lower-executable-target))" compiler/src/iree/compiler/Codegen/LLVMCPU/test/pipeline_pad_conv_tests.mlir | |
: 1726154528:0;iree-opt --pass-pipeline="builtin.module(iree-llvmcpu-select-lowering-strategy, func.func(iree-llvmcpu-lower-executable-target))" compiler/src/iree/compiler/Codegen/LLVMCPU/test/compiler/src/iree/compiler/Codegen/LLVMCPU/test/pipeline_pad_tests.mlir | |
: 1726154544:0;iree-opt --pass-pipeline="builtin.module(iree-llvmcpu-select-lowering-strategy, func.func(iree-llvmcpu-lower-executable-target))" compiler/src/iree/compiler/Codegen/LLVMCPU/test/pipeline_pad_tests.mlir | |
: 1726154559:0;iree-opt --pass-pipeline="builtin.module(iree-llvmcpu-select-lowering-strategy, func.func(iree-llvmcpu-lower-executable-target))" compiler/src/iree/compiler/Codegen/LLVMCPU/test/pipeline_pad_tests.mlir -split-input-file | |
: 1726154668:0;iree-opt --pass-pipeline="builtin.module(iree-llvmcpu-select-lowering-strategy, func.func(iree-llvmcpu-lower-executable-target))" compiler/src/iree/compiler/Codegen/LLVMCPU/test/pipeline_pad_tests.mlir -split-input-file -mlir-print-ir-after-all 2> xyz.txt | |
: 1726154671:0;vi xyz.txt | |
: 1726154731:0;riree | |
: 1726154785:0;iree-opt --pass-pipeline="builtin.module(iree-llvmcpu-select-lowering-strategy, func.func(iree-llvmcpu-lower-executable-target))" compiler/src/iree/compiler/Codegen/LLVMCPU/test/pipeline_pad_tests.mlir -split-input-file -mlir-print-ir-after-all 2> xyz.txt | |
: 1726154794:0;riree | |
: 1726154860:0;iree-opt --pass-pipeline="builtin.module(iree-llvmcpu-select-lowering-strategy, func.func(iree-llvmcpu-lower-executable-target))" compiler/src/iree/compiler/Codegen/LLVMCPU/test/pipeline_pad_tests.mlir -split-input-file -mlir-print-ir-after-all 2> xyz.txt | |
: 1726154862:0;vi xyz.txt | |
: 1726154880:0;riree | |
: 1726155130:0;iree-opt --pass-pipeline="builtin.module(iree-llvmcpu-select-lowering-strategy, func.func(iree-llvmcpu-lower-executable-target))" compiler/src/iree/compiler/Codegen/LLVMCPU/test/pipeline_pad_tests.mlir -split-input-file -mlir-print-ir-after-all 2> xyz.txt | |
: 1726155133:0;vi xyz.txt | |
: 1726155169:0;iree-opt --pass-pipeline="builtin.module(iree-llvmcpu-select-lowering-strategy, func.func(iree-llvmcpu-lower-executable-target))" compiler/src/iree/compiler/Codegen/LLVMCPU/test/pipeline_pad_tests.mlir -split-input-file | |
: 1726155188:0;iree-opt --pass-pipeline="builtin.module(iree-llvmcpu-select-lowering-strategy, func.func(iree-llvmcpu-lower-executable-target))" compiler/src/iree/compiler/Codegen/LLVMCPU/test/pipeline_pad_tests.mlir -split-input-file -mlir-print-ir-after-all 2> xyz.txt | |
: 1726155191:0;vi xyz.txt | |
: 1726230281:0;tmux attach -t 0 | |
: 1726230287:0;clear | |
: 1726230287:0;ls | |
: 1726230303:0;clear | |
: 1726230303:0;ls | |
: 1726230307:0;git o main | |
: 1726230314:0;git puom | |
: 1726230322:0;git submodule update --init | |
: 1726230324:0;clear | |
: 1726230325:0;ls | |
: 1726230338:0;git ob enablescfforall | |
: 1726230339:0;clear | |
: 1726230340:0;ls | |
: 1726230342:0;clear | |
: 1726230343:0;ls | |
: 1726230359:0;git cp https://arxiv.org/pdf/2406.06858 | |
: 1726230364:0;git cp 39a63a31b366af256a0c7119eb94cd869af782cb | |
: 1726230367:0;clear | |
: 1726230369:0;vi | |
: 1726230381:0;source ~/global_venv/bin/activate | |
: 1726230383:0;vi | |
: 1726230405:0;riree | |
: 1726230462:0;biree | |
: 1726230839:0;cmake --build ~/iree-build --target iree-run-tests | |
: 1726230874:0;CTEST_PARALLEL_LEVEL=32 cmake --build ~/iree-build --target iree-run-tests | |
: 1726232586:0;riree | |
: 1726232625:0;biree | |
: 1726233045:0;ls | |
: 1726233071:0;iree-compile --output-format=vm-bytecode --mlir-print-op-on-diagnostic=false --iree-hal-target-backends=llvm-cpu /home/prashant/iree/tests/e2e/tensor_ops/pack_dynamic_inner_tiles.mlir -o check_llvm-cpu_local-task_pack_dynamic_inner_tiles.mlir_module.vmfb | |
: 1726233110:0;iree-compile --output-format=vm-bytecode --mlir-print-op-on-diagnostic=false --iree-hal-target-backends=llvm-cpu /home/prashant/iree/tests/e2e/tensor_ops/pack_dynamic_inner_tiles.mlir -o check_llvm-cpu_local-task_pack_dynamic_inner_tiles.mlir_module.vmfb -mlir-print-ir-after-all 2> ~/all.txt | |
: 1726233146:0;vi ~/all.txt | |
: 1726234066:0;iree-compile --output-format=vm-bytecode --mlir-print-op-on-diagnostic=false --iree-hal-target-backends=llvm-cpu /home/prashant/iree/tests/e2e/tensor_ops/pack_dynamic_inner_tiles.mlir -o check_llvm-cpu_local-task_pack_dynamic_inner_tiles.mlir_module.vmfb -mlir-print-ir-after-all 2> ~/all.txt | |
: 1726234076:0;vi ~/all.txt | |
: 1726235933:0;gist-paste ~/all.txt | |
: 1726239831:0;riree | |
: 1726239859:0;iree-compile --output-format=vm-bytecode --mlir-print-op-on-diagnostic=false --iree-hal-target-backends=llvm-cpu /home/prashant/iree/tests/e2e/tensor_ops/pack_dynamic_inner_tiles.mlir -o check_llvm-cpu_local-task_pack_dynamic_inner_tiles.mlir_module.vmfb -mlir-print-ir-after-all 2> ~/old.txt | |
: 1726239869:0;vi ~/old.txt | |
: 1726458873:0;clear | |
: 1726458873:0;ls | |
: 1726459896:0;clear | |
: 1726459897:0;ls | |
: 1726459907:0;clear | |
: 1726459907:0;ls | |
: 1726459917:0;ssh [email protected] | |
: 1726459930:0;ssh [email protected] | |
: 1726459948:0;clear | |
: 1726459949:0;ls | |
: 1726459950:0;htop | |
: 1726459954:0;clear | |
: 1726459955:0;ls | |
: 1726459983:0;clear | |
: 1726459983:0;ls | |
: 1726459992:0;tmux ls | |
: 1726459995:0;tmux attach -t 0 | |
: 1726460693:0;clear | |
: 1726460694:0;ls | |
: 1726460740:0;clear | |
: 1726460740:0;ls | |
: 1726460975:0;; | |
: 1726460977:0;ls | |
: 1726460982:0;vi test.mir | |
: 1726460985:0;vi test.mlir | |
: 1726461006:0;iree-opt --help | fzf | |
: 1726461074:0;iree-opt --pass-pipeline="builtin.module(iree-codegen-convert-to-destination-passing-style, func.func(iree-llvmcpu-lower-executable-target))" test.mlir | |
: 1726461106:0;iree-opt --pass-pipeline="builtin.module(iree-codegen-convert-to-destination-passing-style)" test.mlir | |
: 1726461191:0;iree-opt --help | fzf | |
: 1726465506:0;\ | |
: 1726465508:0;clear | |
: 1726465509:0;ls | |
: 1726465520:0;\ | |
: 1726465522:0;clear | |
: 1726465522:0;ls | |
: 1726465528:0;iree-opt --pass-pipeline="builtin.module(iree-codegen-convert-to-destination-passing-style)" test.mlir | |
: 1726465536:0;tmux attach -t 0 | |
: 1726474108:0;riree | |
: 1726474218:0;vi test.mlir | |
: 1726474224:0;vi ~/all.txt | |
: 1726475142:0;riree | |
: 1726475268:0;iree-opt %s --pass-pipeline="builtin.module(func.func(iree-codegen-iree-comprehensive-bufferize, canonicalize, cse, canonicalize))" ~/test.mlir | |
: 1726475278:0;iree-opt --pass-pipeline="builtin.module(func.func(iree-codegen-iree-comprehensive-bufferize, canonicalize, cse, canonicalize))" ~/test.mlir | |
: 1726475299:0;ls | |
: 1726475307:0;vi test.mlir | |
: 1726475314:0;iree-opt --pass-pipeline="builtin.module(func.func(iree-codegen-iree-comprehensive-bufferize, canonicalize, cse, canonicalize))" test.mlir | |
: 1726475327:0;riree | |
: 1726475380:0;iree-opt --pass-pipeline="builtin.module(func.func(iree-codegen-iree-comprehensive-bufferize, canonicalize, cse, canonicalize))" test.mlir | |
: 1726475563:0;ls | |
: 1726475570:0;vi test.mlir | |
: 1726475877:0;riree | |
: 1726475892:0;iree-opt --pass-pipeline="builtin.module(func.func(iree-codegen-iree-comprehensive-bufferize, canonicalize, cse, canonicalize))" test.mlir | |
: 1726475956:0;riree | |
: 1726475971:0;iree-opt --pass-pipeline="builtin.module(func.func(iree-codegen-iree-comprehensive-bufferize, canonicalize, cse, canonicalize))" test.mlir | |
: 1726476004:0;iree-opt --pass-pipeline="builtin.module(func.func(iree-codegen-iree-comprehensive-bufferize))" test.mlir | |
: 1726476060:0;riree | |
: 1726476085:0;iree-opt --pass-pipeline="builtin.module(func.func(iree-codegen-iree-comprehensive-bufferize))" test.mlir | |
: 1726476174:0;riree | |
: 1726476329:0;iree-opt --pass-pipeline="builtin.module(func.func(iree-codegen-iree-comprehensive-bufferize))" test.mlir | |
: 1726476584:0;riree | |
: 1726476605:0;iree-opt --pass-pipeline="builtin.module(func.func(iree-codegen-iree-comprehensive-bufferize))" test.mlir | |
: 1726476913:0;iree-opt --pass-pipeline="builtin.module(func.func(iree-codegen-iree-comprehensive-bufferize))" test.mlir -mlir-disable-threading | |
: 1726477469:0;riree | |
: 1726477484:0;iree-opt --pass-pipeline="builtin.module(func.func(iree-codegen-iree-comprehensive-bufferize))" test.mlir -mlir-disable-threading | |
: 1726477576:0;riree | |
: 1726477600:0;iree-opt --pass-pipeline="builtin.module(func.func(iree-codegen-iree-comprehensive-bufferize))" test.mlir -mlir-disable-threading | |
: 1726477640:0;riree | |
: 1726477653:0;iree-opt --pass-pipeline="builtin.module(func.func(iree-codegen-iree-comprehensive-bufferize))" test.mlir -mlir-disable-threading | |
: 1726478519:0;riree | |
: 1726478634:0;vi ~/all.txt | |
: 1726478679:0;vi test.mlir | |
: 1726478740:0;iree-opt --pass-pipeline="builtin.module(func.func(iree-codegen-tile-and-distribute-to-workgroups-using-forall-op, cse))" test.mlir | |
: 1726479218:0;riree | |
: 1726479233:0;iree-opt --pass-pipeline="builtin.module(func.func(iree-codegen-tile-and-distribute-to-workgroups-using-forall-op, cse))" test.mlir | |
: 1726479272:0;riree | |
: 1726479555:0;iree-opt --pass-pipeline="builtin.module(func.func(iree-codegen-tile-and-distribute-to-workgroups-using-forall-op, cse))" test.mlir --mlir-disable-threading | |
: 1726479604:0;riree | |
: 1726479654:0;iree-opt --pass-pipeline="builtin.module(func.func(iree-codegen-tile-and-distribute-to-workgroups-using-forall-op, cse))" test.mlir --mlir-disable-threading | |
: 1726479661:0;riree | |
: 1726479668:0;iree-opt --pass-pipeline="builtin.module(func.func(iree-codegen-tile-and-distribute-to-workgroups-using-forall-op, cse))" test.mlir --mlir-disable-threading | |
: 1726479700:0;riree | |
: 1726479719:0;iree-opt --pass-pipeline="builtin.module(func.func(iree-codegen-tile-and-distribute-to-workgroups-using-forall-op, cse))" test.mlir --mlir-disable-threading | |
: 1726479754:0;riree | |
: 1726479773:0;iree-opt --pass-pipeline="builtin.module(func.func(iree-codegen-tile-and-distribute-to-workgroups-using-forall-op, cse))" test.mlir --mlir-disable-threading | |
: 1726479914:0;iree-opt --pass-pipeline="builtin.module(func.func(iree-codegen-tile-and-distribute-to-workgroups-using-forall-op, cse))" test.mlir | |
: 1726479963:0;riree | |
: 1726480110:0;iree-opt --pass-pipeline="builtin.module(func.func(iree-codegen-tile-and-distribute-to-workgroups-using-forall-op, cse))" test.mlir | |
: 1726480126:0;riree | |
: 1726480134:0;iree-opt --pass-pipeline="builtin.module(func.func(iree-codegen-tile-and-distribute-to-workgroups-using-forall-op, cse))" test.mlir | |
: 1726480300:0;riree | |
: 1726480308:0;iree-opt --pass-pipeline="builtin.module(func.func(iree-codegen-tile-and-distribute-to-workgroups-using-forall-op, cse))" test.mlir | |
: 1726480426:0;riree | |
: 1726480451:0;iree-opt --pass-pipeline="builtin.module(func.func(iree-codegen-tile-and-distribute-to-workgroups-using-forall-op, cse))" test.mlir | |
: 1726480487:0;riree | |
: 1726480996:0;iree-opt --pass-pipeline="builtin.module(func.func(iree-codegen-tile-and-distribute-to-workgroups-using-forall-op, cse))" test.mlir | |
: 1726481338:0;riree | |
: 1726481353:0;iree-opt --pass-pipeline="builtin.module(func.func(iree-codegen-tile-and-distribute-to-workgroups-using-forall-op, cse))" test.mlir | |
: 1726481371:0;vi ~/all.txt | |
: 1726481467:0;iree-opt --pass-pipeline="builtin.module(func.func(iree-codegen-iree-comprehensive-bufferize))" test.mlir | |
: 1726481481:0;iree-opt --pass-pipeline="builtin.module(func.func(iree-codegen-iree-comprehensive-bufferize))" ~/test.mlir | |
: 1726481500:0;iree-opt --pass-pipeline="builtin.module(func.func(iree-codegen-iree-comprehensive-bufferize), cse )" ~/test.mlir | |
: 1726481599:0;vi test.mlir | |
: 1726481612:0;vi ~/all.txt | |
: 1726481691:0;iree-opt --pass-pipeline="builtin.module(func.func(iree-codegen-iree-comprehensive-bufferize), cse )" ~/test.mlir | |
: 1726481702:0;vi test.mlir | |
: 1726481709:0;vi ~/test.mlir | |
: 1726481724:0;iree-opt --pass-pipeline="builtin.module(func.func(iree-codegen-iree-comprehensive-bufferize), cse )" ~/test.mlir | |
: 1726489922:0;riree | |
: 1726489937:0;iree-opt --pass-pipeline="builtin.module(func.func(iree-codegen-iree-comprehensive-bufferize), cse )" ~/test.mlir | |
: 1726491605:0;riree | |
: 1726491617:0;iree-opt --pass-pipeline="builtin.module(func.func(iree-codegen-iree-comprehensive-bufferize), cse )" ~/test.mlir | |
: 1726492371:0;riree | |
: 1726492383:0;iree-opt --pass-pipeline="builtin.module(func.func(iree-codegen-iree-comprehensive-bufferize), cse )" ~/test.mlir | |
: 1726492425:0;riree | |
: 1726492446:0;iree-opt --pass-pipeline="builtin.module(func.func(iree-codegen-iree-comprehensive-bufferize), cse )" ~/test.mlir -mlir-print-ir-after-all | |
: 1726512943:0;exit | |
: 1726513642:0;htop | |
: 1726513665:0;ssh [email protected] | |
: 1726513672:0;sudo tailscale up | |
: 1726513676:0;ssh [email protected] | |
: 1726513793:0;ls | |
: 1726513794:0;htop | |
: 1726513797:0;exit | |
: 1726559190:0;tmux attach -t 0 | |
: 1726559195:0;ls | |
: 1726559197:0;cd .. | |
: 1726559198:0;ls | |
: 1726559201:0;git clone [email protected]:iree-org/megabump.git | |
: 1726559211:0;clear | |
: 1726559212:0;ls | |
: 1726559242:0;2 | |
: 1726559244:0;clear | |
: 1726559244:0;ls | |
: 1726559246:0;cd megabump | |
: 1726559247:0;ls | |
: 1726559268:0;mkdir work | |
: 1726559269:0;clear | |
: 1726559269:0;ls | |
: 1726559283:0;git clone https://github.com/iree-org/iree work/iree | |
: 1726559312:0;python -m venv work/venv | |
: 1726559321:0;source work/venv/bin/activate | |
: 1726559329:0;cd work/iree | |
: 1726559336:0;python -m pip install --upgrade pip | |
: 1726559344:0;python -m pip install -r runtime/bindings/python/iree/runtime/build_requirements.txt\ | |
deactivate\ | |
: 1726559389:0;clear | |
: 1726559389:0;ls | |
: 1726559391:0;cd .. | |
: 1726559391:0;ls | |
: 1726559397:0;cd iree | |
: 1726559398:0;ls | |
: 1726559406:0;./scripts/start_integrate | |
: 1726559427:0;cd .. | |
: 1726559427:0;ls | |
: 1726559428:0;cd .. | |
: 1726559429:0;ls | |
: 1726559430:0;clear | |
: 1726559430:0;ls | |
: 1726559432:0;./scripts/start_integrate | |
: 1726559436:0;source work/venv/bin/activate | |
: 1726559438:0;./scripts/start_integrate | |
: 1726559712:0;vi ~/test.mlir | |
: 1726559957:0;./scripts/llvm_revision status | |
: 1726560214:0;cd work/iree/third_party | |
: 1726560215:0;ls | |
: 1726560234:0;cd llvm-project | |
: 1726560235:0;ls | |
: 1726560238:0;git lg | |
: 1726560563:0;git o c970e96eaedf76f349fcb95309a85fec29844c0e | |
: 1726560567:0;git lg | |
: 1726560576:0;clear | |
: 1726560576:0;ls | |
: 1726560579:0;cd .. | |
: 1726560580:0;ls | |
: 1726560584:0;cd .. | |
: 1726560585:0;ls | |
: 1726560660:0;git ppf | |
: 1726560697:0;git remote add pashu [email protected]:pashu123/iree.git | |
: 1726560699:0;vi | |
: 1726560733:0;git ppf | |
: 1726562002:0;tmux attach -t 0 | |
: 1726563017:0;clear | |
: 1726563018:0;ls | |
: 1726563204:0;ebd | |
: 1726563327:0;ls | |
: 1726563361:0;build_new.sh | |
: 1726563415:0;cd build_tools | |
: 1726563415:0;ls | |
: 1726563418:0;cd .. | |
: 1726563424:0;cd ~/build_commands | |
: 1726563425:0;ls | |
: 1726563430:0;chmod +x build_new.sh | |
: 1726563435:0;cd ~ | |
: 1726563435:0;ls | |
: 1726563443:0;build_new.sh | |
: 1726563451:0;ebd | |
: 1726565785:0;ls | |
: 1726565798:0;cd megabump | |
: 1726565799:0;ls | |
: 1726565802:0;cd work | |
: 1726565802:0;ls | |
: 1726565805:0;clear | |
: 1726565805:0;ls | |
: 1726565832:0;iree-build/bin/iree-opt --pass-pipeline='builtin.module(hal.executable(hal.executable.variant(builtin.module(iree-codegen-llvmgpu-configuration-pipeline), iree-codegen-linalg-to-nvvm-pipeline)))' --iree-gpu-test-target=sm_80 compiler/src/iree/compiler/Codegen/LLVMGPU/test/nvvm_extract_address_computation.mlir | |
: 1726565875:0;ls | |
: 1726565877:0;cd iree-build | |
: 1726565881:0;cmake --build . | |
: 1726565956:0;iree-build/bin/iree-opt --pass-pipeline='builtin.module(hal.executable(hal.executable.variant(builtin.module(iree-codegen-llvmgpu-configuration-pipeline), iree-codegen-linalg-to-nvvm-pipeline)))' --iree-gpu-test-target=sm_80 compiler/src/iree/compiler/Codegen/LLVMGPU/test/nvvm_extract_address_computation.mlir | |
: 1726565964:0;cd .. | |
: 1726565964:0;ls | |
: 1726565968:0;cd iree | |
: 1726565976:0;../iree-build/bin/iree-opt --pass-pipeline='builtin.module(hal.executable(hal.executable.variant(builtin.module(iree-codegen-llvmgpu-configuration-pipeline), iree-codegen-linalg-to-nvvm-pipeline)))' --iree-gpu-test-target=sm_80 compiler/src/iree/compiler/Codegen/LLVMGPU/test/nvvm_extract_address_computation.mlir | |
: 1726566005:0;../iree-build/tools/iree-opt --pass-pipeline='builtin.module(hal.executable(hal.executable.variant(builtin.module(iree-codegen-llvmgpu-configuration-pipeline), iree-codegen-linalg-to-nvvm-pipeline)))' --iree-gpu-test-target=sm_80 compiler/src/iree/compiler/Codegen/LLVMGPU/test/nvvm_extract_address_computation.mlir | |
: 1726566018:0;../iree-build/tools/iree-opt --pass-pipeline='builtin.module(hal.executable(hal.executable.variant(builtin.module(iree-codegen-llvmgpu-configuration-pipeline), iree-codegen-linalg-to-nvvm-pipeline)))' --iree-gpu-test-target=sm_80 compiler/src/iree/compiler/Codegen/LLVMGPU/test/nvvm_extract_address_computation.mlir > xyz.mlir | |
: 1726566020:0;vi xyz.mlir | |
: 1726566053:0;clear | |
: 1726566053:0;ls | |
: 1726566067:0;iree-opt --pass-pipeline='builtin.module(hal.executable(hal.executable.variant(builtin.module(iree-codegen-llvmgpu-configuration-pipeline), iree-codegen-linalg-to-nvvm-pipeline)))' --iree-gpu-test-target=sm_80 compiler/src/iree/compiler/Codegen/LLVMGPU/test/nvvm_extract_address_computation.mlir | |
: 1726566079:0;iree-opt --pass-pipeline='builtin.module(hal.executable(hal.executable.variant(builtin.module(iree-codegen-llvmgpu-configuration-pipeline), iree-codegen-linalg-to-nvvm-pipeline)))' --iree-gpu-test-target=sm_80 compiler/src/iree/compiler/Codegen/LLVMGPU/test/nvvm_extract_address_computation.mlir > ~/xyz.mlir | |
: 1726566156:0;diff xyz.mlir ~/xyz.mlir | |
: 1726566181:0;vi | |
: 1726566290:0;iree-opt --pass-pipeline='builtin.module(hal.executable(hal.executable.variant(builtin.module(iree-codegen-llvmgpu-configuration-pipeline), iree-codegen-linalg-to-nvvm-pipeline)))' --iree-gpu-test-target=sm_80 compiler/src/iree/compiler/Codegen/LLVMGPU/test/nvvm_extract_address_computation.mlir | FileCheck compiler/src/iree/compiler/Codegen/LLVMGPU/test/nvvm_extract_address_computation.mlir | |
: 1726566310:0;../iree-build/tools/iree-opt --pass-pipeline='builtin.module(hal.executable(hal.executable.variant(builtin.module(iree-codegen-llvmgpu-configuration-pipeline), iree-codegen-linalg-to-nvvm-pipeline)))' --iree-gpu-test-target=sm_80 compiler/src/iree/compiler/Codegen/LLVMGPU/test/nvvm_extract_address_computation.mlir | FileCheck compiler/src/iree/compiler/Codegen/LLVMGPU/test/nvvm_extract_address_computation.mlir | |
: 1726566313:0;vi | |
: 1726566361:0;git ppf | |
: 1726571837:0;tmux attach -t 0 | |
: 1726572016:0;clear | |
: 1726572017:0;ls | |
: 1726572018:0;cd .. | |
: 1726572019:0;ls | |
: 1726572021:0;cd ~ | |
: 1726572022:0;clear | |
: 1726572023:0;ls | |
: 1726572039:0;clear | |
: 1726572040:0;ls | |
: 1726572050:0;iree-opt --pass-pipeline="builtin.module(func.func(iree-codegen-iree-comprehensive-bufferize), cse )" ~/test.mlir | |
: 1726592747:0;clear | |
: 1726592748:0;ls | |
: 1726592752:0;tmux attach -t 1 | |
: 1726592757:0;tmux | |
: 1726592759:0;clear | |
: 1726592760:0;ls | |
: 1726592765:0;clear | |
: 1726592765:0;ls | |
: 1726592777:0;git clone [email protected]:nod-ai/sharktank.git | |
: 1726592782:0;clear | |
: 1726592782:0;ls | |
: 1726592786:0;clear | |
: 1726592787:0;ls | |
: 1726592884:0;clear | |
: 1726592884:0;ls | |
: 1726592888:0;clear | |
: 1726592888:0;ls | |
: 1726592899:0;git clone [email protected]:nod-ai/sharktank.git | |
: 1726592901:0;cd shark | |
: 1726592902:0;ls | |
: 1726592906:0;rm -rf shark | |
: 1726592919:0;cd sharktank | |
: 1726592920:0;clear | |
: 1726592920:0;ls | |
: 1726592922:0;git lg | |
: 1726592926:0;clear | |
: 1726592926:0;ls | |
: 1726592952:0;python -m venv --prompt sharktank .venv | |
: 1726592958:0;pytho3 -m venv --prompt sharktank .venv | |
: 1726592965:0;python3 -m venv --prompt sharktank .venv | |
: 1726592972:0;source .venv/bin/activate | |
: 1726592973:0;clear | |
: 1726592974:0;ls | |
: 1726592992:0;pip install -r pytorch-cpu-requirements.txt | |
: 1726593053:0;clear | |
: 1726593053:0;ls | |
: 1726593073:0;pip install -f https://iree.dev/pip-release-links.html --src deps \\ | |
-e "git+https://github.com/iree-org/iree-turbine.git#egg=shark-turbine" | |
: 1726593107:0;pip install -r requirements.txt -e sharktank/ shortfin/ | |
: 1726593138:0;pytest shortfin | |
: 1726593149:0;ls | |
: 1726593156:0;cd sharktank | |
: 1726593157:0;clear | |
: 1726593157:0;ls | |
: 1726593159:0;source .venv/bin/activate | |
: 1726593160:0;clear | |
: 1726593161:0;ls | |
: 1726593161:0;vi | |
: 1726598391:0;pip install -r requirements.txt -e sharktank/ shortfin/ | |
: 1726598405:0;pytest shortfin | |
: 1726598425:0;pytest libshortfin/tests/api/array_test.py | |
: 1726598529:0;git stash | |
: 1726598534:0;git o 15aa675be29a680373fffe7acc7a22eb73c50ca5 | |
: 1726598543:0;cd .. | |
: 1726598543:0;ls | |
: 1726598548:0;cd sharktank | |
: 1726598552:0;pip install -r requirements.txt -e sharktank/ shortfin/ | |
: 1726598568:0;pytest shortfin | |
: 1726598609:0;cd shortfin | |
: 1726598611:0;cmake -GNinja -S. -Bbuild \\ | |
-DCMAKE_C_COMPILER=clang -DCMAKE_CXX_COMPILER=clang++ \\ | |
-DCMAKE_LINKER_TYPE=LLD | |
: 1726598616:0;cd .. | |
: 1726598617:0;cmake -GNinja -S. -Bbuild \\ | |
-DCMAKE_C_COMPILER=clang -DCMAKE_CXX_COMPILER=clang++ \\ | |
-DCMAKE_LINKER_TYPE=LLD | |
: 1726598622:0;ls | |
: 1726598626:0;cd shortfin | |
: 1726598627:0;ls | |
: 1726598652:0;cd .. | |
: 1726598653:0;ls | |
: 1726598655:0;cd libshortfin | |
: 1726598655:0;ls | |
: 1726598668:0;cmake -GNinja -S. -Bbuild \\ | |
-DCMAKE_C_COMPILER=clang -DCMAKE_CXX_COMPILER=clang++ \\ | |
-DCMAKE_LINKER_TYPE=LLD | |
: 1726598678:0;pip install cmake | |
: 1726598683:0;cmake -GNinja -S. -Bbuild \\ | |
-DCMAKE_C_COMPILER=clang -DCMAKE_CXX_COMPILER=clang++ \\ | |
-DCMAKE_LINKER_TYPE=LLD | |
: 1726598690:0;ls | |
: 1726598700:0;cd build | |
: 1726598701:0;ls | |
: 1726598702:0;cd .. | |
: 1726598704:0;rm -rf build | |
: 1726598708:0;cmake -GNinja -S. -Bbuild \\ | |
-DCMAKE_C_COMPILER=clang -DCMAKE_CXX_COMPILER=clang++ \\ | |
-DCMAKE_LINKER_TYPE=LLD | |
: 1726598739:0;pip install cmake | |
: 1726598745:0;cmake --version | |
: 1726598790:0;ls | |
: 1726598794:0;vi CMakeLists.txt | |
: 1726598812:0;pip uninstall cmake | |
: 1726598816:0;vi CMakeLists.txt | |
: 1726598826:0;cmake -GNinja -S. -Bbuild \\ | |
-DCMAKE_C_COMPILER=clang -DCMAKE_CXX_COMPILER=clang++ \\ | |
-DCMAKE_LINKER_TYPE=LLD | |
: 1726598838:0;cmake -GNinja -S. -Bbuild \\ | |
-DCMAKE_C_COMPILER=clang-19 -DCMAKE_CXX_COMPILER=clang++-19 \\ | |
-DCMAKE_LINKER_TYPE=LLD | |
: 1726598892:0;ebd | |
: 1726598904:0;rm -rf build | |
: 1726598913:0;ebd | |
: 1726598922:0;cmake -GNinja -S. -Bbuild \\ | |
-DCMAKE_C_COMPILER=clang-18 -DCMAKE_CXX_COMPILER=clang++-18 \\ | |
-DCMAKE_LINKER_TYPE=LLD | |
: 1726599095:0;cmake -GNinja -S. -Bbuild \\ | |
-DCMAKE_C_COMPILER=clang-18 -DCMAKE_CXX_COMPILER=clang++-18 \\ | |
-DSHORTFIN_BUILD_PYTHON_BINDINGS=ON \\ | |
-DCMAKE_LINKER_TYPE=LLD | |
: 1726599111:0;pip install -e build/ | |
: 1726599145:0;pip install setuptools wheel\ | |
: 1726599153:0;pip install cmake ninja | |
: 1726599160:0;SHORTFIN_DEV_MODE=ON pip install --no-build-isolation -v -e . | |
: 1726599175:0;rm -rf build | |
: 1726599177:0;SHORTFIN_DEV_MODE=ON pip install --no-build-isolation -v -e . | |
: 1726599190:0;cmake -GNinja -S. -Bbuild \\ | |
-DCMAKE_C_COMPILER=clang-18 -DCMAKE_CXX_COMPILER=clang++-18 \\ | |
-DSHORTFIN_BUILD_PYTHON_BINDINGS=ON \\ | |
-DCMAKE_LINKER_TYPE=LLD | |
: 1726599198:0;pip uninstall cmake | |
: 1726599209:0;cmake -GNinja -S. -Bbuild \\ | |
-DCMAKE_C_COMPILER=clang-18 -DCMAKE_CXX_COMPILER=clang++-18 \\ | |
-DSHORTFIN_BUILD_PYTHON_BINDINGS=ON \\ | |
-DCMAKE_LINKER_TYPE=LLD | |
: 1726599272:0;cmake --build build | |
: 1726599302:0;git o man | |
: 1726599304:0;git o main | |
: 1726599310:0;git stash pop | |
: 1726599316:0;cmake --build build | |
: 1726599454:0;SHORTFIN_DEV_MODE=ON pip install --no-build-isolation -v -e . | |
: 1726599585:0;python --version | |
: 1726599600:0;ls | |
: 1726599608:0;cd sharktank | |
: 1726599609:0;ls | |
: 1726599625:0;rm -rf .venv | |
: 1726599661:0;python3.12 -m venv --prompt sharktank .venv | |
: 1726599669:0;sudo apt-get install python3.12 | |
: 1726599734:0;sudo apt install software-properties-common -y | |
: 1726599743:0;add-apt-repository ppa:deadsnakes/ppa | |
: 1726599748:0;sudo add-apt-repository ppa:deadsnakes/ppa | |
: 1726599774:0;sudo apt install python3.12 | |
: 1726599806:0;python3.12 -m venv --prompt sharktank .venv | |
: 1726599831:0;python --version | |
: 1726599835:0;python3 --version | |
: 1726599839:0;python3.1 --version | |
: 1726599842:0;python3.12 --version | |
: 1726599868:0;curl -sS https://bootstrap.pypa.io/get-pip.py | python3.12 | |
: 1726599881:0;python3.12 -m venv --prompt sharktank .venv | |
: 1726599901:0;pip3.12 -V | |
: 1726599919:0;where python3.12 | |
: 1726599925:0;where pip | |
: 1726599970:0;curl https://bootstrap.pypa.io/get-pip.py -o get-pip.py | |
: 1726599978:0;python3.12 get-pip.py | |
: 1726599988:0;python3.12 -m venv --prompt sharktank .venv | |
: 1726599996:0;python3.12 | |
: 1726600070:0;sudo apt install python3.12-dev | |
: 1726600104:0;sudo apt install python3.12-venv | |
: 1726600124:0;python3.12 -m venv --prompt sharktank .venv | |
: 1726600133:0;python | |
: 1726600152:0;pip install -r pytorch-cpu-requirements.txt | |
: 1726600165:0;cd .. | |
: 1726600166:0;ls | |
: 1726600167:0;pip install -r pytorch-cpu-requirements.txt | |
: 1726600262:0;clear | |
: 1726600262:0;ls | |
: 1726600281:0;pip install -f https://iree.dev/pip-release-links.html --src deps \\ | |
-e "git+https://github.com/iree-org/iree-turbine.git#egg=shark-turbine | |
: 1726600283:0;pip install -f https://iree.dev/pip-release-links.html --src deps \\ | |
-e "git+https://github.com/iree-org/iree-turbine.git#egg=shark-turbine" | |
: 1726600313:0;pip install -r requirements.txt -e sharktank/ shortfin/ | |
: 1726600411:0;pip install -r requirements.txt -e shortfin/ | |
: 1726600480:0;ls | |
: 1726600482:0;vi requirements.txt | |
: 1726600488:0;pip install -r requirements.txt -e shortfin/ | |
: 1726600553:0;pytest shortfin | |
: 1726600573:0;cd libshortfin | |
: 1726600573:0;ls | |
: 1726600577:0;rm -rf build | |
: 1726600582:0;cmake -GNinja -S. -Bbuild \\ | |
-DCMAKE_C_COMPILER=clang-18 -DCMAKE_CXX_COMPILER=clang++-18 \\ | |
-DSHORTFIN_BUILD_PYTHON_BINDINGS=ON \\ | |
-DCMAKE_LINKER_TYPE=LLD | |
: 1726600646:0;SHORTFIN_DEV_MODE=ON pip install --no-build-isolation -v -e . | |
: 1726600662:0;pip install distutils | |
: 1726600677:0;python --version | |
: 1726600688:0;pip install setuptools wheel | |
: 1726600694:0;pip install distutils | |
: 1726600765:0;ls | |
: 1726600769:0;cd python | |
: 1726600769:0;ls | |
: 1726600771:0;cd .. | |
: 1726600771:0;ls | |
: 1726600776:0;vi setup.py | |
: 1726600805:0;pip install ninja | |
: 1726600807:0;vi setup.py | |
: 1726600822:0;SHORTFIN_DEV_MODE=ON pip install --no-build-isolation -v -e . | |
: 1726600836:0;vi setup.py | |
: 1726600956:0;sudo apt install python3.12-distutils | |
: 1726600964:0;source .venv/bin/activate | |
: 1726600966:0;ls | |
: 1726600982:0;source .venv/bin/activate | |
: 1726600991:0;cd libshortfin | |
: 1726600993:0;source .venv/bin/activate | |
: 1726601007:0;sudo apt install python3.12-distutils | |
: 1726601027:0;SHORTFIN_DEV_MODE=ON pip install --no-build-isolation -v -e . | |
: 1726601033:0;ls | |
: 1726601036:0;rm -rf build | |
: 1726601039:0;cmake -GNinja -S. -Bbuild \\ | |
-DCMAKE_C_COMPILER=clang-18 -DCMAKE_CXX_COMPILER=clang++-18 \\ | |
-DSHORTFIN_BUILD_PYTHON_BINDINGS=ON \\ | |
-DCMAKE_LINKER_TYPE=LLD | |
: 1726601105:0;cmake --build build | |
: 1726601132:0;SHORTFIN_DEV_MODE=ON pip install --no-build-isolation -v -e . | |
: 1726601142:0;ls | |
: 1726601174:0;SHORTFIN_DEV_MODE=ON pip install --no-build-isolation -v -e . | |
: 1726601176:0;ls | |
: 1726601179:0;rm -rf build | |
: 1726601185:0;cmake -GNinja -S. -Bbuild \\ | |
-DCMAKE_C_COMPILER=clang-18 -DCMAKE_CXX_COMPILER=clang++-18 \\ | |
-DSHORTFIN_BUILD_PYTHON_BINDINGS=ON \\ | |
-DCMAKE_LINKER_TYPE=LLD | |
: 1726601346:0;SHORTFIN_DEV_MODE=ON pip install --no-build-isolation -v -e . | |
: 1726601356:0;pip install setuptools | |
: 1726601360:0;SHORTFIN_DEV_MODE=ON pip install --no-build-isolation -v -e . | |
: 1726601425:0;pytest tests | |
: 1726601452:0;pip install wheel | |
: 1726601456:0;pip install ninja | |
: 1726601461:0;SHORTFIN_DEV_MODE=ON pip install --no-build-isolation -v -e . | |
: 1726601478:0;ls | |
: 1726601482:0;rm -rf build | |
: 1726601484:0;SHORTFIN_DEV_MODE=ON pip install --no-build-isolation -v -e . | |
: 1726601489:0;cmake -GNinja -S. -Bbuild \\ | |
-DCMAKE_C_COMPILER=clang-18 -DCMAKE_CXX_COMPILER=clang++-18 \\ | |
-DSHORTFIN_BUILD_PYTHON_BINDINGS=ON \\ | |
-DCMAKE_LINKER_TYPE=LLD | |
: 1726601688:0;SHORTFIN_DEV_MODE=ON pip install --no-build-isolation -v -e . | |
: 1726601711:0;cd build | |
: 1726601713:0;SHORTFIN_DEV_MODE=ON pip install --no-build-isolation -v -e . | |
: 1726630126:0;clear | |
: 1726630127:0;ls | |
: 1726630139:0;cd .. | |
: 1726630140:0;ls | |
: 1726630144:0;SHORTFIN_DEV_MODE=ON pip install --no-build-isolation -v -e . | |
: 1726630232:0;SHORTFIN_DEV_MODE=ON pip install --no-build-isolation -v -e build/ | |
: 1726630258:0;pytest | |
: 1726630278:0;pip install -e build/ | |
: 1726630302:0;pytest | |
: 1726630315:0;cmake -GNinja -S. -Bbuild \\ | |
-DCMAKE_C_COMPILER=clang-18 -DCMAKE_CXX_COMPILER=clang++-18 \\ | |
-DSHORTFIN_BUILD_PYTHON_BINDINGS=ON \\ | |
-DCMAKE_LINKER_TYPE=LLD | |
: 1726630322:0;cmake --build build | |
: 1726630382:0;ls | |
: 1726630384:0;vi CMakeLists.txt | |
: 1726630589:0;rm -rf build | |
: 1726630592:0;cmake -GNinja -S. -Bbuild \\ | |
-DCMAKE_C_COMPILER=clang-18 -DCMAKE_CXX_COMPILER=clang++-18 \\ | |
-DSHORTFIN_BUILD_PYTHON_BINDINGS=ON \\ | |
-DCMAKE_LINKER_TYPE=LLD | |
: 1726630643:0;cmake --build build | |
: 1726631037:0;cmake -GNinja -S. -Bbuild \\ | |
-DCMAKE_C_COMPILER=clang-18 -DCMAKE_CXX_COMPILER=clang++-18 \\ | |
-DSHORTFIN_BUILD_PYTHON_BINDINGS=ON \\ | |
-DCMAKE_LINKER_TYPE=LLD | |
: 1726631049:0;pip install -e build/ | |
: 1726631063:0;cmake --build build | |
: 1726631073:0;ls | |
: 1726631074:0;cd build | |
: 1726631075:0;ls | |
: 1726631075:0;vi | |
: 1726631248:0;cmake -GNinja -S. -Bbuild \\ | |
-DCMAKE_C_COMPILER=clang-18 -DCMAKE_CXX_COMPILER=clang++-18 \\ | |
-DSHORTFIN_BUILD_PYTHON_BINDINGS=ON \\ | |
-DCMAKE_LINKER_TYPE=LLD | |
: 1726631251:0;cd .. | |
: 1726631252:0;cmake -GNinja -S. -Bbuild \\ | |
-DCMAKE_C_COMPILER=clang-18 -DCMAKE_CXX_COMPILER=clang++-18 \\ | |
-DSHORTFIN_BUILD_PYTHON_BINDINGS=ON \\ | |
-DCMAKE_LINKER_TYPE=LLD | |
: 1726631260:0;pip install cmake ninja | |
: 1726631265:0;cmake -GNinja -S. -Bbuild \\ | |
-DCMAKE_C_COMPILER=clang-18 -DCMAKE_CXX_COMPILER=clang++-18 \\ | |
-DSHORTFIN_BUILD_PYTHON_BINDINGS=ON \\ | |
-DCMAKE_LINKER_TYPE=LLD | |
: 1726631271:0;rm -rf build | |
: 1726631274:0;cmake -GNinja -S. -Bbuild \\ | |
-DCMAKE_C_COMPILER=clang-18 -DCMAKE_CXX_COMPILER=clang++-18 \\ | |
-DSHORTFIN_BUILD_PYTHON_BINDINGS=ON \\ | |
-DCMAKE_LINKER_TYPE=LLD | |
: 1726631322:0;sudo apt-get remove cmake cmake-data | |
: 1726631427:0;cmake -GNinja -S. -Bbuild \\ | |
-DCMAKE_C_COMPILER=clang-18 -DCMAKE_CXX_COMPILER=clang++-18 \\ | |
-DSHORTFIN_BUILD_PYTHON_BINDINGS=ON \\ | |
-DCMAKE_LINKER_TYPE=LLD | |
: 1726631484:0;cmake --build build | |
: 1726631649:0;SHORTFIN_DEV_MODE=ON pip install --no-build-isolation -v -e build/ | |
: 1726631654:0;pytest | |
: 1726631680:0;cd .. | |
: 1726631680:0;ls | |
: 1726631683:0;pytest shortfin | |
: 1726631698:0;cd shortfin | |
: 1726631698:0;ls | |
: 1726631716:0;pip install -e . | |
: 1726631733:0;ls | |
: 1726631737:0;vi requirements.txt | |
: 1726631744:0;vi setup.py | |
: 1726631785:0;ls | |
: 1726631787:0;vi requirements.txt | |
: 1726631794:0;cd .. | |
: 1726631794:0;ls | |
: 1726632615:0;pip install -r pytorch-cpu-requirements.txt | |
: 1726632643:0;pip install -r requirements.txt shortfin | |
: 1726632656:0;cd shortfin | |
: 1726632657:0;ls | |
: 1726632665:0;cd .. | |
: 1726632668:0;pytest shortfin | |
: 1726632674:0;cd .. | |
: 1726632674:0;ls | |
: 1726632677:0;cd sharktank | |
: 1726632679:0;cd shortfin | |
: 1726632679:0;ls | |
: 1726632683:0;cd shortfin | |
: 1726632684:0;ls | |
: 1726632692:0;cd .. | |
: 1726632692:0;ls | |
: 1726632694:0;cd .. | |
: 1726632694:0;ls | |
: 1726632696:0;cd libshortfin | |
: 1726632696:0;ls | |
: 1726632704:0;pip install -e . | |
: 1726632741:0;SHORTFIN_DEV_MODE=ON pip install --no-build-isolation -v -e . | |
: 1726632763:0;vi setup.py | |
: 1726632778:0;SHORTFIN_DEV_MODE=ON pip install --no-build-isolation -v -e . | |
: 1726632800:0;vi setup.py | |
: 1726632872:0;SHORTFIN_DEV_MODE=ON pip install --no-build-isolation -v -e . | |
: 1726632883:0;vi | |
: 1726632960:0;SHORTFIN_DEV_MODE=ON pip install --no-build-isolation -v -e . | |
: 1726632991:0;ls | |
: 1726632993:0;rm -rf build | |
: 1726632996:0;SHORTFIN_DEV_MODE=ON pip install --no-build-isolation -v -e . | |
: 1726633045:0;cmake -GNinja -S. -Bbuild \\ | |
-DCMAKE_C_COMPILER=clang-18 -DCMAKE_CXX_COMPILER=clang++-18 \\ | |
-DSHORTFIN_BUILD_PYTHON_BINDINGS=ON \\ | |
-DCMAKE_LINKER_TYPE=LLD | |
: 1726633095:0;cmake --build build | |
: 1726633111:0;pip install -v -e . | |
: 1726633183:0;pytest | |
: 1726633206:0;pip install setuptools wheel\ | |
: 1726633213:0;SHORTFIN_DEV_MODE=ON pip install --no-build-isolation -v -e . | |
: 1726633228:0;pytest tests/ | |
: 1726633248:0;python | |
: 1726633425:0;cd shortfin | |
: 1726633425:0;ls | |
: 1726633434:0;deactivate | |
: 1726633449:0;source ~/sharktank/.venv/bin/activate | |
: 1726633471:0;ls | |
: 1726633476:0;cd .. | |
: 1726633477:0;ls | |
: 1726633480:0;clear | |
: 1726633481:0;ls | |
: 1726633485:0;rm -rf .venv | |
: 1726633489:0;cd shortfin | |
: 1726633495:0;ls -la | |
: 1726633499:0;cd shortfin | |
: 1726633500:0;ls -la | |
: 1726633503:0;cd .. | |
: 1726633504:0;ls | |
: 1726633505:0;clear | |
: 1726633505:0;ls | |
: 1726633510:0;python | |
: 1726633512:0;exit | |
: 1726633525:0;cd .. | |
: 1726633525:0;s | |
: 1726633526:0;ls | |
: 1726633541:0;python -m venv --prompt sharktank .venv | |
: 1726633546:0;python3.12 -m venv --prompt sharktank .venv | |
: 1726633552:0;source .venv/bin/activate | |
: 1726633557:0;deactivate | |
: 1726633565:0;source ~/sharktank/.venv/bin/activate | |
: 1726633566:0;clear | |
: 1726633566:0;ls | |
: 1726633571:0;pip install -r pytorch-cpu-requirements.txt | |
: 1726633592:0;pip install -f https://iree.dev/pip-release-links.html --src deps \\ | |
-e "git+https://github.com/iree-org/iree-turbine.git#egg=shark-turbine" | |
: 1726633625:0;pip install -r requirements.txt -e sharktank/ shortfin/ | |
: 1726633646:0;pytest shortfin | |
: 1726633663:0;cd libshortfin | |
: 1726633664:0;ls | |
: 1726633668:0;rm -rf build | |
: 1726633689:0;pip install setuptools wheel\ | |
: 1726633694:0;pip install cmake ninja | |
: 1726633701:0;SHORTFIN_DEV_MODE=ON pip install --no-build-isolation -v -e . | |
: 1726633741:0;pip install -v -e . | |
: 1726633826:0;pip install --no-build-isolation -v -e .\ | |
: 1726633894:0;pytest tests/ | |
: 1726633913:0;python | |
: 1726633943:0;python tests/api/array_te | |
: 1726633946:0;python tests/api/array_test.py | |
: 1726633957:0;vi | |
: 1726633962:0;source ~/sharktank/.venv/bin/activate | |
: 1726633963:0;vi | |
: 1726633967:0;cd shark | |
: 1726633970:0;cd sharktank | |
: 1726633971:0;ls | |
: 1726633972:0;vi | |
: 1726634057:0;python examples/python/async/process.py | |
: 1726634089:0;which pytest | |
: 1726634108:0;pip install pytest | |
: 1726634131:0;rm -rf ~/.local/bin/pytest | |
: 1726634137:0;which pytest | |
: 1726634140:0;clear | |
: 1726634141:0;ls | |
: 1726634143:0;pytest | |
: 1726634408:0;pip install --no-build-isolation -v -e .\ | |
: 1726634434:0;pytest -k "test_get" | |
: 1726634443:0;pytest -v -k "test_get" | |
: 1726634529:0;pip install pyright | |
: 1726634535:0;where pyright | |
: 1726634546:0;vi | |
: 1726634599:0;pytest -v -k "test_get" | |
: 1726634687:0;pip install --no-build-isolation -v -e .\ | |
: 1726634697:0;pytest -v -k "test_get" | |
: 1726635852:0;tmux attach -t 0 | |
: 1726635900:0;tmux rename-session -t 5 shortfin | |
: 1726635902:0;tmux ls | |
: 1726635910:0;tmux attach -t shortfin | |
: 1726635926:0;sz | |
: 1726635928:0;clear | |
: 1726635928:0;ls | |
: 1726635934:0;tmux attach -t shortfin | |
: 1726635950:0;tmux attach -t 0 | |
: 1726635957:0;tmux ls | |
: 1726635986:0;tmux kill-session -t 4 6 7 | |
: 1726635989:0;tmux kill-session -t 4 | |
: 1726635991:0;tmux kill-session -t 6 | |
: 1726635994:0;tmux kill-session -t 7 | |
: 1726635996:0;tmux ls | |
: 1726636008:0;tmux rename-session -t 0 iree-dev | |
: 1726636010:0;clear | |
: 1726636010:0;ls | |
: 1726636012:0;tmux ls | |
: 1726636020:0;tmux attach -t iree-dev | |
: 1726636152:0;riree | |
: 1726636161:0;pip install cmake | |
: 1726636166:0;riree | |
: 1726636176:0;biree | |
: 1726649562:0;ls | |
: 1726649572:0;tmux attach -t shortfin | |
: 1726649974:0;tmux attach -t iree-dev | |
: 1726649980:0;ls | |
: 1726650006:0;iree-opt --pass-pipeline="builtin.module(func.func(iree-codegen-iree-comprehensive-bufferize), cse )" ~/test.mlir | |
: 1726650016:0;iree-opt --pass-pipeline="builtin.module(func.func(iree-codegen-iree-comprehensive-bufferize), cse )" ~/test.mlir > new.mlir | |
: 1726650018:0;vi new.mlir | |
: 1726650032:0;vi ~/test.mlir | |
: 1726650077:0;iree-opt --pass-pipeline="builtin.module(func.func(iree-codegen-iree-comprehensive-bufferize), cse )" ~/test.mlir > new1.mlir | |
: 1726650080:0;vi new1.mlir | |
: 1726651083:0;iree-opt --pass-pipeline="builtin.module(func.func(iree-codegen-iree-comprehensive-bufferize), cse )" ~/test.mlir > new1.mlir | |
: 1726651086:0;vi new1.mlir | |
: 1726651198:0;iree-opt --pass-pipeline="builtin.module(func.func(iree-codegen-iree-comprehensive-bufferize), cse )" ~/test.mlir > new1.mlir | |
: 1726651201:0;vi new1.mlir | |
: 1726651759:0;ls | |
: 1726651771:0;vi test.mlir | |
: 1726652286:0;gist-paste test.mlir | |
: 1726652999:0;vi new.mlir | |
: 1726653019:0;vi new1.mlir | |
: 1726653039:0;gist-paste new1.mlir | |
: 1726653604:0;vi new1.mlir | |
: 1726653610:0;vi ~/test.mlir | |
: 1726653639:0;gist-paste ~/test.mlir | |
: 1726660900:0;tmux attach -t iree-dev | |
: 1726660904:0;ls | |
: 1726660909:0;vi ~/test.mlir | |
: 1726660936:0;iree-opt --pass-pipeline="builtin.module(func.func(iree-codegen-iree-comprehensive-bufferize), cse )" ~/test.mlir > new1.mlir | |
: 1726660939:0;vi new1.mlir | |
: 1726661124:0;ls | |
: 1726661138:0;vi all.txt | |
: 1726661205:0;iree-opt --pass-pipeline="builtin.module(func.func(iree-codegen-tile-and-distribute-to-workgroups-using-forall-op, cse))" ~/test.mlir | |
: 1726661228:0;riree | |
: 1726661284:0;iree-opt --pass-pipeline="builtin.module(func.func(iree-codegen-tile-and-distribute-to-workgroups-using-forall-op, cse))" ~/test.mlir | |
: 1726661313:0;iree-opt --pass-pipeline="builtin.module(func.func(iree-codegen-tile-and-distribute-to-workgroups-using-forall-op, cse))" --debug ~/test.mlir 2> debugscfforall.txt | |
: 1726661317:0;vi debugscfforall.txt | |
: 1726661696:0;riree | |
: 1726661741:0;iree-opt --pass-pipeline="builtin.module(func.func(iree-codegen-tile-and-distribute-to-workgroups-using-forall-op, cse))" --debug ~/test.mlir 2> debugscfforall.txt | |
: 1726661767:0;vi debugscfforall.txt | |
: 1726661878:0;iree-opt --pass-pipeline="builtin.module(func.func(iree-codegen-tile-and-distribute-to-workgroups-using-forall-op, cse))" ~/test.mlir | |
: 1726661950:0;vi ~/test.mlir | |
: 1726662383:0;riree | |
: 1726662398:0;iree-opt --pass-pipeline="builtin.module(func.func(iree-codegen-tile-and-distribute-to-workgroups-using-forall-op, cse))" ~/test.mlir | |
: 1726662427:0;riree | |
: 1726662437:0;iree-opt --pass-pipeline="builtin.module(func.func(iree-codegen-tile-and-distribute-to-workgroups-using-forall-op, cse))" ~/test.mlir | |
: 1726662465:0;riree | |
: 1726662479:0;iree-opt --pass-pipeline="builtin.module(func.func(iree-codegen-tile-and-distribute-to-workgroups-using-forall-op, cse))" ~/test.mlir | |
: 1726662517:0;riree | |
: 1726662531:0;iree-opt --pass-pipeline="builtin.module(func.func(iree-codegen-tile-and-distribute-to-workgroups-using-forall-op, cse))" ~/test.mlir | |
: 1726662706:0;riree | |
: 1726662737:0;iree-opt --pass-pipeline="builtin.module(func.func(iree-codegen-tile-and-distribute-to-workgroups-using-forall-op, cse))" ~/test.mlir | |
: 1726662808:0;riree | |
: 1726662823:0;iree-opt --pass-pipeline="builtin.module(func.func(iree-codegen-tile-and-distribute-to-workgroups-using-forall-op, cse))" ~/test.mlir | |
: 1726662852:0;iree-opt --pass-pipeline="builtin.module(func.func(iree-codegen-tile-and-distribute-to-workgroups-using-forall-op, cse))" ~/test.mlir -mlir-disable-threading | |
: 1726663199:0;riree | |
: 1726664299:0;iree-opt --pass-pipeline="builtin.module(func.func(iree-codegen-tile-and-distribute-to-workgroups-using-forall-op, cse))" ~/test.mlir -mlir-disable-threading | |
: 1726664322:0;iree-opt --pass-pipeline="builtin.module(func.func(iree-codegen-tile-and-distribute-to-workgroups-using-forall-op, cse))" ~/test.mlir -mlir-disable-threading | |
: 1726664363:0;riree | |
: 1726664497:0;iree-opt --pass-pipeline="builtin.module(func.func(iree-codegen-tile-and-distribute-to-workgroups-using-forall-op, cse))" ~/test.mlir -mlir-disable-threading | |
: 1726714968:0;tmux attach -t iree-dev | |
: 1726714974:0;tmux attach -t shortfin | |
: 1726721558:0;pip install --no-build-isolation -v -e .\ | |
: 1726721566:0;pytest -v -k "test_get" | |
: 1726734803:0;tmux attach -t iree-dev | |
: 1726735044:0;tmux attach -t shortfin | |
: 1726737266:0;pip install --no-build-isolation -v -e .\ | |
: 1726745120:0;tmux attach -t shortfin | |
: 1726745133:0;pytest -v -k "test_get" | |
: 1726757384:0;tmux attach -t shortfin | |
: 1726758742:0;pip install --no-build-isolation -v -e .\ | |
: 1726758772:0;python | |
: 1726758782:0;python python/shortfin/interop/support/logging_setup.py | |
: 1726759972:0;git ppf | |
: 1726759990:0;git remote add pashu [email protected]:nod-ai/sharktank.git | |
: 1726759993:0;git ppf | |
: 1726760025:0;git remote remove pashu | |
: 1726760036:0;git remote add pashu [email protected]:pashu123/sharktank.git | |
: 1726760045:0;git branch -m logging | |
: 1726760047:0;git ppf | |
: 1726760167:0;git clang-format HEAD~1 | |
: 1726760221:0;clang-format -i python/lib_ext.cc | |
: 1726760244:0;git ppf | |
: 1726760385:0;git o main | |
: 1726760394:0;git checkout origin/main | |
: 1726760398:0;git stash | |
: 1726760401:0;git checkout origin/main | |
: 1726760404:0;git ob main | |
: 1726760409:0;git o logging | |
: 1726760413:0;git rebase main | |
: 1726760416:0;git ppf | |
: 1726823935:0;tmux attach -t iree-dev | |
: 1726823964:0;iree-opt --pass-pipeline="builtin.module(func.func(iree-codegen-iree-comprehensive-bufferize), cse, canonicalize, cse )" ~/test.mlir > new1.mlir | |
: 1726823969:0;vi ~/new.mlir | |
: 1726823983:0;vi ~/test.mlir | |
: 1726823997:0;iree-opt --pass-pipeline="builtin.module(func.func(iree-codegen-iree-comprehensive-bufferize), cse, canonicalize, cse )" ~/test.mlir > new1.mlir | |
: 1726824008:0;vi new1.mlir | |
: 1726986333:0;tmux attach -t 0 | |
: 1726986336:0;tmux ls | |
: 1726986341:0;tmux attach -t iree-dev | |
: 1726986347:0;ls | |
: 1726986350:0;cd megabump | |
: 1726986351:0;ls | |
: 1726986353:0;cd work | |
: 1726986353:0;ls | |
: 1726986356:0;cd iree | |
: 1726986357:0;ls | |
: 1726986364:0;git puom | |
: 1726986368:0;git o main | |
: 1726986372:0;git puom | |
: 1726986377:0;git submodule update --init | |
: 1726986381:0;cd third_party/llvm-project | |
: 1726986381:0;ls | |
: 1726986385:0;git remote -vv | |
: 1726986398:0;cd .. | |
: 1726986399:0;ls | |
: 1726986400:0;cd .. | |
: 1726986401:0;ls | |
: 1726986403:0;clear | |
: 1726986403:0;ls | |
: 1726986410:0;cd .. | |
: 1726986410:0;ls | |
: 1726986419:0;./scripts/llvm_revision status | |
: 1726986447:0;./scripts/start_integrate | |
: 1726986484:0;vi | |
: 1726986537:0;git o integrates/llvm-20240922 | |
: 1726986759:0;git submodule update --init | |
: 1726986768:0;./scripts/start_integrate | |
: 1726986819:0;cd work/iree | |
: 1726986819:0;ls | |
: 1726986821:0;git lg | |
: 1726986891:0;build_new.sh | |
: 1726986897:0;pip install cmake | |
: 1726986902:0;pip install ninja | |
: 1726986905:0;build_new.sh | |
: 1726989689:0;vi | |
: 1726989702:0;git ppf | |
: 1726989763:0;cd .. | |
: 1726989764:0;ls | |
: 1726989767:0;cd .. | |
: 1726989768:0;ls | |
: 1726989776:0;./scripts/start_integrate | |
: 1726989789:0;./scripts/llvm_revision status | |
: 1726989831:0;cd work/iree | |
: 1726989831:0;ls | |
: 1726989833:0;vi | |
: 1726989845:0;cd third_party/llvm-project | |
: 1726989852:0;git o f264d9a9d56f165777f0e1750b3bdb74059fffd0 | |
: 1726989857:0;git lg | |
: 1726989948:0;cd .. | |
: 1726989949:0;ls | |
: 1726989952:0;cd .. | |
: 1726989953:0;vi | |
: 1726989960:0;git ppf | |
: 1726990026:0;git branch -D integrates/llvm-20240922_1 | |
: 1726990032:0;git branch -m integrates/llvm-20240922_1 | |
: 1726990033:0;git ppf | |
: 1726990054:0;riree | |
: 1726990071:0;build_new.sh | |
: 1726992434:0;tmux attach -t iree-dev | |
: 1726992437:0;ls | |
: 1726992443:0;cd third_party/llvm-project | |
: 1726992443:0;ls | |
: 1726992444:0;git lg | |
: 1726992453:0;vi | |
: 1727104791:0;ls | |
: 1727104793:0;pwd | |
: 1727104969:0;ls -la\ | |
: 1727105035:0;scp -r [email protected]:$HOME/.gitconfig . | |
: 1727105065:0;exit | |
: 1727105066:0;11exit | |
: 1727105067:0;exit | |
: 1727105069:0;tmux | |
: 1727105089:0;vi ~/tmux.conf | |
: 1727105100:0;vim ~/.tmux.conf | |
: 1727105112:0;/usr/vi ~/tmux.conf | |
: 1727105116:0;/usr/bin/vi ~/tmux.conf | |
: 1727105122:0;/usr/bin/vi ~/.tmux.conf | |
: 1727105175:0;git clone https://github.com/tmux-plugins/tpm ~/.tmux/plugins/tpm | |
: 1727105214:0;clear | |
: 1727105214:0;ls | |
: 1727105220:0;clear | |
: 1727105220:0;ls | |
: 1727105221:0;ebd | |
: 1727105245:0;LV_BRANCH='release-1.4/neovim-0.9' bash <(curl -s https://raw.githubusercontent.com/LunarVim/LunarVim/release-1.4/neovim-0.9/utils/installer/install.sh) | |
: 1727105253:0;sudo apt install -y neovim | |
: 1727105265:0;nvim | |
: 1727105270:0;LV_BRANCH='release-1.4/neovim-0.9' bash <(curl -s https://raw.githubusercontent.com/LunarVim/LunarVim/release-1.4/neovim-0.9/utils/installer/install.sh) | |
: 1727105281:0;sudo apt-get remove neovim | |
: 1727105415:0;curl -LO https://github.com/neovim/neovim/releases/latest/download/nvim-linux64.tar.gz | |
: 1727105424:0;ls | |
: 1727105449:0;sudo tar -C /usr/bin/ -xzf nvim-linux64.tar.gz | |
: 1727105452:0;nvim | |
: 1727105473:0;cd /usr/bin | |
: 1727105474:0;ls | |
: 1727105485:0;./nvim-linux64/bin | |
: 1727105486:0;ls | |
: 1727105500:0;sudo mv nvim ../../ | |
: 1727105502:0;clear | |
: 1727105502:0;ls | |
: 1727105503:0;cd .. | |
: 1727105506:0;cd ~ | |
: 1727105507:0;clear | |
: 1727105507:0;ls | |
: 1727105509:0;nvim | |
: 1727105528:0;bash <(curl -s https://raw.githubusercontent.com/lunarvim/lunarvim/master/utils/installer/install.sh) | |
: 1727105537:0;sudo apt-get install cargo | |
: 1727105574:0;bash <(curl -s https://raw.githubusercontent.com/lunarvim/lunarvim/master/utils/installer/install.sh) | |
: 1727105628:0;clear | |
: 1727105628:0;ls | |
: 1727105632:0;wget https://github.com/neovim/neovim/releases/download/nightly/nvim-linux64.tar.gz | |
: 1727105684:0;ls | |
: 1727105688:0;rm nvim-linux64.tar.gz | |
: 1727105692:0;rm nvim-linux64.tar.gz.1 | |
: 1727105693:0;clear | |
: 1727105693:0;ls | |
: 1727105695:0;wget https://github.com/neovim/neovim/releases/download/v0.9.0/nvim-linux64.tar.gz | |
: 1727105717:0;ls | |
: 1727105722:0;sudo tar -C /usr/bin/ -xzf nvim-linux64.tar.gz | |
: 1727105729:0;cd /usr/bin | |
: 1727105734:0;rm nvim | |
: 1727105738:0;sudo rm nvim | |
: 1727105744:0;clear | |
: 1727105745:0;ls | |
: 1727105752:0;cd nvim-linux64 | |
: 1727105753:0;ls | |
: 1727105754:0;cd bin | |
: 1727105755:0;ls | |
: 1727105761:0;sudo mv nvim ../../ | |
: 1727105764:0;cd ~ | |
: 1727105764:0;ls | |
: 1727105775:0;LV_BRANCH='release-1.4/neovim-0.9' bash <(curl -s https://raw.githubusercontent.com/LunarVim/LunarVim/release-1.4/neovim-0.9/utils/installer/install.sh) | |
: 1727105795:0;sudo apt-get install python3-dev | |
: 1727105812:0;sudo apt-get install python3-pip | |
: 1727105826:0;LV_BRANCH='release-1.4/neovim-0.9' bash <(curl -s https://raw.githubusercontent.com/LunarVim/LunarVim/release-1.4/neovim-0.9/utils/installer/install.sh) | |
: 1727105865:0;sudo apt-get remove cargo | |
: 1727105870:0;curl --proto '=https' --tlsv1.2 -sSf https://sh.rustup.rs | sh\ | |
: 1727105878:0;sudo apt-get remove rust | |
: 1727106036:0;rustc --version | |
: 1727106043:0;sudo apt-get remove rustc | |
: 1727106058:0;curl --proto '=https' --tlsv1.2 -sSf https://sh.rustup.rs | sh\ | |
: 1727106108:0;source ~/.cargo/env | |
: 1727106116:0;LV_BRANCH='release-1.4/neovim-0.9' bash <(curl -s https://raw.githubusercontent.com/LunarVim/LunarVim/release-1.4/neovim-0.9/utils/installer/install.sh) | |
: 1727106321:0;clear | |
: 1727106321:0;ls | |
: 1727106325:0;rm nvim-linux64.tar.gz | |
: 1727106327:0;clear | |
: 1727106327:0;ls | |
: 1727106330:0;rm xyz.txt | |
: 1727106331:0;clear | |
: 1727106332:0;ls | |
: 1727106334:0;vi | |
: 1727106399:0;clear | |
: 1727106400:0;ls | |
: 1727106458:0;vi | |
: 1727166768:0;\ | |
: 1727166770:0;clear | |
: 1727166770:0;ls | |
: 1727166777:0;tmux ls | |
: 1727166780:0;tmux attach -t 0 | |
: 1727166782:0;clear | |
: 1727166783:0;ls | |
: 1727166786:0;vi | |
: 1727166931:0;bash <(curl -s https://raw.githubusercontent.com/lunarvim/lunarvim/master/utils/installer/install.sh) | |
: 1727167014:0;sudo rm /usr/bin/nvim | |
: 1727167029:0;sudo rm -rf /usr/bin/nvim-linux64/ | |
: 1727167030:0;clear | |
: 1727167031:0;ls | |
: 1727167036:0;sudo add-apt-repository ppa:neovim-ppa/unstable | |
: 1727167054:0;sudo add-apt-repository ppa:neovim-ppa/stable | |
: 1727167088:0;sudo apt update | |
: 1727167119:0;sudo apt install neovim | |
: 1727167167:0;nvim | |
: 1727167174:0;bash <(curl -s https://raw.githubusercontent.com/lunarvim/lunarvim/master/utils/installer/install.sh) | |
: 1727167235:0;mv /usr/bin/clangd-18 /usr/bin/clangd | |
: 1727167238:0;sudo mv /usr/bin/clangd-18 /usr/bin/clangd | |
: 1727167242:0;bash <(curl -s https://raw.githubusercontent.com/lunarvim/lunarvim/master/utils/installer/install.sh) | |
: 1727167302:0;sudo apt-get remove neovim | |
: 1727167353:0;wget https://github.com/neovim/neovim/releases/download/v0.9.5/nvim.appimage | |
: 1727167363:0;chmod +x nvim.appimage | |
: 1727167365:0;./nvim.appimage | |
: 1727167398:0;./nvim.appimage --appimage-extract | |
: 1727167400:0;ls | |
: 1727167403:0;cd squashfs-root | |
: 1727167404:0;ls | |
: 1727167409:0;cd usr | |
: 1727167409:0;ls | |
: 1727167411:0;cd bin | |
: 1727167412:0;ls | |
: 1727167414:0;./nvim | |
: 1727167422:0;cd .. | |
: 1727167422:0;ls | |
: 1727167423:0;cd .. | |
: 1727167424:0;ls | |
: 1727167430:0;./AppRun | |
: 1727167438:0;mv AppRun nvim | |
: 1727167440:0;./nvim | |
: 1727167444:0;clear | |
: 1727167444:0;ls | |
: 1727167446:0;lsls | |
: 1727167446:0;ls | |
: 1727167450:0;cd .. | |
: 1727167450:0;ls | |
: 1727167454:0;mv squashfs-root nvim | |
: 1727167455:0;ls | |
: 1727167459:0;rm nvim.appimage | |
: 1727167461:0;clear | |
: 1727167461:0;ls | |
: 1727167462:0;s | |
: 1727167464:0;ls | |
: 1727167472:0;vi ~/.zshrc | |
: 1727167483:0;/usr/bin/vi ~/.zshrc | |
: 1727167514:0;sz | |
: 1727167517:0;nvim | |
: 1727167519:0;clear | |
: 1727167519:0;ls | |
: 1727167529:0;bash ~/.local/share/lunarvim/lvim/utils/installer/uninstall.sh | |
: 1727167538:0;LV_BRANCH='release-1.4/neovim-0.9' bash <(curl -s https://raw.githubusercontent.com/LunarVim/LunarVim/release-1.4/neovim-0.9/utils/installer/install.sh) | |
: 1727167586:0;clear | |
: 1727167586:0;ls | |
: 1727167588:0;vi | |
: 1727167647:0;LAZYGIT_VERSION=$(curl -s "https://api.github.com/repos/jesseduffield/lazygit/releases/latest" | grep -Po '"tag_name": "v\K[^"]*')\ | |
curl -Lo lazygit.tar.gz "https://github.com/jesseduffield/lazygit/releases/latest/download/lazygit_${LAZYGIT_VERSION}_Linux_x86_64.tar.gz"\ | |
tar xf lazygit.tar.gz lazygit\ | |
sudo install lazygit /usr/local/bin | |
: 1727167655:0;lazygit | |
: 1727167659:0;clear | |
: 1727167659:0;ls | |
: 1727167677:0;rm lazygit lazygit.tar.gz | |
: 1727167681:0;lazygit | |
: 1727167683:0;clear | |
: 1727167684:0;ls | |
: 1727167685:0;htop | |
: 1727167692:0;sudo apt-get install bpytop | |
: 1727167698:0;htop | |
: 1727167728:0;clear | |
: 1727167728:0;ls | |
: 1727167732:0;clear | |
: 1727167732:0;ls | |
: 1727167762:0;ssh-keygen | |
: 1727167773:0;cat ~/.ssh/id_rsa.pub | |
: 1727167828:0;git clone [email protected]:iree-org/iree.git | |
: 1727167862:0;cd iree | |
: 1727167866:0;git submodule update --init | |
: 1727168099:0;clear | |
: 1727168099:0;ls | |
: 1727168099:0;s | |
: 1727168100:0;ls | |
: 1727168113:0;which python3.12 | |
: 1727168121:0;sudo apt-get install python3.12 | |
: 1727168148:0;sudo apt install software-properties-common -y | |
: 1727168154:0;sudo add-apt-repository ppa:deadsnakes/ppa | |
: 1727168170:0;sudo apt install python3.12 | |
: 1727168195:0;curl -sS https://bootstrap.pypa.io/get-pip.py | python3.12 | |
: 1727168206:0;sudo apt install python3.12-dev | |
: 1727168239:0;python3.12 -m venv .iree_venv | |
: 1727168278:0;sudo apt install python3.12-venv | |
: 1727168285:0;python3.12 -m venv .iree_venv | |
: 1727168298:0;source ~/iree/.iree_venv/bin/activate | |
: 1727168299:0;clear | |
: 1727168299:0;ls | |
: 1727168330:0;python -m pip install -r runtime/bindings/python/iree/runtime/build_requirements.txt | |
: 1727168341:0;biree | |
: 1727168346:0;pip install cmake ninja | |
: 1727168350:0;biree | |
: 1727168385:0;sudo apt-get install ccache | |
: 1727168391:0;biree | |
: 1727188823:0;tmux attach -t 0 | |
: 1727188825:0;clear | |
: 1727188826:0;ls | |
: 1727188831:0;clear | |
: 1727188831:0;ls | |
: 1727188834:0;source ~/iree/.iree_venv/bin/activate | |
: 1727188835:0;clear | |
: 1727188835:0;ls | |
: 1727188837:0;clear | |
: 1727188838:0;ls | |
: 1727188843:0;riree | |
: 1727188921:0;sudo apt-get install libcapstone-dev | |
: 1727188958:0;clear | |
: 1727188958:0;ls | |
: 1727188968:0;riree | |
: 1727189155:0;sudo apt install libcapstone-dev | |
: 1727189165:0;sudo apt install libtbb-dev libzstd-dev libglfw3-dev libfreetype6-dev libgtk-3-dev | |
: 1727189208:0;clear | |
: 1727189209:0;ls | |
: 1727189213:0;clear | |
: 1727189214:0;ls | |
: 1727189216:0;riree | |
: 1727189222:0;biree | |
: 1727189234:0;riree | |
: 1727189254:0;clear | |
: 1727189255:0;ls | |
: 1727189258:0;clear | |
: 1727189259:0;ls | |
: 1727189259:0;vi | |
: 1727189274:0;sz | |
: 1727189275:0;vi | |
: 1727189339:0;sudo apt-get install rip-grep | |
: 1727189344:0;sudo apt-get install ripgrep | |
: 1727190601:0;j | |
: 1727190606:0;exit | |
: 1728896387:0;hopt | |
: 1728896388:0;htop | |
: 1728896408:0;clear | |
: 1728896408:0;ls | |
: 1728896411:0;htop | |
: 1728896425:0;source ~/iree/.iree_venv/bin/activate | |
: 1728896426:0;clear | |
: 1728896426:0;ls | |
: 1728896430:0;cd iree | |
: 1728896432:0;git puom | |
: 1728896488:0;git submodule update --init | |
: 1728896492:0;biree | |
: 1728899646:0;sudo tailscale up | |
: 1728899650:0;htop | |
: 1728901009:0;clear | |
: 1728901011:0;htop | |
: 1728901024:0;clear | |
: 1728901024:0;ls | |
: 1728901027:0;vi | |
: 1728901147:0;node | |
: 1728901152:0;nodejs | |
: 1728901281:0;clear | |
: 1728901282:0;ls | |
: 1728901285:0;htop | |
: 1728901290:0;clear | |
: 1728901291:0;ls | |
: 1728901295:0;clear | |
: 1728901296:0;ls | |
: 1728901349:0;clear | |
: 1728901350:0;ls | |
: 1728901352:0;htop | |
: 1728901356:0;clear | |
: 1728901356:0;ls | |
: 1728901358:0;tmux | |
: 1728901362:0;clear | |
: 1728901362:0;ls | |
: 1728901364:0;clear | |
: 1728901365:0;ls | |
: 1728901368:0;curl -fsSL https://deb.nodesource.com/setup_current.x | sudo -E bash - | |
: 1728901389:0;sudo apt-get install nodejs -y | |
: 1728901400:0;vi | |
: 1728901487:0;clear | |
: 1728901487:0;ls | |
: 1728901492:0;source ~/iree/.iree_venv/bin/activate | |
: 1728901493:0;clear | |
: 1728901494:0;ls | |
: 1728901495:0;biree | |
: 1728904406:0;clear | |
: 1728904407:0;ls | |
: 1728904411:0;clear | |
: 1728904412:0;ls | |
: 1728904416:0;htop | |
: 1728904424:0;pip install psutil | |
: 1728904427:0;htop | |
: 1728904435:0;clear | |
: 1728904435:0;ls | |
: 1728904440:0;cd iree | |
: 1728904441:0;vi | |
: 1728904461:0;ls | |
: 1728904475:0;mv iree-build/compile_commands.json ~/iree | |
: 1728904478:0;cd iree | |
: 1728904481:0;vi | |
: 1728905096:0;clear | |
: 1728905097:0;ls | |
: 1728905106:0;mkdir test | |
: 1728905108:0;clear | |
: 1728905108:0;ls | |
: 1728905111:0;cd test | |
: 1728905111:0;ls | |
: 1728905115:0;mkdir test_err | |
: 1728905122:0;git remote -vv | |
: 1728905178:0;git remote add pashu [email protected]:pashu123/iree.git | |
: 1728905184:0;git fetch pashu | |
: 1728905252:0;git puom | |
: 1728905266:0;bpytop | |
: 1728905374:0;clear | |
: 1728905374:0;ls | |
: 1728905378:0;clear | |
: 1728905379:0;ls | |
: 1728905356:76;git fetch pashu | |
: 1728905439:305;git remote show origin | |
: 1728905763:0;cat ~/.ssh/id_rsa.pub | |
: 1728906248:0;clear | |
: 1728906249:0;ls | |
: 1728906251:0;git pull | |
: 1728906422:0;clear | |
: 1728906423:0;ls | |
: 1728906446:0;exit | |
: 1728915108:0;clear | |
: 1728915108:0;ls | |
: 1728915110:0;tmux ls | |
: 1728915114:0;tmux attach -t 0 | |
: 1728915124:0;vi ~/.gitconfig | |
: 1728915137:0;git pull | |
: 1728915164:0;git config --list | |
: 1728915219:0;clear | |
: 1728915219:0;ls | |
: 1728915221:0;git lg | |
: 1728915224:0;git pull | |
: 1728915256:0;git:q | |
: 1728915257:0;:q | |
: 1728915266:0;vi ~/.ssh/config | |
: 1728915275:0;git pull | |
: 1728915288:0;clear | |
: 1728915288:0;ls | |
: 1728915298:0;git fetch pashu | |
: 1728915360:0;git submodule update --init | |
: 1728915385:0;clear | |
: 1728915386:0;ls | |
: 1728915403:0;git o pashu/enablemultitiling | |
: 1728915414:0;git ob enablemultitiling | |
: 1728915419:0;riree | |
: 1728915540:0;clear | |
: 1728915541:0;ls | |
: 1728915543:0;source ~/iree/.iree_venv/bin/activate | |
: 1728915544:0;clear | |
: 1728915545:0;ls | |
: 1728915548:0;clear | |
: 1728915549:0;ls | |
: 1728915660:0;cmake --build ~/iree-build --target iree-run-tests -j 32 | |
: 1728915773:0;CTEST_PARALLEL_LEVEL=32 cmake --build ~/iree-build --target iree-run-tests -j 32 | |
: 1728915834:0;clear | |
: 1728915835:0;ls | |
: 1728915842:0;amdgpu top | |
: 1728915879:0;cargo install amdgpu_top | |
: 1728915983:0;sudo apt install libdrm-dev | |
: 1728915991:0;cargo install amdgpu_top | |
: 1728916064:0;amdgpu_top | |
: 1728916104:0;clear | |
: 1728916105:0;ls | |
: 1728916110:0;clear | |
: 1728916111:0;ls | |
: 1728916122:0;clear | |
: 1728916122:0;ls | |
: 1728918746:0;clear | |
: 1728918747:0;ls | |
: 1728918752:0;htop | |
: 1728918761:0;clear | |
: 1728918761:0;ls | |
: 1728918777:0;clear | |
: 1728918777:0;ls | |
: 1728918780:0;clear | |
: 1728918780:0;ls | |
: 1728918787:0;biree | |
: 1728918801:0;riree | |
: 1728918805:0;clear | |
: 1728918806:0;vi | |
: 1728918861:0;clear | |
: 1728918861:0;ls | |
: 1728918869:0;vi | |
: 1728918940:0;pip install tree-sitter | |
: 1728918944:0;vi | |
: 1728918963:0;tree-sitter | |
: 1728918988:0;cargo install tree-sitter-cli | |
: 1728919266:0;clear | |
: 1728919267:0;htop | |
: 1728919849:0;clear | |
: 1728919850:0;ls | |
: 1728919861:0;clear | |
: 1728919862:0;ls | |
: 1728919867:0;vi | |
: 1728925006:0;cd .. | |
: 1728925007:0;ls | |
: 1728925008:0;clear | |
: 1728925008:0;ls | |
: 1728925012:0;git clone [email protected]:nod-ai/SHARK-Platform.git | |
: 1728925024:0;cd SHARK-Platform | |
: 1728925024:0;ls | |
: 1728925056:0;python3.12 -m venv --prompt sharktank .venv | |
: 1728925076:0;source ~/SHARK-Platform/.venv/bin/activate | |
: 1728925087:0;pip install -r pytorch-cpu-requirements.txt | |
: 1728925313:0;pip install -f https://iree.dev/pip-release-links.html --src deps \\ | |
-e "git+https://github.com/iree-org/iree-turbine.git#egg=iree-turbine" | |
: 1728925442:0;pip install -r requirements.txt -e sharktank/ shortfin/ | |
: 1728925508:0;pip install cmake ninja | |
: 1728925512:0;pip install -r requirements.txt -e sharktank/ shortfin/ | |
: 1728925666:0;htop | |
: 1728926001:0;clear | |
: 1728926001:0;ls | |
: 1728926009:0;cd shortfin | |
: 1728926034:0;cmake -GNinja -S. -Bbuild \\ | |
-DCMAKE_C_COMPILER=clang -DCMAKE_CXX_COMPILER=clang++ \\ | |
-DCMAKE_LINKER_TYPE=LLD\ | |
cmake --build build --target all | |
: 1728926048:0;cmake -GNinja -S. -Bbuild \\ | |
-DCMAKE_C_COMPILER=clang-18 -DCMAKE_CXX_COMPILER=clang-18++ \\ | |
-DCMAKE_LINKER_TYPE=LLD\ | |
cmake --build build --target all | |
: 1728926067:0;cmake -GNinja -S. -Bbuild \\ | |
-DCMAKE_C_COMPILER=clang-18 -DCMAKE_CXX_COMPILER=clang++-18 \\ | |
-DCMAKE_LINKER_TYPE=LLD\ | |
cmake --build build --target all | |
: 1728926348:0;pip install setuptools wheel | |
: 1728926361:0;SHORTFIN_DEV_MODE=ON pip install --no-build-isolation -v -e . | |
: 1728926376:0;ls | |
: 1728926379:0;rm -rf build | |
: 1728926381:0;SHORTFIN_DEV_MODE=ON pip install --no-build-isolation -v -e . | |
: 1728926400:0;ls | |
: 1728926402:0;vi setup.py | |
: 1728926417:0;SHORTFIN_DEV_MODE=ON pip install --no-build-isolation -v -e . | |
: 1728926437:0;ls | |
: 1728926439:0;rm -rf build | |
: 1728926441:0;SHORTFIN_DEV_MODE=ON pip install --no-build-isolation -v -e . | |
: 1728926466:0;vi setup.py | |
: 1728926484:0;rm -rf build | |
: 1728926488:0;SHORTFIN_DEV_MODE=ON pip install --no-build-isolation -v -e . | |
: 1728926739:0;clear | |
: 1728926739:0;ls | |
: 1728926754:0;pytest tests/ | |
: 1728926780:0;ls | |
: 1728926787:0;cd SHARK-Platform | |
: 1728926788:0;ls | |
: 1728926794:0;cd sharktank | |
: 1728926794:0;vi | |
: 1728926965:0;pip install dataclasses-json | |
: 1728926971:0;pytest tests/ | |
: 1728927641:0;ls | |
: 1728932328:0;clear | |
: 1728932328:0;ls | |
: 1728932338:0;clear | |
: 1728932338:0;ls | |
: 1728932339:0;htp | |
: 1728932341:0;htop | |
: 1728932347:0;pip install psutil | |
: 1728932350:0;htop | |
: 1728932353:0;clear | |
: 1728932353:0;ls | |
: 1728932417:0;vi | |
: 1728932429:0;source ~/SHARK-Platform/.venv/bin/activate | |
: 1728932430:0;vi | |
: 1728932682:0;ls | |
: 1728932697:0;pwd | |
: 1728932700:0;cd ../shortfin | |
: 1728932701:0;ls | |
: 1728932703:0;cd build | |
: 1728932703:0;ls | |
: 1728932705:0;cd cmake | |
: 1728932705:0;ls | |
: 1728932708:0;cd default | |
: 1728932708:0;ls | |
: 1728932712:0;cd ../.. | |
: 1728932713:0;ls | |
: 1728932715:0;cd .. | |
: 1728932715:0;ls | |
: 1728932722:0;vi setup.py | |
: 1728932761:0;ls | |
: 1728932762:0;vi | |
: 1728932765:0;ebd | |
: 1728932798:0;j:w | |
: 1728932799:0;exit | |
: 1728932819:0;SHORTFIN_DEV_MODE=ON pip install --no-build-isolation -v -e . | |
: 1728932825:0;ls | |
: 1728932828:0;rm -rf build | |
: 1728932830:0;SHORTFIN_DEV_MODE=ON pip install --no-build-isolation -v -e . | |
: 1728933082:0;ls | |
: 1728933136:0;ln -s build/build/cmake/default/compile_commands.json compile_commands.json | |
: 1728933139:0;ls -l | |
: 1728933141:0;clear | |
: 1728933141:0;ls | |
: 1728933144:0;vi compile_commands.json | |
: 1728933161:0;vi build/build/cmake/default/compile_commands.json | |
: 1728933175:0;vi | |
: 1728975097:0;\ | |
: 1728975099:0;clear | |
: 1728975099:0;ls | |
: 1728975109:0;tmux attach -t 0 | |
: 1728975119:0;git fetch origin | |
: 1728975146:0;git o main | |
: 1728975153:0;git puom | |
: 1728975159:0;clear | |
: 1728975159:0;ls | |
: 1728975161:0;git submodule update --init | |
: 1728975165:0;clear | |
: 1728975166:0;ls | |
: 1728975175:0;git ob cpudefault | |
: 1728975179:0;riree | |
: 1728979033:0;\ | |
: 1728979035:0;tmux attach -t 0 | |
: 1728979061:0;sudo do-release-upgrade | |
: 1728979077:0;tmux attach -t 0 | |
: 1728979079:0;clear | |
: 1728979080:0;ls | |
: 1728979084:0;vi | |
: 1728979140:0;riree | |
: 1728979174:0;CTEST_PARALLEL_LEVEL=32 cmake --build ~/iree-build --target iree-run-tests -j 32 | |
: 1728979440:0;cd ~ | |
: 1728979441:0;ls | |
: 1728979443:0;cd test | |
: 1728979444:0;ls | |
: 1728979449:0;mkdir stablehlo | |
: 1728979451:0;cd stablehlo | |
: 1728979452:0;clear | |
: 1728979452:0;ls | |
: 1728979455:0;cd /home/prashant/iree-build/tests/e2e/stablehlo_ops && /home/prashant/iree-build/tools/iree-compile --output-format=vm-bytecode --mlir-print-op-on-diagnostic=false --iree-hal-target-backends=vmvx --iree-input-type=stablehlo --iree-input-demote-f64-to-f32 /home/prashant/iree/tests/e2e/stablehlo_ops/dynamic_slice.mlir -o check_vmvx_local-task_dynamic_slice.mlir_module.vmfb --iree-hal-executable-object-search-path=\"/home/prashant/iree-build\" | |
: 1728979471:0;cd /home/prashant/iree-build/tests/e2e/stablehlo_ops && /home/prashant/iree-build/tools/iree-compile --output-format=vm-bytecode --mlir-print-op-on-diagnostic=false --iree-hal-target-backends=vmvx --iree-input-type=stablehlo --iree-input-demote-f64-to-f32 /home/prashant/iree/tests/e2e/stablehlo_ops/dynamic_slice.mlir -o check_vmvx_local-task_dynamic_slice.mlir_module.vmfb --iree-hal-executable-object-search-path=\"/home/prashant/iree-build\" -mlir-print-ir-after-all 2> full.txt | |
: 1728979475:0;vi full.txt | |
: 1728979712:0;CTEST_PARALLEL_LEVEL=32 cmake --build ~/iree-build --target iree-run-tests -j 32 | |
: 1728979946:0;cd /home/prashant/iree-build/tests/e2e/stablehlo_ops && /home/prashant/iree-build/tools/iree-compile --output-format=vm-bytecode --mlir-print-op-on-diagnostic=false --iree-hal-target-backends=vmvx --iree-input-type=stablehlo --iree-input-demote-f64-to-f32 /home/prashant/iree/tests/e2e/stablehlo_ops/dynamic_slice.mlir -o check_vmvx_local-task_dynamic_slice.mlir_module.vmfb --iree-hal-executable-object-search-path=\"/home/prashant/iree-build\" -mlir-print-ir-after-all 2> full.txt | |
: 1728979950:0;ls | |
: 1728979964:0;pwd | |
: 1728979970:0;vi full.txt | |
: 1728980048:0;cd ~/test/test_err | |
: 1728980049:0;ls | |
: 1728980055:0;cd ../stablehlo | |
: 1728980055:0;ls | |
: 1728980067:0;/home/prashant/iree-build/tools/iree-compile --output-format=vm-bytecode --mlir-print-op-on-diagnostic=false --iree-hal-target-backends=vmvx --iree-input-type=stablehlo --iree-input-demote-f64-to-f32 /home/prashant/iree/tests/e2e/stablehlo_ops/dynamic_slice.mlir -o check_vmvx_local-task_dynamic_slice.mlir_module.vmfb --iree-hal-executable-object-search-path=\"/home/prashant/iree-build\" -mlir-print-ir-after-all 2> full.txt | |
: 1728980071:0;vi full.txt | |
: 1728980074:0;pwd | |
: 1728980076:0;vi full.txt | |
: 1728980106:0;ls | |
: 1728980124:0;/home/prashant/iree-build/tools/iree-compile --output-format=vm-bytecode --mlir-print-op-on-diagnostic=false --iree-hal-target-backends=vmvx --iree-input-type=stablehlo --iree-input-demote-f64-to-f32 /home/prashant/iree/tests/e2e/stablehlo_ops/dynamic_slice.mlir -o check_vmvx_local-task_dynamic_slice.mlir_module.vmfb --iree-hal-executable-object-search-path=\"/home/prashant/iree-build\" | |
: 1728980147:0;vi ~/iree/tests/e2e/stablehlo_ops/dynamic_slice.mlir | |
: 1728980207:0;/home/prashant/iree-build/tools/iree-compile --output-format=vm-bytecode --mlir-print-op-on-diagnostic=false --iree-hal-target-backends=vmvx --iree-input-type=stablehlo --iree-input-demote-f64-to-f32 /home/prashant/iree/tests/e2e/stablehlo_ops/dynamic_slice.mlir -o check_vmvx_local-task_dynamic_slice.mlir_module.vmfb --iree-hal-executable-object-search-path=\"/home/prashant/iree-build\" | |
: 1728980211:0;vi ~/iree/tests/e2e/stablehlo_ops/dynamic_slice.mlir | |
: 1728980228:0;/home/prashant/iree-build/tools/iree-compile --output-format=vm-bytecode --mlir-print-op-on-diagnostic=false --iree-hal-target-backends=vmvx --iree-input-type=stablehlo --iree-input-demote-f64-to-f32 /home/prashant/iree/tests/e2e/stablehlo_ops/dynamic_slice.mlir -o check_vmvx_local-task_dynamic_slice.mlir_module.vmfb --iree-hal-executable-object-search-path=\"/home/prashant/iree-build\" -mlir-print-ir-after-all 2> full.txt | |
: 1728980231:0;vi full.txt | |
: 1728980263:0;cd ~ | |
: 1728980265:0;ebd | |
: 1728980508:0;riree | |
: 1728980520:0;/home/prashant/iree-build/tools/iree-compile --output-format=vm-bytecode --mlir-print-op-on-diagnostic=false --iree-hal-target-backends=vmvx --iree-input-type=stablehlo --iree-input-demote-f64-to-f32 /home/prashant/iree/tests/e2e/stablehlo_ops/dynamic_slice.mlir -o check_vmvx_local-task_dynamic_slice.mlir_module.vmfb --iree-hal-executable-object-search-path=\"/home/prashant/iree-build\" -mlir-print-ir-after-all 2> full.txt | |
: 1728980527:0;/home/prashant/iree-build/tools/iree-compile --output-format=vm-bytecode --mlir-print-op-on-diagnostic=false --iree-hal-target-backends=vmvx --iree-input-type=stablehlo --iree-input-demote-f64-to-f32 /home/prashant/iree/tests/e2e/stablehlo_ops/dynamic_slice.mlir -o check_vmvx_local-task_dynamic_slice.mlir_module.vmfb --iree-hal-executable-object-search-path=\"/home/prashant/iree-build\" | |
: 1728980564:0;/home/prashant/iree-build/tools/iree-compile --output-format=vm-bytecode --mlir-print-op-on-diagnostic=false --iree-hal-target-backends=vmvx --iree-input-type=stablehlo --iree-input-demote-f64-to-f32 /home/prashant/iree/tests/e2e/stablehlo_ops/dynamic_slice.mlir -o check_vmvx_local-task_dynamic_slice.mlir_module.vmfb --iree-hal-executable-object-search-path=\"/home/prashant/iree-build\" --iree-input-demote-i64-to-i32 | |
: 1728980565:0;ls | |
: 1728980720:0;rriee | |
: 1728980722:0;riree | |
: 1728980735:0;/home/prashant/iree-build/tools/iree-compile --output-format=vm-bytecode --mlir-print-op-on-diagnostic=false --iree-hal-target-backends=vmvx --iree-input-type=stablehlo --iree-input-demote-f64-to-f32 /home/prashant/iree/tests/e2e/stablehlo_ops/dynamic_slice.mlir -o check_vmvx_local-task_dynamic_slice.mlir_module.vmfb --iree-hal-executable-object-search-path=\"/home/prashant/iree-build\" --iree-input-demote-i64-to-i32 | |
: 1728980740:0;/home/prashant/iree-build/tools/iree-compile --output-format=vm-bytecode --mlir-print-op-on-diagnostic=false --iree-hal-target-backends=vmvx --iree-input-type=stablehlo --iree-input-demote-f64-to-f32 /home/prashant/iree/tests/e2e/stablehlo_ops/dynamic_slice.mlir -o check_vmvx_local-task_dynamic_slice.mlir_module.vmfb --iree-hal-executable-object-search-path=\"/home/prashant/iree-build\" | |
: 1728980793:0;biree | |
: 1728981022:0;\ | |
: 1728981025:0;tmux attach -t 0 | |
: 1728981027:0;ls | |
: 1728981037:0;CTEST_PARALLEL_LEVEL=32 cmake --build ~/iree-build --target iree-run-tests -j 32 | |
: 1728981256:0;tmux attach -t 0 | |
: 1728981263:0;CTEST_PARALLEL_LEVEL=32 cmake --build ~/iree-build --target iree-run-tests -j 32 | |
: 1728981317:0;ls | |
: 1728981318:0;cd iree | |
: 1728981319:0;ls | |
: 1728981323:0;vi .gitignore | |
: 1728981346:0;source ~/iree/.iree_venv/bin/activate | |
: 1728981347:0;vi | |
: 1728981437:0;\ | |
\ | |
: 1728981441:0;tmux attach -t 0 | |
: 1728982360:0;\ | |
: 1728982363:0;tmux attach -t 0 | |
: 1728982421:0;vi ~/.gitconfig | |
: 1728982473:0;gpg --full generate key | |
: 1728982483:0;gpg --full generate-key | |
: 1728982521:0;gpg --full-generate-key | |
: 1728982663:0;gpg --list-secret-keys --keyid-format=long | |
: 1728982714:0;gpg --armor export 03B06F7551D1656F | |
: 1728982722:0;gpg --armor --export 03B06F7551D1656F | |
: 1728982740:0;gpg --armor --export 03B06F7551D1656F > file.txt | |
: 1728982743:0;vi file.txt | |
: 1728982790:0;gist-paste file.txt | |
: 1728982830:0;sudo apt install gist | |
: 1728982918:0;gsi | |
: 1728982923:0;gist-paste | |
: 1728982928:0;gist --login | |
: 1728982932:0;gist-paste --login | |
: 1728982956:0;q | |
: 1728982961:0;gist-paste file.txt | |
: 1728983256:0;tmux attach -t 0 | |
: 1728983262:0;git config --global commit.gpgSign true | |
: 1728983277:0;gpg --list-secret-keys --keyid-format=long | |
: 1728983448:0;\ | |
: 1728983450:0;tmux attach -t 0 | |
: 1728983451:0;git config --global user.signingkey 03B06F7551D1656F | |
: 1728983471:0;ls | |
: 1728983475:0;vi .gitignore | |
: 1728983486:0;vi | |
: 1728983568:0;ls | |
: 1728983572:0;clear | |
: 1728983573:0;ls | |
: 1728983575:0;git ppf | |
: 1728983648:0;git clang-format HEAD~1 | |
: 1728983662:0;git clang-format-18 HEAD~1 | |
: 1728983669:0;clang-format-18 | |
: 1728983672:0;clang-format | |
: 1728983721:0;sudo apt-get install clang-format | |
: 1728983776:0;clear | |
: 1728983777:0;ls | |
: 1728983779:0;tmux attach -t 0 | |
: 1728983784:0;git clang-format-18 HEAD~1 | |
: 1728983790:0;git clang-format HEAD~1 | |
: 1728983797:0;r | |
: 1728983797:0;git clang-format HEAD~1 | |
: 1728983799:0;clear | |
: 1728983799:0;ls | |
: 1728985997:0;clear | |
: 1728985997:0;ls | |
: 1728986000:0;biree | |
: 1728986006:0;clear | |
: 1728986006:0;ls | |
: 1728986035:0;cp ~/iree/tests/e2e/linalg_ext_ops/scatter.mlir . | |
: 1728986037:0;ls | |
: 1728986040:0;vi scatter.mlir | |
: 1728987641:0;tmux attach -t 0 | |
: 1728988875:0;\ | |
: 1728988878:0;clear | |
: 1728988880:0;tmux attach -t 0 | |
: 1728988893:0;/home/prashant/iree-build/tools/iree-compile --output-format=vm-bytecode --mlir-print-op-on-diagnostic=false --iree-hal-target-backends=vmvx --iree-input-type=stablehlo --iree-input-demote-f64-to-f32 scatter.mlir -o check_vmvx_local-task_dynamic_slice.mlir_module.vmfb --iree-hal-executable-object-search-path=\"/home/prashant/iree-build\" | |
: 1728988904:0;/home/prashant/iree-build/tools/iree-compile --output-format=vm-bytecode --mlir-print-op-on-diagnostic=false --iree-hal-target-backends=llvm-cpu --iree-input-type=stablehlo --iree-input-demote-f64-to-f32 scatter.mlir -o check_vmvx_local-task_dynamic_slice.mlir_module.vmfb --iree-hal-executable-object-search-path=\"/home/prashant/iree-build\" | |
: 1728988917:0;cd iree | |
: 1728988918:0;vi | |
: 1728989258:0;/home/prashant/iree-build/tools/iree-compile --output-format=vm-bytecode --mlir-print-op-on-diagnostic=false --iree-hal-target-backends=llvm-cpu --iree-input-type=stablehlo --iree-input-demote-f64-to-f32 scatter.mlir -o check_vmvx_local-task_dynamic_slice.mlir_module.vmfb --iree-hal-executable-object-search-path=\"/home/prashant/iree-build\" -mlir-print-ir-after-all 2> xyz.txt | |
: 1728989265:0;vi xyz.txt | |
: 1728989698:0;/home/prashant/iree-build/tools/iree-compile --output-format=vm-bytecode --mlir-print-op-on-diagnostic=false --iree-hal-target-backends=llvm-cpu --iree-input-type=stablehlo --iree-input-demote-f64-to-f32 scatter.mlir -o new.vmfb | |
: 1728989721:0;iree-run-module --module=xyz.vmfb --function=scatter | |
: 1728989725:0;ls | |
: 1728989729:0;iree-run-module --module=new.vmfb --function=scatter | |
: 1728989756:0;/home/prashant/iree-build/tools/iree-compile --output-format=vm-bytecode --mlir-print-op-on-diagnostic=false --iree-hal-target-backends=llvm-cpu --iree-input-type=stablehlo --iree-input-demote-f64-to-f32 scatter.mlir -o new.vmfb -mlir-print-ir-after-all 2> new_err.txt | |
: 1728989778:0;riree | |
: 1728989884:0;tmux attach -t 0 | |
: 1728989888:0;/home/prashant/iree-build/tools/iree-compile --output-format=vm-bytecode --mlir-print-op-on-diagnostic=false --iree-hal-target-backends=llvm-cpu --iree-input-type=stablehlo --iree-input-demote-f64-to-f32 scatter.mlir -o old.vmfb -mlir-print-ir-after-all 2> old_err.txt | |
: 1728989898:0;iree-run-module --module=old.vmfb --function=scatter | |
: 1728989912:0;vi new_err.txt old_err.txt | |
: 1728990016:0;tmux attach -t 0 | |
: 1729002709:0;clear | |
: 1729002709:0;ls | |
: 1729002715:0;clear | |
: 1729002715:0;ls | |
: 1729002717:0;tmux ls | |
: 1729002719:0;tmux attach -t 0 | |
: 1729002731:0;clear | |
: 1729002731:0;ls | |
: 1729013635:0;clear | |
: 1729013635:0;ls | |
: 1729013637:0;tmux attach -t 0 | |
: 1729016808:0;ls | |
: 1729016818:0;source ~/iree/.iree_venv/bin/activate | |
: 1729016826:0;cd SHARK-Platform | |
: 1729016827:0;ls | |
: 1729016831:0;cd sharktank | |
: 1729016831:0;ls | |
: 1729016834:0;cd sharktank | |
: 1729016834:0;ls | |
: 1729016840:0;cd . | |
: 1729016841:0;cd .. | |
: 1729016841:0;ls | |
: 1729016843:0;cd ~ | |
: 1729016844:0;clear | |
: 1729016844:0;ls | |
: 1729063112:0;clear | |
: 1729063113:0;ls | |
: 1729063114:0;htop | |
: 1729063119:0;clear | |
: 1729063122:0;ls | |
: 1729076335:0;clear | |
: 1729076335:0;ls | |
: 1729076337:0;htop | |
: 1729076339:0;clear | |
: 1729076339:0;ls | |
: 1729076342:0;tmux ls | |
: 1729076345:0;tmux attach -t 0 | |
: 1729076350:0;clear | |
: 1729076351:0;ls | |
: 1729077383:0;vi ~/.zshrc | |
: 1729077401:0;cat ~/.zshrc | |
: 1729077834:0;vi ~/.ssh/config | |
: 1729077842:0;cat ~/.ssh/config | |
: 1729084444:0;clear | |
: 1729084444:0;ls | |
: 1729084446:0;htop | |
: 1729084451:0;tmux attach -t 0 | |
: 1729084457:0;ebd | |
: 1729084470:0;exit | |
: 1729145260:0;clear | |
: 1729145260:0;ls | |
: 1729145263:0;tmux attach -t 0 | |
: 1729145265:0;clear | |
: 1729145266:0;ls | |
: 1729145301:0;clear | |
: 1729145301:0;ls | |
: 1729163332:0;clear | |
: 1729163333:0;ls | |
: 1729163337:0;clear | |
: 1729163337:0;ls | |
: 1729163342:0;clear | |
: 1729163342:0;ls | |
: 1729163343:0;htop | |
: 1729163807:0;\ | |
\ | |
: 1729163808:0;clear | |
: 1729163809:0;ls | |
: 1729170882:0;\ | |
: 1729170890:0;htop | |
: 1729170894:0;exit | |
: 1729172125:0;clear | |
: 1729172125:0;ls | |
: 1729172128:0;LAZYGIT_VERSION=$(curl -s "https://api.github.com/repos/jesseduffield/lazygit/releases/latest" | grep -Po '"tag_name": "v\K[^"]*')\ | |
curl -Lo lazygit.tar.gz "https://github.com/jesseduffield/lazygit/releases/latest/download/lazygit_${LAZYGIT_VERSION}_Linux_x86_64.tar.gz"\ | |
tar xf lazygit.tar.gz lazygit\ | |
sudo install lazygit /usr/local/bin | |
: 1729172135:0;clear | |
: 1729172135:0;ls | |
: 1729172146:0;rm lazygit lazygit.tar.gz | |
: 1729172148:0;clear | |
: 1729172149:0;ls | |
: 1729175190:0;\ | |
: 1729175190:0;ls | |
: 1729175197:0;cat ~/.gitconf | |
: 1729175199:0;cat ~/.gitconfig | |
: 1729180479:0;clear | |
: 1729180479:0;ls | |
: 1729180556:0;clear | |
: 1729180556:0;ls | |
: 1729180594:0;clear | |
: 1729180594:0;ls | |
: 1729180613:0;clear | |
: 1729180613:0;ls | |
: 1729180616:0;tmux ls | |
: 1729180619:0;tmux attach -t 0 | |
: 1729180749:0;ls | |
: 1729181862:0;clear | |
: 1729181863:0;ls | |
: 1729181870:0;clear | |
: 1729181870:0;ls | |
: 1729181878:0;\ | |
: 1729181886:0;r | |
: 1729181886:0;\ | |
: 1729181887:0;clear | |
: 1729181887:0;ls | |
: 1729181894:0;htop | |
: 1729181899:0;exit | |
: 1729194583:0;\ | |
: 1729194585:0;bpytop | |
: 1729194588:0;clear | |
: 1729194588:0;ls | |
: 1729194591:0;clear | |
: 1729194592:0;ls | |
: 1729228475:0;\ | |
: 1729228484:0;htop | |
: 1729228488:0;exit | |
: 1729345424:0;clear\ | |
: 1729345425:0;ls | |
: 1729345430:0;htp | |
: 1729345432:0;htop | |
: 1729345434:0;clear | |
: 1729345434:0;ls | |
: 1729345436:0;exit | |
: 1729345509:0;clear | |
: 1729345509:0;ls | |
: 1729345521:0;tmux attach -t shortfin | |
: 1729345531:0;tmux -new shortfin | |
: 1729345555:0;tmux new -s shortfin | |
: 1729345558:0;clear | |
: 1729345558:0;ls | |
: 1729345570:0;cd SHARK-Platform | |
: 1729345572:0;clear | |
: 1729345572:0;ls | |
: 1729345575:0;source ~/SHARK-Platform/.venv/bin/activate | |
: 1729345577:0;clear | |
: 1729345577:0;ls | |
: 1729345582:0;cd SHARK-Platform | |
: 1729345582:0;ls | |
: 1729345585:0;source ~/SHARK-Platform/.venv/bin/activate | |
: 1729345586:0;ls | |
: 1729345594:0;cd SHARK-Platform | |
: 1729345596:0;source ~/SHARK-Platform/.venv/bin/activate | |
: 1729345597:0;vi | |
: 1729346138:0;cd .. | |
: 1729346140:0;mkdir coroutines | |
: 1729346142:0;cd coroutines | |
: 1729346145:0;ls | |
: 1729346148:0;vi main.cpp | |
: 1729346677:0;clang++ -std=c++20 main.cpp | |
: 1729346682:0;clang++-18 -std=c++20 main.cpp | |
: 1729347352:0;./a.out | |
: 1729347405:0;clang++-18 -std=c++20 main.cpp | |
: 1729347406:0;./a.out | |
: 1729347454:0;clang++-18 -std=c++20 main.cpp | |
: 1729347455:0;./a.out | |
: 1729347468:0;clang++-18 -std=c++20 main.cpp | |
: 1729347469:0;./a.out | |
: 1729347484:0;clang++-18 -std=c++20 main.cpp | |
: 1729349005:0;./a.out | |
: 1729349556:0;clang++-18 -std=c++20 main.cpp | |
: 1729351263:0;./a.out | |
: 1729351283:0;clang-format main.cpp | |
: 1729351287:0;clang-format -i main.cpp | |
: 1729351445:0;clang++-18 -std=c++20 main.cpp | |
: 1729351447:0;./a.out | |
: 1729351483:0;clang++-18 -std=c++20 main.cpp | |
: 1729351484:0;./a.out | |
: 1729352034:0;ls | |
: 1729352037:0;cd shortfin | |
: 1729352037:0;ls | |
: 1729352054:0;python tests/local_scope_test.py | |
: 1729352060:0;pytest -k tests/local_scope_test.py | |
: 1729352069:0;pytest tests/local_scope_test.py | |
: 1729352483:0;clang++-18 -std=c++20 main.cpp | |
: 1729352492:0;./a.out | |
: 1729352507:0;clang++-18 -std=c++20 main.cpp | |
: 1729352508:0;./a.out | |
: 1729352536:0;vi main.cpp | |
: 1729352540:0;clang++-18 -std=c++20 main.cpp | |
: 1729352542:0;vi main.cpp | |
: 1729352547:0;./a.out | |
: 1729359218:0;ls | |
: 1729359221:0;rm main.cpp | |
: 1729359224:0;vi new.cpp | |
: 1729359246:0;mv new.cpp example.cpp | |
: 1729359250:0;vi example.py | |
: 1729359288:0;clang++-18 -O3 -Wall -shared -std=c++20 -fPIC -I/path/to/pybind11/include example.cpp -o example.so `python3-config --cflags --ldflags --embed` | |
: 1729359294:0;ls | |
: 1729359297:0;./a.out | |
: 1729359393:0;source ~/SHARK-Platform/.venv/bin/activate | |
: 1729359425:0;clang++-18 -O3 -Wall -shared -std=c++17 -fPIC $(python3 -m pybind11 --includes) example.cpp -o example$(python3-config --extension-suffix)\ | |
: 1729359444:0;clang++-18 -O3 -Wall -shared -std=c++17 -fPIC $(python -m pybind11 --includes) example.cpp -o example$(python-config --extension-suffix)\ | |
: 1729359466:0;vi example. | |
: 1729359468:0;vi example.cpp | |
: 1729359481:0;clang++-18 -O3 -Wall -shared -std=c++17 -fPIC $(python -m pybind11 --includes) example.cpp -o example$(python-config --extension-suffix)\ | |
: 1729359560:0;pip install pybind11 | |
: 1729359563:0;clang++-18 -O3 -Wall -shared -std=c++17 -fPIC $(python -m pybind11 --includes) example.cpp -o example$(python-config --extension-suffix)\ | |
: 1729359594:0;clang++-18 -O3 -Wall -shared -std=c++20 -fPIC $(python -m pybind11 --includes) example.cpp -o example$(python-config --extension-suffix)\ | |
: 1729359599:0;ls | |
: 1729359601:0;./a.out | |
: 1729359605:0;./example | |
: 1729359610:0;vi example.py | |
: 1729359617:0;python example.py | |
: 1729359637:0;vi example.cpp | |
: 1729359723:0;python example.py | |
: 1729359743:0;vi example.py | |
: 1729359784:0;mv example.py ex.py | |
: 1729359787:0;python ex.py | |
: 1729359793:0;ls | |
: 1729359796:0;vi ex.py | |
: 1729359799:0;ls -l | |
: 1729359821:0;clang++-18 -O3 -Wall -shared -std=c++20 -fPIC $(python -m pybind11 --includes) example.cpp -o example.so\ | |
: 1729359828:0;ls -l | |
: 1729359832:0;vi ex.py | |
: 1729359837:0;python ex.py | |
: 1729359940:0;ls | |
: 1729359944:0;vi example.cpp | |
: 1729359961:0;vi ex.py | |
: 1729359979:0;python ex.py | |
: 1729359988:0;vi ex.py | |
: 1729360002:0;python ex.py | |
: 1729360008:0;ls | |
: 1729360013:0;clang++-18 -O3 -Wall -shared -std=c++20 -fPIC $(python -m pybind11 --includes) example.cpp -o example.so\ | |
: 1729360061:0;vi example.cpp | |
: 1729360067:0;clang++-18 -O3 -Wall -shared -std=c++20 -fPIC $(python -m pybind11 --includes) example.cpp -o example.so\ | |
: 1729360190:0;vi example.cpp | |
: 1729360200:0;clang++-18 -O3 -Wall -shared -std=c++20 -fPIC $(python -m pybind11 --includes) example.cpp -o example.so\ | |
: 1729360211:0;vi ex.py | |
: 1729360224:0;python ex.py | |
: 1729360235:0;vi example.cpp | |
: 1729360268:0;vi | |
: 1729360281:0;clang++-18 -O3 -Wall -shared -std=c++20 -fPIC $(python -m pybind11 --includes) example.cpp -o example.so\ | |
: 1729360289:0;python ex.py | |
: 1729360394:0;clang++-18 -O3 -Wall -shared -std=c++20 -fPIC $(python -m pybind11 --includes) example.cpp -o example.so\ | |
: 1729360398:0;python ex.py | |
: 1729360458:0;clang++-18 -O3 -Wall -shared -std=c++20 -fPIC $(python -m pybind11 --includes) example.cpp -o example.so\ | |
: 1729360462:0;python ex.py | |
: 1729360596:0;clang++-18 -O3 -Wall -shared -std=c++20 -fPIC $(python -m pybind11 --includes) example.cpp -o example.so\ | |
: 1729360600:0;python ex.py | |
: 1729360656:0;clang++-18 -O3 -Wall -shared -std=c++20 -fPIC $(python -m pybind11 --includes) example.cpp -o example.so\ | |
: 1729360660:0;python ex.py | |
: 1729360824:0;clang++-18 -O3 -Wall -shared -std=c++20 -fPIC $(python -m pybind11 --includes) example.cpp -o example.so\ | |
: 1729360827:0;python ex.py | |
: 1729360915:0;clang++-18 -O3 -Wall -shared -std=c++20 -fPIC $(python -m pybind11 --includes) example.cpp -o example.so\ | |
: 1729360919:0;python ex.py | |
: 1729361030:0;clang++-18 -O3 -Wall -shared -std=c++20 -fPIC $(python -m pybind11 --includes) example.cpp -o example.so\ | |
: 1729361034:0;python ex.py | |
: 1729361112:0;clang++-18 -O3 -Wall -shared -std=c++20 -fPIC $(python -m pybind11 --includes) example.cpp -o example.so\ | |
: 1729361174:0;python ex.py | |
: 1729361241:0;clang++-18 -O3 -Wall -shared -std=c++20 -fPIC $(python -m pybind11 --includes) example.cpp -o example.so\ | |
: 1729361245:0;python ex.py | |
: 1729362578:0;pytest tests/local_scope_test.py | |
: 1729362580:0;ls | |
: 1729362585:0;bear | |
: 1729362589:0;sudo apt-get install bear | |
: 1729362598:0;clear | |
: 1729362598:0;ls | |
: 1729362624:0;cd | |
: 1729362625:0;ls | |
: 1729362633:0;cd SHARK-Platform | |
: 1729362633:0;ls | |
: 1729362640:0;cd shortfin | |
: 1729362717:0;ls | |
: 1729362750:0;cmake -GNinja -S. -Bbuild -DCMAKE_C_COMPILER=clang -DCMAKE_CXX_COMPILER=clang++ -DCMAKE_LINKER_TYPE=LLD | |
: 1729362763:0;cmake -GNinja -S. -Bbuild -DCMAKE_C_COMPILER=clang-18 -DCMAKE_CXX_COMPILER=clang++-18 -DCMAKE_LINKER_TYPE=LLD | |
: 1729362898:0;ls | |
: 1729362915:0;git puom | |
: 1729362921:0;clear | |
: 1729362922:0;ls | |
: 1729362925:0;rm -rf build | |
: 1729362929:0;cmake -GNinja -S. -Bbuild -DCMAKE_C_COMPILER=clang-18 -DCMAKE_CXX_COMPILER=clang++-18 -DCMAKE_LINKER_TYPE=LLD | |
: 1729363046:0;rm -rf compile_commands.json | |
: 1729363053:0;cd build | |
: 1729363054:0;ls | |
: 1729363058:0;rm compile_commands.json | |
: 1729363059:0;ls | |
: 1729363077:0;bear -- ninja | |
: 1729363091:0;ls | |
: 1729363096:0;cd .. | |
: 1729363097:0;ls | |
: 1729363132:0;ln -s build/compile_commands.json compile_commands.json | |
: 1729363133:0;ls | |
: 1729363137:0;clear | |
: 1729363138:0;ls | |
: 1729363151:0;vi | |
: 1729363220:0;ls | |
: 1729363518:0;vi example.cpp | |
: 1729364254:0;ls | |
: 1729364256:0;cd build | |
: 1729364259:0;rm -rf compile_commands.json | |
: 1729364269:0;bear -- ninja | |
: 1729364271:0;ls | |
: 1729364282:0;mv compile_commands.json bear.json | |
: 1729364283:0;ls | |
: 1729364292:0;ninja | |
: 1729364293:0;ls | |
: 1729364303:0;\ | |
: 1729364304:0;cd .. | |
: 1729364309:0;cmake -GNinja -S. -Bbuild -DCMAKE_C_COMPILER=clang-18 -DCMAKE_CXX_COMPILER=clang++-18 -DCMAKE_LINKER_TYPE=LLD | |
: 1729364315:0;ls | |
: 1729364318:0;cd build | |
: 1729364318:0;ls | |
: 1729364325:0;diff bear.json compile_commands.json | |
: 1729364332:0;ls -l | |
: 1729364355:0;mv compile_commands.json cmake.json | |
: 1729364368:0;cd .. | |
: 1729364369:0;ls | |
: 1729364376:0;cmake -GNinja -S. -Bbuild -DCMAKE_C_COMPILER=clang-18 -DCMAKE_CXX_COMPILER=clang++-18 -DCMAKE_LINKER_TYPE=LLD | |
: 1729364381:0;cd build | |
: 1729364382:0;ls | |
: 1729364390:0;bear -- ninja | |
: 1729364393:0;ls | |
: 1729364394:0;ls -l | |
: 1729364404:0;vi compile_commands.json | |
: 1729364422:0;mv cmake.json .. | |
: 1729364425:0;cd .. | |
: 1729364426:0;ls | |
: 1729364428:0;rm -rf build | |
: 1729364432:0;cmake -GNinja -S. -Bbuild -DCMAKE_C_COMPILER=clang-18 -DCMAKE_CXX_COMPILER=clang++-18 -DCMAKE_LINKER_TYPE=LLD | |
: 1729364542:0;ls | |
: 1729364545:0;cd build | |
: 1729364546:0;ls | |
: 1729364551:0;rm -rf compile_commands.json | |
: 1729364555:0;bear -- ninja | |
: 1729364568:0;ls | |
: 1729364570:0;ls -l | |
: 1729364584:0;diff compile_commands.json ../cmake.json | |
: 1729364598:0;vi compile_commands.json ../cmake.json | |
: 1729364765:0;wc grep -o '\[' compile_commands.json | wc -l\ | |
: 1729364775:0;wc grep '\[' compile_commands.json | wc -l\ | |
: 1729364789:0;grep -o '\[' compile_commands.json | wc -l\ | |
: 1729364801:0;grep -o '\{' compile_commands.json | wc -l\ | |
: 1729364819:0;grep -o '\{' ../cmake.json | wc -l\ | |
: 1729364992:0;ls | |
: 1729365005:0;cd build_tools | |
: 1729365005:0;ls | |
: 1729365007:0;cd .. | |
: 1729365007:0;ls | |
: 1729365018:0;cd .. | |
: 1729365019:0;ls | |
: 1729365024:0;rm -rf cmake.json | |
: 1729365025:0;clear | |
: 1729365025:0;ls | |
: 1729365029:0;vi | |
: 1729365326:0;htop | |
: 1729438917:0;\ | |
: 1729438918:0;clear | |
: 1729438918:0;ls | |
: 1729438922:0;exit | |
: 1730208289:0;omz update\ | |
: 1730208292:0;clear | |
: 1730208293:0;ls | |
: 1730208298:0;clear | |
: 1730208299:0;ls | |
: 1730208300:0;tmux ls | |
: 1730208301:0;tmux | |
: 1730208305:0;clear | |
: 1730208306:0;ls | |
: 1730208309:0;tmux ls | |
: 1730208313:0;tmux attach -t 0 | |
: 1730208316:0;clear | |
: 1730208317:0;ls | |
: 1730208320:0;clear | |
: 1730208321:0;ls | |
: 1730208324:0;clear | |
: 1730208324:0;ls | |
: 1730208335:0;cd iree | |
: 1730208340:0;source ~/iree/.iree_venv/bin/activate | |
: 1730208342:0;clear | |
: 1730208342:0;ls | |
: 1730208346:0;git o main | |
: 1730208348:0;git stash | |
: 1730208350:0;git o main | |
: 1730208352:0;git puom | |
: 1730208365:0;ls | |
: 1730208390:0;git submodule update --init | |
: 1730208394:0;clear | |
: 1730208394:0;ls | |
: 1730208395:0;riree | |
: 1730208807:0;htop | |
: 1730208832:0;clear | |
: 1730208832:0;ls | |
: 1730208841:0;exit | |
: 1730307830:0;clear\ | |
: 1730307830:0;ls | |
: 1730307832:0;tmux ls | |
: 1730307836:0;tmux attach -t 0 | |
: 1730307850:0;htop | |
: 1730307852:0;clear | |
: 1730307852:0;ls | |
: 1730307855:0;clear | |
: 1730307856:0;ls | |
: 1730307858:0;riree | |
: 1730307861:0;git puom | |
: 1730307869:0;riree | |
: 1730307888:0;clearls | |
: 1730307890:0;clear | |
: 1730307890:0;ls | |
: 1730307893:0;source ~/iree/.iree_venv/bin/activate | |
: 1730307894:0;clear | |
: 1730307895:0;ls | |
: 1730307897:0;htop | |
: 1730307967:0;clear | |
: 1730307967:0;ls | |
: 1730387644:0;\ | |
: 1730387646:0;clear | |
: 1730387646:0;ls | |
: 1730387649:0;htop | |
: 1730387671:0;raedontop | |
: 1730387672:0;clear | |
: 1730387673:0;ls | |
: 1730387684:0;tmux attach -t 0 | |
: 1730387699:0;riree | |
: 1730387723:0;git pull | |
: 1730387741:0;git submodule update --init | |
: 1730387743:0;riree | |
: 1730387749:0;ls | |
: 1730387753:0;tmux attach -t 0 | |
: 1730387913:0;exit | |
: 1730387921:0;tmux attach -t 0 | |
: 1730387929:0;vi | |
: 1730717523:0;clear | |
: 1730717523:0;ls | |
: 1730717527:0;tmux attach -t 0 | |
: 1730717533:0;git fetch pashu | |
: 1730717551:0;git o newtiling | |
: 1730717555:0;git submodule update --init | |
: 1730717559:0;riree | |
: 1730717569:0;ls | |
: 1730724069:0;\ | |
: 1730724175:0;ls | |
: 1730724393:0;clear | |
: 1730724394:0;ls | |
: 1730724404:0;tmux attach -t 0 | |
: 1730724427:0;clear | |
: 1730724428:0;ls | |
: 1730724430:0;riree | |
: 1730724487:0;llvm-symbolizer | |
: 1730724492:0;which llvm-symbolizer | |
: 1730724497:0;which llvm-symbolizer-18 | |
: 1730724529:0;sudo mv /usr/bin/llvm-symbolizer-18 /usr/bin/llvm-symbolizer | |
: 1730724536:0;riree | |
: 1730727338:0;ls | |
: 1730727343:0;cd test | |
: 1730727343:0;ls | |
: 1730727350:0;cd test_err | |
: 1730727351:0;ls | |
: 1730727359:0;vi new_err.mlir | |
: 1730727784:0;iree-compile --output-format=vm-bytecode --mlir-print-op-on-diagnostic=false --iree-hal-target-backends=llvm-cpu new_err.mlir | |
: 1730727799:0;iree-compile --output-format=vm-bytecode --mlir-print-op-on-diagnostic=false --iree-hal-target-backends=llvm-cpu new_err.mlir -mlir-print-ir-after-all 2> xyz.txt | |
: 1730727802:0;vi xyz.txt | |
: 1730727964:0;riree | |
: 1730728136:0;iree-compile --output-format=vm-bytecode --mlir-print-op-on-diagnostic=false --iree-hal-target-backends=llvm-cpu new_err.mlir -mlir-print-ir-after-all 2> xyz.txt | |
: 1730728142:0;vi xyz.txt | |
: 1730728284:0;riree | |
: 1730728305:0;iree-compile --output-format=vm-bytecode --mlir-print-op-on-diagnostic=false --iree-hal-target-backends=llvm-cpu new_err.mlir -mlir-print-ir-after-all 2> xyz.txt | |
: 1730728309:0;vi xyz.txt | |
: 1730730256:0;riree | |
: 1730730277:0;iree-compile --output-format=vm-bytecode --mlir-print-op-on-diagnostic=false --iree-hal-target-backends=llvm-cpu new_err.mlir -mlir-print-ir-after-all 2> xyz.txt | |
: 1730730280:0;vi xyz.txt | |
: 1730730829:0;riree | |
: 1730730884:0;iree-compile --output-format=vm-bytecode --mlir-print-op-on-diagnostic=false --iree-hal-target-backends=llvm-cpu new_err.mlir -mlir-print-ir-after-all 2> xyz.txt | |
: 1730730890:0;vi xyz.txt | |
: 1730733037:0;clear | |
: 1730733038:0;ls | |
: 1730733042:0;tmux attach -t 0 | |
: 1730733046:0;riree | |
: 1730733393:0;vi .gitignore | |
: 1730733692:0;ls | |
: 1730733694:0;source ~/iree/.iree_venv/bin/activate | |
: 1730733695:0;cd iree | |
: 1730733704:0;gpg --full-generate-key | |
: 1730733792:0;fdsf | |
: 1730733792:0;sdfsdf | |
: 1730733792:0;sfs | |
: 1730733792:0;sfsdfiuifhjlksdjf | |
: 1730733792:0;sdfsfksljflsjf | |
: 1730733792:0;sflkajfljfl;djsl | |
: 1730733792:0;fdlsdfjl;sjfl | |
: 1730733792:0;l;fjl;sjfljodfjl;sdjfl;sdj | |
: 1730733792:0;l;fjsl;djfl;sdj | |
: 1730733792:0;afljsl;fajl;jdf | |
: 1730733792:0;Y | |
: 1730733798:0;ls | |
: 1730733818:0;gpg --list-secret-keys --keyid-format=long | |
: 1730733909:0;gpg --delete-secret-key 56BC74332D23B054 | |
: 1730734061:0;gpgconf --kill gpg-agent | |
: 1730734071:0;gpgconf --launch gpg-agent | |
: 1730734073:0;gpg --delete-secret-key 56BC74332D23B054 | |
: 1730734097:0;gpgconf --kill gpg-agent | |
: 1730734100:0;gpgconf --launch gpg-agent | |
: 1730734101:0;clear | |
: 1730734101:0;ls | |
: 1730734113:0;gpg --full-generate-key | |
: 1730734170:0;gpg --list-secret-keys --keyid-format=long | |
: 1730734193:0;gpg --armor --export BF3C92902BD1CCED | |
: 1730734316:0;git config --global user.signingkey BF3C92902BD1CCED | |
: 1730734331:0;git config --global commit.gpgSign true | |
: 1730734336:0;vi | |
: 1730734347:0;git ppf | |
: 1730734557:0;git clang-format HEAD~1 | |
: 1730734587:0;git clang-format HEAD~ | |
: 1730734607:0;git clang-format -i HEAD~ | |
: 1730734664:0;git-clang-format -i HEAD~ | |
: 1730734668:0;git-clang-format HEAD~ | |
: 1730734966:0;clear | |
: 1730734967:0;ls | |
: 1730734975:0;git-clang-format HEAD~1 | |
: 1730734985:0;git stash | |
: 1730734994:0;git-clang-format HEAD~1 | |
: 1730735009:0;git ppf | |
: 1730747321:0;ls | |
: 1730747327:0;tmux attach -t 0 | |
: 1730747330:0;source ~/iree/.iree_venv/bin/activate | |
: 1730747332:0;ls | |
: 1730747340:0;gist-paste new_err.mlir | |
: 1730808904:0;clear | |
: 1730808905:0;ls | |
: 1730808912:0;clear | |
: 1730808913:0;ls | |
: 1730808917:0;clear | |
: 1730808917:0;ls | |
: 1730808918:0;riree | |
: 1730808958:0;clear | |
: 1730809323:0;s | |
: 1730811210:0;riree | |
: 1730812592:0;vi | |
: 1730813318:0;riree | |
: 1730813881:0;tmux attach -t 0 | |
: 1730814839:0;\ | |
: 1730814842:0;clear | |
: 1730814843:0;ls | |
: 1730814848:0;tmux attach -t 0 | |
: 1730814909:0;riree | |
: 1730814947:0;ls | |
: 1730814959:0;iree-compile --output-format=vm-bytecode --mlir-print-op-on-diagnostic=false --iree-hal-target-backends=llvm-cpu new_err.mlir -mlir-print-ir-after-all 2> xyz.txt | |
: 1730814976:0;vi new_onnx.mlir | |
: 1730815017:0;iree-compile --iree-hal-target-backends=llvm-cpu -o abc.vmfb new_onnx.mlir | |
: 1730815024:0;ls | |
: 1730815229:0;riree | |
: 1730815317:0;CTEST_PARALLEL_LEVEL=32 cmake --build ~/iree-build --target iree-run-tests -j 32 | |
: 1730815674:0;git ppf | |
: 1730815777:0;git-clang-format HEAD~1 | |
: 1730815788:0;git ppf | |
: 1730815867:0;git o main | |
: 1730815872:0;git submodule update --init | |
: 1730815876:0;git lg | |
: 1730815884:0;git puom | |
: 1730815894:0;git submodule update --init | |
: 1730815898:0;git lg | |
: 1730815901:0;riree | |
: 1730819718:0;clear | |
: 1730819718:0;ls | |
: 1730819720:0;tmux attach -t 0 | |
: 1730819722:0;clear | |
: 1730819723:0;ls | |
: 1730819725:0;riree | |
: 1730819731:0;clear | |
: 1730819731:0;ls | |
: 1730819739:0;git o newtiling | |
: 1730819746:0;git rebase main | |
: 1730819750:0;git submodule update --init | |
: 1730819758:0;git ppf | |
: 1730828150:0;clear | |
: 1730828150:0;ls | |
: 1730896960:0;j | |
: 1730896966:0;clear | |
: 1730896967:0;ls | |
: 1730898990:0;riree | |
: 1730899295:0;clear | |
: 1730899296:0;ls | |
: 1730899298:0;tmux attach -t 0 | |
: 1730899340:0;clear | |
: 1730899342:0;biree | |
: 1730899496:0;git ppf | |
: 1730900481:0;clear | |
: 1730900482:0;ls | |
: 1730900485:0;git o main | |
: 1730900487:0;git puom | |
: 1730900495:0;git submodule update --init | |
: 1730901030:0;git o gpudistr | |
: 1730901037:0;git rebase main | |
: 1730901139:0;git rebase --continue | |
: 1730901142:0;git lg | |
: 1730901158:0;riree | |
: 1730901173:0;git ppf | |
: 1730901180:0;biree | |
: 1730912115:0;clear | |
: 1730912116:0;ls | |
: 1730912118:0;tmux attach -t 0 | |
: 1730912125:0;clear | |
: 1730912126:0;ls | |
: 1730912396:0;biree | |
: 1730912513:0;CTEST_PARALLEL_LEVEL=32 cmake --build ~/iree-build --target iree-run-tests -j 32 | |
: 1730912607:0;biree | |
: 1730913180:0;git ppf | |
: 1730913189:0;CTEST_PARALLEL_LEVEL=32 cmake --build ~/iree-build --target iree-run-tests -j 32 | |
: 1730913201:0;git-clang-format HEAD~1 | |
: 1730979742:0;git o newtiling | |
: 1730979748:0;git stash | |
: 1730979757:0;ls | |
: 1730979764:0;vi test_pipeline.mlir | |
: 1730979798:0;riree | |
: 1730979828:0;iree-opt --pass-pipeline='builtin.module(iree-llvmcpu-select-lowering-strategy)' test_pipeline.mlir | |
: 1730979868:0;ls | |
: 1730979871:0;vi new_onnx.mlir | |
: 1730979877:0;vi new_err.mlir | |
: 1730979883:0;rm new_err.mlir | |
: 1730979888:0;vi new_onnx.mlir | |
: 1730979898:0;vi xyz.txt | |
: 1730979923:0;iree-compile --iree-hal-target-backends=llvm-cpu -o abc.vmfb new_onnx.mlir -mlir-print-ir-after-all 2> xyz.txt | |
: 1730979927:0;vi xyz.txt | |
: 1730980187:0;ls | |
: 1730980190:0;vi test_pipeline.mlir | |
: 1730980215:0;vi test_default.mlir | |
: 1730980229:0;iree-compile --iree-hal-target-backends=llvm-cpu -o abc.vmfb test_default.mlir -mlir-print-ir-after-all 2> xyz.txt | |
: 1730980234:0;vi xyz.txt | |
: 1730980334:0;iree-opt --pass-pipeline='builtin.module(iree-llvmcpu-select-lowering-strategy)' test_pipeline.mlir | |
: 1730980473:0;ls | |
: 1730980476:0;vi test_pipeline.mlir | |
: 1730980481:0;vi test_default.mlir | |
: 1730980721:0;iree-opt --pass-pipeline='builtin.module(iree-llvmcpu-select-lowering-strategy)' test_pipeline.mlir | |
: 1730980740:0;vi test_pipeline.mlir | |
: 1730980764:0;iree-opt --pass-pipeline='builtin.module(iree-llvmcpu-select-lowering-strategy)' test_pipeline.mlir | |
: 1730980779:0;vi test_pipeline.mlir | |
: 1730980834:0;vi xyz.txt | |
: 1730980861:0;vi test_pipeline.mlir | |
: 1730980881:0;iree-opt --pass-pipeline='builtin.module(iree-llvmcpu-select-lowering-strategy)' test_pipeline.mlir | |
: 1730980913:0;vi test_pipeline.mlir | |
: 1730980948:0;iree-opt --pass-pipeline='builtin.module(iree-llvmcpu-select-lowering-strategy)' test_pipeline.mlir | |
: 1730981091:0;biree | |
: 1730981197:0;CTEST_PARALLEL_LEVEL=32 cmake --build ~/iree-build --target iree-run-tests -j 32 | |
: 1730981316:0;iree-opt --pass-pipeline='builtin.module(iree-llvmcpu-select-lowering-strategy)' compiler/src/iree/compiler/Codegen/LLVMCPU/test/select_x86_64_lowering_strategy.mlir | FileCheck-18 compiler/src/iree/compiler/Codegen/LLVMCPU/test/select_x86_64_lowering_strategy.mlir | |
: 1730981697:0;iree-opt --pass-pipeline='builtin.module(iree-llvmcpu-select-lowering-strategy)' -split-input-file compiler/src/iree/compiler/Codegen/LLVMCPU/test/select_x86_64_lowering_strategy.mlir | FileCheck-18 compiler/src/iree/compiler/Codegen/LLVMCPU/test/select_x86_64_lowering_strategy.mlir | |
: 1730983338:0;vi xyz.txt | |
: 1730983434:0;iree-opt --pass-pipeline='builtin.module(iree-llvmcpu-select-lowering-strategy)' -split-input-file compiler/src/iree/compiler/Codegen/LLVMCPU/test/select_x86_64_lowering_strategy.mlir | FileCheck-18 compiler/src/iree/compiler/Codegen/LLVMCPU/test/select_x86_64_lowering_strategy.mlir | |
: 1730983519:0;ls | |
: 1730983523:0;vi test_pipeline.mlir | |
: 1730983537:0;iree-opt --pass-pipeline='builtin.module(iree-llvmcpu-select-lowering-strategy)' test_pipeline.mlir | |
: 1730983579:0;vi xyz.txt | |
: 1730983632:0;vi test_pipeline.mlir | |
: 1730983677:0;iree-opt --pass-pipeline='builtin.module(iree-llvmcpu-select-lowering-strategy)' test_pipeline.mlir | |
: 1730983820:0;vi test_pipeline.mlir | |
: 1730983834:0;iree-opt --pass-pipeline='builtin.module(iree-llvmcpu-select-lowering-strategy)' test_pipeline.mlir | |
: 1730983851:0;cat test_pipeline.mlir | |
: 1730983856:0;vi test_pipeline.mlir | |
: 1730983902:0;iree-opt --pass-pipeline='builtin.module(iree-llvmcpu-select-lowering-strategy)' -split-input-file compiler/src/iree/compiler/Codegen/LLVMCPU/test/select_x86_64_lowering_strategy.mlir | FileCheck-18 compiler/src/iree/compiler/Codegen/LLVMCPU/test/select_x86_64_lowering_strategy.mlir | |
: 1730984187:0;cat test_pipeline.mlir | |
: 1730984191:0;iree-opt --pass-pipeline='builtin.module(iree-llvmcpu-select-lowering-strategy)' test_pipeline.mlir | |
: 1730984234:0;vi test_pipeline.mlir | |
: 1730984254:0;iree-compile --iree-hal-target-backends=llvm-cpu -o abc.vmfb test_default.mlir -mlir-print-ir-after-all 2> xyz.txt | |
: 1730984257:0;vi xyz.txt | |
: 1730984304:0;vi test_pipeline.mlir | |
: 1730984313:0;iree-compile --iree-hal-target-backends=llvm-cpu -o abc.vmfb test_default.mlir -mlir-print-ir-after-all 2> xyz.txt | |
: 1730984317:0;iree-opt --pass-pipeline='builtin.module(iree-llvmcpu-select-lowering-strategy)' test_pipeline.mlir | |
: 1730984434:0;vi xyz.txt | |
: 1730984479:0;vi test_pipeline.mlir | |
: 1730984505:0;iree-opt --pass-pipeline='builtin.module(iree-llvmcpu-select-lowering-strategy)' test_pipeline.mlir | |
: 1730984543:0;vi test_pipeline.mlir | |
: 1730984555:0;iree-opt --pass-pipeline='builtin.module(iree-llvmcpu-select-lowering-strategy)' test_pipeline.mlir | |
: 1730984579:0;ls | |
: 1730984584:0;vi test_pipeline.mlir | |
: 1730984624:0;iree-opt --pass-pipeline='builtin.module(iree-llvmcpu-select-lowering-strategy)' -split-input-file compiler/src/iree/compiler/Codegen/LLVMCPU/test/select_x86_64_lowering_strategy.mlir | FileCheck-18 compiler/src/iree/compiler/Codegen/LLVMCPU/test/select_x86_64_lowering_strategy.mlir | |
: 1730984888:0;git lg | |
: 1730985034:0;git ppf | |
: 1730985125:0;vi | |
: 1730985146:0;iree-compile --iree-hal-target-backends=llvm-cpu -o abc.vmfb new_onnx.mlir -mlir-print-ir-after-all 2> xyz.txt | |
: 1730985151:0;vi xyz.txt | |
: 1730985229:0;iree-compile --iree-hal-target-backends=llvm-cpu new_onnx.mlir -o abc.vmfb --iree-llvmcpu-target-cpu=host | |
: 1730985269:0;git lg | |
: 1730985294:0;git o main | |
: 1730985296:0;gi tpuom | |
: 1730985300:0;git puom | |
: 1730985312:0;git submodule update --init | |
: 1730985313:0;riree | |
: 1730985418:0;iree-compile --iree-hal-target-backends=llvm-cpu new_onnx.mlir -o abc.vmfb --iree-llvmcpu-target-cpu=host | |
: 1730985458:0;iree-compile --iree-hal-target-backends=llvm-cpu new_onnx.mlir -o abc.vmfb --iree-llvmcpu-target-cpu=host 2> err.txt | |
: 1730985465:0;gist-paste err.txt | |
: 1731003422:0;tmux attach -t 0 | |
: 1731003426:0;clear | |
: 1731003426:0;ls | |
: 1731003428:0;rriee | |
: 1731003429:0;riree | |
: 1731003438:0;git o newtiling | |
: 1731003444:0;git rebase main | |
: 1731003752:0;ls | |
: 1731003757:0;vi test_un.mlir | |
: 1731003764:0;riree | |
: 1731003831:0;iree-compile --iree-hal-target-backends=llvm-cpu test_un.mlir -o abc.vmfb --iree-llvmcpu-target-cpu=host 2> err.txt | |
: 1731003834:0;vi err.txt | |
: 1731003863:0;iree-compile --iree-hal-target-backends=llvm-cpu test_un.mlir -o abc.vmfb --iree-llvmcpu-target-cpu=host -mlir-print-ir-after-all 2> err.txt | |
: 1731003866:0;vi err.txt | |
: 1731004268:0;riree | |
: 1731004291:0;iree-compile --iree-hal-target-backends=llvm-cpu test_un.mlir -o abc.vmfb --iree-llvmcpu-target-cpu=host -mlir-print-ir-after-all 2> err.txt | |
: 1731004314:0;iree-compile --iree-hal-target-backends=llvm-cpu test_un.mlir -o abc.vmfb --iree-llvmcpu-target-cpu=host | |
: 1731004691:0;ls -l | |
: 1731004694:0;vi test_un.mlir | |
: 1731004742:0;vi err.txt | |
: 1731074877:0;clear\ | |
: 1731074878:0;ls | |
: 1731074881:0;tmux attach -t 0 | |
: 1731075773:0;git o main | |
: 1731075794:0;git puo | |
: 1731075796:0;git puom | |
: 1731075826:0;git submodule update --init | |
: 1731075828:0;riree | |
: 1731077394:0;vi new_test.mlir | |
: 1731077916:0;git o newtiling | |
: 1731077922:0;git rebase main | |
: 1731077926:0;riree | |
: 1731077991:0;iree-opt --pass-pipeline='builtin.module(iree-llvmcpu-select-lowering-strategy)' -split-input-file new_test.mlir | |
: 1731078048:0;iree-compile --iree-hal-target-backends=llvm-cpu new_test.mlir -o abc.vmfb --iree-llvmcpu-target-cpu=host -mlir-print-ir-after-all 2> err.txt | |
: 1731078053:0;vi err.txt | |
: 1731078262:0;vi new_test.mlir | |
: 1731078309:0;iree-compile --iree-hal-target-backends=llvm-cpu new_test.mlir -o abc.vmfb --iree-llvmcpu-target-cpu=host -mlir-print-ir-after-all 2> err.txt | |
: 1731078316:0;vi err.txt | |
: 1731078390:0;gist-paste err.txt | |
: 1731078661:0;tmux attach -t 0 | |
: 1731078724:0;git ppf | |
: 1731261174:0;tmux attach -t 0 | |
: 1731261178:0;git ppf | |
: 1731261185:0;git lg | |
: 1731261239:0;git fo | |
: 1731261252:0;git rebase origin/main | |
: 1731261258:0;git submodule update --init | |
: 1731261263:0;git ppf | |
: 1731261269:0;riree | |
: 1731261457:0;clear | |
: 1731261458:0;ls | |
: 1732512920:0;omz update | |
: 1732512922:0;clear | |
: 1732512923:0;ls | |
: 1732512926:0;source ~/iree/.iree_venv/bin/activate | |
: 1732512934:0;htop | |
: 1732512955:0;clear | |
: 1732512955:0;ls | |
: 1732512957:0;htop | |
: 1732512967:0;git o main | |
: 1732513051:0;git stash | |
: 1732513055:0;git o main | |
: 1732513057:0;git puom | |
: 1732513097:0;git remote -vv | |
: 1732513104:0;git fetch origin | |
: 1732513158:0;git lg | |
: 1732513168:0;git rebase origin/main | |
: 1732513169:0;git lg | |
: 1732513173:0;clear | |
: 1732513173:0;ls | |
: 1732513176:0;git submodule update --init | |
: 1732513181:0;riree | |
: 1732513751:0;tmux attach -t 0 | |
: 1732513753:0;ls | |
: 1732513755:0;riree | |
: 1732514082:0;vi | |
: 1732515794:0;clear | |
: 1732515794:0;ls | |
: 1732515797:0;clear | |
: 1732515797:0;ls | |
: 1732515799:0;htop | |
: 1732598011:0;tmux attach -t 0 | |
: 1732630750:0;clear | |
: 1732630751:0;ls | |
: 1732630753:0;exit | |
: 1735801495:0;clear | |
: 1735801495:0;ls | |
: 1735801500:0;tmux ls | |
: 1735801501:0;tmux | |
: 1735801513:0;clear | |
: 1735801513:0;ls | |
: 1735801515:0;clear | |
: 1735801516:0;ls | |
: 1735801518:0;cd iree | |
: 1735801519:0;clear | |
: 1735801519:0;ls | |
: 1735801521:0;git puom | |
: 1735801527:0;source ~/iree/.iree_venv/bin/activate | |
: 1735801528:0;vi | |
: 1735801555:0;clear | |
: 1735801556:0;git lg | |
: 1735801559:0;clear | |
: 1735801559:0;ls | |
: 1735801561:0;clear | |
: 1735801562:0;ls | |
: 1735801564:0;source ~/iree/.iree_venv/bin/activate | |
: 1735801566:0;riree | |
: 1735802061:0;git submodule update --init | |
: 1735802066:0;riree | |
: 1736263255:0;clear\ | |
: 1736263256:0;ls | |
: 1736263262:0;tmux | |
: 1736263267:0;clear | |
: 1736263267:0;ls | |
: 1736263270:0;cd .. | |
: 1736263270:0;ls | |
: 1736263273:0;source ~/iree/.iree_venv/bin/activate | |
: 1736263274:0;clear | |
: 1736263274:0;ls | |
: 1736263276:0;cd iree | |
: 1736263277:0;clear | |
: 1736263277:0;ls | |
: 1736263280:0;clear | |
: 1736263281:0;ls | |
: 1736263282:0;source ~/iree/.iree_venv/bin/activate | |
: 1736263285:0;git puom | |
: 1736263308:0;clear | |
: 1736263308:0;ls | |
: 1736263312:0;git submodule update --init | |
: 1736263315:0;clear | |
: 1736263316:0;ls | |
: 1736263318:0;riree | |
: 1736263366:0;ebd | |
: 1736263390:0;rm -rf ~/iree-build | |
: 1736263393:0;biree | |
: 1736267215:0;tmux attach -t 0 | |
: 1736267220:0;clear | |
: 1736267221:0;ls | |
: 1736267223:0;riree | |
: 1736267701:0;clear | |
: 1736267701:0;ls | |
: 1736267709:0;clear | |
: 1736267710:0;ls | |
: 1736267712:0;vi | |
: 1736267751:0;ls | |
: 1736267755:0;clear | |
: 1736267755:0;ls | |
: 1736267758:0;cd .. | |
: 1736267758:0;ls | |
: 1736267762:0;pwd | |
: 1736267769:0;cd bufferization | |
: 1736267775:0;mkdir buff_test | |
: 1736267776:0;cd buff_test | |
: 1736267777:0;clear | |
: 1736267777:0;ls | |
: 1736267780:0;source ~/iree/.iree_venv/bin/activate | |
: 1736267781:0;ls | |
: 1736267788:0;wget full.txt | |
: 1736267791:0;wget https://gist.githubusercontent.com/pashu123/2a162391c5212dc7351a08d0748833fd/raw/72b19900a3ecec4a74e85adc40577e23a56686db/xyz.txt | |
: 1736267796:0;vi xyz.txt | |
: 1736267847:0;vi test.mlir | |
: 1736267873:0;iree-opt --pass-pipeline="builtin.module(func.func(iree-codegen-iree-comprehensive-bufferize{test-analysis-only=true print-conflicts=true}))" test.mlir | |
: 1736267889:0;iree-opt --pass-pipeline="builtin.module(func.func(iree-codegen-iree-comprehensive-bufferize{test-analysis-only=true print-conflicts=true}))" test.mlir > buff_analysis.mlir | |
: 1736267891:0;vi buff_analysis.mlir | |
: 1736268017:0;iree-opt --pass-pipeline="builtin.module(func.func(iree-codegen-iree-comprehensive-bufferize))" test.mlir > buff_analysis.mlir | |
: 1736268019:0;vi buff_analysis.mlir | |
: 1736268042:0;iree-opt --pass-pipeline="builtin.module(func.func(iree-codegen-iree-comprehensive-bufferize{test-analysis-only=true print-conflicts=true}))" test.mlir > buff_analysis.mlir | |
: 1736268045:0;vi buff_analysis.mlir | |
: 1736268085:0;vi test.mlir | |
: 1736268119:0;iree-opt --pass-pipeline="builtin.module(func.func(iree-codegen-iree-comprehensive-bufferize{test-analysis-only=true print-conflicts=true}))" test.mlir > buff_analysis.mlir | |
: 1736268121:0;vi buff_analysis.mlir | |
: 1736268282:0;ls | |
: 1736268284:0;vi buff_analysis.mlir | |
: 1736268558:0;wget https://gist.githubusercontent.com/pashu123/2a162391c5212dc7351a08d0748833fd/raw/72b19900a3ecec4a74e85adc40577e23a56686db/xyz.txt | |
: 1736268619:0;rm xyz.txt.1 | |
: 1736268621:0;wget https://gist.githubusercontent.com/pashu123/b49299b19d14959244079d75ecc502ba/raw/dd70be76a1fa359ce9a28078eff310dca4920116/xyz_old.txt | |
: 1736268702:0;cd test/buff_test | |
: 1736268703:0;clear | |
: 1736268704:0;ls | |
: 1736268725:0;vi test.mlir | |
: 1736268737:0;iree-opt --pass-pipeline="builtin.module(func.func(iree-codegen-iree-comprehensive-bufferize{test-analysis-only=true print-conflicts=true}))" test.mlir > buff_analysis.mlir | |
: 1736268740:0;vi buff_analysis.mlir | |
: 1736268768:0;vi test.mlir | |
: 1736268779:0;iree-opt --pass-pipeline="builtin.module(func.func(iree-codegen-iree-comprehensive-bufferize{test-analysis-only=true print-conflicts=true}))" test.mlir > buff_analysis.mlir | |
: 1736268781:0;vi buff_analysis.mlir | |
: 1736268830:0;gist-paste buff_analysis.mlir | |
: 1736271356:0;clear | |
: 1736271356:0;ls | |
: 1736271378:0;clear | |
: 1736271379:0;ls | |
: 1736271450:0;clear | |
: 1736271451:0;ls | |
: 1736314158:0;\ | |
: 1736314160:0;clear | |
: 1736314160:0;ls | |
: 1736314163:0;tmux ls | |
: 1736314165:0;tmux | |
: 1736314170:0;clear | |
: 1736314170:0;ls | |
: 1736314174:0;clear | |
: 1736314174:0;ls | |
: 1736314176:0;source ~/iree/.iree_venv/bin/activate | |
: 1736314177:0;clear | |
: 1736314177:0;ls | |
: 1736314181:0;source ~/iree/.iree_venv/bin/activate | |
: 1736314182:0;clear | |
: 1736314182:0;ls | |
: 1736314188:0;clear | |
: 1736314189:0;ls | |
: 1736314190:0;htop | |
: 1736314212:0;clear | |
: 1736314212:0;ls | |
: 1736314215:0;clear | |
: 1736314216:0;ls | |
: 1736314512:0;clear | |
: 1736314513:0;ls | |
: 1736314514:0;vi | |
: 1736314609:0;git pull | |
: 1736314618:0;git submodule update --init | |
: 1736314621:0;riree | |
: 1736319396:0;clear | |
: 1736319397:0;ls | |
: 1736319401:0;clear | |
: 1736319401:0;ls | |
: 1736319402:0;vi | |
: 1736319406:0;tmux attach -t 0 | |
: 1736319414:0;clear | |
: 1736319415:0;ls | |
: 1736319419:0;cd ~ | |
: 1736319419:0;ls | |
: 1736319426:0;speed-test | |
: 1736319436:0;rm llvm.sh | |
: 1736319437:0;clear | |
: 1736319437:0;ls | |
: 1736319443:0;clear | |
: 1736319444:0;ls | |
: 1736337297:0;clear | |
: 1736337297:0;ls | |
: 1736337301:0;clear | |
: 1736337302:0;ls | |
: 1736337303:0;tmux ls | |
: 1736337307:0;tmux attach -t 0 | |
: 1736337349:0;cat test_pipeline.mlir | |
: 1736337930:0;clear | |
: 1736337930:0;ls | |
: 1736337961:0;clear | |
: 1736337962:0;ls | |
: 1736337965:0;vi buff_analysis.mlir | |
: 1736338055:0;vi xyz.txt | |
: 1736338491:0;clear | |
: 1736338492:0;ls | |
: 1736338517:0;iree-opt --split-input-file --pass-pipeline="builtin.module(func.func(iree-eliminate-empty-tensors))" test.mlir | |
: 1736338521:0;vi test.mlir | |
: 1736338605:0;clear | |
: 1736338605:0;ls | |
: 1736338608:0;iree-opt --split-input-file --pass-pipeline="builtin.module(func.func(iree-eliminate-empty-tensors))" test.mlir | |
: 1736338743:0;riree | |
: 1736338760:0;git lg | |
: 1736338765:0;clear | |
: 1736338765:0;ls | |
: 1736338772:0;iree-opt --split-input-file --pass-pipeline="builtin.module(func.func(iree-eliminate-empty-tensors))" test.mlir | |
: 1736338789:0;vi xyz.txt | |
: 1736338802:0;wget https://gist.githubusercontent.com/pashu123/2a162391c5212dc7351a08d0748833fd/raw/72b19900a3ecec4a74e85adc40577e23a56686db/xyz.txt | |
: 1736338805:0;ls | |
: 1736338811:0;mv xyz.txt.1 all.txt | |
: 1736338812:0;clear | |
: 1736338813:0;ls | |
: 1736338814:0;vi all.txt | |
: 1736338844:0;iree-opt --split-input-file --pass-pipeline="builtin.module(func.func(iree-eliminate-empty-tensors))" test.mlir | |
: 1736338901:0;iree-opt --pass-pipeline="builtin.module(func.func(iree-codegen-iree-comprehensive-bufferize{test-analysis-only=true print-conflicts=true}))" test.mlir > buff_analysis.mlir | |
: 1736338904:0;vi buff_analysis.mlir | |
: 1736339608:0;riree | |
: 1736339624:0;iree-opt --pass-pipeline="builtin.module(func.func(iree-codegen-iree-comprehensive-bufferize{test-analysis-only=true print-conflicts=true}))" test.mlir > buff_analysis.mlir | |
: 1736339627:0;vi buff_analysis.mlir | |
: 1736339638:0;iree-opt --split-input-file --pass-pipeline="builtin.module(func.func(iree-eliminate-empty-tensors))" test.mlir | |
: 1736339746:0;riree | |
: 1736339840:0;iree-opt --split-input-file --pass-pipeline="builtin.module(func.func(iree-eliminate-empty-tensors))" test.mlir | |
: 1736339890:0;riree | |
: 1736339917:0;iree-opt --split-input-file --pass-pipeline="builtin.module(func.func(iree-eliminate-empty-tensors))" test.mlir | |
: 1736339923:0;iree-opt --split-input-file --pass-pipeline="builtin.module(func.func(iree-eliminate-empty-tensors))" test.mlir 2> dbg.txt | |
: 1736339926:0;vi dbg.txt | |
: 1736339962:0;clear | |
: 1736339963:0;ls | |
: 1736339965:0;htop | |
: 1736339973:0;clear | |
: 1736339974:0;ls | |
: 1736339979:0;clear | |
: 1736339979:0;ls | |
: 1736339981:0;htop | |
: 1736346835:0;tmux attach -t 0 | |
: 1736346838:0;clear | |
: 1736346838:0;ls | |
: 1736347131:0;clear | |
: 1736347131:0;ls | |
: 1736347134:0;cd .. | |
: 1736347134:0;ls | |
: 1736347154:0;vi test.mlir | |
: 1736347189:0;iree-compile --iree-hal-target-backends=llvm-cpu new_test.mlir -o abc.vmfb --iree-llvmcpu-target-cpu=host -mlir-print-ir-after-all 2> err.txt | |
: 1736347193:0;vi test.mlir | |
: 1736347216:0;vi err.txt | |
: 1736347227:0;iree-compile --iree-hal-target-backends=llvm-cpu test.mlir -o abc.vmfb --iree-llvmcpu-target-cpu=host -mlir-print-ir-after-all 2> err.txt | |
: 1736347232:0;vi err.txt | |
: 1736347573:0;riree | |
: 1736347602:0;iree-compile --iree-hal-target-backends=llvm-cpu test.mlir -o abc.vmfb --iree-llvmcpu-target-cpu=host -mlir-print-ir-after-all 2> err.txt | |
: 1736347606:0;vi err.txt | |
: 1736347777:0;iree-opt --help | fzf | |
: 1736347903:0;vi err.txt | |
: 1736348026:0;iree-compile -iree-llvmcpu-enable-ukernels=all --iree-hal-target-backends=llvm-cpu test.mlir -o abc.vmfb --iree-llvmcpu-target-cpu=host -mlir-print-ir-after-all 2> err.txt | |
: 1736348031:0;vi err.txt | |
: 1736348060:0;iree-compile -iree-llvmcpu-enable-ukernels="mmt4d" --iree-hal-target-backends=llvm-cpu test.mlir -o abc.vmfb --iree-llvmcpu-target-cpu=host -mlir-print-ir-after-all 2> err.txt | |
: 1736348064:0;vi err.txt | |
: 1736348326:0;ls | |
: 1736348330:0;vi test.mlir | |
: 1736348485:0;ls | |
: 1736348489:0;cd test | |
: 1736348490:0;ls | |
: 1736348491:0;clear | |
: 1736348491:0;ls | |
: 1736348558:0;iree-benchmark-module --module=abc.vmfb --function=matmul --input=654x321xi8 --input=321x324xi8 --device=local-task | |
: 1736348565:0;iree-compile -iree-llvmcpu-enable-ukernels=all --iree-hal-target-backends=llvm-cpu test.mlir -o abc.vmfb --iree-llvmcpu-target-cpu=host -mlir-print-ir-after-all 2> err.txt | |
: 1736348568:0;iree-benchmark-module --module=abc.vmfb --function=matmul --input=654x321xi8 --input=321x324xi8 --device=local-task | |
: 1736348583:0;iree-benchmark-module --module=abc.vmfb --function=matmul --input=654x321xi8 --input=321x234xi8 --device=local-task | |
: 1736348598:0;iree-compile -iree-llvmcpu-enable-ukernels=mmt4d --iree-hal-target-backends=llvm-cpu test.mlir -o abc.vmfb --iree-llvmcpu-target-cpu=host -mlir-print-ir-after-all 2> err.txt | |
: 1736348602:0;iree-benchmark-module --module=abc.vmfb --function=matmul --input=654x321xi8 --input=321x234xi8 --device=local-task | |
: 1736348634:0;clear | |
: 1736348635:0;ls | |
: 1736348643:0;gist-paste test.mlir | |
: 1736348706:0;t | |
: 1736348707:0;exit | |
: 1736350265:0;cd .. | |
: 1736350265:0;ls | |
: 1736350268:0;cd test/buff_test | |
: 1736350269:0;clear | |
: 1736350269:0;ls | |
: 1736350276:0;iree-opt --split-input-file --pass-pipeline="builtin.module(func.func(iree-eliminate-empty-tensors))" test.mlir 2> dbg.txt | |
: 1736350301:0;riree | |
: 1736350313:0;iree-opt --split-input-file --pass-pipeline="builtin.module(func.func(iree-eliminate-empty-tensors))" test.mlir 2> dbg.txt | |
: 1736350319:0;vi dbg.txt | |
: 1736350384:0;riree | |
: 1736350398:0;iree-opt --split-input-file --pass-pipeline="builtin.module(func.func(iree-eliminate-empty-tensors))" test.mlir 2> dbg.txt | |
: 1736350401:0;vi dbg.txt | |
: 1736350508:0;iree-opt --split-input-file --pass-pipeline="builtin.module(func.func(iree-eliminate-empty-tensors))" test.mlir 2> dbg.txt -mlir-disable-threading | |
: 1736350510:0;vi dbg.txt | |
: 1736350532:0;ls | |
: 1736350534:0;cd test/buff_test | |
: 1736350534:0;ls | |
: 1736350538:0;vi test.mlir | |
: 1736350566:0;iree-opt --split-input-file --pass-pipeline="builtin.module(func.func(iree-eliminate-empty-tensors))" test.mlir 2> dbg.txt -mlir-disable-threading > out.txt | |
: 1736350579:0;iree-opt --split-input-file --pass-pipeline="builtin.module(func.func(iree-eliminate-empty-tensors))" out.txt 2> dbg.txt -mlir-disable-threading | |
: 1736350598:0;vi out.txt | |
: 1736350603:0;mv out.txt out.mlir | |
: 1736350604:0;clear | |
: 1736350604:0;ls | |
: 1736350605:0;vi out.mlir | |
: 1736350655:0;mv out.mlir test.mlir | |
: 1736350656:0;clear | |
: 1736350656:0;ls | |
: 1736350664:0;clear | |
: 1736350664:0;ls | |
: 1736350671:0;vi test.mlir | |
: 1736350713:0;iree-opt --split-input-file --pass-pipeline="builtin.module(func.func(iree-eliminate-empty-tensors))" test.mlir 2> dbg.txt -mlir-disable-threading | |
: 1736350716:0;vi dbg.txt | |
: 1736350771:0;riree | |
: 1736350794:0;iree-opt --split-input-file --pass-pipeline="builtin.module(func.func(iree-eliminate-empty-tensors))" test.mlir 2> dbg.txt -mlir-disable-threading | |
: 1736350797:0;vi dbg.txt | |
: 1736350909:0;riree | |
: 1736350929:0;iree-opt --split-input-file --pass-pipeline="builtin.module(func.func(iree-eliminate-empty-tensors))" test.mlir 2> dbg.txt -mlir-disable-threading | |
: 1736350938:0;vi dbg.txt | |
: 1736350958:0;vi test.mlir | |
: 1736350967:0;ls | |
: 1736350982:0;iree-opt --split-input-file --pass-pipeline="builtin.module(func.func(iree-eliminate-empty-tensors))" test.mlir 2> dbg.txt -mlir-disable-threading > out.mlir | |
: 1736350983:0;vi out.mlir | |
: 1736351004:0;iree-opt --split-input-file --pass-pipeline="builtin.module(func.func(iree-eliminate-empty-tensors))" test.mlir 2> out.mlir | |
: 1736351027:0;iree-opt --split-input-file --pass-pipeline="builtin.module(func.func(iree-eliminate-empty-tensors))" test.mlir 2> dbg.txt -mlir-disable-threading > out.mlir | |
: 1736351036:0;iree-opt --split-input-file --pass-pipeline="builtin.module(func.func(iree-eliminate-empty-tensors))" out.mlir 2> xyz.txt | |
: 1736351042:0;vi xyz.txt | |
: 1736351064:0;vi out.mlir | |
: 1736351097:0;vi xyz.txt | |
: 1736351204:0;riree | |
: 1736351254:0;iree-opt --split-input-file --pass-pipeline="builtin.module(func.func(iree-eliminate-empty-tensors))" out.mlir 2> xyz.txt | |
: 1736351263:0;vi xyz.txt | |
: 1736351563:0;vi out.mlir | |
: 1736351605:0;iree-opt --split-input-file --pass-pipeline="builtin.module(func.func(iree-eliminate-empty-tensors))" out.mlir | |
: 1736351621:0;vi out.mlir | |
: 1736352125:0;ls | |
: 1736352131:0;vi dbg.txt | |
: 1736352136:0;vi xyz.txt | |
: 1736352146:0;cat xyz.txt | |
: 1736352578:0;iree-opt --split-input-file --pass-pipeline="builtin.module(func.func(iree-eliminate-empty-tensors))" out.mlir 2> xyz.txt | |
: 1736352609:0;iree-opt --split-input-file --pass-pipeline="builtin.module(func.func(iree-eliminate-empty-tensors), cse)" out.mlir 2> xyz.txt | |
: 1736352667:0;iree-opt --split-input-file --pass-pipeline="builtin.module(func.func(iree-eliminate-empty-tensors), cse)" out.mlir 2> xyz.txt > good.mlir | |
: 1736352668:0;vi good.mlir | |
: 1736353704:0;iree-opt --split-input-file --pass-pipeline="builtin.module(func.func(iree-eliminate-empty-tensors), cse)" out.mlir | |
: 1736353724:0;vi good.mlir | |
: 1736353753:0;ls | |
: 1736353762:0;vi out.mlir | |
: 1736353955:0;ls | |
: 1736353959:0;vi xyz.txt | |
: 1736353964:0;vi all.txt | |
: 1736355077:0;riree | |
: 1736355099:0;ls | |
: 1736355103:0;vi buff_analysis.mlir | |
: 1736355108:0;vi all.txt | |
: 1736355127:0;iree-run-module --list-devices | |
: 1736355132:0;iree-run-module --list_devices | |
: 1736355144:0;vi test_now.mlir | |
: 1736355223:0;iree-compile -o out1.vmfb --compile-from=executable-sources -mlir-print-ir-after-all 2> xyz.txt | |
: 1736355225:0;vi xyz | |
: 1736355230:0;vi xyz.txt | |
: 1736355241:0;iree-compile test_now.mlir -o out1.vmfb --compile-from=executable-sources -mlir-print-ir-after-all 2> xyz.txt | |
: 1736355244:0;vi xyz.txt | |
: 1736355270:0;ebd | |
: 1736355610:0;rm -rf ~/iree-build | |
: 1736355612:0;biree | |
: 1736355620:0;ebd | |
: 1736355631:0;biree | |
: 1736355642:0;source ~/iree/.iree_venv/bin/activate | |
: 1736355644:0;biree | |
: 1736355927:0;riree | |
: 1736355946:0;iree-compile test_now.mlir -o out1.vmfb --compile-from=executable-sources -mlir-print-ir-after-all 2> xyz.txt | |
: 1736355949:0;vi xyz.txt | |
: 1736356112:0;riree | |
: 1736356140:0;vi test_now.mlir | |
: 1736356163:0;iree-compile test_now.mlir -o out1.vmfb --compile-from=executable-sources -mlir-print-ir-after-all 2> xyz.txt | |
: 1736356192:0;\ | |
: 1736356206:0;git o pashu/scfforallgpu | |
: 1736356211:0;git remote -vv | |
: 1736356213:0;git fetch pashu | |
: 1736356229:0;git o pashu/scfforallgpu | |
: 1736356233:0;git stash | |
: 1736356237:0;git submodule update --init | |
: 1736356244:0;git o pashu/scfforallgpu | |
: 1736356247:0;git submodule update --init | |
: 1736356268:0;cd third_party/llvm-project | |
: 1736356269:0;git stash | |
: 1736356271:0;cd .. | |
: 1736356276:0;git submodule update --init | |
: 1736356278:0;riree | |
: 1736356754:0;iree-compile test_now.mlir -o out1.vmfb --compile-from=executable-sources -mlir-print-ir-after-all 2> xyz.txt | |
: 1736356758:0;vi xyz.txt | |
: 1736356812:0;vi test_optimize.mloir | |
: 1736356816:0;test_optimize.mlir | |
: 1736356820:0;vi test_optimize.mlir | |
: 1736356883:0;iree-opt --pass-pipeline="builtin.module(func.func(iree-codegen-optimize-tensor-insert-extract-slices{fold-identity-slices=true}))" --split-input-file test_optimize.mlir | |
: 1736356941:0;riree | |
: 1736356961:0;iree-opt --pass-pipeline="builtin.module(func.func(iree-codegen-optimize-tensor-insert-extract-slices{fold-identity-slices=true}))" --split-input-file test_optimize.mlir | |
: 1736356974:0;iree-opt --pass-pipeline="builtin.module(func.func(iree-codegen-optimize-tensor-insert-extract-slices{fold-identity-slices=true}))" --split-input-file test_optimize.mlir --verify-each=0 | |
: 1736357350:0;riree | |
: 1736357420:0;iree-opt --pass-pipeline="builtin.module(func.func(iree-codegen-optimize-tensor-insert-extract-slices{fold-identity-slices=true}))" --split-input-file test_optimize.mlir --verify-each=0 | |
: 1736357486:0;riree | |
: 1736357504:0;iree-opt --pass-pipeline="builtin.module(func.func(iree-codegen-optimize-tensor-insert-extract-slices{fold-identity-slices=true}))" --split-input-file test_optimize.mlir --verify-each=0 | |
: 1736358009:0;riree | |
: 1736358145:0;iree-opt --pass-pipeline="builtin.module(func.func(iree-codegen-optimize-tensor-insert-extract-slices{fold-identity-slices=true}))" --split-input-file test_optimize.mlir --verify-each=0 | |
: 1736358215:0;riree | |
: 1736358249:0;iree-opt --pass-pipeline="builtin.module(func.func(iree-codegen-optimize-tensor-insert-extract-slices{fold-identity-slices=true}))" --split-input-file test_optimize.mlir --verify-each=0 | |
: 1736358856:0;riree | |
: 1736358876:0;iree-opt --pass-pipeline="builtin.module(func.func(iree-codegen-optimize-tensor-insert-extract-slices{fold-identity-slices=true}))" --split-input-file test_optimize.mlir --verify-each=0 | |
: 1736358938:0;riree | |
: 1736358956:0;iree-opt --pass-pipeline="builtin.module(func.func(iree-codegen-optimize-tensor-insert-extract-slices{fold-identity-slices=true}))" --split-input-file test_optimize.mlir --verify-each=0 | |
: 1736359028:0;riree | |
: 1736359048:0;iree-opt --pass-pipeline="builtin.module(func.func(iree-codegen-optimize-tensor-insert-extract-slices{fold-identity-slices=true}))" --split-input-file test_optimize.mlir --verify-each=0 | |
: 1736359260:0;riree | |
: 1736359279:0;iree-opt --pass-pipeline="builtin.module(func.func(iree-codegen-optimize-tensor-insert-extract-slices{fold-identity-slices=true}))" --split-input-file test_optimize.mlir --verify-each=0 | |
: 1736359838:0;riree | |
: 1736360134:0;iree-opt --pass-pipeline="builtin.module(func.func(iree-codegen-optimize-tensor-insert-extract-slices{fold-identity-slices=true}))" --split-input-file test_optimize.mlir --verify-each=0 | |
: 1736360176:0;riree | |
: 1736360196:0;iree-opt --pass-pipeline="builtin.module(func.func(iree-codegen-optimize-tensor-insert-extract-slices{fold-identity-slices=true}))" --split-input-file test_optimize.mlir --verify-each=0 | |
: 1736360221:0;iree-compile test_now.mlir -o out1.vmfb --compile-from=executable-sources -mlir-print-ir-after-all 2> xyz.txt | |
: 1736360227:0;vi xyz.txt | |
: 1736360384:0;riree | |
: 1736360432:0;iree-compile test_now.mlir -o out1.vmfb --compile-from=executable-sources -mlir-print-ir-after-all 2> xyz.txt | |
: 1736360438:0;vi xyz.txt | |
: 1736360451:0;git o main | |
: 1736360474:0;git branch | |
: 1736360482:0;git ob scfforallgpu | |
: 1736360696:0;git-clang-format HEAD~1 | |
: 1736360762:0;git ppf | |
: 1736360770:0;CTEST_PARALLEL_LEVEL=32 cmake --build ~/iree-build --target iree-run-tests -j 32 | |
: 1736361123:0;/home/prashant/iree-build/tools/iree-compile --output-format=vm-bytecode --mlir-print-op-on-diagnostic=false --iree-hal-target-backends=llvm-cpu --iree-llvmcpu-target-cpu=generic /home/prashant/iree-build/tests/e2e/convolution/e2e_conv2d_cpu_f16_f16_f16_medium_llvm-cpu_local-task_generic_conv2d.mlir -o /home/prashant/iree-build/tests/e2e/convolution/e2e_conv2d_cpu_f16_f16_f16_medium_llvm-cpu_local-task_generic_conv2d.vmfb | |
: 1736361137:0;/home/prashant/iree-build/tools/iree-compile --output-format=vm-bytecode --mlir-print-op-on-diagnostic=false --iree-hal-target-backends=llvm-cpu --iree-llvmcpu-target-cpu=generic /home/prashant/iree-build/tests/e2e/convolution/e2e_conv2d_cpu_f16_f16_f16_medium_llvm-cpu_local-task_generic_conv2d.mlir -o /home/prashant/iree-build/tests/e2e/convolution/e2e_conv2d_cpu_f16_f16_f16_medium_llvm-cpu_local-task_generic_conv2d.vmfb -mlir-print-ir-after-all 2> all.txt | |
: 1736361139:0;vi all.txt | |
: 1736361459:0;riree | |
: 1736361483:0;/home/prashant/iree-build/tools/iree-compile --output-format=vm-bytecode --mlir-print-op-on-diagnostic=false --iree-hal-target-backends=llvm-cpu --iree-llvmcpu-target-cpu=generic /home/prashant/iree-build/tests/e2e/convolution/e2e_conv2d_cpu_f16_f16_f16_medium_llvm-cpu_local-task_generic_conv2d.mlir -o /home/prashant/iree-build/tests/e2e/convolution/e2e_conv2d_cpu_f16_f16_f16_medium_llvm-cpu_local-task_generic_conv2d.vmfb -mlir-print-ir-after-all 2> all.txt -mlir-disable-threading | |
: 1736361485:0;vi all.txt | |
: 1736361620:0;riree | |
: 1736361647:0;/home/prashant/iree-build/tools/iree-compile --output-format=vm-bytecode --mlir-print-op-on-diagnostic=false --iree-hal-target-backends=llvm-cpu --iree-llvmcpu-target-cpu=generic /home/prashant/iree-build/tests/e2e/convolution/e2e_conv2d_cpu_f16_f16_f16_medium_llvm-cpu_local-task_generic_conv2d.mlir -o /home/prashant/iree-build/tests/e2e/convolution/e2e_conv2d_cpu_f16_f16_f16_medium_llvm-cpu_local-task_generic_conv2d.vmfb | |
: 1736361680:0;riree | |
: 1736361697:0;/home/prashant/iree-build/tools/iree-compile --output-format=vm-bytecode --mlir-print-op-on-diagnostic=false --iree-hal-target-backends=llvm-cpu --iree-llvmcpu-target-cpu=generic /home/prashant/iree-build/tests/e2e/convolution/e2e_conv2d_cpu_f16_f16_f16_medium_llvm-cpu_local-task_generic_conv2d.mlir -o /home/prashant/iree-build/tests/e2e/convolution/e2e_conv2d_cpu_f16_f16_f16_medium_llvm-cpu_local-task_generic_conv2d.vmfb | |
: 1736361845:0;riree | |
: 1736361868:0;/home/prashant/iree-build/tools/iree-compile --output-format=vm-bytecode --mlir-print-op-on-diagnostic=false --iree-hal-target-backends=llvm-cpu --iree-llvmcpu-target-cpu=generic /home/prashant/iree-build/tests/e2e/convolution/e2e_conv2d_cpu_f16_f16_f16_medium_llvm-cpu_local-task_generic_conv2d.mlir -o /home/prashant/iree-build/tests/e2e/convolution/e2e_conv2d_cpu_f16_f16_f16_medium_llvm-cpu_local-task_generic_conv2d.vmfb | |
: 1736361907:0;vi all.txt | |
: 1736362245:0;riree | |
: 1736362288:0;/home/prashant/iree-build/tools/iree-compile --output-format=vm-bytecode --mlir-print-op-on-diagnostic=false --iree-hal-target-backends=llvm-cpu --iree-llvmcpu-target-cpu=generic /home/prashant/iree-build/tests/e2e/convolution/e2e_conv2d_cpu_f16_f16_f16_medium_llvm-cpu_local-task_generic_conv2d.mlir -o /home/prashant/iree-build/tests/e2e/convolution/e2e_conv2d_cpu_f16_f16_f16_medium_llvm-cpu_local-task_generic_conv2d.vmfb | |
: 1736362301:0;riree | |
: 1736362320:0;/home/prashant/iree-build/tools/iree-compile --output-format=vm-bytecode --mlir-print-op-on-diagnostic=false --iree-hal-target-backends=llvm-cpu --iree-llvmcpu-target-cpu=generic /home/prashant/iree-build/tests/e2e/convolution/e2e_conv2d_cpu_f16_f16_f16_medium_llvm-cpu_local-task_generic_conv2d.mlir -o /home/prashant/iree-build/tests/e2e/convolution/e2e_conv2d_cpu_f16_f16_f16_medium_llvm-cpu_local-task_generic_conv2d.vmfb | |
: 1736362429:0;rm all.txt | |
: 1736362433:0;git-clang-format HEAD~1 | |
: 1736362467:0;CTEST_PARALLEL_LEVEL=32 cmake --build ~/iree-build --target iree-run-tests -j 32 | |
: 1736362708:0;git ppf | |
: 1736362803:0;iree-opt --pass-pipeline="builtin.module(func.func(iree-codegen-optimize-tensor-insert-extract-slices{fold-identity-slices=true}))" --split-input-file compiler/src/iree/compiler/Codegen/Common/test/optimize_tensor_insert_extract_slices.mlir | |
: 1736363171:0;riree | |
: 1736363187:0;iree-opt --pass-pipeline="builtin.module(func.func(iree-codegen-optimize-tensor-insert-extract-slices{fold-identity-slices=true}))" --split-input-file compiler/src/iree/compiler/Codegen/Common/test/optimize_tensor_insert_extract_slices.mlir | |
: 1736363238:0;riree | |
: 1736363260:0;iree-opt --pass-pipeline="builtin.module(func.func(iree-codegen-optimize-tensor-insert-extract-slices{fold-identity-slices=true}))" --split-input-file compiler/src/iree/compiler/Codegen/Common/test/optimize_tensor_insert_extract_slices.mlir | |
: 1736363342:0;riree | |
: 1736363376:0;iree-opt --pass-pipeline="builtin.module(func.func(iree-codegen-optimize-tensor-insert-extract-slices{fold-identity-slices=true}))" --split-input-file compiler/src/iree/compiler/Codegen/Common/test/optimize_tensor_insert_extract_slices.mlir | |
: 1736363402:0;riree | |
: 1736363422:0;iree-opt --pass-pipeline="builtin.module(func.func(iree-codegen-optimize-tensor-insert-extract-slices{fold-identity-slices=true}))" --split-input-file compiler/src/iree/compiler/Codegen/Common/test/optimize_tensor_insert_extract_slices.mlir | |
: 1736363446:0;riree | |
: 1736363465:0;iree-opt --pass-pipeline="builtin.module(func.func(iree-codegen-optimize-tensor-insert-extract-slices{fold-identity-slices=true}))" --split-input-file compiler/src/iree/compiler/Codegen/Common/test/optimize_tensor_insert_extract_slices.mlir | |
: 1736363502:0;riree | |
: 1736363576:0;iree-opt --pass-pipeline="builtin.module(func.func(iree-codegen-optimize-tensor-insert-extract-slices{fold-identity-slices=true}))" --split-input-file compiler/src/iree/compiler/Codegen/Common/test/optimize_tensor_insert_extract_slices.mlir | |
: 1736363637:0;vi compiler/src/iree/compiler/Codegen/Common/test/optimize_tensor_insert_extract_slices.mlir | |
: 1736363820:0;ree | |
: 1736363821:0;riree | |
: 1736363963:0;vi compiler/src/iree/compiler/Codegen/Common/test/optimize_tensor_insert_extract_slices.mlir | |
: 1736363966:0;iree-opt --pass-pipeline="builtin.module(func.func(iree-codegen-optimize-tensor-insert-extract-slices{fold-identity-slices=true}))" --split-input-file compiler/src/iree/compiler/Codegen/Common/test/optimize_tensor_insert_extract_slices.mlir | |
: 1736363986:0;CTEST_PARALLEL_LEVEL=32 cmake --build ~/iree-build --target iree-run-tests -j 32 | |
: 1736364141:0;git ppf | |
: 1736364349:0;git rebase main | |
: 1736364389:0;git rebase --abort | |
: 1736364398:0;git rebase origin/main | |
: 1736364405:0;git remote -vv | |
: 1736364410:0;git fetch origin | |
: 1736364421:0;git rebase --abort | |
: 1736364431:0;git o origin/main | |
: 1736364432:0;git lg | |
: 1736364443:0;git o scfforallgpu | |
: 1736364445:0;git lg | |
: 1736364451:0;git rebase origin/main | |
: 1736364563:0;git rebase --continue | |
: 1736364575:0;git add compiler/src/iree/compiler/Codegen/Common/test/tile_and_distribute_workgroups_using_forall.mlir | |
: 1736364576:0;git rebase --continue | |
: 1736364582:0;git submodule update --init | |
: 1736364595:0;git ppf | |
: 1736364659:0;CTEST_PARALLEL_LEVEL=32 cmake --build ~/iree-build --target iree-run-tests -j 32 | |
: 1736364691:0;git rebase origin/main | |
: 1736364697:0;git o origin/main | |
: 1736364699:0;git lg | |
: 1736364704:0;git branch -D main | |
: 1736364707:0;git ob main | |
: 1736364708:0;clear | |
: 1736364709:0;ls | |
: 1736364711:0;git submodule update --init | |
: 1736364715:0;git o scfforallgpu | |
: 1736364720:0;git rebase origin/main | |
: 1736364723:0;git rebase main | |
: 1736364753:0;cd third_party/benchmark | |
: 1736364816:0;ls | |
: 1736364822:0;git ppf | |
: 1736364826:0;cd .. | |
: 1736364829:0;git ppf | |
: 1736364933:0;git-clang-format HEAD~1 | |
: 1736364939:0;git-clang-format HEAD~ | |
: 1736364941:0;git ppf | |
: 1736364957:0;CTEST_PARALLEL_LEVEL=32 cmake --build ~/iree-build --target iree-run-tests -j 128 | |
: 1736365205:0;CTEST_PARALLEL_LEVEL=32 cmake --build ~/iree-build --target iree-run-tests -j 16 | |
: 1736365526:0;vi | |
: 1736365573:0;git ppf | |
: 1736365595:0;riree | |
: 1736365626:0;iree-compile test_now.mlir -o out1.vmfb --compile-from=executable-sources -mlir-print-ir-after-all 2> xyz.txt | |
: 1736365633:0;vi xyz.txt | |
: 1736365726:0;riree | |
: 1736365757:0;iree-compile test_now.mlir -o out1.vmfb --compile-from=executable-sources -mlir-print-ir-after-all 2> xyz.txt | |
: 1736365765:0;vi xyz.txt | |
: 1736365778:0;iree-opt --pass-pipeline="builtin.module(func.func(iree-codegen-optimize-tensor-insert-extract-slices{fold-identity-slices=true}))" --split-input-file compiler/src/iree/compiler/Codegen/Common/test/optimize_tensor_insert_extract_slices.mlir | |
: 1736365785:0;cd .. | |
: 1736365786:0;iree-opt --pass-pipeline="builtin.module(func.func(iree-codegen-optimize-tensor-insert-extract-slices{fold-identity-slices=true}))" --split-input-file compiler/src/iree/compiler/Codegen/Common/test/optimize_tensor_insert_extract_slices.mlir | |
: 1736395936:0;tmux attach -t 0 | |
: 1736396450:0;riree | |
: 1736396472:0;iree-opt --pass-pipeline="builtin.module(func.func(iree-codegen-optimize-tensor-insert-extract-slices{fold-identity-slices=true}))" --split-input-file compiler/src/iree/compiler/Codegen/Common/test/optimize_tensor_insert_extract_slices.mlir | |
: 1736396507:0;iree-compile test_now.mlir -o out1.vmfb --compile-from=executable-sources -mlir-print-ir-after-all 2> xyz.txt | |
: 1736396514:0;vi xyz.txt | |
: 1736396734:0;riree | |
: 1736396756:0;iree-compile test_now.mlir -o out1.vmfb --compile-from=executable-sources -mlir-print-ir-after-all 2> xyz.txt | |
: 1736396761:0;vi xyz.txt | |
: 1736397061:0;riree | |
: 1736397083:0;iree-opt --pass-pipeline="builtin.module(func.func(iree-codegen-optimize-tensor-insert-extract-slices{fold-identity-slices=true}))" --split-input-file compiler/src/iree/compiler/Codegen/Common/test/optimize_tensor_insert_extract_slices.mlir | |
: 1736397090:0;iree-compile test_now.mlir -o out1.vmfb --compile-from=executable-sources -mlir-print-ir-after-all 2> xyz.txt | |
: 1736397094:0;vi xyz.txt | |
: 1736397452:0;riree | |
: 1736397473:0;iree-compile test_now.mlir -o out1.vmfb --compile-from=executable-sources -mlir-print-ir-after-all 2> xyz.txt | |
: 1736397479:0;vi xyz.txt | |
: 1736397546:0;rriee | |
: 1736397548:0;riree | |
: 1736397584:0;iree-compile test_now.mlir -o out1.vmfb --compile-from=executable-sources -mlir-print-ir-after-all 2> xyz.txt | |
: 1736397590:0;vi xyz.txt | |
: 1736397653:0;riree | |
: 1736397675:0;iree-compile test_now.mlir -o out1.vmfb --compile-from=executable-sources -mlir-print-ir-after-all 2> xyz.txt | |
: 1736397771:0;rriee | |
: 1736397772:0;riree | |
: 1736397786:0;rriee | |
: 1736397787:0;riree | |
: 1736397811:0;iree-opt --pass-pipeline="builtin.module(func.func(iree-codegen-optimize-tensor-insert-extract-slices{fold-identity-slices=true}))" --split-input-file compiler/src/iree/compiler/Codegen/Common/test/optimize_tensor_insert_extract_slices.mlir | |
: 1736397823:0;iree-compile test_now.mlir -o out1.vmfb --compile-from=executable-sources -mlir-print-ir-after-all 2> xyz.txt | |
: 1736397830:0;vi xyz.txt | |
: 1736397949:0;riree | |
: 1736397972:0;iree-opt --pass-pipeline="builtin.module(func.func(iree-codegen-optimize-tensor-insert-extract-slices{fold-identity-slices=true}))" --split-input-file compiler/src/iree/compiler/Codegen/Common/test/optimize_tensor_insert_extract_slices.mlir | |
: 1736398033:0;vi test.mlir | |
: 1736398105:0;iree-opt --pass-pipeline="builtin.module(func.func(iree-codegen-optimize-tensor-insert-extract-slices{fold-identity-slices=true}))" --split-input-file test.mlir | |
: 1736398184:0;vi test.mlir | |
: 1736398206:0;iree-opt --pass-pipeline="builtin.module(func.func(iree-codegen-optimize-tensor-insert-extract-slices{fold-identity-slices=true}))" --split-input-file test.mlir | |
: 1736398235:0;vi xyz.txt | |
: 1736398256:0;vi test.mlir | |
: 1736398261:0;iree-opt --pass-pipeline="builtin.module(func.func(iree-codegen-optimize-tensor-insert-extract-slices{fold-identity-slices=true}))" --split-input-file test.mlir | |
: 1736398300:0;riree | |
: 1736398319:0;iree-opt --pass-pipeline="builtin.module(func.func(iree-codegen-optimize-tensor-insert-extract-slices{fold-identity-slices=true}))" --split-input-file test.mlir | |
: 1736398331:0;iree-opt --pass-pipeline="builtin.module(func.func(iree-codegen-optimize-tensor-insert-extract-slices{fold-identity-slices=true}))" --split-input-file compiler/src/iree/compiler/Codegen/Common/test/optimize_tensor_insert_extract_slices.mlir | |
: 1736398381:0;riree | |
: 1736398400:0;iree-opt --pass-pipeline="builtin.module(func.func(iree-codegen-optimize-tensor-insert-extract-slices{fold-identity-slices=true}))" --split-input-file compiler/src/iree/compiler/Codegen/Common/test/optimize_tensor_insert_extract_slices.mlir | |
: 1736398412:0;iree-opt --pass-pipeline="builtin.module(func.func(iree-codegen-optimize-tensor-insert-extract-slices{fold-identity-slices=true}))" --split-input-file test.mlir | |
: 1736398421:0;iree-compile test_now.mlir -o out1.vmfb --compile-from=executable-sources -mlir-print-ir-after-all 2> xyz.txt | |
: 1736398427:0;vi xyz.txt | |
: 1736398470:0;CTEST_PARALLEL_LEVEL=32 cmake --build ~/iree-build --target iree-run-tests -j 16 | |
: 1736398501:0;/home/prashant/iree-build/tools/iree-compile --output-format=vm-bytecode --mlir-print-op-on-diagnostic=false --iree-hal-target-backends=llvm-cpu --iree-llvmcpu-target-cpu=generic /home/prashant/iree-build/tests/e2e/convolution/e2e_conv2d_cpu_f16_f16_f16_medium_llvm-cpu_local-task_generic_conv2d.mlir -o /home/prashant/iree-build/tests/e2e/convolution/e2e_conv2d_cpu_f16_f16_f16_medium_llvm-cpu_local-task_generic_conv2d.vmfb | |
: 1736398543:0;riree | |
: 1736398560:0;/home/prashant/iree-build/tools/iree-compile --output-format=vm-bytecode --mlir-print-op-on-diagnostic=false --iree-hal-target-backends=llvm-cpu --iree-llvmcpu-target-cpu=generic /home/prashant/iree-build/tests/e2e/convolution/e2e_conv2d_cpu_f16_f16_f16_medium_llvm-cpu_local-task_generic_conv2d.mlir -o /home/prashant/iree-build/tests/e2e/convolution/e2e_conv2d_cpu_f16_f16_f16_medium_llvm-cpu_local-task_generic_conv2d.vmfb | |
: 1736398571:0;iree-opt --pass-pipeline="builtin.module(func.func(iree-codegen-optimize-tensor-insert-extract-slices{fold-identity-slices=true}))" --split-input-file test.mlir | |
: 1736398743:0;riree | |
: 1736398811:0;clear | |
: 1736398812:0;ls | |
: 1736398815:0;iree-opt --pass-pipeline="builtin.module(func.func(iree-codegen-optimize-tensor-insert-extract-slices{fold-identity-slices=true}))" --split-input-file test.mlir | |
: 1736398825:0;/home/prashant/iree-build/tools/iree-compile --output-format=vm-bytecode --mlir-print-op-on-diagnostic=false --iree-hal-target-backends=llvm-cpu --iree-llvmcpu-target-cpu=generic /home/prashant/iree-build/tests/e2e/convolution/e2e_conv2d_cpu_f16_f16_f16_medium_llvm-cpu_local-task_generic_conv2d.mlir -o /home/prashant/iree-build/tests/e2e/convolution/e2e_conv2d_cpu_f16_f16_f16_medium_llvm-cpu_local-task_generic_conv2d.vmfb | |
: 1736399187:0;vi test.mlir | |
: 1736399348:0;riree | |
: 1736399368:0;iree-opt --pass-pipeline="builtin.module(func.func(iree-codegen-optimize-tensor-insert-extract-slices{fold-identity-slices=true}))" --split-input-file test.mlir | |
: 1736399384:0;/home/prashant/iree-build/tools/iree-compile --output-format=vm-bytecode --mlir-print-op-on-diagnostic=false --iree-hal-target-backends=llvm-cpu --iree-llvmcpu-target-cpu=generic /home/prashant/iree-build/tests/e2e/convolution/e2e_conv2d_cpu_f16_f16_f16_medium_llvm-cpu_local-task_generic_conv2d.mlir -o /home/prashant/iree-build/tests/e2e/convolution/e2e_conv2d_cpu_f16_f16_f16_medium_llvm-cpu_local-task_generic_conv2d.vmfb | |
: 1736399461:0;riree | |
: 1736399481:0;iree-opt --pass-pipeline="builtin.module(func.func(iree-codegen-optimize-tensor-insert-extract-slices{fold-identity-slices=true}))" --split-input-file test.mlir | |
: 1736399488:0;/home/prashant/iree-build/tools/iree-compile --output-format=vm-bytecode --mlir-print-op-on-diagnostic=false --iree-hal-target-backends=llvm-cpu --iree-llvmcpu-target-cpu=generic /home/prashant/iree-build/tests/e2e/convolution/e2e_conv2d_cpu_f16_f16_f16_medium_llvm-cpu_local-task_generic_conv2d.mlir -o /home/prashant/iree-build/tests/e2e/convolution/e2e_conv2d_cpu_f16_f16_f16_medium_llvm-cpu_local-task_generic_conv2d.vmfb | |
: 1736399516:0;iree-opt --pass-pipeline="builtin.module(func.func(iree-codegen-optimize-tensor-insert-extract-slices{fold-identity-slices=true}))" --split-input-file compiler/src/iree/compiler/Codegen/Common/test/optimize_tensor_insert_extract_slices.mlir | |
: 1736399596:0;git-clang-format HEAD~ | |
: 1736399609:0;riree | |
: 1736399631:0;iree-opt --pass-pipeline="builtin.module(func.func(iree-codegen-optimize-tensor-insert-extract-slices{fold-identity-slices=true}))" --split-input-file compiler/src/iree/compiler/Codegen/Common/test/optimize_tensor_insert_extract_slices.mlir | |
: 1736399684:0;git ppf | |
: 1736399691:0;CTEST_PARALLEL_LEVEL=32 cmake --build ~/iree-build --target iree-run-tests -j 16 | |
: 1736399868:0;git ppf | |
: 1736400019:0;iree-opt --split-input-file --iree-gpu-test-target=gfx942 --iree-codegen-llvmgpu-use-vector-distribution --iree-llvmgpu-enable-prefetch=true --pass-pipeline="builtin.module(hal.executable(hal.executable.variant(builtin.module(func.func(iree-llvmgpu-lower-executable-target)))))" compiler/src/iree/compiler/Codegen/LLVMGPU/test/ROCDL/pipeline_vector_distribute_gfx942.mlir | FileCheck compiler/src/iree/compiler/Codegen/LLVMGPU/test/ROCDL/pipeline_vector_distribute_gfx942.mlir | |
: 1736400032:0;sudo apt-get install FileCheck | |
: 1736400057:0;iree-opt --split-input-file --iree-gpu-test-target=gfx942 --iree-codegen-llvmgpu-use-vector-distribution --iree-llvmgpu-enable-prefetch=true --pass-pipeline="builtin.module(hal.executable(hal.executable.variant(builtin.module(func.func(iree-llvmgpu-lower-executable-target)))))" compiler/src/iree/compiler/Codegen/LLVMGPU/test/ROCDL/pipeline_vector_distribute_gfx942.mlir | FileCheck-18 compiler/src/iree/compiler/Codegen/LLVMGPU/test/ROCDL/pipeline_vector_distribute_gfx942.mlir | |
: 1736400083:0;iree-opt --split-input-file --iree-gpu-test-target=gfx942 --iree-codegen-llvmgpu-use-vector-distribution --iree-llvmgpu-enable-prefetch=true --pass-pipeline="builtin.module(hal.executable(hal.executable.variant(builtin.module(func.func(iree-llvmgpu-lower-executable-target)))))" compiler/src/iree/compiler/Codegen/LLVMGPU/test/ROCDL/pipeline_vector_distribute_gfx942.mlir | FileCheck-18 compiler/src/iree/compiler/Codegen/LLVMGPU/test/ROCDL/pipeline_vector_distribute_gfx942.mlir --check-prefix=MEMORY | |
: 1736400214:0;iree-opt --split-input-file --iree-gpu-test-target=gfx942 --pass-pipeline="builtin.module(hal.executable(hal.executable.variant(builtin.module(func.func(iree-llvmgpu-lower-executable-target)))))" compiler/src/iree/compiler/Codegen/LLVMGPU/test/ROCDL/pipeline_tile_and_fuse.mlir | |
: 1736400268:0;iree-opt --split-input-file --iree-gpu-test-target=gfx942 --pass-pipeline="builtin.module(hal.executable(hal.executable.variant(builtin.module(func.func(iree-llvmgpu-lower-executable-target)))))" compiler/src/iree/compiler/Codegen/LLVMGPU/test/ROCDL/pipeline_tile_and_fuse.mlir | FileCheck-18 compiler/src/iree/compiler/Codegen/LLVMGPU/test/ROCDL/pipeline_tile_and_fuse.mlir | |
: 1736426791:0;clear | |
: 1736426792:0;ls | |
: 1736426794:0;tmux attach -t 0 | |
: 1736426852:0;iree-opt --split-input-file --iree-gpu-test-target=gfx942 --pass-pipeline="builtin.module(hal.executable(hal.executable.variant(builtin.module(func.func(iree-llvmgpu-lower-executable-target)))))" compiler/src/iree/compiler/Codegen/LLVMGPU/test/ROCDL/pipeline_tile_and_fuse.mlir | FileCheck-18 compiler/src/iree/compiler/Codegen/LLVMGPU/test/ROCDL/pipeline_tile_and_fuse.mlir | |
: 1736426866:0;iree-opt --split-input-file --iree-gpu-test-target=gfx942 --pass-pipeline="builtin.module(hal.executable(hal.executable.variant(builtin.module(func.func(iree-llvmgpu-lower-executable-target)))))" compiler/src/iree/compiler/Codegen/LLVMGPU/test/ROCDL/pipeline_tile_and_fuse.mlir > test.mlir | |
: 1736427207:0;riree | |
: 1736427224:0;iree-opt --split-input-file --iree-gpu-test-target=gfx942 --pass-pipeline="builtin.module(hal.executable(hal.executable.variant(builtin.module(func.func(iree-llvmgpu-lower-executable-target)))))" compiler/src/iree/compiler/Codegen/LLVMGPU/test/ROCDL/pipeline_tile_and_fuse.mlir > test.mlir | |
: 1736427254:0;riree | |
: 1736427277:0;iree-opt --split-input-file --iree-gpu-test-target=gfx942 --pass-pipeline="builtin.module(hal.executable(hal.executable.variant(builtin.module(func.func(iree-llvmgpu-lower-executable-target)))))" compiler/src/iree/compiler/Codegen/LLVMGPU/test/ROCDL/pipeline_tile_and_fuse.mlir > test1.mlir | |
: 1736427578:0;riree | |
: 1736427591:0;iree-opt --split-input-file --iree-gpu-test-target=gfx942 --pass-pipeline="builtin.module(hal.executable(hal.executable.variant(builtin.module(func.func(iree-llvmgpu-lower-executable-target)))))" compiler/src/iree/compiler/Codegen/LLVMGPU/test/ROCDL/pipeline_tile_and_fuse.mlir | FileCheck-18 compiler/src/iree/compiler/Codegen/LLVMGPU/test/ROCDL/pipeline_tile_and_fuse.mlir | |
: 1736427751:0;riree | |
: 1736427773:0;iree-opt --split-input-file --iree-gpu-test-target=gfx942 --pass-pipeline="builtin.module(hal.executable(hal.executable.variant(builtin.module(func.func(iree-llvmgpu-lower-executable-target)))))" compiler/src/iree/compiler/Codegen/LLVMGPU/test/ROCDL/pipeline_tile_and_fuse.mlir | FileCheck-18 compiler/src/iree/compiler/Codegen/LLVMGPU/test/ROCDL/pipeline_tile_and_fuse.mlir | |
: 1736427922:0;git-clang-format HEAD~ | |
: 1736427925:0;git-clang-format HEAD~1 | |
: 1736427944:0;clang-format compiler/src/iree/compiler/Codegen/Common/OptimizeTensorInsertExtractSlices.cpp | |
: 1736427948:0;clang-format -i compiler/src/iree/compiler/Codegen/Common/OptimizeTensorInsertExtractSlices.cpp | |
: 1736427991:0;CTEST_PARALLEL_LEVEL=32 cmake --build ~/iree-build --target iree-run-tests -j 16 | |
: 1736428393:0;iree-opt --split-input-file --iree-gpu-test-target=gfx942 --pass-pipeline="builtin.module(hal.executable(hal.executable.variant(builtin.module(func.func(iree-llvmgpu-lower-executable-target)))))" compiler/src/iree/compiler/Codegen/LLVMGPU/test/ROCDL/pipeline_igemm_tile_and_fuse.mlir | FileCheck-18 compiler/src/iree/compiler/Codegen/LLVMGPU/test/ROCDL/pipeline_igemm_tile_and_fuse.mlir | |
: 1736428464:0;git ppf | |
: 1736428635:0;rm test*.mlir | |
: 1736428636:0;clear | |
: 1736428636:0;ls | |
: 1736429148:0;CTEST_PARALLEL_LEVEL=32 cmake --build ~/iree-build --target iree-run-tests -j 32 | |
: 1736429386:0;iree-opt --split-input-file --iree-gpu-test-target=gfx942 --pass-pipeline="builtin.module(hal.executable(hal.executable.variant(builtin.module(func.func(iree-llvmgpu-lower-executable-target)))))" compiler/src/iree/compiler/Codegen/LLVMGPU/test/ROCDL/pipeline_tile_and_fuse.mlir | FileCheck-18 compiler/src/iree/compiler/Codegen/LLVMGPU/test/ROCDL/pipeline_tile_and_fuse.mlir | |
: 1736429424:0;iree-opt --split-input-file --iree-gpu-test-target=gfx942 --pass-pipeline="builtin.module(hal.executable(hal.executable.variant(builtin.module(func.func(iree-llvmgpu-lower-executable-target)))))" compiler/src/iree/compiler/Codegen/LLVMGPU/test/ROCDL/pipeline_tile_and_fuse.mlir | |
: 1736429435:0;iree-opt --split-input-file --iree-gpu-test-target=gfx942 --pass-pipeline="builtin.module(hal.executable(hal.executable.variant(builtin.module(func.func(iree-llvmgpu-lower-executable-target)))))" compiler/src/iree/compiler/Codegen/LLVMGPU/test/ROCDL/pipeline_tile_and_fuse.mlir -mlir-print-ir-after-all 2> full.txt | |
: 1736429439:0;vi full.txt | |
: 1736429695:0;rm full.txt | |
: 1736429697:0;CTEST_PARALLEL_LEVEL=32 cmake --build ~/iree-build --target iree-run-tests -j 32 | |
: 1736431803:0;riree | |
: 1736432250:0;clear | |
: 1736432251:0;ls | |
: 1736432266:0;vi | |
: 1736442566:0;\ | |
: 1736442567:0;tmux attach -t 0 | |
: 1736444373:0;git ppf | |
: 1736444517:0;buildifier compiler/src/iree/compiler/Codegen/Common/BUILD.bazel | |
: 1736444569:0;build_tools/bazel_to_cmake/bazel_to_cmake.py compiler/src/iree/compiler/Codegen/Common/BUILD.bazel | |
: 1736444587:0;git ppf | |
: 1736525046:0;\ | |
: 1736525048:0;tmux attach -t 0 | |
: 1736525200:0;riree | |
: 1736525399:0;build_tools/bazel_to_cmake/bazel_to_cmake.py compiler/src/iree/compiler/Codegen/Common/BUILD.bazel | |
: 1736525422:0;git-clang-format HEAD~1 | |
: 1736525431:0;clear | |
: 1736525431:0;ls | |
: 1736525434:0;git ppf | |
: 1736525444:0;lazygit --verison | |
: 1736525449:0;lazygit -h | |
: 1736525454:0;lazygit --v | |
: 1736525594:0;build_tools/bazel_to_cmake/bazel_to_cmake.py compiler/src/iree/compiler/Codegen/Common/BUILD.bazel | |
: 1736525601:0;git ppf | |
: 1736525928:0;riree | |
: 1736526148:0;git-clang-format HEAD~1 | |
: 1736526164:0;git-clang-format HEAD~ | |
: 1736526172:0;git ppf | |
: 1736526278:0;iree-compile test_now.mlir -o out1.vmfb --compile-from=executable-sources -mlir-print-ir-after-all 2> xyz.txt | |
: 1736526285:0;vi xyz.txt | |
: 1736526304:0;CTEST_PARALLEL_LEVEL= cmake --build ~/iree-build --target iree-run-tests -j 32 | |
: 1736526310:0;CTEST_PARALLEL_LEVEL=64 cmake --build ~/iree-build --target iree-run-tests -j 32 | |
: 1736527750:0;r | |
: 1736527750:0;CTEST_PARALLEL_LEVEL=64 cmake --build ~/iree-build --target iree-run-tests -j 32 | |
: 1736527753:0;riree | |
: 1736527895:0;git-clang-format HEAD~ | |
: 1736527916:0;git ppf | |
: 1736528343:0;CTEST_PARALLEL_LEVEL=64 cmake --build ~/iree-build --target iree-run-tests -j 32 | |
: 1736528385:0;rire | |
: 1736528387:0;riree | |
: 1736528738:0;rire | |
: 1736528739:0;riree | |
: 1736528814:0;git-clang-format HEAD~ | |
: 1736528824:0;git ppf | |
: 1736528829:0;CTEST_PARALLEL_LEVEL=64 cmake --build ~/iree-build --target iree-run-tests -j 32 | |
: 1736535248:0;tmux attach -t 0 | |
: 1736535424:0;git-clang-format compiler/src/iree/compiler/Codegen/Common/OptimizeTensorInsertExtractSlices.cpp | |
: 1736535436:0;clang-format -i compiler/src/iree/compiler/Codegen/Common/OptimizeTensorInsertExtractSlices.cpp | |
: 1736535458:0;riree | |
: 1736535477:0;CTEST_PARALLEL_LEVEL=64 cmake --build ~/iree-build --target iree-run-tests -j 32 | |
: 1736535670:0;git ppf | |
: 1736574488:0;\ | |
: 1736574490:0;tmux attach -t 0 | |
: 1736574519:0;clear | |
: 1736574519:0;ls | |
: 1736574524:0;vi test_avgpool.mlir | |
: 1736574584:0;iree-compile test_avgpool.mlir --iree-hal-target-backends=rocm --iree-hip-target=gfx1100 --iree-input-demote-f64-to-f32=false -o model_gpu_rocm_rdna3.vmfb | |
: 1736576046:0;git o main | |
: 1736576048:0;git puom | |
: 1736576053:0;git lg | |
: 1736576056:0;clear | |
: 1736576056:0;ls | |
: 1736576058:0;git submodule update --init | |
: 1736576060:0;clear | |
: 1736576060:0;ls | |
: 1736576075:0;git ob opt_tensor_insert_extract | |
: 1736576076:0;clear | |
: 1736576077:0;ls | |
: 1736576080:0;riree | |
: 1736576528:0;ls | |
: 1736576531:0;vi test.mlir | |
: 1736576915:0;iree-opt --pass-pipeline="builtin.module(func.func(iree-codegen-optimize-tensor-insert-extract-slices{fold-identity-slices=true}))" --split-input-file compiler/src/iree/compiler/Codegen/Common/test/optimize_tensor_insert_extract_slices.mlir | |
: 1736576967:0;iree-opt compiler/src/iree/compiler/Codegen/Common/test/optimize_tensor_insert_extract_slices.mlir | |
: 1736576975:0;iree-opt compiler/src/iree/compiler/Codegen/Common/test/optimize_tensor_insert_extract_slices.mlir --split-input-file | |
: 1736577080:0;iree-opt --pass-pipeline="builtin.module(func.func(iree-codegen-optimize-tensor-insert-extract-slices{fold-identity-slices=true}))" --split-input-file compiler/src/iree/compiler/Codegen/Common/test/optimize_tensor_insert_extract_slices.mlir | FileCheck-18 compiler/src/iree/compiler/Codegen/Common/test/optimize_tensor_insert_extract_slices.mlir | |
: 1736577460:0;CTEST_PARALLEL_LEVEL=64 cmake --build ~/iree-build --target iree-run-tests -j 32 | |
: 1736577850:0;iree-opt --split-input-file --iree-gpu-test-target=gfx942 --pass-pipeline="builtin.module(hal.executable(hal.executable.variant(builtin.module(func.func(iree-llvmgpu-lower-executable-target)))))" compiler/src/iree/compiler/Codegen/LLVMGPU/test/ROCDL/pipeline_igemm_tile_and_fuse.mlir | FileCheck-18 compiler/src/iree/compiler/Codegen/LLVMGPU/test/ROCDL/pipeline_igemm_tile_and_fuse.mlir | |
: 1736577919:0;iree-opt --split-input-file --iree-gpu-test-target=gfx942 --pass-pipeline="builtin.module(hal.executable(hal.executable.variant(builtin.module(func.func(iree-llvmgpu-lower-executable-target)))))" compiler/src/iree/compiler/Codegen/LLVMGPU/test/ROCDL/pipeline_tile_and_fuse.mlir -mlir-print-ir-after-all 2> full.txt | |
: 1736577980:0;iree-opt --split-input-file --iree-gpu-test-target=gfx942 --pass-pipeline="builtin.module(hal.executable(hal.executable.variant(builtin.module(func.func(iree-llvmgpu-lower-executable-target)))))" compiler/src/iree/compiler/Codegen/LLVMGPU/test/ROCDL/pipeline_tile_and_fuse.mlir | FileCheck-18 compiler/src/iree/compiler/Codegen/LLVMGPU/test/ROCDL/pipeline_tile_and_fuse.mlir | |
: 1736578022:0;git ppf | |
: 1736578585:0;git ob main | |
: 1736578590:0;git o main | |
: 1736578592:0;clear | |
: 1736578598:0;git ob reorderworkgroups | |
: 1736579034:0;riree | |
: 1736579381:0;git-clang-format HEAD~ | |
: 1736579399:0;git ppf | |
: 1736752985:0;clear | |
: 1736752985:0;ls | |
: 1736752997:0;\ | |
\ | |
\ | |
: 1736752998:0;clear | |
: 1736752998:0;ls | |
: 1736753000:0;tmux attach -t 0 | |
: 1736755206:0;clear | |
: 1736755206:0;ls | |
: 1736755210:0;riree | |
: 1736755282:0;vi test_buffer.mlir | |
: 1736755312:0;iree-opt --split-input-file --iree-gpu-test-target=gfx942 --pass-pipeline="builtin.module(hal.executable(hal.executable.variant(builtin.module(func.func(iree-llvmgpu-lower-executable-target)))))" test_buffer.mlir | |
: 1736755324:0;iree-opt --split-input-file --iree-gpu-test-target=gfx942 --pass-pipeline="builtin.module(hal.executable(hal.executable.variant(builtin.module(func.func(iree-llvmgpu-lower-executable-target)))))" test_buffer.mlir --mlir-print-ir-after-all 2> full.txt | |
: 1736755327:0;vi full.txt | |
: 1736755334:0;iree-opt --split-input-file --iree-gpu-test-target=gfx942 --pass-pipeline="builtin.module(hal.executable(hal.executable.variant(builtin.module(func.func(iree-llvmgpu-lower-executable-target)))))" test_buffer.mlir --mlir-print-ir-after-all 2> full.txt | |
: 1736755337:0;vi full.txt | |
: 1736755353:0;mv full.txt wo.txt | |
: 1736755359:0;git branch | |
: 1736755363:0;git o opt_tensor_insert_extract | |
: 1736755365:0;riree | |
: 1736755380:0;iree-opt --split-input-file --iree-gpu-test-target=gfx942 --pass-pipeline="builtin.module(hal.executable(hal.executable.variant(builtin.module(func.func(iree-llvmgpu-lower-executable-target)))))" test_buffer.mlir --mlir-print-ir-after-all 2> with.txt | |
: 1736755383:0;vi with.txt | |
: 1736755409:0;diff with.txt wo.txt | |
: 1736755434:0;vi with.txt wo.txt | |
: 1736755494:0;gist-paste with.txt wo.txt | |
: 1736755647:0;clear | |
: 1736755648:0;ls | |
: 1736755654:0;vi wo.txt | |
: 1736756761:0;clear | |
: 1736756761:0;ls | |
: 1736756764:0;vi attn.mlir | |
: 1736756792:0;/home/prashant/iree-build/tools/iree-compile --output-format=vm-bytecode --mlir-print-op-on-diagnostic=false --iree-hal-target-backends=llvm-cpu --iree-llvmcpu-target-cpu=generic attn.mlir -o atn.vmfb | |
: 1736756796:0;vi attn.mlir | |
: 1736756910:0;/home/prashant/iree-build/tools/iree-compile --output-format=vm-bytecode --mlir-print-op-on-diagnostic=false --iree-hal-target-backends=llvm-cpu --iree-llvmcpu-target-cpu=generic attn.mlir -o atn.vmfb | |
: 1736756920:0;/home/prashant/iree-build/tools/iree-compile --output-format=vm-bytecode --mlir-print-op-on-diagnostic=false --iree-hal-target-backends=llvm-cpu --iree-llvmcpu-target-cpu=generic attn.mlir -o atn.vmfb -mlir-print-ir-after-all 2> full.txt | |
: 1736756925:0;vi full.txt | |
: 1736757016:0;clear | |
: 1736757017:0;ls | |
: 1736761537:0;gist-paste attn.mlir | |
: 1736761546:0;gist-paste full.txt | |
: 1736787085:0;clear | |
: 1736787086:0;ls | |
: 1736787088:0;tmux attach -t 0 | |
: 1736787094:0;clear | |
: 1736787095:0;ls | |
: 1736787099:0;vi | |
: 1736787833:0;riree | |
: 1736788285:0;iree-opt --pass-pipeline="builtin.module(func.func(iree-codegen-optimize-tensor-insert-extract-slices{fold-identity-slices=true}))" --split-input-file compiler/src/iree/compiler/Codegen/Common/test/optimize_tensor_insert_extract_slices.mlir | FileCheck-18 compiler/src/iree/compiler/Codegen/Common/test/optimize_tensor_insert_extract_slices.mlir | |
: 1736788356:0;riree | |
: 1736788373:0;iree-opt --pass-pipeline="builtin.module(func.func(iree-codegen-optimize-tensor-insert-extract-slices{fold-identity-slices=true}))" --split-input-file compiler/src/iree/compiler/Codegen/Common/test/optimize_tensor_insert_extract_slices.mlir | FileCheck-18 compiler/src/iree/compiler/Codegen/Common/test/optimize_tensor_insert_extract_slices.mlir | |
: 1736788413:0;riree | |
: 1736788432:0;iree-opt --pass-pipeline="builtin.module(func.func(iree-codegen-optimize-tensor-insert-extract-slices{fold-identity-slices=true}))" --split-input-file compiler/src/iree/compiler/Codegen/Common/test/optimize_tensor_insert_extract_slices.mlir | FileCheck-18 compiler/src/iree/compiler/Codegen/Common/test/optimize_tensor_insert_extract_slices.mlir | |
: 1736790233:0;ls | |
: 1736790239:0;mkdir buff_elem.mlir | |
: 1736790243:0;vi buff_elem.mlir | |
: 1736790262:0;rm -rf buff_elem.mlir | |
: 1736790267:0;vi buff_elem.mlir | |
: 1736790289:0;cd ../ | |
: 1736790290:0;ls | |
: 1736790291:0;cd .. | |
: 1736790297:0;clear | |
: 1736790298:0;ls | |
: 1736790351:0;git clone [email protected]:llvm/llvm-project.git | |
: 1736790761:0;bm | |
: 1736790767:0;source ~/iree/.iree_venv/bin/activate | |
: 1736790768:0;bm | |
: 1736790773:0;ebd | |
: 1736790791:0;bm | |
: 1736790796:0;ebd | |
: 1736790812:0;bm | |
: 1736790834:0;pip install nanobind | |
: 1736790846:0;pip install nanobind==2.4 | |
: 1736790850:0;bm | |
: 1736790874:0;rm -rf llvm-project/build | |
: 1736790875:0;bm | |
: 1736842400:0;\ | |
: 1736842401:0;clear | |
: 1736842402:0;ls | |
: 1736842404:0;tmux attach -t 0 | |
: 1736842423:0;pip install yaml | |
: 1736842430:0;pip install pyyaml | |
: 1736842439:0;runm | |
: 1736842582:0;ls | |
: 1736842587:0;vi buff_ext.mlir | |
: 1736842632:0;mlir-opt buff_ext.mlir -eliminate-empty-tensors | |
: 1736842656:0;mlir-opt buff_ext.mlir -cse -eliminate-empty-tensors | |
: 1736842677:0;vi buff_ext.mlir | |
: 1736842731:0;mlir-opt buff_ext.mlir -cse -eliminate-empty-tensors | |
: 1736842756:0;mlir-opt buff_ext.mlir -canonicalize -eliminate-empty-tensors | |
: 1736842761:0;mlir-opt buff_ext.mlir -canonicalize -cse -eliminate-empty-tensors | |
: 1736842824:0;mlir-opt buff_ext.mlir -canonicalize -dce -eliminate-empty-tensors | |
: 1736842861:0;cat buff_ext.mlir | |
: 1736843064:0;mlir-opt buff_ext.mlir -canonicalize -dce -eliminate-empty-tensors | |
: 1736843070:0;mlir-opt buff_ext.mlir -canonicalize -cse -eliminate-empty-tensors | |
: 1736843079:0;module {\ | |
func.func @test_one(%arg0: index, %arg1: vector<64x64xf32>, %arg2: tensor<2x4096x10x64xf16>) -> tensor<1x64x1x64xf16> {\ | |
%c0 = arith.constant 0 : index\ | |
%0 = tensor.empty() : tensor<64x64xf16>\ | |
%1 = arith.truncf %arg1 : vector<64x64xf32> to vector<64x64xf16>\ | |
%2 = vector.transfer_write %1, %0[%c0, %c0] {in_bounds = [true, true]} : vector<64x64xf16>, tensor<64x64xf16>\ | |
%extracted_slice = tensor.extract_slice %arg2[%arg0, 0, 0, 0] [1, 64, 1, 64] [1, 1, 1, 1] : tensor<2x4096x10x64xf16> to tensor<1x64x1x64xf16>\ | |
%inserted_slice = tensor.insert_slice %2 into %extracted_slice[0, 0, 0, 0] [1, 64, 1, 64] [1, 1, 1, 1] : tensor<64x64xf16> into tensor<1x64x1x64xf16>\ | |
return %inserted_slice : tensor<1x64x1x64xf16>\ | |
}\ | |
func.func @test_two(%arg0: index, %arg1: vector<64x64xf32>, %arg2: tensor<2x4096x10x64xf16>) -> tensor<1x64x1x64xf16> {\ | |
%c0 = arith.constant 0 : index\ | |
%0 = tensor.empty() : tensor<64x64xf16>\ | |
%1 = arith.truncf %arg1 : vector<64x64xf32> to vector<64x64xf16>\ | |
%extracted_slice = tensor.extract_slice %arg2[%arg0, 0, 0, 0] [1, 64, 1, 64] [1, 1, 1, 1] : tensor<2x4096x10x64xf16> to tensor<1x64x1x64xf16>\ | |
%extracted_slice_0 = tensor.extract_slice %extracted_slice[0, 0, 0, 0] [1, 64, 1, 64] [1, 1, 1, 1] : tensor<1x64x1x64xf16> to tensor<64x64xf16>\ | |
%2 = vector.transfer_write %1, %extracted_slice_0[%c0, %c0] {in_bounds = [true, true]} : vector<64x64xf16>, tensor<64x64xf16>\ | |
%inserted_slice = tensor.insert_slice %2 into %extracted_slice[0, 0, 0, 0] [1, 64, 1, 64] [1, 1, 1, 1] : tensor<64x64xf16> into tensor<1x64x1x64xf16>\ | |
return %inserted_slice : tensor<1x64x1x64xf16>\ | |
}\ | |
} | |
: 1736843303:0;mlir-opt buff_ext.mlir -eliminate-empty-tensors -canonicalize | |
: 1736870593:0;clear | |
: 1736870593:0;ls | |
: 1736870597:0;tmux attach -t 0 | |
: 1736870611:0;cd ../llvm-project | |
: 1736870612:0;vi | |
: 1736870650:0;riree | |
: 1736870655:0;cd .. | |
: 1736870657:0;cd llvm-project | |
: 1736870658:0;runm | |
: 1736870683:0;vi buff_ext.mlir | |
: 1736870698:0;mlir-opt buff_ext.mlir -eliminate-empty-tensors -canonicalize | |
: 1736870764:0;riree | |
: 1736870778:0;mlir-opt buff_ext.mlir -eliminate-empty-tensors -canonicalize | |
: 1736870783:0;runm | |
: 1736870798:0;mlir-opt buff_ext.mlir -eliminate-empty-tensors -canonicalize | |
: 1736870805:0;vi buff_ext.mlir | |
: 1736870810:0;mlir-opt buff_ext.mlir -eliminate-empty-tensors -canonicalize | |
: 1736870902:0;riree | |
: 1736870921:0;runm | |
: 1736870937:0;mlir-opt buff_ext.mlir -eliminate-empty-tensors -canonicalize | |
: 1736871167:0;riree | |
: 1736871174:0;runm | |
: 1736871194:0;mlir-opt buff_ext.mlir -eliminate-empty-tensors -canonicalize | |
: 1736871209:0;mlir-opt buff_ext.mlir -eliminate-empty-tensors -canonicalize --verify-each=0 | |
: 1736871257:0;riree | |
: 1736871268:0;mlir-opt buff_ext.mlir -eliminate-empty-tensors -canonicalize --verify-each=0 | |
: 1736871275:0;runm | |
: 1736871333:0;mlir-opt buff_ext.mlir -eliminate-empty-tensors -canonicalize --verify-each=0 | |
: 1736871354:0;rire | |
: 1736871357:0;riree | |
: 1736871401:0;mlir-opt buff_ext.mlir -eliminate-empty-tensors -canonicalize --verify-each=0 | |
: 1736871407:0;runm | |
: 1736871415:0;mlir-opt buff_ext.mlir -eliminate-empty-tensors -canonicalize --verify-each=0 | |
: 1736871427:0;runm | |
: 1736871433:0;mlir-opt buff_ext.mlir -eliminate-empty-tensors -canonicalize --verify-each=0 | |
: 1736871487:0;riree | |
: 1736871498:0;rum | |
: 1736871500:0;runm | |
: 1736871514:0;mlir-opt buff_ext.mlir -eliminate-empty-tensors -canonicalize --verify-each=0 | |
: 1736941535:0;\ | |
: 1736941537:0;omz update | |
: 1736941540:0;clear | |
: 1736941540:0;ls | |
: 1736941542:0;tmux attach -t 0 | |
: 1736941695:0;runm | |
: 1736941712:0;mlir-opt buff_ext.mlir -eliminate-empty-tensors -canonicalize --verify-each=0 | |
: 1736943135:0;runm | |
: 1736943149:0;mlir-opt buff_ext.mlir -eliminate-empty-tensors -canonicalize --verify-each=0 | |
: 1736943221:0;ls | |
: 1736943227:0;cat buff_ext.mlir | |
: 1736943327:0;runm | |
: 1736943342:0;mlir-opt buff_ext.mlir -eliminate-empty-tensors -canonicalize --verify-each=0 | |
: 1736943357:0;vi buff_e | |
: 1736943360:0;vi buff_ext.mlir | |
: 1736943369:0;mlir-opt buff_ext.mlir -eliminate-empty-tensors -canonicalize --verify-each=0 | |
: 1736943378:0;runm | |
: 1736943384:0;source ~/iree/.iree_venv/bin/activate | |
: 1736943385:0;runm | |
: 1736943390:0;mlir-opt buff_ext.mlir -eliminate-empty-tensors -canonicalize --verify-each=0 | |
: 1736943471:0;runm | |
: 1736943480:0;mlir-opt buff_ext.mlir -eliminate-empty-tensors -canonicalize --verify-each=0 | |
: 1736950020:0;runm | |
: 1736950030:0;mlir-opt buff_ext.mlir -eliminate-empty-tensors -canonicalize --verify-each=0 | |
: 1736950112:0;runm | |
: 1736950134:0;mlir-opt buff_ext.mlir -eliminate-empty-tensors -canonicalize --verify-each=0 | |
: 1736950289:0;runm | |
: 1736950298:0;mlir-opt buff_ext.mlir -eliminate-empty-tensors -canonicalize --verify-each=0 | |
: 1736950313:0;runm | |
: 1736950316:0;mlir-opt buff_ext.mlir -eliminate-empty-tensors -canonicalize --verify-each=0 | |
: 1736950597:0;runm | |
: 1736950606:0;mlir-opt buff_ext.mlir -eliminate-empty-tensors -canonicalize --verify-each=0 | |
: 1736950800:0;runm | |
: 1736950808:0;mlir-opt buff_ext.mlir -eliminate-empty-tensors -canonicalize --verify-each=0 | |
: 1736950826:0;ls | |
: 1736950830:0;clear | |
: 1736950830:0;ls | |
: 1736950836:0;vi buff_ext.mlir | |
: 1736950852:0;mlir-opt buff_ext.mlir -eliminate-empty-tensors -canonicalize --verify-each=0 | |
: 1736950880:0;runm | |
: 1736950889:0;mlir-opt buff_ext.mlir -eliminate-empty-tensors -canonicalize --verify-each=0 | |
: 1736951002:0;cat buff_ext.mlir | |
: 1736951448:0;runm | |
: 1736951459:0;cat buff_ext.mlir | |
: 1736951462:0;mlir-opt buff_ext.mlir -eliminate-empty-tensors -canonicalize --verify-each=0 | |
: 1736951512:0;bm | |
: 1736951909:0;runm | |
: 1736952019:0;bm | |
: 1736952146:0;pip install ml_dtypes | |
: 1736952162:0;bm | |
: 1736952200:0;runm | |
: 1736952217:0;bm | |
: 1736952363:0;runm | |
: 1736952374:0;bm | |
: 1736952448:0;mlir-opt buff_ext.mlir -eliminate-empty-tensors -canonicalize --verify-each=0 | |
: 1736952462:0;cat buff_ext.mlir | |
: 1736952491:0;vi buff_ext.mlir | |
: 1736952505:0;mlir-opt buff_ext.mlir -eliminate-empty-tensors -canonicalize --verify-each=0 | |
: 1736952531:0;runm | |
: 1736952535:0;mlir-opt buff_ext.mlir -eliminate-empty-tensors -canonicalize --verify-each=0 | |
: 1736952697:0;runm | |
: 1736952706:0;mlir-opt buff_ext.mlir -eliminate-empty-tensors -canonicalize --verify-each=0 | |
: 1736952863:0;runm | |
: 1736952872:0;mlir-opt buff_ext.mlir -eliminate-empty-tensors -canonicalize --verify-each=0 | |
: 1736952940:0;vi buff_ext.mlir | |
: 1736952966:0;mlir-opt buff_1.mlir -eliminate-empty-tensors -canonicalize --verify-each=0 | |
: 1736952970:0;mlir-opt buff1.mlir -eliminate-empty-tensors -canonicalize --verify-each=0 | |
: 1736952999:0;runm | |
: 1736953007:0;mlir-opt buff1.mlir -eliminate-empty-tensors -canonicalize --verify-each=0 | |
: 1736953044:0;runm | |
: 1736953053:0;mlir-opt buff1.mlir -eliminate-empty-tensors -canonicalize --verify-each=0 | |
: 1736953101:0;runm | |
: 1736953111:0;mlir-opt buff1.mlir -eliminate-empty-tensors -canonicalize --verify-each=0 | |
: 1736953131:0;mlir-opt buff_ext.mlir -eliminate-empty-tensors -canonicalize --verify-each=0 | |
: 1736953162:0;runm | |
: 1736953185:0;mlir-opt buff_ext.mlir -eliminate-empty-tensors -canonicalize --verify-each=0 | |
: 1736953224:0;mlir-opt buff1.mlir -eliminate-empty-tensors -canonicalize --verify-each=0 | |
: 1736953335:0;runm | |
: 1736953345:0;mlir-opt buff1.mlir -eliminate-empty-tensors -canonicalize --verify-each=0 | |
: 1736953364:0;mlir-opt buff_ext.mlir -eliminate-empty-tensors -canonicalize --verify-each=0 | |
: 1736953481:0;:vs buff_ext.mlir buff1.mlir | |
: 1736953485:0;vi buff_ext.mlir buff1.mlir | |
: 1736953565:0;mlir-opt buff_ext.mlir -eliminate-empty-tensors -canonicalize --verify-each=0 | |
: 1736953576:0;runm | |
: 1736953580:0;mlir-opt buff_ext.mlir -eliminate-empty-tensors -canonicalize --verify-each=0 | |
: 1736953616:0;mlir-opt buff1.mlir -eliminate-empty-tensors -canonicalize --verify-each=0 | |
: 1736953791:0;runm | |
: 1736953807:0;mlir-opt buff1.mlir -eliminate-empty-tensors -canonicalize --verify-each=0 | |
: 1736953865:0;runm | |
: 1736953892:0;mlir-opt buff1.mlir -eliminate-empty-tensors -canonicalize --verify-each=0 | |
: 1736953935:0;mlir-opt buff_ext.mlir -eliminate-empty-tensors -canonicalize --verify-each=0 | |
: 1736953955:0;riree | |
: 1736953965:0;mlir-opt buff_ext.mlir -eliminate-empty-tensors -canonicalize --verify-each=0 | |
: 1736953991:0;mlir-opt buff1.mlir -eliminate-empty-tensors -canonicalize --verify-each=0 | |
: 1736954004:0;runm | |
: 1736954014:0;mlir-opt buff1.mlir -eliminate-empty-tensors -canonicalize --verify-each=0 | |
: 1736954022:0;mlir-opt buff_ext.mlir -eliminate-empty-tensors -canonicalize --verify-each=0 | |
: 1736954483:0;runm | |
: 1736954492:0;mlir-opt buff_ext.mlir -eliminate-empty-tensors -canonicalize --verify-each=0 | |
: 1736954656:0;cat buff1.mlir | |
: 1736954662:0;cat buff_ext.mlir | |
: 1736954734:0;runm | |
: 1736954740:0;mlir-opt buff_ext.mlir -eliminate-empty-tensors -canonicalize --verify-each=0 | |
: 1736954847:0;cat buff1.mlir | |
: 1736954852:0;mlir-opt buff1.mlir -eliminate-empty-tensors -canonicalize --verify-each=0 | |
: 1736955146:0;runm | |
: 1736955161:0;mlir-opt buff1.mlir -eliminate-empty-tensors -canonicalize --verify-each=0 | |
: 1736955173:0;mlir-opt buff_ext.mlir -eliminate-empty-tensors -canonicalize --verify-each=0 | |
: 1736955206:0;cat buff_ext.mlir | |
: 1736955435:0;runm | |
: 1736955444:0;cat buff_ext.mlir | |
: 1736955450:0;mlir-opt buff_ext.mlir -eliminate-empty-tensors -canonicalize --verify-each=0 | |
: 1736955542:0;runm | |
: 1736955551:0;mlir-opt buff_ext.mlir -eliminate-empty-tensors -canonicalize --verify-each=0 | |
: 1736955755:0;runm | |
: 1736955764:0;mlir-opt buff_ext.mlir -eliminate-empty-tensors -canonicalize --verify-each=0 | |
: 1736955836:0;runm | |
: 1736955845:0;mlir-opt buff_ext.mlir -eliminate-empty-tensors -canonicalize --verify-each=0 | |
: 1736955864:0;runm | |
: 1736955907:0;mlir-opt buff_ext.mlir -eliminate-empty-tensors -canonicalize --verify-each=0 | |
: 1736955944:0;runm | |
: 1736955952:0;mlir-opt buff_ext.mlir -eliminate-empty-tensors -canonicalize --verify-each=0 | |
: 1736956033:0;mlir-opt buff1.mlir -eliminate-empty-tensors -canonicalize --verify-each=0 | |
: 1736956045:0;mlir-opt buff_ext.mlir -eliminate-empty-tensors -canonicalize --verify-each=0 | |
: 1736956051:0;vi buff_ext.mlir | |
: 1736956155:0;runm | |
: 1736956165:0;mlir-opt buff_ext.mlir -eliminate-empty-tensors -canonicalize --verify-each=0 | |
: 1736956712:0;clear | |
: 1736956712:0;ls | |
: 1736956725:0;vi buff_ext.mlir | |
: 1736956729:0;clear | |
: 1736956729:0;ls | |
: 1736956739:0;clear | |
: 1736956739:0;ls | |
: 1736956743:0;cd .. | |
: 1736956746:0;cd iree | |
: 1736956746:0;vi | |
: 1736956902:0;runm | |
: 1736956915:0;vi buff_analysis.mlir | |
: 1736956940:0;iree-opt --pass-pipeline="builtin.module(func.func(iree-codegen-optimize-tensor-insert-extract-slices{fold-identity-slices=true}))" --split-input-file compiler/src/iree/compiler/Codegen/Common/test/optimize_tensor_insert_extract_slices.mlir | |
: 1736956953:0;iree-opt --pass-pipeline="builtin.module(func.func(iree-codegen-optimize-tensor-insert-extract-slices{fold-identity-slices=true}))" --split-input-file iree/compiler/src/iree/compiler/Codegen/Common/test/optimize_tensor_insert_extract_slices.mlir | |
: 1736956962:0;iree-opt --pass-pipeline="builtin.module(func.func(iree-codegen-optimize-tensor-insert-extract-slices{fold-identity-slices=true}))" --split-input-file ~/iree/compiler/src/iree/compiler/Codegen/Common/test/optimize_tensor_insert_extract_slices.mlir | |
: 1736957152:0;vi buff_analysis.mlir | |
: 1736957164:0;iree-opt --pass-pipeline="builtin.module(func.func(iree-codegen-optimize-tensor-insert-extract-slices{fold-identity-slices=true}))" --split-input-file buff_analysis.mlir | |
: 1736957172:0;iree-opt --pass-pipeline="builtin.module(func.func(iree-codegen-optimize-tensor-insert-extract-slices{fold-identity-slices=true}))" --split-input-file buff_analysis.mlir --verify-each=0 | |
: 1736957189:0;vi buff_analysis.mlir | |
: 1736957291:0;iree-opt --pass-pipeline="builtin.module(func.func(iree-codegen-optimize-tensor-insert-extract-slices{fold-identity-slices=true}))" --split-input-file buff_analysis.mlir --verify-each=0 | |
: 1736957362:0;runm | |
: 1736957369:0;riree | |
: 1736957389:0;iree-opt --pass-pipeline="builtin.module(func.func(iree-codegen-optimize-tensor-insert-extract-slices{fold-identity-slices=true}))" --split-input-file buff_analysis.mlir --verify-each=0 | |
: 1736958036:0;riree | |
: 1736958301:0;iree-opt --pass-pipeline="builtin.module(func.func(iree-codegen-optimize-tensor-insert-extract-slices{fold-identity-slices=true}))" --split-input-file buff_analysis.mlir --verify-each=0 | |
: 1736958598:0;riree | |
: 1736958618:0;iree-opt --pass-pipeline="builtin.module(func.func(iree-codegen-optimize-tensor-insert-extract-slices{fold-identity-slices=true}))" --split-input-file buff_analysis.mlir --verify-each=0 | |
: 1736958649:0;ls | |
: 1736958652:0;vi buff_analysis.mlir | |
: 1736958822:0;CTEST_PARALLEL_LEVEL=64 cmake --build ~/iree-build --target iree-run-tests -j 32 | |
: 1736959012:0;cd ../llvm-project | |
: 1736959016:0;cd ../iree | |
: 1736959031:0;iree-opt --pass-pipeline="builtin.module(func.func(iree-codegen-optimize-tensor-insert-extract-slices{fold-identity-slices=true}))" --split-input-file compiler/src/iree/compiler/Codegen/Common/test/optimize_tensor_insert_extract_slices.mlir | FileCheck-18 compiler/src/iree/compiler/Codegen/Common/test/optimize_tensor_insert_extract_slices.mlir | |
: 1736959232:0;runm | |
: 1736959234:0;riree | |
: 1736959258:0;iree-opt --pass-pipeline="builtin.module(func.func(iree-codegen-optimize-tensor-insert-extract-slices{fold-identity-slices=true}))" --split-input-file compiler/src/iree/compiler/Codegen/Common/test/optimize_tensor_insert_extract_slices.mlir | FileCheck-18 compiler/src/iree/compiler/Codegen/Common/test/optimize_tensor_insert_extract_slices.mlir | |
: 1736959289:0;runm | |
: 1736959295:0;riree | |
: 1736959319:0;iree-opt --pass-pipeline="builtin.module(func.func(iree-codegen-optimize-tensor-insert-extract-slices{fold-identity-slices=true}))" --split-input-file compiler/src/iree/compiler/Codegen/Common/test/optimize_tensor_insert_extract_slices.mlir | |
: 1736959382:0;riree | |
: 1736959402:0;iree-opt --pass-pipeline="builtin.module(func.func(iree-codegen-optimize-tensor-insert-extract-slices{fold-identity-slices=true}))" --split-input-file compiler/src/iree/compiler/Codegen/Common/test/optimize_tensor_insert_extract_slices.mlir | |
: 1736959931:0;riree | |
: 1736959949:0;iree-opt --pass-pipeline="builtin.module(func.func(iree-codegen-optimize-tensor-insert-extract-slices{fold-identity-slices=true}))" --split-input-file compiler/src/iree/compiler/Codegen/Common/test/optimize_tensor_insert_extract_slices.mlir | |
: 1736960003:0;riree | |
: 1736963337:0;tmux attach -t 0 | |
: 1736963375:0;riree | |
: 1736963395:0;iree-opt --pass-pipeline="builtin.module(func.func(iree-codegen-optimize-tensor-insert-extract-slices{fold-identity-slices=true}))" --split-input-file compiler/src/iree/compiler/Codegen/Common/test/optimize_tensor_insert_extract_slices.mlir | |
: 1736963469:0;riree | |
: 1736963487:0;iree-opt --pass-pipeline="builtin.module(func.func(iree-codegen-optimize-tensor-insert-extract-slices{fold-identity-slices=true}))" --split-input-file compiler/src/iree/compiler/Codegen/Common/test/optimize_tensor_insert_extract_slices.mlir | |
: 1736963604:0;riree | |
: 1736963622:0;iree-opt --pass-pipeline="builtin.module(func.func(iree-codegen-optimize-tensor-insert-extract-slices{fold-identity-slices=true}))" --split-input-file compiler/src/iree/compiler/Codegen/Common/test/optimize_tensor_insert_extract_slices.mlir | |
: 1736963651:0;riree | |
: 1736963670:0;iree-opt --pass-pipeline="builtin.module(func.func(iree-codegen-optimize-tensor-insert-extract-slices{fold-identity-slices=true}))" --split-input-file compiler/src/iree/compiler/Codegen/Common/test/optimize_tensor_insert_extract_slices.mlir | |
: 1736963788:0;riree | |
: 1736963804:0;iree-opt --pass-pipeline="builtin.module(func.func(iree-codegen-optimize-tensor-insert-extract-slices{fold-identity-slices=true}))" --split-input-file compiler/src/iree/compiler/Codegen/Common/test/optimize_tensor_insert_extract_slices.mlir | |
: 1736963885:0;iree-opt --pass-pipeline="builtin.module(func.func(iree-codegen-optimize-tensor-insert-extract-slices{fold-identity-slices=true}))" --split-input-file compiler/src/iree/compiler/Codegen/Common/test/optimize_tensor_insert_extract_slices.mlir | FileCheck-18 compiler/src/iree/compiler/Codegen/Common/test/optimize_tensor_insert_extract_slices.mlir | |
: 1736963961:0;vi test_xyz.mlir | |
: 1736963977:0;iree-opt --pass-pipeline="builtin.module(func.func(iree-codegen-optimize-tensor-insert-extract-slices{fold-identity-slices=true}))" --split-input-file test_xyz.mlir | |
: 1736963983:0;vi test_xyz.mlir | |
: 1736963986:0;iree-opt --pass-pipeline="builtin.module(func.func(iree-codegen-optimize-tensor-insert-extract-slices{fold-identity-slices=true}))" --split-input-file test_xyz.mlir | |
: 1736964019:0;iree-opt --pass-pipeline="builtin.module(func.func(iree-codegen-optimize-tensor-insert-extract-slices{fold-identity-slices=true}))" --split-input-file test_xyz.mlir > out.mlir | |
: 1736964027:0;diff out.mlir test_xyz.mlir | |
: 1736964049:0;vi test_xyz.mlir | |
: 1736964324:0;riree | |
: 1736964587:0;iree-opt --pass-pipeline="builtin.module(func.func(iree-codegen-optimize-tensor-insert-extract-slices{fold-identity-slices=true}))" --split-input-file test_xyz.mlir > out.mlir | |
: 1736964596:0;iree-opt --pass-pipeline="builtin.module(func.func(iree-codegen-optimize-tensor-insert-extract-slices{fold-identity-slices=true}))" --split-input-file compiler/src/iree/compiler/Codegen/Common/test/optimize_tensor_insert_extract_slices.mlir | FileCheck-18 compiler/src/iree/compiler/Codegen/Common/test/optimize_tensor_insert_extract_slices.mlir | |
: 1736964635:0;riree | |
: 1736964711:0;iree-opt --pass-pipeline="builtin.module(func.func(iree-codegen-optimize-tensor-insert-extract-slices{fold-identity-slices=true}))" --split-input-file compiler/src/iree/compiler/Codegen/Common/test/optimize_tensor_insert_extract_slices.mlir | FileCheck-18 compiler/src/iree/compiler/Codegen/Common/test/optimize_tensor_insert_extract_slices.mlir | |
: 1736965427:0;riree | |
: 1736965443:0;iree-opt --pass-pipeline="builtin.module(func.func(iree-codegen-optimize-tensor-insert-extract-slices{fold-identity-slices=true}))" --split-input-file compiler/src/iree/compiler/Codegen/Common/test/optimize_tensor_insert_extract_slices.mlir | FileCheck-18 compiler/src/iree/compiler/Codegen/Common/test/optimize_tensor_insert_extract_slices.mlir | |
: 1736965591:0;riree | |
: 1736965609:0;iree-opt --pass-pipeline="builtin.module(func.func(iree-codegen-optimize-tensor-insert-extract-slices{fold-identity-slices=true}))" --split-input-file compiler/src/iree/compiler/Codegen/Common/test/optimize_tensor_insert_extract_slices.mlir | FileCheck-18 compiler/src/iree/compiler/Codegen/Common/test/optimize_tensor_insert_extract_slices.mlir | |
: 1736965663:0;riree | |
: 1736965680:0;iree-opt --pass-pipeline="builtin.module(func.func(iree-codegen-optimize-tensor-insert-extract-slices{fold-identity-slices=true}))" --split-input-file compiler/src/iree/compiler/Codegen/Common/test/optimize_tensor_insert_extract_slices.mlir | FileCheck-18 compiler/src/iree/compiler/Codegen/Common/test/optimize_tensor_insert_extract_slices.mlir | |
: 1736965934:0;riree | |
: 1736965977:0;iree-opt --pass-pipeline="builtin.module(func.func(iree-codegen-optimize-tensor-insert-extract-slices{fold-identity-slices=true}))" --split-input-file compiler/src/iree/compiler/Codegen/Common/test/optimize_tensor_insert_extract_slices.mlir | |
: 1736966216:0;riree | |
: 1736966234:0;iree-opt --pass-pipeline="builtin.module(func.func(iree-codegen-optimize-tensor-insert-extract-slices{fold-identity-slices=true}))" --split-input-file compiler/src/iree/compiler/Codegen/Common/test/optimize_tensor_insert_extract_slices.mlir | |
: 1736966276:0;riree | |
: 1736966295:0;iree-opt --pass-pipeline="builtin.module(func.func(iree-codegen-optimize-tensor-insert-extract-slices{fold-identity-slices=true}))" --split-input-file compiler/src/iree/compiler/Codegen/Common/test/optimize_tensor_insert_extract_slices.mlir | |
: 1736966362:0;riree | |
: 1736966381:0;iree-opt --pass-pipeline="builtin.module(func.func(iree-codegen-optimize-tensor-insert-extract-slices{fold-identity-slices=true}))" --split-input-file compiler/src/iree/compiler/Codegen/Common/test/optimize_tensor_insert_extract_slices.mlir | |
: 1736966465:0;riree | |
: 1736966481:0;iree-opt --pass-pipeline="builtin.module(func.func(iree-codegen-optimize-tensor-insert-extract-slices{fold-identity-slices=true}))" --split-input-file compiler/src/iree/compiler/Codegen/Common/test/optimize_tensor_insert_extract_slices.mlir | |
: 1736967704:0;riree | |
: 1736967810:0;iree-opt --pass-pipeline="builtin.module(func.func(iree-codegen-optimize-tensor-insert-extract-slices{fold-identity-slices=true}))" --split-input-file compiler/src/iree/compiler/Codegen/Common/test/optimize_tensor_insert_extract_slices.mlir | |
: 1736967870:0;riree | |
: 1736967897:0;iree-opt --pass-pipeline="builtin.module(func.func(iree-codegen-optimize-tensor-insert-extract-slices{fold-identity-slices=true}))" --split-input-file compiler/src/iree/compiler/Codegen/Common/test/optimize_tensor_insert_extract_slices.mlir | |
: 1736967994:0;riree | |
: 1736968063:0;iree-opt --pass-pipeline="builtin.module(func.func(iree-codegen-optimize-tensor-insert-extract-slices{fold-identity-slices=true}))" --split-input-file compiler/src/iree/compiler/Codegen/Common/test/optimize_tensor_insert_extract_slices.mlir | |
: 1736968117:0;riree | |
: 1736968133:0;iree-opt --pass-pipeline="builtin.module(func.func(iree-codegen-optimize-tensor-insert-extract-slices{fold-identity-slices=true}))" --split-input-file compiler/src/iree/compiler/Codegen/Common/test/optimize_tensor_insert_extract_slices.mlir | |
: 1736968851:0;riree | |
: 1736968867:0;iree-opt --pass-pipeline="builtin.module(func.func(iree-codegen-optimize-tensor-insert-extract-slices{fold-identity-slices=true}))" --split-input-file compiler/src/iree/compiler/Codegen/Common/test/optimize_tensor_insert_extract_slices.mlir | |
: 1736968956:0;riree | |
: 1736968973:0;iree-opt --pass-pipeline="builtin.module(func.func(iree-codegen-optimize-tensor-insert-extract-slices{fold-identity-slices=true}))" --split-input-file compiler/src/iree/compiler/Codegen/Common/test/optimize_tensor_insert_extract_slices.mlir | |
: 1736969207:0;riree | |
: 1736969235:0;iree-opt --pass-pipeline="builtin.module(func.func(iree-codegen-optimize-tensor-insert-extract-slices{fold-identity-slices=true}))" --split-input-file compiler/src/iree/compiler/Codegen/Common/test/optimize_tensor_insert_extract_slices.mlir | |
: 1736969301:0;riree | |
: 1736969317:0;iree-opt --pass-pipeline="builtin.module(func.func(iree-codegen-optimize-tensor-insert-extract-slices{fold-identity-slices=true}))" --split-input-file compiler/src/iree/compiler/Codegen/Common/test/optimize_tensor_insert_extract_slices.mlir | |
: 1736969439:0;riree | |
: 1736969458:0;iree-opt --pass-pipeline="builtin.module(func.func(iree-codegen-optimize-tensor-insert-extract-slices{fold-identity-slices=true}))" --split-input-file compiler/src/iree/compiler/Codegen/Common/test/optimize_tensor_insert_extract_slices.mlir | |
: 1736969501:0;riree | |
: 1736969508:0;iree-opt --pass-pipeline="builtin.module(func.func(iree-codegen-optimize-tensor-insert-extract-slices{fold-identity-slices=true}))" --split-input-file compiler/src/iree/compiler/Codegen/Common/test/optimize_tensor_insert_extract_slices.mlir | |
: 1736969574:0;riree | |
: 1736969590:0;iree-opt --pass-pipeline="builtin.module(func.func(iree-codegen-optimize-tensor-insert-extract-slices{fold-identity-slices=true}))" --split-input-file compiler/src/iree/compiler/Codegen/Common/test/optimize_tensor_insert_extract_slices.mlir | |
: 1736969655:0;riree | |
: 1736969674:0;iree-opt --pass-pipeline="builtin.module(func.func(iree-codegen-optimize-tensor-insert-extract-slices{fold-identity-slices=true}))" --split-input-file compiler/src/iree/compiler/Codegen/Common/test/optimize_tensor_insert_extract_slices.mlir | |
: 1736970094:0;riree | |
: 1736970112:0;iree-opt --pass-pipeline="builtin.module(func.func(iree-codegen-optimize-tensor-insert-extract-slices{fold-identity-slices=true}))" --split-input-file compiler/src/iree/compiler/Codegen/Common/test/optimize_tensor_insert_extract_slices.mlir | |
: 1736970259:0;riree | |
: 1736970275:0;iree-opt --pass-pipeline="builtin.module(func.func(iree-codegen-optimize-tensor-insert-extract-slices{fold-identity-slices=true}))" --split-input-file compiler/src/iree/compiler/Codegen/Common/test/optimize_tensor_insert_extract_slices.mlir | |
: 1736970323:0;riree | |
: 1736970339:0;iree-opt --pass-pipeline="builtin.module(func.func(iree-codegen-optimize-tensor-insert-extract-slices{fold-identity-slices=true}))" --split-input-file compiler/src/iree/compiler/Codegen/Common/test/optimize_tensor_insert_extract_slices.mlir | |
: 1736970643:0;riree | |
: 1736970659:0;iree-opt --pass-pipeline="builtin.module(func.func(iree-codegen-optimize-tensor-insert-extract-slices{fold-identity-slices=true}))" --split-input-file compiler/src/iree/compiler/Codegen/Common/test/optimize_tensor_insert_extract_slices.mlir | |
: 1736970747:0;riree | |
: 1736970763:0;iree-opt --pass-pipeline="builtin.module(func.func(iree-codegen-optimize-tensor-insert-extract-slices{fold-identity-slices=true}))" --split-input-file compiler/src/iree/compiler/Codegen/Common/test/optimize_tensor_insert_extract_slices.mlir | |
: 1736970802:0;CTEST_PARALLEL_LEVEL=64 cmake --build ~/iree-build --target iree-run-tests -j 32 | |
: 1736970829:0;vi test_xyz.mlir | |
: 1736970864:0;iree-opt --pass-pipeline="builtin.module(func.func(iree-codegen-optimize-tensor-insert-extract-slices{fold-identity-slices=true}))" --split-input-file test_xyz.mlir > out.mlir | |
: 1736970874:0;diff out.mlir test_xyz.mlir | |
: 1736970878:0;vi out.mlir | |
: 1736971229:0;riree | |
: 1736971274:0;iree-opt --pass-pipeline="builtin.module(func.func(iree-codegen-optimize-tensor-insert-extract-slices{fold-identity-slices=true}))" --split-input-file test_xyz.mlir > out.mlir | |
: 1736971279:0;iree-opt --pass-pipeline="builtin.module(func.func(iree-codegen-optimize-tensor-insert-extract-slices{fold-identity-slices=true}))" --split-input-file compiler/src/iree/compiler/Codegen/Common/test/optimize_tensor_insert_extract_slices.mlir | |
: 1736971386:0;riree | |
: 1736971418:0;iree-opt --pass-pipeline="builtin.module(func.func(iree-codegen-optimize-tensor-insert-extract-slices{fold-identity-slices=true}))" --split-input-file compiler/src/iree/compiler/Codegen/Common/test/optimize_tensor_insert_extract_slices.mlir | |
: 1736971647:0;riree | |
: 1736971666:0;CTEST_PARALLEL_LEVEL=64 cmake --build ~/iree-build --target iree-run-tests -j 32 | |
: 1736971823:0;iree-opt --split-input-file --iree-gpu-test-target=gfx942 --iree-codegen-llvmgpu-use-vector-distribution --iree-llvmgpu-enable-prefetch=true --pass-pipeline="builtin.module(hal.executable(hal.executable.variant(builtin.module(func.func(iree-llvmgpu-lower-executable-target)))))" compiler/src/iree/compiler/Codegen/LLVMGPU/test/ROCDL/pipeline_vector_distribute_gfx942.mlir | FileCheck-18 compiler/src/iree/compiler/Codegen/LLVMGPU/test/ROCDL/pipeline_vector_distribute_gfx942.mlir --check-prefix=MEMORY | |
: 1736971830:0;iree-opt --split-input-file --iree-gpu-test-target=gfx942 --iree-codegen-llvmgpu-use-vector-distribution --iree-llvmgpu-enable-prefetch=true --pass-pipeline="builtin.module(hal.executable(hal.executable.variant(builtin.module(func.func(iree-llvmgpu-lower-executable-target)))))" compiler/src/iree/compiler/Codegen/LLVMGPU/test/ROCDL/pipeline_vector_distribute_gfx942.mlir | FileCheck-18 compiler/src/iree/compiler/Codegen/LLVMGPU/test/ROCDL/pipeline_vector_distribute_gfx942.mlir | |
: 1736971979:0;iree-opt --split-input-file --iree-gpu-test-target=gfx942 --iree-codegen-llvmgpu-use-vector-distribution --iree-llvmgpu-enable-prefetch=true --pass-pipeline="builtin.module(hal.executable(hal.executable.variant(builtin.module(func.func(iree-llvmgpu-lower-executable-target)))))" compiler/src/iree/compiler/Codegen/LLVMGPU/test/ROCDL/pipeline_vector_distribute_gfx942.mlir | |
: 1736972218:0;iree-opt --split-input-file --iree-gpu-test-target=gfx942 --iree-codegen-llvmgpu-use-vector-distribution --iree-llvmgpu-enable-prefetch=true --pass-pipeline="builtin.module(hal.executable(hal.executable.variant(builtin.module(func.func(iree-llvmgpu-lower-executable-target)))))" compiler/src/iree/compiler/Codegen/LLVMGPU/test/ROCDL/pipeline_vector_distribute_gfx942.mlir | FileCheck-18 compiler/src/iree/compiler/Codegen/LLVMGPU/test/ROCDL/pipeline_vector_distribute_gfx942.mlir | |
: 1736972255:0;iree-opt --split-input-file --iree-gpu-test-target=gfx942 --iree-codegen-llvmgpu-use-vector-distribution --iree-llvmgpu-enable-prefetch=true --pass-pipeline="builtin.module(hal.executable(hal.executable.variant(builtin.module(func.func(iree-llvmgpu-lower-executable-target)))))" compiler/src/iree/compiler/Codegen/LLVMGPU/test/ROCDL/pipeline_vector_distribute_gfx942.mlir > out.mlir | |
: 1736972332:0;iree-opt --split-input-file --iree-gpu-test-target=gfx942 --iree-codegen-llvmgpu-use-vector-distribution --iree-llvmgpu-enable-prefetch=true --pass-pipeline="builtin.module(hal.executable(hal.executable.variant(builtin.module(func.func(iree-llvmgpu-lower-executable-target)))))" compiler/src/iree/compiler/Codegen/LLVMGPU/test/ROCDL/pipeline_vector_distribute_gfx942.mlir | FileCheck-18 compiler/src/iree/compiler/Codegen/LLVMGPU/test/ROCDL/pipeline_vector_distribute_gfx942.mlir | |
: 1736972666:0;clang-format -i compiler/src/iree/compiler/Codegen/Common/OptimizeTensorInsertExtractSlices.cpp | |
: 1736972712:0;riree | |
: 1736972773:0;iree-opt --pass-pipeline="builtin.module(func.func(iree-codegen-optimize-tensor-insert-extract-slices{fold-identity-slices=true}))" --split-input-file compiler/src/iree/compiler/Codegen/Common/test/optimize_tensor_insert_extract_slices.mlir | |
: 1736972850:0;git ppf | |
: 1736973132:0;iree-opt --split-input-file compiler/src/iree/compiler/Codegen/Common/test/optimize_tensor_insert_extract_slices.mlir | |
: 1736973194:0;git ppf | |
: 1736974038:0;riree | |
: 1736974298:0;iree-opt --pass-pipeline="builtin.module(func.func(iree-codegen-optimize-tensor-insert-extract-slices{fold-identity-slices=true}))" --split-input-file compiler/src/iree/compiler/Codegen/Common/test/optimize_tensor_insert_extract_slices.mlir | |
: 1736974315:0;clang-format -i compiler/src/iree/compiler/Codegen/Common/OptimizeTensorInsertExtractSlices.cpp | |
: 1736974356:0;git ppf | |
: 1736975136:0;clang-format -i compiler/src/iree/compiler/Codegen/Common/OptimizeTensorInsertExtractSlices.cpp | |
: 1736975151:0;riree | |
: 1736975179:0;iree-opt --pass-pipeline="builtin.module(func.func(iree-codegen-optimize-tensor-insert-extract-slices{fold-identity-slices=true}))" --split-input-file compiler/src/iree/compiler/Codegen/Common/test/optimize_tensor_insert_extract_slices.mlir | |
: 1737007029:0;tmux attach -t 0 | |
: 1737007085:0;clear | |
: 1737007085:0;ls | |
: 1737007177:0;git ppf | |
: 1737007970:0;clear | |
: 1737007971:0;ls | |
: 1737008104:0;clear | |
: 1737008105:0;ls | |
: 1737008111:0;git o reorderworkgroups | |
: 1737008112:0;git lg | |
: 1737008118:0;clear | |
: 1737008119:0;ls | |
: 1737008150:0;riree | |
: 1737010143:0;CTEST_PARALLEL_LEVEL=64 cmake --build ~/iree-build --target iree-run-tests -j 32 | |
: 1737010299:0;git-clang-format HEAD~ | |
: 1737010318:0;git ppf | |
: 1737012492:0;riree | |
: 1737012810:0;git clang-format compiler/src/iree/compiler/Codegen/Common/TileDispatchUsingForall.cpp | |
: 1737012834:0;git-clang-format HEAD~ | |
: 1737012854:0;riree | |
: 1737013203:0;2 | |
: 1737013206:0;clear | |
: 1737013207:0;ls | |
: 1737013220:0;riree | |
: 1737013235:0;git-clang-format HEAD~ | |
: 1737013238:0;cd iree | |
: 1737013240:0;git-clang-format HEAD~ | |
: 1737013243:0;git ppf | |
: 1737014789:0;riree | |
: 1737015037:0;git-clang-format HEAD~ | |
: 1737032509:0;tmux attach -t 0 | |
: 1737033768:0;riree | |
: 1737034417:0;clear | |
: 1737034418:0;ls | |
: 1737036347:0;vi attn.mlir | |
: 1737036521:0;iree-opt --split-input-file --pass-pipeline="builtin.module(func.func(torch-iree-tm-tensor-to-linalg-ext))" attn.mlir | |
: 1737036554:0;iree-opt --split-input-file --pass-pipeline="builtin.module(func.func(torch-iree-tm-tensor-to-linalg-ext))" attn.mlir > attn_kernel.mlir | |
: 1737036555:0;clear | |
: 1737036556:0;ls | |
: 1737036559:0;vi attn_kernel.mlir | |
: 1737036579:0;clear | |
: 1737036580:0;ls | |
: 1737036608:0;/home/prashant/iree-build/tools/iree-compile --output-format=vm-bytecode --mlir-print-op-on-diagnostic=false --iree-hal-target-backends=llvm-cpu --iree-llvmcpu-target-cpu=generic attn_kernel.mlir -o atn.vmfb -mlir-print-ir-after-all 2> full.txt | |
: 1737036615:0;vi full.txt | |
: 1737036759:0;vi attn.mlir | |
: 1737036781:0;iree-opt --split-input-file --pass-pipeline="builtin.module(func.func(torch-iree-tm-tensor-to-linalg-ext))" attn.mlir > attn_kernel.mlir | |
: 1737036784:0;/home/prashant/iree-build/tools/iree-compile --output-format=vm-bytecode --mlir-print-op-on-diagnostic=false --iree-hal-target-backends=llvm-cpu --iree-llvmcpu-target-cpu=generic attn_kernel.mlir -o atn.vmfb -mlir-print-ir-after-all 2> full.txt | |
: 1737036796:0;vi full.txt | |
: 1737036922:0;iree-benchmark-module --module=attn.vmfb --function=attention --input=1x128x8x64xf32 --input=1x128x8x64xf32 --input=1x128x8x64xf32 --device=local-sync | |
: 1737036927:0;iree-benchmark-module --module=atn.vmfb --function=attention --input=1x128x8x64xf32 --input=1x128x8x64xf32 --input=1x128x8x64xf32 --device=local-sync | |
: 1737036934:0;vi attn.mlir | |
: 1737036963:0;iree-benchmark-module --module=atn.vmfb --function=attention --input=1x128x8x64xf32 --input=1x128x8x64xf32 --input=1x128x8x64xf32 --input=1x128x8x64xf32 --device=local-sync | |
: 1737036972:0;vi attn.mlir | |
: 1737036993:0;iree-benchmark-module --module=atn.vmfb --function=attention --input=1x128x32x64xf32 --input=1x128x32x64xf32 --input=1x128x32x64xf32 --input=1x128x32x64xf32 --device=local-sync | |
: 1737037022:0;iree-compile --help | fzf | |
: 1737037186:0;clear | |
: 1737037186:0;ls | |
: 1737037430:0;iree-compile "--iree-preprocessing-pass-pipeline=builtin.module(iree-linalg-ext-decompose-attention)" --output-format=vm-bytecode --mlir-print-op-on-diagnostic=false --iree-hal-target-backends=llvm-cpu --iree-llvmcpu-target-cpu=generic attn_kernel.mlir -o atn.vmfb -mlir-print-ir-after-all 2> full.txt | |
: 1737037442:0;vi full.txt | |
: 1737037513:0;iree-compile "--iree-preprocessing-pass-pipeline=builtin.module(func.func(iree-linalg-ext-decompose-attention))" --output-format=vm-bytecode --mlir-print-op-on-diagnostic=false --iree-hal-target-backends=llvm-cpu --iree-llvmcpu-target-cpu=generic attn_kernel.mlir -o atn.vmfb -mlir-print-ir-after-all 2> full.txt | |
: 1737037518:0;vi full.txt | |
: 1737037618:0;iree-opt "--iree-preprocessing-pass-pipeline=builtin.module(func.func(iree-linalg-ext-decompose-attention))" attn.mlir | |
: 1737037651:0;iree-opt --pass-pipeline=builtin.module(func.func(iree-linalg-ext-decompose-attention))" attn.mlir | |
: 1737037654:0;iree-opt --pass-pipeline=builtin.module(func.func(iree-linalg-ext-decompose-attention)) attn.mlir | |
: 1737037683:0;iree-opt --pass-pipeline="builtin.module(func.func(iree-linalg-ext-decompose-attention))" attn.mlir | |
: 1737037689:0;iree-opt --pass-pipeline="builtin.module(func.func(iree-linalg-ext-decompose-attention))" attn_kernel.mlir | |
: 1737037750:0;vi full.txt | |
: 1737037848:0;iree-compile "--iree-preprocessing-pass-pipeline=builtin.module(func.func(iree-linalg-ext-decompose-attention,iree-linalg-ext-convert-attention-to-online-attention))" --output-format=vm-bytecode --mlir-print-op-on-diagnostic=false --iree-hal-target-backends=llvm-cpu --iree-llvmcpu-target-cpu=generic attn_kernel.mlir -o atn.vmfb -mlir-print-ir-after-all 2> full.txt | |
: 1737037853:0;vi full.txt | |
: 1737037894:0;iree-opt --pass-pipeline="builtin.module(func.func(iree-linalg-ext-convert-attention-to-online-attention,iree-linalg-ext-decompose-attention))" attn_kernel.mlir | |
: 1737037995:0;iree-opt --pass-pipeline="builtin.module(func.func(iree-linalg-ext-convert-attention-to-online-attention,iree-linalg-ext-decompose-attention))" attn_kernel.mlir > decomposed_kernel.mlir | |
: 1737037997:0;clear | |
: 1737037997:0;ls | |
: 1737038018:0;iree-compile --output-format=vm-bytecode --mlir-print-op-on-diagnostic=false --iree-hal-target-backends=llvm-cpu --iree-llvmcpu-target-cpu=generic decomposed_kernel.mlir -o atn.vmfb -mlir-print-ir-after-all 2> full.txt | |
: 1737038028:0;iree-benchmark-module --module=atn.vmfb --function=attention --input=1x128x32x64xf32 --input=1x128x32x64xf32 --input=1x128x32x64xf32 --input=1x128x32x64xf32 --device=local-sync | |
: 1737038637:0;ls | |
: 1737038642:0;vi attn_kernel.mlir | |
: 1737038696:0;gist-paste attn_kernel.mlir | |
: 1737038914:0;ls | |
: 1737038921:0;vi decomposed_kernel.mlir | |
: 1737038945:0;gist-paste decomposed_kernel.mlir | |
: 1737039016:0;iree-compile --output-format=vm-bytecode --iree-hal-target-backends=llvm-cpu --iree-llvmcpu-target-cpu=host decomposed_kernel.mlir -o atn.vmfb -mlir-print-ir-after-all 2> full.txt | |
: 1737039024:0;iree-benchmark-module --module=atn.vmfb --function=attention --input=1x128x32x64xf32 --input=1x128x32x64xf32 --input=1x128x32x64xf32 --input=1x128x32x64xf32 --device=local-sync | |
: 1737039034:0;iree-benchmark-module --module=atn.vmfb --function=attention --input=1x128x32x64xf32 --input=1x128x32x64xf32 --input=1x128x32x64xf32 --device=local-sync | |
: 1737039045:0;cpuinfo | |
: 1737039078:0;iree-compile --output-format=vm-bytecode --iree-hal-target-backends=llvm-cpu --iree-llvmcpu-target-cpu=host attn_kernel.mlir -o atn.vmfb | |
: 1737039083:0;iree-benchmark-module --module=atn.vmfb --function=attention --input=1x128x32x64xf32 --input=1x128x32x64xf32 --input=1x128x32x64xf32 --device=local-sync | |
: 1737039462:0;cat /proc/cpuinfo | |
: 1737039475:0;cat /proc/cpuinfo > gist-paste | |
: 1737039480:0;vi gist-paste | |
: 1737039492:0;mv gist-paste cpuinfo | |
: 1737039495:0;vi cpuinfo | |
: 1737039500:0;gist-paste cpuinfo | |
: 1737039607:0;clear | |
: 1737039607:0;ls | |
: 1737039612:0;vi attn.mlir | |
: 1737039644:0;iree-opt --split-input-file --pass-pipeline="builtin.module(func.func(torch-iree-tm-tensor-to-linalg-ext))" attn.mlir | |
: 1737039664:0;iree-opt --split-input-file --pass-pipeline="builtin.module(func.func(torch-iree-tm-tensor-to-linalg-ext))" attn.mlir > attnbf16.mlir | |
: 1737039672:0;gist-paste attnbf16.mlir | |
: 1737039691:0;iree-compile --output-format=vm-bytecode --iree-hal-target-backends=llvm-cpu --iree-llvmcpu-target-cpu=host attnbf16.mlir -o attn.vmfb | |
: 1737039715:0;iree-benchmark-module --module=attn.vmfb --function=attention --input=1x128x32x64xbf16 --input=1x128x32x64xbf16 --input=1x128x32x64xbf16 --device=local-sync | |
: 1737039726:0;vi attnbf16.mlir | |
: 1737039736:0;iree-compile --output-format=vm-bytecode --iree-hal-target-backends=llvm-cpu --iree-llvmcpu-target-cpu=host attnbf16.mlir -o attn.vmfb | |
: 1737039739:0;iree-benchmark-module --module=attn.vmfb --function=attention --input=1x128x32x64xbf16 --input=1x128x32x64xbf16 --input=1x128x32x64xbf16 --device=local-sync | |
: 1737039784:0;iree-opt --pass-pipeline="builtin.module(func.func(iree-linalg-ext-convert-attention-to-online-attention,iree-linalg-ext-decompose-attention))" attnbf16.mlir > decomposedbf16.mlir | |
: 1737039802:0;iree-compile --output-format=vm-bytecode --iree-hal-target-backends=llvm-cpu --iree-llvmcpu-target-cpu=host decomposedbf16.mlir -o attn.vmfb | |
: 1737039808:0;iree-benchmark-module --module=attn.vmfb --function=attention --input=1x128x32x64xbf16 --input=1x128x32x64xbf16 --input=1x128x32x64xbf16 --device=local-sync | |
: 1737039920:0;gist-paste attnbf16.mlir | |
: 1737039947:0;gist-paste decomposedbf16.mlir | |
: 1737040772:0;riree | |
: 1737040780:0;git ppf | |
: 1737041544:0;clear | |
: 1737041544:0;ls | |
: 1737046987:0;riree | |
: 1737047017:0;git-clang-format HEAD~ | |
: 1737047020:0;git ppf | |
: 1737047202:0;git o opt_tensor_insert_extract | |
: 1737047425:0;riree | |
: 1737047569:0;iree-opt --pass-pipeline="builtin.module(func.func(iree-codegen-optimize-tensor-insert-extract-slices{fold-identity-slices=true}))" --split-input-file compiler/src/iree/compiler/Codegen/Common/test/optimize_tensor_insert_extract_slices.mlir | |
: 1737047626:0;CTEST_PARALLEL_LEVEL=64 cmake --build ~/iree-build --target iree-run-tests -j 32 | |
: 1737047870:0;riree | |
: 1737047909:0;CTEST_PARALLEL_LEVEL=64 cmake --build ~/iree-build --target iree-run-tests -j 32 | |
: 1737048194:0;git ppf | |
: 1737048375:0;git-clang-format HEAD~ | |
: 1737048391:0;git ppf | |
: 1737053364:0;clear | |
: 1737053368:0;git fetch origin | |
: 1737053378:0;git rebase origin/main | |
: 1737053381:0;git ppf | |
: 1737056145:0;clear | |
: 1737056146:0;ls | |
: 1737056148:0;git o main | |
: 1737056150:0;git lg | |
: 1737056161:0;git puom | |
: 1737056169:0;clear | |
: 1737056169:0;ls | |
: 1737056171:0;git submodule update --init | |
: 1737056175:0;git lg | |
: 1737056194:0;clear | |
: 1737056194:0;ls | |
: 1737093892:0;\ | |
: 1737093899:0;tmux attach -t 0 | |
: 1737093904:0;clear | |
: 1737093905:0;ls | |
: 1737093919:0;git ob scfforallgpu | |
: 1737093926:0;git ob temp | |
: 1737093961:0;riree | |
: 1737094440:0;ree | |
: 1737094443:0;riree | |
: 1737094633:0;CTEST_PARALLEL_LEVEL=64 cmake --build ~/iree-build --target iree-run-tests -j 32 | |
: 1737094793:0;iree-opt --split-input-file --iree-gpu-test-target=gfx942 --iree-codegen-llvmgpu-use-vector-distribution --iree-llvmgpu-enable-prefetch=true --pass-pipeline="builtin.module(hal.executable(hal.executable.variant(builtin.module(func.func(iree-llvmgpu-lower-executable-target)))))" compiler/src/iree/compiler/Codegen/LLVMGPU/test/ROCDL/pipeline_vector_distribute_gfx942.mlir | FileCheck-18 compiler/src/iree/compiler/Codegen/LLVMGPU/test/ROCDL/pipeline_vector_distribute_gfx942.mlir | |
: 1737094955:0;iree-opt --split-input-file --iree-gpu-test-target=gfx942 --iree-codegen-llvmgpu-use-vector-distribution --iree-llvmgpu-enable-prefetch=true --pass-pipeline="builtin.module(hal.executable(hal.executable.variant(builtin.module(func.func(iree-llvmgpu-lower-executable-target)))))" compiler/src/iree/compiler/Codegen/LLVMGPU/test/ROCDL/pipeline_vector_distribute_gfx942.mlir > out.mlir | |
: 1737095176:0;iree-opt --split-input-file --iree-gpu-test-target=gfx942 --iree-codegen-llvmgpu-use-vector-distribution --iree-llvmgpu-enable-prefetch=true --pass-pipeline="builtin.module(hal.executable(hal.executable.variant(builtin.module(func.func(iree-llvmgpu-lower-executable-target)))))" compiler/src/iree/compiler/Codegen/LLVMGPU/test/ROCDL/pipeline_vector_distribute_gfx942.mlir | FileCheck-18 compiler/src/iree/compiler/Codegen/LLVMGPU/test/ROCDL/pipeline_vector_distribute_gfx942.mlir | |
: 1737095296:0;iree-opt --split-input-file --iree-gpu-test-target=gfx942 --iree-codegen-llvmgpu-use-vector-distribution --iree-llvmgpu-enable-prefetch=true --pass-pipeline="builtin.module(hal.executable(hal.executable.variant(builtin.module(func.func(iree-llvmgpu-lower-executable-target)))))" compiler/src/iree/compiler/Codegen/LLVMGPU/test/ROCDL/pipeline_vector_distribute_gfx942.mlir | FileCheck-18 compiler/src/iree/compiler/Codegen/LLVMGPU/test/ROCDL/pipeline_vector_distribute_gfx942.mlir --check-prefix=MEMORY | |
: 1737095321:0;vi | |
: 1737095480:0;iree-opt --split-input-file --iree-gpu-test-target=gfx942 --iree-codegen-llvmgpu-use-vector-distribution --iree-llvmgpu-enable-prefetch=true --pass-pipeline="builtin.module(hal.executable(hal.executable.variant(builtin.module(func.func(iree-llvmgpu-lower-executable-target)))))" compiler/src/iree/compiler/Codegen/LLVMGPU/test/ROCDL/pipeline_vector_distribute_gfx942.mlir | FileCheck-18 compiler/src/iree/compiler/Codegen/LLVMGPU/test/ROCDL/pipeline_vector_distribute_gfx942.mlir --check-prefix=MEMORY | |
: 1737095483:0;iree-opt --split-input-file --iree-gpu-test-target=gfx942 --iree-codegen-llvmgpu-use-vector-distribution --iree-llvmgpu-enable-prefetch=true --pass-pipeline="builtin.module(hal.executable(hal.executable.variant(builtin.module(func.func(iree-llvmgpu-lower-executable-target)))))" compiler/src/iree/compiler/Codegen/LLVMGPU/test/ROCDL/pipeline_vector_distribute_gfx942.mlir | FileCheck-18 compiler/src/iree/compiler/Codegen/LLVMGPU/test/ROCDL/pipeline_vector_distribute_gfx942.mlir | |
: 1737095502:0;git branch -D scfforallgpu | |
: 1737095511:0;git branch -m scfforallgpu | |
: 1737095514:0;git ppf | |
: 1737095528:0;git-clang-format HEAD~ | |
: 1737095536:0;git ppf | |
: 1737095612:0;CTEST_PARALLEL_LEVEL=64 cmake --build ~/iree-build --target iree-run-tests -j 32 | |
: 1737096083:0;git ppf | |
: 1737114077:0;clear | |
: 1737114078:0;ls | |
: 1737114080:0;tmux attach -t 0 | |
: 1737114108:0;clear | |
: 1737114108:0;ls | |
: 1737114119:0;cd .. | |
: 1737114120:0;ls | |
: 1737114123:0;mkdir onnx_perf | |
: 1737114125:0;cd onnx_perf | |
: 1737114125:0;clear | |
: 1737114126:0;ls | |
: 1737114134:0;clear | |
: 1737114134:0;ls | |
: 1737114142:0;vi onnx_gen.py | |
: 1737114153:0;pip install onnx onnx-runtime | |
: 1737114165:0;pip install onnx onnxruntime\ | |
: 1737114172:0;clear | |
: 1737114172:0;ls | |
: 1737114174:0;python onnx_gen.py | |
: 1737114178:0;vi group_query_attention.onnx | |
: 1737114341:0;ls | |
: 1737114347:0;vi onnx_run.py | |
: 1737114354:0;python onnx_run.py | |
: 1737114427:0;pip install onnxruntime-extensions | |
: 1737114478:0;vi onnx_run.py | |
: 1737114521:0;python onnx_run.py | |
: 1737114540:0;onnxruntime_test_all --list_custom_ops | |
: 1737119315:0;tmux attach -t 0 | |
: 1737119318:0;vi | |
: 1737119588:0;git clone --recursive https://github.com/microsoft/onnxruntime.git | |
: 1737120086:0;clear | |
: 1737120087:0;ls | |
: 1737120110:0;cd onnxruntime | |
: 1737120125:0;python3 tools/ci_build/build.py --build_dir build --config Release --use_custom_ops | |
: 1737120143:0;vi tools/ci_build/build.py | |
: 1737120216:0;python3 tools/ci_build/build.py --build_dir build --config Release | |
: 1737122965:0;\ | |
ls | |
: 1737122967:0;htop | |
: 1737123281:0;vi tools/ci_build/build.py | |
: 1737123295:0;python3 tools/ci_build/build.py --build_dir build --config Release --build_shared_lib | |
: 1737123361:0;vi tools/ci_build/build.py | |
: 1737123393:0;python3 tools/ci_build/build.py --build_dir build --config Release --build_shared_lib --enable_pybind | |
: 1737123458:0;pip install pytest | |
: 1737123471:0;python3 tools/ci_build/build.py --build_dir build --config Release --build_shared_lib --enable_pybind --build_wheel | |
: 1737123484:0;htop | |
: 1737123541:0;pip uninstall onnxruntime | |
: 1737123558:0;pip install build/Release/dist/onnxruntime-1.21.0-cp312-cp312-linux_x86_64.whl | |
: 1737123561:0;clear | |
: 1737123561:0;ls | |
: 1737123564:0;cd .. | |
: 1737123565:0;ls | |
: 1737123569:0;python onnx_run.py | |
: 1737123592:0;vi onnx_gen.py | |
: 1737123605:0;python onnx_gen.py | |
: 1737123607:0;ls | |
: 1737123616:0;python onnx_run.py | |
: 1737123709:0;vi onnx_gen.py | |
: 1737123717:0;python onnx_gen.py | |
: 1737123719:0;python onnx_run.py | |
: 1737123727:0;vi onnx_gen.py | |
: 1737123736:0;python onnx_run.py | |
: 1737123740:0;python onnx_gen.py | |
: 1737123742:0;python onnx_run.py | |
: 1737123798:0;vi onnx_gen.py | |
: 1737123813:0;python onnx_gen.py | |
: 1737123816:0;python onnx_run.py | |
: 1737123970:0;vi onnx_gen.py | |
: 1737124001:0;python onnx_gen.py | |
: 1737124005:0;python onnx_run.py | |
: 1737124078:0;vi onnx_run.py | |
: 1737124177:0;python onnx_run.py | |
: 1737124200:0;vi onnx_run.py | |
: 1737124205:0;vi onnx_gen.py | |
: 1737124303:0;python onnx_gen.py | |
: 1737124313:0;mv group_query_attention_updated.onnx group_query_attention.onnx | |
: 1737124318:0;python onnx_run.py | |
: 1737124385:0;vi onnx_run.py | |
: 1737124396:0;python onnx_run.py | |
: 1737124567:0;vi onnx_gen.py | |
: 1737124610:0;python onnx_gen.py | |
: 1737124664:0;vi onnx_gen.py | |
: 1737124980:0;python onnx_gen.py | |
: 1737124981:0;ls | |
: 1737124987:0;python onnx_run.py | |
: 1737125003:0;vi onnx_run.py | |
: 1737125056:0;vi onnx_gen.py | |
: 1737125263:0;python onnx_gen.py | |
: 1737125267:0;python onnx_run.py | |
: 1737125282:0;vi onnx_run.py | |
: 1737125353:0;python onnx_run.py | |
: 1737125357:0;python onnx_gen.py | |
: 1737125359:0;python onnx_run.py | |
: 1737125501:0;vi onnx_gen.py | |
: 1737125597:0;python onnx_gen.py | |
: 1737125600:0;vi onnx_gen.py | |
: 1737125607:0;python onnx_run.py | |
: 1737125630:0;vi onnx_gen.py | |
: 1737125679:0;python onnx_run.py | |
: 1737125688:0;vi onnx_gen.py | |
: 1737125790:0;python onnx_gen.py | |
: 1737125793:0;python onnx_run.py | |
: 1737125804:0;vi onnx_gen.py | |
: 1737125874:0;python onnx_gen.py | |
: 1737125877:0;vi onnx_run.py | |
: 1737125896:0;python onnx_run.py | |
: 1737125904:0;vi onnx_run.py | |
: 1737125924:0;source ~/iree/.iree_venv/bin/activate | |
: 1737125929:0;python onnx_gen.py | |
: 1737125932:0;python onnx_run.py | |
: 1737126298:0;ls | |
: 1737126378:0;cd .. | |
: 1737126379:0;ls | |
: 1737126383:0;mkdir tinyllama | |
: 1737126384:0;cd tinyllama | |
: 1737126385:0;clear | |
: 1737126386:0;ls | |
: 1737126389:0;wget https://gist.githubusercontent.com/NoumanAmir657/fdf8e41ba41f4439cc3b26df8fc7b099/raw/6f6a98359c59db932c274bbce7b0f82b1326b83e/chat_tinyllama_q8.mlir | |
: 1737126391:0;ls | |
: 1737126393:0;vi chat_tinyllama_q8.mlir | |
: 1737126488:0;iree-compile --output-format=vm-bytecode --iree-hal-target-backends=llvm-cpu --iree-llvmcpu-target-cpu=host chat_tinyllama_q8.mlir -o chat.vmfb --iree-hal-dump-executable-sources-to=dump/ | |
: 1737126497:0;ls | |
: 1737126509:0;vi chat_tinyllama_q8.mlir | |
: 1737126774:0;ls | |
: 1737126775:0;cd dump | |
: 1737126776:0;ls | |
: 1737126783:0;vi module_prefill_bs1\$async_dispatch_39.mlir | |
: 1737126947:0;iree-compile --output-format=vm-bytecode --iree-hal-target-backends=llvm-cpu --iree-llvmcpu-target-cpu=host module_prefill_bs1\$async_dispatch_39.mlir -o chat.vmfb --iree-hal-dump-executable-sources-to=dump/ --compile-from=executable-sources | |
: 1737126956:0;iree-compile --output-format=vm-bytecode --iree-hal-target-backends=llvm-cpu --iree-llvmcpu-target-cpu=host module_prefill_bs1\$async_dispatch_39.mlir -o chat.vmfb --iree-hal-dump-executable-sources-to=dump/ --compile-from=executable-sources --mlir-print-ir-after-all 2> xyz.txt | |
: 1737126961:0;vi xyz.txt | |
: 1737127319:0;gist-paste module_prefill_bs1\$async_dispatch_39.mlir | |
: 1737127852:0;git-clang-format HEAD~ | |
: 1737127867:0;clear | |
: 1737127867:0;ls | |
: 1737127871:0;CTEST_PARALLEL_LEVEL=64 cmake --build ~/iree-build --target iree-run-tests -j 32 | |
: 1737128073:0;git-clang-format HEAD~ | |
: 1737128117:0;git stash | |
: 1737128120:0;git-clang-format HEAD~ | |
: 1737128133:0;git ppf | |
: 1737128833:0;vi xyz.txt | |
: 1737129294:0;git ppf | |
: 1737129301:0;git-clang-format HEAD~ | |
: 1737387341:0;clear\ | |
: 1737387342:0;ls | |
: 1737387347:0;tmux attach -t 0 | |
: 1737394275:0;clear | |
: 1737394276:0;ls | |
: 1737394280:0;tmux ls | |
: 1737394285:0;tmux attach -t shortfin | |
: 1737394291:0;clear | |
: 1737394291:0;ls | |
: 1737394294:0;cd .. | |
: 1737394295:0;ls | |
: 1737394297:0;cd .. | |
: 1737394297:0;ls | |
: 1737394298:0;clear | |
: 1737394298:0;ls | |
: 1737394309:0;cd test | |
: 1737394309:0;ls | |
: 1737394314:0;cd onnx_perf | |
: 1737394315:0;clear | |
: 1737394315:0;ls | |
: 1737394321:0;source ~/iree/.iree_venv/bin/activate | |
: 1737394322:0;clear | |
: 1737394323:0;ls | |
: 1737394331:0;cd ../test/onnx_perf | |
: 1737394331:0;clear | |
: 1737394332:0;ls | |
: 1737394336:0;source ~/iree/.iree_venv/bin/activate | |
: 1737394336:0;clear | |
: 1737394337:0;ls | |
: 1737394340:0;dz | |
: 1737394341:0;sz | |
: 1737394343:0;source ~/iree/.iree_venv/bin/activate | |
: 1737394344:0;clear | |
: 1737394344:0;ls | |
: 1737394346:0;clear | |
: 1737394347:0;ls | |
: 1737394347:0;sz | |
: 1737394349:0;source ~/iree/.iree_venv/bin/activate | |
: 1737394350:0;clear | |
: 1737394351:0;ls | |
: 1737394355:0;vi onnx_gen.py | |
: 1737394379:0;python onnx_gen.py | |
: 1737394383:0;vi onnx_run.py | |
: 1737394392:0;python onnx_run.py | |
: 1737394406:0;vi onnx_run.py | |
: 1737394446:0;VI | |
: 1737394449:0;vi onnx_run.py | |
: 1737394453:0;clear | |
: 1737394454:0;ls | |
: 1737394457:0;python onnx_run.py | |
: 1737394542:0;ls | |
: 1737394546:0;rm group_query_attention_updated.onnx | |
: 1737394548:0;rm group_query_attention.onnx | |
: 1737394552:0;python onnx_gen.py | |
: 1737394555:0;python onnx_run.py | |
: 1737394810:0;python onnx_gen.py | |
: 1737394812:0;python onnx_run.py | |
: 1737394869:0;python onnx_gen.py | |
: 1737394870:0;python onnx_run.py | |
: 1737394899:0;python onnx_gen.py | |
: 1737394900:0;python onnx_run.py | |
: 1737395055:0;python onnx_gen.py | |
: 1737395057:0;python onnx_run.py | |
: 1737395363:0;python onnx_gen.py | |
: 1737395365:0;python onnx_run.py | |
: 1737395484:0;python onnx_gen.py | |
: 1737395485:0;python onnx_run.py | |
: 1737395504:0;python onnx_gen.py | |
: 1737395505:0;python onnx_run.py | |
: 1737395535:0;cat onnx_run.py | |
: 1737395932:0;python onnx_run.py | |
: 1737396076:0;ls | |
: 1737396088:0;clear | |
: 1737396089:0;ls | |
: 1737396091:0;cd .. | |
: 1737396092:0;ls | |
: 1737396115:0;vi test.mlir | |
: 1737396176:0;cd onnx_perf | |
: 1737396177:0;ls | |
: 1737396188:0;vi attn_kernel.mlir | |
: 1737396788:0;iree-compile --output-format=vm-bytecode --iree-hal-target-backends=llvm-cpu --iree-llvmcpu-target-cpu=host attn_kernel.mlir -o attn.vmfb | |
: 1737396814:0;iree-opt --pass-pipeline="builtin.module(func.func(iree-linalg-ext-convert-attention-to-online-attention,iree-linalg-ext-decompose-attention))" attn_kernel.mlir > decomposed_kernel.mlir | |
: 1737396816:0;vi decomposed_kernel.mlir | |
: 1737396834:0;iree-compile --output-format=vm-bytecode --iree-hal-target-backends=llvm-cpu --iree-llvmcpu-target-cpu=host decomposed_kernel.mlir -o attn.vmfb | |
: 1737396879:0;iree-benchmark-module --module=attn.vmfb --function=attention --input=1x32x128x512xf32--input=1x32x128x512xf32 --input=1x32x128x512xf32 --device=local-sync | |
: 1737396888:0;iree-benchmark-module --module=attn.vmfb --function=attention --input=1x32x128x512xf32 --input=1x32x128x512xf32 --input=1x32x128x512xf32 --device=local-sync | |
: 1737396921:0;iree-benchmark-module --module=attn.vmfb --function=attention --input=1x32x128x512xf32 --input=1x32x128x512xf32 --input=1x32x128x512xf32 --device=local-task | |
: 1737396948:0;ls | |
: 1737396958:0;vi onnx_run.py | |
: 1737396969:0;python onnx_run.py | |
: 1737396985:0;ls | |
: 1737397019:0;iree-benchmark-module --module=attn.vmfb --function=attention --input=1x32x128x512xf32 --input=1x32x128x512xf32 --input=1x32x128x512xf32 --device=local-task | |
: 1737397029:0;python onnx_run.py | |
: 1737397068:0;iree-benchmark-module --module=attn.vmfb --function=attention --input=1x32x128x512xf32 --input=1x32x128x512xf32 --input=1x32x128x512xf32 --device=local-task | |
: 1737398118:0;gist-paste attn_kernel.mlir | |
: 1737398202:0;gist-paste decomposed_kernel.mlir | |
: 1737398452:0;iree-benchmark-module --module=attn.vmfb --function=attention --input=1x32x128x512xf32 --input=1x32x128x512xf32 --input=1x32x128x512xf32 --device=local-task | |
: 1737398629:0;ls | |
: 1737398641:0;gist-paste onnx_gen.py onnx_run.py | |
: 1737399713:0;clear | |
: 1737399714:0;ls | |
: 1737399717:0;clear | |
: 1737399717:0;ls | |
: 1737399720:0;tmux attach -t 0 | |
: 1737399727:0;clear | |
: 1737399727:0;ls | |
: 1737399813:0;cd .. | |
: 1737399814:0;ls | |
: 1737399815:0;cd .. | |
: 1737399816:0;ls | |
: 1737399817:0;clear | |
: 1737399817:0;ls | |
: 1737399827:0;mkdir multireduction | |
: 1737399828:0;clear | |
: 1737399828:0;ls | |
: 1737399830:0;cd multireduction | |
: 1737399830:0;ls | |
: 1737399834:0;vi test.mlir | |
: 1737399865:0;iree-compile --output-format=vm-bytecode --iree-hal-target-backends=llvm-cpu --iree-llvmcpu-target-cpu=host test.mlir -o abc.vmfb -mlir-print-ir-after-all 2> full.txt | |
: 1737399870:0;vi full.txt | |
: 1737400786:0;git o main | |
: 1737400788:0;git puom | |
: 1737400797:0;git submodule update --init | |
: 1737400812:0;git ob tilesoftmax | |
: 1737400813:0;clear | |
: 1737400814:0;ls | |
: 1737400818:0;riree | |
: 1737470049:0;tmux attach -t 0 | |
: 1737470063:0;clear | |
: 1737470063:0;ls | |
: 1737470064:0;riree | |
: 1737470068:0;CTEST_PARALLEL_LEVEL=64 cmake --build ~/iree-build --target iree-run-tests -j 32 | |
: 1737470220:0;ls | |
: 1737470223:0;cd .. | |
: 1737470223:0;ls | |
: 1737470228:0;mkdir softmax | |
: 1737470230:0;cd softmax | |
: 1737470233:0;vi test.mlir | |
: 1737470245:0;iree-compile --output-format=vm-bytecode --iree-hal-target-backends=llvm-cpu --iree-llvmcpu-target-cpu=host test.mlir -o abc.vmfb -mlir-print-ir-after-all 2> full.txt | |
: 1737470251:0;vi full.txt | |
: 1737470431:0;vi test.mlir | |
: 1737470437:0;iree-compile --output-format=vm-bytecode --iree-hal-target-backends=llvm-cpu --iree-llvmcpu-target-cpu=host test.mlir -o abc.vmfb -mlir-print-ir-after-all 2> full.txt | |
: 1737470439:0;vi full.txt | |
: 1737471951:0;riree | |
: 1737471980:0;iree-compile --output-format=vm-bytecode --iree-hal-target-backends=llvm-cpu --iree-llvmcpu-target-cpu=host test.mlir -o abc.vmfb -mlir-print-ir-after-all 2> full.txt | |
: 1737471993:0;vi full.txt | |
: 1737472124:0;iree-compile --output-format=vm-bytecode --iree-hal-target-backends=llvm-cpu --iree-llvmcpu-target-cpu=host test.mlir -o abc.vmfb | |
: 1737472130:0;ls | |
: 1737472474:0;riree | |
: 1737472772:0;CTEST_PARALLEL_LEVEL=64 cmake --build ~/iree-build --target iree-run-tests -j 32 | |
: 1737472923:0;riree | |
: 1737472927:0;CTEST_PARALLEL_LEVEL=64 cmake --build ~/iree-build --target iree-run-tests -j 32 | |
: 1737473140:0;vi new.mlir | |
: 1737473148:0;iree-compile --output-format=vm-bytecode --iree-hal-target-backends=llvm-cpu --iree-llvmcpu-target-cpu=host new.mlir -o abc.vmfb | |
: 1737473158:0;iree-compile --output-format=vm-bytecode --iree-hal-target-backends=llvm-cpu --iree-llvmcpu-target-cpu=host new.mlir -o abc.vmfb -mlir-print-ir-after-all 2> full.txt | |
: 1737473160:0;vi full.txt | |
: 1737473935:0;riree | |
: 1737473949:0;vi full.txt | |
: 1737473961:0;mv full.txt full_new.txt | |
: 1737473962:0;clear | |
: 1737473962:0;ls | |
: 1737473977:0;iree-compile --output-format=vm-bytecode --iree-hal-target-backends=llvm-cpu --iree-llvmcpu-target-cpu=host new.mlir -o abc.vmfb -mlir-print-ir-after-all 2> full_old.txt | |
: 1737473982:0;vi full_old.txt | |
: 1737474046:0;CTEST_PARALLEL_LEVEL=64 cmake --build ~/iree-build --target iree-run-tests -j 32 | |
: 1737474851:0;git o main | |
: 1737474853:0;riree | |
: 1737474935:0;iree-compile --output-format=vm-bytecode --iree-hal-target-backends=llvm-cpu --iree-llvmcpu-target-cpu=host new.mlir -o abc.vmfb -mlir-print-ir-after-all 2> full_new.txt | |
: 1737474940:0;vi full_new.txt | |
: 1737475065:0;riree | |
: 1737475098:0;iree-compile --output-format=vm-bytecode --iree-hal-target-backends=llvm-cpu --iree-llvmcpu-target-cpu=host new.mlir -o abc.vmfb -mlir-print-ir-after-all 2> full_new.txt | |
: 1737475102:0;vi full_new.txt | |
: 1737475627:0;cat full_new.txt | |
: 1737475983:0;riree | |
: 1737476010:0;iree-compile --output-format=vm-bytecode --iree-hal-target-backends=llvm-cpu --iree-llvmcpu-target-cpu=host new.mlir -o abc.vmfb -mlir-print-ir-after-all 2> full_new.txt | |
: 1737476014:0;vi full_new.txt | |
: 1737476092:0;riree | |
: 1737476115:0;iree-compile --output-format=vm-bytecode --iree-hal-target-backends=llvm-cpu --iree-llvmcpu-target-cpu=host new.mlir -o abc.vmfb -mlir-print-ir-after-all 2> full_new.txt | |
: 1737476119:0;vi full_new.txt | |
: 1737476203:0;riree | |
: 1737476226:0;iree-compile --output-format=vm-bytecode --iree-hal-target-backends=llvm-cpu --iree-llvmcpu-target-cpu=host new.mlir -o abc.vmfb -mlir-print-ir-after-all 2> full_new.txt | |
: 1737476229:0;vi full_new.txt | |
: 1737476249:0;git branch | |
: 1737476255:0;git o tilesoftmax | |
: 1737476258:0;git stash | |
: 1737476259:0;git o tilesoftmax | |
: 1737476617:0;riree | |
: 1737476636:0;iree-compile --output-format=vm-bytecode --iree-hal-target-backends=llvm-cpu --iree-llvmcpu-target-cpu=host new.mlir -o abc.vmfb -mlir-print-ir-after-all 2> full_new.txt | |
: 1737476641:0;vi full_new.txt | |
: 1737476670:0;riree | |
: 1737476682:0;iree-compile --output-format=vm-bytecode --iree-hal-target-backends=llvm-cpu --iree-llvmcpu-target-cpu=host new.mlir -o abc.vmfb -mlir-print-ir-after-all 2> full_new.txt | |
: 1737476685:0;vi full_new.txt | |
: 1737476838:0;riree | |
: 1737476857:0;iree-compile --output-format=vm-bytecode --iree-hal-target-backends=llvm-cpu --iree-llvmcpu-target-cpu=host new.mlir -o abc.vmfb -mlir-print-ir-after-all 2> full_new.txt | |
: 1737476859:0;vi full_ | |
: 1737476862:0;vi full_new.txt | |
: 1737476926:0;riree | |
: 1737476967:0;vi full_ | |
: 1737476970:0;iree-compile --output-format=vm-bytecode --iree-hal-target-backends=llvm-cpu --iree-llvmcpu-target-cpu=host new.mlir -o abc.vmfb -mlir-print-ir-after-all 2> full_new.txt | |
: 1737476973:0;vi full_new.txt | |
: 1737477011:0;riree | |
: 1737477043:0;iree-compile --output-format=vm-bytecode --iree-hal-target-backends=llvm-cpu --iree-llvmcpu-target-cpu=host new.mlir -o abc.vmfb -mlir-print-ir-after-all 2> full_new.txt | |
: 1737477046:0;vi full_new.txt | |
: 1737477111:0;riree | |
: 1737477128:0;iree-compile --output-format=vm-bytecode --iree-hal-target-backends=llvm-cpu --iree-llvmcpu-target-cpu=host new.mlir -o abc.vmfb -mlir-print-ir-after-all 2> full_new.txt | |
: 1737477132:0;vi full_new.txt | |
: 1737478983:0;git stash | |
: 1737478986:0;git o main | |
: 1737478987:0;clear | |
: 1737478987:0;ls | |
: 1737479085:0;git puom | |
: 1737479090:0;clear | |
: 1737479091:0;ls | |
: 1737479093:0;git submodule update --init | |
: 1737479117:0;git ob morescfforall | |
: 1737479177:0;riree | |
: 1737481841:0;iree-compile --output-format=vm-bytecode --iree-hal-target-backends=llvm-cpu --iree-llvmcpu-target-cpu=host new.mlir -o abc.vmfb -mlir-print-ir-after-all 2> full_new.txt | |
: 1737481845:0;vi full_new.txt | |
: 1737482105:0;riree | |
: 1737482125:0;iree-compile --output-format=vm-bytecode --iree-hal-target-backends=llvm-cpu --iree-llvmcpu-target-cpu=host new.mlir -o abc.vmfb -mlir-print-ir-after-all 2> full_new.txt | |
: 1737482129:0;vi full_new.txt | |
: 1737482411:0;riree | |
: 1737482446:0;iree-compile --output-format=vm-bytecode --iree-hal-target-backends=llvm-cpu --iree-llvmcpu-target-cpu=host new.mlir -o abc.vmfb -mlir-print-ir-after-all 2> full_new.txt | |
: 1737482451:0;vi full_new.txt | |
: 1737482521:0;git stash | |
: 1737482545:0;CTEST_PARALLEL_LEVEL=64 cmake --build ~/iree-build --target iree-run-tests -j 32 | |
: 1737482573:0;riree | |
: 1737482705:0;CTEST_PARALLEL_LEVEL=64 cmake --build ~/iree-build --target iree-run-tests -j 32 | |
: 1737482936:0;git-clang-format HEAD~ | |
: 1737482937:0;git ppf | |
: 1737483051:0;riree | |
: 1737483071:0;CTEST_PARALLEL_LEVEL=64 cmake --build ~/iree-build --target iree-run-tests -j 32 | |
: 1737483313:0;git ppf | |
: 1737483450:0;CTEST_PARALLEL_LEVEL=64 cmake --build ~/iree-build --target iree-run-tests -j 32 | |
: 1737483763:0;iree-opt --split-input-file --iree-gpu-test-target=sm_60 --pass-pipeline="builtin.module(hal.executable(hal.executable.variant(builtin.module(iree-codegen-llvmgpu-configuration-pipeline), iree-codegen-linalg-to-nvvm-pipeline)))" -iree-codegen-llvmgpu-use-wmma compiler/src/iree/compiler/Codegen/LLVMGPU/test/nvvm_pipeline_test.mlir | FileCheck compiler/src/iree/compiler/Codegen/LLVMGPU/test/nvvm_pipeline_test.mlir | |
: 1737483955:0;iree-opt --split-input-file --iree-gpu-test-target=sm_60 --pass-pipeline="builtin.module(hal.executable(hal.executable.variant(builtin.module(iree-codegen-llvmgpu-configuration-pipeline), iree-codegen-linalg-to-nvvm-pipeline)))" -iree-codegen-llvmgpu-use-wmma compiler/src/iree/compiler/Codegen/LLVMGPU/test/nvvm_pipeline_test.mlir | |
: 1737550348:0;\ | |
: 1737550348:0;clear | |
: 1737550349:0;ls | |
: 1737550351:0;tmux attach -t 0 | |
: 1737550354:0;iree-opt --split-input-file --iree-gpu-test-target=sm_60 --pass-pipeline="builtin.module(hal.executable(hal.executable.variant(builtin.module(iree-codegen-llvmgpu-configuration-pipeline), iree-codegen-linalg-to-nvvm-pipeline)))" -iree-codegen-llvmgpu-use-wmma compiler/src/iree/compiler/Codegen/LLVMGPU/test/nvvm_pipeline_test.mlir | |
: 1737550358:0;git o main | |
: 1737550361:0;git stash | |
: 1737550362:0;git o main | |
: 1737550364:0;git puom | |
: 1737550374:0;git submodule update --init | |
: 1737550375:0;clear | |
: 1737550375:0;ls | |
: 1737550382:0;git ob deprecatewarp | |
: 1737550383:0;clear | |
: 1737550383:0;ls | |
: 1737550384:0;riree | |
: 1737550523:0;ls | |
: 1737550525:0;cd .. | |
: 1737550525:0;ls | |
: 1737550529:0;mkdir warpreduction | |
: 1737550530:0;clear | |
: 1737550530:0;ls | |
: 1737550532:0;cd warpreduction | |
: 1737550533:0;clear | |
: 1737550533:0;ls | |
: 1737550535:0;vi test.mlir | |
: 1737550874:0;iree-compile --iree-hal-target-backends=rocm --iree-hip-target=gfx942 test.mlir -o abc.vmfb --mlir-print-ir-afer-all 2> full.txt | |
: 1737550877:0;vi full.txt | |
: 1737550887:0;iree-compile --iree-hal-target-backends=rocm --iree-hip-target=gfx942 test.mlir -o abc.vmfb --mlir-print-ir-after-all 2> full.txt | |
: 1737550890:0;vi full.txt | |
: 1737550895:0;ls | |
: 1737550896:0;vi full.txt | |
: 1737557761:0;ls | |
: 1737557764:0;cat test.mlir | |
: 1737557836:0;vi test2.mlir | |
: 1737557939:0;iree-compile --iree-hal-target-backends=rocm --iree-hip-target=gfx942 test2.mlir -o abc.vmfb --mlir-print-ir-after-all 2> full.txt | |
: 1737557942:0;vi full.txt | |
: 1737557962:0;vi test2.mlir | |
: 1737557976:0;iree-compile --iree-hal-target-backends=rocm --iree-hip-target=gfx942 test2.mlir -o abc.vmfb --mlir-print-ir-after-all 2> full.txt | |
: 1737557978:0;vi full.txt | |
: 1737558220:0;iree-compile --iree-codegen-llvmgpu-use-vector-distribution=true --iree-hal-target-backends=rocm --iree-hip-target=gfx942 test2.mlir -o abc.vmfb --mlir-print-ir-after-all 2> full.txt | |
: 1737558223:0;vi full.txt | |
: 1737558431:0;wget https://sharkblobs.blob.core.windows.net/halo-models/flux/transformer/black-forest-labs--FLUX.1-dev--transformer-single-layer-b16.mlir | |
: 1737558504:0;ls | |
: 1737558516:0;cd iree | |
: 1737558516:0;ls | |
: 1737558522:0;cd .. | |
: 1737558522:0;ls | |
: 1737558525:0;cd test | |
: 1737558525:0;ls | |
: 1737558529:0;cd tinyllama | |
: 1737558530:0;ls | |
: 1737558534:0;vi chat_tinyllama_q8.mlir | |
: 1737558541:0;cd dump | |
: 1737558541:0;ls | |
: 1737558548:0;ag vector | |
: 1737558558:0;grep vectordistribute | |
: 1737558573:0;cd .. | |
: 1737558573:0;ls | |
: 1737558628:0;iree-compile --iree-codegen-llvmgpu-use-vector-distribution=true --iree-hal-target-backends=rocm --iree-hip-target=gfx942 chat_tinyllama_q8.mlir -o abc.vmfb iree-hal-dump-executable-sources-to=dump/ | |
: 1737558633:0;rm -rf dump | |
: 1737558638:0;iree-compile --iree-codegen-llvmgpu-use-vector-distribution=true --iree-hal-target-backends=rocm --iree-hip-target=gfx942 chat_tinyllama_q8.mlir -o abc.vmfb -iree-hal-dump-executable-sources-to=dump/ | |
: 1737558680:0;ls | |
: 1737558681:0;cd dump | |
: 1737558682:0;ls | |
: 1737558689:0;vi module_prefill_bs1\$async_dispatch_9.mlir | |
: 1737559058:0;cd .. | |
: 1737559058:0;ls | |
: 1737559063:0;cd .. | |
: 1737559063:0;ls | |
: 1737559066:0;cd warpreduction | |
: 1737559066:0;ls | |
: 1737559068:0;vi test2.mlir | |
: 1737559117:0;iree-compile --iree-codegen-llvmgpu-use-vector-distribution=true --iree-hal-target-backends=rocm --iree-hip-target=gfx942 test2.mlir -o abc.vmfb --mlir-print-ir-after-all 2> full.txt | |
: 1737559120:0;vi full.txt | |
: 1737559531:0;vi test_vector_distribute.mlir | |
: 1737559579:0;iree-opt --split-input-file --iree-gpu-test-target=gfx942 --iree-codegen-llvmgpu-use-vector-distribution --iree-llvmgpu-enable-prefetch=true --pass-pipeline="builtin.module(hal.executable(hal.executable.variant(builtin.module(func.func(iree-llvmgpu-lower-executable-target)))))" test_vector_distribute.mlir --mlir-print-ir-after-all 2> vector_full.txt | |
: 1737559583:0;vi vector_full.txt | |
: 1737559945:0;ls | |
: 1737559951:0;git clone https://github.com/bjacob/hip-matmul.git | |
: 1737559955:0;cd hip-matmul | |
: 1737559955:0;ls | |
: 1737559962:0;g++ mfma_on_cpu_threads.cc | |
: 1737559977:0;clang++ mfma_on_cpu_threads.cc | |
: 1737559982:0;clang++-18 mfma_on_cpu_threads.cc | |
: 1737559991:0;clang mfma_on_cpu_threads.cc | |
: 1737559999:0;clang-18 mfma_on_cpu_threads.cc | |
: 1737560031:0;clang++ --std=c++20 mfma_on_cpu_threads.cc | |
: 1737560035:0;clang++-18 --std=c++20 mfma_on_cpu_threads.cc | |
: 1737560038:0;./a.out | |
: 1737560182:0;ls | |
: 1737560186:0;vi mfma_on_cpu_threads.cc | |
: 1737560680:0;ls | |
: 1737560690:0;cd test/warpreduction | |
: 1737560691:0;ls | |
: 1737560703:0;cd hip-matmul | |
: 1737560704:0;ls | |
: 1737560707:0;clang++-18 --std=c++20 mfma_on_cpu_threads.cc | |
: 1737560709:0;./a.out | |
: 1737562601:0;gist-paste vector_full.txt | |
: 1737562624:0;vi vector_full.txt | |
: 1737571471:0;ls | |
: 1737571476:0;vi test_vector_distribute.mlir | |
: 1737571572:0;iree-opt --split-input-file --iree-gpu-test-target=gfx942 --iree-codegen-llvmgpu-use-vector-distribution --iree-llvmgpu-enable-prefetch=true --pass-pipeline="builtin.module(hal.executable(hal.executable.variant(builtin.module(func.func(iree-llvmgpu-lower-executable-target)))))" test_vector_distribute.mlir --mlir-print-ir-after-all 2> vector_full.txt | |
: 1737571577:0;vi vector_full.txt | |
: 1737633317:0;clear | |
: 1737633317:0;ls | |
: 1737633321:0;cd .. | |
: 1737633328:0;git clone https://github.com/ROCm/amd_matrix_instruction_calculator.git | |
: 1737633330:0;ls | |
: 1737633333:0;cd amd_matrix_instruction_calculator | |
: 1737633333:0;ls | |
: 1737633340:0;source ~/iree/.iree_venv/bin/activate | |
: 1737633344:0;python matrix_calculator.py | |
: 1737633348:0;pip install tabulate | |
: 1737633353:0;python matrix_calculator.py | |
: 1737633407:0;./matrix_calculator.py --architecture rdna3 --instruction v_wmma_f32_16x16x16_f16 --matrix-layout --B-matrix | |
: 1737633419:0;./matrix_calculator.py --architecture rdna3 --instruction v_wmma_f32_16x16x16_f16 --matrix-layout --C-matrix | |
: 1737633423:0;./matrix_calculator.py --architecture rdna3 --instruction v_wmma_f32_16x16x16_f16 --matrix-layout --A-matrix | |
: 1737633455:0;./matrix_calculator.py --architecture rdna3 --instruction v_wmma_f32_16x16x16_f16 --matrix-layout --A-matrix -csv | |
: 1737633473:0;./matrix_calculator.py --architecture rdna3 --instruction v_wmma_f32_16x16x16_f16 --matrix-layout --A-matrix --csv | |
: 1737633616:0;./matrix_calculator.py --architecture rdna3 --instruction v_wmma_f32_16x16x16_f16 --matrix-layout --C-matrix --csv | |
: 1737633649:0;./matrix_calculator.py --architecture rdna3 --instruction v_wmma_f32_16x16x16_f16 --matrix-layout --A-matrix --csv | |
: 1737638428:0;riree | |
: 1737638797:0;iree-compile --iree-hal-target-backends=rocm --iree-hip-target=gfx942 test.mlir -o abc.vmfb --mlir-print-ir-afer-all 2> full.txt | |
: 1737638799:0;vi full.txt | |
: 1737638808:0;iree-compile --iree-hal-target-backends=rocm --iree-hip-target=gfx942 test.mlir -o abc.vmfb --mlir-print-ir-after-all 2> full.txt | |
: 1737638811:0;vi full.txt | |
: 1737640481:0;ls | |
: 1737640485:0;vi test_vector_distribute.mlir | |
: 1737640814:0;iree-opt --split-input-file --iree-gpu-test-target=gfx942 --iree-codegen-llvmgpu-use-vector-distribution --iree-llvmgpu-enable-prefetch=true --pass-pipeline="builtin.module(hal.executable(hal.executable.variant(builtin.module(func.func(iree-llvmgpu-lower-executable-target)))))" test_vector_distribute.mlir --mlir-print-ir-after-all 2> vecmat_full.txt | |
: 1737640817:0;vi vector_full.txt | |
: 1737640838:0;vi test_vector_distribute.mlir | |
: 1737640855:0;iree-opt --split-input-file --iree-gpu-test-target=gfx942 --iree-codegen-llvmgpu-use-vector-distribution --iree-llvmgpu-enable-prefetch=true --pass-pipeline="builtin.module(hal.executable(hal.executable.variant(builtin.module(func.func(iree-llvmgpu-lower-executable-target)))))" test_vector_distribute.mlir --mlir-print-ir-after-all 2> vecmat_full.txt | |
: 1737640857:0;vi vecmat_full.txt | |
: 1737640921:0;vi test_vector_distribute.mlir | |
: 1737640933:0;iree-opt --split-input-file --iree-gpu-test-target=gfx942 --iree-codegen-llvmgpu-use-vector-distribution --iree-llvmgpu-enable-prefetch=true --pass-pipeline="builtin.module(hal.executable(hal.executable.variant(builtin.module(func.func(iree-llvmgpu-lower-executable-target)))))" test_vector_distribute.mlir --mlir-print-ir-after-all 2> vecmat_full.txt | |
: 1737640938:0;vi vecmat_full.txt | |
: 1737641126:0;riree | |
: 1737641202:0;vi test_vector_distribute.mlir | |
: 1737641237:0;iree-opt --split-input-file --iree-gpu-test-target=gfx942 --iree-codegen-llvmgpu-use-vector-distribution --iree-llvmgpu-enable-prefetch=true --pass-pipeline="builtin.module(hal.executable(hal.executable.variant(builtin.module(func.func(iree-llvmgpu-lower-executable-target)))))" test_vector_distribute.mlir --mlir-print-ir-after-all 2> vecmat_full.txt | |
: 1737641246:0;vi vecmat_full.txt | |
: 1737641302:0;ls | |
: 1737641305:0;vi before_layouts.mlir | |
: 1737641348:0;iree-opt --split-input-file --pass-pipeline='builtin.module(func.func(iree-llvmgpu-configure-tensor-layouts, canonicalize, cse))' before_layouts.mlir | |
: 1737641356:0;riree | |
: 1737641374:0;iree-opt --split-input-file --pass-pipeline='builtin.module(func.func(iree-llvmgpu-configure-tensor-layouts, canonicalize, cse))' before_layouts.mlir | |
: 1737641415:0;vi before_layouts.mlir | |
: 1737641629:0;riree | |
: 1737641697:0;iree-opt --split-input-file --pass-pipeline='builtin.module(func.func(iree-llvmgpu-configure-tensor-layouts, canonicalize, cse))' before_layouts.mlir | |
: 1737641788:0;riree | |
: 1737641804:0;iree-opt --split-input-file --pass-pipeline='builtin.module(func.func(iree-llvmgpu-configure-tensor-layouts, canonicalize, cse))' before_layouts.mlir | |
: 1737641929:0;riree | |
: 1737641945:0;iree-opt --split-input-file --pass-pipeline='builtin.module(func.func(iree-llvmgpu-configure-tensor-layouts, canonicalize, cse))' before_layouts.mlir | |
: 1737642892:0;ls | |
: 1737642895:0;cat test_vector_distribute.mlir | |
: 1737644363:0;ls | |
: 1737644371:0;vi test_vector.mlir | |
: 1737644396:0;ls | |
: 1737644418:0;vi test_vector.mlir | |
: 1737644451:0;iree-compile --iree-hal-target-backends=rocm --iree-hip-target=gfx942 vector_full.txt -o abc.vmfb --mlir-print-ir-after-all 2> full.txt --compile-from=executable-sources | |
: 1737644454:0;vi full.txt | |
: 1737644472:0;vi vector_full.txt | |
: 1737644497:0;iree-compile --iree-hal-target-backends=rocm --iree-hip-target=gfx942 test_vector.mlir -o abc.vmfb --mlir-print-ir-after-all 2> full.txt --compile-from=executable-sources | |
: 1737644500:0;vi full.txt | |
: 1737644542:0;vi test_vector | |
: 1737644545:0;vi test_vector.mlir | |
: 1737644669:0;iree-compile --iree-hal-target-backends=rocm --iree-hip-target=gfx942 test_vector.mlir -o abc.vmfb --mlir-print-ir-after-all 2> full.txt | |
: 1737644672:0;vi full.txt | |
: 1737644778:0;iree-compile --iree-codegen-llvmgpu-use-vector-distribution=true --iree-hal-target-backends=rocm --iree-hip-target=gfx942 test_vector.mlir -o abc.vmfb --mlir-print-ir-after-all 2> full.txt | |
: 1737644782:0;vi full.txt | |
: 1737644872:0;riree | |
: 1737644947:0;iree-compile --iree-codegen-llvmgpu-use-vector-distribution=true --iree-hal-target-backends=rocm --iree-hip-target=gfx942 test_vector.mlir -o abc.vmfb --mlir-print-ir-after-all 2> full.txt | |
: 1737644950:0;vi full.txt | |
: 1737645158:0;vi test_vector.mlir | |
: 1737645170:0;iree-compile --iree-codegen-llvmgpu-use-vector-distribution=true --iree-hal-target-backends=rocm --iree-hip-target=gfx942 test_vector.mlir -o abc.vmfb --mlir-print-ir-after-all 2> full.txt | |
: 1737645387:0;iree-opt --split-input-file --iree-gpu-test-taret=gfx942 --iree-codeen-llvmpu-use-vector-distribution --pass-pipeline="builtin.module(iree-llvmpu-select-lowerin-stratey)" test_vector.mlir | |
: 1737645395:0;iree-opt --split-input-file --iree-gpu-test-target=gfx942 --iree-codeen-llvmpu-use-vector-distribution --pass-pipeline="builtin.module(iree-llvmpu-select-lowerin-stratey)" test_vector.mlir | |
: 1737645403:0;iree-opt --split-input-file --iree-gpu-test-target=gfx942 --iree-codegen-llvmpu-use-vector-distribution --pass-pipeline="builtin.module(iree-llvmpu-select-lowerin-stratey)" test_vector.mlir | |
: 1737645416:0;iree-opt --split-input-file --iree-gpu-test-target=gfx942 --iree-codegen-llvmgpu-use-vector-distribution --pass-pipeline="builtin.module(iree-llvmpu-select-lowerin-stratey)" test_vector.mlir | |
: 1737645423:0;iree-opt --split-input-file --iree-gpu-test-target=gfx942 --iree-codegen-llvmgpu-use-vector-distribution --pass-pipeline="builtin.module(iree-llvmpu-select-lowering-stratey)" test_vector.mlir | |
: 1737645428:0;iree-opt --split-input-file --iree-gpu-test-target=gfx942 --iree-codegen-llvmgpu-use-vector-distribution --pass-pipeline="builtin.module(iree-llvmgpu-select-lowering-stratey)" test_vector.mlir | |
: 1737645442:0;iree-opt --split-input-file --iree-gpu-test-target=gfx942 --iree-codegen-llvmgpu-use-vector-distribution --pass-pipeline="builtin.module(iree-llvmgpu-select-lowering-strategy)" test_vector.mlir | |
: 1737645457:0;iree-opt --split-input-file --iree-gpu-test-target=gfx942 --iree-codegen-llvmgpu-use-vector-distribution --pass-pipeline="builtin.module(iree-llvmgpu-select-lowering-strategy)" test_vector.mlir --debug 2> debug.txt | |
: 1737645459:0;vi debug.txt | |
: 1737645657:0;riree | |
: 1737645678:0;iree-opt --split-input-file --iree-gpu-test-target=gfx942 --iree-codegen-llvmgpu-use-vector-distribution --pass-pipeline="builtin.module(iree-llvmgpu-select-lowering-strategy)" test_vector.mlir --debug 2> debug.txt | |
: 1737645681:0;vi debug.txt | |
: 1737646203:0;riree | |
: 1737646223:0;iree-opt --split-input-file --iree-gpu-test-target=gfx942 --iree-codegen-llvmgpu-use-vector-distribution --pass-pipeline="builtin.module(iree-llvmgpu-select-lowering-strategy)" test_vector.mlir --debug 2> debug.txt | |
: 1737646460:0;riree | |
: 1737646483:0;iree-opt --split-input-file --iree-gpu-test-target=gfx942 --iree-codegen-llvmgpu-use-vector-distribution --pass-pipeline="builtin.module(iree-llvmgpu-select-lowering-strategy)" test_vector.mlir --debug 2> debug.txt | |
: 1737651132:0;\ | |
: 1737651134:0;clear | |
: 1737651134:0;ls | |
: 1737651136:0;tmux attach -t 0 | |
: 1737651179:0;ls | |
: 1737651186:0;vi test_vector_distribute.mlir | |
: 1737651286:0;vi dump.txt | |
: 1737652632:0;vi test_vector_distribute.mlir | |
: 1737652724:0;iree-opt --split-input-file --iree-gpu-test-target=gfx942 --iree-codegen-llvmgpu-use-vector-distribution --iree-llvmgpu-enable-prefetch=true --pass-pipeline="builtin.module(hal.executable(hal.executable.variant(builtin.module(func.func(iree-llvmgpu-lower-executable-target)))))" test_vector_distribute.mlir | |
: 1737652753:0;iree-opt --split-input-file --iree-gpu-test-target=gfx942 --iree-codegen-llvmgpu-use-vector-distribution --iree-llvmgpu-enable-prefetch=true --pass-pipeline="builtin.module(hal.executable(hal.executable.variant(builtin.module(func.func(iree-llvmgpu-lower-executable-target)))))" test_vector_distribute.mlir 2> vector_distribute_dump.txt | |
: 1737652763:0;iree-opt --split-input-file --iree-gpu-test-target=gfx942 --iree-codegen-llvmgpu-use-vector-distribution --iree-llvmgpu-enable-prefetch=true --pass-pipeline="builtin.module(hal.executable(hal.executable.variant(builtin.module(func.func(iree-llvmgpu-lower-executable-target)))))" test_vector_distribute.mlir 2> vector_distribute_dump.txt -mlir-print-ir-after-all | |
: 1737652767:0;vi vector_distribute_dump.txt | |
: 1737652777:0;vi test_vector_distribute.mlir | |
: 1737652978:0;cat test.mlir | |
: 1737653112:0;vi test.mlir | |
: 1737653212:0;iree-compile --iree-hal-target-backends=rocm --iree-hip-target=gfx942 test.mlir -o abc.vmfb --mlir-print-ir-after-all 2> warp_reduction_dump.txt | |
: 1737653216:0;vi warp_reduction_dump.txt | |
: 1737653530:0;2 | |
: 1737713139:0;clear | |
: 1737713140:0;ls | |
: 1737713146:0;tmux attach -t 0 | |
: 1737717286:0;riree | |
: 1737717321:0;iree-compile --iree-hal-target-backends=rocm --iree-hip-target=gfx942 test.mlir -o abc.vmfb --mlir-print-ir-after-all 2> warp_reduction_dump.txt | |
: 1737717325:0;vi warp_reduction_dump.txt | |
: 1737717368:0;iree-compile iree-codegen-use-vector-distribution=true --iree-hal-target-backends=rocm --iree-hip-target=gfx942 test.mlir -o abc.vmfb --mlir-print-ir-after-all 2> warp_reduction_dump.txt | |
: 1737717371:0;vi warp_reduction_dump.txt | |
: 1737717377:0;iree-compile -iree-codegen-use-vector-distribution=true --iree-hal-target-backends=rocm --iree-hip-target=gfx942 test.mlir -o abc.vmfb --mlir-print-ir-after-all 2> warp_reduction_dump.txt | |
: 1737717379:0;vi warp_reduction_dump.txt | |
: 1737717390:0;iree-compile -iree-codegen-llvmgpu-use-vector-distribution=true --iree-hal-target-backends=rocm --iree-hip-target=gfx942 test.mlir -o abc.vmfb --mlir-print-ir-after-all 2> warp_reduction_dump.txt | |
: 1737717395:0;vi warp_reduction_dump.txt | |
: 1737717423:0;vi strategy.mlir | |
: 1737717450:0;vi warp_reduction_dump.txt | |
: 1737717492:0;iree-opt --split-input-file --iree-gpu-test-target=gfx908 --pass-pipeline='builtin.module(iree-llvmgpu-select-lowering-strategy)' strategy.mlir | |
: 1737717628:0;iree-opt -iree-codegen-llvmgpu-use-vector-distribution=true --split-input-file --iree-gpu-test-target=gfx908 --pass-pipeline='builtin.module(iree-llvmgpu-select-lowering-strategy)' strategy.mlir | |
: 1737717655:0;iree-opt -iree-codegen-llvmgpu-use-vector-distribution=true --split-input-file --iree-gpu-test-target=gfx908 --pass-pipeline='builtin.module(iree-llvmgpu-select-lowering-strategy)' strategy.mlir --debug | |
: 1737717733:0;ree | |
: 1737717734:0;riree | |
: 1737717753:0;iree-opt -iree-codegen-llvmgpu-use-vector-distribution=true --split-input-file --iree-gpu-test-target=gfx908 --pass-pipeline='builtin.module(iree-llvmgpu-select-lowering-strategy)' strategy.mlir --debug | |
: 1737717799:0;riree | |
: 1737717843:0;iree-opt -iree-codegen-llvmgpu-use-vector-distribution=true --split-input-file --iree-gpu-test-target=gfx908 --pass-pipeline='builtin.module(iree-llvmgpu-select-lowering-strategy)' strategy.mlir --debug | |
: 1737718132:0;riree | |
: 1737718154:0;iree-opt -iree-codegen-llvmgpu-use-vector-distribution=true --split-input-file --iree-gpu-test-target=gfx908 --pass-pipeline='builtin.module(iree-llvmgpu-select-lowering-strategy)' strategy.mlir --debug | |
: 1737718236:0;riree | |
: 1737718253:0;iree-opt -iree-codegen-llvmgpu-use-vector-distribution=true --split-input-file --iree-gpu-test-target=gfx908 --pass-pipeline='builtin.module(iree-llvmgpu-select-lowering-strategy)' strategy.mlir | |
: 1737718325:0;riree | |
: 1737718437:0;iree-opt -iree-codegen-llvmgpu-use-vector-distribution=true --split-input-file --iree-gpu-test-target=gfx908 --pass-pipeline='builtin.module(iree-llvmgpu-select-lowering-strategy)' strategy.mlir | |
: 1737718448:0;ree | |
: 1737718449:0;riree | |
: 1737718457:0;iree-opt -iree-codegen-llvmgpu-use-vector-distribution=true --split-input-file --iree-gpu-test-target=gfx908 --pass-pipeline='builtin.module(iree-llvmgpu-select-lowering-strategy)' strategy.mlir | |
: 1737718466:0;iree-opt -iree-codegen-llvmgpu-use-vector-distribution=true --split-input-file --iree-gpu-test-target=gfx908 --pass-pipeline='builtin.module(iree-llvmgpu-select-lowering-strategy)' strategy.mlir --debug | |
: 1737718486:0;riree | |
: 1737718504:0;iree-opt -iree-codegen-llvmgpu-use-vector-distribution=true --split-input-file --iree-gpu-test-target=gfx908 --pass-pipeline='builtin.module(iree-llvmgpu-select-lowering-strategy)' strategy.mlir --debug | |
: 1737718961:0;riree | |
: 1737718979:0;iree-opt -iree-codegen-llvmgpu-use-vector-distribution=true --split-input-file --iree-gpu-test-target=gfx908 --pass-pipeline='builtin.module(iree-llvmgpu-select-lowering-strategy)' strategy.mlir --debug | |
: 1737721369:0;cd .. | |
: 1737721372:0;cd iree | |
: 1737721385:0;clang-format -i compiler/src/iree/compiler/Codegen/LLVMGPU/Passes.cpp | |
: 1737721404:0;clang-format -i compiler/src/iree/compiler/Codegen/LLVMGPU/KernelConfig.cpp | |
: 1737721418:0;riree | |
: 1737721439:0;iree-opt -iree-codegen-llvmgpu-use-vector-distribution=true --split-input-file --iree-gpu-test-target=gfx908 --pass-pipeline='builtin.module(iree-llvmgpu-select-lowering-strategy)' strategy.mlir --debug | |
: 1737721482:0;iree-opt -iree-codegen-llvmgpu-use-vector-distribution=true --split-input-file --iree-gpu-test-target=gfx908 --pass-pipeline='builtin.module(iree-llvmgpu-select-lowering-strategy)' strategy.mlir | |
: 1737722108:0;riree | |
: 1737722132:0;iree-opt -iree-codegen-llvmgpu-use-vector-distribution=true --split-input-file --iree-gpu-test-target=gfx908 --pass-pipeline='builtin.module(iree-llvmgpu-select-lowering-strategy)' strategy.mlir | |
: 1737722252:0;riree | |
: 1737722270:0;iree-opt -iree-codegen-llvmgpu-use-vector-distribution=true --split-input-file --iree-gpu-test-target=gfx908 --pass-pipeline='builtin.module(iree-llvmgpu-select-lowering-strategy)' strategy.mlir | |
: 1737722442:0;riree | |
: 1737722500:0;iree-opt -iree-codegen-llvmgpu-use-vector-distribution=true --split-input-file --iree-gpu-test-target=gfx908 --pass-pipeline='builtin.module(iree-llvmgpu-select-lowering-strategy)' strategy.mlir | |
: 1737722526:0;vi gen.mlir | |
: 1737722555:0;iree-opt --split-input-file --iree-gpu-test-target=gfx942 --iree-codegen-llvmgpu-use-vector-distribution --iree-llvmgpu-enable-prefetch=true --pass-pipeline="builtin.module(hal.executable(hal.executable.variant(builtin.module(func.func(iree-llvmgpu-lower-executable-target)))))" gen.mlir 2> vector_distribute_dump.txt -mlir-print-ir-after-all | |
: 1737722563:0;vi vector_distribute_dump.txt | |
: 1737722587:0;iree-opt --split-input-file --iree-gpu-test-target=gfx942 --iree-codegen-llvmgpu-use-vector-distribution --iree-llvmgpu-enable-prefetch=true --pass-pipeline="builtin.module(hal.executable(hal.executable.variant(builtin.module(func.func(iree-llvmgpu-lower-executable-target)))))" gen.mlir 2> vector_distribute_dump.txt -mlir-print-ir-after-all | |
: 1737722599:0;ls | |
: 1737722606:0;vi test.mlir | |
: 1737722618:0;iree-compile -iree-codegen-use-vector-distribution=true --iree-hal-target-backends=rocm --iree-hip-target=gfx942 test.mlir -o abc.vmfb --mlir-print-ir-after-all 2> warp_reduction_dump.txt | |
: 1737722622:0;vi warp_reduction_dump.txt | |
: 1737722640:0;iree-compile -iree-codegen-llvmgpu-use-vector-distribution=true --iree-hal-target-backends=rocm --iree-hip-target=gfx942 test.mlir -o abc.vmfb --mlir-print-ir-after-all 2> warp_reduction_dump.txt | |
: 1737722643:0;vi warp_reduction_dump.txt | |
: 1737722695:0;iree-opt --split-input-file --iree-gpu-test-target=gfx908 --pass-pipeline='builtin.module(iree-llvmgpu-select-lowering-strategy)' strategy.mlir | |
: 1737722847:0;iree-opt --split-input-file --iree-gpu-test-target=gfx942 --iree-codegen-llvmgpu-use-vector-distribution --iree-llvmgpu-enable-prefetch=true --pass-pipeline="builtin.module(hal.executable(hal.executable.variant(builtin.module(func.func(iree-llvmgpu-lower-executable-target)))))" test_vector_distribute.mlir 2> vector_distribute_dump.txt -mlir-print-ir-after-all | |
: 1737722858:0;vi dump.txt vector_distribute_dump.txt | |
: 1737722983:0;vi vector_distribute_dump.txt | |
: 1737723154:0;git ppf | |
: 1737723745:0;riree | |
: 1737724207:0;iree-opt --split-input-file --iree-gpu-test-target=gfx908 --pass-pipeline='builtin.module(iree-llvmgpu-select-lowering-strategy)' strategy.mlir | |
: 1737724221:0;ls | |
: 1737724227:0;vi gen.mlir | |
: 1737724247:0;iree-opt --split-input-file --iree-gpu-test-target=gfx942 --iree-codegen-llvmgpu-use-vector-distribution --iree-llvmgpu-enable-prefetch=true --pass-pipeline="builtin.module(hal.executable(hal.executable.variant(builtin.module(func.func(iree-llvmgpu-lower-executable-target)))))" gen.mlir 2> vector_distribute_dump.txt -mlir-print-ir-after-all | |
: 1737724254:0;vi vector_distribute_dump.txt | |
: 1737724273:0;iree-compile -iree-codegen-llvmgpu-use-vector-distribution=true --iree-hal-target-backends=rocm --iree-hip-target=gfx942 test.mlir -o abc.vmfb --mlir-print-ir-after-all 2> warp_reduction_dump.txt | |
: 1737724279:0;vi warp_reduction_dump.txt | |
: 1737725717:0;mv warp_reduction_dump.txt vec_new.txt | |
: 1737725721:0;vi vector_distribute_dump.txt | |
: 1737725731:0;iree-opt --split-input-file --iree-gpu-test-target=gfx942 --iree-codegen-llvmgpu-use-vector-distribution --iree-llvmgpu-enable-prefetch=true --pass-pipeline="builtin.module(hal.executable(hal.executable.variant(builtin.module(func.func(iree-llvmgpu-lower-executable-target)))))" test_vector_distribute.mlir 2> vector_distribute_dump.txt -mlir-print-ir-after-all | |
: 1737725735:0;vi vector_distribute_dump.txt | |
: 1737725968:0;gist-paste vector_distribute_dump.txt | |
: 1737725976:0;vi test.mlir | |
: 1737727573:0;clear | |
: 1737727573:0;ls | |
: 1737734916:0;tmux attach -t 0 | |
: 1737738107:0;riree | |
: 1737738183:0;iree-opt --split-input-file --iree-gpu-test-target=gfx908 --pass-pipeline='builtin.module(iree-llvmgpu-select-lowering-strategy)' strategy.mlir | |
: 1737739390:0;clang-format -i compiler/src/iree/compiler/Codegen/LLVMGPU/KernelConfig.cpp | |
: 1737739418:0;riree | |
: 1737739436:0;iree-opt --split-input-file --iree-gpu-test-target=gfx908 --pass-pipeline='builtin.module(iree-llvmgpu-select-lowering-strategy)' strategy.mlir | |
: 1737739738:0;clang-format -i compiler/src/iree/compiler/Codegen/LLVMGPU/KernelConfig.cpp | |
: 1737739755:0;git ppf | |
: 1737739835:0;clang-format -i compiler/src/iree/compiler/Codegen/LLVMGPU/KernelConfig.cpp | |
: 1737739848:0;git ppf | |
: 1737740507:0;clear | |
: 1737740508:0;ls | |
: 1737897544:0;\ | |
c | |
: 1737897545:0;clear | |
: 1737897546:0;ls | |
: 1737897551:0;tmux attach -t 0 | |
: 1737902981:0;\ | |
\ | |
\ | |
: 1737902983:0;tmux attach -t 0 | |
: 1737904543:0;riree | |
: 1737904552:0;ls | |
: 1737904553:0;vi test.mlir | |
: 1737904576:0;iree-compile -iree-codegen-llvmgpu-use-vector-distribution=true --iree-hal-target-backends=rocm --iree-hip-target=gfx942 test.mlir -o abc.vmfb --mlir-print-ir-after-all 2> warp_reduction_dump.txt | |
: 1737904579:0;vi warp_reduction_dump.txt | |
: 1737904717:0;riree | |
: 1737904737:0;iree-compile -iree-codegen-llvmgpu-use-vector-distribution=true --iree-hal-target-backends=rocm --iree-hip-target=gfx942 test.mlir -o abc.vmfb --mlir-print-ir-after-all 2> warp_reduction_dump.txt | |
: 1737904741:0;vi warp_reduction_dump.txt | |
: 1737904883:0;riree | |
: 1737904944:0;iree-compile -iree-codegen-llvmgpu-use-vector-distribution=true --iree-hal-target-backends=rocm --iree-hip-target=gfx942 test.mlir -o abc.vmfb --mlir-print-ir-after-all 2> warp_reduction_dump.txt | |
: 1737904948:0;vi warp_reduction_dump.txt | |
: 1737905009:0;riree | |
: 1737905037:0;iree-compile -iree-codegen-llvmgpu-use-vector-distribution=true --iree-hal-target-backends=rocm --iree-hip-target=gfx942 test.mlir -o abc.vmfb --mlir-print-ir-after-all 2> warp_reduction_dump.txt | |
: 1737905041:0;vi warp_reduction_dump.txt | |
: 1737905074:0;riree | |
: 1737905258:0;iree-compile -iree-codegen-llvmgpu-use-vector-distribution=true --iree-hal-target-backends=rocm --iree-hip-target=gfx942 test.mlir -o abc.vmfb --mlir-print-ir-after-all 2> warp_reduction_dump.txt | |
: 1737905262:0;vi warp_reduction_dump.txt | |
: 1737905522:0;riree | |
: 1737905677:0;iree-compile -iree-codegen-llvmgpu-use-vector-distribution=true --iree-hal-target-backends=rocm --iree-hip-target=gfx942 test.mlir -o abc.vmfb --mlir-print-ir-after-all 2> warp_reduction_dump.txt | |
: 1737905682:0;vi warp_reduction_dump.txt | |
: 1737906296:0;CTEST_PARALLEL_LEVEL=64 cmake --build ~/iree-build --target iree-run-tests -j 32 | |
: 1737906652:0;iree-opt --split-input-file --iree-gpu-test-target=gfx1100 --pass-pipeline='builtin.module(iree-llvmgpu-select-lowering-strategy)' compiler/src/iree/compiler/Codegen/LLVMGPU/test/config_matvec.mlir | FileCheck compiler/src/iree/compiler/Codegen/LLVMGPU/test/config_matvec.mlir --check-prefix=CDNA3 | |
: 1737906962:0;rriree | |
: 1737906963:0;riree | |
: 1737906984:0;iree-opt --split-input-file --iree-gpu-test-target=gfx1100 --pass-pipeline='builtin.module(iree-llvmgpu-select-lowering-strategy)' compiler/src/iree/compiler/Codegen/LLVMGPU/test/config_matvec.mlir | FileCheck compiler/src/iree/compiler/Codegen/LLVMGPU/test/config_matvec.mlir --check-prefix=CDNA3 | |
: 1737907048:0;riree | |
: 1737907066:0;iree-opt --split-input-file --iree-gpu-test-target=gfx1100 --pass-pipeline='builtin.module(iree-llvmgpu-select-lowering-strategy)' compiler/src/iree/compiler/Codegen/LLVMGPU/test/config_matvec.mlir | FileCheck compiler/src/iree/compiler/Codegen/LLVMGPU/test/config_matvec.mlir --check-prefix=CDNA3 | |
: 1737907334:0;iree-opt --split-input-file --iree-gpu-test-target=gfx942 --pass-pipeline="builtin.module(hal.executable(hal.executable.variant(builtin.module(iree-llvmgpu-select-lowering-strategy, func.func(iree-llvmgpu-lower-executable-target)))))" compiler/src/iree/compiler/Codegen/LLVMGPU/test/reduction_pipeline_rocm.mlir | FileCheck compiler/src/iree/compiler/Codegen/LLVMGPU/test/reduction_pipeline_rocm.mlir | |
: 1737907448:0;iree-opt --split-input-file --iree-gpu-test-target=gfx1100 --pass-pipeline="builtin.module(hal.executable(hal.executable.variant(builtin.module(iree-llvmgpu-select-lowering-strategy, func.func(iree-llvmgpu-lower-executable-target)))))" compiler/src/iree/compiler/Codegen/LLVMGPU/test/reduction_pipeline_rocm.mlir | FileCheck compiler/src/iree/compiler/Codegen/LLVMGPU/test/reduction_pipeline_rocm.mlir --check-prefix=CDNA3 | |
: 1737907461:0;riree | |
: 1737908202:0;iree-opt --split-input-file --iree-gpu-test-target=gfx942 --pass-pipeline="builtin.module(hal.executable(hal.executable.variant(builtin.module(iree-llvmgpu-select-lowering-strategy, func.func(iree-llvmgpu-lower-executable-target)))))" compiler/src/iree/compiler/Codegen/LLVMGPU/test/reduction_pipeline_rocm.mlir | FileCheck compiler/src/iree/compiler/Codegen/LLVMGPU/test/reduction_pipeline_rocm.mlir | |
: 1737908235:0;iree-opt --split-input-file --iree-gpu-test-target=gfx1100 --pass-pipeline='builtin.module(iree-llvmgpu-select-lowering-strategy)' compiler/src/iree/compiler/Codegen/LLVMGPU/test/config_matvec.mlir | FileCheck compiler/src/iree/compiler/Codegen/LLVMGPU/test/config_matvec.mlir --check-prefix=CDNA3 | |
: 1737908245:0;iree-opt --split-input-file --iree-gpu-test-target=gfx1100 --pass-pipeline='builtin.module(iree-llvmgpu-select-lowering-strategy)' compiler/src/iree/compiler/Codegen/LLVMGPU/test/config_matvec.mlir | FileCheck compiler/src/iree/compiler/Codegen/LLVMGPU/test/config_matvec.mlir | |
: 1737911095:0;iree-opt --split-input-file --iree-gpu-test-target=gfx942 --pass-pipeline='builtin.module(iree-llvmgpu-select-lowering-strategy)' compiler/src/iree/compiler/Codegen/LLVMGPU/test/config_matvec.mlir | FileCheck compiler/src/iree/compiler/Codegen/LLVMGPU/test/config_matvec.mlir | |
: 1737911710:0;git lg | |
: 1737911721:0;git o main | |
: 1737911723:0;git stash | |
: 1737911725:0;git o main | |
: 1737911743:0;git ob correcttile | |
: 1737911749:0;git cp 3c36fb479e | |
: 1737911751:0;git ppf | |
: 1737911804:0;git-clang-format HEAD~ | |
: 1737911822:0;git ppf | |
: 1737912041:0;vi test.mlir | |
: 1737912056:0;iree-compile --iree-hal-target-backends=rocm --iree-hip-target=gfx942 test.mlir -o abc.vmfb --mlir-print-ir-after-all 2> warp_reduction_dump.txt | |
: 1737912060:0;vi warp_reduction_dump.txt | |
: 1737912124:0;riree | |
: 1737912168:0;iree-compile --iree-hal-target-backends=rocm --iree-hip-target=gfx942 test.mlir -o abc.vmfb --mlir-print-ir-after-all 2> warp_reduction_dump.txt | |
: 1737912172:0;vi warp_reduction_dump.txt | |
: 1737912194:0;clear | |
: 1737912194:0;ls | |
: 1737912383:0;CTEST_PARALLEL_LEVEL=64 cmake --build ~/iree-build --target iree-run-tests -j 32 | |
: 1737912845:0;clang-format -i compiler/src/iree/compiler/Codegen/LLVMGPU/KernelConfig.cpp | |
: 1737912885:0;git ppf | |
: 1737914301:0;git-clang-format HEAD~ | |
: 1737914309:0;git ppf | |
: 1737915676:0;iree-compile --iree-opt-generalize-matmul=true --iree-hal-target-backends=rocm --iree-hip-target=gfx942 test.mlir -o abc.vmfb --mlir-print-ir-after-all 2> warp_reduction_dump.txt | |
: 1737915681:0;vi warp_reduction_dump.txt | |
: 1737967365:0;tmux attach -t 0 | |
: 1737967369:0;clear | |
: 1737967369:0;ls | |
: 1737980425:0;clear | |
: 1737980425:0;ls | |
: 1737980427:0;tmux attach -t 0 | |
: 1737980818:0;cat compiler/src/iree/compiler/Codegen/LLVMGPU/KernelConfig.cpp | |
: 1737982384:0;clang-format -i compiler/src/iree/compiler/Codegen/LLVMGPU/KernelConfig.cpp | |
: 1737982567:0;riree | |
: 1737982632:0;git-clang-format HEAD~ | |
: 1737982639:0;clang-format -i compiler/src/iree/compiler/Codegen/LLVMGPU/KernelConfig.cpp | |
: 1737983225:0;CTEST_PARALLEL_LEVEL=64 cmake --build ~/iree-build --target iree-run-tests -j 32 | |
: 1737983505:0;riree | |
: 1737983580:0;iree-opt --split-input-file --iree-gpu-test-target=gfx942 --pass-pipeline='builtin.module(iree-llvmgpu-select-lowering-strategy)' compiler/src/iree/compiler/Codegen/LLVMGPU/test/config_matvec.mlir | |
: 1737983905:0;clang-format -i compiler/src/iree/compiler/Codegen/LLVMGPU/KernelConfig.cpp | |
: 1737983927:0;riree | |
: 1737983945:0;iree-opt --split-input-file --iree-gpu-test-target=gfx942 --pass-pipeline='builtin.module(iree-llvmgpu-select-lowering-strategy)' compiler/src/iree/compiler/Codegen/LLVMGPU/test/config_matvec.mlir | |
: 1737984035:0;riree | |
: 1737984056:0;iree-opt --split-input-file --iree-gpu-test-target=gfx942 --pass-pipeline='builtin.module(iree-llvmgpu-select-lowering-strategy)' compiler/src/iree/compiler/Codegen/LLVMGPU/test/config_matvec.mlir | |
: 1737984203:0;riree | |
: 1737984226:0;iree-opt --split-input-file --iree-gpu-test-target=gfx942 --pass-pipeline='builtin.module(iree-llvmgpu-select-lowering-strategy)' compiler/src/iree/compiler/Codegen/LLVMGPU/test/config_matvec.mlir | |
: 1737984295:0;riree | |
: 1737984314:0;iree-opt --split-input-file --iree-gpu-test-target=gfx942 --pass-pipeline='builtin.module(iree-llvmgpu-select-lowering-strategy)' compiler/src/iree/compiler/Codegen/LLVMGPU/test/config_matvec.mlir | |
: 1737984341:0;iree-opt --pass-pipeline='builtin.module(iree-llvmcpu-select-lowering-strategy)' -split-input-file compiler/src/iree/compiler/Codegen/LLVMCPU/test/select_x86_64_lowering_strategy.mlir | FileCheck-18 compiler/src/iree/compiler/Codegen/LLVMCPU/test/select_x86_64_lowering_strategy.mlir | |
: 1737984365:0;iree-opt --split-input-file --iree-gpu-test-target=gfx942 --pass-pipeline='builtin.module(iree-llvmgpu-select-lowering-strategy)' compiler/src/iree/compiler/Codegen/LLVMGPU/test/config_matvec.mlir | FileCheck compiler/src/iree/compiler/Codegen/LLVMGPU/test/config_matvec.mlir | |
: 1737984662:0;riree | |
: 1737984670:0;iree-opt --split-input-file --iree-gpu-test-target=gfx942 --pass-pipeline='builtin.module(iree-llvmgpu-select-lowering-strategy)' compiler/src/iree/compiler/Codegen/LLVMGPU/test/config_matvec.mlir | FileCheck compiler/src/iree/compiler/Codegen/LLVMGPU/test/config_matvec.mlir | |
: 1737984740:0;iree-opt --split-input-file --iree-gpu-test-target=gfx942 --pass-pipeline='builtin.module(iree-llvmgpu-select-lowering-strategy)' compiler/src/iree/compiler/Codegen/LLVMGPU/test/config_matvec.mlir | |
: 1737984876:0;riree | |
: 1737984894:0;iree-opt --split-input-file --iree-gpu-test-target=gfx942 --pass-pipeline='builtin.module(iree-llvmgpu-select-lowering-strategy)' compiler/src/iree/compiler/Codegen/LLVMGPU/test/config_matvec.mlir | FileCheck compiler/src/iree/compiler/Codegen/LLVMGPU/test/config_matvec.mlir | |
: 1737984901:0;CTEST_PARALLEL_LEVEL=64 cmake --build ~/iree-build --target iree-run-tests -j 32 | |
: 1737985259:0;git ppf | |
: 1737985806:0;git-clang-format HEAD~ | |
: 1737985828:0;git ppf | |
: 1737986232:0;git branch | |
: 1737986243:0;git o newtiling | |
: 1737986250:0;git o main | |
: 1737986251:0;git puom | |
: 1737986262:0;git submodule update --init | |
: 1737986266:0;git o newtiling | |
: 1737986270:0;git rebase main | |
: 1737986338:0;git o main | |
: 1737986343:0;git lg | |
: 1737986348:0;git o main | |
: 1737986354:0;git rebase --abort | |
: 1737986355:0;git o main | |
: 1737986358:0;git branch | |
: 1737986365:0;git o tilesoftmax | |
: 1737986374:0;git rebase main | |
: 1737986777:0;clang-format -i compiler/src/iree/compiler/Codegen/LLVMCPU/LLVMCPUTileRootAndFuseProducerConsumer.cpp | |
: 1737987017:0;ls | |
: 1737987019:0;cd .. | |
: 1737987021:0;cd softmax | |
: 1737987022:0;ls | |
: 1737987024:0;vi test.mlir | |
: 1737987126:0;iree-compile --output-format=vm-bytecode --iree-hal-target-backends=llvm-cpu --iree-llvmcpu-target-cpu=host test.mlir -o abc.vmfb -mlir-print-ir-after-all 2> full_new.txt | |
: 1737987134:0;vi full_new.txt | |
: 1737987283:0;vi test.mlir | |
: 1737987343:0;iree-opt --pass-pipeline="builtin.module(func.func(iree-llvmcpu-tile-root-and-fuse-producer-consumer{tiling-level=1 only-fuse-producer-input-operands=false}), canonicalize)" test.mlir | |
: 1737987372:0;riree | |
: 1737989597:0;iree-opt --pass-pipeline="builtin.module(func.func(iree-llvmcpu-tile-root-and-fuse-producer-consumer{tiling-level=1 only-fuse-producer-input-operands=false}), canonicalize)" test.mlir | |
: 1737989639:0;vi test.mlir | |
: 1737989926:0;iree-opt --pass-pipeline="builtin.module(func.func(iree-llvmcpu-tile-root-and-fuse-producer-consumer{tiling-level=0 only-fuse-producer-input-operands=false}), canonicalize)" compiler/src/iree/compiler/Codegen/LLVMCPU/test/tile-root-fuse-consumer-producer.mlir --split-input-file | FileCheck-18 compiler/src/iree/compiler/Codegen/LLVMCPU/test/tile-root-fuse-consumer-producer.mlir | |
: 1737990165:0;git ppf | |
: 1737990481:0;clear | |
: 1737990482:0;ls | |
: 1737990997:0;git-clang-format HEAD~ | |
: 1737991008:0;clang-format -i compiler/src/iree/compiler/Codegen/LLVMCPU/LLVMCPUTileRootAndFuseProducerConsumer.cpp | |
: 1737991023:0;git ppf | |
: 1737991668:0;git o main | |
: 1737991679:0;git ob deprecatetile | |
: 1737991747:0;CTEST_PARALLEL_LEVEL=64 cmake --build ~/iree-build --target iree-run-tests -j 32 | |
: 1737992176:0;git lg | |
: 1737992198:0;CTEST_PARALLEL_LEVEL=64 cmake --build ~/iree-build --target iree-run-tests -j 32 | |
: 1737992308:0;riree | |
: 1737992364:0;CTEST_PARALLEL_LEVEL=64 cmake --build ~/iree-build --target iree-run-tests -j 32 | |
: 1738002345:0;tmux attach -t 0 | |
: 1738002349:0;git o correcttile | |
: 1738002362:0;git stash | |
: 1738002865:0;clang-format -i compiler/src/iree/compiler/Codegen/LLVMGPU/KernelConfig.cpp | |
: 1738003403:0;riree | |
: 1738003459:0;git rebase main | |
: 1738003482:0;git submodule update --init | |
: 1738003485:0;git rebase main | |
: 1738003488:0;git submodule update --init | |
: 1738003491:0;riree | |
: 1738003511:0;git-clang-format HEAD~ | |
: 1738003513:0;git ppf | |
: 1738003549:0;riree | |
: 1738003964:0;clear | |
: 1738003964:0;ls | |
: 1738003967:0;CTEST_PARALLEL_LEVEL=64 cmake --build ~/iree-build --target iree-run-tests -j 32 | |
: 1738005837:0;clear | |
: 1738005838:0;ls | |
: 1738005933:0;tmux attach -t 0 | |
: 1738005939:0;git o main | |
: 1738005941:0;git puom | |
: 1738005951:0;clear | |
: 1738005951:0;ls | |
: 1738005958:0;git submodule update --init | |
: 1738005965:0;git ob bumpllvm | |
: 1738005966:0;clear | |
: 1738005966:0;ls | |
: 1738005973:0;cd third_party/llvm-project | |
: 1738005974:0;git lg | |
: 1738005980:0;git remote | |
: 1738006011:0;git remote add upstream [email protected]:llvm/llvm-project.git | |
: 1738006014:0;git fetch upstream | |
: 1738006071:0;cd ~/iree | |
: 1738006075:0;git remote add mahesh https://github.com/MaheshRavishankar/iree.git | |
: 1738006080:0;git fetch mahesh | |
: 1738006094:0;git o aa34a6ab299027ac31929173287e42db0dbdb06b | |
: 1738006095:0;clear | |
: 1738006096:0;ls | |
: 1738006103:0;cd .. | |
: 1738006103:0;ls | |
: 1738006106:0;cd .. | |
: 1738006106:0;ls | |
: 1738006151:0;git cp 66c536ab20831e72511cdc9a3d101a2e66613d18 | |
: 1738006156:0;git cp b9863466ee4872aa955973b5ae02b45d19deda84 | |
: 1738006166:0;CTEST_PARALLEL_LEVEL=64 cmake --build ~/iree-build --target iree-run-tests -j 32 | |
: 1738006329:0;git ppf | |
: 1738006345:0;git lg | |
: 1738008320:0;git o correcttile | |
: 1738008349:0;git submodule update --init | |
: 1738008364:0;clang-format -i compiler/src/iree/compiler/Codegen/LLVMGPU/KernelConfig.cpp | |
: 1738008376:0;git ppf | |
: 1738008383:0;git ob bumpllvm | |
: 1738008387:0;git o bumpllvm | |
: 1738008391:0;git submodule update --init | |
: 1738008397:0;riree | |
: 1738009198:0;git ppf | |
: 1738049124:0;tmux attach -t 0 | |
: 1738049127:0;clear | |
: 1738049127:0;ls | |
: 1738049134:0;clear | |
: 1738049135:0;ls | |
: 1738049140:0;cd .. | |
: 1738049140:0;ls | |
: 1738049149:0;vi test.mlir | |
: 1738049356:0;iree-compile --output-format=vm-bytecode --iree-hal-target-backends=llvm-cpu --iree-llvmcpu-target-cpu=host test.mlir -o abc.vmfb -mlir-print-ir-after-all 2> full_new.txt | |
: 1738049360:0;clear | |
: 1738049360:0;ls | |
: 1738049362:0;vi full_new.txt | |
: 1738049499:0;iree-compile --iree-hal-target-backends=llvm-cpu --iree-llvmcpu-target-cpu=znver4 --iree-dispatch-creation-experimental-data-tiling --iree-opt-data-tiling=false test.mlir -o out1.vmfb -mlir-print-ir-after-all 2> full_new.txt | |
: 1738049504:0;vi full_new.txt | |
: 1738049626:0;iree-compile --output-format=vm-bytecode --iree-hal-target-backends=llvm-cpu --iree-llvmcpu-target-cpu=host test.mlir -o abc.vmfb -mlir-print-ir-after-all 2> full_new.txt | |
: 1738049633:0;vi full_new.txt | |
: 1738049926:0;vi | |
: 1738050857:0;iree-compile --help | fzf | |
: 1738050888:0;iree-compile --output-format=vm-bytecode --iree-hal-target-backends=llvm-cpu --iree-llvmcpu-target-cpu=host test.mlir -o abc.vmfb -mlir-print-ir-after-all 2> full_new.txt --iree-llvmcpu-enable-ukernels=false | |
: 1738050894:0;vi full_new.txt | |
: 1738051462:0;iree-compile --output-format=vm-bytecode --iree-hal-target-backends=llvm-cpu --iree-llvmcpu-target-cpu=host test.mlir -o abc.vmfb -mlir-print-ir-after-all 2> full_new.txt | |
: 1738051467:0;vi full_new.txt | |
: 1738051704:0;gist-paste full_new.txt | |
: 1738249470:0;exit | |
: 1738684354:0;clear | |
: 1738684355:0;ls | |
: 1738684363:0;clear | |
: 1738684364:0;ls | |
: 1738684372:0;tmux attach -t 0 | |
: 1738684560:0;ls | |
: 1738922355:0;\ | |
\ | |
: 1738922356:0;clear | |
: 1738922357:0;ls | |
: 1738922360:0;tmux ls | |
: 1738922363:0;tmux attach -t 0 | |
: 1738922368:0;clear | |
: 1738922368:0;ls | |
: 1738922377:0;cd onnx_perf | |
: 1738922377:0;ls | |
: 1738922381:0;vi attn_kernel.mlir | |
: 1738922384:0;vi decomposed_kernel.mlir | |
: 1738922567:0;iree-compile --output-format=vm-bytecode --iree-hal-target-backends=llvm-cpu --iree-llvmcpu-target-cpu=host decomposed.mlir -o abc.vmfb -mlir-print-ir-after-all 2> full_new.txt | |
: 1738922573:0;vi full_new.txt | |
: 1738922576:0;ls | |
: 1738922582:0;iree-compile --output-format=vm-bytecode --iree-hal-target-backends=llvm-cpu --iree-llvmcpu-target-cpu=host decomposed_kernel.mlir -o abc.vmfb -mlir-print-ir-after-all 2> full_new.txt | |
: 1738922603:0;iree-benchmark-module --module=abc.vmfb --function=attention --input=1x32x128x512xf32 --input=1x32x128x512xf32 --input=1x32x128x512xf32 --device=local-task | |
: 1738922612:0;vi full_new.txt | |
: 1738922755:0;iree-compile --output-format=vm-bytecode --iree-hal-target-backends=llvm-cpu --iree-llvmcpu-target-cpu=host decomposed_kernel.mlir -o abc.vmfb -mlir-print-ir-after-all 2> full_new.txt --iree-hal-dump-executable-sources-to=dump/ | |
: 1738922763:0;cd dump | |
: 1738922764:0;ls | |
: 1738922772:0;vi module_attention_dispatch_3.mlir | |
: 1738922815:0;vi module_attention_dispatch_2.mlir | |
: 1738922842:0;vi module_attention_dispatch_1 | |
: 1738922846:0;vi module_attention_dispatch_1.mlir | |
: 1738924158:0;clear | |
: 1738924158:0;ls | |
: 1738924161:0;cd .. | |
: 1738924162:0;ls | |
: 1738924182:0;vi attn_kernel.mlir | |
: 1738925296:0;ls | |
: 1738925301:0;vi attn_kernel.mlir | |
: 1738925390:0;vi decomposed_kernel.mlir | |
: 1738925496:0;iree-compile --output-format=vm-bytecode --iree-hal-target-backends=llvm-cpu --iree-llvmcpu-target-cpu=host decomposed_kernel.mlir -o abc.vmfb -mlir-print-ir-after-all 2> full_new.txt --iree-hal-dump-executable-sources-to=dump/ | |
: 1738925504:0;cd dump | |
: 1738925504:0;ls | |
: 1738925558:0;vi module_attention_dispatch_3.mlir | |
: 1738926101:0;iree-compile --output-format=vm-bytecode --iree-hal-target-backends=llvm-cpu --iree-llvmcpu-target-cpu=host module_attention_dispatch_3.mlir -o abc.vmfb -mlir-print-ir-after-all 2> full_new.txt --iree-hal-dump-executable-sources-to=dump/ --compile-from=executable-sources | |
: 1738926106:0;vi full_new.txt | |
: 1738927307:0;ls | |
: 1738927314:0;unzip -d abc.vmfb | |
: 1738927316:0;ls | |
: 1738927320:0;unzip abc.vmfb | |
: 1738927322:0;ls | |
: 1738927327:0;vi module.fb | |
: 1738927337:0;cd .. | |
: 1738927339:0;ls | |
: 1738927341:0;unzip abc.vmfb | |
: 1738927352:0;vi module.fb | |
: 1738927573:0;ls | |
: 1738927578:0;iree-benchmark-module --module=abc.vmfb --function=attention --input=1x32x128x512xf32 --input=1x32x128x512xf32 --input=1x32x128x512xf32 --device=local-task | |
: 1738927591:0;iree-benchmark-module --module=abc.vmfb --function=attention --input=1x32x128x512xf32 --input=1x32x128x512xf32 --input=1x32x128x512xf32 --device=local-sync | |
: 1739174333:0;\ | |
: 1739174335:0;omz update | |
: 1739174337:0;clear | |
: 1739174337:0;ls | |
: 1739174340:0;tmux ls | |
: 1739174343:0;tmux attach -t 0 | |
: 1739174345:0;clear | |
: 1739174345:0;ls | |
: 1739174355:0;cd .. | |
: 1739174356:0;ls | |
: 1739174365:0;pwd | |
: 1739174367:0;htop | |
: 1739174370:0;clear | |
: 1739174370:0;ls | |
: 1739174376:0;git puom | |
: 1739174412:0;clear | |
: 1739174412:0;ls | |
: 1739174416:0;git fetch orogin | |
: 1739174421:0;git fetch origin | |
: 1739174434:0;git o origin/main | |
: 1739174436:0;clear | |
: 1739174436:0;ls | |
: 1739174439:0;git submodule update --init | |
: 1739174442:0;clear | |
: 1739174443:0;ls | |
: 1739174513:0;git remote add chi https://github.com/AmosLewis/iree.git | |
: 1739174520:0;git fetch chi | |
: 1739174546:0;git o chi/negf_f8tof32 | |
: 1739174552:0;git rebase origin/main | |
: 1739174558:0;clear | |
: 1739174559:0;ls | |
: 1739174560:0;git lg | |
: 1739174563:0;clear | |
: 1739174563:0;ls | |
: 1739174565:0;riree | |
: 1739174693:0;ls | |
: 1739174694:0;cd .. | |
: 1739174695:0;ls | |
: 1739174696:0;cd llvm-project | |
: 1739174696:0;ls | |
: 1739174697:0;vi | |
: 1739189548:0;riree | |
: 1739192171:0;biree | |
: 1739192388:0;riree | |
: 1739193934:0;clang-format -i compiler/src/iree/compiler/Codegen/Common/ConvertUnsupportedFloatArithToF32.cpp | |
: 1739193952:0;clear | |
: 1739193952:0;ls | |
: 1739193955:0;riree | |
: 1739194338:0;iree-opt --convert-unsupported-float-arith-to-f32 compiler/src/iree/compiler/Codegen/Common/test/convert_unsupported_float_arith_to_f32.mlir | |
: 1739194361:0;iree-opt --iree-convert-unsupported-float-arith-to-f32 compiler/src/iree/compiler/Codegen/Common/test/convert_unsupported_float_arith_to_f32.mlir | |
: 1739194437:0;riree | |
: 1739194456:0;iree-opt --iree-convert-unsupported-float-arith-to-f32 compiler/src/iree/compiler/Codegen/Common/test/convert_unsupported_float_arith_to_f32.mlir | |
: 1739195140:0;clear | |
: 1739195140:0;ls | |
: 1739195152:0;git ob exp_f8 | |
: 1739195342:0;git ppf | |
: 1739195478:0;build_tools/bazel_to_cmake/bazel_to_cmake.py compiler/src/iree/compiler/Codegen/Common/BUILD.bazel | |
: 1739195517:0;build_tools/bazel_to_cmake/bazel_to_cmake.py compiler/src/iree/compiler/Codegen/Common/test/BUILD.bazel | |
: 1739195554:0;git ppf | |
: 1739195570:0;biree | |
: 1739195724:0;iree-opt --iree-convert-unsupported-float-arith-to-f32 compiler/src/iree/compiler/Codegen/Common/test/convert_unsupported_float_arith_to_f32.mlir | FileCheck-18 compiler/src/iree/compiler/Codegen/Common/test/convert_unsupported_float_arith_to_f32.mlir | |
: 1739195844:0;clear | |
: 1739195844:0;ls | |
: 1739195941:0;clear | |
: 1739195942:0;ls | |
: 1739198376:0;cd .. | |
: 1739198378:0;cd test | |
: 1739198378:0;ls | |
: 1739198384:0;mkdir err_test | |
: 1739198385:0;clear | |
: 1739198385:0;ls | |
: 1739198450:0;cd test_err | |
: 1739198451:0;ls | |
: 1739198458:0;vi xyz.mlir | |
: 1739198518:0;iree-opt --iree-convert-unsupported-float-arith-to-f32 compiler/src/iree/compiler/Codegen/Common/test/convert_unsupported_float_arith_to_f32.mlir xyz.mlir | |
: 1739198526:0;iree-opt --iree-convert-unsupported-float-arith-to-f32 xyz.mlir | |
: 1739198655:0;ls | |
: 1739198658:0;vi xyz.mlir | |
: 1739198749:0;iree-opt --iree-convert-unsupported-float-arith-to-f32 -iree-convert-to-rocdl xyz.mlir | |
: 1739198769:0;iree-opt -iree-gpu-test-target=gfx940 --iree-convert-unsupported-float-arith-to-f32 -iree-convert-to-rocdl xyz.mlir | |
: 1739198893:0;riree | |
: 1739198921:0;iree-opt -iree-gpu-test-target=gfx940 --iree-convert-unsupported-float-arith-to-f32 -iree-convert-to-rocdl xyz.mlir | |
: 1739198928:0;ls | |
: 1739198932:0;vi xyz.mlir | |
: 1739198947:0;iree-opt --iree-convert-unsupported-float-arith-to-f32 xyz.mlir | |
: 1739198957:0;iree-opt --iree-convert-unsupported-float-arith-to-f32 xyz.mlir > full.mlir | |
: 1739198959:0;vi full.mlir | |
: 1739198986:0;riree | |
: 1739199003:0;iree-opt --iree-convert-unsupported-float-arith-to-f32 xyz.mlir > full.mlir | |
: 1739199005:0;vi full.mlir | |
: 1739199034:0;riree | |
: 1739199050:0;iree-opt --iree-convert-unsupported-float-arith-to-f32 xyz.mlir > full.mlir | |
: 1739199051:0;vi full.mlir | |
: 1739199077:0;riree | |
: 1739199094:0;iree-opt --iree-convert-unsupported-float-arith-to-f32 xyz.mlir > full.mlir | |
: 1739199103:0;vi full.mlir | |
: 1739199138:0;riree | |
: 1739199152:0;iree-opt --iree-convert-unsupported-float-arith-to-f32 xyz.mlir > full.mlir | |
: 1739199162:0;riree | |
: 1739199176:0;iree-opt --iree-convert-unsupported-float-arith-to-f32 xyz.mlir > full.mlir | |
: 1739199187:0;riree | |
: 1739199242:0;iree-opt --iree-convert-unsupported-float-arith-to-f32 xyz.mlir > full.mlir | |
: 1739199301:0;riree | |
: 1739199316:0;iree-opt --iree-convert-unsupported-float-arith-to-f32 xyz.mlir > full.mlir | |
: 1739199318:0;vi full.mlir | |
: 1739199328:0;iree-opt -iree-gpu-test-target=gfx940 --iree-convert-unsupported-float-arith-to-f32 -iree-convert-to-rocdl xyz.mlir | |
: 1739199344:0;riree | |
: 1739199358:0;iree-opt -iree-gpu-test-target=gfx940 --iree-convert-unsupported-float-arith-to-f32 -iree-convert-to-rocdl xyz.mlir | |
: 1739199403:0;riree | |
: 1739199415:0;iree-opt -iree-gpu-test-target=gfx940 --iree-convert-unsupported-float-arith-to-f32 -iree-convert-to-rocdl xyz.mlir | |
: 1739199457:0;riree | |
: 1739199475:0;iree-opt -iree-gpu-test-target=gfx940 --iree-convert-unsupported-float-arith-to-f32 -iree-convert-to-rocdl xyz.mlir | |
: 1739199496:0;riree | |
: 1739199510:0;iree-opt -iree-gpu-test-target=gfx940 --iree-convert-unsupported-float-arith-to-f32 -iree-convert-to-rocdl xyz.mlir | |
: 1739199524:0;riree | |
: 1739199536:0;iree-opt -iree-gpu-test-target=gfx940 --iree-convert-unsupported-float-arith-to-f32 -iree-convert-to-rocdl xyz.mlir | |
: 1739199543:0;ls | |
: 1739199553:0;vi xyz.mlir | |
: 1739209060:0;exit | |
: 1739258171:0;tmux attach -t 0 | |
: 1739258178:0;ls | |
: 1739258179:0;cd .. | |
: 1739258181:0;ls | |
: 1739258189:0;cd onnx_perf | |
: 1739258190:0;ls | |
: 1739258208:0;iree-opt --pass-pipeline="builtin.module(func.func(iree-linalg-ext-convert-attention-to-online-attention,iree-linalg-ext-decompose-attention))" attn_kernel.mlir | |
: 1739258434:0;iree-compile --output-format=vm-bytecode --iree-hal-target-backends=llvm-cpu --iree-llvmcpu-target-cpu=host decomposed_kernel.mlir -o abc.vmfb -mlir-print-ir-after-all 2> full_new.txt --iree-hal-dump-executable-sources-to=dump/ | |
: 1739258610:0;iree-benchmark-module --module=abc.vmfb --function=attention --input=1x32x128x512xf32 --input=1x32x128x512xf32 --input=1x32x128x512xf32 --device=local-sync | |
: 1739258614:0;iree-benchmark-module --module=abc.vmfb --function=attention --input=1x32x128x512xf32 --input=1x32x128x512xf32 --input=1x32x128x512xf32 --device=local-task | |
: 1739258789:0;ls | |
: 1739258797:0;vi attn_kernel.mlir | |
: 1739259389:0;ls | |
: 1739259392:0;vi attn_kernel.mlir | |
: 1739259657:0;iree-opt --pass-pipeline="builtin.module(func.func(iree-linalg-ext-convert-attention-to-online-attention,iree-linalg-ext-decompose-attention))" attn_kernel.mlir | |
: 1739259665:0;iree-opt --pass-pipeline="builtin.module(func.func(iree-linalg-ext-convert-attention-to-online-attention,iree-linalg-ext-decompose-attention))" attn_kernel.mlir > decomposed.mlir | |
: 1739259673:0;gist-paste decomposed.mlir | |
: 1739260044:0;iree-compile --output-format=vm-bytecode --iree-hal-target-backends=llvm-cpu --iree-llvmcpu-target-cpu=host attn_kernel.mlir -o abc.vmfb | |
: 1739260397:0;iree-benchmark-module --module=abc.vmfb --function=attention --input=1x32x64x96xf32 --input=1x32x128x512xf32 --input=1x32x128x512xf32 --device=local-task | |
: 1739260403:0;vi attn_kernel.mlir | |
: 1739276812:0;clear | |
: 1739276812:0;ls | |
: 1739276817:0;clear | |
: 1739276818:0;ls | |
: 1739276821:0;htop | |
: 1739276824:0;exit | |
: 1739301589:0;clear | |
: 1739301589:0;ls | |
: 1739301592:0;tmux attach -t 0 | |
: 1739301637:0;riree | |
: 1739340838:0;clang-format -i compiler/src/iree/compiler/Codegen/Common/ConvertUnsupportedFloatArithToF32.cpp | |
: 1739341366:0;biree | |
: 1739341609:0;riree | |
: 1739345178:0;clang-format -i compiler/src/iree/compiler/Codegen/Common/ConvertUnsupportedFloatArithToF32.cpp | |
: 1739345371:0;riree | |
: 1739345442:0;biree | |
: 1739345539:0;clang-format -i compiler/src/iree/compiler/Codegen/Common/ConvertUnsupportedFloatArithToF32.cpp | |
: 1739345594:0;riree | |
: 1739345832:0;iree-opt --iree-convert-unsupported-float-arith-to-f32 compiler/src/iree/compiler/Codegen/Common/test/convert_unsupported_float_arith_to_f32.mlir xyz.mlir | |
: 1739345842:0;iree-opt --iree-convert-unsupported-float-arith-to-f32 compiler/src/iree/compiler/Codegen/Common/test/convert_unsupported_float_arith_to_f32.mlir | |
: 1739345942:0;iree-opt --split-input-file --iree-convert-unsupported-float-arith-to-f32 ="source-types=bf16,f8E4M3FNUZ target-type=f32"compiler/src/iree/compiler/Codegen/Common/test/convert_unsupported_float_arith_to_f32.mlir | |
: 1739345969:0;iree-opt --split-input-file --iree-convert-unsupported-float-arith-to-f32 ="source-types=bf16,f8E4M3FNUZ target-type=f32" compiler/src/iree/compiler/Codegen/Common/test/convert_unsupported_float_arith_to_f32.mlir | |
: 1739345995:0;iree-opt --split-input-file --iree-convert-unsupported-float-arith-to-f32= "source-types=bf16,f8E4M3FNUZ target-type=f32" compiler/src/iree/compiler/Codegen/Common/test/convert_unsupported_float_arith_to_f32.mlir | |
: 1739346008:0;iree-opt --split-input-file --iree-convert-unsupported-float-arith-to-f32="source-types=bf16,f8E4M3FNUZ target-type=f32" compiler/src/iree/compiler/Codegen/Common/test/convert_unsupported_float_arith_to_f32.mlir | |
: 1739346066:0;riree | |
: 1739346180:0;iree-opt --pass-pipeline="builtin.module(func.func(iree-convert-unsupported-float-arith-to-f32="source-types=bf16,f8E4M3FNUZ target-type=f32", cse))" compiler/src/iree/compiler/Codegen/Common/test/convert_unsupported_float_arith_to_f32.mlir | |
: 1739346219:0;iree-opt --pass-pipeline="builtin.module(func.func(iree-convert-unsupported-float-arith-to-f32{source-types=bf16,f8E4M3FNUZ target-type=f32}, cse))" compiler/src/iree/compiler/Codegen/Common/test/convert_unsupported_float_arith_to_f32.mlir | |
: 1739346266:0;riree | |
: 1739346304:0;iree-opt --pass-pipeline="builtin.module(func.func(iree-convert-unsupported-float-arith-to-f32{source-types=bf16,f8E4M3FNUZ target-type=f32}, cse))" compiler/src/iree/compiler/Codegen/Common/test/convert_unsupported_float_arith_to_f32.mlir | |
: 1739346357:0;riree | |
: 1739346490:0;iree-opt --pass-pipeline="builtin.module(func.func(iree-convert-unsupported-float-arith-to-f32 ="source-types=f8E4M3NUZ target-type=f32"))" compiler/src/iree/compiler/Codegen/Common/test/convert_unsupported_float_arith_to_f32.mlir | |
: 1739346498:0;iree-opt --pass-pipeline="builtin.module(func.func(iree-convert-unsupported-float-arith-to-f32="source-types=f8E4M3NUZ target-type=f32"))" compiler/src/iree/compiler/Codegen/Common/test/convert_unsupported_float_arith_to_f32.mlir | |
: 1739346511:0;iree-opt --pass-pipeline="builtin.module(func.func(iree-convert-unsupported-float-arith-to-f32{"source-types=f8E4M3NUZ target-type=f32"}))" compiler/src/iree/compiler/Codegen/Common/test/convert_unsupported_float_arith_to_f32.mlir | |
: 1739346533:0;iree-opt --pass-pipeline="builtin.module(func.func(iree-convert-unsupported-float-arith-to-f32{source-types=f8E4M3NUZ target-type=f32}))" compiler/src/iree/compiler/Codegen/Common/test/convert_unsupported_float_arith_to_f32.mlir | |
: 1739346701:0;riree | |
: 1739347636:0;iree-opt --pass-pipeline="builtin.module(func.func(iree-convert-unsupported-float-arith-to-f32{source-types=f8E4M3NUZ target-type=f32}))" compiler/src/iree/compiler/Codegen/Common/test/convert_unsupported_float_arith_to_f32.mlir | |
: 1739347949:0;riree | |
: 1739348128:0;iree-opt --pass-pipeline="builtin.module(func.func(iree-convert-unsupported-float-arith-to-f32{source-types=bf16, f8E4M3NUZ target-type=f32}))" compiler/src/iree/compiler/Codegen/Common/test/convert_unsupported_float_arith_to_f32.mlir | |
: 1739348162:0;iree-opt --pass-pipeline="builtin.module(func.func("iree-convert-unsupported-float-arith-to-f32 =source-types=bf16, f8E4M3NUZ target-type=f32"))" compiler/src/iree/compiler/Codegen/Common/test/convert_unsupported_float_arith_to_f32.mlir | |
: 1739348172:0;iree-opt --pass-pipeline="builtin.module(func.func("iree-convert-unsupported-float-arith-to-f32=source-types=bf16, f8E4M3NUZ target-type=f32"))" compiler/src/iree/compiler/Codegen/Common/test/convert_unsupported_float_arith_to_f32.mlir | |
: 1739348728:0;iree-opt --pass-pipeline="builtin.module(func.func(iree-convert-unsupported-float-arith-to-f32{source-types=f8E4M3NUZ target-type=f32}))" compiler/src/iree/compiler/Codegen/Common/test/convert_unsupported_float_arith_to_f32.mlir | |
: 1739348754:0;riree | |
: 1739348773:0;iree-opt --pass-pipeline="builtin.module(func.func(iree-convert-unsupported-float-arith-to-f32{source-types=f8E4M3NUZ target-type=f32}))" compiler/src/iree/compiler/Codegen/Common/test/convert_unsupported_float_arith_to_f32.mlir | |
: 1739349023:0;riree | |
: 1739349210:0;iree-opt --pass-pipeline="builtin.module(func.func(iree-convert-unsupported-float-arith-to-f32{source-types=f8E4M3NUZ target-type=f32}))" compiler/src/iree/compiler/Codegen/Common/test/convert_unsupported_float_arith_to_f32.mlir | |
: 1739349251:0;iree-opt --pass-pipeline="builtin.module(func.func(iree-convert-unsupported-float-arith-to-f32{source-types=f8E4M3FNUZ target-type=f32}))" compiler/src/iree/compiler/Codegen/Common/test/convert_unsupported_float_arith_to_f32.mlir | |
: 1739349275:0;iree-opt --pass-pipeline="builtin.module(func.func(iree-convert-unsupported-float-arith-to-f32{source-types=bf16,f8E4M3FNUZ target-type=f32}))" compiler/src/iree/compiler/Codegen/Common/test/convert_unsupported_float_arith_to_f32.mlir | |
: 1739350438:0;clang-format -i compiler/src/iree/compiler/Codegen/Common/ConvertUnsupportedFloatArithToF32.cpp | |
: 1739350450:0;riree | |
: 1739350473:0;iree-opt --pass-pipeline="builtin.module(func.func(iree-convert-unsupported-float-arith-to-f32{source-types=bf16,f8E4M3FNUZ target-type=f32}))" compiler/src/iree/compiler/Codegen/Common/test/convert_unsupported_float_arith_to_f32.mlir | |
: 1739350486:0;iree-opt --pass-pipeline="builtin.module(func.func(iree-convert-unsupported-float-arith-to-f32{source-types=f8E4M3FNUZ target-type=f32}))" compiler/src/iree/compiler/Codegen/Common/test/convert_unsupported_float_arith_to_f32.mlir | |
: 1739350647:0;iree-opt --pass-pipeline="builtin.module(func.func(iree-convert-unsupported-float-arith-to-f32{source-types=f8E4M3FNUZ target-type=f32}))" compiler/src/iree/compiler/Codegen/Common/test/convert_unsupported_float_arith_to_f32.mlir | FileCheck-18 compiler/src/iree/compiler/Codegen/Common/ConvertUnsupportedFloatArithToF32.cpp | |
: 1739350678:0;iree-opt --pass-pipeline="builtin.module(func.func(iree-convert-unsupported-float-arith-to-f32{source-types=f8E4M3FNUZ,bf16 target-type=f32}))" compiler/src/iree/compiler/Codegen/Common/test/convert_unsupported_float_arith_to_f32.mlir | FileCheck-18 compiler/src/iree/compiler/Codegen/Common/ConvertUnsupportedFloatArithToF32.cpp | |
: 1739350693:0;iree-opt --pass-pipeline="builtin.module(func.func(iree-convert-unsupported-float-arith-to-f32{source-types=f8E4M3FNUZ,bf16 target-type=f32}))" compiler/src/iree/compiler/Codegen/Common/test/convert_unsupported_float_arith_to_f32.mlir | FileCheck-18 compiler/src/iree/compiler/Codegen/Common/test/convert_unsupported_float_arith_to_f32.mlir | |
: 1739350739:0;iree-opt --pass-pipeline="builtin.module(func.func(iree-convert-unsupported-float-arith-to-f32{source-types=f8E4M3FNUZ target-type=f32}))" compiler/src/iree/compiler/Codegen/Common/test/convert_unsupported_float_arith_to_f32.mlir | |
: 1739350755:0;iree-opt --pass-pipeline="builtin.module(func.func(iree-convert-unsupported-float-arith-to-f32{source-types=f8E4M3FNUZ,bf16 target-type=f32}))" compiler/src/iree/compiler/Codegen/Common/test/convert_unsupported_float_arith_to_f32.mlir | FileCheck-18 compiler/src/iree/compiler/Codegen/Common/test/convert_unsupported_float_arith_to_f32.mlir | |
: 1739351423:0;biree | |
: 1739351622:0;riree | |
: 1739351779:0;rm -rf ~/iree-build | |
: 1739351783:0;biree | |
: 1739351982:0;riree | |
: 1739355569:0;iree-opt --pass-pipeline="builtin.module(func.func(iree-convert-unsupported-float-arith-to-f32{source-types=f8E4M3FNUZ,bf16 target-type=f32}))" compiler/src/iree/compiler/Codegen/Common/test/convert_unsupported_float_arith_to_f32.mlir | FileCheck-18 compiler/src/iree/compiler/Codegen/Common/test/convert_unsupported_float_arith_to_f32.mlir | |
: 1739355585:0;iree-opt --pass-pipeline="builtin.module(func.func(iree-convert-unsupported-float-arith{source-types=f8E4M3FNUZ,bf16 target-type=f32}))" compiler/src/iree/compiler/Codegen/Common/test/convert_unsupported_float_arith_to_f32.mlir | FileCheck-18 compiler/src/iree/compiler/Codegen/Common/test/convert_unsupported_float_arith_to_f32.mlir | |
: 1739355596:0;iree-opt --pass-pipeline="builtin.module(func.func(iree-convert-unsupported-float-arith{source-types=f8E4M3FNUZ,bf16 target-type=f32}))" compiler/src/iree/compiler/Codegen/Common/test/convert_unsupported_float_arith.mlir | |
: 1739355789:0;riree | |
: 1739355856:0;clang-format -i compiler/src/iree/compiler/Codegen/Common/ConvertUnsupportedFloatArithToF32.cpp | |
: 1739355885:0;clang-format -i compiler/src/iree/compiler/Codegen/Common/ConvertUnsupportedFloatArithPass.cpp | |
: 1739356022:0;riree | |
: 1739356046:0;ls | |
: 1739356083:0;wget https://sharkpublic.blob.core.windows.net/sharkpublic/chi/llama/atten/f8_attn_chi_castf32_roctorch.mlir | |
: 1739356112:0;iree-compile f8_attn_chi_castf32_roctorch.mlir \\ | |
--iree-hip-target=gfx942 \\ | |
-o=f8_attn_chi_castf32_roctorch.vmfb \\ | |
--iree-hal-target-device=hip \\ | |
--iree-dispatch-creation-enable-aggressive-fusion=true \\ | |
--iree-global-opt-propagate-transposes=true \\ | |
--iree-opt-aggressively-propagate-transposes=true \\ | |
--iree-opt-data-tiling=false \\ | |
--iree-preprocessing-pass-pipeline='builtin.module(util.func(iree-preprocessing-generalize-linalg-matmul-experimental))' \\ | |
--iree-hal-indirect-command-buffers=true \\ | |
--iree-stream-resource-memory-model=discrete \\ | |
--iree-hal-memoization=true \\ | |
--iree-opt-strip-assertions | |
: 1739356188:0;riree | |
: 1739356518:0;clang-format -i compiler/src/iree/compiler/Codegen/LLVMGPU/Passes.cpp | |
: 1739356528:0;riree | |
: 1739356550:0;clang-format -i compiler/src/iree/compiler/Codegen/LLVMGPU/Passes.cpp | |
: 1739356554:0;iree-compile f8_attn_chi_castf32_roctorch.mlir \\ | |
--iree-hip-target=gfx942 \\ | |
-o=f8_attn_chi_castf32_roctorch.vmfb \\ | |
--iree-hal-target-device=hip \\ | |
--iree-dispatch-creation-enable-aggressive-fusion=true \\ | |
--iree-global-opt-propagate-transposes=true \\ | |
--iree-opt-aggressively-propagate-transposes=true \\ | |
--iree-opt-data-tiling=false \\ | |
--iree-preprocessing-pass-pipeline='builtin.module(util.func(iree-preprocessing-generalize-linalg-matmul-experimental))' \\ | |
--iree-hal-indirect-command-buffers=true \\ | |
--iree-stream-resource-memory-model=discrete \\ | |
--iree-hal-memoization=true \\ | |
--iree-opt-strip-assertions | |
: 1739356595:0;riree | |
: 1739356617:0;iree-compile f8_attn_chi_castf32_roctorch.mlir \\ | |
--iree-hip-target=gfx942 \\ | |
-o=f8_attn_chi_castf32_roctorch.vmfb \\ | |
--iree-hal-target-device=hip \\ | |
--iree-dispatch-creation-enable-aggressive-fusion=true \\ | |
--iree-global-opt-propagate-transposes=true \\ | |
--iree-opt-aggressively-propagate-transposes=true \\ | |
--iree-opt-data-tiling=false \\ | |
--iree-preprocessing-pass-pipeline='builtin.module(util.func(iree-preprocessing-generalize-linalg-matmul-experimental))' \\ | |
--iree-hal-indirect-command-buffers=true \\ | |
--iree-stream-resource-memory-model=discrete \\ | |
--iree-hal-memoization=true \\ | |
--iree-opt-strip-assertions | |
: 1739356657:0;riree | |
: 1739356680:0;iree-compile f8_attn_chi_castf32_roctorch.mlir \\ | |
--iree-hip-target=gfx942 \\ | |
-o=f8_attn_chi_castf32_roctorch.vmfb \\ | |
--iree-hal-target-device=hip \\ | |
--iree-dispatch-creation-enable-aggressive-fusion=true \\ | |
--iree-global-opt-propagate-transposes=true \\ | |
--iree-opt-aggressively-propagate-transposes=true \\ | |
--iree-opt-data-tiling=false \\ | |
--iree-preprocessing-pass-pipeline='builtin.module(util.func(iree-preprocessing-generalize-linalg-matmul-experimental))' \\ | |
--iree-hal-indirect-command-buffers=true \\ | |
--iree-stream-resource-memory-model=discrete \\ | |
--iree-hal-memoization=true \\ | |
--iree-opt-strip-assertions | |
: 1739356734:0;iree-compile f8_attn_chi_castf32_roctorch.mlir \\ | |
--iree-hip-target=gfx942 \\ | |
-o=f8_attn_chi_castf32_roctorch.vmfb \\ | |
--iree-hal-target-device=hip \\ | |
--iree-dispatch-creation-enable-aggressive-fusion=true \\ | |
--iree-global-opt-propagate-transposes=true \\ | |
--iree-opt-aggressively-propagate-transposes=true \\ | |
--iree-opt-data-tiling=false \\ | |
--iree-preprocessing-pass-pipeline='builtin.module(util.func(iree-preprocessing-generalize-linalg-matmul-experimental))' \\ | |
--iree-hal-indirect-command-buffers=true \\ | |
--iree-stream-resource-memory-model=discrete \\ | |
--iree-hal-memoization=true \\ | |
--iree-opt-strip-assertions 2> err.txt | |
: 1739356743:0;vi err.txt | |
: 1739356862:0;vi disp.mlir | |
: 1739356883:0;iree-compile f8_attn_chi_castf32_roctorch.mlir \\ | |
--iree-hip-target=gfx942 \\ | |
-o=f8_attn_chi_castf32_roctorch.vmfb \\ | |
--iree-hal-target-device=hip \\ | |
--iree-dispatch-creation-enable-aggressive-fusion=true \\ | |
--iree-global-opt-propagate-transposes=true \\ | |
--iree-opt-aggressively-propagate-transposes=true \\ | |
--iree-opt-data-tiling=false \\ | |
--iree-preprocessing-pass-pipeline='builtin.module(util.func(iree-preprocessing-generalize-linalg-matmul-experimental))' \\ | |
--iree-hal-indirect-command-buffers=true \\ | |
--iree-stream-resource-memory-model=discrete \\ | |
--iree-hal-memoization=true \\ | |
--compile-from=executable-sources \\ | |
--iree-opt-strip-assertions 2> err.txt | |
: 1739356890:0;iree-compile disp.mlir \\ | |
--iree-hip-target=gfx942 \\ | |
-o=f8_attn_chi_castf32_roctorch.vmfb \\ | |
--iree-hal-target-device=hip \\ | |
--iree-dispatch-creation-enable-aggressive-fusion=true \\ | |
--iree-global-opt-propagate-transposes=true \\ | |
--iree-opt-aggressively-propagate-transposes=true \\ | |
--iree-opt-data-tiling=false \\ | |
--iree-preprocessing-pass-pipeline='builtin.module(util.func(iree-preprocessing-generalize-linalg-matmul-experimental))' \\ | |
--iree-hal-indirect-command-buffers=true \\ | |
--iree-stream-resource-memory-model=discrete \\ | |
--iree-hal-memoization=true \\ | |
--compile-from=executable-sources \\ | |
--iree-opt-strip-assertions 2> err.txt | |
: 1739356893:0;vi err.txt | |
: 1739356909:0;riree | |
: 1739356925:0;iree-compile f8_attn_chi_castf32_roctorch.mlir \\ | |
--iree-hip-target=gfx942 \\ | |
-o=f8_attn_chi_castf32_roctorch.vmfb \\ | |
--iree-hal-target-device=hip \\ | |
--iree-dispatch-creation-enable-aggressive-fusion=true \\ | |
--iree-global-opt-propagate-transposes=true \\ | |
--iree-opt-aggressively-propagate-transposes=true \\ | |
--iree-opt-data-tiling=false \\ | |
--iree-preprocessing-pass-pipeline='builtin.module(util.func(iree-preprocessing-generalize-linalg-matmul-experimental))' \\ | |
--iree-hal-indirect-command-buffers=true \\ | |
--iree-stream-resource-memory-model=discrete \\ | |
--iree-hal-memoization=true \\ | |
--compile-from=executable-sources \\ | |
--iree-opt-strip-assertions 2> err.txt | |
: 1739356935:0;iree-compile f8_attn_chi_castf32_roctorch.mlir \\ | |
--iree-hip-target=gfx942 \\ | |
-o=f8_attn_chi_castf32_roctorch.vmfb \\ | |
--iree-hal-target-device=hip \\ | |
--iree-dispatch-creation-enable-aggressive-fusion=true \\ | |
--iree-global-opt-propagate-transposes=true \\ | |
--iree-opt-aggressively-propagate-transposes=true \\ | |
--iree-opt-data-tiling=false \\ | |
--iree-preprocessing-pass-pipeline='builtin.module(util.func(iree-preprocessing-generalize-linalg-matmul-experimental))' \\ | |
--iree-hal-indirect-command-buffers=true \\ | |
--iree-stream-resource-memory-model=discrete \\ | |
--iree-hal-memoization=true \\ | |
--iree-opt-strip-assertions 2> err.txt | |
: 1739356944:0;vi err.txt | |
: 1739357033:0;git-clang-format HEAD~ | |
: 1739357037:0;git ppf | |
: 1739367234:0;build_tools/bazel_to_cmake/bazel_to_cmake.py compiler/src/iree/compiler/Codegen/Common/test/BUILD.bazel | |
: 1739367277:0;riree | |
: 1739367309:0;iree-opt --pass-pipeline="builtin.module(func.func(iree-convert-unsupported-float-arith{source-types=f8E4M3FNUZ,bf16 target-type=f32}))" compiler/src/iree/compiler/Codegen/Common/test/convert_unsupported_float_arith.mlir | |
: 1739367322:0;iree-opt --pass-pipeline="builtin.module(func.func(iree-convert-unsupported-float-arith{source-types=f8E4M3FNUZ,bf16 target-type=f32}))" compiler/src/iree/compiler/Codegen/Common/test/convert_unsupported_float_arith.mlir | FileCheck compiler/src/iree/compiler/Codegen/Common/test/convert_unsupported_float_arith.mlir | |
: 1739367363:0;iree-opt --pass-pipeline="builtin.module(func.func(iree-convert-unsupported-float-arith{source-types=f8E4M3FNUZ, bf16 target-type=f32}))" compiler/src/iree/compiler/Codegen/Common/test/convert_unsupported_float_arith.mlir | |
: 1739367454:0;iree-opt --split-input-file --pass-pipeline="builtin.module(func.func(iree-convert-unsupported-float-arith{source-types=f8E4M3FNUZ,bf16 target-type=f32}))" %s compiler/src/iree/compiler/Codegen/Common/test/convert_unsupported_float_arith.mlir | |
: 1739367473:0;iree-opt --split-input-file --pass-pipeline="builtin.module(func.func(iree-convert-unsupported-float-arith{source-types=f8E4M3FNUZ,bf16 target-type=f32}))" compiler/src/iree/compiler/Codegen/Common/test/convert_unsupported_float_arith.mlir | |
: 1739367498:0;iree-opt --split-input-file --pass-pipeline="builtin.module(func.func(iree-convert-unsupported-float-arith{source-types=f8E4M3FNUZ,bf16 target-type=f32}))" compiler/src/iree/compiler/Codegen/Common/test/convert_unsupported_float_arith.mlir | FileCheck third_party/llvm-project/mlir/test/Dialect/Arith/emulate-unsupported-floats.mlir | |
: 1739367520:0;iree-opt --split-input-file --pass-pipeline="builtin.module(func.func(iree-convert-unsupported-float-arith{source-types=f8E4M3FNUZ,bf16 target-type=f32}))" compiler/src/iree/compiler/Codegen/Common/test/convert_unsupported_float_arith.mlir | FileCheck compiler/src/iree/compiler/Codegen/Common/test/convert_unsupported_float_arith.mlir | |
: 1739367564:0;git ppf | |
: 1739367768:0;clear | |
: 1739367768:0;ls | |
: 1739370993:0;git ppf | |
: 1739371066:0;clear | |
: 1739371066:0;ls | |
: 1739371080:0;exit | |
: 1739380064:0;tmux attach -t 0 | |
: 1739380065:0;ls | |
: 1739380075:0;vi test.mlir | |
: 1739380272:0;iree-opt --help | fzf | |
: 1739380307:0;iree-opt -enable-generalize-matmul test.mlir | |
: 1739380324:0;iree-opt -linalg-generalize-named-ops test.mlir | |
: 1739380710:0;vi disp.mlir | |
: 1739388827:0;riree | |
: 1739389462:0;clang-format -i compiler/src/iree/compiler/Codegen/Common/ConvertUnsupportedFloatArithPass.cpp | |
: 1739389616:0;riree | |
: 1739389948:0;clang-format -i compiler/src/iree/compiler/Codegen/Common/Passes.td | |
: 1739390051:0;riree | |
: 1739390267:0;sz | |
: 1739390271:0;source ~/iree/.iree_venv/bin/activate | |
: 1739390272:0;clear | |
: 1739390273:0;ls | |
: 1739390291:0;iree-opt --split-input-file --pass-pipeline="builtin.module(func.func(iree-convert-unsupported-float-arith))" third_party/llvm-project/mlir/test/Dialect/Arith/emulate-unsupported-floats.mlir | |
: 1739390412:0;riree | |
: 1739390430:0;iree-opt --split-input-file --pass-pipeline="builtin.module(func.func(iree-convert-unsupported-float-arith))" third_party/llvm-project/mlir/test/Dialect/Arith/emulate-unsupported-floats.mlir | |
: 1739390492:0;riree | |
: 1739390509:0;iree-opt --split-input-file --pass-pipeline="builtin.module(func.func(iree-convert-unsupported-float-arith))" third_party/llvm-project/mlir/test/Dialect/Arith/emulate-unsupported-floats.mlir | |
: 1739390714:0;ls | |
: 1739390721:0;vi f8_attn_chi_castf32_roctorch.mlir | |
: 1739390730:0;ls | |
: 1739390737:0;vi attn_kernel.mlir | |
: 1739391158:0;iree-compile attn_kernel.mlir \\ | |
--iree-hip-target=gfx942 \\ | |
-o=f8_attn_chi_castf32_roctorch.vmfb \\ | |
--iree-hal-target-device=hip \\ | |
--iree-dispatch-creation-enable-aggressive-fusion=true \\ | |
--iree-global-opt-propagate-transposes=true \\ | |
--iree-opt-aggressively-propagate-transposes=true \\ | |
--iree-opt-data-tiling=false \\ | |
--iree-preprocessing-pass-pipeline='builtin.module(util.func(iree-preprocessing-generalize-linalg-matmul-experimental))' \\ | |
--iree-hal-indirect-command-buffers=true \\ | |
--iree-stream-resource-memory-model=discrete \\ | |
--iree-hal-memoization=true \\ | |
-mlir-print-ir-after-all \\ | |
--iree-opt-strip-assertions 2> err.txt | |
: 1739391163:0;vi err.txt | |
: 1739391248:0;iree-compile disp.mlir \\ | |
--iree-hip-target=gfx942 \\ | |
-o=f8_attn_chi_castf32_roctorch.vmfb \\ | |
--iree-hal-target-device=hip \\ | |
--iree-dispatch-creation-enable-aggressive-fusion=true \\ | |
--iree-global-opt-propagate-transposes=true \\ | |
--iree-opt-aggressively-propagate-transposes=true \\ | |
--iree-opt-data-tiling=false \\ | |
--iree-preprocessing-pass-pipeline='builtin.module(util.func(iree-preprocessing-generalize-linalg-matmul-experimental))' \\ | |
--iree-hal-indirect-command-buffers=true \\ | |
--iree-stream-resource-memory-model=discrete \\ | |
--iree-hal-memoization=true \\ | |
-mlir-print-ir-after-all \\ | |
--iree-opt-strip-assertions 2> err.txt | |
: 1739391261:0;vi err.txt | |
: 1739391351:0;iree-compile attn_kernel.mlir \\ | |
--iree-hip-target=gfx942 \\ | |
-o=f8_attn_chi_castf32_roctorch.vmfb \\ | |
--iree-hal-target-device=hip \\ | |
--iree-dispatch-creation-enable-aggressive-fusion=true \\ | |
--iree-global-opt-propagate-transposes=true \\ | |
--iree-opt-aggressively-propagate-transposes=true \\ | |
--iree-opt-data-tiling=false \\ | |
--iree-preprocessing-pass-pipeline='builtin.module(util.func(iree-preprocessing-generalize-linalg-matmul-experimental))' \\ | |
--iree-hal-indirect-command-buffers=true \\ | |
--iree-stream-resource-memory-model=discrete \\ | |
--iree-hal-memoization=true \\ | |
-mlir-print-ir-after-all \\ | |
--iree-opt-strip-assertions 2> err.txt | |
: 1739391355:0;vi err.txt | |
: 1739392305:0;iree-opt --split-input-file --pass-pipeline="builtin.module(func.func(iree-convert-unsupported-float-arith))" compiler/src/iree/compiler/Codegen/Common/test/convert_unsupported_float_arith.mlir | |
: 1739392461:0;ls | |
: 1739392468:0;cat compiler/src/iree/compiler/Codegen/Common/test/convert_unsupported_float_arith.mlir | |
: 1739392508:0;iree-opt --split-input-file --pass-pipeline="builtin.module(func.func(iree-convert-unsupported-float-arith))" compiler/src/iree/compiler/Codegen/Common/test/convert_unsupported_float_arith.mlir | |
: 1739392709:0;iree-opt --split-input-file --pass-pipeline="builtin.module(func.func(iree-convert-unsupported-float-arith))" compiler/src/iree/compiler/Codegen/Common/test/convert_unsupported_float_arith.mlir | FileCheck compiler/src/iree/compiler/Codegen/Common/test/convert_unsupported_float_arith.mlir | |
: 1739392731:0;iree-opt --split-input-file --pass-pipeline="builtin.module(func.func(iree-convert-unsupported-float-arith))" compiler/src/iree/compiler/Codegen/Common/test/convert_unsupported_float_arith.mlir | |
: 1739392841:0;iree-opt --split-input-file --pass-pipeline="builtin.module(func.func(iree-convert-unsupported-float-arith))" compiler/src/iree/compiler/Codegen/Common/test/convert_unsupported_float_arith.mlir | FileCheck compiler/src/iree/compiler/Codegen/Common/test/convert_unsupported_float_arith.mlir | |
: 1739393065:0;clang-format -i compiler/src/iree/compiler/Codegen/Common/ConvertUnsupportedFloatArithPass.cpp | |
: 1739393305:0;riree | |
: 1739393377:0;iree-opt --split-input-file --pass-pipeline="builtin.module(func.func(iree-convert-unsupported-float-arith))" compiler/src/iree/compiler/Codegen/Common/test/convert_unsupported_float_arith.mlir | FileCheck compiler/src/iree/compiler/Codegen/Common/test/convert_unsupported_float_arith.mlir | |
: 1739393384:0;clang-format -i compiler/src/iree/compiler/Codegen/Common/ConvertUnsupportedFloatArithPass.cpp | |
: 1739393456:0;git ppf | |
: 1739393814:0;riree | |
: 1739393984:0;git-clang-format HEAD~ | |
: 1739393987:0;git ppf | |
: 1739395293:0;clang-format -i compiler/src/iree/compiler/Codegen/Common/ConvertUnsupportedFloatArithPass.cpp | |
: 1739395333:0;riree | |
: 1739395434:0;clang-format -i compiler/src/iree/compiler/Codegen/Common/ConvertUnsupportedFloatArithPass.cpp | |
: 1739395510:0;riree | |
: 1739395535:0;iree-opt --split-input-file --pass-pipeline="builtin.module(func.func(iree-convert-unsupported-float-arith))" compiler/src/iree/compiler/Codegen/Common/test/convert_unsupported_float_arith.mlir | FileCheck compiler/src/iree/compiler/Codegen/Common/test/convert_unsupported_float_arith.mlir | |
: 1739395549:0;git ppf | |
: 1739395930:0;git-clang-format HEAD~ | |
: 1739395933:0;git ppf | |
: 1739396144:0;clang-format -i compiler/src/iree/compiler/Codegen/Common/ConvertUnsupportedFloatArithPass.cpp | |
: 1739396174:0;riree | |
: 1739396309:0;iree-opt --split-input-file --pass-pipeline="builtin.module(func.func(iree-convert-unsupported-float-arith))" compiler/src/iree/compiler/Codegen/Common/test/convert_unsupported_float_arith.mlir | FileCheck compiler/src/iree/compiler/Codegen/Common/test/convert_unsupported_float_arith.mlir | |
: 1739396337:0;git ppf | |
: 1739428177:0;tmux ls | |
: 1739428182:0;tmux attach -t 0 | |
: 1739431064:0;clang-format -i compiler/src/iree/compiler/Codegen/Common/ConvertUnsupportedFloatArithPass.cpp | |
: 1739431215:0;riree | |
: 1739431237:0;iree-opt --split-input-file --pass-pipeline="builtin.module(func.func(iree-convert-unsupported-float-arith))" compiler/src/iree/compiler/Codegen/Common/test/convert_unsupported_float_arith.mlir | FileCheck compiler/src/iree/compiler/Codegen/Common/test/convert_unsupported_float_arith.mlir | |
: 1739431335:0;buildifier compiler/src/iree/compiler/Codegen/Common/BUILD.bazel | |
: 1739431350:0;ls | |
: 1739431377:0;go install github.com/bazelbuild/buildtools/buildifier@latest\ | |
\ | |
: 1739431386:0;sudo apt-get install goland | |
: 1739431389:0;sudo apt-get install golangh | |
: 1739431391:0;sudo apt-get install golang | |
: 1739431405:0;gold dd | |
: 1739431414:0;sudo apt-get install --fix-broken | |
: 1739431431:0;sudo apt-get update | |
: 1739431444:0;sudo apt-get install golang | |
: 1739431449:0;sudo apt-get install golang --fix-broken | |
: 1739431466:0;pip install buildifier | |
: 1739431486:0;bazel build | |
: 1739431507:0;wget https://github.com/bazelbuild/buildtools/releases/download/v8.0.3/buildifier-linux-amd64 | |
: 1739431526:0;mv buildifier-linux-amd64 buildifier | |
: 1739431534:0;chmod +x buildifier | |
: 1739431534:0;clear | |
: 1739431535:0;ls | |
: 1739431544:0;./buildifier compiler/src/iree/compiler/Codegen/Common/BUILD.bazel | |
: 1739431587:0;mv buildifier ../ | |
: 1739431594:0;git-clang-format HEAD~ | |
: 1739431599:0;git ppf | |
: 1739431690:0;build_tools/bazel_to_cmake/bazel_to_cmake.py compiler/src/iree/compiler/Codegen/Common/BUILD.bazel | |
: 1739431702:0;git ppf | |
: 1739448176:0;tmux attach -t 0 | |
: 1739448247:0;git ppf | |
: 1739448253:0;git-clang-format HEAD~ | |
: 1739448272:0;git ppf | |
: 1739452052:0;iree-opt --split-input-file --pass-pipeline="builtin.module(func.func(iree-convert-unsupported-float-arith))" compiler/src/iree/compiler/Codegen/Common/test/convert_unsupported_float_arith.mlir | FileCheck compiler/src/iree/compiler/Codegen/Common/test/convert_unsupported_float_arith.mlir | |
: 1739452067:0;git ppf | |
: 1739473401:0;exi\ | |
: 1739473411:0;exit | |
: 1739529139:0;tmux ls | |
: 1739529142:0;tmux attach -t 0 | |
: 1739529151:0;git fetch origin | |
: 1739529165:0;git o origin/main | |
: 1739529166:0;clear | |
: 1739529166:0;ls | |
: 1739529174:0;git submodule update --init | |
: 1739529177:0;riree | |
: 1739529693:0;ls | |
: 1739529765:0;iree-compile f8_attn_chi_castf32_roctorch.mlir \\ | |
--iree-hip-target=gfx942 \\ | |
-o=f8_attn_chi_castf32_roctorch.vmfb \\ | |
--iree-hal-target-device=hip \\ | |
--iree-dispatch-creation-enable-aggressive-fusion=true \\ | |
--iree-global-opt-propagate-transposes=true \\ | |
--iree-opt-aggressively-propagate-transposes=true \\ | |
--iree-opt-data-tiling=false \\ | |
--iree-preprocessing-pass-pipeline='builtin.module(util.func(iree-preprocessing-generalize-linalg-matmul-experimental))' \\ | |
--iree-hal-indirect-command-buffers=true \\ | |
--iree-stream-resource-memory-model=discrete \\ | |
--iree-hal-memoization=true \\ | |
-mlir-print-ir-after-all \\ | |
--iree-hal-dump-executable-sources-to=dump/ \\ | |
--iree-opt-strip-assertions 2> err.txt | |
: 1739529777:0;iree-compile f8_attn_chi_castf32_roctorch.mlir \\ | |
--iree-hip-target=gfx942 \\ | |
-o=f8_attn_chi_castf32_roctorch.vmfb \\ | |
--iree-hal-target-device=hip \\ | |
--iree-dispatch-creation-enable-aggressive-fusion=true \\ | |
--iree-global-opt-propagate-transposes=true \\ | |
--iree-opt-aggressively-propagate-transposes=true \\ | |
--iree-opt-data-tiling=false \\ | |
--iree-preprocessing-pass-pipeline='builtin.module(util.func(iree-preprocessing-generalize-linalg-matmul-experimental))' \\ | |
--iree-hal-indirect-command-buffers=true \\ | |
--iree-stream-resource-memory-model=discrete \\ | |
--iree-hal-memoization=true \\ | |
--iree-hal-dump-executable-sources-to=dump/ \\ | |
--iree-opt-strip-assertions 2> err.txt | |
: 1739530012:0;vi err.txt | |
: 1739530038:0;cd dump | |
: 1739530039:0;ls | |
: 1739530043:0;vi module_decode_bs1\$async_dispatch_19.mlir | |
: 1739530060:0;cd .. | |
: 1739530061:0;ls | |
: 1739530064:0;vi err.txt | |
: 1739530106:0;cd dump | |
: 1739530106:0;ls | |
: 1739530109:0;vi module_decode_bs1\$async_dispatch_19.mlir | |
: 1739530129:0;gist-paste module_decode_bs1\$async_dispatch_19.mlir | |
: 1739530174:0;ls | |
: 1739530234:0;cd .. | |
: 1739530235:0;ls | |
: 1739530236:0;cd dump | |
: 1739530237:0;ls | |
: 1739530261:0;mv module_decode_bs1\$async_dispatch_19.mlir ../dmp.mlir | |
: 1739530263:0;cd .. | |
: 1739530263:0;ls | |
: 1739530283:0;iree-compile dmp.mlir \\ | |
--iree-hip-target=gfx942 \\ | |
-o=f8_attn_chi_castf32_roctorch.vmfb \\ | |
--iree-hal-target-device=hip \\ | |
--iree-dispatch-creation-enable-aggressive-fusion=true \\ | |
--iree-global-opt-propagate-transposes=true \\ | |
--iree-opt-aggressively-propagate-transposes=true \\ | |
--iree-opt-data-tiling=false \\ | |
--iree-preprocessing-pass-pipeline='builtin.module(util.func(iree-preprocessing-generalize-linalg-matmul-experimental))' \\ | |
--iree-hal-indirect-command-buffers=true \\ | |
--iree-stream-resource-memory-model=discrete \\ | |
--iree-hal-memoization=true \\ | |
--iree-opt-strip-assertions | |
: 1739530300:0;iree-compile dmp.mlir \\ | |
--iree-hip-target=gfx942 \\ | |
-o=f8_attn_chi_castf32_roctorch.vmfb \\ | |
--iree-hal-target-device=hip \\ | |
--iree-dispatch-creation-enable-aggressive-fusion=true \\ | |
--iree-global-opt-propagate-transposes=true \\ | |
--iree-opt-aggressively-propagate-transposes=true \\ | |
--iree-opt-data-tiling=false \\ | |
--iree-preprocessing-pass-pipeline='builtin.module(util.func(iree-preprocessing-generalize-linalg-matmul-experimental))' \\ | |
--iree-hal-indirect-command-buffers=true \\ | |
--iree-stream-resource-memory-model=discrete \\ | |
--iree-hal-memoization=true \\ | |
--compile-from=executable-sources \\ | |
--iree-opt-strip-assertions | |
: 1739530307:0;vi err.txt | |
: 1739530315:0;cd dump | |
: 1739530315:0;ls | |
: 1739530335:0;vi module_prefill_bs1\$async_dispatch_119.mlir | |
: 1739530345:0;vi ../err.txt | |
: 1739530358:0;cd .. | |
: 1739530359:0;ls | |
: 1739530365:0;rm -rf dump | |
: 1739530375:0;iree-compile f8_attn_chi_castf32_roctorch.mlir \\ | |
--iree-hip-target=gfx942 \\ | |
-o=f8_attn_chi_castf32_roctorch.vmfb \\ | |
--iree-hal-target-device=hip \\ | |
--iree-dispatch-creation-enable-aggressive-fusion=true \\ | |
--iree-global-opt-propagate-transposes=true \\ | |
--iree-opt-aggressively-propagate-transposes=true \\ | |
--iree-opt-data-tiling=false \\ | |
--iree-preprocessing-pass-pipeline='builtin.module(util.func(iree-preprocessing-generalize-linalg-matmul-experimental))' \\ | |
--iree-hal-indirect-command-buffers=true \\ | |
--iree-stream-resource-memory-model=discrete \\ | |
--iree-hal-memoization=true \\ | |
--iree-hal-dump-executable-sources-to=dump/ \\ | |
--iree-opt-strip-assertions 2> err.txt | |
: 1739530593:0;cd dump | |
: 1739530593:0;ls | |
: 1739530606:0;vi module_prefill_bs1\$async_dispatch_19.mlir | |
: 1739530772:0;iree-compile module_prefill_bs1\$async_dispatch_19.mlir \\ | |
--iree-hip-target=gfx942 \\ | |
-o=f8_attn_chi_castf32_roctorch.vmfb \\ | |
--iree-hal-target-device=hip \\ | |
--iree-dispatch-creation-enable-aggressive-fusion=true \\ | |
--iree-global-opt-propagate-transposes=true \\ | |
--iree-opt-aggressively-propagate-transposes=true \\ | |
--iree-opt-data-tiling=false \\ | |
--iree-preprocessing-pass-pipeline='builtin.module(util.func(iree-preprocessing-generalize-linalg-matmul-experimental))' \\ | |
--iree-hal-indirect-command-buffers=true \\ | |
--iree-stream-resource-memory-model=discrete \\ | |
--iree-hal-memoization=true \\ | |
--compile-from=executable-sources \\ | |
--iree-opt-strip-assertions | |
: 1739530817:0;gist-paste module_prefill_bs1\$async_dispatch_19.mlir | |
: 1739531082:0;iree-compile module_prefill_bs1\$async_dispatch_19.mlir \\ | |
--iree-hip-target=gfx942 \\ | |
-o=f8_attn_chi_castf32_roctorch.vmfb \\ | |
--iree-hal-target-device=hip \\ | |
--iree-dispatch-creation-enable-aggressive-fusion=true \\ | |
--iree-global-opt-propagate-transposes=true \\ | |
--iree-opt-aggressively-propagate-transposes=true \\ | |
--iree-opt-data-tiling=false \\ | |
--iree-preprocessing-pass-pipeline='builtin.module(util.func(iree-preprocessing-generalize-linalg-matmul-experimental))' \\ | |
--iree-hal-indirect-command-buffers=true \\ | |
--iree-stream-resource-memory-model=discrete \\ | |
--iree-hal-memoization=true \\ | |
--compile-from=executable-sources \\ | |
-mlir-print-ir-after-all 2> err.txt \\ | |
--iree-opt-strip-assertions | |
: 1739531085:0;vi err.txt | |
: 1739531203:0;cd .. | |
: 1739531204:0;ls | |
: 1739531212:0;vi before_vector_distribute.mlir | |
: 1739531262:0;iree-opt --pass-pipeline="builtin.module(func.func(iree-llvmgpu-vector-lowering,canonicalize,cse))" --split-input-file before_vector_distribute.mlir | |
: 1739531492:0;ls | |
: 1739531493:0;cd dump | |
: 1739531494:0;ls | |
: 1739531496:0;vi err.txt | |
: 1739531522:0;cd .. | |
: 1739531522:0;ls | |
: 1739531532:0;iree-opt --pass-pipeline="builtin.module(func.func(iree-llvmgpu-vector-distribute,canonicalize,cse))" --split-input-file before_vector_distribute.mlir | |
: 1739531551:0;gist-paste before_vector_distribute.mlir | |
: 1739531601:0;iree-opt --pass-pipeline="builtin.module(func.func(iree-llvmgpu-vector-distribute,canonicalize,cse))" --split-input-file before_vector_distribute.mlir | |
: 1739531746:0;riree | |
: 1739531801:0;iree-opt --pass-pipeline="builtin.module(func.func(iree-llvmgpu-vector-distribute,canonicalize,cse))" --split-input-file before_vector_distribute.mlir 2> err.txt | |
: 1739531805:0;vi err.txt | |
: 1739531844:0;iree-opt --pass-pipeline="builtin.module(func.func(iree-llvmgpu-vector-distribute,canonicalize,cse))" --split-input-file before_vector_distribute.mlir --debug 2> err.txt | |
: 1739531849:0;vi err.txt | |
: 1739541929:0;clear | |
: 1739541929:0;ls | |
: 1739541935:0;clear | |
: 1739541935:0;ls | |
: 1739541944:0;exit | |
: 1739542036:0;clear | |
: 1739542037:0;ls | |
: 1739542038:0;tmux ls | |
: 1739542042:0;tmux attach -t 0 | |
: 1739542071:0;clear | |
: 1739542072:0;ls | |
: 1739542087:0;git fetch pashu | |
: 1739542130:0;git o pashu/deprecatewarp | |
: 1739542139:0;git rebase origin/main | |
: 1739542141:0;clear | |
: 1739542142:0;ls | |
: 1739542144:0;git ppf | |
: 1739542159:0;git ob deprecatewarp | |
: 1739542167:0;git branch -D deprecatewarp | |
: 1739542169:0;git ob deprecatewarp | |
: 1739542170:0;git ppf | |
: 1739542183:0;clear | |
: 1739542183:0;ls | |
: 1739542183:0;vi | |
: 1739542388:0;ls | |
: 1739542389:0;cd .. | |
: 1739542390:0;ls | |
: 1739542401:0;mkdir vectormulti | |
: 1739542403:0;cd vectormulti | |
: 1739542404:0;ls | |
: 1739542407:0;vi test.mlir | |
: 1739542465:0;clear | |
: 1739542465:0;ls | |
: 1739542568:0;riree | |
: 1739542705:0;iree-compile test.mlir \\ | |
--iree-hip-target=gfx942 \\ | |
-o=abc.vmfb \\ | |
--iree-hal-target-device=hip \\ | |
--compile-from=executable-sources \\ | |
-mlir-print-ir-after-all 2> err.txt \\ | |
--iree-opt-strip-assertions | |
: 1739542723:0;vi test.mlir | |
: 1739542729:0;vi err.txt | |
: 1739542790:0;vi test_new.mlir | |
: 1739542833:0;iree-opt --split-input-file --iree-gpu-test-target=gfx942 --pass-pipeline='builtin.module(iree-llvmgpu-select-lowering-strategy)' test_new.mlir | |
: 1739542865:0;riree | |
: 1739542887:0;iree-opt --split-input-file --iree-gpu-test-target=gfx942 --pass-pipeline='builtin.module(iree-llvmgpu-select-lowering-strategy)' test_new.mlir | |
: 1739542925:0;riree | |
: 1739543026:0;iree-opt --split-input-file --iree-gpu-test-target=gfx942 --pass-pipeline='builtin.module(iree-llvmgpu-select-lowering-strategy)' test_new.mlir | |
: 1739543114:0;riree | |
: 1739543136:0;iree-opt --split-input-file --iree-gpu-test-target=gfx942 --pass-pipeline='builtin.module(iree-llvmgpu-select-lowering-strategy)' test_new.mlir | |
: 1739543688:0;riree | |
: 1739544760:0;iree-opt --split-input-file --iree-gpu-test-target=gfx942 --pass-pipeline='builtin.module(iree-llvmgpu-select-lowering-strategy)' test_new.mlir | |
: 1739544804:0;riree | |
: 1739544971:0;iree-opt --split-input-file --iree-gpu-test-target=gfx942 --pass-pipeline='builtin.module(iree-llvmgpu-select-lowering-strategy)' test_new.mlir | |
: 1739545085:0;riree | |
: 1739545105:0;iree-opt --split-input-file --iree-gpu-test-target=gfx942 --pass-pipeline='builtin.module(iree-llvmgpu-select-lowering-strategy)' test_new.mlir | |
: 1739545118:0;riree | |
: 1739545139:0;iree-opt --split-input-file --iree-gpu-test-target=gfx942 --pass-pipeline='builtin.module(iree-llvmgpu-select-lowering-strategy)' test_new.mlir | |
: 1739545192:0;riree | |
: 1739545215:0;iree-opt --split-input-file --iree-gpu-test-target=gfx942 --pass-pipeline='builtin.module(iree-llvmgpu-select-lowering-strategy)' test_new.mlir | |
: 1739545502:0;riree | |
: 1739545529:0;iree-opt --split-input-file --iree-gpu-test-target=gfx942 --pass-pipeline='builtin.module(iree-llvmgpu-select-lowering-strategy)' test_new.mlir | |
: 1739547032:0;riree | |
: 1739552954:0;vi | |
: 1739552973:0;iree-opt --split-input-file --iree-gpu-test-target=gfx942 --pass-pipeline='builtin.module(iree-llvmgpu-select-lowering-strategy)' test_new.mlir | |
: 1739554368:0;riree | |
: 1739554405:0;iree-opt --split-input-file --iree-gpu-test-target=gfx942 --pass-pipeline='builtin.module(iree-llvmgpu-select-lowering-strategy)' test_new.mlir | |
: 1739554487:0;riree | |
: 1739554508:0;iree-opt --split-input-file --iree-gpu-test-target=gfx942 --pass-pipeline='builtin.module(iree-llvmgpu-select-lowering-strategy)' test_new.mlir | |
: 1739787705:0;tmux attach -t 0 | |
: 1739787775:0;ls | |
: 1739787779:0;vi make.mlir | |
: 1739787803:0;iree-opt --split-input-file --iree-gpu-test-target=gfx942 --pass-pipeline='builtin.module(iree-llvmgpu-select-lowering-strategy)' test_new.mlir > make.mlir | |
: 1739787805:0;vi make.mlir | |
: 1739788729:0;iree-opt --split-input-file --iree-gpu-test-target=gfx942 --iree-codegen-llvmgpu-use-vector-distribution --iree-llvmgpu-enable-prefetch=true --pass-pipeline="builtin.module(hal.executable(hal.executable.variant(builtin.module(func.func(iree-llvmgpu-lower-executable-target)))))" make.mlir | |
: 1739788755:0;iree-opt --split-input-file --iree-gpu-test-target=gfx942 --iree-codegen-llvmgpu-use-vector-distribution --iree-llvmgpu-enable-prefetch=true --pass-pipeline="builtin.module(hal.executable(hal.executable.variant(builtin.module(func.func(iree-llvmgpu-lower-executable-target)))))" make.mlir --debug | |
: 1739788947:0;vi make.mlir | |
: 1739788965:0;iree-opt --split-input-file --iree-gpu-test-target=gfx942 --iree-codegen-llvmgpu-use-vector-distribution --iree-llvmgpu-enable-prefetch=true --pass-pipeline="builtin.module(hal.executable(hal.executable.variant(builtin.module(func.func(iree-llvmgpu-lower-executable-target)))))" make.mlir --debug | |
: 1739788979:0;vi make.mlir | |
: 1739788989:0;iree-opt --split-input-file --iree-gpu-test-target=gfx942 --iree-codegen-llvmgpu-use-vector-distribution --iree-llvmgpu-enable-prefetch=true --pass-pipeline="builtin.module(hal.executable(hal.executable.variant(builtin.module(func.func(iree-llvmgpu-lower-executable-target)))))" make.mlir --debug | |
: 1739789011:0;iree-opt --split-input-file --iree-gpu-test-target=gfx942 --iree-codegen-llvmgpu-use-vector-distribution --iree-llvmgpu-enable-prefetch=true --pass-pipeline="builtin.module(hal.executable(hal.executable.variant(builtin.module(func.func(iree-llvmgpu-lower-executable-target)))))" make.mlir --debug -mlir-print-ir-after-all 2> full.txt | |
: 1739789013:0;vi full.txt | |
: 1739789020:0;riree | |
: 1739789047:0;iree-opt --split-input-file --iree-gpu-test-target=gfx942 --iree-codegen-llvmgpu-use-vector-distribution --iree-llvmgpu-enable-prefetch=true --pass-pipeline="builtin.module(hal.executable(hal.executable.variant(builtin.module(func.func(iree-llvmgpu-lower-executable-target)))))" make.mlir -mlir-print-ir-after-all 2> full.txt | |
: 1739789049:0;vi full.txt | |
: 1739789077:0;iree-opt --iree-codegen-llvmgpu-use-vector-distribution --pass-pipeline="builtin.module(hal.executable(hal.executable.variant(builtin.module(func.func(iree-llvmgpu-lower-executable-target)))))" make.mlir -mlir-print-ir-after-all 2> full.txt | |
: 1739789079:0;vi full.txt | |
: 1739789193:0;iree-opt --iree-codegen-llvmgpu-use-vector-distribution--pass-pipeline=builtin.module(hal.executable(hal.executable.variant(builtin.module(func.func(iree-llvmgpu-lower-executable-target))))) make.mlir -mlir-print-ir-after-all 2> full.txt | |
: 1739789206:0;iree-opt --pass-pipeline=builtin.module(hal.executable(hal.executable.variant(builtin.module(func.func(iree-llvmgpu-lower-executable-target))))) make.mlir -mlir-print-ir-after-all 2> full.txt | |
: 1739789216:0;iree-opt --pass-pipeline="builtin.module(hal.executable(hal.executable.variant(builtin.module(func.func(iree-llvmgpu-lower-executable-target)))))" make.mlir -mlir-print-ir-after-all 2> full.txt | |
: 1739789226:0;vi full.txt | |
: 1739789283:0;vi make | |
: 1739789285:0;vi make.mlir | |
: 1739789300:0;iree-opt --pass-pipeline="builtin.module(hal.executable(hal.executable.variant(builtin.module(func.func(iree-llvmgpu-lower-executable-target)))))" make.mlir -mlir-print-ir-after-all 2> full.txt | |
: 1739789309:0;iree-opt --pass-pipeline="builtin.module(hal.executable(hal.executable.variant(builtin.module(func.func(iree-llvmgpu-lower-executable-target)))))" make.mlir -mlir-print-ir-after-all 2> full.txt -mlir-timing | |
: 1739789323:0;vi full.txt | |
: 1739789451:0;vi new.mlir | |
: 1739789464:0;iree-opt --pass-pipeline="builtin.module(hal.executable(hal.executable.variant(builtin.module(func.func(iree-llvmgpu-lower-executable-target)))))" new.mlir -mlir-print-ir-after-all 2> full.txt -mlir-timing | |
: 1739789482:0;iree-opt --split-input-file --iree-gpu-test-target=gfx942 --iree-codegen-llvmgpu-use-vector-distribution --iree-llvmgpu-enable-prefetch=true --pass-pipeline="builtin.module(hal.executable(hal.executable.variant(builtin.module(func.func(iree-llvmgpu-lower-executable-target)))))" new.mlir -mlir-print-ir-after-all 2> full.txt | |
: 1739789489:0;vi make.mlir new.mlir | |
: 1739789626:0;iree-opt --split-input-file --iree-gpu-test-target=gfx942 --iree-codegen-llvmgpu-use-vector-distribution --iree-llvmgpu-enable-prefetch=true --pass-pipeline="builtin.module(hal.executable(hal.executable.variant(builtin.module(func.func(iree-llvmgpu-lower-executable-target)))))" makje.mlir -mlir-print-ir-after-all 2> full.txt | |
: 1739789631:0;iree-opt --split-input-file --iree-gpu-test-target=gfx942 --iree-codegen-llvmgpu-use-vector-distribution --iree-llvmgpu-enable-prefetch=true --pass-pipeline="builtin.module(hal.executable(hal.executable.variant(builtin.module(func.func(iree-llvmgpu-lower-executable-target)))))" make.mlir -mlir-print-ir-after-all 2> full.txt | |
: 1739789633:0;vi full.txt | |
: 1739789696:0;vi make.mlir | |
: 1739789718:0;iree-opt --split-input-file --iree-gpu-test-target=gfx942 --iree-codegen-llvmgpu-use-vector-distribution --iree-llvmgpu-enable-prefetch=true --pass-pipeline="builtin.module(hal.executable(hal.executable.variant(builtin.module(func.func(iree-llvmgpu-lower-executable-target)))))" make.mlir -mlir-print-ir-after-all 2> full.txt | |
: 1739789720:0;vi full.txt | |
: 1739789729:0;vi make.mlir | |
: 1739789766:0;iree-opt --split-input-file --iree-gpu-test-target=gfx942 --iree-codegen-llvmgpu-use-vector-distribution --iree-llvmgpu-enable-prefetch=true --pass-pipeline="builtin.module(hal.executable(hal.executable.variant(builtin.module(func.func(iree-llvmgpu-lower-executable-target)))))" make.mlir -mlir-print-ir-after-all 2> full.txt | |
: 1739789768:0;vi full.txt | |
: 1739789891:0;vi make.mlir | |
: 1739789915:0;iree-opt --split-input-file --iree-gpu-test-target=gfx942 --iree-codegen-llvmgpu-use-vector-distribution --iree-llvmgpu-enable-prefetch=true --pass-pipeline="builtin.module(hal.executable(hal.executable.variant(builtin.module(func.func(iree-llvmgpu-lower-executable-target)))))" make.mlir -mlir-print-ir-after-all 2> full.txt | |
: 1739789917:0;vi full.txt | |
: 1739789936:0;vi make.mlir | |
: 1739789965:0;iree-opt --split-input-file --iree-gpu-test-target=gfx942 --iree-codegen-llvmgpu-use-vector-distribution --iree-llvmgpu-enable-prefetch=true --pass-pipeline="builtin.module(hal.executable(hal.executable.variant(builtin.module(func.func(iree-llvmgpu-lower-executable-target)))))" make.mlir -mlir-print-ir-after-all 2> full.txt | |
: 1739789968:0;vi full.txt | |
: 1739790126:0;vi make.mlir | |
: 1739790136:0;iree-opt --split-input-file --iree-gpu-test-target=gfx942 --iree-codegen-llvmgpu-use-vector-distribution --iree-llvmgpu-enable-prefetch=true --pass-pipeline="builtin.module(hal.executable(hal.executable.variant(builtin.module(func.func(iree-llvmgpu-lower-executable-target)))))" make.mlir -mlir-print-ir-after-all 2> full.txt | |
: 1739790138:0;vi full.txt | |
: 1739790302:0;vi make.mlir | |
: 1739790357:0;iree-opt --split-input-file --iree-gpu-test-target=gfx942 --iree-codegen-llvmgpu-use-vector-distribution --iree-llvmgpu-enable-prefetch=true --pass-pipeline="builtin.module(hal.executable(hal.executable.variant(builtin.module(func.func(iree-llvmgpu-lower-executable-target)))))" make.mlir -mlir-print-ir-after-all 2> full.txt | |
: 1739790365:0;vi make.mlir | |
: 1739790371:0;vi full.txt | |
: 1739790422:0;vi make.mlir | |
: 1739790485:0;iree-opt --split-input-file --iree-gpu-test-target=gfx942 --iree-codegen-llvmgpu-use-vector-distribution --iree-llvmgpu-enable-prefetch=true --pass-pipeline="builtin.module(hal.executable(hal.executable.variant(builtin.module(func.func(iree-llvmgpu-lower-executable-target)))))" make.mlir -mlir-print-ir-after-all 2> full.txt | |
: 1739790490:0;vi full.txt | |
: 1739792345:0;vi make.mlir | |
: 1739792361:0;iree-opt --split-input-file --iree-gpu-test-target=gfx942 --iree-codegen-llvmgpu-use-vector-distribution --iree-llvmgpu-enable-prefetch=true --pass-pipeline="builtin.module(hal.executable(hal.executable.variant(builtin.module(func.func(iree-llvmgpu-lower-executable-target)))))" make.mlir -mlir-print-ir-after-all 2> full.txt | |
: 1739792363:0;vi full.txt | |
: 1739792554:0;vi make.mlir | |
: 1739792616:0;iree-opt --split-input-file --iree-gpu-test-target=gfx942 --iree-codegen-llvmgpu-use-vector-distribution --iree-llvmgpu-enable-prefetch=true --pass-pipeline="builtin.module(hal.executable(hal.executable.variant(builtin.module(func.func(iree-llvmgpu-lower-executable-target)))))" make.mlir -mlir-print-ir-after-all 2> full.txt | |
: 1739792618:0;vi full.txt | |
: 1739792725:0;vi make.mlir | |
: 1739792736:0;iree-opt --split-input-file --iree-gpu-test-target=gfx942 --iree-codegen-llvmgpu-use-vector-distribution --iree-llvmgpu-enable-prefetch=true --pass-pipeline="builtin.module(hal.executable(hal.executable.variant(builtin.module(func.func(iree-llvmgpu-lower-executable-target)))))" make.mlir -mlir-print-ir-after-all 2> full.txt | |
: 1739792753:0;vi full.txt | |
: 1739792941:0;gist-paste make.mlir | |
: 1739792991:0;vi make.mlir | |
: 1739793123:0;iree-opt --split-input-file --iree-gpu-test-target=gfx942 --iree-codegen-llvmgpu-use-vector-distribution --iree-llvmgpu-enable-prefetch=true --pass-pipeline="builtin.module(hal.executable(hal.executable.variant(builtin.module(func.func(iree-llvmgpu-lower-executable-target)))))" make.mlir -mlir-print-ir-after-all 2> full.txt | |
: 1739793133:0;vi full.txt | |
: 1739793242:0;vi make.mlir | |
: 1739793361:0;iree-opt --split-input-file --iree-gpu-test-target=gfx942 --iree-codegen-llvmgpu-use-vector-distribution --iree-llvmgpu-enable-prefetch=true --pass-pipeline="builtin.module(hal.executable(hal.executable.variant(builtin.module(func.func(iree-llvmgpu-lower-executable-target)))))" make.mlir -mlir-print-ir-after-all 2> full.txt | |
: 1739793367:0;vi full.txt | |
: 1739793586:0;vi make.mlir | |
: 1739794262:0;iree-opt --split-input-file --iree-gpu-test-target=gfx942 --iree-codegen-llvmgpu-use-vector-distribution --iree-llvmgpu-enable-prefetch=true --pass-pipeline="builtin.module(hal.executable(hal.executable.variant(builtin.module(func.func(iree-llvmgpu-lower-executable-target)))))" make.mlir -mlir-print-ir-after-all 2> full.txt | |
: 1739794265:0;vi full.txt | |
: 1739794287:0;vi make.mlir | |
: 1739794326:0;iree-opt --split-input-file --iree-gpu-test-target=gfx942 --iree-codegen-llvmgpu-use-vector-distribution --iree-llvmgpu-enable-prefetch=true --pass-pipeline="builtin.module(hal.executable(hal.executable.variant(builtin.module(func.func(iree-llvmgpu-lower-executable-target)))))" make.mlir -mlir-print-ir-after-all 2> full.txt | |
: 1739794336:0;ls | |
: 1739794338:0;vi full.txt | |
: 1739794427:0;vi make.mlir | |
: 1739794551:0;iree-opt --split-input-file --iree-gpu-test-target=gfx942 --iree-codegen-llvmgpu-use-vector-distribution --iree-llvmgpu-enable-prefetch=true --pass-pipeline="builtin.module(hal.executable(hal.executable.variant(builtin.module(func.func(iree-llvmgpu-lower-executable-target)))))" make.mlir -mlir-print-ir-after-all 2> full.txt | |
: 1739794555:0;vi full.txt | |
: 1739794777:0;riree | |
: 1739794807:0;iree-opt --split-input-file --iree-gpu-test-target=gfx942 --iree-codegen-llvmgpu-use-vector-distribution --iree-llvmgpu-enable-prefetch=true --pass-pipeline="builtin.module(hal.executable(hal.executable.variant(builtin.module(func.func(iree-llvmgpu-lower-executable-target)))))" make.mlir -mlir-print-ir-after-all 2> full.txt | |
: 1739794883:0;vi make.mlir | |
: 1739795174:0;iree-opt --split-input-file --iree-gpu-test-target=gfx942 --iree-codegen-llvmgpu-use-vector-distribution --iree-llvmgpu-enable-prefetch=true --pass-pipeline="builtin.module(hal.executable(hal.executable.variant(builtin.module(func.func(iree-llvmgpu-lower-executable-target)))))" make.mlir -mlir-print-ir-after-all 2> full.txt | |
: 1739795206:0;ls | |
: 1739795208:0;vi make.mlir | |
: 1739795219:0;iree-opt --split-input-file --iree-gpu-test-target=gfx942 --iree-codegen-llvmgpu-use-vector-distribution --iree-llvmgpu-enable-prefetch=true --pass-pipeline="builtin.module(hal.executable(hal.executable.variant(builtin.module(func.func(iree-llvmgpu-lower-executable-target)))))" make.mlir -mlir-print-ir-after-all 2> full.txt | |
: 1739796083:0;vi make.mlir | |
: 1739800816:0;gist-paste make.mlir | |
: 1739801209:0;vi make.mlir | |
: 1739801762:0;cat make.mlir | |
: 1739801830:0;vi make.mlir | |
: 1739801924:0;vi ex.mlir | |
: 1739801982:0;iree-compile ex.mlir \\ | |
--iree-hip-target=gfx942 \\ | |
-o=abc.vmfb \\ | |
--iree-hal-target-device=hip \\ | |
--compile-from=executable-sources \\ | |
-mlir-print-ir-after-all 2> err.txt \\ | |
: 1739801985:0;vi ex.mlir | |
: 1739801989:0;vi err.txt | |
: 1739802004:0;iree-compile ex.mlir \\ | |
--iree-hip-target=gfx942 \\ | |
-o=abc.vmfb \\ | |
--iree-hal-target-device=hip \\ | |
-mlir-print-ir-after-all 2> err.txt \\ | |
: 1739802008:0;vi err.txt | |
: 1739802047:0;git stash | |
: 1739802052:0;riree | |
: 1739802076:0;iree-compile ex.mlir \\ | |
--iree-hip-target=gfx942 \\ | |
-o=abc.vmfb \\ | |
--iree-hal-target-device=hip \\ | |
-mlir-print-ir-after-all 2> err.txt \\ | |
: 1739802079:0;vi err.txt | |
: 1739802418:0;vi make.mlir | |
: 1739802449:0;iree-opt --split-input-file --iree-gpu-test-target=gfx942 --iree-codegen-llvmgpu-use-vector-distribution --iree-llvmgpu-enable-prefetch=true --pass-pipeline="builtin.module(hal.executable(hal.executable.variant(builtin.module(func.func(iree-llvmgpu-lower-executable-target)))))" make.mlir -mlir-print-ir-after-all 2> full.txt | |
: 1739802722:0;git stash pop | |
: 1739803005:0;ls | |
: 1739803008:0;vi err.txt | |
: 1739805697:0;ls | |
: 1739805699:0;vi make.mlir | |
: 1739805757:0;clear | |
: 1739805757:0;ls | |
: 1739805920:0;vi err.txt | |
: 1739806194:0;riree | |
: 1739806346:0;iree-opt --split-input-file --iree-gpu-test-target=gfx942 --pass-pipeline='builtin.module(iree-llvmgpu-select-lowering-strategy)' test_new.mlir | |
: 1739806393:0;vi make.mlir | |
: 1739806427:0;iree-opt --split-input-file --iree-gpu-test-target=gfx942 --iree-codegen-llvmgpu-use-vector-distribution --iree-llvmgpu-enable-prefetch=true --pass-pipeline="builtin.module(hal.executable(hal.executable.variant(builtin.module(func.func(iree-llvmgpu-lower-executable-target)))))" make.mlir -mlir-print-ir-after-all 2> full.txt | |
: 1739806455:0;vi make.mlir | |
: 1739806514:0;iree-opt --split-input-file --iree-gpu-test-target=gfx942 --iree-codegen-llvmgpu-use-vector-distribution --iree-llvmgpu-enable-prefetch=true --pass-pipeline="builtin.module(hal.executable(hal.executable.variant(builtin.module(func.func(iree-llvmgpu-lower-executable-target)))))" make.mlir -mlir-print-ir-after-all 2> full.txt | |
: 1739806516:0;vi full.txt | |
: 1739806532:0;vi make.mlir | |
: 1739806564:0;iree-opt --split-input-file --iree-gpu-test-target=gfx942 --iree-codegen-llvmgpu-use-vector-distribution --iree-llvmgpu-enable-prefetch=true --pass-pipeline="builtin.module(hal.executable(hal.executable.variant(builtin.module(func.func(iree-llvmgpu-lower-executable-target)))))" make.mlir -mlir-print-ir-after-all 2> full.txt | |
: 1739806574:0;vi make.mlir | |
: 1739806584:0;iree-opt --split-input-file --iree-gpu-test-target=gfx942 --iree-codegen-llvmgpu-use-vector-distribution --iree-llvmgpu-enable-prefetch=true --pass-pipeline="builtin.module(hal.executable(hal.executable.variant(builtin.module(func.func(iree-llvmgpu-lower-executable-target)))))" make.mlir -mlir-print-ir-after-all 2> full.txt | |
: 1739806604:0;vi make.mlir | |
: 1739806683:0;iree-opt --split-input-file --iree-gpu-test-target=gfx942 --iree-codegen-llvmgpu-use-vector-distribution --iree-llvmgpu-enable-prefetch=true --pass-pipeline="builtin.module(hal.executable(hal.executable.variant(builtin.module(func.func(iree-llvmgpu-lower-executable-target)))))" make.mlir -mlir-print-ir-after-all 2> full.txt | |
: 1739807714:0;vi make.mlir | |
: 1739807783:0;iree-opt --split-input-file --iree-gpu-test-target=gfx942 --iree-codegen-llvmgpu-use-vector-distribution --iree-llvmgpu-enable-prefetch=true --pass-pipeline="builtin.module(hal.executable(hal.executable.variant(builtin.module(func.func(iree-llvmgpu-lower-executable-target)))))" make.mlir -mlir-print-ir-after-all 2> full.txt | |
: 1739807787:0;vi full.txt | |
: 1739807797:0;vi make.mlir | |
: 1739807836:0;iree-opt --split-input-file --iree-gpu-test-target=gfx942 --iree-codegen-llvmgpu-use-vector-distribution --iree-llvmgpu-enable-prefetch=true --pass-pipeline="builtin.module(hal.executable(hal.executable.variant(builtin.module(func.func(iree-llvmgpu-lower-executable-target)))))" make.mlir -mlir-print-ir-after-all 2> full.txt | |
: 1739807839:0;vi make.mlir | |
: 1739807849:0;vi full.txt | |
: 1739807941:0;vi make.mlir | |
: 1739807952:0;iree-opt --split-input-file --iree-gpu-test-target=gfx942 --iree-codegen-llvmgpu-use-vector-distribution --iree-llvmgpu-enable-prefetch=true --pass-pipeline="builtin.module(hal.executable(hal.executable.variant(builtin.module(func.func(iree-llvmgpu-lower-executable-target)))))" make.mlir -mlir-print-ir-after-all 2> full.txt | |
: 1739807954:0;vi full.txt | |
: 1739807968:0;vi make.mlir | |
: 1739808606:0;iree-opt --split-input-file --iree-gpu-test-target=gfx942 --iree-codegen-llvmgpu-use-vector-distribution --iree-llvmgpu-enable-prefetch=true --pass-pipeline="builtin.module(hal.executable(hal.executable.variant(builtin.module(func.func(iree-llvmgpu-lower-executable-target)))))" make.mlir -mlir-print-ir-after-all 2> full.txt | |
: 1739808622:0;vi make.mlir | |
: 1739808787:0;iree-opt --split-input-file --iree-gpu-test-target=gfx942 --iree-codegen-llvmgpu-use-vector-distribution --iree-llvmgpu-enable-prefetch=true --pass-pipeline="builtin.module(hal.executable(hal.executable.variant(builtin.module(func.func(iree-llvmgpu-lower-executable-target)))))" make.mlir -mlir-print-ir-after-all 2> full.txt | |
: 1739808790:0;vi make.mlir | |
: 1739808848:0;iree-opt --split-input-file --iree-gpu-test-target=gfx942 --iree-codegen-llvmgpu-use-vector-distribution --iree-llvmgpu-enable-prefetch=true --pass-pipeline="builtin.module(hal.executable(hal.executable.variant(builtin.module(func.func(iree-llvmgpu-lower-executable-target)))))" make.mlir -mlir-print-ir-after-all 2> full.txt | |
: 1739808851:0;vi full.txt | |
: 1739808863:0;vi make.mlir | |
: 1739808891:0;iree-opt --split-input-file --iree-gpu-test-target=gfx942 --iree-codegen-llvmgpu-use-vector-distribution --iree-llvmgpu-enable-prefetch=true --pass-pipeline="builtin.module(hal.executable(hal.executable.variant(builtin.module(func.func(iree-llvmgpu-lower-executable-target)))))" make.mlir -mlir-print-ir-after-all 2> full.txt | |
: 1739808896:0;vi full.txt | |
: 1739808956:0;vi make.mlir | |
: 1739808989:0;iree-opt --split-input-file --iree-gpu-test-target=gfx942 --iree-codegen-llvmgpu-use-vector-distribution --iree-llvmgpu-enable-prefetch=true --pass-pipeline="builtin.module(hal.executable(hal.executable.variant(builtin.module(func.func(iree-llvmgpu-lower-executable-target)))))" make.mlir -mlir-print-ir-after-all 2> full.txt | |
: 1739808991:0;vi full.txt | |
: 1739809041:0;vi make.mlir | |
: 1739809063:0;iree-opt --split-input-file --iree-gpu-test-target=gfx942 --iree-codegen-llvmgpu-use-vector-distribution --iree-llvmgpu-enable-prefetch=true --pass-pipeline="builtin.module(hal.executable(hal.executable.variant(builtin.module(func.func(iree-llvmgpu-lower-executable-target)))))" make.mlir -mlir-print-ir-after-all 2> full.txt | |
: 1739809100:0;vi make.mlir | |
: 1739809127:0;iree-opt --split-input-file --iree-gpu-test-target=gfx942 --iree-codegen-llvmgpu-use-vector-distribution --iree-llvmgpu-enable-prefetch=true --pass-pipeline="builtin.module(hal.executable(hal.executable.variant(builtin.module(func.func(iree-llvmgpu-lower-executable-target)))))" make.mlir -mlir-print-ir-after-all 2> full.txt | |
: 1739809157:0;vi make.mlir | |
: 1739809187:0;iree-opt --split-input-file --iree-gpu-test-target=gfx942 --iree-codegen-llvmgpu-use-vector-distribution --iree-llvmgpu-enable-prefetch=true --pass-pipeline="builtin.module(hal.executable(hal.executable.variant(builtin.module(func.func(iree-llvmgpu-lower-executable-target)))))" make.mlir -mlir-print-ir-after-all 2> full.txt | |
: 1739809190:0;vi make.mlir | |
: 1739809202:0;ree | |
: 1739809204:0;riree | |
: 1739809220:0;iree-opt --split-input-file --iree-gpu-test-target=gfx942 --iree-codegen-llvmgpu-use-vector-distribution --iree-llvmgpu-enable-prefetch=true --pass-pipeline="builtin.module(hal.executable(hal.executable.variant(builtin.module(func.func(iree-llvmgpu-lower-executable-target)))))" make.mlir -mlir-print-ir-after-all 2> full.txt | |
: 1739809226:0;vi full.txt | |
: 1739809233:0;iree-opt --split-input-file --iree-gpu-test-target=gfx942 --iree-codegen-llvmgpu-use-vector-distribution --iree-llvmgpu-enable-prefetch=true --pass-pipeline="builtin.module(hal.executable(hal.executable.variant(builtin.module(func.func(iree-llvmgpu-lower-executable-target)))))" make.mlir -mlir-print-ir-after-all 2> full.txt | |
: 1739809273:0;vi full.txt | |
: 1739809276:0;ls | |
: 1739809280:0;vi test.mlir | |
: 1739809283:0;ls | |
: 1739809289:0;vi make.mlir | |
: 1739811937:0;riree | |
: 1739813218:0;gist-paste make.mlir | |
: 1739857192:0;clear | |
: 1739857192:0;ls | |
: 1739857197:0;tmux attach -t 0 | |
: 1739857509:0;clang-format -i compiler/src/iree/compiler/Codegen/LLVMGPU/KernelConfig.cpp | |
: 1739857830:0;vi make.mlir | |
: 1739858045:0;clang-format -i compiler/src/iree/compiler/Codegen/LLVMGPU/KernelConfig.cpp | |
: 1739860574:0;vi make.mlir | |
: 1739860652:0;iree-opt --split-input-file --iree-gpu-test-target=gfx942 --iree-codegen-llvmgpu-use-vector-distribution --iree-llvmgpu-enable-prefetch=true --pass-pipeline="builtin.module(hal.executable(hal.executable.variant(builtin.module(func.func(iree-llvmgpu-lower-executable-target)))))" make.mlir -mlir-print-ir-after-all 2> full.txt | |
: 1739860658:0;vi full.txt | |
: 1739860672:0;vi make.mlir | |
: 1739860704:0;iree-opt --split-input-file --iree-gpu-test-target=gfx942 --iree-codegen-llvmgpu-use-vector-distribution --iree-llvmgpu-enable-prefetch=true --pass-pipeline="builtin.module(hal.executable(hal.executable.variant(builtin.module(func.func(iree-llvmgpu-lower-executable-target)))))" make.mlir -mlir-print-ir-after-all 2> full.txt | |
: 1739870703:0;vi make.mlir | |
: 1739871883:0;clang-format -i compiler/src/iree/compiler/Codegen/LLVMGPU/KernelConfig.cpp | |
: 1739873784:0;riree | |
: 1739874155:0;iree-opt --split-input-file --iree-gpu-test-target=gfx942 --pass-pipeline='builtin.module(iree-llvmgpu-select-lowering-strategy)' test_new.mlir | |
: 1739874240:0;riree | |
: 1739874259:0;iree-opt --split-input-file --iree-gpu-test-target=gfx942 --pass-pipeline='builtin.module(iree-llvmgpu-select-lowering-strategy)' test_new.mlir | |
: 1739874371:0;riree | |
: 1739874393:0;iree-opt --split-input-file --iree-gpu-test-target=gfx942 --pass-pipeline='builtin.module(iree-llvmgpu-select-lowering-strategy)' test_new.mlir | |
: 1739874437:0;riree | |
: 1739874457:0;iree-opt --split-input-file --iree-gpu-test-target=gfx942 --pass-pipeline='builtin.module(iree-llvmgpu-select-lowering-strategy)' test_new.mlir | |
: 1739874509:0;riree | |
: 1739874530:0;iree-opt --split-input-file --iree-gpu-test-target=gfx942 --pass-pipeline='builtin.module(iree-llvmgpu-select-lowering-strategy)' test_new.mlir | |
: 1739874724:0;riree | |
: 1739874744:0;iree-opt --split-input-file --iree-gpu-test-target=gfx942 --pass-pipeline='builtin.module(iree-llvmgpu-select-lowering-strategy)' test_new.mlir | |
: 1739878417:0;riree | |
: 1739878896:0;iree-opt --split-input-file --iree-gpu-test-target=gfx942 --pass-pipeline='builtin.module(iree-llvmgpu-select-lowering-strategy)' test_new.mlir | |
: 1739878952:0;riree | |
: 1739878998:0;iree-opt --split-input-file --iree-gpu-test-target=gfx942 --pass-pipeline='builtin.module(iree-llvmgpu-select-lowering-strategy)' test_new.mlir | |
: 1739879189:0;riree | |
: 1739879209:0;iree-opt --split-input-file --iree-gpu-test-target=gfx942 --pass-pipeline='builtin.module(iree-llvmgpu-select-lowering-strategy)' test_new.mlir | |
: 1739879281:0;riree | |
: 1739879336:0;iree-opt --split-input-file --iree-gpu-test-target=gfx942 --pass-pipeline='builtin.module(iree-llvmgpu-select-lowering-strategy)' test_new.mlir | |
: 1739879533:0;riree | |
: 1739879555:0;iree-opt --split-input-file --iree-gpu-test-target=gfx942 --pass-pipeline='builtin.module(iree-llvmgpu-select-lowering-strategy)' test_new.mlir | |
: 1739880083:0;riree | |
: 1739880104:0;iree-opt --split-input-file --iree-gpu-test-target=gfx942 --pass-pipeline='builtin.module(iree-llvmgpu-select-lowering-strategy)' test_new.mlir | |
: 1739880259:0;riree | |
: 1739880290:0;iree-opt --split-input-file --iree-gpu-test-target=gfx942 --pass-pipeline='builtin.module(iree-llvmgpu-select-lowering-strategy)' test_new.mlir | |
: 1739880698:0;ree | |
: 1739880699:0;riree | |
: 1739880718:0;iree-opt --split-input-file --iree-gpu-test-target=gfx942 --pass-pipeline='builtin.module(iree-llvmgpu-select-lowering-strategy)' test_new.mlir | |
: 1739880823:0;riree | |
: 1739880841:0;iree-opt --split-input-file --iree-gpu-test-target=gfx942 --pass-pipeline='builtin.module(iree-llvmgpu-select-lowering-strategy)' test_new.mlir | |
: 1739880911:0;clang-format -i compiler/src/iree/compiler/Codegen/LLVMGPU/KernelConfig.cpp | |
: 1739880997:0;riree | |
: 1739881031:0;iree-opt --split-input-file --iree-gpu-test-target=gfx942 --pass-pipeline='builtin.module(iree-llvmgpu-select-lowering-strategy)' test_new.mlir | |
: 1739881152:0;riree | |
: 1739881170:0;iree-opt --split-input-file --iree-gpu-test-target=gfx942 --pass-pipeline='builtin.module(iree-llvmgpu-select-lowering-strategy)' test_new.mlir | |
: 1739881203:0;riree | |
: 1739881222:0;iree-opt --split-input-file --iree-gpu-test-target=gfx942 --pass-pipeline='builtin.module(iree-llvmgpu-select-lowering-strategy)' test_new.mlir | |
: 1739881327:0;riree | |
: 1739881347:0;iree-opt --split-input-file --iree-gpu-test-target=gfx942 --pass-pipeline='builtin.module(iree-llvmgpu-select-lowering-strategy)' test_new.mlir | |
: 1739881386:0;riree | |
: 1739881405:0;iree-opt --split-input-file --iree-gpu-test-target=gfx942 --pass-pipeline='builtin.module(iree-llvmgpu-select-lowering-strategy)' test_new.mlir | |
: 1739881443:0;vi make.mlir | |
: 1739881520:0;iree-opt --split-input-file --iree-gpu-test-target=gfx942 --iree-codegen-llvmgpu-use-vector-distribution --iree-llvmgpu-enable-prefetch=true --pass-pipeline="builtin.module(hal.executable(hal.executable.variant(builtin.module(func.func(iree-llvmgpu-lower-executable-target)))))" make.mlir -mlir-print-ir-after-all 2> full.txt | |
: 1739881523:0;vi full.txt | |
: 1739881532:0;ls | |
: 1739881534:0;vi make.mlir | |
: 1739881551:0;iree-opt --split-input-file --iree-gpu-test-target=gfx942 --iree-codegen-llvmgpu-use-vector-distribution --iree-llvmgpu-enable-prefetch=true --pass-pipeline="builtin.module(hal.executable(hal.executable.variant(builtin.module(func.func(iree-llvmgpu-lower-executable-target)))))" make.mlir -mlir-print-ir-after-all 2> full.txt | |
: 1739881555:0;vi full.txt | |
: 1739881564:0;vi make.mlir | |
: 1739881735:0;riree | |
: 1739881757:0;iree-opt --split-input-file --iree-gpu-test-target=gfx942 --pass-pipeline='builtin.module(iree-llvmgpu-select-lowering-strategy)' test_new.mlir | |
: 1739881829:0;riree | |
: 1739881874:0;iree-opt --split-input-file --iree-gpu-test-target=gfx942 --pass-pipeline='builtin.module(iree-llvmgpu-select-lowering-strategy)' test_new.mlir | |
: 1739882072:0;riree | |
: 1739882097:0;iree-opt --split-input-file --iree-gpu-test-target=gfx942 --pass-pipeline='builtin.module(iree-llvmgpu-select-lowering-strategy)' test_new.mlir | |
: 1739882286:0;riree | |
: 1739882326:0;iree-opt --split-input-file --iree-gpu-test-target=gfx942 --pass-pipeline='builtin.module(iree-llvmgpu-select-lowering-strategy)' test_new.mlir | |
: 1739882699:0;riree | |
: 1739882717:0;iree-opt --split-input-file --iree-gpu-test-target=gfx942 --pass-pipeline='builtin.module(iree-llvmgpu-select-lowering-strategy)' test_new.mlir | |
: 1739882787:0;riree | |
: 1739882808:0;iree-opt --split-input-file --iree-gpu-test-target=gfx942 --pass-pipeline='builtin.module(iree-llvmgpu-select-lowering-strategy)' test_new.mlir | |
: 1739883016:0;riree | |
: 1739883051:0;iree-opt --split-input-file --iree-gpu-test-target=gfx942 --pass-pipeline='builtin.module(iree-llvmgpu-select-lowering-strategy)' test_new.mlir | |
: 1739883136:0;riree | |
: 1739883275:0;iree-opt --split-input-file --iree-gpu-test-target=gfx942 --pass-pipeline='builtin.module(iree-llvmgpu-select-lowering-strategy)' test_new.mlir | |
: 1739883994:0;riree | |
: 1739888669:0;iree-opt --split-input-file --iree-gpu-test-target=gfx942 --pass-pipeline='builtin.module(iree-llvmgpu-select-lowering-strategy)' test_new.mlir | |
: 1739888968:0;riree | |
: 1739889007:0;iree-opt --split-input-file --iree-gpu-test-target=gfx942 --pass-pipeline='builtin.module(iree-llvmgpu-select-lowering-strategy)' test_new.mlir | |
: 1739889601:0;vi make.mlir | |
: 1739889688:0;riree | |
: 1739889709:0;iree-opt --split-input-file --iree-gpu-test-target=gfx942 --pass-pipeline='builtin.module(iree-llvmgpu-select-lowering-strategy)' test_new.mlir | |
: 1739890252:0;riree | |
: 1739890335:0;iree-opt --split-input-file --iree-gpu-test-target=gfx942 --pass-pipeline='builtin.module(iree-llvmgpu-select-lowering-strategy)' test_new.mlir | |
: 1739890501:0;riree | |
: 1739890521:0;iree-opt --split-input-file --iree-gpu-test-target=gfx942 --pass-pipeline='builtin.module(iree-llvmgpu-select-lowering-strategy)' test_new.mlir | |
: 1739890912:0;riree | |
: 1739890931:0;iree-opt --split-input-file --iree-gpu-test-target=gfx942 --pass-pipeline='builtin.module(iree-llvmgpu-select-lowering-strategy)' test_new.mlir | |
: 1739890966:0;iree-opt --split-input-file --iree-gpu-test-target=gfx942 --pass-pipeline='builtin.module(iree-llvmgpu-select-lowering-strategy)' test_new.mlir > new.mlir | |
: 1739890968:0;vi new.mlir | |
: 1739891000:0;iree-opt --split-input-file --iree-gpu-test-target=gfx942 --iree-codegen-llvmgpu-use-vector-distribution --iree-llvmgpu-enable-prefetch=true --pass-pipeline="builtin.module(hal.executable(hal.executable.variant(builtin.module(func.func(iree-llvmgpu-lower-executable-target)))))" new.mlir -mlir-print-ir-after-all 2> full.txt | |
: 1739891013:0;vi make.mlir new.mlir | |
: 1739891074:0;iree-opt --split-input-file --iree-gpu-test-target=gfx942 --iree-codegen-llvmgpu-use-vector-distribution --iree-llvmgpu-enable-prefetch=true --pass-pipeline="builtin.module(hal.executable(hal.executable.variant(builtin.module(func.func(iree-llvmgpu-lower-executable-target)))))" new.mlir -mlir-print-ir-after-all 2> full.txt | |
: 1739891110:0;vi make.mlir | |
: 1739891433:0;ls | |
: 1739891446:0;iree-opt --split-input-file --iree-gpu-test-target=gfx942 --pass-pipeline='builtin.module(iree-llvmgpu-select-lowering-strategy)' test_new.mlir 2> err.txt | |
: 1739891451:0;vi err.txt | |
: 1739891825:0;riree | |
: 1739891852:0;iree-opt --split-input-file --iree-gpu-test-target=gfx942 --pass-pipeline='builtin.module(iree-llvmgpu-select-lowering-strategy)' test_new.mlir | |
: 1739891912:0;iree-opt --split-input-file --iree-gpu-test-target=gfx942 --pass-pipeline='builtin.module(iree-llvmgpu-select-lowering-strategy)' new.mlir | |
: 1739891922:0;iree-opt --split-input-file --iree-gpu-test-target=gfx942 --pass-pipeline='builtin.module(iree-llvmgpu-select-lowering-strategy)' test.mlir | |
: 1739891932:0;iree-opt --split-input-file --iree-gpu-test-target=gfx942 --pass-pipeline='builtin.module(iree-llvmgpu-select-lowering-strategy)' test_new.mlir | |
: 1739891968:0;ls | |
: 1739891976:0;wget https://gist.github.com/IanWood1/948a753821f8aa8dc07288c903778fb5 | |
: 1739891981:0;ls | |
: 1739891983:0;vi 948a753821f8aa8dc07288c903778fb5 | |
: 1739891986:0;rm 948a753821f8aa8dc07288c903778fb5 | |
: 1739891997:0;wget https://gist.githubusercontent.com/IanWood1/948a753821f8aa8dc07288c903778fb5/raw/7f8460f76c92725ea50d0468af0985cdee3e8281/bad-uncollapsed.mlir | |
: 1739891999:0;ls | |
: 1739892027:0;iree-compile bad-uncollapsed.mlir \\ | |
--iree-hip-target=gfx942 \\ | |
-o=abc.vmfb \\ | |
--iree-hal-target-device=hip \\ | |
-mlir-print-ir-after-all 2> err.txt \\ | |
: 1739892036:0;ls | |
: 1739892039:0;ls -lh | |
: 1739892045:0;vi err.txt | |
: 1739892726:0;clang-format -i compiler/src/iree/compiler/Codegen/LLVMGPU/KernelConfig.cpp | |
: 1739893111:0;riree | |
: 1739893268:0;clang-format -i compiler/src/iree/compiler/Codegen/LLVMGPU/KernelConfig.cpp | |
: 1739893344:0;rm full.txt | |
: 1739893388:0;git-clang-format HEAD~ | |
: 1739893399:0;riree | |
: 1739893459:0;iree-compile bad-uncollapsed.mlir \\ | |
-iree-codegen-llvmgpu-test-vector-distribution-on-generics \\ | |
--iree-hip-target=gfx942 \\ | |
-o=abc.vmfb \\ | |
--iree-hal-target-device=hip \\ | |
-mlir-print-ir-after-all 2> err.txt \\ | |
: 1739893463:0;vi err.txt | |
: 1739893549:0;riree | |
: 1739893587:0;iree-compile bad-uncollapsed.mlir \\ | |
-iree-codegen-llvmgpu-test-vector-distribution-on-generics \\ | |
--iree-hip-target=gfx942 \\ | |
-o=abc.vmfb \\ | |
--iree-hal-target-device=hip \\ | |
-mlir-print-ir-after-all 2> err.txt \\ | |
: 1739893590:0;vi err.txt | |
: 1739893626:0;git ppf | |
: 1739894023:0;vi orig.mlir | |
: 1739894038:0;iree-compile orig.mlir \\ | |
-iree-codegen-llvmgpu-test-vector-distribution-on-generics \\ | |
--iree-hip-target=gfx942 \\ | |
-o=abc.vmfb \\ | |
--iree-hal-target-device=hip \\ | |
-mlir-print-ir-after-all 2> err.txt \\ | |
: 1739894042:0;vi err.txt | |
: 1739988173:0;\ | |
: 1739988178:0;tmux attach -t 0 | |
: 1739988186:0;wget https://gist.githubusercontent.com/IanWood1/e1a4fb466e382bb968c5cf9685924bca/raw/89b98a445be5bcb52f64d95ef2fc13e13479d669/model.mlir | |
: 1739988188:0;ls | |
: 1739988199:0;iree-compile model.mlir \\ | |
-iree-codegen-llvmgpu-test-vector-distribution-on-generics \\ | |
--iree-hip-target=gfx942 \\ | |
-o=abc.vmfb \\ | |
--iree-hal-target-device=hip \\ | |
-mlir-print-ir-after-all 2> err.txt \\ | |
: 1739988214:0;iree-compile model.mlir \\ | |
-iree-codegen-llvmgpu-test-vector-distribution-on-generics \\ | |
--iree-hip-target=gfx942 \\ | |
-o=abc.vmfb \\ | |
--iree-hal-target-device=hip\ | |
: 1739988305:0;iree-compile model.mlir \\ | |
-iree-codegen-llvmgpu-test-vector-distribution-on-generics \\ | |
--iree-hip-target=gfx942 \\ | |
-o=abc.vmfb \\ | |
--iree-hal-target-device=hip\ | |
-iree-hal-dump-executable-sources-to=dump/ | |
: 1739988372:0;iree-compile model.mlir \\ | |
-iree-codegen-llvmgpu-test-vector-distribution-on-generics \\ | |
--iree-hip-target=gfx942 \\ | |
-o=abc.vmfb \\ | |
--iree-hal-target-device=hip\ | |
-iree-hal-dump-executable-sources-to=dump/ 2> err.txt | |
: 1739988384:0;vi err.txt | |
: 1739988401:0;iree-compile model.mlir \\ | |
-iree-codegen-llvmgpu-test-vector-distribution-on-generics \\ | |
--iree-hip-target=gfx942 \\ | |
-o=abc.vmfb \\ | |
--iree-hal-target-device=hip\ | |
-iree-hal-dump-executable-sources-to=dump/ 2> err.txt | |
: 1739988436:0;ls | |
: 1739988455:0;iree-compile model.mlir \\ | |
-iree-codegen-llvmgpu-test-vector-distribution-on-generics \\ | |
--iree-hip-target=gfx942 \\ | |
-o=abc.vmfb \\ | |
--iree-hal-target-device=hip \\ | |
-iree-hal-dump-executable-sources-to=dump/ | |
: 1739988466:0;cd dump | |
: 1739988467:0;ls | |
: 1739988475:0;vi compiled_clip_encode_prompts\$async_dispatch_178.mlir | |
: 1739988512:0;gist-paste compiled_clip_encode_prompts\$async_dispatch_178.mlir | |
: 1739988531:0;ls | |
: 1739988548:0;iree-compile compiled_clip_encode_prompts\$async_dispatch_178.mlir \\ | |
-iree-codegen-llvmgpu-test-vector-distribution-on-generics \\ | |
--iree-hip-target=gfx942 \\ | |
-o=abc.vmfb \\ | |
--iree-hal-target-device=hip \\ | |
-iree-hal-dump-executable-sources-to=dump/ | |
: 1739988564:0;iree-compile compiled_clip_encode_prompts\$async_dispatch_178.mlir \\ | |
-iree-codegen-llvmgpu-test-vector-distribution-on-generics \\ | |
--iree-hip-target=gfx942 \\ | |
-o=abc.vmfb \\ | |
--iree-hal-target-device=hip \\ | |
-mlir-print-ir-after-all 2> err.txt | |
: 1739988567:0;vi err.txt | |
: 1740032953:0;\ | |
: 1740032955:0;tmux attach -t 0 | |
: 1740032959:0;ls | |
: 1740032971:0;wget hal.executable public @encode_prompts$async_dispatch_104 {\ | |
hal.executable.variant public @rocm_hsaco_fb target(<"rocm", "rocm-hsaco-fb", {abi = "hip", iree.gpu.target = #iree_gpu.target<arch = "gfx942", features = "", wgp = <compute = fp64|fp32|fp16|int64|int32|int16|int8, storage = b64|b32|b16|b8, subgroup = shuffle|arithmetic, dot = dp4xi8toi32, mma = [<MFMA_F32_16x16x4_F32>, <MFMA_F32_16x16x16_F16>, <MFMA_F32_32x32x8_F16>, <MFMA_F64_16x16x4_F64>, <MFMA_F32_16x16x16_BF16>, <MFMA_F32_32x32x8_BF16>, <MFMA_F32_16x16x32_F8E5M2FNUZ>, <MFMA_F32_16x16x32_F8E5M2FNUZ_F8E4M3FNUZ>, <MFMA_F32_16x16x32_F8E4M3FNUZ>, <MFMA_F32_16x16x32_F8E4M3FNUZ_F8E5M2FNUZ>, <MFMA_F32_32x32x16_F8E5M2FNUZ>, <MFMA_F32_32x32x16_F8E5M2FNUZ_F8E4M3FNUZ>, <MFMA_F32_32x32x16_F8E4M3FNUZ>, <MFMA_F32_32x32x16_F8E4M3FNUZ_F8E5M2FNUZ>, <MFMA_I32_16x16x32_I8>, <MFMA_I32_32x32x16_I8>], subgroup_size_choices = [64], max_workgroup_sizes = [1024, 1024, 1024], max_thread_count_per_workgroup = 1024, max_workgroup_memory_bytes = 65536, max_workgroup_counts = [2147483647, 2147483647, 2147483647], max_load_instruction_bits = 128, simds_per_wgp = 4, vgpr_space_bits = 16384>>, ukernels = "none", waves_per_eu = 2 : i64}>) {\ | |
hal.executable.export public @encode_prompts$async_dispatch_104_softmax_20x64x64xf32_generic ordinal(0) layout(#hal.pipeline.layout<constants = 2, bindings = [#hal.pipeline.binding<storage_buffer, "ReadOnly|Indirect">, #hal.pipeline.binding<storage_buffer, ReadOnly>, #hal.pipeline.binding<storage_buffer, Indirect>], flags = Indirect>) {\ | |
^bb0(%arg0: \ | |
%x, %y, %z = flow.dispatch.workgroup_count_from_slice \ | |
hal.return %x, %y, %z : index, index, index\ | |
}\ | |
builtin.module {\ | |
func.func @encode_prompts$async_dispatch_104_softmax_20x64x64xf32_generic() {\ | |
%c98304 = arith.constant 98304 : index\ | |
%0 = hal.interface.constant.load layout(<constants = 2, bindings = [#hal.pipeline.binding<storage_buffer, "ReadOnly|Indirect">, #hal.pipeline.binding<storage_buffer, ReadOnly>, #hal.pipeline.binding<storage_buffer, Indirect>], flags = Indirect>) ordinal(0) : i32\ | |
%1 = hal.interface.constant.load layout(<constants = 2, bindings = [#hal.pipeline.binding<storage_buffer, "ReadOnly|Indirect">, #hal.pipeline.binding<storage_buffer, ReadOnly>, #hal.pipeline.binding<storage_buffer, Indirect>], flags = Indirect>) ordinal(1) : i32\ | |
%2 = arith.index_castui %0 : i32 to index\ | |
%3 = arith.index_castui %1 : i32 to index\ | |
%4:2 = util.assume.int \ | |
%2[<umin = 1114112, umax = 1114112, udiv = 1114112>, <umin = 1114112, umax = 1114112, udiv = 1114112>, <umin = 1114112, umax = 1114112, udiv = 1114112>, <umin = 1114112, umax = 1114112, udiv = 1114112>, <umin = 1114112, umax = 1114112, udiv = 1114112>, <umin = 1114112, umax = 1114112, udiv = 1114112>, <umin = 1114112, umax = 1114112, udiv = 1114112>, <umin = 1114112, umax = 1114112, udiv = 1114112>, <umin = 1114112, umax = 1114112, udiv = 1114112>, <umin = 1114112, umax = 1114112, udiv = 1114112>, <umin = 1114112, umax = 1114112, udiv = 1114112>, <umin = 1114112, umax = 1114112, udiv = 1114112>, <umin = 1114112, umax = 1114112, udiv = 1114112>, <umin = 1114112, umax = 1114112, udiv = 1114112>, <umin = 1114112, umax = 1114112, udiv = 1114112>, <umin = 1114112, umax = 1114112, udiv = 1114112>, <umin = 1114112, umax = 1114112, udiv = 1114112>, <umin = 1114112, umax = 1114112, udiv = 1114112>, <umin = 1114112, umax = 1114112, udiv = 1114112>, <umin = 1114112, umax = 1114112, udiv = 1114112>, <umin = 1114112, umax = 1114112, udiv = 1114112>, <umin = 1114112, umax = 1114112, udiv = 1114112>, <umin = 1114112, umax = 1114112, udiv = 1114112>, <umin = 1114112, umax = 1114112, udiv = 1114112>, <umin = 1114112, umax = 1114112, udiv = 1114112>, <umin = 1114112, umax = 1114112, udiv = 1114112>, <umin = 1114112, umax = 1114112, udiv = 1114112>, <umin = 1114112, umax = 1114112, udiv = 1114112>, <umin = 1114112, umax = 1114112, udiv = 1114112>, <umin = 1114112, umax = 1114112, udiv = 1114112>, <umin = 1114112, umax = 1114112, udiv = 1114112>, <umin = 1114112, umax = 1114112, udiv = 1114112>, <umin = 1277952, umax = 1277952, udiv = 1277952>, <umin = 1277952, umax = 1277952, udiv = 1277952>, <umin = 1277952, umax = 1277952, udiv = 1277952>, <umin = 1277952, umax = 1277952, udiv = 1277952>, <umin = 1277952, umax = 1277952, udiv = 1277952>, <umin = 1277952, umax = 1277952, udiv = 1277952>, <umin = 1277952, umax = 1277952, udiv = 1277952>, <umin = 1277952, umax = 1277952, udiv = 1277952>, <umin = 1277952, umax = 1277952, udiv = 1277952>, <umin = 1277952, umax = 1277952, udiv = 1277952>, <umin = 1277952, umax = 1277952, udiv = 1277952>, <umin = 1277952, umax = 1277952, udiv = 1277952>, <umin = 1277952, umax = 1277952, udiv = 1277952>, <umin = 1277952, umax = 1277952, udiv = 1277952>, <umin = 1277952, umax = 1277952, udiv = 1277952>, <umin = 1277952, umax = 1277952, udiv = 1277952>, <umin = 1277952, umax = 1277952, udiv = 1277952>, <umin = 1277952, umax = 1277952, udiv = 1277952>, <umin = 1277952, umax = 1277952, udiv = 1277952>, <umin = 1277952, umax = 1277952, udiv = 1277952>, <umin = 1277952, umax = 1277952, udiv = 1277952>, <umin = 1277952, umax = 1277952, udiv = 1277952>, <umin = 1277952, umax = 1277952, udiv = 1277952>, <umin = 1277952, umax = 1277952, udiv = 1277952>, <umin = 1277952, umax = 1277952, udiv = 1277952>, <umin = 1277952, umax = 1277952, udiv = 1277952>, <umin = 1277952, umax = 1277952, udiv = 1277952>, <umin = 1277952, umax = 1277952, udiv = 1277952>, <umin = 1277952, umax = 1277952, udiv = 1277952>, <umin = 1277952, umax = 1277952, udiv = 1277952>, <umin = 1277952, umax = 1277952, udiv = 1277952>, <umin = 1277952, umax = 1277952, udiv = 1277952>], \ | |
%3[<umin = 950272, umax = 950272, udiv = 950272>, <umin = 950272, umax = 950272, udiv = 950272>, <umin = 950272, umax = 950272, udiv = 950272>, <umin = 950272, umax = 950272, udiv = 950272>, <umin = 950272, umax = 950272, udiv = 950272>, <umin = 950272, umax = 950272, udiv = 950272>, <umin = 950272, umax = 950272, udiv = 950272>, <umin = 950272, umax = 950272, udiv = 950272>, <umin = 950272, umax = 950272, udiv = 950272>, <umin = 950272, umax = 950272, udiv = 950272>, <umin = 950272, umax = 950272, udiv = 950272>, <umin = 950272, umax = 950272, udiv = 950272>, <umin = 950272, umax = 950272, udiv = 950272>, <umin = 950272, umax = 950272, udiv = 950272>, <umin = 950272, umax = 950272, udiv = 950272>, <umin = 950272, umax = 950272, udiv = 950272>, <umin = 950272, umax = 950272, udiv = 950272>, <umin = 950272, umax = 950272, udiv = 950272>, <umin = 950272, umax = 950272, udiv = 950272>, <umin = 950272, umax = 950272, udiv = 950272>, <umin = 950272, umax = 950272, udiv = 950272>, <umin = 950272, umax = 950272, udiv = 950272>, <umin = 950272, umax = 950272, udiv = 950272>, <umin = 950272, umax = 950272, udiv = 950272>, <umin = 950272, umax = 950272, udiv = 950272>, <umin = 950272, umax = 950272, udiv = 950272>, <umin = 950272, umax = 950272, udiv = 950272>, <umin = 950272, umax = 950272, udiv = 950272>, <umin = 950272, umax = 950272, udiv = 950272>, <umin = 950272, umax = 950272, udiv = 950272>, <umin = 950272, umax = 950272, udiv = 950272>, <umin = 950272, umax = 950272, udiv = 950272>, <umin = 1114112, umax = 1114112, udiv = 1114112>, <umin = 1114112, umax = 1114112, udiv = 1114112>, <umin = 1114112, umax = 1114112, udiv = 1114112>, <umin = 1114112, umax = 1114112, udiv = 1114112>, <umin = 1114112, umax = 1114112, udiv = 1114112>, <umin = 1114112, umax = 1114112, udiv = 1114112>, <umin = 1114112, umax = 1114112, udiv = 1114112>, <umin = 1114112, umax = 1114112, udiv = 1114112>, <umin = 1114112, umax = 1114112, udiv = 1114112>, <umin = 1114112, umax = 1114112, udiv = 1114112>, <umin = 1114112, umax = 1114112, udiv = 1114112>, <umin = 1114112, umax = 1114112, udiv = 1114112>, <umin = 1114112, umax = 1114112, udiv = 1114112>, <umin = 1114112, umax = 1114112, udiv = 1114112>, <umin = 1114112, umax = 1114112, udiv = 1114112>, <umin = 1114112, umax = 1114112, udiv = 1114112>, <umin = 1114112, umax = 1114112, udiv = 1114112>, <umin = 1114112, umax = 1114112, udiv = 1114112>, <umin = 1114112, umax = 1114112, udiv = 1114112>, <umin = 1114112, umax = 1114112, udiv = 1114112>, <umin = 1114112, umax = 1114112, udiv = 1114112>, <umin = 1114112, umax = 1114112, udiv = 1114112>, <umin = 1114112, umax = 1114112, udiv = 1114112>, <umin = 1114112, umax = 1114112, udiv = 1114112>, <umin = 1114112, umax = 1114112, udiv = 1114112>, <umin = 1114112, umax = 1114112, udiv = 1114112>, <umin = 1114112, umax = 1114112, udiv = 1114112>, <umin = 1114112, umax = 1114112, udiv = 1114112>, <umin = 1114112, umax = 1114112, udiv = 1114112>, <umin = 1114112, umax = 1114112, udiv = 1114112>, <umin = 1114112, umax = 1114112, udiv = 1114112>, <umin = 1114112, umax = 1114112, udiv = 1114112>]\ | |
: index, index\ | |
%5 = hal.interface.binding.subspan layout(<constants = 2, bindings = [#hal.pipeline.binding<storage_buffer, "ReadOnly|Indirect">, #hal.pipeline.binding<storage_buffer, ReadOnly>, #hal.pipeline.binding<storage_buffer, Indirect>], flags = Indirect>) binding(0) alignment(64) offset(%4#0) flags("ReadOnly|Indirect") : !flow.dispatch.tensor<readonly:tensor<20x64x64xf32>>\ | |
%6 = hal.interface.binding.subspan layout(<constants = 2, bindings = [#hal.pipeline.binding<storage_buffer, "ReadOnly|Indirect">, #hal.pipeline.binding<storage_buffer, ReadOnly>, #hal.pipeline.binding<storage_buffer, Indirect>], flags = Indirect>) binding(1) alignment(64) offset(%c98304) flags(ReadOnly) : !flow.dispatch.tensor<readonly:tensor<64x64xf16>>\ | |
%7 = hal.interface.binding.subspan layout(<constants = 2, bindings = [#hal.pipeline.binding<storage_buffer, "ReadOnly|Indirect">, #hal.pipeline.binding<storage_buffer, ReadOnly>, #hal.pipeline.binding<storage_buffer, Indirect>], flags = Indirect>) binding(2) alignment(64) offset(%4#1) flags(Indirect) : !flow.dispatch.tensor<writeonly:tensor<20x64x64xf16>>\ | |
%8 = flow.dispatch.tensor.load %5, offsets = [0, 0, 0], sizes = [20, 64, 64], strides = [1, 1, 1] : !flow.dispatch.tensor<readonly:tensor<20x64x64xf32>> -> tensor<20x64x64xf32>\ | |
%9 = flow.dispatch.tensor.load %6, offsets = [0, 0], sizes = [64, 64], strides = [1, 1] : !flow.dispatch.tensor<readonly:tensor<64x64xf16>> -> tensor<64x64xf16>\ | |
%10 = tensor.empty() : tensor<20x64x64xf16>\ | |
%11 = tensor.empty() : tensor<20x64x64xf32>\ | |
%12 = linalg.generic {indexing_maps = [affine_map<(d0, d1, d2) -> (d0, d1, d2)>, affine_map<(d0, d1, d2) -> (d1, d2)>, affine_map<(d0, d1, d2) -> (d0, d1, d2)>], iterator_types = ["parallel", "parallel", "parallel"]} ins(%8, %9 : tensor<20x64x64xf32>, tensor<64x64xf16>) outs(%11 : tensor<20x64x64xf32>) {\ | |
^bb0(%in: f32, %in_0: f16, %out: f32):\ | |
%15 = arith.truncf %in : f32 to f16\ | |
%16 = arith.addf %15, %in_0 : f16\ | |
%17 = arith.extf %16 : f16 to f32\ | |
linalg.yield %17 : f32\ | |
} -> tensor<20x64x64xf32>\ | |
%13 = linalg.softmax dimension(2) ins(%12 : tensor<20x64x64xf32>) outs(%11 : tensor<20x64x64xf32>) -> tensor<20x64x64xf32>\ | |
%14 = linalg.generic {indexing_maps = [affine_map<(d0, d1, d2) -> (d0, d1, d2)>, affine_map<(d0, d1, d2) -> (d0, d1, d2)>], iterator_types = ["parallel", "parallel", "parallel"]} ins(%13 : tensor<20x64x64xf32>) outs(%10 : tensor<20x64x64xf16>) {\ | |
^bb0(%in: f32, %out: f16):\ | |
%15 = arith.truncf %in : f32 to f16\ | |
linalg.yield %15 : f16\ | |
} -> tensor<20x64x64xf16>\ | |
flow.dispatch.tensor.store %14, %7, offsets = [0, 0, 0], sizes = [20, 64, 64], strides = [1, 1, 1] : tensor<20x64x64xf16> -> !flow.dispatch.tensor<writeonly:tensor<20x64x64xf16>>\ | |
return\ | |
}\ | |
}\ | |
}\ | |
} | |
: 1740032977:0;vi new.mlir | |
: 1740032990:0;iree-compile new.mlir \\ | |
-iree-codegen-llvmgpu-test-vector-distribution-on-generics \\ | |
--iree-hip-target=gfx942 \\ | |
-o=abc.vmfb \\ | |
--iree-hal-target-device=hip \\ | |
-mlir-print-ir-after-all 2> err.txt | |
: 1740032993:0;vi err.txt | |
: 1740033472:0;iree-compile new.mlir \\ | |
--iree-hip-target=gfx942 \\ | |
-o=abc.vmfb \\ | |
--iree-hal-target-device=hip \\ | |
-mlir-print-ir-after-all 2> err.txt | |
: 1740033476:0;vi err.txt | |
: 1740036600:0;clang-format -i compiler/src/iree/compiler/Codegen/LLVMGPU/KernelConfig.cpp | |
: 1740036802:0;riree | |
: 1740036942:0;iree-compile new.mlir \\ | |
-iree-codegen-llvmgpu-test-vector-distribution-on-generics \\ | |
--iree-hip-target=gfx942 \\ | |
-o=abc.vmfb \\ | |
--iree-hal-target-device=hip \\ | |
-mlir-print-ir-after-all 2> err.txt | |
: 1740036945:0;vi err.txt | |
: 1740037411:0;riree | |
: 1740037433:0;iree-compile new.mlir \\ | |
-iree-codegen-llvmgpu-test-vector-distribution-on-generics \\ | |
--iree-hip-target=gfx942 \\ | |
-o=abc.vmfb \\ | |
--iree-hal-target-device=hip \\ | |
-mlir-print-ir-after-all 2> err.txt | |
: 1740037436:0;vi err.txt | |
: 1740038737:0;riree | |
: 1740038757:0;iree-compile new.mlir \\ | |
-iree-codegen-llvmgpu-test-vector-distribution-on-generics \\ | |
--iree-hip-target=gfx942 \\ | |
-o=abc.vmfb \\ | |
--iree-hal-target-device=hip \\ | |
-mlir-print-ir-after-all 2> err.txt | |
: 1740038760:0;vi err.txt | |
: 1740038954:0;riree | |
: 1740038974:0;iree-compile new.mlir \\ | |
-iree-codegen-llvmgpu-test-vector-distribution-on-generics \\ | |
--iree-hip-target=gfx942 \\ | |
-o=abc.vmfb \\ | |
--iree-hal-target-device=hip \\ | |
-mlir-print-ir-after-all 2> err.txt | |
: 1740038976:0;vi err.txt | |
: 1740039018:0;iree-compile new.mlir \\ | |
-iree-codegen-llvmgpu-test-vector-distribution-on-generics \\ | |
--iree-hip-target=gfx942 \\ | |
-o=abc.vmfb \\ | |
--iree-hal-target-device=hip \\ | |
--compile-from=executable-sources \\ | |
-mlir-print-ir-after-all 2> err.txt | |
: 1740039021:0;vi err.txt | |
: 1740039034:0;iree-opt --split-input-file --iree-gpu-test-target=gfx942 --pass-pipeline='builtin.module(iree-llvmgpu-select-lowering-strategy)' test_new.mlir | |
: 1740039036:0;ls | |
: 1740039037:0;cd .. | |
: 1740039038:0;iree-opt --split-input-file --iree-gpu-test-target=gfx942 --pass-pipeline='builtin.module(iree-llvmgpu-select-lowering-strategy)' test_new.mlir | |
: 1740039074:0;iree-opt -iree-codegen-vector-distribute-on-generics --split-input-file --iree-gpu-test-target=gfx942 --pass-pipeline='builtin.module(iree-llvmgpu-select-lowering-strategy)' test_new.mlir | |
: 1740039096:0;iree-opt -iree-llvmgpu-codegen-test-vector-distribute-on-generics --split-input-file --iree-gpu-test-target=gfx942 --pass-pipeline='builtin.module(iree-llvmgpu-select-lowering-strategy)' test_new.mlir | |
: 1740039105:0;iree-opt -iree-llvmgpu-codegen-test-vector-distribution-on-generics --split-input-file --iree-gpu-test-target=gfx942 --pass-pipeline='builtin.module(iree-llvmgpu-select-lowering-strategy)' test_new.mlir | |
: 1740039117:0;iree-opt -iree-codegen-llvmgpu-test-vector-distribution-on-generics --split-input-file --iree-gpu-test-target=gfx942 --pass-pipeline='builtin.module(iree-llvmgpu-select-lowering-strategy)' test_new.mlir | |
: 1740039178:0;iree-opt -iree-codegen-llvmgpu-test-vector-distribution-on-generics --split-input-file --iree-gpu-test-target=gfx942 --pass-pipeline='builtin.module(iree-llvmgpu-select-lowering-strategy)' test_new.mlir > check_this.mlir | |
: 1740039208:0;ls | |
: 1740039219:0;iree-compile bad-uncollapsed.mlir \\ | |
-iree-codegen-llvmgpu-test-vector-distribution-on-generics \\ | |
--iree-hip-target=gfx942 \\ | |
-o=abc.vmfb \\ | |
--iree-hal-target-device=hip \\ | |
-mlir-print-ir-after-all 2> err.txt \\ | |
: 1740039226:0;vi err.txt | |
: 1740039317:0;ls | |
: 1740039319:0;cd dump | |
: 1740039320:0;ls | |
: 1740039328:0;iree-compile compiled_clip_encode_prompts\$async_dispatch_178.mlir \\ | |
-iree-codegen-llvmgpu-test-vector-distribution-on-generics \\ | |
--iree-hip-target=gfx942 \\ | |
-o=abc.vmfb \\ | |
--iree-hal-target-device=hip \\ | |
-mlir-print-ir-after-all 2> err.txt | |
: 1740039351:0;vi err.txt | |
: 1740039529:0;riree | |
: 1740039549:0;iree-compile compiled_clip_encode_prompts\$async_dispatch_178.mlir \\ | |
-iree-codegen-llvmgpu-test-vector-distribution-on-generics \\ | |
--iree-hip-target=gfx942 \\ | |
-o=abc.vmfb \\ | |
--iree-hal-target-device=hip \\ | |
-mlir-print-ir-after-all 2> err.txt | |
: 1740039572:0;iree-compile compiled_clip_encode_prompts\$async_dispatch_178.mlir \\ | |
-iree-codegen-llvmgpu-test-vector-distribution-on-generics \\ | |
--iree-hip-target=gfx942 \\ | |
-o=abc.vmfb \\ | |
--iree-hal-target-device=hip \\ | |
: 1740039583:0;ls | |
: 1740039588:0;vi err.txt | |
: 1740039593:0;vi new.mlir | |
: 1740039603:0;iree-compile new.mlir \\ | |
-iree-codegen-llvmgpu-test-vector-distribution-on-generics \\ | |
--iree-hip-target=gfx942 \\ | |
-o=abc.vmfb \\ | |
--iree-hal-target-device=hip \\ | |
--compile-from=executable-sources \\ | |
-mlir-print-ir-after-all 2> err.txt | |
: 1740039606:0;vi err.txt | |
: 1740039819:0;riree | |
: 1740039830:0;clang-format -i compiler/src/iree/compiler/Codegen/LLVMGPU/KernelConfig.cpp | |
: 1740039856:0;riree | |
: 1740040004:0;iree-compile new.mlir \\ | |
-iree-codegen-llvmgpu-test-vector-distribution-on-generics \\ | |
--iree-hip-target=gfx942 \\ | |
-o=abc.vmfb \\ | |
--iree-hal-target-device=hip \\ | |
--compile-from=executable-sources \\ | |
-mlir-print-ir-after-all 2> err.txt | |
: 1740040007:0;vi err.txt | |
: 1740040068:0;ls | |
: 1740040069:0;cd .. | |
: 1740040069:0;ls | |
: 1740040077:0;iree-compile model.mlir \\ | |
-iree-codegen-llvmgpu-test-vector-distribution-on-generics \\ | |
--iree-hip-target=gfx942 \\ | |
-o=abc.vmfb \\ | |
--iree-hal-target-device=hip \\ | |
-iree-hal-dump-executable-sources-to=dump/ | |
: 1740040111:0;ls | |
: 1740040130:0;clear | |
: 1740040130:0;ls | |
: 1740041669:0;vi model.mlir | |
: 1740041940:0;riree | |
: 1740041947:0;ls | |
: 1740041949:0;cd test | |
: 1740041950:0;ls | |
: 1740041953:0;cd warpreduction | |
: 1740041954:0;ls | |
: 1740042355:0;clang-format -i compiler/src/iree/compiler/Codegen/LLVMGPU/KernelConfig.cpp | |
: 1740042597:0;riree | |
: 1740042620:0;ls | |
: 1740042630:0;cd .. | |
: 1740042630:0;ls | |
: 1740042632:0;cd vectormulti | |
: 1740042633:0;ls | |
: 1740042635:0;wget https://raw.githubusercontent.com/nod-ai/sdxl-scripts/refs/heads/vinayakdsci/add-other-batched-inputs/int8-model/base_ir/punet_07_18.mlir | |
: 1740042639:0;ls | |
: 1740042646:0;mv punet_07_18.mlir punet.mlir | |
: 1740042647:0;clear | |
: 1740042648:0;ls | |
: 1740042656:0;iree-compile punet.mlir \\ | |
-iree-codegen-llvmgpu-test-vector-distribution-on-generics \\ | |
--iree-hip-target=gfx942 \\ | |
-o=abc.vmfb \\ | |
--iree-hal-target-device=hip \\ | |
-iree-hal-dump-executable-sources-to=dump/ | |
: 1740042784:0;htop | |
: 1740042798:0;iree-compile punet.mlir \\ | |
--iree-hip-target=gfx942 \\ | |
-o=abc.vmfb \\ | |
--iree-hal-target-device=hip \\ | |
-iree-hal-dump-executable-sources-to=dump/ | |
: 1740042968:0;riree | |
: 1740042987:0;iree-compile punet.mlir \\ | |
--iree-hip-target=gfx942 \\ | |
-o=abc.vmfb \\ | |
--iree-hal-target-device=hip \\ | |
-iree-hal-dump-executable-sources-to=dump/ | |
: 1740042993:0;iree-compile punet.mlir \\ | |
-iree-codegen-llvmgpu-test-vector-distribution-on-generics \\ | |
--iree-hip-target=gfx942 \\ | |
-o=abc.vmfb \\ | |
--iree-hal-target-device=hip \\ | |
-iree-hal-dump-executable-sources-to=dump/ | |
: 1740043261:0;ls | |
: 1740043262:0;cd dump | |
: 1740043262:0;ls | |
: 1740043267:0;vi module_main\$async_dispatch_256.mlir | |
: 1740043301:0;exit | |
: 1740043307:0;vi module_main\$async_dispatch_248.mlir | |
: 1740043327:0;grep vectordistribute | |
: 1740043355:0;vi module_main\$async_dispatch_2589.mlir | |
: 1740043398:0;riree | |
: 1740043423:0;cd .. | |
: 1740043423:0;ls | |
: 1740043429:0;iree-compile punet.mlir \\ | |
-iree-codegen-llvmgpu-test-vector-distribution-on-generics \\ | |
--iree-hip-target=gfx942 \\ | |
-o=abc.vmfb \\ | |
--iree-hal-target-device=hip \\ | |
-iree-hal-dump-executable-sources-to=dump/ | |
: 1740043472:0;riree | |
: 1740043487:0;rm -rf dump | |
: 1740043493:0;iree-compile punet.mlir \\ | |
-iree-codegen-llvmgpu-test-vector-distribution-on-generics \\ | |
--iree-hip-target=gfx942 \\ | |
-o=abc.vmfb \\ | |
--iree-hal-target-device=hip \\ | |
-iree-hal-dump-executable-sources-to=dump/ | |
: 1740043669:0;ls | |
: 1740043670:0;cd dump | |
: 1740043671:0;ls | |
: 1740043677:0;vi module_main\$async_dispatch_2589.mlir | |
: 1740043691:0;iree-compile module_main\$async_dispatch_2589.mlir \\ | |
-iree-codegen-llvmgpu-test-vector-distribution-on-generics \\ | |
--iree-hip-target=gfx942 \\ | |
-o=abc.vmfb \\ | |
--iree-hal-target-device=hip \\ | |
-iree-hal-dump-executable-sources-to=dump/ | |
: 1740043724:0;iree-compile module_main\$async_dispatch_2589.mlir \\ | |
-iree-codegen-llvmgpu-test-vector-distribution-on-generics \\ | |
--iree-hip-target=gfx942 \\ | |
-o=abc.vmfb \\ | |
--iree-hal-target-device=hip \\ | |
mlir-print-ir-after-all 2> err.txt | |
: 1740043726:0;vi err.txt | |
: 1740043732:0;iree-compile module_main\$async_dispatch_2589.mlir \\ | |
-iree-codegen-llvmgpu-test-vector-distribution-on-generics \\ | |
--iree-hip-target=gfx942 \\ | |
-o=abc.vmfb \\ | |
--iree-hal-target-device=hip \\ | |
--mlir-print-ir-after-all 2> err.txt | |
: 1740043734:0;vi err.txt | |
: 1740043926:0;riree | |
: 1740043947:0;iree-compile module_main\$async_dispatch_2589.mlir \\ | |
-iree-codegen-llvmgpu-test-vector-distribution-on-generics \\ | |
--iree-hip-target=gfx942 \\ | |
-o=abc.vmfb \\ | |
--iree-hal-target-device=hip \\ | |
--mlir-print-ir-after-all 2> err.txt | |
: 1740043948:0;vi err.txt | |
: 1740044273:0;riree | |
: 1740044297:0;iree-compile module_main\$async_dispatch_2589.mlir \\ | |
-iree-codegen-llvmgpu-test-vector-distribution-on-generics \\ | |
--iree-hip-target=gfx942 \\ | |
-o=abc.vmfb \\ | |
--iree-hal-target-device=hip \\ | |
--mlir-print-ir-after-all 2> err.txt | |
: 1740044299:0;vi err.txt | |
: 1740044595:0;riree | |
: 1740044617:0;iree-compile module_main\$async_dispatch_2589.mlir \\ | |
-iree-codegen-llvmgpu-test-vector-distribution-on-generics \\ | |
--iree-hip-target=gfx942 \\ | |
-o=abc.vmfb \\ | |
--iree-hal-target-device=hip \\ | |
--mlir-print-ir-after-all 2> err.txt | |
: 1740044619:0;vi err.txt | |
: 1740044666:0;iree-compile module_main\$async_dispatch_2589.mlir \\ | |
--iree-hip-target=gfx942 \\ | |
-o=abc.vmfb \\ | |
--iree-hal-target-device=hip \\ | |
--mlir-print-ir-after-all 2> err.txt | |
: 1740044670:0;vi err.txt | |
: 1740044789:0;riree | |
: 1740044821:0;iree-compile module_main\$async_dispatch_2589.mlir \\ | |
-iree-codegen-llvmgpu-test-vector-distribution-on-generics \\ | |
--iree-hip-target=gfx942 \\ | |
-o=abc.vmfb \\ | |
--iree-hal-target-device=hip \\ | |
--mlir-print-ir-after-all 2> err.txt | |
: 1740044823:0;vi err.txt | |
: 1740045293:0;riree | |
: 1740045315:0;iree-compile module_main\$async_dispatch_2589.mlir \\ | |
-iree-codegen-llvmgpu-test-vector-distribution-on-generics \\ | |
--iree-hip-target=gfx942 \\ | |
-o=abc.vmfb \\ | |
--iree-hal-target-device=hip \\ | |
--mlir-print-ir-after-all 2> err.txt | |
: 1740045317:0;vi err.txt | |
: 1740045418:0;riree | |
: 1740045438:0;iree-compile module_main\$async_dispatch_2589.mlir \\ | |
-iree-codegen-llvmgpu-test-vector-distribution-on-generics \\ | |
--iree-hip-target=gfx942 \\ | |
-o=abc.vmfb \\ | |
--iree-hal-target-device=hip \\ | |
--mlir-print-ir-after-all 2> err.txt | |
: 1740045440:0;vi err.txt | |
: 1740045474:0;riree | |
: 1740045494:0;iree-compile module_main\$async_dispatch_2589.mlir \\ | |
-iree-codegen-llvmgpu-test-vector-distribution-on-generics \\ | |
--iree-hip-target=gfx942 \\ | |
-o=abc.vmfb \\ | |
--iree-hal-target-device=hip \\ | |
--mlir-print-ir-after-all 2> err.txt | |
: 1740045496:0;vi err.txt | |
: 1740132122:0;\ | |
: 1740132126:0;tmux attach -t 0 | |
: 1740132152:0;riree | |
: 1740132231:0;iree-compile module_main\$async_dispatch_2589.mlir \\ | |
-iree-codegen-llvmgpu-test-vector-distribution-on-generics \\ | |
--iree-hip-target=gfx942 \\ | |
-o=abc.vmfb \\ | |
--iree-hal-target-device=hip \\ | |
--mlir-print-ir-after-all 2> err.txt | |
: 1740132233:0;vi err.txt | |
: 1740132849:0;riree | |
: 1740132869:0;iree-compile module_main\$async_dispatch_2589.mlir \\ | |
-iree-codegen-llvmgpu-test-vector-distribution-on-generics \\ | |
--iree-hip-target=gfx942 \\ | |
-o=abc.vmfb \\ | |
--iree-hal-target-device=hip \\ | |
--mlir-print-ir-after-all 2> err.txt | |
: 1740132871:0;vi err.txt | |
: 1740133114:0;riree | |
: 1740133134:0;iree-compile module_main\$async_dispatch_2589.mlir \\ | |
-iree-codegen-llvmgpu-test-vector-distribution-on-generics \\ | |
--iree-hip-target=gfx942 \\ | |
-o=abc.vmfb \\ | |
--iree-hal-target-device=hip \\ | |
--mlir-print-ir-after-all 2> err.txt | |
: 1740133136:0;vi err.txt | |
: 1740133174:0;riree | |
: 1740133202:0;cd .. | |
: 1740133202:0;ls | |
: 1740133215:0;iree-compile model.mlir \\ | |
-iree-codegen-llvmgpu-test-vector-distribution-on-generics \\ | |
--iree-hip-target=gfx942 \\ | |
-o=abc.vmfb \\ | |
--iree-hal-target-device=hip \\ | |
-iree-hal-dump-executable-sources-to=dump/ | |
: 1740133269:0;cd dump | |
: 1740133269:0;ls | |
: 1740133273:0;vi compiled_clip_encode_prompts\$async_dispatch_187.mlir | |
: 1740133290:0;iree-compile compiled_clip_encode_prompts\$async_dispatch_187.mlir \\ | |
-iree-codegen-llvmgpu-test-vector-distribution-on-generics \\ | |
--iree-hip-target=gfx942 \\ | |
-o=abc.vmfb \\ | |
--iree-hal-target-device=hip \\ | |
-iree-hal-dump-executable-sources-to=dump/ | |
: 1740133316:0;iree-compile compiled_clip_encode_prompts\$async_dispatch_187.mlir \\ | |
-iree-codegen-llvmgpu-test-vector-distribution-on-generics \\ | |
--iree-hip-target=gfx942 \\ | |
-o=abc.vmfb \\ | |
--iree-hal-target-device=hip \\ | |
-mlir-print-ir-after-all 2> full.txt | |
: 1740133318:0;vi full.txt | |
: 1740133545:0;riree | |
: 1740133566:0;iree-compile compiled_clip_encode_prompts\$async_dispatch_187.mlir \\ | |
-iree-codegen-llvmgpu-test-vector-distribution-on-generics \\ | |
--iree-hip-target=gfx942 \\ | |
-o=abc.vmfb \\ | |
--iree-hal-target-device=hip \\ | |
-mlir-print-ir-after-all 2> full.txt | |
: 1740133569:0;vi full.txt | |
: 1740133583:0;cd .. | |
: 1740133583:0;ls | |
: 1740133587:0;iree-compile model.mlir \\ | |
-iree-codegen-llvmgpu-test-vector-distribution-on-generics \\ | |
--iree-hip-target=gfx942 \\ | |
-o=abc.vmfb \\ | |
--iree-hal-target-device=hip \\ | |
-iree-hal-dump-executable-sources-to=dump/ | |
: 1740133635:0;cd dump | |
: 1740133635:0;ls | |
: 1740133644:0;iree-compile compiled_clip_encode_prompts\$async_dispatch_178.mlir \\ | |
-iree-codegen-llvmgpu-test-vector-distribution-on-generics \\ | |
--iree-hip-target=gfx942 \\ | |
-o=abc.vmfb \\ | |
--iree-hal-target-device=hip \\ | |
-iree-hal-dump-executable-sources-to=dump/ | |
: 1740133657:0;iree-compile compiled_clip_encode_prompts\$async_dispatch_178.mlir \\ | |
-iree-codegen-llvmgpu-test-vector-distribution-on-generics \\ | |
--iree-hip-target=gfx942 \\ | |
-o=abc.vmfb \\ | |
--iree-hal-target-device=hip \\ | |
-iree-hal-dump-executable-sources-to=dump/\ | |
-mlir-print-ir-after-all 2> err.txt | |
: 1740133659:0;vi err.txt | |
: 1740133671:0;iree-compile compiled_clip_encode_prompts\$async_dispatch_178.mlir \\ | |
-iree-codegen-llvmgpu-test-vector-distribution-on-generics \\ | |
--iree-hip-target=gfx942 \\ | |
-o=abc.vmfb \\ | |
--iree-hal-target-device=hip \\ | |
-iree-hal-dump-executable-sources-to=dump/\ | |
--mlir-print-ir-after-all 2> err.txt | |
: 1740133673:0;vi err.txt | |
: 1740133680:0;iree-compile compiled_clip_encode_prompts\$async_dispatch_178.mlir \\ | |
-iree-codegen-llvmgpu-test-vector-distribution-on-generics \\ | |
--iree-hip-target=gfx942 \\ | |
-o=abc.vmfb \\ | |
--iree-hal-target-device=hip \\ | |
--mlir-print-ir-after-all 2> err.txt | |
: 1740133682:0;vi err.txt | |
: 1740134104:0;riree | |
: 1740134145:0;iree-compile compiled_clip_encode_prompts\$async_dispatch_178.mlir \\ | |
-iree-codegen-llvmgpu-test-vector-distribution-on-generics \\ | |
--iree-hip-target=gfx942 \\ | |
-o=abc.vmfb \\ | |
--iree-hal-target-device=hip \\ | |
--mlir-print-ir-after-all 2> err.txt | |
: 1740134148:0;vi err.txt | |
: 1740134172:0;cd .. | |
: 1740134172:0;ls | |
: 1740134178:0;iree-compile model.mlir \\ | |
-iree-codegen-llvmgpu-test-vector-distribution-on-generics \\ | |
--iree-hip-target=gfx942 \\ | |
-o=abc.vmfb \\ | |
--iree-hal-target-device=hip \\ | |
-iree-hal-dump-executable-sources-to=dump/ | |
: 1740134214:0;iree-compile model.mlir \\ | |
-iree-codegen-llvmgpu-test-vector-distribution-on-generics \\ | |
--iree-hip-target=gfx942 \\ | |
-o=abc.vmfb \\ | |
--iree-hal-target-device=hip \\ | |
-iree-hal-dump-executable-sources-to=dump/ 2> err.txt | |
: 1740134232:0;vi err.txt | |
: 1740134273:0;cd dump | |
: 1740134274:0;ls | |
: 1740134303:0;iree-compile module_main\$async_dispatch_1.mlir \\ | |
-iree-codegen-llvmgpu-test-vector-distribution-on-generics \\ | |
--iree-hip-target=gfx942 \\ | |
-o=abc.vmfb \\ | |
--iree-hal-target-device=hip \\ | |
-iree-hal-dump-executable-sources-to=dump/ 2> err.txt | |
: 1740134328:0;iree-compile compiled_clip_encode_prompts\$async_dispatch_178.mlir \\ | |
-iree-codegen-llvmgpu-test-vector-distribution-on-generics \\ | |
--iree-hip-target=gfx942 \\ | |
-o=abc.vmfb \\ | |
--iree-hal-target-device=hip \\ | |
-iree-hal-dump-executable-sources-to=dump/ 2> err.txt | |
: 1740134330:0;vi err.txt | |
: 1740134346:0;iree-compile compiled_clip_encode_prompts\$async_dispatch_178.mlir \\ | |
-iree-codegen-llvmgpu-test-vector-distribution-on-generics \\ | |
--iree-hip-target=gfx942 \\ | |
-o=abc.vmfb \\ | |
--iree-hal-target-device=hip \\ | |
-mlir-print-ir-after-all \\ | |
-iree-hal-dump-executable-sources-to=dump/ 2> err.txt | |
: 1740134349:0;vi err.txt | |
: 1740134606:0;riree | |
: 1740134643:0;iree-compile compiled_clip_encode_prompts\$async_dispatch_178.mlir \\ | |
-iree-codegen-llvmgpu-test-vector-distribution-on-generics \\ | |
--iree-hip-target=gfx942 \\ | |
-o=abc.vmfb \\ | |
--iree-hal-target-device=hip \\ | |
-mlir-print-ir-after-all \\ | |
-iree-hal-dump-executable-sources-to=dump/ 2> err.txt | |
: 1740134647:0;vi err.txt | |
: 1740144649:0;tmux attach -t 0 | |
: 1740154833:0;ls | |
: 1740154835:0;cd .. | |
: 1740154835:0;ls | |
: 1740154838:0;vi test_this_now.mlir | |
: 1740154843:0;ls | |
: 1740154847:0;vi test_this_now.mlir | |
: 1740154872:0;iree-opt -iree-codegen-llvmgpu-test-vector-distribution-on-generics --split-input-file --iree-gpu-test-target=gfx942 --pass-pipeline='builtin.module(iree-llvmgpu-select-lowering-strategy)' test_new.mlir > check_this.mlir | |
: 1740154874:0;vi check_this.mlir | |
: 1740154910:0;iree-opt --split-input-file --iree-gpu-test-target=gfx942 --iree-codegen-llvmgpu-use-vector-distribution --iree-llvmgpu-enable-prefetch=true --pass-pipeline="builtin.module(hal.executable(hal.executable.variant(builtin.module(func.func(iree-llvmgpu-lower-executable-target)))))" make.mlir -mlir-print-ir-after-all 2> full.txt | |
: 1740154921:0;iree-opt --split-input-file --iree-gpu-test-target=gfx942 --iree-codegen-llvmgpu-use-vector-distribution --iree-llvmgpu-enable-prefetch=true --pass-pipeline="builtin.module(hal.executable(hal.executable.variant(builtin.module(func.func(iree-llvmgpu-lower-executable-target)))))" test_this_now.mlir -mlir-print-ir-after-all 2> full.txt | |
: 1740154939:0;vi make.mlir | |
: 1740154955:0;iree-opt --split-input-file --iree-gpu-test-target=gfx942 --iree-codegen-llvmgpu-use-vector-distribution --iree-llvmgpu-enable-prefetch=true --pass-pipeline="builtin.module(hal.executable(hal.executable.variant(builtin.module(func.func(iree-llvmgpu-lower-executable-target)))))" make.mlir | |
: 1740154969:0;vi test_this_now.mlir | |
: 1740155080:0;iree-opt --split-input-file --iree-gpu-test-target=gfx942 --iree-codegen-llvmgpu-use-vector-distribution --iree-llvmgpu-enable-prefetch=true --pass-pipeline="builtin.module(hal.executable(hal.executable.variant(builtin.module(func.func(iree-llvmgpu-lower-executable-target)))))" test_this_now.mlir | |
: 1740155090:0;vi test_this_now.mlir | |
: 1740155126:0;iree-opt --split-input-file --iree-gpu-test-target=gfx942 --iree-codegen-llvmgpu-use-vector-distribution --iree-llvmgpu-enable-prefetch=true --pass-pipeline="builtin.module(hal.executable(hal.executable.variant(builtin.module(func.func(iree-llvmgpu-lower-executable-target)))))" test_this_now.mlir | |
: 1740155138:0;vi test_this_now.mlir | |
: 1740155159:0;iree-opt --split-input-file --iree-gpu-test-target=gfx942 --iree-codegen-llvmgpu-use-vector-distribution --iree-llvmgpu-enable-prefetch=true --pass-pipeline="builtin.module(hal.executable(hal.executable.variant(builtin.module(func.func(iree-llvmgpu-lower-executable-target)))))" test_this_now.mlir | |
: 1740155199:0;vi test_this_now.mlir | |
: 1740155209:0;iree-opt --split-input-file --iree-gpu-test-target=gfx942 --iree-codegen-llvmgpu-use-vector-distribution --iree-llvmgpu-enable-prefetch=true --pass-pipeline="builtin.module(hal.executable(hal.executable.variant(builtin.module(func.func(iree-llvmgpu-lower-executable-target)))))" test_this_now.mlir | |
: 1740155212:0;vi test_this_now.mlir | |
: 1740155225:0;iree-opt --split-input-file --iree-gpu-test-target=gfx942 --iree-codegen-llvmgpu-use-vector-distribution --iree-llvmgpu-enable-prefetch=true --pass-pipeline="builtin.module(hal.executable(hal.executable.variant(builtin.module(func.func(iree-llvmgpu-lower-executable-target)))))" test_this_now.mlir | |
: 1740155236:0;iree-opt --split-input-file --iree-gpu-test-target=gfx942 --iree-codegen-llvmgpu-use-vector-distribution --iree-llvmgpu-enable-prefetch=true --pass-pipeline="builtin.module(hal.executable(hal.executable.variant(builtin.module(func.func(iree-llvmgpu-lower-executable-target)))))" test_this_now.mlir -mlir-print-ir-after-all 2> full.txt | |
: 1740155238:0;vi full.txt | |
: 1740155522:0;vi test_this_now.mlir | |
: 1740155838:0;iree-opt --split-input-file --iree-gpu-test-target=gfx942 --iree-codegen-llvmgpu-use-vector-distribution --iree-llvmgpu-enable-prefetch=true --pass-pipeline="builtin.module(hal.executable(hal.executable.variant(builtin.module(func.func(iree-llvmgpu-lower-executable-target)))))" test_this_now.mlir -mlir-print-ir-after-all 2> full.txt | |
: 1740155841:0;vi full.txt | |
: 1740155884:0;vi test_this_now.mlir | |
: 1740156435:0;iree-opt --split-input-file --iree-gpu-test-target=gfx942 --iree-codegen-llvmgpu-use-vector-distribution --iree-llvmgpu-enable-prefetch=true --pass-pipeline="builtin.module(hal.executable(hal.executable.variant(builtin.module(func.func(iree-llvmgpu-lower-executable-target)))))" test_this_now.mlir -mlir-print-ir-after-all 2> full.txt | |
: 1740156437:0;vi full.txt | |
: 1740156468:0;iree-opt --split-input-file --iree-gpu-test-target=gfx942 --iree-codegen-llvmgpu-use-vector-distribution --iree-llvmgpu-enable-prefetch=true --pass-pipeline="builtin.module(hal.executable(hal.executable.variant(builtin.module(func.func(iree-llvmgpu-lower-executable-target)))))" make.mlir -mlir-print-ir-after-all 2> full.txt | |
: 1740156496:0;vi make.mlir test_this_now.mlir | |
: 1740156597:0;iree-opt --split-input-file --iree-gpu-test-target=gfx942 --iree-codegen-llvmgpu-use-vector-distribution --iree-llvmgpu-enable-prefetch=true --pass-pipeline="builtin.module(hal.executable(hal.executable.variant(builtin.module(func.func(iree-llvmgpu-lower-executable-target)))))" make.mlir -mlir-print-ir-after-all 2> full.txt | |
: 1740156604:0;iree-opt --split-input-file --iree-gpu-test-target=gfx942 --iree-codegen-llvmgpu-use-vector-distribution --iree-llvmgpu-enable-prefetch=true --pass-pipeline="builtin.module(hal.executable(hal.executable.variant(builtin.module(func.func(iree-llvmgpu-lower-executable-target)))))" test_this_now.mlir -mlir-print-ir-after-all 2> full.txt | |
: 1740156606:0;vi full.txt | |
: 1740156688:0;vi test_this_now.mlir | |
: 1740156709:0;iree-opt --split-input-file --iree-gpu-test-target=gfx942 --iree-codegen-llvmgpu-use-vector-distribution --iree-llvmgpu-enable-prefetch=true --pass-pipeline="builtin.module(hal.executable(hal.executable.variant(builtin.module(func.func(iree-llvmgpu-lower-executable-target)))))" test_this_now.mlir -mlir-print-ir-after-all 2> full.txt | |
: 1740156711:0;vi full.txt | |
: 1740156719:0;vi make.mlir | |
: 1740156903:0;vi test_this_now.mlir | |
: 1740156974:0;iree-opt --split-input-file --iree-gpu-test-target=gfx942 --iree-codegen-llvmgpu-use-vector-distribution --iree-llvmgpu-enable-prefetch=true --pass-pipeline="builtin.module(hal.executable(hal.executable.variant(builtin.module(func.func(iree-llvmgpu-lower-executable-target)))))" make.mlir -mlir-print-ir-after-all 2> full.txt | |
: 1740156981:0;iree-opt --split-input-file --iree-gpu-test-target=gfx942 --iree-codegen-llvmgpu-use-vector-distribution --iree-llvmgpu-enable-prefetch=true --pass-pipeline="builtin.module(hal.executable(hal.executable.variant(builtin.module(func.func(iree-llvmgpu-lower-executable-target)))))" test_this_now.mlir -mlir-print-ir-after-all 2> full.txt | |
: 1740156984:0;vi full.txt | |
: 1740157015:0;iree-opt --split-input-file --iree-gpu-test-target=gfx942 --iree-codegen-llvmgpu-use-vector-distribution --iree-llvmgpu-enable-prefetch=true --pass-pipeline="builtin.module(hal.executable(hal.executable.variant(builtin.module(func.func(iree-llvmgpu-lower-executable-target)))))" test_this_now.mlir --debug 2> full.txt | |
: 1740157017:0;vi full.txt | |
: 1740157282:0;riree | |
: 1740157309:0;iree-compile model.mlir \\ | |
-iree-codegen-llvmgpu-test-vector-distribution-on-generics \\ | |
--iree-hip-target=gfx942 \\ | |
-o=abc.vmfb \\ | |
--iree-hal-target-device=hip \\ | |
-iree-hal-dump-executable-sources-to=dump/ 2> err.txt | |
: 1740157324:0;vi err.txt | |
: 1740157391:0;ls | |
: 1740157404:0;vi test_this_now.mlir | |
: 1740157441:0;iree-opt --split-input-file --iree-gpu-test-target=gfx942 --iree-codegen-llvmgpu-use-vector-distribution --iree-llvmgpu-enable-prefetch=true --pass-pipeline="builtin.module(hal.executable(hal.executable.variant(builtin.module(func.func(iree-llvmgpu-lower-executable-target)))))" test_this_now.mlir --debug 2> full.txt | |
: 1740157468:0;iree-opt --split-input-file --iree-gpu-test-target=gfx942 --iree-codegen-llvmgpu-use-vector-distribution --iree-llvmgpu-enable-prefetch=true --pass-pipeline="builtin.module(hal.executable(hal.executable.variant(builtin.module(func.func(iree-llvmgpu-lower-executable-target)))))" test_this_now.mlir | |
: 1740157517:0;ls | |
: 1740157542:0;riree | |
: 1740157582:0;iree-compile model.mlir \\ | |
-iree-codegen-llvmgpu-test-vector-distribution-on-generics \\ | |
--iree-hip-target=gfx942 \\ | |
-o=abc.vmfb \\ | |
--iree-hal-target-device=hip \\ | |
-iree-hal-dump-executable-sources-to=dump/ 2> err.txt | |
: 1740157595:0;vi err.txt | |
: 1740157612:0;vi test_this_now.mlir | |
: 1740157619:0;iree-opt --split-input-file --iree-gpu-test-target=gfx942 --iree-codegen-llvmgpu-use-vector-distribution --iree-llvmgpu-enable-prefetch=true --pass-pipeline="builtin.module(hal.executable(hal.executable.variant(builtin.module(func.func(iree-llvmgpu-lower-executable-target)))))" test_this_now.mlir | |
: 1740157625:0;vi test_this_now.mlir | |
: 1740157759:0;iree-opt --split-input-file --iree-gpu-test-target=gfx942 --iree-codegen-llvmgpu-use-vector-distribution --iree-llvmgpu-enable-prefetch=true --pass-pipeline="builtin.module(hal.executable(hal.executable.variant(builtin.module(func.func(iree-llvmgpu-lower-executable-target)))))" test_this_now.mlir | |
: 1740157783:0;vi test_this_now.mlir | |
: 1740157808:0;iree-opt --split-input-file --iree-gpu-test-target=gfx942 --iree-codegen-llvmgpu-use-vector-distribution --iree-llvmgpu-enable-prefetch=true --pass-pipeline="builtin.module(hal.executable(hal.executable.variant(builtin.module(func.func(iree-llvmgpu-lower-executable-target)))))" test_this_now.mlir | |
: 1740157834:0;vi make.mlir | |
: 1740157968:0;iree-opt --split-input-file --iree-gpu-test-target=gfx942 --iree-codegen-llvmgpu-use-vector-distribution --iree-llvmgpu-enable-prefetch=true --pass-pipeline="builtin.module(hal.executable(hal.executable.variant(builtin.module(func.func(iree-llvmgpu-lower-executable-target)))))" test_this_now.mlir | |
: 1740158091:0;ls | |
: 1740158094:0;vi test_this_now.mlir | |
: 1740158114:0;iree-opt --split-input-file --iree-gpu-test-target=gfx942 --iree-codegen-llvmgpu-use-vector-distribution --iree-llvmgpu-enable-prefetch=true --pass-pipeline="builtin.module(hal.executable(hal.executable.variant(builtin.module(func.func(iree-llvmgpu-lower-executable-target)))))" test_this_now.mlir | |
: 1740158180:0;iree-opt --split-input-file --iree-gpu-test-target=gfx942 --iree-codegen-llvmgpu-use-vector-distribution --iree-llvmgpu-enable-prefetch=true --pass-pipeline="builtin.module(hal.executable(hal.executable.variant(builtin.module(func.func(iree-llvmgpu-lower-executable-target)))))" test_this_now.mlir --debug 2> full.txt | |
: 1740158182:0;vi full.txt | |
: 1740158663:0;iree-opt --split-input-file --iree-gpu-test-target=gfx942 --iree-codegen-llvmgpu-use-vector-distribution --iree-llvmgpu-enable-prefetch=true --pass-pipeline="builtin.module(hal.executable(hal.executable.variant(builtin.module(func.func(iree-llvmgpu-lower-executable-target)))))" test_this_now.mlir --debug 2> full.txt -mlir-print-ir-after-all | |
: 1740158665:0;vi full.txt | |
: 1740158674:0;iree-opt --split-input-file --iree-gpu-test-target=gfx942 --iree-codegen-llvmgpu-use-vector-distribution --iree-llvmgpu-enable-prefetch=true --pass-pipeline="builtin.module(hal.executable(hal.executable.variant(builtin.module(func.func(iree-llvmgpu-lower-executable-target)))))" test_this_now.mlir 2> full.txt -mlir-print-ir-after-all | |
: 1740158675:0;vi full.txt | |
: 1740159828:0;iree-opt --split-input-file --iree-gpu-test-target=gfx942 --iree-codegen-llvmgpu-use-vector-distribution --iree-llvmgpu-enable-prefetch=true --pass-pipeline="builtin.module(hal.executable(hal.executable.variant(builtin.module(func.func(iree-llvmgpu-lower-executable-target)))))" test_this_now.mlir 2> full.txt -mlir-print-ir-after-all -mlir-disable-threading | |
: 1740159831:0;vi full.txt | |
: 1740159913:0;gist-paste full.txt | |
: 1740160443:0;ls | |
: 1740160455:0;vi test_ | |
: 1740160458:0;vi test_this_now.mlir | |
: 1740160515:0;iree-opt --split-input-file --iree-gpu-test-target=gfx942 --iree-codegen-llvmgpu-use-vector-distribution --iree-llvmgpu-enable-prefetch=true --pass-pipeline="builtin.module(hal.executable(hal.executable.variant(builtin.module(func.func(iree-llvmgpu-lower-executable-target)))))" test_this_now.mlir 2> full.txt -mlir-print-ir-after-all -mlir-disable-threading | |
: 1740160518:0;vi full.txt | |
: 1740160544:0;vi test.mlir | |
: 1740160559:0;vi test_this_now.mlir | |
: 1740160593:0;iree-opt -iree-codegen-llvmgpu-test-vector-distribution-on-generics --split-input-file --iree-gpu-test-target=gfx942 --pass-pipeline='builtin.module(iree-llvmgpu-select-lowering-strategy)' test_new.mlir > check_this.mlir | |
: 1740160595:0;vi check_this.mlir | |
: 1740160620:0;vi test_this_now.mlir | |
: 1740160643:0;iree-opt --split-input-file --iree-gpu-test-target=gfx942 --iree-codegen-llvmgpu-use-vector-distribution --iree-llvmgpu-enable-prefetch=true --pass-pipeline="builtin.module(hal.executable(hal.executable.variant(builtin.module(func.func(iree-llvmgpu-lower-executable-target)))))" test_this_now.mlir 2> full.txt -mlir-print-ir-after-all -mlir-disable-threading | |
: 1740160645:0;vi full.txt | |
: 1740160930:0;riree | |
: 1740160943:0;iree-opt --split-input-file --iree-gpu-test-target=gfx942 --iree-codegen-llvmgpu-use-vector-distribution --iree-llvmgpu-enable-prefetch=true --pass-pipeline="builtin.module(hal.executable(hal.executable.variant(builtin.module(func.func(iree-llvmgpu-lower-executable-target)))))" test_this_now.mlir 2> full.txt -mlir-print-ir-after-all -mlir-disable-threading | |
: 1740161038:0;riree | |
: 1740161051:0;iree-opt --split-input-file --iree-gpu-test-target=gfx942 --iree-codegen-llvmgpu-use-vector-distribution --iree-llvmgpu-enable-prefetch=true --pass-pipeline="builtin.module(hal.executable(hal.executable.variant(builtin.module(func.func(iree-llvmgpu-lower-executable-target)))))" test_this_now.mlir 2> full.txt -mlir-print-ir-after-all -mlir-disable-threading | |
: 1740161054:0;vi full.txt | |
: 1740161068:0;vi test_this_now.mlir | |
: 1740161114:0;iree-opt --split-input-file --iree-gpu-test-target=gfx942 --iree-codegen-llvmgpu-use-vector-distribution --iree-llvmgpu-enable-prefetch=true --pass-pipeline="builtin.module(hal.executable(hal.executable.variant(builtin.module(func.func(iree-llvmgpu-lower-executable-target)))))" test_this_now.mlir 2> full.txt -mlir-print-ir-after-all -mlir-disable-threading | |
: 1740161116:0;vi ffull | |
: 1740161119:0;vi full.txt | |
: 1740161148:0;vi test_this_now.mlir | |
: 1740161167:0;iree-opt --split-input-file --iree-gpu-test-target=gfx942 --iree-codegen-llvmgpu-use-vector-distribution --iree-llvmgpu-enable-prefetch=true --pass-pipeline="builtin.module(hal.executable(hal.executable.variant(builtin.module(func.func(iree-llvmgpu-lower-executable-target)))))" test_this_now.mlir 2> full.txt -mlir-print-ir-after-all -mlir-disable-threading | |
: 1740161170:0;vi test_this_now.mlir | |
: 1740161173:0;vi full.txt | |
: 1740161745:0;vi test_this_now.mlir | |
: 1740161753:0;iree-opt --split-input-file --iree-gpu-test-target=gfx942 --iree-codegen-llvmgpu-use-vector-distribution --iree-llvmgpu-enable-prefetch=true --pass-pipeline="builtin.module(hal.executable(hal.executable.variant(builtin.module(func.func(iree-llvmgpu-lower-executable-target)))))" test_this_now.mlir 2> full.txt -mlir-print-ir-after-all -mlir-disable-threading | |
: 1740161755:0;vi full.txt | |
: 1740162213:0;cat full.txt | |
: 1740162412:0;vi test_this_now.mlir | |
: 1740162431:0;iree-opt --split-input-file --iree-gpu-test-target=gfx942 --iree-codegen-llvmgpu-use-vector-distribution --iree-llvmgpu-enable-prefetch=true --pass-pipeline="builtin.module(hal.executable(hal.executable.variant(builtin.module(func.func(iree-llvmgpu-lower-executable-target)))))" test_this_now.mlir 2> full.txt -mlir-print-ir-after-all -mlir-disable-threading | |
: 1740162491:0;vi test_this_now.mlir | |
: 1740162558:0;iree-opt --split-input-file --iree-gpu-test-target=gfx942 --iree-codegen-llvmgpu-use-vector-distribution --iree-llvmgpu-enable-prefetch=true --pass-pipeline="builtin.module(hal.executable(hal.executable.variant(builtin.module(func.func(iree-llvmgpu-lower-executable-target)))))" test_this_now.mlir 2> full_err.txt -mlir-print-ir-after-all -mlir-disable-threading | |
: 1740162561:0;vi full_err.txt | |
: 1740162741:0;riree | |
: 1740162761:0;iree-opt --split-input-file --iree-gpu-test-target=gfx942 --iree-codegen-llvmgpu-use-vector-distribution --iree-llvmgpu-enable-prefetch=true --pass-pipeline="builtin.module(hal.executable(hal.executable.variant(builtin.module(func.func(iree-llvmgpu-lower-executable-target)))))" test_this_now.mlir 2> full_err.txt -mlir-print-ir-after-all -mlir-disable-threading | |
: 1740162764:0;vi full_err.txt | |
: 1740162952:0;riree | |
: 1740162975:0;ls | |
: 1740162982:0;iree-compile model.mlir \\ | |
-iree-codegen-llvmgpu-test-vector-distribution-on-generics \\ | |
--iree-hip-target=gfx942 \\ | |
-o=abc.vmfb \\ | |
--iree-hal-target-device=hip \\ | |
-iree-hal-dump-executable-sources-to=dump/ 2> err.txt | |
: 1740162994:0;vi err.txt | |
: 1740163021:0;rm -rf dump | |
: 1740163023:0;iree-compile model.mlir \\ | |
-iree-codegen-llvmgpu-test-vector-distribution-on-generics \\ | |
--iree-hip-target=gfx942 \\ | |
-o=abc.vmfb \\ | |
--iree-hal-target-device=hip \\ | |
-iree-hal-dump-executable-sources-to=dump/ 2> err.txt | |
: 1740164212:0;vi err.txt | |
: 1740164271:0;cd dump | |
: 1740164271:0;ls | |
: 1740164274:0;vi compiled_clip_encode_prompts\$async_dispatch_179.mlir | |
: 1740164328:0;iree-compile compiled_clip_encode_prompts\$async_dispatch_179.mlir \\ | |
-iree-codegen-llvmgpu-test-vector-distribution-on-generics \\ | |
--iree-hip-target=gfx942 \\ | |
-o=abc.vmfb \\ | |
--iree-hal-target-device=hip \\ | |
-iree-hal-dump-executable-sources-to=dump/ 2> err.txt | |
: 1740164330:0;vi err.txt | |
: 1740164362:0;riree | |
: 1740164381:0;iree-compile compiled_clip_encode_prompts\$async_dispatch_179.mlir \\ | |
-iree-codegen-llvmgpu-test-vector-distribution-on-generics \\ | |
--iree-hip-target=gfx942 \\ | |
-o=abc.vmfb \\ | |
--iree-hal-target-device=hip \\ | |
-iree-hal-dump-executable-sources-to=dump/ 2> err.txt | |
: 1740164384:0;vi err.txt | |
: 1740164389:0;cd .. | |
: 1740164390:0;ls | |
: 1740164396:0;iree-compile model.mlir \\ | |
-iree-codegen-llvmgpu-test-vector-distribution-on-generics \\ | |
--iree-hip-target=gfx942 \\ | |
-o=abc.vmfb \\ | |
--iree-hal-target-device=hip \\ | |
-iree-hal-dump-executable-sources-to=dump/ 2> err.txt | |
: 1740164409:0;vi err.txt | |
: 1740164426:0;cd dump | |
: 1740164426:0;ls | |
: 1740164434:0;iree-compile compiled_clip_encode_prompts\$async_dispatch_187.mlir \\ | |
-iree-codegen-llvmgpu-test-vector-distribution-on-generics \\ | |
--iree-hip-target=gfx942 \\ | |
-o=abc.vmfb \\ | |
--iree-hal-target-device=hip \\ | |
-iree-hal-dump-executable-sources-to=dump/ 2> err.txt | |
: 1740164436:0;vi err.txt | |
: 1740164459:0;iree-compile compiled_clip_encode_prompts\$async_dispatch_187.mlir \\ | |
-iree-codegen-llvmgpu-test-vector-distribution-on-generics \\ | |
--iree-hip-target=gfx942 \\ | |
-o=abc.vmfb \\ | |
--iree-hal-target-device=hip \\ | |
-mlir-print-ir-after-all \\ | |
-iree-hal-dump-executable-sources-to=dump/ 2> err.txt | |
: 1740164461:0;vi err.txt | |
: 1740164839:0;vi compiled_clip_encode_prompts\$async_dispatch_187.mlir | |
: 1740164847:0;vi err.txt | |
: 1740165067:0;vi test_softmax.mlir | |
: 1740165079:0;mv test_softmax.mlir ../ | |
: 1740165081:0;cd .. | |
: 1740165081:0;ls | |
: 1740165089:0;vi test_softmax.mlir test_this_now.mlir | |
: 1740165159:0;iree-opt --split-input-file --iree-gpu-test-target=gfx942 --iree-codegen-llvmgpu-use-vector-distribution --iree-llvmgpu-enable-prefetch=true --pass-pipeline="builtin.module(hal.executable(hal.executable.variant(builtin.module(func.func(iree-llvmgpu-lower-executable-target)))))" test_softmax.mlir 2> full_err.txt -mlir-print-ir-after-all -mlir-disable-threading | |
: 1740165162:0;vi full | |
: 1740165165:0;vi full_err.txt | |
: 1740165172:0;vi test_softmax.mlir | |
: 1740165210:0;iree-opt --split-input-file --iree-gpu-test-target=gfx942 --iree-codegen-llvmgpu-use-vector-distribution --iree-llvmgpu-enable-prefetch=true --pass-pipeline="builtin.module(hal.executable(hal.executable.variant(builtin.module(func.func(iree-llvmgpu-lower-executable-target)))))" test_softmax.mlir 2> full_err.txt -mlir-print-ir-after-all -mlir-disable-threading | |
: 1740165317:0;ls | |
: 1740165321:0;vi bad-uncollapsed.mlir | |
: 1740165337:0;iree-opt --split-input-file --iree-gpu-test-target=gfx942 --iree-codegen-llvmgpu-use-vector-distribution --iree-llvmgpu-enable-prefetch=true --pass-pipeline="builtin.module(hal.executable(hal.executable.variant(builtin.module(func.func(iree-llvmgpu-lower-executable-target)))))" bad-uncollapsed.mlir 2> full_err.txt -mlir-print-ir-after-all -mlir-disable-threading | |
: 1740165342:0;ls | |
: 1740165351:0;vi test_softmax.mlir | |
: 1740165370:0;iree-compile test_softmax.mlir \\ | |
-iree-codegen-llvmgpu-test-vector-distribution-on-generics \\ | |
--iree-hip-target=gfx942 \\ | |
-o=abc.vmfb \\ | |
--iree-hal-target-device=hip \\ | |
-mlir-print-ir-after-all \\ | |
-iree-hal-dump-executable-sources-to=dump/ 2> err.txt | |
: 1740165372:0;vi err.txt | |
: 1740165394:0;iree-compile test_this_now.mlir \\ | |
-iree-codegen-llvmgpu-test-vector-distribution-on-generics \\ | |
--iree-hip-target=gfx942 \\ | |
-o=abc.vmfb \\ | |
--iree-hal-target-device=hip \\ | |
-mlir-print-ir-after-all \\ | |
-iree-hal-dump-executable-sources-to=dump/ 2> err.txt | |
: 1740165397:0;vi err.txt | |
: 1740165403:0;vi test_this_now.mlir | |
: 1740165412:0;vi err.txt | |
: 1740165768:0;riree | |
: 1740165791:0;iree-compile model.mlir \\ | |
-iree-codegen-llvmgpu-test-vector-distribution-on-generics \\ | |
--iree-hip-target=gfx942 \\ | |
-o=abc.vmfb \\ | |
--iree-hal-target-device=hip \\ | |
-iree-hal-dump-executable-sources-to=dump/ 2> err.txt | |
: 1740165804:0;vi err.txt | |
: 1740165847:0;cd dump | |
: 1740165847:0;ls | |
: 1740165850:0;vi compiled_clip_encode_prompts\$async_dispatch_179.mlir | |
: 1740165876:0;iree-compile compiled_clip_encode_prompts\$async_dispatch_2.mlir \\ | |
-iree-codegen-llvmgpu-test-vector-distribution-on-generics \\ | |
--iree-hip-target=gfx942 \\ | |
-o=abc.vmfb \\ | |
--iree-hal-target-device=hip \\ | |
-iree-hal-dump-executable-sources-to=dump/ 2> err.txt | |
: 1740165878:0;vi err.txt | |
: 1740165890:0;iree-compile compiled_clip_encode_prompts\$async_dispatch_2.mlir \\ | |
-iree-codegen-llvmgpu-test-vector-distribution-on-generics \\ | |
--iree-hip-target=gfx942 \\ | |
-o=abc.vmfb \\ | |
--iree-hal-target-device=hip \\ | |
-iree-hal-dump-executable-sources-to=dump/ 2> err.txt -mlir-print-ir-after-all | |
: 1740165894:0;vi err.txt | |
: 1740166090:0;iree-compile compiled_clip_encode_prompts\$async_dispatch_2.mlir \\ | |
--iree-hip-target=gfx942 \\ | |
-o=abc.vmfb \\ | |
--iree-hal-target-device=hip \\ | |
-iree-hal-dump-executable-sources-to=dump/ 2> err.txt -mlir-print-ir-after-all | |
: 1740166093:0;vi err.txt | |
: 1740166252:0;iree-compile compiled_clip_encode_prompts\$async_dispatch_2.mlir \\ | |
-iree-codegen-llvmgpu-test-vector-distribution-on-generics \\ | |
--iree-hip-target=gfx942 \\ | |
-o=abc.vmfb \\ | |
--iree-hal-target-device=hip \\ | |
-iree-hal-dump-executable-sources-to=dump/ 2> err.txt -mlir-print-ir-after-all | |
: 1740166254:0;vi err.txt | |
: 1740166842:0;riree | |
: 1740166931:0;iree-compile compiled_clip_encode_prompts\$async_dispatch_2.mlir \\ | |
-iree-codegen-llvmgpu-test-vector-distribution-on-generics \\ | |
--iree-hip-target=gfx942 \\ | |
-o=abc.vmfb \\ | |
--iree-hal-target-device=hip \\ | |
-iree-hal-dump-executable-sources-to=dump/ 2> err.txt -mlir-print-ir-after-all | |
: 1740166934:0;vi err.txt | |
: 1740167198:0;riree | |
: 1740167210:0;iree-compile compiled_clip_encode_prompts\$async_dispatch_2.mlir \\ | |
-iree-codegen-llvmgpu-test-vector-distribution-on-generics \\ | |
--iree-hip-target=gfx942 \\ | |
-o=abc.vmfb \\ | |
--iree-hal-target-device=hip \\ | |
-iree-hal-dump-executable-sources-to=dump/ 2> err.txt -mlir-print-ir-after-all | |
: 1740167219:0;vi err.txt | |
: 1740167292:0;cd .. | |
: 1740167292:0;ls | |
: 1740167296:0;iree-compile model.mlir \\ | |
-iree-codegen-llvmgpu-test-vector-distribution-on-generics \\ | |
--iree-hip-target=gfx942 \\ | |
-o=abc.vmfb \\ | |
--iree-hal-target-device=hip \\ | |
-iree-hal-dump-executable-sources-to=dump/ 2> err.txt | |
: 1740167322:0;vi err.txt | |
: 1740167328:0;iree-compile punet.mlir \\ | |
-iree-codegen-llvmgpu-test-vector-distribution-on-generics \\ | |
--iree-hip-target=gfx942 \\ | |
-o=abc.vmfb \\ | |
--iree-hal-target-device=hip \\ | |
-iree-hal-dump-executable-sources-to=dump/ | |
: 1740167449:0;htop | |
: 1740167466:0;cd dump | |
: 1740167466:0;ls | |
: 1740167469:0;cd .. | |
: 1740167470:0;ls | |
: 1740167471:0;rm -rf dump | |
: 1740167499:0;ls | |
: 1740167518:0;riree | |
: 1740167544:0;iree-compile model.mlir \\ | |
-iree-codegen-llvmgpu-test-vector-distribution-on-generics \\ | |
--iree-hip-target=gfx942 \\ | |
-o=abc.vmfb \\ | |
--iree-hal-target-device=hip \\ | |
-iree-hal-dump-executable-sources-to=dump/ 2> err.txt | |
: 1740167556:0;vi err.txt | |
: 1740167575:0;iree-compile punet.mlir \\ | |
-iree-codegen-llvmgpu-test-vector-distribution-on-generics \\ | |
--iree-hip-target=gfx942 \\ | |
-o=abc.vmfb \\ | |
--iree-hal-target-device=hip \\ | |
-iree-hal-dump-executable-sources-to=dump/ 2> err.txt | |
: 1740167621:0;vi err.txt | |
: 1740167638:0;vi test_softmax.mlir | |
: 1740167673:0;vi test_new.mlir | |
: 1740167678:0;vi test_this_now.mlir | |
: 1740167693:0;iree-opt --split-input-file --iree-gpu-test-target=gfx942 --iree-codegen-llvmgpu-use-vector-distribution --iree-llvmgpu-enable-prefetch=true --pass-pipeline="builtin.module(hal.executable(hal.executable.variant(builtin.module(func.func(iree-llvmgpu-lower-executable-target)))))" test_this_now.mlir 2> full_err.txt -mlir-print-ir-after-all -mlir-disable-threading | |
: 1740167697:0;vi full_err.txt | |
: 1740167704:0;vi test_softmax.mlir | |
: 1740167726:0;vi full_err.txt | |
: 1740167834:0;cd dump | |
: 1740167835:0;ls | |
: 1740167837:0;cd .. | |
: 1740167840:0;rm -rf dump | |
: 1740167852:0;iree-compile model.mlir \\ | |
-iree-codegen-llvmgpu-test-vector-distribution-on-generics \\ | |
--iree-hip-target=gfx942 \\ | |
-o=abc.vmfb \\ | |
--iree-hal-target-device=hip \\ | |
-iree-hal-dump-executable-sources-to=dump/ 2> err.txt | |
: 1740167889:0;vi err.txt | |
: 1740167915:0;ls | |
: 1740167917:0;cd dump | |
: 1740167917:0;ls | |
: 1740167922:0;vi compiled_clip_encode_prompts\$async_dispatch_2.mlir | |
: 1740167935:0;iree-compile compiled_clip_encode_prompts\$async_dispatch_2.mlir \\ | |
-iree-codegen-llvmgpu-test-vector-distribution-on-generics \\ | |
--iree-hip-target=gfx942 \\ | |
-o=abc.vmfb \\ | |
--iree-hal-target-device=hip \\ | |
-iree-hal-dump-executable-sources-to=dump/ 2> err.txt -mlir-print-ir-after-all | |
: 1740167948:0;cd .. | |
: 1740167948:0;ls | |
: 1740167951:0;vi err.txt | |
: 1740167996:0;cd dump | |
: 1740167996:0;ls | |
: 1740167998:0;vi err.txt | |
: 1740168221:0;cd .. | |
: 1740168221:0;ls | |
: 1740168222:0;vi err.txt | |
: 1740168395:0;ls | |
: 1740168400:0;vi err.txt | |
: 1740168406:0;ls | |
: 1740168410:0;vi test_this_now.mlir | |
: 1740168536:0;gist-paste test_this_now.mlir | |
: 1740168569:0;iree-opt --split-input-file --iree-gpu-test-target=gfx942 --iree-codegen-llvmgpu-use-vector-distribution --iree-llvmgpu-enable-prefetch=true --pass-pipeline="builtin.module(hal.executable(hal.executable.variant(builtin.module(func.func(iree-llvmgpu-lower-executable-target)))))" test_this_now.mlir 2> full_err.txt -mlir-print-ir-after-all -mlir-disable-threading | |
: 1740168574:0;vi test_this_now.mlir | |
: 1740168590:0;iree-opt --split-input-file --iree-gpu-test-target=gfx942 --iree-codegen-llvmgpu-use-vector-distribution --iree-llvmgpu-enable-prefetch=true --pass-pipeline="builtin.module(hal.executable(hal.executable.variant(builtin.module(func.func(iree-llvmgpu-lower-executable-target)))))" test_this_now.mlir 2> full_err.txt -mlir-print-ir-after-all -mlir-disable-threading | |
: 1740168852:0;cat test_this_now.mlir | |
: 1740169136:0;iree-opt --split-input-file --iree-gpu-test-target=gfx942 --iree-codegen-llvmgpu-use-vector-distribution --iree-llvmgpu-enable-prefetch=true --pass-pipeline="builtin.module(hal.executable(hal.executable.variant(builtin.module(func.func(iree-llvmgpu-lower-executable-target)))))" test_this_now.mlir 2> full_err.txt -mlir-print-ir-after-all -mlir-disable-threading | |
: 1740169420:0;vi test_this_now.mlir | |
: 1740169423:0;iree-opt --split-input-file --iree-gpu-test-target=gfx942 --iree-codegen-llvmgpu-use-vector-distribution --iree-llvmgpu-enable-prefetch=true --pass-pipeline="builtin.module(hal.executable(hal.executable.variant(builtin.module(func.func(iree-llvmgpu-lower-executable-target)))))" test_this_now.mlir 2> full_err.txt -mlir-print-ir-after-all -mlir-disable-threading | |
: 1740169426:0;vi full | |
: 1740169430:0;vi full_err.txt | |
: 1740470371:0;\ | |
: 1740470373:0;clear | |
: 1740470373:0;ls | |
: 1740470376:0;s | |
: 1740470377:0;ls | |
: 1740470381:0;tmux ls | |
: 1740470383:0;tmux attach -t 0 | |
: 1741006295:0;ssh [email protected] | |
: 1741006302:0;ssh [email protected] | |
: 1741006312:0;htop | |
: 1741006314:0;clear | |
: 1741006314:0;ls | |
: 1741006317:0;tmux attach -t 0 | |
: 1741006707:0;riree | |
: 1741006951:0;iree-opt --split-input-file --iree-gpu-test-target=gfx942 --iree-codegen-llvmgpu-use-vector-distribution --iree-llvmgpu-enable-prefetch=true --pass-pipeline="builtin.module(hal.executable(hal.executable.variant(builtin.module(func.func(iree-llvmgpu-lower-executable-target)))))" test_this_now.mlir 2> full_err.txt -mlir-print-ir-after-all -mlir-disable-threading | |
: 1741006956:0;vi full_err.txt | |
: 1741007064:0;riree | |
: 1741007437:0;iree-opt --split-input-file --iree-gpu-test-target=gfx942 --iree-codegen-llvmgpu-use-vector-distribution --iree-llvmgpu-enable-prefetch=true --pass-pipeline="builtin.module(hal.executable(hal.executable.variant(builtin.module(func.func(iree-llvmgpu-lower-executable-target)))))" test_this_now.mlir 2> full_err.txt -mlir-print-ir-after-all -mlir-disable-threading | |
: 1741007440:0;vi full_err.txt | |
: 1741080961:0;riree | |
: 1741080970:0;vi test_ | |
: 1741080975:0;vi test_this_now.mlir | |
: 1741081002:0;iree-opt --split-input-file --iree-gpu-test-target=gfx942 --iree-codegen-llvmgpu-use-vector-distribution --iree-llvmgpu-enable-prefetch=true --pass-pipeline="builtin.module(hal.executable(hal.executable.variant(builtin.module(func.func(iree-llvmgpu-lower-executable-target)))))" test_this_now.mlir 2> full_err.txt -mlir-print-ir-after-all -mlir-disable-threading | |
: 1741081039:0;vi test_this_now.mlir | |
: 1741081065:0;iree-opt --split-input-file --iree-gpu-test-target=gfx942 --iree-codegen-llvmgpu-use-vector-distribution --iree-llvmgpu-enable-prefetch=true --pass-pipeline="builtin.module(hal.executable(hal.executable.variant(builtin.module(func.func(iree-llvmgpu-lower-executable-target)))))" test_this_now.mlir 2> full_err.txt -mlir-print-ir-after-all -mlir-disable-threading | |
: 1741081384:0;riree | |
: 1741081407:0;ls | |
: 1741081417:0;iree-compile model.mlir \\ | |
-iree-codegen-llvmgpu-test-vector-distribution-on-generics \\ | |
--iree-hip-target=gfx942 \\ | |
-o=abc.vmfb \\ | |
--iree-hal-target-device=hip \\ | |
-iree-hal-dump-executable-sources-to=dump/ 2> err.txt | |
: 1741081430:0;vi err.txt | |
: 1741081460:0;ls | |
: 1741081462:0;cd dump | |
: 1741081462:0;ls | |
: 1741081465:0;vi compiled_clip_encode_prompts\$async_dispatch_10.mlir | |
: 1741081485:0;iree-compile compiled_clip_encode_prompts\$async_dispatch_10.mlir \\ | |
-iree-codegen-llvmgpu-test-vector-distribution-on-generics \\ | |
--iree-hip-target=gfx942 \\ | |
-o=abc.vmfb \\ | |
--iree-hal-target-device=hip \\ | |
-iree-hal-dump-executable-sources-to=dump/ 2> err.txt | |
: 1741081512:0;iree-compile compiled_clip_encode_prompts\$async_dispatch_10.mlir \\ | |
-iree-codegen-llvmgpu-test-vector-distribution-on-generics \\ | |
--iree-hip-target=gfx942 \\ | |
-o=abc.vmfb \\ | |
--iree-hal-target-device=hip \\ | |
-mlir-print-ir-after-all \ 2> err.txt | |
: 1741081516:0;iree-compile compiled_clip_encode_prompts\$async_dispatch_10.mlir \\ | |
-iree-codegen-llvmgpu-test-vector-distribution-on-generics \\ | |
--iree-hip-target=gfx942 \\ | |
-o=abc.vmfb \\ | |
--iree-hal-target-device=hip \\ | |
-mlir-print-ir-after-all 2> err.txt | |
: 1741081518:0;vi err.txt | |
: 1741081908:0;riree | |
: 1741081918:0;iree-compile compiled_clip_encode_prompts\$async_dispatch_10.mlir \\ | |
-iree-codegen-llvmgpu-test-vector-distribution-on-generics \\ | |
--iree-hip-target=gfx942 \\ | |
-o=abc.vmfb \\ | |
--iree-hal-target-device=hip \\ | |
-mlir-print-ir-after-all 2> err.txt | |
: 1741081920:0;vi err.txt | |
: 1741082079:0;riree | |
: 1741082098:0;iree-compile compiled_clip_encode_prompts\$async_dispatch_10.mlir \\ | |
-iree-codegen-llvmgpu-test-vector-distribution-on-generics \\ | |
--iree-hip-target=gfx942 \\ | |
-o=abc.vmfb \\ | |
--iree-hal-target-device=hip \\ | |
-mlir-print-ir-after-all 2> err.txt | |
: 1741082100:0;vi err.txt | |
: 1741082161:0;riree | |
: 1741082174:0;iree-compile compiled_clip_encode_prompts\$async_dispatch_10.mlir \\ | |
-iree-codegen-llvmgpu-test-vector-distribution-on-generics \\ | |
--iree-hip-target=gfx942 \\ | |
-o=abc.vmfb \\ | |
--iree-hal-target-device=hip \\ | |
-mlir-print-ir-after-all 2> err.txt | |
: 1741082176:0;vi err.txt | |
: 1741082511:0;riree | |
: 1741082531:0;iree-compile compiled_clip_encode_prompts\$async_dispatch_10.mlir \\ | |
-iree-codegen-llvmgpu-test-vector-distribution-on-generics \\ | |
--iree-hip-target=gfx942 \\ | |
-o=abc.vmfb \\ | |
--iree-hal-target-device=hip \\ | |
-mlir-print-ir-after-all 2> err.txt | |
: 1741082533:0;vi err.txt | |
: 1741082603:0;riree | |
: 1741082614:0;ls | |
: 1741082617:0;cd .. | |
: 1741082617:0;ls | |
: 1741082622:0;vi test_new.mlir | |
: 1741082646:0;iree-compile test_now.mlir -o out1.vmfb --compile-from=executable-sources -mlir-print-ir-after-all 2> xyz.txt | |
: 1741082648:0;vi xyz.txt | |
: 1741082657:0;iree-compile test_new.mlir -o out1.vmfb --compile-from=executable-sources -mlir-print-ir-after-all 2> xyz.txt | |
: 1741082660:0;vi xyz.txt | |
: 1741082685:0;vi punet.mlir | |
: 1741082707:0;iree-compile punet.mlir \\ | |
-iree-codegen-llvmgpu-test-vector-distribution-on-generics \\ | |
--iree-hip-target=gfx942 \\ | |
-o=abc.vmfb \\ | |
--iree-hal-target-device=hip \\ | |
-iree-hal-dump-executable-sources-to=dump/ 2> err.txt | |
: 1741082996:0;iree-compile bad-uncollapsed.mlir \\ | |
-iree-codegen-llvmgpu-test-vector-distribution-on-generics \\ | |
--iree-hip-target=gfx942 \\ | |
-o=abc.vmfb \\ | |
--iree-hal-target-device=hip \\ | |
-mlir-print-ir-after-all 2> err.txt \\ | |
: 1741083001:0;vi err.txt | |
: 1741083091:0;ls | |
: 1741083093:0;cd dump | |
: 1741083094:0;ls | |
: 1741083095:0;cd .. | |
: 1741083095:0;ls | |
: 1741083097:0;vi test_softmax.mlir | |
: 1741083106:0;iree-compile test_softmax.mlir \\ | |
-iree-codegen-llvmgpu-test-vector-distribution-on-generics \\ | |
--iree-hip-target=gfx942 \\ | |
-o=abc.vmfb \\ | |
--iree-hal-target-device=hip \\ | |
-mlir-print-ir-after-all \\ | |
-iree-hal-dump-executable-sources-to=dump/ 2> err.txt | |
: 1741083108:0;vi err.txt | |
: 1741083127:0;vi test_softmax.mlir | |
: 1741083137:0;cd .. | |
: 1741083139:0;cd vectormulti | |
: 1741083140:0;ls | |
: 1741083141:0;cd dump | |
: 1741083141:0;ls | |
: 1741083149:0;vi module_main\$async_dispatch_10.mlir | |
: 1741083161:0;vi compiled_clip_encode_prompts\$async_dispatch_10.mlir | |
: 1741083174:0;_ | |
: 1741083191:0;mv compiled_clip_encode_prompts\$async_dispatch_10.mlir ../ | |
: 1741083192:0;cd .. | |
: 1741083192:0;ls | |
: 1741083200:0;iree-compile compiled_clip_encode_prompts\$async_dispatch_10.mlir \\ | |
-iree-codegen-llvmgpu-test-vector-distribution-on-generics \\ | |
--iree-hip-target=gfx942 \\ | |
-o=abc.vmfb \\ | |
--iree-hal-target-device=hip \\ | |
-mlir-print-ir-after-all 2> err.txt | |
: 1741083202:0;vi err.txt | |
: 1741083918:0;riree | |
: 1741083941:0;iree-compile compiled_clip_encode_prompts\$async_dispatch_10.mlir \\ | |
-iree-codegen-llvmgpu-test-vector-distribution-on-generics \\ | |
--iree-hip-target=gfx942 \\ | |
-o=abc.vmfb \\ | |
--iree-hal-target-device=hip \\ | |
-mlir-print-ir-after-all 2> err.txt | |
: 1741083943:0;vi err.txt | |
: 1741084002:0;riree | |
: 1741084015:0;iree-compile compiled_clip_encode_prompts\$async_dispatch_10.mlir \\ | |
-iree-codegen-llvmgpu-test-vector-distribution-on-generics \\ | |
--iree-hip-target=gfx942 \\ | |
-o=abc.vmfb \\ | |
--iree-hal-target-device=hip \\ | |
-mlir-print-ir-after-all 2> err.txt | |
: 1741084017:0;vi err.txt | |
: 1741084366:0;iree-compile punet.mlir \\ | |
-iree-codegen-llvmgpu-test-vector-distribution-on-generics \\ | |
--iree-hip-target=gfx942 \\ | |
-o=abc.vmfb \\ | |
--iree-hal-target-device=hip | |
: 1741084723:0;ls | |
: 1741084727:0;vi test_softmax.mlir | |
: 1741085044:0;vi xyz.txt | |
: 1741085056:0;iree-compile compiled_clip_encode_prompts\$async_dispatch_10.mlir \\ | |
-iree-codegen-llvmgpu-test-vector-distribution-on-generics \\ | |
--iree-hip-target=gfx942 \\ | |
-o=abc.vmfb \\ | |
--iree-hal-target-device=hip \\ | |
-mlir-print-ir-after-all 2> err.txt | |
: 1741085058:0;vi err.txt | |
: 1741090293:0;cd .. | |
: 1741090294:0;ls | |
: 1741090299:0;vi now.mlir | |
: 1741090345:0;iree-opt --pass-pipeline='builtin.module(func.func(iree-codegen-tile-and-distribute-to-workgroups))' now.mlir | |
: 1741090354:0;vi now.mlir | |
: 1741090428:0;iree-compile --output-format=vm-bytecode --iree-hal-target-backends=llvm-cpu --iree-llvmcpu-target-cpu=host now.mlir -o abc.vmfb -mlir-print-ir-after-all 2> full.txt | |
: 1741090433:0;vi full.txt | |
: 1741090447:0;iree-compile --compile-from=executable-sources --output-format=vm-bytecode --iree-hal-target-backends=llvm-cpu --iree-llvmcpu-target-cpu=host now.mlir -o abc.vmfb -mlir-print-ir-after-all 2> full.txt | |
: 1741090449:0;vi full | |
: 1741090452:0;vi full.txt | |
: 1741090491:0;vi ir.mlir | |
: 1741090500:0;iree-opt --pass-pipeline='builtin.module(func.func(iree-codegen-tile-and-distribute-to-workgroups))' ir.mlir | |
: 1741090519:0;iree-opt --pass-pipeline='builtin.module(func.func(iree-codegen-tile-and-distribute-to-workgroups-using-forall))' ir.mlir | |
: 1741090539:0;iree-opt --pass-pipeline='builtin.module(func.func(iree-codegen-tile-dispatch-using-forall))' ir.mlir | |
: 1741090573:0;iree-opt --pass-pipeline='builtin.module(func.func(iree-codegen-tile-and-distribute-to-workgroups-using-forall-op))' ir.mlir | |
: 1741090966:0;riree | |
: 1741090986:0;iree-opt --pass-pipeline='builtin.module(func.func(iree-codegen-tile-and-distribute-to-workgroups-using-forall-op))' ir.mlir | |
: 1741091198:0;riree | |
: 1741091820:0;iree-opt --pass-pipeline='builtin.module(func.func(iree-codegen-tile-and-distribute-to-workgroups-using-forall-op))' ir.mlir | |
: 1741091834:0;iree-compile --compile-from=executable-sources --output-format=vm-bytecode --iree-hal-target-backends=llvm-cpu --iree-llvmcpu-target-cpu=host now.mlir -o abc.vmfb -mlir-print-ir-after-all 2> full.txt | |
: 1741091909:0;git-clang-format HEAD~ | |
: 1741091956:0;git ppf | |
: 1741096036:0;cd vectormulti | |
: 1741096037:0;ls | |
: 1741096052:0;iree-compile compiled_clip_encode_prompts\$async_dispatch_10.mlir \\ | |
-iree-codegen-llvmgpu-test-vector-distribution-on-generics \\ | |
--iree-hip-target=gfx942 \\ | |
-o=abc.vmfb \\ | |
--iree-hal-target-device=hip \\ | |
-mlir-print-ir-after-all 2> err.txt | |
: 1741096055:0;vi err.txt | |
: 1741096964:0;riree | |
: 1741096979:0;iree-compile compiled_clip_encode_prompts\$async_dispatch_10.mlir \\ | |
-iree-codegen-llvmgpu-test-vector-distribution-on-generics \\ | |
--iree-hip-target=gfx942 \\ | |
-o=abc.vmfb \\ | |
--iree-hal-target-device=hip \\ | |
-mlir-print-ir-after-all 2> err.txt | |
: 1741096982:0;vi err.txt | |
: 1741097030:0;riree | |
: 1741097039:0;iree-compile compiled_clip_encode_prompts\$async_dispatch_10.mlir \\ | |
-iree-codegen-llvmgpu-test-vector-distribution-on-generics \\ | |
--iree-hip-target=gfx942 \\ | |
-o=abc.vmfb \\ | |
--iree-hal-target-device=hip \\ | |
-mlir-print-ir-after-all 2> err.txt | |
: 1741097041:0;vi err.txt | |
: 1741097090:0;vi send.mlir | |
: 1741097094:0;gist-paste send.mlir | |
: 1741099173:0;vi err.txt | |
: 1741104695:0;riree | |
: 1741104717:0;iree-compile compiled_clip_encode_prompts\$async_dispatch_10.mlir \\ | |
-iree-codegen-llvmgpu-test-vector-distribution-on-generics \\ | |
--iree-hip-target=gfx942 \\ | |
-o=abc.vmfb \\ | |
--iree-hal-target-device=hip \\ | |
-mlir-print-ir-after-all 2> err.txt | |
: 1741104720:0;vi err.txt | |
: 1741104798:0;ls | |
: 1741104802:0;iree-compile bad-uncollapsed.mlir \\ | |
-iree-codegen-llvmgpu-test-vector-distribution-on-generics \\ | |
--iree-hip-target=gfx942 \\ | |
-o=abc.vmfb \\ | |
--iree-hal-target-device=hip \\ | |
-mlir-print-ir-after-all 2> err.txt \\ | |
: 1741104807:0;vi err.txt | |
: 1741104815:0;iree-compile model.mlir \\ | |
-iree-codegen-llvmgpu-test-vector-distribution-on-generics \\ | |
--iree-hip-target=gfx942 \\ | |
-o=abc.vmfb \\ | |
--iree-hal-target-device=hip \\ | |
-iree-hal-dump-executable-sources-to=dump/ 2> err.txt | |
: 1741104827:0;vi err.txt | |
: 1741104851:0;ls | |
: 1741104853:0;cd dump | |
: 1741104853:0;ls | |
: 1741104855:0;cd .. | |
: 1741104856:0;ls | |
: 1741104858:0;rm -rf dump | |
: 1741104859:0;clear | |
: 1741104860:0;ls | |
: 1741104862:0;iree-compile model.mlir \\ | |
-iree-codegen-llvmgpu-test-vector-distribution-on-generics \\ | |
--iree-hip-target=gfx942 \\ | |
-o=abc.vmfb \\ | |
--iree-hal-target-device=hip \\ | |
-iree-hal-dump-executable-sources-to=dump/ 2> err.txt | |
: 1741105580:0;vi err.txt | |
: 1741166816:0;riree | |
: 1741166839:0;iree-compile bad-uncollapsed.mlir \\ | |
-iree-codegen-llvmgpu-test-vector-distribution-on-generics \\ | |
--iree-hip-target=gfx942 \\ | |
-o=abc.vmfb \\ | |
--iree-hal-target-device=hip \\ | |
-mlir-print-ir-after-all 2> err.txt \\ | |
: 1741166841:0;vi err.txt | |
: 1741166996:0;riree | |
: 1741167007:0;iree-compile bad-uncollapsed.mlir \\ | |
-iree-codegen-llvmgpu-test-vector-distribution-on-generics \\ | |
--iree-hip-target=gfx942 \\ | |
-o=abc.vmfb \\ | |
--iree-hal-target-device=hip \\ | |
-mlir-print-ir-after-all 2> err.txt \\ | |
: 1741167011:0;vi err.txt | |
: 1741167279:0;riree | |
: 1741167299:0;iree-compile bad-uncollapsed.mlir \\ | |
-iree-codegen-llvmgpu-test-vector-distribution-on-generics \\ | |
--iree-hip-target=gfx942 \\ | |
-o=abc.vmfb \\ | |
--iree-hal-target-device=hip \\ | |
-mlir-print-ir-after-all 2> err.txt \\ | |
: 1741167303:0;vi err.txt | |
: 1741167325:0;riree | |
: 1741167329:0;iree-compile bad-uncollapsed.mlir \\ | |
-iree-codegen-llvmgpu-test-vector-distribution-on-generics \\ | |
--iree-hip-target=gfx942 \\ | |
-o=abc.vmfb \\ | |
--iree-hal-target-device=hip \\ | |
-mlir-print-ir-after-all 2> err.txt \\ | |
: 1741167335:0;iree-compile model.mlir \\ | |
-iree-codegen-llvmgpu-test-vector-distribution-on-generics \\ | |
--iree-hip-target=gfx942 \\ | |
-o=abc.vmfb \\ | |
--iree-hal-target-device=hip \\ | |
-iree-hal-dump-executable-sources-to=dump/ 2> err.txt | |
: 1741167348:0;vi err.txt | |
: 1741167365:0;cd dump | |
: 1741167365:0;ls | |
: 1741167368:0;vi compiled_clip_encode_prompts\$async_dispatch_178.mlir | |
: 1741167403:0;iree-compile compiled_clip_encode_prompts\$async_dispatch_178.mlir \\ | |
-iree-codegen-llvmgpu-test-vector-distribution-on-generics \\ | |
--iree-hip-target=gfx942 \\ | |
-o=abc.vmfb \\ | |
--iree-hal-target-device=hip \\ | |
-mlir-print-ir-after-all \\ | |
-iree-hal-dump-executable-sources-to=dump/ 2> err.txt | |
: 1741167405:0;vi err.txt | |
: 1741168052:0;riree | |
: 1741168061:0;iree-compile compiled_clip_encode_prompts\$async_dispatch_178.mlir \\ | |
-iree-codegen-llvmgpu-test-vector-distribution-on-generics \\ | |
--iree-hip-target=gfx942 \\ | |
-o=abc.vmfb \\ | |
--iree-hal-target-device=hip \\ | |
-mlir-print-ir-after-all \\ | |
-iree-hal-dump-executable-sources-to=dump/ 2> err.txt | |
: 1741168064:0;vi err.txt | |
: 1741168538:0;riree | |
: 1741168558:0;iree-compile compiled_clip_encode_prompts\$async_dispatch_178.mlir \\ | |
-iree-codegen-llvmgpu-test-vector-distribution-on-generics \\ | |
--iree-hip-target=gfx942 \\ | |
-o=abc.vmfb \\ | |
--iree-hal-target-device=hip \\ | |
-mlir-print-ir-after-all \\ | |
-iree-hal-dump-executable-sources-to=dump/ 2> err.txt | |
: 1741168560:0;vi err.txt | |
: 1741168754:0;riree | |
: 1741168775:0;iree-compile compiled_clip_encode_prompts\$async_dispatch_178.mlir \\ | |
-iree-codegen-llvmgpu-test-vector-distribution-on-generics \\ | |
--iree-hip-target=gfx942 \\ | |
-o=abc.vmfb \\ | |
--iree-hal-target-device=hip \\ | |
-mlir-print-ir-after-all \\ | |
-iree-hal-dump-executable-sources-to=dump/ 2> err.txt | |
: 1741168778:0;vi err.txt | |
: 1741168848:0;cd .. | |
: 1741168849:0;ls | |
: 1741168859:0;iree-compile compiled_clip_encode_prompts\$async_dispatch_10.mlir \\ | |
-iree-codegen-llvmgpu-test-vector-distribution-on-generics \\ | |
--iree-hip-target=gfx942 \\ | |
-o=abc.vmfb \\ | |
--iree-hal-target-device=hip \\ | |
-mlir-print-ir-after-all 2> err.txt | |
: 1741168863:0;vi err.txt | |
: 1741168886:0;cd dump | |
: 1741168887:0;ls | |
: 1741168910:0;vi compiled_clip_encode_prompts\$async_dispatch_1.mlir | |
: 1741168924:0;iree-compile compiled_clip_encode_prompts\$async_dispatch_178.mlir \\ | |
-iree-codegen-llvmgpu-test-vector-distribution-on-generics \\ | |
--iree-hip-target=gfx942 \\ | |
-o=abc.vmfb \\ | |
--iree-hal-target-device=hip \\ | |
-mlir-print-ir-after-all \\ | |
-iree-hal-dump-executable-sources-to=dump/ 2> err.txt | |
: 1741168927:0;vi err.txt | |
: 1741169040:0;riree | |
: 1741169071:0;iree-compile compiled_clip_encode_prompts\$async_dispatch_178.mlir \\ | |
-iree-codegen-llvmgpu-test-vector-distribution-on-generics \\ | |
--iree-hip-target=gfx942 \\ | |
-o=abc.vmfb \\ | |
--iree-hal-target-device=hip \\ | |
-mlir-print-ir-after-all \\ | |
-iree-hal-dump-executable-sources-to=dump/ 2> err.txt | |
: 1741169073:0;vi err.txt | |
: 1741169091:0;riree | |
: 1741169113:0;iree-compile compiled_clip_encode_prompts\$async_dispatch_178.mlir \\ | |
-iree-codegen-llvmgpu-test-vector-distribution-on-generics \\ | |
--iree-hip-target=gfx942 \\ | |
-o=abc.vmfb \\ | |
--iree-hal-target-device=hip \\ | |
-mlir-print-ir-after-all \\ | |
-iree-hal-dump-executable-sources-to=dump/ 2> err.txt | |
: 1741169116:0;vi err.txt | |
: 1741169203:0;vi txt.txt | |
: 1741169207:0;cat txt.txt | |
: 1741169317:0;riree | |
: 1741169366:0;iree-compile compiled_clip_encode_prompts\$async_dispatch_178.mlir \\ | |
-iree-codegen-llvmgpu-test-vector-distribution-on-generics \\ | |
--iree-hip-target=gfx942 \\ | |
-o=abc.vmfb \\ | |
--iree-hal-target-device=hip \\ | |
-mlir-print-ir-after-all \\ | |
-iree-hal-dump-executable-sources-to=dump/ 2> err.txt | |
: 1741169368:0;vi err.txt | |
: 1741169398:0;rireee | |
: 1741169399:0;riree | |
: 1741169407:0;iree-compile compiled_clip_encode_prompts\$async_dispatch_178.mlir \\ | |
-iree-codegen-llvmgpu-test-vector-distribution-on-generics \\ | |
--iree-hip-target=gfx942 \\ | |
-o=abc.vmfb \\ | |
--iree-hal-target-device=hip \\ | |
-mlir-print-ir-after-all \\ | |
-iree-hal-dump-executable-sources-to=dump/ 2> err.txt | |
: 1741169416:0;vi err.txt | |
: 1741169422:0;cd .. | |
: 1741169423:0;ls | |
: 1741169428:0;iree-compile model.mlir \\ | |
-iree-codegen-llvmgpu-test-vector-distribution-on-generics \\ | |
--iree-hip-target=gfx942 \\ | |
-o=abc.vmfb \\ | |
--iree-hal-target-device=hip \\ | |
-iree-hal-dump-executable-sources-to=dump/ 2> err.txt | |
: 1741169441:0;vi err.txt | |
: 1741169470:0;riree | |
: 1741170039:0;iree-compile model.mlir \\ | |
-iree-codegen-llvmgpu-test-vector-distribution-on-generics \\ | |
--iree-hip-target=gfx942 \\ | |
-o=abc.vmfb \\ | |
--iree-hal-target-device=hip \\ | |
-iree-hal-dump-executable-sources-to=dump/ 2> err.txt | |
: 1741170052:0;vi err.txt | |
: 1741170079:0;ls | |
: 1741170080:0;cd dump | |
: 1741170081:0;ls | |
: 1741170088:0;iree-compile compiled_clip_encode_prompts\$async_dispatch_178.mlir \\ | |
--iree-hip-target=gfx942 \\ | |
-o=abc.vmfb \\ | |
--iree-hal-target-device=hip \\ | |
-mlir-print-ir-after-all \\ | |
-iree-hal-dump-executable-sources-to=dump/ 2> err.txt | |
: 1741170091:0;vi err.txt | |
: 1741170172:0;riree | |
: 1741170200:0;iree-compile compiled_clip_encode_prompts\$async_dispatch_178.mlir \\ | |
-iree-codegen-llvmgpu-test-vector-distribution-on-generics \\ | |
--iree-hip-target=gfx942 \\ | |
-o=abc.vmfb \\ | |
--iree-hal-target-device=hip \\ | |
-mlir-print-ir-after-all \\ | |
-iree-hal-dump-executable-sources-to=dump/ 2> err.txt | |
: 1741170202:0;vi err.txt | |
: 1741170244:0;riree | |
: 1741170263:0;iree-compile compiled_clip_encode_prompts\$async_dispatch_178.mlir \\ | |
-iree-codegen-llvmgpu-test-vector-distribution-on-generics \\ | |
--iree-hip-target=gfx942 \\ | |
-o=abc.vmfb \\ | |
--iree-hal-target-device=hip \\ | |
-mlir-print-ir-after-all \\ | |
-iree-hal-dump-executable-sources-to=dump/ 2> err.txt | |
: 1741170267:0;vi err.txt | |
: 1741170357:0;riree | |
: 1741170376:0;iree-compile compiled_clip_encode_prompts\$async_dispatch_178.mlir \\ | |
-iree-codegen-llvmgpu-test-vector-distribution-on-generics \\ | |
--iree-hip-target=gfx942 \\ | |
-o=abc.vmfb \\ | |
--iree-hal-target-device=hip \\ | |
-mlir-print-ir-after-all \\ | |
-iree-hal-dump-executable-sources-to=dump/ 2> err.txt | |
: 1741170379:0;vi err.txt | |
: 1741170405:0;riree | |
: 1741170429:0;iree-compile compiled_clip_encode_prompts\$async_dispatch_178.mlir \\ | |
-iree-codegen-llvmgpu-test-vector-distribution-on-generics \\ | |
--iree-hip-target=gfx942 \\ | |
-o=abc.vmfb \\ | |
--iree-hal-target-device=hip \\ | |
-mlir-print-ir-after-all \\ | |
-iree-hal-dump-executable-sources-to=dump/ 2> err.txt | |
: 1741170431:0;vi err.txt | |
: 1741171451:0;riree | |
: 1741171472:0;iree-compile compiled_clip_encode_prompts\$async_dispatch_178.mlir \\ | |
-iree-codegen-llvmgpu-test-vector-distribution-on-generics \\ | |
--iree-hip-target=gfx942 \\ | |
-o=abc.vmfb \\ | |
--iree-hal-target-device=hip \\ | |
-mlir-print-ir-after-all \\ | |
-iree-hal-dump-executable-sources-to=dump/ 2> err.txt | |
: 1741171474:0;vi err.txt | |
: 1741171540:0;riree | |
: 1741171549:0;iree-compile compiled_clip_encode_prompts\$async_dispatch_178.mlir \\ | |
-iree-codegen-llvmgpu-test-vector-distribution-on-generics \\ | |
--iree-hip-target=gfx942 \\ | |
-o=abc.vmfb \\ | |
--iree-hal-target-device=hip \\ | |
-mlir-print-ir-after-all \\ | |
-iree-hal-dump-executable-sources-to=dump/ 2> err.txt | |
: 1741171552:0;vi err.txt | |
: 1741171610:0;riree | |
: 1741171630:0;iree-compile compiled_clip_encode_prompts\$async_dispatch_178.mlir \\ | |
-iree-codegen-llvmgpu-test-vector-distribution-on-generics \\ | |
--iree-hip-target=gfx942 \\ | |
-o=abc.vmfb \\ | |
--iree-hal-target-device=hip \\ | |
-mlir-print-ir-after-all \\ | |
-iree-hal-dump-executable-sources-to=dump/ 2> err.txt | |
: 1741171636:0;vi err.txt | |
: 1741171662:0;riree | |
: 1741171683:0;iree-compile compiled_clip_encode_prompts\$async_dispatch_178.mlir \\ | |
-iree-codegen-llvmgpu-test-vector-distribution-on-generics \\ | |
--iree-hip-target=gfx942 \\ | |
-o=abc.vmfb \\ | |
--iree-hal-target-device=hip \\ | |
-mlir-print-ir-after-all \\ | |
-iree-hal-dump-executable-sources-to=dump/ 2> err.txt | |
: 1741171685:0;vi err.txt | |
: 1741172547:0;cd .. | |
: 1741172547:0;ls | |
: 1741172551:0;iree-compile bad-uncollapsed.mlir \\ | |
-iree-codegen-llvmgpu-test-vector-distribution-on-generics \\ | |
--iree-hip-target=gfx942 \\ | |
-o=abc.vmfb \\ | |
--iree-hal-target-device=hip \\ | |
-mlir-print-ir-after-all 2> err.txt \\ | |
: 1741172555:0;vi err.txt | |
: 1741172668:0;ls | |
: 1741172670:0;cd dump | |
: 1741172674:0;iree-compile compiled_clip_encode_prompts\$async_dispatch_178.mlir \\ | |
-iree-codegen-llvmgpu-test-vector-distribution-on-generics \\ | |
--iree-hip-target=gfx942 \\ | |
-o=abc.vmfb \\ | |
--iree-hal-target-device=hip \\ | |
-mlir-print-ir-after-all \\ | |
-iree-hal-dump-executable-sources-to=dump/ 2> err.txt | |
: 1741172677:0;vi err.txt | |
: 1741173044:0;riree | |
: 1741173065:0;cd .. | |
: 1741173065:0;ls | |
: 1741173068:0;iree-compile bad-uncollapsed.mlir \\ | |
-iree-codegen-llvmgpu-test-vector-distribution-on-generics \\ | |
--iree-hip-target=gfx942 \\ | |
-o=abc.vmfb \\ | |
--iree-hal-target-device=hip \\ | |
-mlir-print-ir-after-all 2> err.txt \\ | |
: 1741173071:0;vi err.txt | |
: 1741173127:0;riree | |
: 1741173141:0;iree-compile bad-uncollapsed.mlir \\ | |
-iree-codegen-llvmgpu-test-vector-distribution-on-generics \\ | |
--iree-hip-target=gfx942 \\ | |
-o=abc.vmfb \\ | |
--iree-hal-target-device=hip \\ | |
-mlir-print-ir-after-all 2> err.txt \\ | |
: 1741173145:0;cd dump | |
: 1741173146:0;ls | |
: 1741173153:0;iree-compile compiled_clip_encode_prompts\$async_dispatch_178.mlir \\ | |
-iree-codegen-llvmgpu-test-vector-distribution-on-generics \\ | |
--iree-hip-target=gfx942 \\ | |
-o=abc.vmfb \\ | |
--iree-hal-target-device=hip \\ | |
-mlir-print-ir-after-all \\ | |
-iree-hal-dump-executable-sources-to=dump/ 2> err.txt | |
: 1741173156:0;vi err.txt | |
: 1741188636:0;riree | |
: 1741190025:0;cat err.txt | |
: 1741260376:0;git ppf | |
: 1741260383:0;git o main | |
: 1741260386:0;git puom | |
: 1741260394:0;git submodule update --init | |
: 1741260404:0;riree | |
: 1741260414:0;git ob typo | |
: 1741260504:0;git-clang-format HEAD~ | |
: 1741260507:0;git ppf | |
: 1741260968:0;git o deprecatewarp | |
: 1741261085:0;git submodule update --init | |
: 1741261088:0;riree | |
: 1741261098:0;ls | |
: 1741261101:0;vi err.txt | |
: 1741263208:0;ls | |
: 1741263236:0;iree-compile compiled_clip_encode_prompts\$async_dispatch_178.mlir \\ | |
-iree-codegen-llvmgpu-test-vector-distribution-on-generics \\ | |
--iree-hip-target=gfx942 \\ | |
-o=abc.vmfb \\ | |
--iree-hal-target-device=hip \\ | |
-mlir-print-ir-after-all \\ | |
-iree-hal-dump-executable-sources-to=dump/ 2> err.txt | |
: 1741263239:0;vi err.txt | |
: 1741263342:0;riree | |
: 1741263361:0;iree-compile compiled_clip_encode_prompts\$async_dispatch_178.mlir \\ | |
-iree-codegen-llvmgpu-test-vector-distribution-on-generics \\ | |
--iree-hip-target=gfx942 \\ | |
-o=abc.vmfb \\ | |
--iree-hal-target-device=hip \\ | |
-mlir-print-ir-after-all \\ | |
-iree-hal-dump-executable-sources-to=dump/ 2> err.txt | |
: 1741263369:0;vi err.txt | |
: 1741263517:0;riree | |
: 1741263546:0;iree-compile compiled_clip_encode_prompts\$async_dispatch_178.mlir \\ | |
-iree-codegen-llvmgpu-test-vector-distribution-on-generics \\ | |
--iree-hip-target=gfx942 \\ | |
-o=abc.vmfb \\ | |
--iree-hal-target-device=hip \\ | |
-mlir-print-ir-after-all \\ | |
-iree-hal-dump-executable-sources-to=dump/ 2> err.txt | |
: 1741263551:0;vi err.txt | |
: 1741263786:0;riree | |
: 1741263902:0;iree-compile compiled_clip_encode_prompts\$async_dispatch_178.mlir \\ | |
-iree-codegen-llvmgpu-test-vector-distribution-on-generics \\ | |
--iree-hip-target=gfx942 \\ | |
-o=abc.vmfb \\ | |
--iree-hal-target-device=hip \\ | |
-mlir-print-ir-after-all \\ | |
-iree-hal-dump-executable-sources-to=dump/ 2> err.txt | |
: 1741263905:0;vi err.txt | |
: 1741263949:0;riree | |
: 1741263968:0;iree-compile compiled_clip_encode_prompts\$async_dispatch_178.mlir \\ | |
-iree-codegen-llvmgpu-test-vector-distribution-on-generics \\ | |
--iree-hip-target=gfx942 \\ | |
-o=abc.vmfb \\ | |
--iree-hal-target-device=hip \\ | |
-mlir-print-ir-after-all \\ | |
-iree-hal-dump-executable-sources-to=dump/ 2> err.txt | |
: 1741263971:0;vi err.txt | |
: 1741265911:0;clear | |
: 1741265911:0;ls | |
: 1741265927:0;git stash | |
: 1741265933:0;git o main | |
: 1741265936:0;git submodule update --init | |
: 1741265943:0;git ob first_iter | |
: 1741265944:0;celar | |
: 1741265945:0;clear | |
: 1741265946:0;ls | |
: 1741265965:0;riree | |
: 1741267272:0;vi | |
: 1741269916:0;riree | |
: 1741270093:0;iree-compile compiled_clip_encode_prompts\$async_dispatch_178.mlir \\ | |
-iree-codegen-llvmgpu-test-vector-distribution-on-generics \\ | |
--iree-hip-target=gfx942 \\ | |
-o=abc.vmfb \\ | |
--iree-hal-target-device=hip \\ | |
-mlir-print-ir-after-all \\ | |
-iree-hal-dump-executable-sources-to=dump/ 2> err.txt | |
: 1741270095:0;vi err.txt | |
: 1741270104:0;iree-compile compiled_clip_encode_prompts\$async_dispatch_178.mlir \\ | |
-iree-codegen-llvmgpu-test-vector-distribution-on-reduction \\ | |
--iree-hip-target=gfx942 \\ | |
-o=abc.vmfb \\ | |
--iree-hal-target-device=hip \\ | |
-mlir-print-ir-after-all \\ | |
-iree-hal-dump-executable-sources-to=dump/ 2> err.txt | |
: 1741270108:0;vi err.txt | |
: 1741270197:0;cd .. | |
: 1741270197:0;ls | |
: 1741270202:0;iree-compile model.mlir \\ | |
-iree-codegen-llvmgpu-test-vector-distribution-on-generics \\ | |
--iree-hip-target=gfx942 \\ | |
-o=abc.vmfb \\ | |
--iree-hal-target-device=hip \\ | |
-iree-hal-dump-executable-sources-to=dump/ 2> err.txt | |
: 1741270205:0;vi err.txt | |
: 1741270210:0;iree-compile model.mlir \\ | |
-iree-codegen-llvmgpu-test-vector-distribution-on-reduction \\ | |
--iree-hip-target=gfx942 \\ | |
-o=abc.vmfb \\ | |
--iree-hal-target-device=hip \\ | |
-iree-hal-dump-executable-sources-to=dump/ 2> err.txt | |
: 1741270223:0;vi err.txt | |
: 1741270262:0;riree | |
: 1741270284:0;iree-compile model.mlir \\ | |
-iree-codegen-llvmgpu-test-vector-distribution-on-reduction \\ | |
--iree-hip-target=gfx942 \\ | |
-o=abc.vmfb \\ | |
--iree-hal-target-device=hip \\ | |
-iree-hal-dump-executable-sources-to=dump/ 2> err.txt | |
: 1741270302:0;iree-compile punet.mlir \\ | |
-iree-codegen-llvmgpu-test-vector-distribution-on-generics \\ | |
--iree-hip-target=gfx942 \\ | |
-o=abc.vmfb \\ | |
--iree-hal-target-device=hip | |
: 1741270308:0;iree-compile punet.mlir \\ | |
-iree-codegen-llvmgpu-test-vector-distribution-on-reduction \\ | |
--iree-hip-target=gfx942 \\ | |
-o=abc.vmfb \\ | |
--iree-hal-target-device=hip | |
: 1741270466:0;clang-format -i compiler/src/iree/compiler/Codegen/LLVMGPU/KernelConfig.cpp | |
: 1741270684:0;riree | |
: 1741270505:52;iree-compile punet.mlir \\ | |
--iree-hip-target=gfx942 \\ | |
-o=abc.vmfb \\ | |
--iree-hal-target-device=hip | |
: 1741270712:0;iree-compile punet.mlir \\ | |
-iree-codegen-llvmgpu-test-vector-distribution-on-reduction \\ | |
--iree-hip-target=gfx942 \\ | |
-o=abc.vmfb \\ | |
--iree-hal-target-device=hip | |
: 1741271016:0;cat compiler/src/iree/compiler/Codegen/LLVMGPU/test/config_reduction_vector_distribute.mlir | |
: 1741271027:0;ls | |
: 1741271032:0;cd dump | |
: 1741271032:0;ls | |
: 1741271037:0;vi compiled_clip_encode_prompts\$async_dispatch_178.mlir | |
: 1741271070:0;iree-opt --split-input-file --iree-gpu-test-target=gfx942 --iree-codegen-llvmgpu-test-vector-distribution-reduction --pass-pipeline="builtin.module(iree-llvmgpu-select-lowering-strategy)" compiled_clip_encode_prompts\$async_dispatch_178.mlir | |
: 1741271081:0;iree-opt --split-input-file --iree-gpu-test-target=gfx942 --iree-codegen-llvmgpu-test-vector-distribution-on-reduction --pass-pipeline="builtin.module(iree-llvmgpu-select-lowering-strategy)" compiled_clip_encode_prompts\$async_dispatch_178.mlir | |
: 1741271127:0;vi test_this.mlir | |
: 1741271137:0;iree-opt --split-input-file --iree-gpu-test-target=gfx942 --iree-codegen-llvmgpu-test-vector-distribution-on-reduction --pass-pipeline="builtin.module(iree-llvmgpu-select-lowering-strategy)" test_this.mlir | |
: 1741271208:0;riree | |
: 1741271232:0;iree-opt --split-input-file --iree-gpu-test-target=gfx942 --iree-codegen-llvmgpu-test-vector-distribution-on-reduction --pass-pipeline="builtin.module(iree-llvmgpu-select-lowering-strategy)" test_this.mlir | |
: 1741271246:0;ls | |
: 1741271248:0;cd .. | |
: 1741271248:0;ls | |
: 1741271252:0;iree-compile punet.mlir \\ | |
-iree-codegen-llvmgpu-test-vector-distribution-on-reduction \\ | |
--iree-hip-target=gfx942 \\ | |
-o=abc.vmfb \\ | |
--iree-hal-target-device=hip | |
: 1741271356:0;iree-compile model.mlir \\ | |
-iree-codegen-llvmgpu-test-vector-distribution-on-reduction \\ | |
--iree-hip-target=gfx942 \\ | |
-o=abc.vmfb \\ | |
--iree-hal-target-device=hip \\ | |
-iree-hal-dump-executable-sources-to=dump/ 2> err.txt | |
: 1741271369:0;vi err.txt | |
: 1741271394:0;ls | |
: 1741271396:0;cd dump | |
: 1741271396:0;ls | |
: 1741271402:0;vi compiled_clip_encode_prompts\$async_dispatch_692.mlir | |
: 1741271511:0;riree | |
: 1741271551:0;cd .. | |
: 1741271551:0;ls | |
: 1741271554:0;iree-compile model.mlir \\ | |
-iree-codegen-llvmgpu-test-vector-distribution-on-reduction \\ | |
--iree-hip-target=gfx942 \\ | |
-o=abc.vmfb \\ | |
--iree-hal-target-device=hip \\ | |
-iree-hal-dump-executable-sources-to=dump/ 2> err.txt | |
: 1741271566:0;vi err.txt | |
: 1741271578:0;cd dump | |
: 1741271579:0;ls | |
: 1741271583:0;vi compiled_clip_encode_prompts\$async_dispatch_2.mlir | |
: 1741271627:0;iree-compile compiled_clip_encode_prompts\$async_dispatch_2.mlir \\ | |
-iree-codegen-llvmgpu-test-vector-distribution-on-reduction \\ | |
--iree-hip-target=gfx942 \\ | |
-o=abc.vmfb \\ | |
--iree-hal-target-device=hip \\ | |
-iree-hal-dump-executable-sources-to=dump/ 2> err.txt | |
: 1741271629:0;vi err.txt | |
: 1741271648:0;iree-compile compiled_clip_encode_prompts\$async_dispatch_2.mlir \\ | |
-iree-codegen-llvmgpu-test-vector-distribution-on-reduction \\ | |
--iree-hip-target=gfx942 \\ | |
-o=abc.vmfb \\ | |
--iree-hal-target-device=hip \\ | |
-mlir-print-ir-after-all \\ | |
-iree-hal-dump-executable-sources-to=dump/ 2> err.txt | |
: 1741271650:0;vi err.txt | |
: 1741271905:0;iree-opt --split-input-file --iree-gpu-test-target=gfx942 --iree-codegen-llvmgpu-test-vector-distribution-on-reduction --pass-pipeline="builtin.module(iree-llvmgpu-select-lowering-strategy)" test_this.mlir | |
: 1741271947:0;cat test_this.mlir | |
: 1741271994:0;iree-opt --split-input-file --iree-gpu-test-target=gfx942 --iree-codegen-llvmgpu-test-vector-distribution-on-reduction --pass-pipeline="builtin.module(iree-llvmgpu-select-lowering-strategy)" test_this.mlir | |
: 1741272105:0;vi test_this.mlir | |
: 1741272119:0;iree-opt --split-input-file --iree-gpu-test-target=gfx942 --iree-codegen-llvmgpu-test-vector-distribution-on-reduction --pass-pipeline="builtin.module(iree-llvmgpu-select-lowering-strategy)" test_this.mlir | |
: 1741272408:0;iree-opt --split-input-file --iree-gpu-test-target=gfx942 --iree-codegen-llvmgpu-test-vector-distribution-on-reduction --pass-pipeline="builtin.module(iree-llvmgpu-select-lowering-strategy)" compiler/src/iree/compiler/Codegen/LLVMGPU/test/config_reduction_vector_distribute.mlir | |
: 1741272424:0;iree-opt --split-input-file --iree-gpu-test-target=gfx942 --iree-codegen-llvmgpu-test-vector-distribution-on-reduction --pass-pipeline="builtin.module(iree-llvmgpu-select-lowering-strategy)" compiler/src/iree/compiler/Codegen/LLVMGPU/test/config_reduction_vector_distribute.mlir | FileCheck compiler/src/iree/compiler/Codegen/LLVMGPU/test/config_reduction_vector_distribute.mlir | |
: 1741272825:0;iree-opt --split-input-file --iree-gpu-test-target=gfx942 --iree-codegen-llvmgpu-test-vector-distribution-on-reduction --pass-pipeline="builtin.module(iree-llvmgpu-select-lowering-strategy)" compiler/src/iree/compiler/Codegen/LLVMGPU/test/config_reduction_vector_distribute.mlir | |
: 1741272868:0;iree-opt --split-input-file --iree-gpu-test-target=gfx942 --iree-codegen-llvmgpu-test-vector-distribution-on-reduction --pass-pipeline="builtin.module(iree-llvmgpu-select-lowering-strategy)" compiler/src/iree/compiler/Codegen/LLVMGPU/test/config_reduction_vector_distribute.mlir | FileCheck compiler/src/iree/compiler/Codegen/LLVMGPU/test/config_reduction_vector_distribute.mlir | |
: 1741273070:0;git ppf | |
: 1741273142:0;git-clang-format HEAD~ | |
: 1741273149:0;git ppf | |
: 1741273191:0;ls | |
: 1741273192:0;riree | |
: 1741273203:0;iree-compile compiled_clip_encode_prompts\$async_dispatch_2.mlir \\ | |
-iree-codegen-llvmgpu-test-vector-distribution-on-reduction \\ | |
--iree-hip-target=gfx942 \\ | |
-o=abc.vmfb \\ | |
--iree-hal-target-device=hip \\ | |
-mlir-print-ir-after-all \\ | |
-iree-hal-dump-executable-sources-to=dump/ 2> err.txt | |
: 1741273205:0;vi err.txt | |
: 1741273732:0;riree | |
: 1741273753:0;iree-compile compiled_clip_encode_prompts\$async_dispatch_2.mlir \\ | |
-iree-codegen-llvmgpu-test-vector-distribution-on-reduction \\ | |
--iree-hip-target=gfx942 \\ | |
-o=abc.vmfb \\ | |
--iree-hal-target-device=hip \\ | |
-mlir-print-ir-after-all \\ | |
-iree-hal-dump-executable-sources-to=dump/ 2> err.txt | |
: 1741273756:0;vi err.txt | |
: 1741273905:0;riree | |
: 1741273961:0;iree-compile compiled_clip_encode_prompts\$async_dispatch_2.mlir \\ | |
-iree-codegen-llvmgpu-test-vector-distribution-on-reduction \\ | |
--iree-hip-target=gfx942 \\ | |
-o=abc.vmfb \\ | |
--iree-hal-target-device=hip | |
: 1741273986:0;riree | |
: 1741274033:0;iree-compile compiled_clip_encode_prompts\$async_dispatch_2.mlir \\ | |
-iree-codegen-llvmgpu-test-vector-distribution-on-reduction \\ | |
--iree-hip-target=gfx942 \\ | |
-o=abc.vmfb \\ | |
--iree-hal-target-device=hip | |
: 1741274062:0;vi compiled_clip_encode_prompts\$async_dispatch_2.mlir | |
: 1741274182:0;riree | |
: 1741274201:0;iree-compile compiled_clip_encode_prompts\$async_dispatch_2.mlir \\ | |
-iree-codegen-llvmgpu-test-vector-distribution-on-reduction \\ | |
--iree-hip-target=gfx942 \\ | |
-o=abc.vmfb \\ | |
--iree-hal-target-device=hip | |
: 1741274253:0;vi compiled_clip_encode_prompts\$async_dispatch_2.mlir | |
: 1741274304:0;iree-compile compiled_clip_encode_prompts\$async_dispatch_2.mlir \\ | |
-iree-codegen-llvmgpu-test-vector-distribution-on-reduction \\ | |
--iree-hip-target=gfx942 \\ | |
-o=abc.vmfb \\ | |
--iree-hal-target-device=hip | |
: 1741274311:0;iree-compile compiled_clip_encode_prompts\$async_dispatch_2.mlir \\ | |
-iree-codegen-llvmgpu-test-vector-distribution-on-reduction \\ | |
--iree-hip-target=gfx942 \\ | |
-o=abc.vmfb \\ | |
--iree-hal-target-device=hip \\ | |
-mlir-print-ir-after-all \\ | |
-iree-hal-dump-executable-sources-to=dump/ 2> err.txt | |
: 1741274313:0;vi err.txt | |
: 1741274379:0;riree | |
: 1741274428:0;iree-compile compiled_clip_encode_prompts\$async_dispatch_2.mlir \\ | |
-iree-codegen-llvmgpu-test-vector-distribution-on-reduction \\ | |
--iree-hip-target=gfx942 \\ | |
-o=abc.vmfb \\ | |
--iree-hal-target-device=hip \\ | |
-mlir-print-ir-after-all \\ | |
-iree-hal-dump-executable-sources-to=dump/ 2> err.txt | |
: 1741274430:0;vi err.txt | |
: 1741274481:0;riree | |
: 1741274503:0;iree-compile compiled_clip_encode_prompts\$async_dispatch_2.mlir \\ | |
-iree-codegen-llvmgpu-test-vector-distribution-on-reduction \\ | |
--iree-hip-target=gfx942 \\ | |
-o=abc.vmfb \\ | |
--iree-hal-target-device=hip \\ | |
-mlir-print-ir-after-all \\ | |
-iree-hal-dump-executable-sources-to=dump/ 2> err.txt | |
: 1741274506:0;vi err.txt | |
: 1741274673:0;riree | |
: 1741274689:0;iree-compile compiled_clip_encode_prompts\$async_dispatch_2.mlir \\ | |
-iree-codegen-llvmgpu-test-vector-distribution-on-reduction \\ | |
--iree-hip-target=gfx942 \\ | |
-o=abc.vmfb \\ | |
--iree-hal-target-device=hip \\ | |
-mlir-print-ir-after-all \\ | |
-iree-hal-dump-executable-sources-to=dump/ 2> err.txt | |
: 1741274699:0;vi err.txt | |
: 1741274735:0;riree | |
: 1741274747:0;iree-compile compiled_clip_encode_prompts\$async_dispatch_2.mlir \\ | |
-iree-codegen-llvmgpu-test-vector-distribution-on-reduction \\ | |
--iree-hip-target=gfx942 \\ | |
-o=abc.vmfb \\ | |
--iree-hal-target-device=hip \\ | |
-mlir-print-ir-after-all \\ | |
-iree-hal-dump-executable-sources-to=dump/ 2> err.txt | |
: 1741274755:0;vi err.txt | |
: 1741274810:0;cd .. | |
: 1741274811:0;ls | |
: 1741274815:0;iree-compile model.mlir \\ | |
-iree-codegen-llvmgpu-test-vector-distribution-on-reduction \\ | |
--iree-hip-target=gfx942 \\ | |
-o=abc.vmfb \\ | |
--iree-hal-target-device=hip \\ | |
-iree-hal-dump-executable-sources-to=dump/ 2> err.txt | |
: 1741275141:0;vi err.txt | |
: 1741275156:0;cd dump | |
: 1741275157:0;ls | |
: 1741275161:0;iree-compile compiled_clip_encode_prompts\$async_dispatch_2.mlir \\ | |
-iree-codegen-llvmgpu-test-vector-distribution-on-reduction \\ | |
--iree-hip-target=gfx942 \\ | |
-o=abc.vmfb \\ | |
--iree-hal-target-device=hip \\ | |
-mlir-print-ir-after-all \\ | |
-iree-hal-dump-executable-sources-to=dump/ 2> err.txt | |
: 1741275169:0;vi err.txt | |
: 1741277948:0;iree-compile compiled_clip_encode_prompts\$async_dispatch_2.mlir \\ | |
--iree-hip-target=gfx942 \\ | |
-o=abc.vmfb \\ | |
--iree-hal-target-device=hip \\ | |
-mlir-print-ir-after-all \\ | |
-iree-hal-dump-executable-sources-to=dump/ 2> err.txt | |
: 1741277951:0;vi err.txt | |
: 1741353596:0;\ | |
\ | |
\ | |
: 1741353599:0;tmux attach -t 0 | |
: 1741353651:0;riree | |
: 1741353660:0;iree-compile compiled_clip_encode_prompts\$async_dispatch_2.mlir \\ | |
--iree-hip-target=gfx942 \\ | |
-o=abc.vmfb \\ | |
--iree-hal-target-device=hip \\ | |
-mlir-print-ir-after-all \\ | |
-iree-hal-dump-executable-sources-to=dump/ 2> err.txt | |
: 1741353673:0;vi err.txt | |
: 1741353691:0;iree-compile compiled_clip_encode_prompts\$async_dispatch_2.mlir \\ | |
-iree-codegen-llvmgpu-test-vector-distribution-on-reduction \\ | |
--iree-hip-target=gfx942 \\ | |
-o=abc.vmfb \\ | |
--iree-hal-target-device=hip \\ | |
-mlir-print-ir-after-all \\ | |
-iree-hal-dump-executable-sources-to=dump/ 2> err.txt | |
: 1741353695:0;vi err.txt | |
: 1741357317:0;riree | |
: 1741357503:0;iree-compile compiled_clip_encode_prompts\$async_dispatch_2.mlir \\ | |
-iree-codegen-llvmgpu-test-vector-distribution-on-reduction \\ | |
--iree-hip-target=gfx942 \\ | |
-o=abc.vmfb \\ | |
--iree-hal-target-device=hip \\ | |
-mlir-print-ir-after-all \\ | |
-iree-hal-dump-executable-sources-to=dump/ 2> err.txt | |
: 1741357508:0;cd .. | |
: 1741357509:0;ls | |
: 1741357513:0;iree-compile model.mlir \\ | |
-iree-codegen-llvmgpu-test-vector-distribution-on-reduction \\ | |
--iree-hip-target=gfx942 \\ | |
-o=abc.vmfb \\ | |
--iree-hal-target-device=hip \\ | |
-iree-hal-dump-executable-sources-to=dump/ 2> err.txt | |
: 1741357530:0;iree-compile punet.mlir \\ | |
-iree-codegen-llvmgpu-test-vector-distribution-on-reduction \\ | |
--iree-hip-target=gfx942 \\ | |
-o=abc.vmfb \\ | |
--iree-hal-target-device=hip | |
: 1741357717:0;clang-format -i compiler/src/iree/compiler/Codegen/LLVMGPU/KernelConfig.cpp | |
: 1741357795:0;iree-opt --split-input-file --iree-gpu-test-target=gfx942 --iree-codegen-llvmgpu-test-vector-distribution-on-reduction --pass-pipeline="builtin.module(iree-llvmgpu-select-lowering-strategy)" compiler/src/iree/compiler/Codegen/LLVMGPU/test/config_reduction_vector_distribute.mlir | FileCheck compiler/src/iree/compiler/Codegen/LLVMGPU/test/config_reduction_vector_distribute.mlir | |
: 1741357800:0;riree | |
: 1741357820:0;iree-opt --split-input-file --iree-gpu-test-target=gfx942 --iree-codegen-llvmgpu-test-vector-distribution-on-reduction --pass-pipeline="builtin.module(iree-llvmgpu-select-lowering-strategy)" compiler/src/iree/compiler/Codegen/LLVMGPU/test/config_reduction_vector_distribute.mlir | FileCheck compiler/src/iree/compiler/Codegen/LLVMGPU/test/config_reduction_vector_distribute.mlir | |
: 1741358277:0;clang-format -i compiler/src/iree/compiler/Codegen/LLVMGPU/KernelConfig.cpp | |
: 1741358452:0;build_tools/bazel_to_cmake/bazel_to_cmake.py compiler/src/iree/compiler/Codegen/LLVMGPU/test/BUILD.bazel | |
: 1741358477:0;./buildifier compiler/src/iree/compiler/Codegen/LLVMGPU/test/BUILD.bazel | |
: 1741358481:0;ls | |
: 1741358484:0;cd .. | |
: 1741358484:0;ls | |
: 1741358491:0;./buildifier iree/compiler/src/iree/compiler/Codegen/LLVMGPU/test/BUILD.bazel | |
: 1741358494:0;cd iree | |
: 1741358494:0;ls | |
: 1741358536:0;git ppf | |
: 1741361875:0;riree | |
: 1741369835:0;git ppf | |
: 1741372026:0;clear | |
: 1741372026:0;ls | |
: 1741372027:0;riree | |
: 1741372044:0;clear | |
: 1741372045:0;ls | |
: 1741372209:0;git ppf | |
: 1741372751:0;git-clang-format HEAD~ | |
: 1741511985:0;\ | |
\ | |
: 1741511988:0;tmux ls | |
: 1741511994:0;tmux attach -t shortfin | |
: 1741511997:0;clear | |
: 1741511997:0;ls | |
: 1741512000:0;lks | |
: 1741512002:0;ls | |
: 1741512008:0;cd .. | |
: 1741512008:0;ls | |
: 1741512013:0;mkdir attention | |
: 1741512014:0;cd attention | |
: 1741512015:0;ls | |
: 1741512018:0;vi np_attn.py | |
: 1741512093:0;cd ../attention | |
: 1741512094:0;ls | |
: 1741512094:0;vi | |
: 1741512100:0;python np_attn.py | |
: 1741513737:0;cat np_attn.py | |
: 1741513860:0;python np_attn.py | |
: 1741514034:0;black -i np_attn.py | |
: 1741514038:0;pip install black | |
: 1741514040:0;black -i np_attn.py | |
: 1741514043:0;black np_attn.py | |
: 1741515378:0;python np_attn.py | |
: 1741598926:0;\ | |
: 1741598928:0;tmux attach -t shortfin | |
: 1741611907:0;ls | |
: 1741611912:0;clear | |
: 1741611913:0;ls | |
: 1741611914:0;cd test | |
: 1741611915:0;ls | |
: 1741611919:0;vi check.mlir | |
: 1741612034:0;cd .. | |
: 1741612037:0;vi iree | |
: 1741612144:0;iree-compile --output-format=vm-bytecode --iree-hal-target-backends=llvm-cpu --iree-llvmcpu-target-cpu=host check.mlir -o abc.vmfb -mlir-print-ir-after-all 2> full.txt | |
: 1741612150:0;vi full.txt | |
: 1741612207:0;cat check.mlir | |
: 1741612392:0;ls | |
: 1741612395:0;vi check.mlir | |
: 1741612578:0;iree-opt --pass-pipeline="builtin.module(func.func(iree-llvmcpu-tile-root-and-fuse-producer-consumer{tiling-level=0}), canonicalize)" --split-input-file check.mlir | |
: 1741612629:0;cd .. | |
: 1741612630:0;ls | |
: 1741612631:0;cd .. | |
: 1741612631:0;ls | |
: 1741612632:0;cd iree | |
: 1741612633:0;ls | |
: 1741612635:0;cd third_party/llvm-project | |
: 1741612635:0;ls | |
: 1741612646:0;git cp 191008bdb7952e028b806f98d4db28db80399bcb | |
: 1741612650:0;git fetch pashyu | |
: 1741612652:0;git fetch pashu | |
: 1741612664:0;git remote add pashu [email protected]:pashu123/llvm-project.git | |
: 1741612666:0;git fetch pashu | |
: 1741612678:0;git cp 191008bdb7952e028b806f98d4db28db80399bcb | |
: 1741612882:0;riree | |
: 1741612902:0;iree-opt --pass-pipeline="builtin.module(func.func(iree-llvmcpu-tile-root-and-fuse-producer-consumer{tiling-level=0}), canonicalize)" --split-input-file check.mlir | |
: 1741612925:0;git cherry-pick --continue | |
: 1741612931:0;riree | |
: 1741612943:0;iree-opt --pass-pipeline="builtin.module(func.func(iree-llvmcpu-tile-root-and-fuse-producer-consumer{tiling-level=0}), canonicalize)" --split-input-file check.mlir | |
: 1741612975:0;iree-opt --pass-pipeline="builtin.module(func.func(iree-llvmcpu-tile-root-and-fuse-producer-consumer{tiling-level=0}), canonicalize)" --split-input-file check.mlir -debug | |
: 1741613017:0;vi check.mlir | |
: 1741613062:0;iree-opt --pass-pipeline="builtin.module(func.func(iree-llvmcpu-tile{tiling-level=0}))" --split-input-file check.mlir | |
: 1741613101:0;ls | |
: 1741613103:0;vi check.mlir | |
: 1741613167:0;iree-opt check.mlir | |
: 1741613175:0;vi check.mlir | |
: 1741613340:0;iree-opt --transform-interpreter --cse --split-input-file check.mlir | |
: 1741613354:0;mlir-opt --transform-interpreter --cse --split-input-file check.mlir | |
: 1741613379:0;vi check.mlir | |
: 1741613389:0;mlir-opt --transform-interpreter --cse --split-input-file check.mlir | |
: 1741613400:0;cd ../llvm-project | |
: 1741613401:0;ls | |
: 1741613409:0;git branch | |
: 1741613424:0;git remote -vv | |
: 1741613434:0;git remote add pashu [email protected]:pashu123/llvm-project.git | |
: 1741613438:0;git fetch pashu | |
: 1741613469:0;git o pashu/cons_fuse | |
: 1741613479:0;git ob cons_fuse | |
: 1741613480:0;clear | |
: 1741613480:0;ls | |
: 1741613486:0;source ~/iree/.iree_venv/bin/activate | |
: 1741613488:0;bm | |
: 1741614678:0;ls | |
: 1741614680:0;cd .. | |
: 1741614680:0;ls | |
: 1741614682:0;cd test | |
: 1741614682:0;ls | |
: 1741614685:0;mlir-opt --transform-interpreter --cse --split-input-file check.mlir | |
: 1741615675:0;vi check.mlir | |
: 1741615938:0;mlir-opt --transform-interpreter --cse --split-input-file check.mlir | |
: 1741615939:0;cd .. | |
: 1741615939:0;ls | |
: 1741615945:0;cd llvm-project | |
: 1741615946:0;ls | |
: 1741615960:0;mlir-opt --transform-interpreter --cse --split-input-file mlir/test/Interfaces/TilingInterface/tile-and-fuse-consumer.mlir | |
: 1741615984:0;mlir-opt --transform-interpreter --cse -canonicalize --split-input-file mlir/test/Interfaces/TilingInterface/tile-and-fuse-consumer.mlir | |
: 1741616011:0;cd llvm-project | |
: 1741616012:0;ls | |
: 1741616012:0;vi | |
: 1741616299:0;ls | |
: 1741616306:0;cp ~/test/check.mlir . | |
: 1741616312:0;mlir-opt --transform-interpreter --cse --split-input-file check.mlir | |
: 1741616314:0;vi check.mlir | |
: 1741616324:0;mlir-opt --transform-interpreter --cse --split-input-file check.mlir | |
: 1741616335:0;vi check.mlir | |
: 1741616371:0;mlir-opt --transform-interpreter --cse --split-input-file check.mlir | |
: 1741616375:0;vi check.mlir | |
: 1741616384:0;mlir-opt --transform-interpreter --cse --split-input-file check.mlir | |
: 1741616404:0;vi check.mlir | |
: 1741616421:0;mlir-opt --transform-interpreter --cse --split-input-file check.mlir | |
: 1741625360:0;ebd | |
: 1741625378:0;cat ~/build_commands/build_iree.sh | |
: 1741625891:0;clear | |
: 1741625891:0;ls | |
: 1741625895:0;tmux ls | |
: 1741625898:0;tmux attach -t 0 | |
: 1741625899:0;ls | |
: 1741625905:0;pwd | |
: 1741625920:0;clear | |
: 1741625920:0;ls | |
: 1741625931:0;gist-paste punet.mlir | |
: 1741625966:0;ls | |
: 1741625969:0;cd .. | |
: 1741625970:0;ls | |
: 1741625975:0;vi ~/.zsh_history | |
: 1741625986:0;gist-paste ~/.zsh_history |
Sign up for free
to join this conversation on GitHub.
Already have an account?
Sign in to comment