Skip to content

Instantly share code, notes, and snippets.

View mdboom's full-sized avatar

Michael Droettboom mdboom

View GitHub Profile
/*
gcc -o nvml_process_name nvml_process_name.c \
-I/usr/local/cuda/include \
-L/usr/local/cuda/lib64/stubs \
-lcuda -lnvidia-ml
*/
#include <stdio.h>
#include <string.h>
#include <unistd.h>
#include <cuda.h>
#include <nvml.h>
#define BUF_LEN 1024
#define MAX_PROCS 64
static int check_cu(CUresult r, const char *what) {
import pyperf
from cuda.bindings._internal._fast_enum import FastEnum
class BenchEnum(FastEnum):
ELEM_0 = 0
ELEM_1 = 1
ELEM_2 = 2
ELEM_3 = 3
ELEM_4 = 4
# cython: language_level=3
# distutils: language = c
# distutils: libraries = cuda
"""
Minimal Cython wrapper for cuTensorMapEncodeTiled benchmark.
This isolates Cython binding overhead from cuda-python's extra functionality.
"""
from libc.stdint cimport uint32_t, uint64_t
Loading
Sorry, something went wrong. Reload?
Sorry, we cannot display this file.
Sorry, this file is invalid so it cannot be displayed.
Loading
Sorry, something went wrong. Reload?
Sorry, we cannot display this file.
Sorry, this file is invalid so it cannot be displayed.
<!-- kind:binary;verdict:compatible;affected:0;added:0;removed:0;type_problems_high:0;type_problems_medium:0;type_problems_low:0;interface_problems_high:0;interface_problems_medium:0;interface_problems_low:0;changed_constants:0;tool_version:2.3 -->
<!-- kind:source;verdict:incompatible;affected:0.2;added:0;removed:0;type_problems_high:13;type_problems_medium:0;type_problems_low:17;interface_problems_high:0;interface_problems_medium:0;interface_problems_low:0;changed_constants:0;type_changes_other:1;tool_version:2.3 -->
<!DOCTYPE html PUBLIC "-//W3C//DTD XHTML 1.0 Transitional//EN" "http://www.w3.org/TR/xhtml1/DTD/xhtml1-transitional.dtd">
<html xmlns="http://www.w3.org/1999/xhtml" xml:lang="en" lang="en">
<head>
<meta http-equiv="Content-Type" content="text/html; charset=utf-8" />
<meta name="viewport" content="width=device-width,initial-scale=1" />
<meta name="keywords" content="NAME, compatibility, API, ABI, report" />
<meta name="description" content="API/ABI compatibility report for the NAME object betwee
============================= test session starts ==============================
platform linux -- Python 3.13.6, pytest-8.4.1, pluggy-1.6.0
benchmark: 5.1.0 (defaults: timer=time.perf_counter disable_gc=False min_rounds=5 min_time=0.000005 max_time=1.0 calibration_precision=10 warmup=False warmup_iterations=100000)
rootdir: /home/mdboom/Work/builds/cuda-python/cuda_core/tests
configfile: pytest.ini
plugins: benchmark-5.1.0
collected 423 items
cuda_core/tests/example_tests/test_basic_examples.py s....s..s.. [ 2%]
cuda_core/tests/test_context.py . [ 2%]
#!/usr/bin/env python3
import sys
import pyperf
runner = pyperf.Runner()
runner.bench_command('cuda.bindings.nvrtc import', [sys.executable, '-c', 'import cuda.bindings.nvrtc'])
====
Benchmark: django_template
Object method cache dunder misses: 2353.294117647059
Object method cache collisions: 2287.504761904762
Object method cache misses: 2225.3703703703704
Object immortal increfs: 1.0039206501770555
Object immortal decrefs: 1.0034565222003073
Object mortal decrefs: 1.0009515004198075
Object mortal increfs: 1.0008433608988452