Skip to content

Instantly share code, notes, and snippets.

View makslevental's full-sized avatar
💩

Maksim Levental makslevental

💩
View GitHub Profile
//===--- ItaniumMangle.cpp - Itanium C++ Name Mangling ----------*- C++ -*-===//
//
// Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
// See https://llvm.org/LICENSE.txt for license information.
// SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
//
//===----------------------------------------------------------------------===//
//
// Implements C++ name mangling according to the Itanium C++ ABI,
// which is used in GCC 3.2 and newer (and many compilers that are
@makslevental
makslevental / lc_cluster_soln_strats.py
Created May 30, 2025 18:21
cluster lc by soln strat
import re
import time
from collections import defaultdict
from pprint import pprint
import hdbscan
import leetcode
from sklearn.feature_extraction.text import TfidfVectorizer
from sklearn.preprocessing import normalize
@makslevental
makslevental / gen.py
Last active May 12, 2025 21:57
gen conundrum
import dis
import inspect
def my_generator():
frame = inspect.currentframe()
print(frame.f_code.co_consts)
x = yield
frame = inspect.currentframe()
print(frame.f_code.co_consts)
%1085 = tail call <16 x float> @llvm.amdgcn.mfma.f32.32x32x16.f16(<8 x half> %1056, <8 x half> %1052, <16 x float> %1084, i32 0, i32 0, i32 0), !dbg !62
%1947 = shufflevector <2 x float> %1478, <2 x float> poison, <16 x i32> zeroinitializer, !dbg !62
%1948 = fmul <16 x float> %1085, %1947, !dbg !62
%1949 = tail call <16 x float> @llvm.amdgcn.mfma.f32.32x32x16.f16(<8 x half> %1931, <8 x half> %1906, <16 x float> %1948, i32 0, i32 0, i32 0), !dbg !62
/*===- TableGen'erated file -------------------------------------*- C++ -*-===*\
|* *|
|* Target Register Enum Values *|
|* *|
|* Automatically generated file, do not edit! *|
|* *|
\*===----------------------------------------------------------------------===*/
#ifdef GET_REGINFO_ENUM
@makslevental
makslevental / v_pk_add_f32.s
Last active April 25, 2025 04:13
unpack v_pk_add_f32
.section .AMDGPU.config,"",@progbits
.long 47176
.long 11468865
.long 47180
.long 5008
.long 47200
.long 0
.long 4
.long 0
.long 8
from enum import Flag
from pprint import pprint
class SchedGroupMask(Flag):
NONE = 0
ALU = 1 << 0
VALU = 1 << 1
SALU = 1 << 2
MFMA = 1 << 3
; Function Attrs: mustprogress nofree norecurse nosync nounwind willreturn memory(argmem: readwrite)
define amdgpu_kernel void @add_kernel(ptr addrspace(1) nocapture readonly %0, ptr addrspace(1) nocapture readonly %1, ptr addrspace(1) nocapture writeonly %2, i32 %3) local_unnamed_addr #0 {
%5 = tail call i32 @llvm.amdgcn.workgroup.id.x()
%6 = shl i32 %5, 10
%7 = tail call i32 @llvm.amdgcn.workitem.id.x()
%8 = shl i32 %7, 2
%9 = and i32 %8, 1020
%10 = or disjoint i32 %9, %6
%11 = icmp slt i32 %10, %3
br i1 %11, label %.critedge, label %.critedge2
diff --git a/CMakeLists.txt b/CMakeLists.txt
--- a/CMakeLists.txt (revision 7fb35319d38e57f7341e8434a4f5b2049aec8657)
+++ b/CMakeLists.txt (date 1744728290525)
@@ -318,6 +318,9 @@
endif()
target_link_options(triton PRIVATE ${PYTHON_LDFLAGS})
+ set_target_properties(triton PROPERTIES ARCHIVE_OUTPUT_DIRECTORY ${CMAKE_CURRENT_SOURCE_DIR}/python/triton/_C)
+ set_target_properties(triton PROPERTIES LIBRARY_OUTPUT_DIRECTORY ${CMAKE_CURRENT_SOURCE_DIR}/python/triton/_C)
+ set_target_properties(triton PROPERTIES RUNTIME_OUTPUT_DIRECTORY ${CMAKE_CURRENT_SOURCE_DIR}/python/triton/_C)
W20250414 14:53:24.356304 132475353552832 metadata.cpp:186] rocprofiler_iterate_agent_supported_counters returned ROCPROFILER_STATUS_ERROR_AGENT_ARCH_NOT_SUPPORTED for agent 1 (gfx1150) :: Agent HW architecture is not supported, no counter metrics found.
W20250414 14:53:24.651769 131105783740352 metadata.cpp:186] rocprofiler_iterate_agent_supported_counters returned ROCPROFILER_STATUS_ERROR_AGENT_ARCH_NOT_SUPPORTED for agent 1 (gfx1150) :: Agent HW architecture is not supported, no counter metrics found.
F20250414 14:53:24.970933 131105783740352 agent.cpp:1069] rocprofiler was only able to map 2 rocprofiler agents to HSA agents, expected 3
@ 0x773d72612360 (unknown)
@ 0x773d72613297 (unknown)
@ 0x773d7205d18a (unknown)
@ 0x773d72098ed5 rocprofiler_set_api_table
@ 0x773d71ad5afc rocprofiler_register_library_api_table
@ 0x773d660a2229 (unknown)
@ 0x773d660a3c58 (unknown)