This file contains hidden or bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
| module { | |
| func.func @_attn_fwd(%arg0: memref<?xi8>, %arg1: memref<?xi8>, %arg2: memref<?xf16> {tt.divisibility = 16 : i32, tt.tensor_kind = 0 : i32}, %arg3: memref<?xf16> {tt.divisibility = 16 : i32, tt.tensor_kind = 0 : i32}, %arg4: memref<?xf16> {tt.divisibility = 16 : i32, tt.tensor_kind = 0 : i32}, %arg5: memref<?xf32> {tt.divisibility = 16 : i32, tt.tensor_kind = 1 : i32}, %arg6: memref<?xf16> {tt.divisibility = 16 : i32, tt.tensor_kind = 1 : i32}, %arg7: memref<?xf32> {tt.divisibility = 16 : i32}, %arg8: f32, %arg9: i32, %arg10: i32, %arg11: i32, %arg12: i32, %arg13: i32, %arg14: i32) attributes {SyncBlockLockArgIdx = 0 : i64, WorkspaceArgIdx = 1 : i64, global_kernel = "local", mix_mode = "mix"} { | |
| %c128 = arith.constant 128 : index | |
| %c4_i32 = arith.constant 4 : i32 | |
| %c16384_i64 = arith.constant 16384 : i64 | |
| %c32_i32 = arith.constant 32 : i32 | |
| %c128_i32 = arith.constant 128 : i32 | |
| %c20_i32 = arith.constant 20 : i32 | |
| %cst = arith.constant 0xFF800000 : f32 | |
| %cst_0 = arith.constant |
This file contains hidden or bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
| set(CMAKE_C_COMPILER clang) | |
| set(CMAKE_CXX_COMPILER clang++) | |
| cmake_minimum_required(VERSION 3.18) | |
| set(APP_NAME "example-app") | |
| project("${APP_NAME}") | |
| set(CMAKE_CXX_STANDARD 20) | |
| set(CMAKE_CXX_FLAGS "${CMAKE_CXX_FLAGS} -O3 -std=c++20 -Wno-multichar") |
This file contains hidden or bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
| set(FFMPEG_INCLUDE_PATH "C:\\Users\\cola\\LOCAL\\ffmpeg\\include") | |
| set(FFMPEG_LIB_PATH "C:\\Users\\cola\\LOCAL\\ffmpeg\\lib") | |
| INCLUDE_DIRECTORIES(${FFMPEG_INCLUDE_PATH}) | |
| LINK_DIRECTORIES(${FFMPEG_LIB_PATH}) |
This file contains hidden or bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
| CMakeLists: | |
| set(BOOST_ROOT "C:/local/boost_1_78_0") | |
| set(BOOSTROOT "C:/local/boost_1_78_0") | |
| find_package(Boost 1.78.0) | |
| set(Boost_INCLUDE_DIR C:/local/boost_1_78_0/) | |
| set(Boost_LIBRARY_DIR C:/local/boost_1_78_0/stage/lib) | |
| include_directories(${Boost_INCLUDE_DIR}) | |
| link_directories(${Boost_LIBRARY_DIR}) |