Skip to content

Commit 2735bc2

Browse files
committed
2 parents c9ca974 + 3980887 commit 2735bc2

File tree

3 files changed

+102
-0
lines changed

3 files changed

+102
-0
lines changed
+22
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,22 @@
1+
cmake_minimum_required(VERSION 3.28)
2+
project(tanh)
3+
4+
set(FILENAME "gpu.h")
5+
6+
get_filename_component(PROJECT_ROOT ${CMAKE_CURRENT_SOURCE_DIR} DIRECTORY)
7+
get_filename_component(PROJECT_ROOT ${PROJECT_ROOT} DIRECTORY)
8+
9+
# Construct potential paths
10+
set(FILEPATH_CURRENT_DIR "${CMAKE_CURRENT_SOURCE_DIR}/${FILENAME}")
11+
set(FILEPATH_PROJECT_ROOT "${PROJECT_ROOT}/${FILENAME}")
12+
13+
# Check if the file exists in the current directory
14+
if(EXISTS ${FILEPATH_CURRENT_DIR})
15+
set(TARGET_FILE_PATH ${CMAKE_CURRENT_SOURCE_DIR})
16+
elseif(EXISTS ${FILEPATH_PROJECT_ROOT})
17+
set(TARGET_FILE_PATH ${PROJECT_ROOT})
18+
else()
19+
message(FATAL_ERROR "File ${FILENAME} not found in either ${CMAKE_CURRENT_SOURCE_DIR} or ${CMAKE_CURRENT_SOURCE_DIR}/../../")
20+
endif()
21+
22+
include("${TARGET_FILE_PATH}/cmake/example.cmake")

experimental/kernels/tanh/Makefile

+29
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,29 @@
1+
CXX=clang++
2+
GPUCPP ?= $(PWD)/../../..
3+
LIBDIR ?= $(GPUCPP)/third_party/lib
4+
LIBSPEC ?= . $(GPUCPP)/source
5+
NUM_JOBS?=$(shell nproc)
6+
TARGET=tanh
7+
ifeq ($(shell $(CXX) -std=c++17 -x c++ -E -include array - < /dev/null > /dev/null 2>&1 ; echo $$?),0)
8+
STDLIB :=
9+
else
10+
STDLIB := -stdlib=libc++
11+
endif
12+
FLAGS=-std=c++17 $(STDLIB) -I$(GPUCPP) -I$(GPUCPP)/third_party/headers -L$(GPUCPP)/third_party/lib run.cpp -ldl -ldawn
13+
14+
run: ./build/$(TARGET) dawnlib
15+
$(LIBSPEC) && ./build/$(TARGET)
16+
17+
dawnlib: $(if $(wildcard $(GPUCPP)/third_party/lib/libdawn.so $(GPUCPP)/third_party/lib/libdawn.dylib),,run_setup)
18+
19+
run_setup: check-python
20+
cd $(GPUCPP) && python3 setup.py
21+
22+
build/$(TARGET): run.cpp
23+
mkdir -p build && $(CXX) $(FLAGS) -DNDEBUG -o ./build/$(TARGET)
24+
25+
clean:
26+
read -r -p "This will delete the contents of build/*. Are you sure? [CTRL-C to abort] " response && rm -rf build/*
27+
28+
check-python:
29+
@command -v python3 >/dev/null 2>&1 || { echo >&2 "Python needs to be installed and in your path."; exit 1; }

experimental/kernels/tanh/run.cpp

+51
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,51 @@
1+
#include "gpu.h"
2+
#include <array>
3+
#include <cstdio>
4+
#include <future>
5+
6+
using namespace gpu; // createContext, createTensor, createKernel,
7+
// createShader, dispatchKernel, wait, toCPU
8+
// Tensor, Kernel, Context, Shape, kf32
9+
10+
static const char *kTan = R"(
11+
@group(0) @binding(0) var<storage, read_write> inp: array<{{precision}}>;
12+
@group(0) @binding(1) var<storage, read_write> out: array<{{precision}}>;
13+
@compute @workgroup_size({{workgroupSize}})
14+
fn main(
15+
@builtin(global_invocation_id) GlobalInvocationID: vec3<u32>) {
16+
let i: u32 = GlobalInvocationID.x;
17+
if (i < arrayLength(&inp)) {
18+
let x: f32 = inp[i];
19+
out[i] = tan(x);
20+
}
21+
}
22+
)";
23+
24+
int main(int argc, char **argv) {
25+
printf("\033[2J\033[1;1H");
26+
printf("\nHello gpu.cpp!\n");
27+
printf("--------------\n\n");
28+
29+
Context ctx = createContext();
30+
static constexpr size_t N = 100000;
31+
std::array<float, N> inputArr, outputArr;
32+
for (int i = 0; i < N; ++i) {
33+
inputArr[i] = static_cast<float>(i) / 10.0; // dummy input data
34+
}
35+
Tensor input = createTensor(ctx, Shape{N}, kf32, inputArr.data());
36+
Tensor output = createTensor(ctx, Shape{N}, kf32);
37+
std::promise<void> promise;
38+
std::future<void> future = promise.get_future();
39+
Kernel op = createKernel(ctx, {kTan, 256, kf32},
40+
Bindings{input, output},
41+
/* nWorkgroups */ {cdiv(N, 256), 1, 1});
42+
dispatchKernel(ctx, op, promise);
43+
wait(ctx, future);
44+
toCPU(ctx, output, outputArr.data(), sizeof(outputArr));
45+
for (int i = 0; i < 1000; ++i) {
46+
printf(" tan(%.2f) = %.10f\n", inputArr[i], outputArr[i]);
47+
}
48+
printf(" ...\n\n");
49+
printf("Computed %zu values of tan(x)\n\n", N);
50+
return 0;
51+
}

0 commit comments

Comments
 (0)