Skip to content
Snippets Groups Projects
Commit 05d8b236 authored by Russel Arbore's avatar Russel Arbore
Browse files

matmul32

parent 7a03a821
No related branches found
No related tags found
No related merge requests found
Pipeline #202691 failed
......@@ -12,3 +12,8 @@ fn matmul<n : usize, m : usize, l : usize>(a : f32[n, m], b : f32[m, l]) -> f32[
return res;
}
#[entry]
fn matmul32(a: f32[32, 32], b: f32[32, 32]) -> f32[32, 32] {
return matmul::<32, 32, 32>(a, b);
}
\ No newline at end of file
......@@ -11,16 +11,32 @@ macro simpl!(X) {
infer-schedules(X);
}
simpl!(*);
forkify(*);
fork-guard-elim(*);
simpl!(*);
reduce-slf(*);
simpl!(*);
fork-coalesce(*);
simpl!(*);
reduce-slf(*);
simpl!(*);
if feature("cuda") {
inline(matmul32);
simpl!(matmul32);
let func = outline(matmul32@outer);
no-memset(matmul32@res);
gpu(func);
simpl!(matmul32, func);
forkify(func);
fork-guard-elim(func);
simpl!(func);
fork-coalesce(func);
fork-coalesce(func);
simpl!(func);
xdot[true](func);
}
simpl!(matmul);
forkify(matmul);
fork-guard-elim(matmul);
simpl!(matmul);
reduce-slf(matmul);
simpl!(matmul);
fork-coalesce(matmul);
simpl!(matmul);
reduce-slf(matmul);
simpl!(matmul);
if feature("cuda") {
// Base
......
0% Loading or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment