I hereby claim:
- I am cchan on github.
- I am cchan3141 (https://keybase.io/cchan3141) on keybase.
- I have a public key ASDXngTLj1owbE-s6GMjagRzspT_u0dDisSc627G2J4Q0wo
To claim this, I am signing this object:
I hereby claim:
To claim this, I am signing this object:
--- syscall.c | |
+++ syscall.c | |
@@ -48,6 +48,39 @@ | |
* Copyright (C) 1994-2003 by Todd M. Austin, Ph.D. and SimpleScalar, LLC. | |
*/ | |
+#ifdef __APPLE__ | |
+ | |
+#define __unix__ | |
+#define unix |
import time | |
import torch | |
torch.backends.cuda.matmul.allow_tf32 = False | |
GROUPS = 64 | |
for k in [3, 5, 7]: | |
x = torch.rand(16,64,1024,1024, device="cuda", dtype=torch.float32) | |
weight = torch.rand(64,64//GROUPS,k,k, device="cuda", dtype=torch.float32) |