You can not select more than 25 topics
Topics must start with a letter or number, can include dashes ('-') and can be up to 35 characters long.
18 lines
591 B
18 lines
591 B
from tinygrad import Tensor, dtypes, Context, GlobalCounters
|
|
dtypes.default_float = dtypes.float16
|
|
from tinygrad.dtype import to_dtype
|
|
from tinygrad.helpers import getenv
|
|
from test.test_softmax_fusion import single_kernel_softmax
|
|
|
|
if __name__ == "__main__":
|
|
# softmax in bert layers
|
|
BS = getenv("BS", 96//6)
|
|
acc_dtype = to_dtype(getenv("ACC_DTYPE", "half"))
|
|
t = Tensor.empty(BS, 16, 512, 512)
|
|
t.softmax(-1, dtype="half").realize()
|
|
|
|
# test single kernel softmax
|
|
GlobalCounters.reset()
|
|
with Context(DONT_GROUP_REDUCES=1):
|
|
single_kernel_softmax(t, -1, acc_dtype).realize()
|
|
|
|
|