2023-03-11 08:56:07 +08:00
|
|
|
import unittest
|
|
|
|
import numpy as np
|
2023-07-24 04:00:56 +08:00
|
|
|
from tinygrad.helpers import getenv, DType, DEBUG, CI
|
2023-03-11 08:56:07 +08:00
|
|
|
from tinygrad.lazy import Device
|
|
|
|
from tinygrad.tensor import Tensor, dtypes
|
2023-07-22 06:18:02 +08:00
|
|
|
from typing import List, Optional
|
2023-07-20 11:18:32 +08:00
|
|
|
from extra.utils import OSX, temp
|
2023-07-22 06:18:02 +08:00
|
|
|
import copy
|
2023-05-31 08:49:26 +08:00
|
|
|
|
|
|
|
def _test_to_np(a:Tensor, np_dtype, target):
|
2023-07-22 06:18:02 +08:00
|
|
|
if DEBUG >= 2: print(a)
|
2023-05-31 08:49:26 +08:00
|
|
|
na = a.numpy()
|
2023-07-22 06:18:02 +08:00
|
|
|
if DEBUG >= 2: print(na, na.dtype, a.lazydata.realized)
|
|
|
|
try:
|
|
|
|
assert na.dtype == np_dtype
|
|
|
|
np.testing.assert_allclose(na, target)
|
|
|
|
except AssertionError as e:
|
|
|
|
raise AssertionError(f"\ntensor {a.numpy()} does not match target {target} with np_dtype {np_dtype}") from e
|
|
|
|
|
|
|
|
def _assert_eq(tensor:Tensor, target_dtype:DType, target):
|
|
|
|
if DEBUG >= 2: print(tensor.numpy())
|
|
|
|
try:
|
|
|
|
assert tensor.dtype == target_dtype
|
|
|
|
np.testing.assert_allclose(tensor.numpy(), target)
|
|
|
|
except AssertionError as e:
|
|
|
|
raise AssertionError(f"\ntensor {tensor.numpy()} dtype {tensor.dtype} does not match target {target} with dtype {target_dtype}") from e
|
|
|
|
|
|
|
|
def _test_op(fxn, target_dtype:DType, target): _assert_eq(fxn(), target_dtype, target)
|
2023-05-31 08:49:26 +08:00
|
|
|
def _test_cast(a:Tensor, target_dtype:DType, target): _test_op(lambda: a.cast(target_dtype), target_dtype, target)
|
|
|
|
|
2023-07-22 06:18:02 +08:00
|
|
|
# tests no-op casts from source_dtype to target_dtypes
|
|
|
|
def _test_casts_from(tensor_contents:List, source_dtype:DType, target_dtypes:List[DType], target_contents:Optional[List]=None):
|
|
|
|
if target_contents is None: target_contents = copy.deepcopy(tensor_contents)
|
|
|
|
list(map(
|
|
|
|
lambda t_dtype: _test_cast(Tensor(tensor_contents, dtype=source_dtype), t_dtype, target_contents),
|
|
|
|
target_dtypes
|
|
|
|
))
|
|
|
|
# tests no-op casts from source_dtypes to target_dtype
|
|
|
|
def _test_casts_to(tensor_contents:List, source_dtypes:List[DType], target_dtype:DType, target_contents:Optional[List]=None):
|
|
|
|
if target_contents is None: target_contents = copy.deepcopy(tensor_contents)
|
|
|
|
list(map(
|
|
|
|
lambda s_dtype: _test_cast(Tensor(tensor_contents, dtype=s_dtype), target_dtype, target_contents),
|
|
|
|
source_dtypes
|
|
|
|
))
|
|
|
|
|
|
|
|
def _test_ops(a_dtype:DType, b_dtype:DType, target_dtype:DType):
|
|
|
|
_assert_eq(Tensor([1,2,3,4], dtype=a_dtype)+Tensor([1,2,3,4], dtype=b_dtype), target_dtype, [2,4,6,8])
|
|
|
|
_assert_eq(Tensor([1,2,3,4], dtype=a_dtype)*Tensor([1,2,3,4], dtype=b_dtype), target_dtype, [1,4,9,16])
|
|
|
|
_assert_eq(Tensor([[1,2],[3,4]], dtype=a_dtype)@Tensor.eye(2, dtype=b_dtype), target_dtype, [[1,2],[3,4]])
|
2023-07-20 11:18:32 +08:00
|
|
|
|
|
|
|
class TestBFloat16DType(unittest.TestCase):
|
|
|
|
def test_bf16_to_float(self):
|
|
|
|
with self.assertRaises(AssertionError):
|
|
|
|
_test_cast(Tensor([100000], dtype=dtypes.bfloat16), dtypes.float32, [100000])
|
|
|
|
|
|
|
|
def test_float_to_bf16(self):
|
|
|
|
with self.assertRaises(AssertionError):
|
|
|
|
_test_cast(Tensor([100000], dtype=dtypes.float32), dtypes.bfloat16, [100000])
|
|
|
|
|
|
|
|
# torch.tensor([10000, -1, -1000, -10000, 20]).type(torch.bfloat16)
|
|
|
|
|
|
|
|
@unittest.skipIf(Device.DEFAULT not in ["LLVM"], "bf16 only on LLVM")
|
|
|
|
def test_bf16(self):
|
|
|
|
t = Tensor([10000, -1, -1000, -10000, 20]).cast(dtypes.bfloat16)
|
|
|
|
t.realize()
|
|
|
|
back = t.cast(dtypes.float32)
|
|
|
|
assert tuple(back.numpy().tolist()) == (9984., -1, -1000, -9984, 20)
|
|
|
|
|
|
|
|
@unittest.skipIf(Device.DEFAULT not in ["LLVM"], "bf16 only on LLVM")
|
|
|
|
def test_bf16_disk_write_read(self):
|
|
|
|
t = Tensor([10000, -1, -1000, -10000, 20]).cast(dtypes.float32)
|
|
|
|
t.to(f"disk:{temp('f32')}").realize()
|
|
|
|
|
|
|
|
# hack to "cast" f32 -> bf16
|
|
|
|
dat = open(temp('f32'), "rb").read()
|
|
|
|
adat = b''.join([dat[i+2:i+4] for i in range(0, len(dat), 4)])
|
|
|
|
with open(temp('bf16'), "wb") as f: f.write(adat)
|
|
|
|
|
|
|
|
t = Tensor.empty(5, dtype=dtypes.bfloat16, device=f"disk:{temp('bf16')}").llvm().realize()
|
|
|
|
back = t.cast(dtypes.float32)
|
|
|
|
assert tuple(back.numpy().tolist()) == (9984., -1, -1000, -9984, 20)
|
|
|
|
|
2023-03-20 14:43:49 +08:00
|
|
|
# for GPU, cl_khr_fp16 isn't supported (except now we don't need it!)
|
2023-03-11 08:56:07 +08:00
|
|
|
# for LLVM, it segfaults because it can't link to the casting function
|
2023-07-13 03:52:06 +08:00
|
|
|
@unittest.skipIf((getenv("CI", "") != "" and Device.DEFAULT in ["LLVM"]) or Device.DEFAULT == "WEBGPU", "float16 broken in some CI backends")
|
2023-05-31 08:49:26 +08:00
|
|
|
class TestHalfDtype(unittest.TestCase):
|
2023-07-22 06:18:02 +08:00
|
|
|
def test_float16_to_np(self): _test_to_np(Tensor([1,2,3,4], dtype=dtypes.float16), np.float16, [1,2,3,4])
|
|
|
|
def test_casts_to_half(self): _test_casts_to([1,2,3,4], source_dtypes=[dtypes.float32, dtypes.int8, dtypes.uint8], target_dtype=dtypes.float16)
|
|
|
|
def test_casts_from_half(self): _test_casts_from([1,2,3,4], source_dtype=dtypes.float16, target_dtypes=[dtypes.int8, dtypes.uint8, dtypes.float32, dtypes.int32, dtypes.int64])
|
|
|
|
def test_half_upcast_ops(self): _test_ops(a_dtype=dtypes.float16, b_dtype=dtypes.float32, target_dtype=dtypes.float32)
|
|
|
|
def test_upcast_to_half_ops(self): _test_ops(a_dtype=dtypes.int8, b_dtype=dtypes.float16, target_dtype=dtypes.float16)
|
2023-05-31 08:49:26 +08:00
|
|
|
|
2023-07-13 03:52:06 +08:00
|
|
|
@unittest.skipIf(Device.DEFAULT == "WEBGPU", "webgpu does not support int8")
|
2023-05-31 08:49:26 +08:00
|
|
|
class TestInt8Dtype(unittest.TestCase):
|
|
|
|
def test_int8_to_np(self): _test_to_np(Tensor([1,2,3,4], dtype=dtypes.int8), np.int8, [1,2,3,4])
|
|
|
|
def test_uint8_to_np(self): _test_to_np(Tensor([1,2,3,4], dtype=dtypes.uint8), np.uint8, [1,2,3,4])
|
|
|
|
def test_int64_to_np(self): _test_to_np(Tensor([1,2,3,4], dtype=dtypes.int64), np.int64, [1,2,3,4])
|
|
|
|
|
2023-07-22 06:18:02 +08:00
|
|
|
def test_casts_to_int8(self): _test_casts_from([1,2,3,4], source_dtype=dtypes.float32, target_dtypes=[dtypes.int8, dtypes.uint8, dtypes.int32, dtypes.int64])
|
|
|
|
def test_casts_from_int8(self): _test_casts_from([1,2,3,4], source_dtype=dtypes.int8, target_dtypes=[dtypes.float32, dtypes.uint8, dtypes.int32, dtypes.int64])
|
|
|
|
def test_casts_from_uint8(self): _test_casts_from([1,2,3,4], source_dtype=dtypes.uint8, target_dtypes=[dtypes.float32, dtypes.int8, dtypes.int32, dtypes.int64])
|
2023-05-31 08:49:26 +08:00
|
|
|
|
2023-07-22 06:18:02 +08:00
|
|
|
def test_int8_ops(self): _test_ops(a_dtype=dtypes.int8, b_dtype=dtypes.int8, target_dtype=dtypes.int8)
|
|
|
|
def test_int64_ops(self): _test_ops(a_dtype=dtypes.int64, b_dtype=dtypes.int64, target_dtype=dtypes.int64)
|
|
|
|
def test_int8_upcast_float(self): _test_ops(a_dtype=dtypes.int8, b_dtype=dtypes.float32, target_dtype=dtypes.float32)
|
|
|
|
def test_int8_upcast_int64(self): _test_ops(a_dtype=dtypes.int8, b_dtype=dtypes.int64, target_dtype=dtypes.int64)
|
2023-05-31 08:49:26 +08:00
|
|
|
|
2023-06-23 05:15:50 +08:00
|
|
|
@unittest.skipIf(getenv("CUDA",0)==1, "cuda saturation works differently")
|
2023-05-31 08:49:26 +08:00
|
|
|
def test_int8_to_uint8_negative(self): _test_op(lambda: Tensor([-1, -2, -3, -4], dtype=dtypes.int8).cast(dtypes.uint8), dtypes.uint8, [255, 254, 253, 252])
|
|
|
|
|
|
|
|
def test_uint8_to_int8_overflow(self): _test_op(lambda: Tensor([255, 254, 253, 252], dtype=dtypes.uint8).cast(dtypes.int8), dtypes.int8, [-1, -2, -3, -4])
|
2023-03-23 23:02:52 +08:00
|
|
|
|
2023-07-13 01:29:15 +08:00
|
|
|
class TestInt32Dtype(unittest.TestCase):
|
|
|
|
def test_int32_to_np(self): _test_to_np(Tensor([1,2,3,4], dtype=dtypes.int32), np.int32, [1,2,3,4])
|
|
|
|
|
2023-07-22 06:18:02 +08:00
|
|
|
def test_casts_to_int32(self): _test_casts_to([1,2,3,4], source_dtypes=[dtypes.float32, dtypes.int64], target_dtype=dtypes.int32)
|
|
|
|
def test_casts_from_int32(self): _test_casts_from([1,2,3,4], source_dtype=dtypes.int32, target_dtypes=[dtypes.float32, dtypes.int64])
|
2023-07-13 01:29:15 +08:00
|
|
|
|
2023-07-22 06:18:02 +08:00
|
|
|
def test_int32_ops(self): _test_ops(a_dtype=dtypes.int32, b_dtype=dtypes.int32, target_dtype=dtypes.int32)
|
|
|
|
def test_int32_upcast_float32(self): _test_ops(a_dtype=dtypes.int32, b_dtype=dtypes.float32, target_dtype=dtypes.float32)
|
|
|
|
def test_int32_upcast_int64(self): _test_ops(a_dtype=dtypes.int32, b_dtype=dtypes.int64, target_dtype=dtypes.int64)
|
2023-07-13 01:29:15 +08:00
|
|
|
|
2023-03-11 08:56:07 +08:00
|
|
|
if __name__ == '__main__':
|
2023-03-23 23:02:52 +08:00
|
|
|
unittest.main()
|