tinygrad/test/test_dtype.py

import unittest
import numpy as np
from tinygrad.helpers import getenv
from tinygrad.lazy import Device
from tinygrad.tensor import Tensor, dtypes

# for GPU, cl_khr_fp16 isn't supported (except now we don't need it!)
# for LLVM, it segfaults because it can't link to the casting function
@unittest.skipIf(getenv("CI", "") != "" and Device.DEFAULT in ["LLVM"], "float16 broken in some CI backends")
class TestDtype(unittest.TestCase):
  def test_half_to_np(self):
    a = Tensor([1,2,3,4], dtype=dtypes.float16)
    print(a)
    na = a.numpy()
    print(na, na.dtype, a.lazydata.realized)
    assert na.dtype == np.float16
    np.testing.assert_allclose(na, [1,2,3,4])

  def test_half_add(self):
    a = Tensor([1,2,3,4], dtype=dtypes.float16)
    b = Tensor([1,2,3,4], dtype=dtypes.float16)
    c = a+b
    print(c.numpy())
    assert c.dtype == dtypes.float16
    np.testing.assert_allclose(c.numpy(), [2,4,6,8])

  def test_half_mul(self):
    a = Tensor([1,2,3,4], dtype=dtypes.float16)
    b = Tensor([1,2,3,4], dtype=dtypes.float16)
    c = a*b
    print(c.numpy())
    assert c.dtype == dtypes.float16
    np.testing.assert_allclose(c.numpy(), [1,4,9,16])

  def test_half_matmul(self):
    a = Tensor([[1,2],[3,4]], dtype=dtypes.float16)
    b = Tensor.eye(2, dtype=dtypes.float16)
    c = a@b
    print(c.numpy())
    assert c.dtype == dtypes.float16
    np.testing.assert_allclose(c.numpy(), [[1,2],[3,4]])

  def test_upcast_float(self):
    a = Tensor([1,2,3,4], dtype=dtypes.float16)
    print(a)
    fa = a.float()
    assert a.device == fa.device
    assert a.requires_grad == fa.requires_grad
    na = fa.numpy()
    print(na, na.dtype)
    assert na.dtype == np.float32
    np.testing.assert_allclose(na, [1,2,3,4])

  def test_downcast_float(self):
    a = Tensor([1,2,3,4], dtype=dtypes.float32, requires_grad=False).half()
    print(a)
    ha = a.half()
    assert a.device == ha.device
    assert a.requires_grad == ha.requires_grad
    na = ha.numpy()
    print(na, na.dtype)
    assert na.dtype == np.float16
    np.testing.assert_allclose(na, [1,2,3,4])

  def test_half_add_upcast(self):
    a = Tensor([1,2,3,4], dtype=dtypes.float16)
    b = Tensor([1,2,3,4], dtype=dtypes.float32)
    c = a+b
    print(c.numpy())
    assert c.dtype == dtypes.float32
    np.testing.assert_allclose(c.numpy(), [2,4,6,8])

  def test_half_mul_upcast(self):
    a = Tensor([1,2,3,4], dtype=dtypes.float16)
    b = Tensor([1,2,3,4], dtype=dtypes.float32)
    c = a*b
    print(c.numpy())
    assert c.dtype == dtypes.float32
    np.testing.assert_allclose(c.numpy(), [1,4,9,16])

  def test_half_matmul_upcast(self):
    a = Tensor([[1,2],[3,4]], dtype=dtypes.float16)
    b = Tensor.eye(2, dtype=dtypes.float32)
    c = a@b
    print(c.numpy())
    assert c.dtype == dtypes.float32
    np.testing.assert_allclose(c.numpy(), [[1,2],[3,4]])

if __name__ == '__main__':
  unittest.main()
dtypes nice and clean (#673) * add dtype class * dtypes * buffers are lazy * dtype is tracked by lazybuffer and GenericShape * fix types in llvm * llvm store * dtype tests * fix tests maybe * fix flop counter * fix CI * CI fix and check format * fix dtype and dtype check * fix custom test * fix test graph 2023-03-11 08:56:07 +08:00			`import unittest`
			`import numpy as np`
			`from tinygrad.helpers import getenv`
			`from tinygrad.lazy import Device`
			`from tinygrad.tensor import Tensor, dtypes`

linearizer! (#714) * linearizer outputs something * working ish * cstyle codegen * clang mostly works * fix load valid * fix numberless loop * fancy gen * working * fix enet compiler * cleanups * float4 upcasting * less lines * supports_float4 * constant folding * mulacc * internet tests flaky in CI * 90% image support * fix image generic * bugs exposed with shapetracker and single view * new llvm * use vload, remove OLD * that's really poorly done * ending up being more lines 2023-03-20 14:43:49 +08:00			`# for GPU, cl_khr_fp16 isn't supported (except now we don't need it!)`
dtypes nice and clean (#673) * add dtype class * dtypes * buffers are lazy * dtype is tracked by lazybuffer and GenericShape * fix types in llvm * llvm store * dtype tests * fix tests maybe * fix flop counter * fix CI * CI fix and check format * fix dtype and dtype check * fix custom test * fix test graph 2023-03-11 08:56:07 +08:00			`# for LLVM, it segfaults because it can't link to the casting function`
linearizer! (#714) * linearizer outputs something * working ish * cstyle codegen * clang mostly works * fix load valid * fix numberless loop * fancy gen * working * fix enet compiler * cleanups * float4 upcasting * less lines * supports_float4 * constant folding * mulacc * internet tests flaky in CI * 90% image support * fix image generic * bugs exposed with shapetracker and single view * new llvm * use vload, remove OLD * that's really poorly done * ending up being more lines 2023-03-20 14:43:49 +08:00			`@unittest.skipIf(getenv("CI", "") != "" and Device.DEFAULT in ["LLVM"], "float16 broken in some CI backends")`
dtypes nice and clean (#673) * add dtype class * dtypes * buffers are lazy * dtype is tracked by lazybuffer and GenericShape * fix types in llvm * llvm store * dtype tests * fix tests maybe * fix flop counter * fix CI * CI fix and check format * fix dtype and dtype check * fix custom test * fix test graph 2023-03-11 08:56:07 +08:00			`class TestDtype(unittest.TestCase):`
			`def test_half_to_np(self):`
			`a = Tensor([1,2,3,4], dtype=dtypes.float16)`
			`print(a)`
			`na = a.numpy()`
			`print(na, na.dtype, a.lazydata.realized)`
			`assert na.dtype == np.float16`
fix float16 in CLANG on linux 2023-03-12 13:51:22 +08:00			`np.testing.assert_allclose(na, [1,2,3,4])`
dtypes nice and clean (#673) * add dtype class * dtypes * buffers are lazy * dtype is tracked by lazybuffer and GenericShape * fix types in llvm * llvm store * dtype tests * fix tests maybe * fix flop counter * fix CI * CI fix and check format * fix dtype and dtype check * fix custom test * fix test graph 2023-03-11 08:56:07 +08:00
			`def test_half_add(self):`
			`a = Tensor([1,2,3,4], dtype=dtypes.float16)`
			`b = Tensor([1,2,3,4], dtype=dtypes.float16)`
			`c = a+b`
			`print(c.numpy())`
			`assert c.dtype == dtypes.float16`
fix float16 in CLANG on linux 2023-03-12 13:51:22 +08:00			`np.testing.assert_allclose(c.numpy(), [2,4,6,8])`
dtypes nice and clean (#673) * add dtype class * dtypes * buffers are lazy * dtype is tracked by lazybuffer and GenericShape * fix types in llvm * llvm store * dtype tests * fix tests maybe * fix flop counter * fix CI * CI fix and check format * fix dtype and dtype check * fix custom test * fix test graph 2023-03-11 08:56:07 +08:00
Add tests for casting (#724) * Add tests for casting * Skip half_matmul_upcast when TORCH=1 * Fix promotion on torch * Fix spacing 2023-03-23 23:02:52 +08:00			`def test_half_mul(self):`
			`a = Tensor([1,2,3,4], dtype=dtypes.float16)`
			`b = Tensor([1,2,3,4], dtype=dtypes.float16)`
			`c = a*b`
			`print(c.numpy())`
			`assert c.dtype == dtypes.float16`
			`np.testing.assert_allclose(c.numpy(), [1,4,9,16])`

			`def test_half_matmul(self):`
			`a = Tensor([[1,2],[3,4]], dtype=dtypes.float16)`
			`b = Tensor.eye(2, dtype=dtypes.float16)`
			`c = a@b`
			`print(c.numpy())`
			`assert c.dtype == dtypes.float16`
			`np.testing.assert_allclose(c.numpy(), [[1,2],[3,4]])`

dtypes nice and clean (#673) * add dtype class * dtypes * buffers are lazy * dtype is tracked by lazybuffer and GenericShape * fix types in llvm * llvm store * dtype tests * fix tests maybe * fix flop counter * fix CI * CI fix and check format * fix dtype and dtype check * fix custom test * fix test graph 2023-03-11 08:56:07 +08:00			`def test_upcast_float(self):`
casting: support all backends and implement half (#726) * casting: support all backends and implement half * map torch types in ops_torch * reuse type map for torch buffer * inverse dict lookup 2023-03-25 00:58:03 +08:00			`a = Tensor([1,2,3,4], dtype=dtypes.float16)`
dtypes nice and clean (#673) * add dtype class * dtypes * buffers are lazy * dtype is tracked by lazybuffer and GenericShape * fix types in llvm * llvm store * dtype tests * fix tests maybe * fix flop counter * fix CI * CI fix and check format * fix dtype and dtype check * fix custom test * fix test graph 2023-03-11 08:56:07 +08:00			`print(a)`
casting: support all backends and implement half (#726) * casting: support all backends and implement half * map torch types in ops_torch * reuse type map for torch buffer * inverse dict lookup 2023-03-25 00:58:03 +08:00			`fa = a.float()`
			`assert a.device == fa.device`
			`assert a.requires_grad == fa.requires_grad`
			`na = fa.numpy()`
dtypes nice and clean (#673) * add dtype class * dtypes * buffers are lazy * dtype is tracked by lazybuffer and GenericShape * fix types in llvm * llvm store * dtype tests * fix tests maybe * fix flop counter * fix CI * CI fix and check format * fix dtype and dtype check * fix custom test * fix test graph 2023-03-11 08:56:07 +08:00			`print(na, na.dtype)`
			`assert na.dtype == np.float32`
fix float16 in CLANG on linux 2023-03-12 13:51:22 +08:00			`np.testing.assert_allclose(na, [1,2,3,4])`
dtypes nice and clean (#673) * add dtype class * dtypes * buffers are lazy * dtype is tracked by lazybuffer and GenericShape * fix types in llvm * llvm store * dtype tests * fix tests maybe * fix flop counter * fix CI * CI fix and check format * fix dtype and dtype check * fix custom test * fix test graph 2023-03-11 08:56:07 +08:00
casting: support all backends and implement half (#726) * casting: support all backends and implement half * map torch types in ops_torch * reuse type map for torch buffer * inverse dict lookup 2023-03-25 00:58:03 +08:00			`def test_downcast_float(self):`
			`a = Tensor([1,2,3,4], dtype=dtypes.float32, requires_grad=False).half()`
			`print(a)`
			`ha = a.half()`
			`assert a.device == ha.device`
			`assert a.requires_grad == ha.requires_grad`
			`na = ha.numpy()`
			`print(na, na.dtype)`
			`assert na.dtype == np.float16`
			`np.testing.assert_allclose(na, [1,2,3,4])`

dtypes nice and clean (#673) * add dtype class * dtypes * buffers are lazy * dtype is tracked by lazybuffer and GenericShape * fix types in llvm * llvm store * dtype tests * fix tests maybe * fix flop counter * fix CI * CI fix and check format * fix dtype and dtype check * fix custom test * fix test graph 2023-03-11 08:56:07 +08:00			`def test_half_add_upcast(self):`
			`a = Tensor([1,2,3,4], dtype=dtypes.float16)`
			`b = Tensor([1,2,3,4], dtype=dtypes.float32)`
			`c = a+b`
			`print(c.numpy())`
			`assert c.dtype == dtypes.float32`
fix float16 in CLANG on linux 2023-03-12 13:51:22 +08:00			`np.testing.assert_allclose(c.numpy(), [2,4,6,8])`
dtypes nice and clean (#673) * add dtype class * dtypes * buffers are lazy * dtype is tracked by lazybuffer and GenericShape * fix types in llvm * llvm store * dtype tests * fix tests maybe * fix flop counter * fix CI * CI fix and check format * fix dtype and dtype check * fix custom test * fix test graph 2023-03-11 08:56:07 +08:00
Add tests for casting (#724) * Add tests for casting * Skip half_matmul_upcast when TORCH=1 * Fix promotion on torch * Fix spacing 2023-03-23 23:02:52 +08:00			`def test_half_mul_upcast(self):`
			`a = Tensor([1,2,3,4], dtype=dtypes.float16)`
			`b = Tensor([1,2,3,4], dtype=dtypes.float32)`
			`c = a*b`
			`print(c.numpy())`
			`assert c.dtype == dtypes.float32`
			`np.testing.assert_allclose(c.numpy(), [1,4,9,16])`

			`def test_half_matmul_upcast(self):`
			`a = Tensor([[1,2],[3,4]], dtype=dtypes.float16)`
			`b = Tensor.eye(2, dtype=dtypes.float32)`
			`c = a@b`
			`print(c.numpy())`
			`assert c.dtype == dtypes.float32`
			`np.testing.assert_allclose(c.numpy(), [[1,2],[3,4]])`

dtypes nice and clean (#673) * add dtype class * dtypes * buffers are lazy * dtype is tracked by lazybuffer and GenericShape * fix types in llvm * llvm store * dtype tests * fix tests maybe * fix flop counter * fix CI * CI fix and check format * fix dtype and dtype check * fix custom test * fix test graph 2023-03-11 08:56:07 +08:00			`if __name__ == '__main__':`
Add tests for casting (#724) * Add tests for casting * Skip half_matmul_upcast when TORCH=1 * Fix promotion on torch * Fix spacing 2023-03-23 23:02:52 +08:00			`unittest.main()`