Data Core

Main Numpy and Times Series functions used throughout the library.

from tsai.data.external import get_UCR_data

dsid = 'OliveOil'
X_train, y_train, X_valid, y_valid = get_UCR_data(dsid, on_disk=True, force_download=True)
X_on_disk, y_on_disk, splits = get_UCR_data(dsid, on_disk=True, return_split=False, force_download=True)
X_in_memory, y_in_memory, splits = get_UCR_data(dsid, on_disk=False, return_split=False, force_download=True)
y_tensor = cat2int(y_on_disk)
y_array = y_tensor.numpy()

source

ToNumpyTensor

 ToNumpyTensor (enc=None, dec=None, split_idx=None, order=None)

Transforms an object into NumpyTensor

source

NumpyTensor

 NumpyTensor (o, dtype=None, device=None, copy=None, requires_grad=False,
              **kwargs)

Returns a tensor with subclass NumpyTensor that has a show method

source

TSTensor

 TSTensor (o, dtype=None, device=None, copy=None, requires_grad=False,
           **kwargs)

Returns a tensor with subclass TSTensor that has a show method

source

show_tuple

 show_tuple (tup, nrows:int=1, ncols:int=1,
             sharex:"bool|Literal['none','all','row','col']"=False,
             sharey:"bool|Literal['none','all','row','col']"=False,
             squeeze:bool=True, width_ratios:Sequence[float]|None=None,
             height_ratios:Sequence[float]|None=None,
             subplot_kw:dict[str,Any]|None=None,
             gridspec_kw:dict[str,Any]|None=None)

Display a timeseries plot from a decoded tuple

source

ToTSTensor

 ToTSTensor (enc=None, dec=None, split_idx=None, order=None)

Transforms an object into TSTensor

a = np.random.randn(2, 3, 4).astype(np.float16)
assert np.shares_memory(a, NumpyTensor(a))
assert np.shares_memory(a, TSTensor(a))

a = np.random.randn(2, 3, 4).astype(np.float32)
assert np.shares_memory(a, NumpyTensor(a))
assert np.shares_memory(a, TSTensor(a))

a = np.random.randint(10, size=10).astype(np.int64)
assert np.shares_memory(a, NumpyTensor(a))
assert np.shares_memory(a, TSTensor(a))

a = np.random.randint(10, size=10).astype(np.int32)
assert np.shares_memory(a, NumpyTensor(a))
assert np.shares_memory(a, TSTensor(a))

a = torch.rand(2, 3, 4).float()
assert np.shares_memory(a, NumpyTensor(a))
assert np.shares_memory(a, TSTensor(a))

a = torch.randint(3, (10,))
assert np.shares_memory(a, NumpyTensor(a))
assert np.shares_memory(a, TSTensor(a))

t = TSTensor(torch.randn(2, 3, 4))
p = torch.tensor(3., requires_grad=True)
test = torch.add(t, p)
test_eq(test.requires_grad, True)
test_eq(type(t.data), torch.Tensor)
test_eq(type(t), TSTensor)

l = L([0,1,2,3], [4,5,6,7], [8, 9, 10, 11])
TSTensor(l), TSTensor(l).data

(TSTensor(vars:3, len:4, device=cpu, dtype=torch.int64),
 tensor([[ 0,  1,  2,  3],
         [ 4,  5,  6,  7],
         [ 8,  9, 10, 11]]))

t = TSTensor(X_train)
for i in range(4):
    print(t, t.ndim, torch.is_tensor(t))
    if i < 3: t = t[0]

TSTensor(samples:30, vars:1, len:570, device=cpu, dtype=torch.float32) 3 True
TSTensor(vars:1, len:570, device=cpu, dtype=torch.float32) 2 True
TSTensor(len:570, device=cpu, dtype=torch.float32) 1 True
TSTensor([-0.6113752722740173], device=cpu, dtype=torch.float32) 0 True

TSTensor(X_on_disk)

TSTensor(samples:60, vars:1, len:570, device=cpu, dtype=torch.float32)

ToTSTensor()(X_on_disk)

TSTensor(samples:60, vars:1, len:570, device=cpu, dtype=torch.float32)

TSTensor(X_train).show();

TSTensor(X_train).show(title='1');

show_tuple((TSTensor(X_train), ['1', '2']))

show_tuple((TSTensor(np.arange(10).reshape(2,5)), 1))

show_tuple((TSTensor(np.arange(10).reshape(2,5)), '1'))

show_tuple((TSTensor(np.arange(10).reshape(2,5)), [1,2]))

show_tuple((TSTensor(np.arange(10).reshape(2,5)), ['1', '2']))

source

TSMaskTensor

 TSMaskTensor (o, dtype=None, device=None, copy=None, requires_grad=False,
               **kwargs)

Returns a tensor with subclass NumpyTensor that has a show method

source

TSLabelTensor

 TSLabelTensor (o, dtype=None, device=None, copy=None,
                requires_grad=False, **kwargs)

Returns a tensor with subclass NumpyTensor that has a show method

t = TSLabelTensor(torch.randint(0,10,(1, 2, 3)))
t, t[0], t[0][0], t[0][0][0]

(TSLabelTensor(shape:(1, 2, 3), device=cpu, dtype=torch.int64),
 TSLabelTensor(shape:(2, 3), device=cpu, dtype=torch.int64),
 TSLabelTensor(shape:(3,), device=cpu, dtype=torch.int64),
 3)

t = TSMaskTensor(torch.randint(0,10,(1, 2, 3)))
t, t[0], t[0][0], t[0][0][0]

(TSMaskTensor(shape:(1, 2, 3), device=cpu, dtype=torch.int64),
 TSMaskTensor(shape:(2, 3), device=cpu, dtype=torch.int64),
 TSMaskTensor(shape:(3,), device=cpu, dtype=torch.int64),
 6)

source

TSClassification

 TSClassification (vocab=None, sort=True)

Vectorized, reversible transform of category string to vocab id

source

ToInt

 ToInt (enc=None, dec=None, split_idx=None, order=None)

Transforms an object dtype to int

source

ToFloat

 ToFloat (enc=None, dec=None, split_idx=None, order=None)

Transforms an object dtype to float (vectorized)

a = np.random.randint(0, 2, 10)
b = np.array(['1', '2', '3'])
c = np.array(['1.0', '2.0', '3.0'])
t = torch.randint(0, 2, (10, ))
test_eq(ToFloat()(a).dtype, 'float32')
test_eq(ToFloat()(b).dtype, 'float32')
test_eq(ToFloat()(c).dtype, 'float32')
test_eq(ToFloat()(t).dtype, torch.float32)

a = np.random.rand(10)*10
b = np.array(['1.0', '2.0', '3.0'])
t = torch.rand(10)*10
test_eq(ToInt()(a).dtype, 'int64')
test_eq(ToInt()(b).dtype, 'int64')
test_eq(ToInt()(t).dtype, torch.long)

t = TSClassification()
t.setup(y_on_disk[splits[0]])
y_encoded = t(y_on_disk)
print(y_encoded)
test_eq(t.decodes(y_encoded), y_on_disk)

TensorCategory([0, 0, 0, 0, 0, 1, 1, 1, 1, 1, 1, 1, 1, 2, 2, 2, 2, 3, 3, 3, 3,
                3, 3, 3, 3, 3, 3, 3, 3, 3, 0, 0, 0, 0, 0, 1, 1, 1, 1, 1, 1, 1,
                1, 1, 2, 2, 2, 2, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3])

y_multi= np.random.randint(0,3,20)
y_multi = np.asarray(alphabet[y_multi]).reshape(4,5)
tfm = TSClassification()
tfm.setup(y_multi)
enc_y_multi = tfm(y_multi)
test_eq(y_multi, tfm.decode(enc_y_multi))
enc_y_multi

TensorCategory([[2, 1, 0, 0, 1],
                [0, 0, 2, 1, 2],
                [0, 2, 0, 0, 0],
                [1, 1, 0, 0, 1]])

source

TSMultiLabelClassification

 TSMultiLabelClassification (c=None, vocab=None, add_na=False, sort=True)

Reversible combined transform of multi-category strings to one-hot encoded vocab id

source