cpdbench.examples.ExampleDatasets

 1import pathlib
 2
 3import numpy as np
 4
 5from cpdbench.dataset.CPD2DFromFileDataset import CPD2DFromFileDataset
 6from cpdbench.dataset.CPDNdarrayDataset import CPDNdarrayDataset
 7
 8
 9def get_extreme_large_dataset_from_file(validation_amount=-1):
10    path = pathlib.Path(__file__).parent.resolve()
11    path = path.joinpath("data", "very_big_numpy_file.dat")
12    dataset = CPD2DFromFileDataset(str(path), "float32", [5, 245, 255, 256, 25], validation_amount)
13    return dataset
14
15
16def dataset_get_apple_dataset():
17    path = pathlib.Path(__file__).parent.resolve()
18    path = path.joinpath("data", "apple.npy")
19    raw_data = np.load(str(path))
20    timeseries = raw_data[:, 0]
21    reshaped_ts = np.reshape(timeseries, [1, timeseries.size])
22    return CPDNdarrayDataset(reshaped_ts, [337])
23
24
25def dataset_get_bitcoin_dataset():
26    path = pathlib.Path(__file__).parent.resolve()
27    path = path.joinpath("data", "bitcoin.npy")
28    raw_data = np.load(str(path))
29    timeseries = raw_data[:, 0]
30    reshaped_ts = np.reshape(timeseries, [1, timeseries.size])
31    return CPDNdarrayDataset(reshaped_ts, [569])
def get_extreme_large_dataset_from_file(validation_amount=-1):
10def get_extreme_large_dataset_from_file(validation_amount=-1):
11    path = pathlib.Path(__file__).parent.resolve()
12    path = path.joinpath("data", "very_big_numpy_file.dat")
13    dataset = CPD2DFromFileDataset(str(path), "float32", [5, 245, 255, 256, 25], validation_amount)
14    return dataset
def dataset_get_apple_dataset():
17def dataset_get_apple_dataset():
18    path = pathlib.Path(__file__).parent.resolve()
19    path = path.joinpath("data", "apple.npy")
20    raw_data = np.load(str(path))
21    timeseries = raw_data[:, 0]
22    reshaped_ts = np.reshape(timeseries, [1, timeseries.size])
23    return CPDNdarrayDataset(reshaped_ts, [337])
def dataset_get_bitcoin_dataset():
26def dataset_get_bitcoin_dataset():
27    path = pathlib.Path(__file__).parent.resolve()
28    path = path.joinpath("data", "bitcoin.npy")
29    raw_data = np.load(str(path))
30    timeseries = raw_data[:, 0]
31    reshaped_ts = np.reshape(timeseries, [1, timeseries.size])
32    return CPDNdarrayDataset(reshaped_ts, [569])