Dataset Base and Meta

Base Classes for Datasets

Base DFSet


source

BaseDataFrameDataset

 BaseDataFrameDataset (df:pandas.core.frame.DataFrame=<factory>)

Example

df = pd.DataFrame(
    np.random.randint(0, 10, (10, 3)), 
    index=np.random.choice('a b c'.split(), 10),
    columns='x y z'.split()
)
df.head()
x y z
b 7 5 7
a 0 9 0
c 5 6 9
a 1 3 9
b 8 2 4
class DataFrameDataSetTest(BaseDataFrameDataset):
    pass
ds = DataFrameDataSetTest(df)
ds.iloc[0]
x    7
y    5
z    7
Name: b, dtype: int64
ds.cloc[0]
x y z
a 0 9 0
a 1 3 9
ds.cloc.cindex.get_indexer_for(['a'])
array([1, 3])
ds.cloc.icat(0)
['a']
ds.loc['a']
x y z
a 0 9 0
a 1 3 9
ds.iloc[:2]
x y z
b 7 5 7
a 0 9 0
ds.cloc.cindex.categories[:2]
Index(['a', 'b'], dtype='object')
ds.loc[['a', 'b']]
x y z
b 7 5 7
a 0 9 0
a 1 3 9
b 8 2 4
b 0 9 2
b 2 3 4
ds.loc[pd.Index(['a', 'b'])]
x y z
b 7 5 7
a 0 9 0
a 1 3 9
b 8 2 4
b 0 9 2
b 2 3 4
ds.loc[['a', 'b']]
x y z
b 7 5 7
a 0 9 0
a 1 3 9
b 8 2 4
b 0 9 2
b 2 3 4
ds.df.iloc[ds.cloc.cindex.get_indexer_for(['a', 'b'])]
x y z
a 0 9 0
a 1 3 9
b 7 5 7
b 8 2 4
b 0 9 2
b 2 3 4
ds.cloc[pd.Index(['a', 'b'])]
x y z
a 0 9 0
a 1 3 9
b 7 5 7
b 8 2 4
b 0 9 2
b 2 3 4
ds.cloc[:2]
x y z
a 0 9 0
a 1 3 9
b 7 5 7
b 8 2 4
b 0 9 2
b 2 3 4