Source code for tic

'''Top-level package for TIC.'''

__author__ = '''Tom Martensen'''
__email__ = '[email protected]'
__version__ = '0.2.0'

import pandas as pd
from sklearn.datasets import load_breast_cancer
from sklearn.model_selection import train_test_split


[docs]def load_test_data(): ''' Loads the breast cancer test dataset from sklearn and prepares it for the examples. ''' data = load_breast_cancer() X = pd.DataFrame(data.data, columns=data.feature_names) y = pd.Series(data.target, name=data.target_names[1]) X_train, X_test, y_train, y_test = train_test_split(X, y, random_state=42) dataset = dict(zip( ['X_train', 'X_test', 'y_train', 'y_test'], [X_train, X_test, y_train, y_test] )) return { 'target_names': data.target_names, 'feature_names': data.feature_names, 'dataset': dataset }