in sagemaker/source/dl_utils/dataset.py [0:0]
def select_data(self, **kwargs):
'''
Function to select data.
Parameters:
-----------
**kwargs: {}
Dictionary where keys are the column names and values are the target selection.
Returns:
--------
named_tuple with data, labels, and vehicle_properties.
Usage:
------
To select freightliners,
> train_ds.select_data(make="FREIGHTLINER")
To select 2016 freightliners that use diesel
> train_ds.select_data(make="FREIGHTLINER", model_year=2016, fuel_type="diesel")
'''
selection_indexes = np.ones(shape=(self.vehicle_properties.shape[0]))
for header, selection in kwargs.items():
selection_index = self.vehicle_properties[header] == selection
selection_indexes = np.logical_and(selection_indexes, selection_index)
selected_data = self.data[selection_indexes]
selected_labels = self.labels[selection_indexes]
selected_vehicle_properties = self.vehicle_properties[selection_indexes]
Selected_data = collections.namedtuple('Selected_data', 'data labels vehicle_properties')
return Selected_data(data=selected_data, labels=selected_labels,
vehicle_properties=selected_vehicle_properties)