@@ -76,7 +76,7 @@ def __init__(self, dataset_id=None, name=None, version=None, description=None,
7676 self .features = features
7777
7878 if data_file is not None :
79- if ( self ._data_contains_string_features () == False ):
79+ if self ._data_features_supported ( ):
8080 self .data_pickle_file = data_file .replace ('.arff' , '.pkl' )
8181
8282 if os .path .exists (self .data_pickle_file ):
@@ -137,7 +137,7 @@ def _get_arff(self, format):
137137 # 32 bit system...currently 120mb (just a little bit more than covtype)
138138 import struct
139139
140- if ( self ._data_contains_string_features () ):
140+ if not self ._data_features_supported ( ):
141141 raise PyOpenMLError ('Dataset not compatible, PyOpenML cannot handle string features' )
142142
143143 filename = self .data_file
@@ -180,7 +180,7 @@ def get_data(self, target=None, target_dtype=int, include_row_id=False,
180180 """
181181 rval = []
182182
183- if ( self ._data_contains_string_features () ):
183+ if not self ._data_features_supported ( ):
184184 raise PyOpenMLError ('Dataset not compatible, PyOpenML cannot handle string features' )
185185
186186 path = self .data_pickle_file
@@ -348,10 +348,10 @@ def _to_xml(self):
348348 xml_dataset += "</oml:data_set_description>"
349349 return xml_dataset
350350
351- def _data_contains_string_features (self ):
352- if ( self .features is not None ) :
351+ def _data_features_supported (self ):
352+ if self .features is not None :
353353 for feature in self .features ['oml:feature' ]:
354- if ( feature ['oml:data_type' ] == 'string' ) :
355- return True
356- return False
357- return False
354+ if feature ['oml:data_type' ] not in [ 'numeric' , 'nominal' ] :
355+ return False
356+ return True
357+ return True
0 commit comments