in ml-tools-python/awspyml.py [0:0]
def _guess_variable_type(self, samples):
counts = {
"NUMERIC": 0,
"BINARY": 0,
"TEXT": 0,
"CATEGORICAL": 0,
}
for sample in samples:
try:
num = float(sample)
counts["NUMERIC"] += 1
if num == 0 or num == 1:
counts["BINARY"] += 1
except:
# Non-numeric
word_count = len(re.split("\s+", sample))
if word_count > self.text_words_threshold:
counts["TEXT"] += 1
else:
counts["CATEGORICAL"] += 1
return max(counts, key=counts.get)