def _guess_variable_type()

in ml-tools-python/awspyml.py [0:0]


    def _guess_variable_type(self, samples):
        counts = {
            "NUMERIC": 0,
            "BINARY": 0,
            "TEXT": 0,
            "CATEGORICAL": 0,
        }
        for sample in samples:
            try:
                num = float(sample)
                counts["NUMERIC"] += 1
                if num == 0 or num == 1:
                    counts["BINARY"] += 1
            except:
                # Non-numeric
                word_count = len(re.split("\s+", sample))
                if word_count > self.text_words_threshold:
                    counts["TEXT"] += 1
                else:
                    counts["CATEGORICAL"] += 1
        return max(counts, key=counts.get)