core/src/main/scala/com/microsoft/azure/synapse/ml/stages/SummarizeData.scala (4 lines): - line 227: //TODO: StructField("Range", DoubleType, true), - line 228: //TODO: StructField("Mean", DoubleType, true), - line 229: //TODO: StructField("Mean Deviation", DoubleType, true), - line 231: //TODO: StructField("Mode", StringType, true)) deep-learning/src/main/scala/com/microsoft/azure/synapse/ml/cntk/CNTKModel.scala (4 lines): - line 56: val fvv = new FloatVectorVector() //TODO try re-using - line 62: val dvv = new DoubleVectorVector() //TODO try re-using - line 165: // TODO: investigate using destroy() - line 504: // TODO: The cache call is a workaround for issue 1075: core/src/main/scala/com/microsoft/azure/synapse/ml/train/ComputeModelStatistics.scala (3 lines): - line 258: // TODO: We call cache in order to avoid a bug with catalyst where CMS seems to get stuck in a loop - line 282: // TODO: We call cache in order to avoid a bug with catalyst where CMS seems to get stuck in a loop - line 312: // TODO: We call cache in order to avoid a bug with catalyst where CMS seems to get stuck in a loop core/src/main/scala/com/microsoft/azure/synapse/ml/train/TrainRegressor.scala (2 lines): - line 73: // TODO: Handle DateType, TimestampType and DecimalType for label - line 159: // Update the schema - TODO: create method that would generate GUID and add it to the scored model pipeline.yaml (2 lines): - line 588: PACKAGE: "flaky" #TODO fix flaky test so isolation is not needed - line 591: PACKAGE: "lightgbm.split1" #TODO speed up LGBM Tests and remove split core/src/main/scala/org/apache/spark/sql/execution/streaming/DistributedHTTPSource.scala (2 lines): - line 223: // TODO do this by hooking deeper into spark, - line 224: // TODO allow for dynamic allocation core/src/main/scala/com/microsoft/azure/synapse/ml/codegen/Wrappable.scala (2 lines): - line 61: //case _: Param[String] => StringInfo //TODO fix erasure issues - line 124: // TODO add default values core/src/main/scala/com/microsoft/azure/synapse/ml/core/schema/Categoricals.scala (2 lines): - line 157: val numLevels: Int = levels.length //TODO: add the maximum possible number of levels? - line 208: //TODO: add tests to ensure deep-learning/src/main/scala/com/microsoft/azure/synapse/ml/cntk/ImageFeaturizer.scala (1 line): - line 110: //TODO make nulls pass through deep-learning/src/main/scala/com/microsoft/azure/synapse/ml/cntk/CNTKFunctionParam.scala (1 line): - line 40: // TODO make this check more robust vw/src/main/scala/com/microsoft/azure/synapse/ml/vw/featurizer/StringSplitFeaturizer.scala (1 line): - line 31: * TODO: expose as user configurable parameter core/src/main/scala/com/microsoft/azure/synapse/ml/nn/BallTree.scala (1 line): - line 61: //TODO: Check if not using squared euclidean distance is ok core/src/main/scala/com/microsoft/azure/synapse/ml/io/http/HTTPSchema.scala (1 line): - line 51: case _: SocketException => Array() //TODO investigate why sockets fail sometimes cognitive/src/main/scala/com/microsoft/azure/synapse/ml/cognitive/MultivariateAnomalyDetection.scala (1 line): - line 287: // TODO: do we have to worry about locale? core/src/main/scala/com/microsoft/azure/synapse/ml/core/metrics/MetricUtils.scala (1 line): - line 41: // TODO: evaluate all models; for now, get first model name found opencv/src/main/scala/com/microsoft/azure/synapse/ml/opencv/ImageTransformer.scala (1 line): - line 607: // TODO: figure out more elegant way vw/src/main/scala/com/microsoft/azure/synapse/ml/vw/VowpalWabbitBaseModel.scala (1 line): - line 102: // TODO: surface prediction confidence cognitive/src/main/scala/com/microsoft/azure/synapse/ml/cognitive/SpeechToText.scala (1 line): - line 119: //TODO figure out why build machines don't have proper codecs project/build.scala (1 line): - line 53: //TODO figure out why this doesent work core/src/main/scala/com/microsoft/azure/synapse/ml/exploratory/FeatureBalanceMeasure.scala (1 line): - line 95: // TODO (for v2): support regression scenarios vw/src/main/scala/com/microsoft/azure/synapse/ml/vw/VowpalWabbitFeaturizer.scala (1 line): - line 167: // TODO: list types cognitive/src/main/scala/com/microsoft/azure/synapse/ml/cognitive/SpeechToTextSDK.scala (1 line): - line 529: // TODO fix this spelling in 1.15 update core/src/main/scala/com/microsoft/azure/synapse/ml/train/ComputePerInstanceStatistics.scala (1 line): - line 109: // TODO: This should be based on the retrieved score value kind core/src/main/scala/org/apache/spark/ml/ComplexParamsSerializer.scala (1 line): - line 145: * TODO: Consider adding check for correct class name. core/src/main/scala/com/microsoft/azure/synapse/ml/core/utils/ClusterUtil.scala (1 line): - line 156: //TODO make this less brittle core/src/main/scala/com/microsoft/azure/synapse/ml/image/UnrollImage.scala (1 line): - line 49: //TODO: is there a better way to convert to unsigned byte? core/src/main/scala/com/microsoft/azure/synapse/ml/train/TrainClassifier.scala (1 line): - line 313: // Update the schema - TODO: create method that would generate GUID and add it to the scored model cognitive/src/main/scala/com/microsoft/azure/synapse/ml/cognitive/RESTHelpers.scala (1 line): - line 47: //TODO use this elsewhere cognitive/src/main/scala/com/microsoft/azure/synapse/ml/cognitive/TextAnalytics.scala (1 line): - line 545: // TODO refactor to remove duplicate from TextAnalyticsBase core/src/main/python/synapse/ml/io/http/HTTPFunctions.py (1 line): - line 23: # TODO figure out why we cannot just grab from SparkContext on databricks core/src/main/scala/com/microsoft/azure/synapse/ml/exploratory/DistributionBalanceMeasure.scala (1 line): - line 92: // TODO (for v2): Introduce a referenceDistribution function param for user to override the uniform distribution