diff --git a/src/csharp/Microsoft.Spark.E2ETest/IpcTests/ML/Feature/BucketizerTests.cs b/src/csharp/Microsoft.Spark.E2ETest/IpcTests/ML/Feature/BucketizerTests.cs
index 48c7fdf89..11037bc6d 100644
--- a/src/csharp/Microsoft.Spark.E2ETest/IpcTests/ML/Feature/BucketizerTests.cs
+++ b/src/csharp/Microsoft.Spark.E2ETest/IpcTests/ML/Feature/BucketizerTests.cs
@@ -3,6 +3,8 @@
 // See the LICENSE file in the project root for more information.
 
 using System.Collections.Generic;
+using System.IO;
+using Microsoft.Spark.E2ETest.Utils;
 using Microsoft.Spark.ML.Feature;
 using Microsoft.Spark.Sql;
 using Xunit;
@@ -47,6 +49,15 @@ public void TestBucketizer()
             Assert.Equal(expectedInputCol, bucketizer.GetInputCol());
             Assert.Equal(expectedOutputCol, bucketizer.GetOutputCol());
             Assert.Equal(expectedSplits, bucketizer.GetSplits());
+            
+            using (var tempDirectory = new TemporaryDirectory())
+            {
+                string savePath = Path.Join(tempDirectory.Path, "bucket");
+                bucketizer.Save(savePath);
+                
+                Bucketizer loadedBucketizer = Bucketizer.Load(savePath);
+                Assert.Equal(bucketizer.Uid(), loadedBucketizer.Uid());
+            }
         }
 
         [Fact]
diff --git a/src/csharp/Microsoft.Spark.E2ETest/IpcTests/ML/Feature/HashingTFTests.cs b/src/csharp/Microsoft.Spark.E2ETest/IpcTests/ML/Feature/HashingTFTests.cs
new file mode 100644
index 000000000..7b6882bea
--- /dev/null
+++ b/src/csharp/Microsoft.Spark.E2ETest/IpcTests/ML/Feature/HashingTFTests.cs
@@ -0,0 +1,65 @@
+// Licensed to the .NET Foundation under one or more agreements.
+// The .NET Foundation licenses this file to you under the MIT license.
+// See the LICENSE file in the project root for more information.
+
+using System;
+using System.Collections.Generic;
+using System.IO;
+using System.Linq;
+using Microsoft.Spark.E2ETest.Utils;
+using Microsoft.Spark.ML.Feature;
+using Microsoft.Spark.Sql;
+using Xunit;
+
+namespace Microsoft.Spark.E2ETest.IpcTests.ML.Feature
+{
+    [Collection("Spark E2E Tests")]
+    public class HashingTFTests
+    {
+        private readonly SparkSession _spark;
+
+        public HashingTFTests(SparkFixture fixture)
+        {
+            _spark = fixture.Spark;
+        }
+
+        [Fact]
+        public void TestHashingTF()
+        {
+            string expectedInputCol = "input_col";
+            string expectedOutputCol = "output_col";
+            int expectedFeatures = 10;
+
+            Assert.IsType<HashingTF>(new HashingTF());
+            
+            HashingTF hashingTf = new HashingTF("my-unique-id")
+                .SetNumFeatures(expectedFeatures)
+                .SetInputCol(expectedInputCol)
+                .SetOutputCol(expectedOutputCol);
+
+            Assert.Equal(expectedFeatures, hashingTf.GetNumFeatures());
+            Assert.Equal(expectedInputCol, hashingTf.GetInputCol());
+            Assert.Equal(expectedOutputCol, hashingTf.GetOutputCol());
+
+            DataFrame input = _spark.Sql("SELECT array('this', 'is', 'a', 'string', 'a', 'a')" +
+                " as input_col");
+
+            DataFrame output = hashingTf.Transform(input);
+            DataFrame outputVector = output.Select(expectedOutputCol);
+            
+            Assert.Contains(expectedOutputCol, outputVector.Columns());
+       
+            using (var tempDirectory = new TemporaryDirectory())
+            {
+                string savePath = Path.Join(tempDirectory.Path, "hashingTF");
+                hashingTf.Save(savePath);
+                
+                HashingTF loadedHashingTf = HashingTF.Load(savePath);
+                Assert.Equal(hashingTf.Uid(), loadedHashingTf.Uid());
+            }
+
+            hashingTf.SetBinary(true);
+            Assert.True(hashingTf.GetBinary());
+        }
+    }
+}
diff --git a/src/csharp/Microsoft.Spark.E2ETest/IpcTests/ML/Feature/IDFModelTests.cs b/src/csharp/Microsoft.Spark.E2ETest/IpcTests/ML/Feature/IDFModelTests.cs
new file mode 100644
index 000000000..623b7322c
--- /dev/null
+++ b/src/csharp/Microsoft.Spark.E2ETest/IpcTests/ML/Feature/IDFModelTests.cs
@@ -0,0 +1,70 @@
+// Licensed to the .NET Foundation under one or more agreements.
+// The .NET Foundation licenses this file to you under the MIT license.
+// See the LICENSE file in the project root for more information.
+
+using System.IO;
+using Microsoft.Spark.E2ETest.Utils;
+using Microsoft.Spark.ML.Feature;
+using Microsoft.Spark.Sql;
+using Xunit;
+
+namespace Microsoft.Spark.E2ETest.IpcTests.ML.Feature
+{
+    [Collection("Spark E2E Tests")]
+    public class IDFModelTests
+    {
+        private readonly SparkSession _spark;
+
+        public IDFModelTests(SparkFixture fixture)
+        {
+            _spark = fixture.Spark;
+        }
+
+        [Fact]
+        public void TestIDFModel()
+        {
+            int expectedDocFrequency = 1980;
+            string expectedInputCol = "rawFeatures";
+            string expectedOutputCol = "features";
+            
+            DataFrame sentenceData =
+                _spark.Sql("SELECT 0.0 as label, 'Hi I heard about Spark' as sentence");
+            
+            Tokenizer tokenizer = new Tokenizer()
+                .SetInputCol("sentence")
+                .SetOutputCol("words");
+            
+            DataFrame wordsData = tokenizer.Transform(sentenceData);
+
+            HashingTF hashingTF = new HashingTF()
+                .SetInputCol("words")
+                .SetOutputCol(expectedInputCol)
+                .SetNumFeatures(20);
+
+            DataFrame featurizedData = hashingTF.Transform(wordsData);
+    
+            IDF idf = new IDF()
+                .SetInputCol(expectedInputCol)
+                .SetOutputCol(expectedOutputCol)
+                .SetMinDocFreq(expectedDocFrequency);
+            
+            IDFModel idfModel = idf.Fit(featurizedData);
+
+            DataFrame rescaledData = idfModel.Transform(featurizedData);
+            Assert.Contains(expectedOutputCol, rescaledData.Columns());
+            
+            Assert.Equal(expectedInputCol, idfModel.GetInputCol());
+            Assert.Equal(expectedOutputCol, idfModel.GetOutputCol());
+            Assert.Equal(expectedDocFrequency, idfModel.GetMinDocFreq());
+            
+            using (var tempDirectory = new TemporaryDirectory())
+            {
+                string modelPath = Path.Join(tempDirectory.Path, "idfModel");
+                idfModel.Save(modelPath);
+
+                IDFModel loadedModel = IDFModel.Load(modelPath);
+                Assert.Equal(idfModel.Uid(), loadedModel.Uid());
+            }
+        }
+    }
+}
diff --git a/src/csharp/Microsoft.Spark.E2ETest/IpcTests/ML/Feature/IDFTests.cs b/src/csharp/Microsoft.Spark.E2ETest/IpcTests/ML/Feature/IDFTests.cs
new file mode 100644
index 000000000..3dea63de7
--- /dev/null
+++ b/src/csharp/Microsoft.Spark.E2ETest/IpcTests/ML/Feature/IDFTests.cs
@@ -0,0 +1,49 @@
+// Licensed to the .NET Foundation under one or more agreements.
+// The .NET Foundation licenses this file to you under the MIT license.
+// See the LICENSE file in the project root for more information.
+
+using System.IO;
+using Microsoft.Spark.E2ETest.Utils;
+using Microsoft.Spark.ML.Feature;
+using Microsoft.Spark.Sql;
+using Xunit;
+
+namespace Microsoft.Spark.E2ETest.IpcTests.ML.Feature
+{
+    [Collection("Spark E2E Tests")]
+    public class IDFTests
+    {
+        private readonly SparkSession _spark;
+
+        public IDFTests(SparkFixture fixture)
+        {
+            _spark = fixture.Spark;
+        }
+
+        [Fact]
+        public void TestIDFModel()
+        {
+            string expectedInputCol = "rawFeatures";
+            string expectedOutputCol = "features";
+            int expectedDocFrequency = 100;
+            
+            IDF idf = new IDF()
+                .SetInputCol(expectedInputCol)
+                .SetOutputCol(expectedOutputCol)
+                .SetMinDocFreq(expectedDocFrequency);
+            
+            Assert.Equal(expectedInputCol, idf.GetInputCol());
+            Assert.Equal(expectedOutputCol, idf.GetOutputCol());
+            Assert.Equal(expectedDocFrequency, idf.GetMinDocFreq());
+            
+            using (var tempDirectory = new TemporaryDirectory())
+            {
+                string savePath = Path.Join(tempDirectory.Path, "IDF");
+                idf.Save(savePath);
+                
+                IDF loadedIdf = IDF.Load(savePath);
+                Assert.Equal(idf.Uid(), loadedIdf.Uid());
+            }
+        }
+    }
+}
diff --git a/src/csharp/Microsoft.Spark.E2ETest/IpcTests/ML/Feature/TokenizerTests.cs b/src/csharp/Microsoft.Spark.E2ETest/IpcTests/ML/Feature/TokenizerTests.cs
new file mode 100644
index 000000000..8cdb4e03a
--- /dev/null
+++ b/src/csharp/Microsoft.Spark.E2ETest/IpcTests/ML/Feature/TokenizerTests.cs
@@ -0,0 +1,55 @@
+// Licensed to the .NET Foundation under one or more agreements.
+// The .NET Foundation licenses this file to you under the MIT license.
+// See the LICENSE file in the project root for more information.
+
+using System.IO;
+using Microsoft.Spark.E2ETest.Utils;
+using Microsoft.Spark.ML.Feature;
+using Microsoft.Spark.Sql;
+using Xunit;
+
+namespace Microsoft.Spark.E2ETest.IpcTests.ML.Feature
+{
+    [Collection("Spark E2E Tests")]
+    public class TokenizerTests
+    {
+        private readonly SparkSession _spark;
+
+        public TokenizerTests(SparkFixture fixture)
+        {
+            _spark = fixture.Spark;
+        }
+
+        [Fact]
+        public void TestTokenizer()
+        {
+            string expectedUid = "theUid";
+            string expectedInputCol = "input_col";
+            string expectedOutputCol = "output_col";
+            
+            DataFrame input = _spark.Sql("SELECT 'hello I AM a string TO, TOKENIZE' as input_col" +
+                " from range(100)");
+            
+            Tokenizer tokenizer = new Tokenizer(expectedUid)
+                .SetInputCol(expectedInputCol)
+                .SetOutputCol(expectedOutputCol);
+            
+            DataFrame output = tokenizer.Transform(input);
+            
+            Assert.Contains(output.Schema().Fields, (f => f.Name == expectedOutputCol));
+            Assert.Equal(expectedInputCol, tokenizer.GetInputCol());
+            Assert.Equal(expectedOutputCol, tokenizer.GetOutputCol());
+            
+            using (var tempDirectory = new TemporaryDirectory())
+            {
+                string savePath = Path.Join(tempDirectory.Path, "Tokenizer");
+                tokenizer.Save(savePath);
+                
+                Tokenizer loadedTokenizer = Tokenizer.Load(savePath);
+                Assert.Equal(tokenizer.Uid(), loadedTokenizer.Uid());
+            }
+            
+            Assert.Equal(expectedUid, tokenizer.Uid());
+        }
+    }
+}
diff --git a/src/csharp/Microsoft.Spark/ML/Feature/Bucketizer.cs b/src/csharp/Microsoft.Spark/ML/Feature/Bucketizer.cs
index 4eefd119d..823f13c1a 100644
--- a/src/csharp/Microsoft.Spark/ML/Feature/Bucketizer.cs
+++ b/src/csharp/Microsoft.Spark/ML/Feature/Bucketizer.cs
@@ -8,7 +8,6 @@
 using Microsoft.Spark.Interop;
 using Microsoft.Spark.Interop.Ipc;
 using Microsoft.Spark.Sql;
-using Microsoft.Spark.Sql.Types;
 
 namespace Microsoft.Spark.ML.Feature
 {
@@ -23,18 +22,17 @@ namespace Microsoft.Spark.ML.Feature
     /// </summary>
     public class Bucketizer : IJvmObjectReferenceProvider
     {
-        internal Bucketizer(JvmObjectReference jvmObject)
-        {
-            _jvmObject = jvmObject;
-        }
+        private static readonly string s_bucketizerClassName = 
+            "org.apache.spark.ml.feature.Bucketizer";
         
+        private readonly JvmObjectReference _jvmObject;
+
         /// <summary>
         /// Create a <see cref="Bucketizer"/> without any parameters
         /// </summary>
         public Bucketizer()
         {
-            _jvmObject = SparkEnvironment.JvmBridge.CallConstructor(
-                "org.apache.spark.ml.feature.Bucketizer");
+            _jvmObject = SparkEnvironment.JvmBridge.CallConstructor(s_bucketizerClassName);
         }
 
         /// <summary>
@@ -44,11 +42,14 @@ public Bucketizer()
         /// <param name="uid">An immutable unique ID for the object and its derivatives.</param>
         public Bucketizer(string uid)
         {
-            _jvmObject = SparkEnvironment.JvmBridge.CallConstructor(
-                "org.apache.spark.ml.feature.Bucketizer", uid);
+            _jvmObject = SparkEnvironment.JvmBridge.CallConstructor(s_bucketizerClassName, uid);
         }
         
-        private readonly JvmObjectReference _jvmObject;
+        internal Bucketizer(JvmObjectReference jvmObject)
+        {
+            _jvmObject = jvmObject;
+        }
+
         JvmObjectReference IJvmObjectReferenceProvider.Reference => _jvmObject;
         
         /// <summary>
@@ -70,7 +71,7 @@ public double[] GetSplits()
         /// bucket, which also includes y. The splits should be of length &gt;= 3 and strictly
         /// increasing. Values outside the splits specified will be treated as errors.
         /// </param>
-        /// <returns><see cref="Bucketizer"/></returns>
+        /// <returns>New <see cref="Bucketizer"/> object</returns>
         public Bucketizer SetSplits(double[] value)
         {
             return WrapAsBucketizer(_jvmObject.Invoke("setSplits", value));
@@ -95,7 +96,7 @@ public double[][] GetSplitsArray()
         /// by splits x,y holds values in the range [x,y) except the last bucket, which also
         /// includes y. The splits should be of length &gt;= 3 and strictly increasing.
         /// Values outside the splits specified will be treated as errors.</param>
-        /// <returns><see cref="Bucketizer"/></returns>
+        /// <returns>New <see cref="Bucketizer"/> object</returns>
         public Bucketizer SetSplitsArray(double[][] value)
         {
             return WrapAsBucketizer(_jvmObject.Invoke("setSplitsArray", (object)value));
@@ -116,7 +117,7 @@ public string GetInputCol()
         /// buckets
         /// </summary>
         /// <param name="value">The name of the column to as the source of the buckets</param>
-        /// <returns><see cref="Bucketizer"/></returns>
+        /// <returns>New <see cref="Bucketizer"/> object</returns>
         public Bucketizer SetInputCol(string value)
         {
             return WrapAsBucketizer(_jvmObject.Invoke("setInputCol", value));
@@ -140,7 +141,7 @@ public IEnumerable<string> GetInputCols()
         /// sets of buckets and two output columns.
         /// </summary>
         /// <param name="value">List of input columns to use as sources for buckets</param>
-        /// <returns><see cref="Bucketizer"/></returns>
+        /// <returns>New <see cref="Bucketizer"/> object</returns>
         public Bucketizer SetInputCols(IEnumerable<string> value)
         {
             return WrapAsBucketizer(_jvmObject.Invoke("setInputCols", value));
@@ -161,7 +162,7 @@ public string GetOutputCol()
         /// name of the new column.
         /// </summary>
         /// <param name="value">The name of the new column which contains the bucket ID</param>
-        /// <returns><see cref="Bucketizer"/></returns>
+        /// <returns>New <see cref="Bucketizer"/> object</returns>
         public Bucketizer SetOutputCol(string value)
         {
             return WrapAsBucketizer(_jvmObject.Invoke("setOutputCol", value));
@@ -181,36 +182,47 @@ public IEnumerable<string> GetOutputCols()
         /// The list of columns that the <see cref="Bucketizer"/> will create in the DataFrame.
         /// </summary>
         /// <param name="value">List of column names which will contain the bucket ID</param>
-        /// <returns><see cref="Bucketizer"/></returns>
+        /// <returns>New <see cref="Bucketizer"/> object</returns>
         public Bucketizer SetOutputCols(List<string> value)
         {
             return WrapAsBucketizer(_jvmObject.Invoke("setOutputCols", value));
         }
+        
+        /// <summary>
+        /// Loads the <see cref="Bucketizer"/> that was previously saved using Save
+        /// </summary>
+        /// <param name="path">The path the previous <see cref="Bucketizer"/> was saved to</param>
+        /// <returns>New <see cref="Bucketizer"/> object</returns>
+        public static Bucketizer Load(string path)
+        {
+            return WrapAsBucketizer(
+                SparkEnvironment.JvmBridge.CallStaticJavaMethod(
+                    s_bucketizerClassName,"load", path));
+        }
+        
+        /// <summary>
+        /// Saves the <see cref="Bucketizer"/> so that it can be loaded later using Load
+        /// </summary>
+        /// <param name="path">The path to save the <see cref="Bucketizer"/> to</param>
+        /// <returns>New <see cref="Bucketizer"/> object</returns>
+        public Bucketizer Save(string path)
+        {
+            return WrapAsBucketizer(_jvmObject.Invoke("save", path));
+        }
 
         /// <summary>
         /// Executes the <see cref="Bucketizer"/> and transforms the DataFrame to include the new
         /// column or columns with the bucketed data.
         /// </summary>
         /// <param name="source">The DataFrame to add the bucketed data to</param>
-        /// <returns><see cref="DataFrame"/> containing the original data and the new bucketed
-        /// columns</returns>
+        /// <returns>
+        /// <see cref="DataFrame"/> containing the original data and the new bucketed columns
+        /// </returns>
         public DataFrame Transform(DataFrame source)
         {
             return new DataFrame((JvmObjectReference)_jvmObject.Invoke("transform", source));
         }
 
-        /// <summary>
-        /// The reference we get back from each call isn't usable unless we wrap it in a new dotnet
-        /// <see cref="Bucketizer"/>
-        /// </summary>
-        /// <param name="obj">The <see cref="JvmObjectReference"/> to convert into a dotnet
-        /// <see cref="Bucketizer"/></param>
-        /// <returns><see cref="Bucketizer"/></returns>
-        private static Bucketizer WrapAsBucketizer(object obj)
-        {
-            return new Bucketizer((JvmObjectReference)obj);
-        }
-
         /// <summary>
         /// The uid that was used to create the <see cref="Bucketizer"/>. If no UID is passed in
         /// when creating the <see cref="Bucketizer"/> then a random UID is created when the
@@ -238,10 +250,13 @@ public string GetHandleInvalid()
         /// Choices are "skip", "error" or "keep". Default is "error"
         /// </summary>
         /// <param name="value">"skip", "error" or "keep"</param>
-        /// <returns><see cref="Bucketizer"/></returns>
+        /// <returns>New <see cref="Bucketizer"/> object</returns>
         public Bucketizer SetHandleInvalid(string value)
         {
             return WrapAsBucketizer(_jvmObject.Invoke("setHandleInvalid", value.ToString()));
         }
+        
+        private static Bucketizer WrapAsBucketizer(object obj) => 
+            new Bucketizer((JvmObjectReference)obj);
     }
 }
diff --git a/src/csharp/Microsoft.Spark/ML/Feature/HashingTF.cs b/src/csharp/Microsoft.Spark/ML/Feature/HashingTF.cs
new file mode 100644
index 000000000..50b4fe04a
--- /dev/null
+++ b/src/csharp/Microsoft.Spark/ML/Feature/HashingTF.cs
@@ -0,0 +1,184 @@
+// Licensed to the .NET Foundation under one or more agreements.
+// The .NET Foundation licenses this file to you under the MIT license.
+// See the LICENSE file in the project root for more information.
+
+using System;
+using System.Collections.Generic;
+using Microsoft.Spark.Interop;
+using Microsoft.Spark.Interop.Ipc;
+using Microsoft.Spark.Sql;
+using Microsoft.Spark.Sql.Types;
+
+namespace Microsoft.Spark.ML.Feature
+{
+    /// <summary>
+    /// A <see cref="HashingTF"/> Maps a sequence of terms to their term frequencies using the
+    /// hashing trick. Currently we use Austin Appleby's MurmurHash 3 algorithm
+    /// (MurmurHash3_x86_32) to calculate the hash code value for the term object. Since a simple
+    /// modulo is used to transform the hash function to a column index, it is advisable to use a
+    /// power of two as the numFeatures parameter; otherwise the features will not be mapped evenly
+    /// to the columns.
+    /// </summary>
+    public class HashingTF : IJvmObjectReferenceProvider
+    {
+        private static readonly string s_hashingTfClassName = 
+            "org.apache.spark.ml.feature.HashingTF";
+        
+        private readonly JvmObjectReference _jvmObject;
+        
+        /// <summary>
+        /// Create a <see cref="HashingTF"/> without any parameters
+        /// </summary>
+        public HashingTF()
+        {
+            _jvmObject = SparkEnvironment.JvmBridge.CallConstructor(s_hashingTfClassName);
+        }
+
+        /// <summary>
+        /// Create a <see cref="HashingTF"/> with a UID that is used to give the
+        /// <see cref="HashingTF"/> a unique ID
+        /// <param name="uid">unique identifier</param>
+        /// </summary>
+        public HashingTF(string uid)
+        {
+            _jvmObject = SparkEnvironment.JvmBridge.CallConstructor(s_hashingTfClassName, uid);
+        }
+        
+        internal HashingTF(JvmObjectReference jvmObject)
+        {
+            _jvmObject = jvmObject;
+        }
+
+        JvmObjectReference IJvmObjectReferenceProvider.Reference => _jvmObject;
+
+        /// <summary>
+        /// Loads the <see cref="HashingTF"/> that was previously saved using Save
+        /// </summary>
+        /// <param name="path">The path the previous <see cref="HashingTF"/> was saved to</param>
+        /// <returns>New <see cref="HashingTF"/> object</returns>
+        public static HashingTF Load(string path)
+        {
+            return WrapAsHashingTF(
+                SparkEnvironment.JvmBridge.CallStaticJavaMethod(
+                    s_hashingTfClassName, "load", path));
+        }
+        
+        /// <summary>
+        /// Saves the <see cref="HashingTF"/> so that it can be loaded later using Load
+        /// </summary>
+        /// <param name="path">The path to save the <see cref="HashingTF"/> to</param>
+        /// <returns>New <see cref="HashingTF"/> object</returns>
+        public HashingTF Save(string path)
+        {
+            return WrapAsHashingTF(_jvmObject.Invoke("save", path));
+        }
+        
+        /// <summary>
+        /// Gets the binary toggle that controls term frequency counts
+        /// </summary>
+        /// <returns>Flag showing whether the binary toggle is on or off</returns>
+        public bool GetBinary()
+        {
+            return (bool)_jvmObject.Invoke("getBinary");
+        }
+
+        /// <summary>
+        /// Binary toggle to control term frequency counts.
+        /// If true, all non-zero counts are set to 1.  This is useful for discrete probabilistic
+        /// models that model binary events rather than integer counts
+        ///</summary>
+        /// <param name="value">binary toggle, default is false</param>
+        public HashingTF SetBinary(bool value)
+        {
+            return WrapAsHashingTF(_jvmObject.Invoke("setBinary", value));
+        }
+        
+        /// <summary>
+        /// Gets the column that the <see cref="HashingTF"/> should read from
+        /// </summary>
+        /// <returns>string, the name of the input column</returns>
+        public string GetInputCol()
+        {
+            return (string)_jvmObject.Invoke("getInputCol");
+        }
+        
+        /// <summary>
+        /// Sets the column that the <see cref="HashingTF"/> should read from
+        /// </summary>
+        /// <param name="value">The name of the column to as the source</param>
+        /// <returns>New <see cref="HashingTF"/> object</returns>
+        public HashingTF SetInputCol(string value)
+        {
+            return WrapAsHashingTF(_jvmObject.Invoke("setInputCol", value));
+        }
+
+        /// <summary>
+        /// The <see cref="HashingTF"/> will create a new column in the <see cref="DataFrame"/>,
+        /// this is the name of the new column.
+        /// </summary>
+        /// <returns>string, the name of the output col</returns>
+        public string GetOutputCol()
+        {
+            return (string)_jvmObject.Invoke("getOutputCol");
+        }
+        
+        /// <summary>
+        /// The <see cref="HashingTF"/> will create a new column in the <see cref="DataFrame"/>,
+        /// this is the name of the new column.
+        /// </summary>
+        /// <param name="value">The name of the new column</param>
+        /// <returns>New <see cref="HashingTF"/> object</returns>
+        public HashingTF SetOutputCol(string value)
+        {
+            return WrapAsHashingTF(_jvmObject.Invoke("setOutputCol", value));
+        }
+
+        /// <summary>
+        /// Gets the number of features that should be used. Since a simple modulo is used to
+        /// transform the hash function to a column index, it is advisable to use a power of two
+        /// as the numFeatures parameter; otherwise the features will not be mapped evenly to the
+        /// columns.
+        /// </summary>
+        /// <returns>The number of features to be used</returns>
+        public int GetNumFeatures()
+        {
+            return (int)_jvmObject.Invoke("getNumFeatures");
+        }
+        
+        /// <summary>
+        /// Sets the number of features that should be used. Since a simple modulo is used to
+        /// transform the hash function to a column index, it is advisable to use a power of two as
+        /// the numFeatures parameter; otherwise the features will not be mapped evenly to the
+        /// columns.
+        /// </summary>
+        /// <param name="value">int</param>
+        /// <returns>New <see cref="HashingTF"/> object</returns>
+        public HashingTF SetNumFeatures(int value)
+        {
+            return WrapAsHashingTF(_jvmObject.Invoke("setNumFeatures", value));
+        }
+
+        /// <summary>
+        /// An immutable unique ID for the object and its derivatives.
+        /// </summary>
+        /// <returns>string, unique ID for the object</returns>
+        public string Uid()
+        {
+            return (string)_jvmObject.Invoke("uid");
+        }
+
+        /// <summary>
+        /// Executes the <see cref="HashingTF"/> and transforms the DataFrame to include the new
+        /// column or columns with the tokens.
+        /// </summary>
+        /// <param name="source">The <see cref="DataFrame"/> to add the tokens to</param>
+        /// <returns><see cref="DataFrame"/> containing the original data and the tokens</returns>
+        public DataFrame Transform(DataFrame source)
+        {
+            return new DataFrame((JvmObjectReference)_jvmObject.Invoke("transform", source));
+        }
+        
+        private static HashingTF WrapAsHashingTF(object obj) => 
+            new HashingTF((JvmObjectReference)obj);
+    }
+}
diff --git a/src/csharp/Microsoft.Spark/ML/Feature/IDF.cs b/src/csharp/Microsoft.Spark/ML/Feature/IDF.cs
new file mode 100644
index 000000000..5c2259aaf
--- /dev/null
+++ b/src/csharp/Microsoft.Spark/ML/Feature/IDF.cs
@@ -0,0 +1,154 @@
+// Licensed to the .NET Foundation under one or more agreements.
+// The .NET Foundation licenses this file to you under the MIT license.
+// See the LICENSE file in the project root for more information.
+
+using Microsoft.Spark.Interop;
+using Microsoft.Spark.Interop.Ipc;
+using Microsoft.Spark.Sql;
+
+namespace Microsoft.Spark.ML.Feature
+{
+    /// <summary>
+    /// Inverse document frequency (IDF). The standard formulation is used:
+    /// idf = log((m + 1) / (d(t) + 1)), where m is the total number of documents and d(t) is
+    /// the number of documents that contain term t.
+    /// 
+    /// This implementation supports filtering out terms which do not appear in a minimum number
+    /// of documents (controlled by the variable minDocFreq). For terms that are not in at least
+    /// minDocFreq documents, the IDF is found as 0, resulting in TF-IDFs of 0.
+    /// </summary>
+    public class IDF : IJvmObjectReferenceProvider
+    {
+        private static readonly string s_IDFClassName = "org.apache.spark.ml.feature.IDF";
+        
+        private readonly JvmObjectReference _jvmObject;
+        
+        /// <summary>
+        /// Create a <see cref="IDF"/> without any parameters
+        /// </summary>
+        public IDF()
+        {
+            _jvmObject = SparkEnvironment.JvmBridge.CallConstructor(s_IDFClassName);
+        }
+
+        /// <summary>
+        /// Create a <see cref="IDF"/> with a UID that is used to give the
+        /// <see cref="IDF"/> a unique ID
+        /// </summary>
+        /// <param name="uid">An immutable unique ID for the object and its derivatives.</param>
+        public IDF(string uid)
+        {
+            _jvmObject = SparkEnvironment.JvmBridge.CallConstructor(s_IDFClassName, uid);
+        }
+        
+        internal IDF(JvmObjectReference jvmObject)
+        {
+            _jvmObject = jvmObject;
+        }
+        
+        JvmObjectReference IJvmObjectReferenceProvider.Reference => _jvmObject;
+
+        /// <summary>
+        /// Gets the column that the <see cref="IDF"/> should read from
+        /// </summary>
+        /// <returns>string, input column</returns>
+        public string GetInputCol()
+        {
+            return (string)(_jvmObject.Invoke("getInputCol"));
+        }
+        
+        /// <summary>
+        /// Sets the column that the <see cref="IDF"/> should read from
+        /// </summary>
+        /// <param name="value">The name of the column to as the source</param>
+        /// <returns>New <see cref="IDF"/> object</returns>
+        public IDF SetInputCol(string value)
+        {
+            return WrapAsIDF(_jvmObject.Invoke("setInputCol", value));
+        }
+
+        /// <summary>
+        /// The <see cref="IDF"/> will create a new column in the DataFrame, this is the
+        /// name of the new column.
+        /// </summary>
+        /// <returns>string, the output column</returns>
+        public string GetOutputCol()
+        {
+            return (string)(_jvmObject.Invoke("getOutputCol"));
+        }
+        
+        /// <summary>
+        /// The <see cref="IDF"/> will create a new column in the DataFrame, this is the
+        /// name of the new column.
+        /// </summary>
+        /// <param name="value">The name of the new column</param>
+        /// <returns>New <see cref="IDF"/> object</returns>
+        public IDF SetOutputCol(string value)
+        {
+            return WrapAsIDF(_jvmObject.Invoke("setOutputCol", value));
+        }
+
+        /// <summary>
+        /// Minimum of documents in which a term should appear for filtering
+        /// </summary>
+        /// <returns>int, minimum number of documents in which a term should appear</returns>
+        public int GetMinDocFreq()
+        {
+            return (int)_jvmObject.Invoke("getMinDocFreq");
+        }
+        
+        /// <summary>
+        /// Minimum of documents in which a term should appear for filtering
+        /// </summary>
+        /// <param name="value">int, the minimum of documents a term should appear in</param>
+        /// <returns>New <see cref="IDF"/> object</returns>
+        public IDF SetMinDocFreq(int value)
+        {
+            return WrapAsIDF(_jvmObject.Invoke("setMinDocFreq", value));
+        }
+        
+        /// <summary>
+        /// Fits a model to the input data.
+        /// </summary>
+        /// <param name="source">The <see cref="DataFrame"/> to fit the model to</param>
+        /// <returns>New <see cref="IDFModel"/> object</returns>
+        public IDFModel Fit(DataFrame source)
+        {
+            return new IDFModel((JvmObjectReference)_jvmObject.Invoke("fit", source));
+        }
+
+        /// <summary>
+        /// The uid that was used to create the <see cref="IDF"/>. If no UID is passed in
+        /// when creating the <see cref="IDF"/> then a random UID is created when the
+        /// <see cref="IDF"/> is created.
+        /// </summary>
+        /// <returns>string UID identifying the <see cref="IDF"/></returns>
+        public string Uid()
+        {
+            return (string)_jvmObject.Invoke("uid");
+        }
+        
+        /// <summary>
+        /// Loads the <see cref="IDF"/> that was previously saved using Save
+        /// </summary>
+        /// <param name="path">The path the previous <see cref="IDF"/> was saved to</param>
+        /// <returns>New <see cref="IDF"/> object, loaded from path</returns>
+        public static IDF Load(string path)
+        {
+            return WrapAsIDF(
+                SparkEnvironment.JvmBridge.CallStaticJavaMethod(s_IDFClassName, "load", path));
+        }
+        
+        /// <summary>
+        /// Saves the <see cref="IDF"/> so that it can be loaded later using Load
+        /// </summary>
+        /// <param name="path">The path to save the <see cref="IDF"/> to</param>
+        /// <returns>New <see cref="IDF"/> object</returns>
+        public IDF Save(string path)
+        {
+            return WrapAsIDF(_jvmObject.Invoke("save", path));
+        }
+
+        private static IDF WrapAsIDF(object obj) => new IDF((JvmObjectReference)obj);
+    }
+}
diff --git a/src/csharp/Microsoft.Spark/ML/Feature/IDFModel.cs b/src/csharp/Microsoft.Spark/ML/Feature/IDFModel.cs
new file mode 100644
index 000000000..4fc8a4f30
--- /dev/null
+++ b/src/csharp/Microsoft.Spark/ML/Feature/IDFModel.cs
@@ -0,0 +1,145 @@
+// Licensed to the .NET Foundation under one or more agreements.
+// The .NET Foundation licenses this file to you under the MIT license.
+// See the LICENSE file in the project root for more information.
+
+using Microsoft.Spark.Interop;
+using Microsoft.Spark.Interop.Ipc;
+using Microsoft.Spark.Sql;
+
+namespace Microsoft.Spark.ML.Feature
+{
+    /// <summary>
+    /// A <see cref="IDFModel"/> that converts the input string to lowercase and then splits it by
+    /// white spaces.
+    /// </summary>
+    public class IDFModel : IJvmObjectReferenceProvider
+    {
+        private static readonly string s_IDFModelClassName = 
+            "org.apache.spark.ml.feature.IDFModel";
+        
+        private readonly JvmObjectReference _jvmObject;
+
+        /// <summary>
+        /// Create a <see cref="IDFModel"/> without any parameters
+        /// </summary>
+        public IDFModel()
+        {
+            _jvmObject = SparkEnvironment.JvmBridge.CallConstructor(s_IDFModelClassName);
+        }
+
+        /// <summary>
+        /// Create a <see cref="IDFModel"/> with a UID that is used to give the
+        /// <see cref="IDFModel"/> a unique ID
+        /// </summary>
+        /// <param name="uid">An immutable unique ID for the object and its derivatives.</param>
+        public IDFModel(string uid)
+        {
+            _jvmObject = SparkEnvironment.JvmBridge.CallConstructor(s_IDFModelClassName, uid);
+        }
+        
+        internal IDFModel(JvmObjectReference jvmObject)
+        {
+            _jvmObject = jvmObject;
+        }
+        
+        JvmObjectReference IJvmObjectReferenceProvider.Reference => _jvmObject;
+        
+        /// <summary>
+        /// Gets the column that the <see cref="IDFModel"/> should read from
+        /// </summary>
+        /// <returns>string, input column</returns>
+        public string GetInputCol()
+        {
+            return (string)(_jvmObject.Invoke("getInputCol"));
+        }
+        
+        /// <summary>
+        /// Sets the column that the <see cref="IDFModel"/> should read from and convert into
+        /// buckets
+        /// </summary>
+        /// <param name="value">The name of the column to as the source</param>
+        /// <returns>New <see cref="IDFModel"/> object</returns>
+        public IDFModel SetInputCol(string value)
+        {
+            return WrapAsIDFModel(_jvmObject.Invoke("setInputCol", value));
+        }
+
+        /// <summary>
+        /// The <see cref="IDFModel"/> will create a new column in the <see cref="DataFrame"/>,
+        /// this is the name of the new column.
+        /// </summary>
+        /// <returns>string, the output column</returns>
+        public string GetOutputCol()
+        {
+            return (string)(_jvmObject.Invoke("getOutputCol"));
+        }
+        
+        /// <summary>
+        /// The <see cref="IDFModel"/> will create a new column in the DataFrame, this is the
+        /// name of the new column.
+        /// </summary>
+        /// <param name="value">The name of the new column which contains the tokens
+        /// </param>
+        /// <returns>New <see cref="IDFModel"/> object</returns>
+        public IDFModel SetOutputCol(string value)
+        {
+            return WrapAsIDFModel(_jvmObject.Invoke("setOutputCol", value));
+        }
+        
+        /// <summary>
+        /// Minimum of documents in which a term should appear for filtering
+        /// </summary>
+        /// <returns>Minimum number of documents a term should appear</returns>
+        public int GetMinDocFreq()
+        {
+            return (int)_jvmObject.Invoke("getMinDocFreq");
+        }
+        
+        /// <summary>
+        /// Executes the <see cref="IDFModel"/> and transforms the <see cref="DataFrame"/> to
+        /// include the new column or columns with the tokens.
+        /// </summary>
+        /// <param name="source">The <see cref="DataFrame"/> to add the tokens to</param>
+        /// <returns><see cref="DataFrame"/> containing the original data and the tokens</returns>
+        public DataFrame Transform(DataFrame source)
+        {
+            return new DataFrame((JvmObjectReference)_jvmObject.Invoke("transform", source));
+        }
+
+        /// <summary>
+        /// The uid that was used to create the <see cref="IDFModel"/>. If no UID is passed in
+        /// when creating the <see cref="IDFModel"/> then a random UID is created when the
+        /// <see cref="IDFModel"/> is created.
+        /// </summary>
+        /// <returns>string UID identifying the <see cref="IDFModel"/></returns>
+        public string Uid()
+        {
+            return (string)_jvmObject.Invoke("uid");
+        }
+        
+        /// <summary>
+        /// Loads the <see cref="IDFModel"/> that was previously saved using Save
+        /// </summary>
+        /// <param name="path">The path the previous <see cref="IDFModel"/> was saved to</param>
+        /// <returns>New <see cref="IDFModel"/> object, loaded from path</returns>
+        public static IDFModel Load(string path)
+        {
+            return WrapAsIDFModel(
+                SparkEnvironment.JvmBridge.CallStaticJavaMethod(
+                    s_IDFModelClassName, "load", path));
+        }
+        
+        /// <summary>
+        /// Saves the <see cref="IDFModel"/> so that it can be loaded later using Load
+        /// </summary>
+        /// <param name="path">The path to save the <see cref="IDFModel"/> to</param>
+        /// <returns>New <see cref="IDFModel"/> object</returns>
+        public IDFModel Save(string path)
+        {
+            return WrapAsIDFModel(_jvmObject.Invoke("save", path));
+        }
+        
+        private static IDFModel WrapAsIDFModel(object obj) => 
+            new IDFModel((JvmObjectReference)obj);
+    }
+}
diff --git a/src/csharp/Microsoft.Spark/ML/Feature/Tokenizer.cs b/src/csharp/Microsoft.Spark/ML/Feature/Tokenizer.cs
new file mode 100644
index 000000000..c411309dc
--- /dev/null
+++ b/src/csharp/Microsoft.Spark/ML/Feature/Tokenizer.cs
@@ -0,0 +1,136 @@
+// Licensed to the .NET Foundation under one or more agreements.
+// The .NET Foundation licenses this file to you under the MIT license.
+// See the LICENSE file in the project root for more information.
+
+using Microsoft.Spark.Interop;
+using Microsoft.Spark.Interop.Ipc;
+using Microsoft.Spark.Sql;
+
+namespace Microsoft.Spark.ML.Feature
+{
+    /// <summary>
+    /// A <see cref="Tokenizer"/> that converts the input string to lowercase and then splits it by
+    /// white spaces.
+    /// </summary>
+    public class Tokenizer : IJvmObjectReferenceProvider
+    {
+        private static readonly string s_tokenizerClassName = 
+            "org.apache.spark.ml.feature.Tokenizer";
+        
+        private readonly JvmObjectReference _jvmObject;
+        
+        /// <summary>
+        /// Create a <see cref="Tokenizer"/> without any parameters
+        /// </summary>
+        public Tokenizer()
+        {
+            _jvmObject = SparkEnvironment.JvmBridge.CallConstructor(s_tokenizerClassName);
+        }
+
+        /// <summary>
+        /// Create a <see cref="Tokenizer"/> with a UID that is used to give the
+        /// <see cref="Tokenizer"/> a unique ID
+        /// </summary>
+        /// <param name="uid">An immutable unique ID for the object and its derivatives.</param>
+        public Tokenizer(string uid)
+        {
+            _jvmObject = SparkEnvironment.JvmBridge.CallConstructor(s_tokenizerClassName, uid);
+        }
+        
+        internal Tokenizer(JvmObjectReference jvmObject)
+        {
+            _jvmObject = jvmObject;
+        }
+        
+        JvmObjectReference IJvmObjectReferenceProvider.Reference => _jvmObject;
+        
+        /// <summary>
+        /// Gets the column that the <see cref="Tokenizer"/> should read from
+        /// </summary>
+        /// <returns>string, input column</returns>
+        public string GetInputCol()
+        {
+            return (string)(_jvmObject.Invoke("getInputCol"));
+        }
+        
+        /// <summary>
+        /// Sets the column that the <see cref="Tokenizer"/> should read from
+        /// </summary>
+        /// <param name="value">The name of the column to as the source</param>
+        /// <returns>New <see cref="Tokenizer"/> object</returns>
+        public Tokenizer SetInputCol(string value)
+        {
+            return WrapAsTokenizer(_jvmObject.Invoke("setInputCol", value));
+        }
+
+        /// <summary>
+        /// The <see cref="Tokenizer"/> will create a new column in the DataFrame, this is the
+        /// name of the new column.
+        /// </summary>
+        /// <returns>string, the output column</returns>
+        public string GetOutputCol()
+        {
+            return (string)(_jvmObject.Invoke("getOutputCol"));
+        }
+        
+        /// <summary>
+        /// The <see cref="Tokenizer"/> will create a new column in the DataFrame, this is the
+        /// name of the new column.
+        /// </summary>
+        /// <param name="value">The name of the new column</param>
+        /// <returns>New <see cref="Tokenizer"/> object</returns>
+        public Tokenizer SetOutputCol(string value)
+        {
+            return WrapAsTokenizer(_jvmObject.Invoke("setOutputCol", value));
+        }
+        
+        /// <summary>
+        /// Executes the <see cref="Tokenizer"/> and transforms the DataFrame to include the new
+        /// column
+        /// </summary>
+        /// <param name="source">The DataFrame to transform</param>
+        /// <returns>
+        /// New <see cref="DataFrame"/> object with the source <see cref="DataFrame"/> transformed
+        /// </returns>
+        public DataFrame Transform(DataFrame source)
+        {
+            return new DataFrame((JvmObjectReference)_jvmObject.Invoke("transform", source));
+        }
+
+        /// <summary>
+        /// The uid that was used to create the <see cref="Tokenizer"/>. If no UID is passed in
+        /// when creating the <see cref="Tokenizer"/> then a random UID is created when the
+        /// <see cref="Tokenizer"/> is created.
+        /// </summary>
+        /// <returns>string UID identifying the <see cref="Tokenizer"/></returns>
+        public string Uid()
+        {
+            return (string)_jvmObject.Invoke("uid");
+        }
+        
+        /// <summary>
+        /// Loads the <see cref="Tokenizer"/> that was previously saved using Save
+        /// </summary>
+        /// <param name="path">The path the previous <see cref="Tokenizer"/> was saved to</param>
+        /// <returns>New <see cref="Tokenizer"/> object, loaded from path</returns>
+        public static Tokenizer Load(string path)
+        {
+            return WrapAsTokenizer(
+                SparkEnvironment.JvmBridge.CallStaticJavaMethod(
+                    s_tokenizerClassName, "load", path));
+        }
+        
+        /// <summary>
+        /// Saves the <see cref="Tokenizer"/> so that it can be loaded later using Load
+        /// </summary>
+        /// <param name="path">The path to save the <see cref="Tokenizer"/> to</param>
+        /// <returns>New <see cref="Tokenizer"/> object</returns>
+        public Tokenizer Save(string path)
+        {
+            return WrapAsTokenizer(_jvmObject.Invoke("save", path));
+        }
+        
+        private static Tokenizer WrapAsTokenizer(object obj) => 
+            new Tokenizer((JvmObjectReference)obj);
+    }
+}
diff --git a/src/csharp/Microsoft.Spark/Sql/Types/DataType.cs b/src/csharp/Microsoft.Spark/Sql/Types/DataType.cs
index 3bf4173c3..4de1f4ded 100644
--- a/src/csharp/Microsoft.Spark/Sql/Types/DataType.cs
+++ b/src/csharp/Microsoft.Spark/Sql/Types/DataType.cs
@@ -160,6 +160,14 @@ internal static DataType ParseDataType(JToken json)
                     }
                     else if (typeName == "udt")
                     {
+                        if (typeJObject.TryGetValue("class", out JToken classToken))
+                        {
+                            if (typeJObject.TryGetValue("sqlType", out JToken sqlTypeToken))
+                            {
+                                return new StructType((JObject)sqlTypeToken);
+                            }
+                        }
+
                         throw new NotImplementedException();
                     }
                 }