diff --git a/build-tools/repositories.gradle b/build-tools/repositories.gradle
index 8993a5d367..e72fc8a8cc 100644
--- a/build-tools/repositories.gradle
+++ b/build-tools/repositories.gradle
@@ -7,5 +7,6 @@ repositories {
     mavenLocal()
     maven { url "https://aws.oss.sonatype.org/content/repositories/snapshots" }
     mavenCentral()
+    maven {url 'https://oss.sonatype.org/content/repositories/snapshots/'}
     maven { url "https://d1nvenhzbhpy0q.cloudfront.net/snapshots/lucene/" }
 }
\ No newline at end of file
diff --git a/client/src/main/java/org/opensearch/ml/client/MachineLearningNodeClient.java b/client/src/main/java/org/opensearch/ml/client/MachineLearningNodeClient.java
index f08abb85aa..3538797478 100644
--- a/client/src/main/java/org/opensearch/ml/client/MachineLearningNodeClient.java
+++ b/client/src/main/java/org/opensearch/ml/client/MachineLearningNodeClient.java
@@ -13,7 +13,7 @@
 import org.opensearch.action.delete.DeleteResponse;
 import org.opensearch.action.search.SearchRequest;
 import org.opensearch.action.search.SearchResponse;
-import org.opensearch.client.node.NodeClient;
+import org.opensearch.client.Client;
 import org.opensearch.ml.common.input.MLInput;
 import org.opensearch.ml.common.MLModel;
 import org.opensearch.ml.common.output.MLOutput;
@@ -38,17 +38,16 @@
 @RequiredArgsConstructor
 public class MachineLearningNodeClient implements MachineLearningClient {
 
-    NodeClient client;
+    Client client;
 
     @Override
     public void predict(String modelId, MLInput mlInput, ActionListener<MLOutput> listener) {
         validateMLInput(mlInput, true);
 
         MLPredictionTaskRequest predictionRequest = MLPredictionTaskRequest.builder()
-            .mlInput(mlInput)
-            .modelId(modelId)
-            .build();
-
+                .mlInput(mlInput)
+                .modelId(modelId)
+                .build();
         client.execute(MLPredictionTaskAction.INSTANCE, predictionRequest, getMlPredictionTaskResponseActionListener(listener));
     }
 
@@ -80,9 +79,18 @@ public void getModel(String modelId, ActionListener<MLModel> listener) {
                 .modelId(modelId)
                 .build();
 
-        client.execute(MLModelGetAction.INSTANCE, mlModelGetRequest, ActionListener.wrap(response -> {
-            listener.onResponse(MLModelGetResponse.fromActionResponse(response).getMlModel());
-        }, listener::onFailure));
+        client.execute(MLModelGetAction.INSTANCE, mlModelGetRequest, getMlGetModelResponseActionListener(listener));
+    }
+
+    private ActionListener<MLModelGetResponse> getMlGetModelResponseActionListener(ActionListener<MLModel> listener) {
+        ActionListener<MLModelGetResponse> internalListener = ActionListener.wrap(predictionResponse -> {
+            listener.onResponse(predictionResponse.getMlModel());
+        }, listener::onFailure);
+        ActionListener<MLModelGetResponse> actionListener = wrapActionListener(internalListener, res -> {
+            MLModelGetResponse getResponse = MLModelGetResponse.fromActionResponse(res);
+            return getResponse;
+        });
+        return actionListener;
     }
 
     @Override
diff --git a/common/src/main/java/org/opensearch/ml/common/MLModel.java b/common/src/main/java/org/opensearch/ml/common/MLModel.java
index 5ecf2afa2b..0549a5b43d 100644
--- a/common/src/main/java/org/opensearch/ml/common/MLModel.java
+++ b/common/src/main/java/org/opensearch/ml/common/MLModel.java
@@ -95,13 +95,6 @@ public MLModel(String name, FunctionName algorithm, Integer version, String cont
         this.totalChunks = totalChunks;
     }
 
-    public MLModel(FunctionName algorithm, Model model) {
-        this.name = model.getName();
-        this.algorithm = algorithm;
-        this.version = model.getVersion();
-        this.content = Base64.getEncoder().encodeToString(model.getContent());
-    }
-
     public MLModel(StreamInput input) throws IOException{
         name = input.readOptionalString();
         algorithm = input.readEnum(FunctionName.class);
diff --git a/common/src/main/java/org/opensearch/ml/common/exception/MLException.java b/common/src/main/java/org/opensearch/ml/common/exception/MLException.java
index 8994678401..fea47dc826 100644
--- a/common/src/main/java/org/opensearch/ml/common/exception/MLException.java
+++ b/common/src/main/java/org/opensearch/ml/common/exception/MLException.java
@@ -33,7 +33,7 @@ public MLException(Throwable cause) {
     }
 
     /**
-     * Constructor with specified error message adn cause.
+     * Constructor with specified error message and cause.
      * @param message error message
      * @param cause exception cause
      */
diff --git a/common/src/main/java/org/opensearch/ml/common/input/MLInput.java b/common/src/main/java/org/opensearch/ml/common/input/MLInput.java
index 47437f91eb..a58fa09f97 100644
--- a/common/src/main/java/org/opensearch/ml/common/input/MLInput.java
+++ b/common/src/main/java/org/opensearch/ml/common/input/MLInput.java
@@ -42,11 +42,17 @@ public class MLInput implements Input {
     public static final String INPUT_INDEX_FIELD = "input_index";
     public static final String INPUT_QUERY_FIELD = "input_query";
     public static final String INPUT_DATA_FIELD = "input_data";
+
     // For trained model
+    // Return bytes in model output
     public static final String RETURN_BYTES_FIELD = "return_bytes";
+    // Return bytes in model output. This can be used together with return_bytes.
     public static final String RETURN_NUMBER_FIELD = "return_number";
+    // Filter target response with name in model output
     public static final String TARGET_RESPONSE_FIELD = "target_response";
+    // Filter target response with position in model output
     public static final String TARGET_RESPONSE_POSITIONS_FIELD = "target_response_positions";
+    // Input text sentences for text embedding  model
     public static final String TEXT_DOCS_FIELD = "text_docs";
 
     // Algorithm name
diff --git a/common/src/main/java/org/opensearch/ml/common/output/model/ModelTensors.java b/common/src/main/java/org/opensearch/ml/common/output/model/ModelTensors.java
index 06899dd05f..6e57f46b6c 100644
--- a/common/src/main/java/org/opensearch/ml/common/output/model/ModelTensors.java
+++ b/common/src/main/java/org/opensearch/ml/common/output/model/ModelTensors.java
@@ -66,12 +66,12 @@ public void writeTo(StreamOutput out) throws IOException {
 
     public void filter(ModelResultFilter resultFilter) {
         boolean returnBytes = resultFilter.isReturnBytes();
-        boolean returnNUmber = resultFilter.isReturnNumber();
+        boolean returnNumber = resultFilter.isReturnNumber();
         List<String> targetResponse = resultFilter.getTargetResponse();
         List<Integer> targetResponsePositions = resultFilter.getTargetResponsePositions();
         if ((targetResponse == null || targetResponse.size() == 0)
                 && (targetResponsePositions == null || targetResponsePositions.size() == 0)) {
-            mlModelTensors.forEach(output -> filter(output, returnBytes,  returnNUmber));
+            mlModelTensors.forEach(output -> filter(output, returnBytes,  returnNumber));
             return;
         }
         List<ModelTensor> targetOutput = new ArrayList<>();
@@ -79,10 +79,10 @@ public void filter(ModelResultFilter resultFilter) {
             for (int i = 0 ; i<mlModelTensors.size(); i++) {
                 ModelTensor output = mlModelTensors.get(i);
                 if (targetResponse != null && targetResponse.contains(output.getName())) {
-                    filter(output, returnBytes,  returnNUmber);
+                    filter(output, returnBytes,  returnNumber);
                     targetOutput.add(output);
                 } else if (targetResponsePositions != null && targetResponsePositions.contains(i)) {
-                    filter(output, returnBytes,  returnNUmber);
+                    filter(output, returnBytes,  returnNumber);
                     targetOutput.add(output);
                 }
             }
diff --git a/ml-algorithms/src/main/java/org/opensearch/ml/engine/MLEngine.java b/ml-algorithms/src/main/java/org/opensearch/ml/engine/MLEngine.java
index 95cc8fe505..3df57142fb 100644
--- a/ml-algorithms/src/main/java/org/opensearch/ml/engine/MLEngine.java
+++ b/ml-algorithms/src/main/java/org/opensearch/ml/engine/MLEngine.java
@@ -5,37 +5,47 @@
 
 package org.opensearch.ml.engine;
 
+import org.opensearch.ml.common.MLModel;
 import org.opensearch.ml.common.dataframe.DataFrame;
+import org.opensearch.ml.common.dataset.DataFrameInputDataset;
+import org.opensearch.ml.common.dataset.MLInputDataset;
 import org.opensearch.ml.common.input.Input;
 import org.opensearch.ml.common.input.parameter.MLAlgoParams;
 import org.opensearch.ml.common.input.MLInput;
 import org.opensearch.ml.common.output.MLOutput;
-import org.opensearch.ml.common.Model;
 import org.opensearch.ml.common.output.Output;
 
+import java.util.Map;
+
 /**
  * This is the interface to all ml algorithms.
  */
 public class MLEngine {
 
-    public static Model train(Input input) {
+    public static MLModel train(Input input) {
         validateMLInput(input);
         MLInput mlInput = (MLInput) input;
         Trainable trainable = MLEngineClassLoader.initInstance(mlInput.getAlgorithm(), mlInput.getParameters(), MLAlgoParams.class);
         if (trainable == null) {
             throw new IllegalArgumentException("Unsupported algorithm: " + mlInput.getAlgorithm());
         }
-        return trainable.train(mlInput.getDataFrame());
+        return trainable.train(mlInput.getInputDataset());
+    }
+
+    public static Predictable load(MLModel mlModel, Map<String, Object> params) {
+        Predictable predictable = MLEngineClassLoader.initInstance(mlModel.getAlgorithm(), null, MLAlgoParams.class);
+        predictable.initModel(mlModel, params);
+        return predictable;
     }
 
-    public static MLOutput predict(Input input, Model model) {
+    public static MLOutput predict(Input input, MLModel model) {
         validateMLInput(input);
         MLInput mlInput = (MLInput) input;
         Predictable predictable = MLEngineClassLoader.initInstance(mlInput.getAlgorithm(), mlInput.getParameters(), MLAlgoParams.class);
         if (predictable == null) {
             throw new IllegalArgumentException("Unsupported algorithm: " + mlInput.getAlgorithm());
         }
-        return predictable.predict(mlInput.getDataFrame(), model);
+        return predictable.predict(mlInput.getInputDataset(), model);
     }
 
     public static MLOutput trainAndPredict(Input input) {
@@ -45,7 +55,7 @@ public static MLOutput trainAndPredict(Input input) {
         if (trainAndPredictable == null) {
             throw new IllegalArgumentException("Unsupported algorithm: " + mlInput.getAlgorithm());
         }
-        return trainAndPredictable.trainAndPredict(mlInput.getDataFrame());
+        return trainAndPredictable.trainAndPredict(mlInput.getInputDataset());
     }
 
     public static Output execute(Input input) {
@@ -63,9 +73,15 @@ private static void validateMLInput(Input input) {
             throw new IllegalArgumentException("Input should be MLInput");
         }
         MLInput mlInput = (MLInput) input;
-        DataFrame dataFrame = mlInput.getDataFrame();
-        if (dataFrame == null || dataFrame.size() == 0) {
-            throw new IllegalArgumentException("Input data frame should not be null or empty");
+        MLInputDataset inputDataset = mlInput.getInputDataset();
+        if (inputDataset == null) {
+            throw new IllegalArgumentException("Input data set should not be null");
+        }
+        if (inputDataset instanceof DataFrameInputDataset) {
+            DataFrame dataFrame = ((DataFrameInputDataset)inputDataset).getDataFrame();
+            if (dataFrame == null || dataFrame.size() == 0) {
+                throw new IllegalArgumentException("Input data frame should not be null or empty");
+            }
         }
     }
 
diff --git a/ml-algorithms/src/main/java/org/opensearch/ml/engine/Predictable.java b/ml-algorithms/src/main/java/org/opensearch/ml/engine/Predictable.java
index a40b791adc..df19bf5823 100644
--- a/ml-algorithms/src/main/java/org/opensearch/ml/engine/Predictable.java
+++ b/ml-algorithms/src/main/java/org/opensearch/ml/engine/Predictable.java
@@ -5,9 +5,11 @@
 
 package org.opensearch.ml.engine;
 
-import org.opensearch.ml.common.dataframe.DataFrame;
+import org.opensearch.ml.common.MLModel;
+import org.opensearch.ml.common.dataset.MLInputDataset;
 import org.opensearch.ml.common.output.MLOutput;
-import org.opensearch.ml.common.Model;
+
+import java.util.Map;
 
 /**
  * This is machine learning algorithms predict interface.
@@ -15,11 +17,30 @@
 public interface Predictable {
 
     /**
-     * Predict with given features and model (optional).
-     * @param dataFrame features data
+     * Predict with given input data and model (optional).
+     * Will reload model into memory with model content.
+     * @param inputDataset input data set
      * @param model the java serialized model
      * @return predicted results
      */
-    MLOutput predict(DataFrame dataFrame, Model model);
+    MLOutput predict(MLInputDataset inputDataset, MLModel model);
+
+    /**
+     * Predict with given input data with loaded model.
+     * @param inputDataset input data set
+     * @return predicted results
+     */
+    MLOutput predict(MLInputDataset inputDataset);
 
+    /**
+     * Init model (load model into memory) with ML model content and params.
+     * @param model ML model
+     * @param params other parameters
+     */
+    void initModel(MLModel model, Map<String, Object> params);
+
+    /**
+     * Close resources like loaded model.
+     */
+    void close();
 }
diff --git a/ml-algorithms/src/main/java/org/opensearch/ml/engine/TrainAndPredictable.java b/ml-algorithms/src/main/java/org/opensearch/ml/engine/TrainAndPredictable.java
index d67d685b2e..f6d761bb9b 100644
--- a/ml-algorithms/src/main/java/org/opensearch/ml/engine/TrainAndPredictable.java
+++ b/ml-algorithms/src/main/java/org/opensearch/ml/engine/TrainAndPredictable.java
@@ -5,20 +5,20 @@
 
 package org.opensearch.ml.engine;
 
-import org.opensearch.ml.common.dataframe.DataFrame;
+import org.opensearch.ml.common.dataset.MLInputDataset;
 import org.opensearch.ml.common.output.MLOutput;
 
 
 /**
- * This is machine learning algorithms train interface.
+ * This is machine learning algorithms train and predict interface.
  */
 public interface TrainAndPredictable extends Trainable, Predictable {
 
     /**
-     * Train model with given features. Then predict with the same data.
-     * @param dataFrame training data
-     * @return the java serialized model
+     * Train model with given input data. Then predict with the same data.
+     * @param inputDataset training data
+     * @return ML model with serialized model content
      */
-    MLOutput trainAndPredict(DataFrame dataFrame);
+    MLOutput trainAndPredict(MLInputDataset inputDataset);
 
 }
diff --git a/ml-algorithms/src/main/java/org/opensearch/ml/engine/Trainable.java b/ml-algorithms/src/main/java/org/opensearch/ml/engine/Trainable.java
index 755b365144..397b64c19e 100644
--- a/ml-algorithms/src/main/java/org/opensearch/ml/engine/Trainable.java
+++ b/ml-algorithms/src/main/java/org/opensearch/ml/engine/Trainable.java
@@ -5,8 +5,8 @@
 
 package org.opensearch.ml.engine;
 
-import org.opensearch.ml.common.dataframe.DataFrame;
-import org.opensearch.ml.common.Model;
+import org.opensearch.ml.common.MLModel;
+import org.opensearch.ml.common.dataset.MLInputDataset;
 
 /**
  * This is machine learning algorithms train interface.
@@ -15,9 +15,9 @@ public interface Trainable {
 
     /**
      * Train model with given features.
-     * @param dataFrame training data
-     * @return the java serialized model
+     * @param inputDataset training data
+     * @return ML model with serialized model content
      */
-    Model train(DataFrame dataFrame);
+    MLModel train(MLInputDataset inputDataset);
 
 }
diff --git a/ml-algorithms/src/main/java/org/opensearch/ml/engine/algorithms/ad/AnomalyDetectionLibSVM.java b/ml-algorithms/src/main/java/org/opensearch/ml/engine/algorithms/ad/AnomalyDetectionLibSVM.java
index d145c5d1aa..2c6c6c44be 100644
--- a/ml-algorithms/src/main/java/org/opensearch/ml/engine/algorithms/ad/AnomalyDetectionLibSVM.java
+++ b/ml-algorithms/src/main/java/org/opensearch/ml/engine/algorithms/ad/AnomalyDetectionLibSVM.java
@@ -5,14 +5,16 @@
 
 package org.opensearch.ml.engine.algorithms.ad;
 
+import org.opensearch.ml.common.MLModel;
 import org.opensearch.ml.common.dataframe.DataFrame;
 import org.opensearch.ml.common.dataframe.DataFrameBuilder;
 import org.opensearch.ml.common.FunctionName;
+import org.opensearch.ml.common.dataset.DataFrameInputDataset;
+import org.opensearch.ml.common.dataset.MLInputDataset;
 import org.opensearch.ml.common.input.parameter.ad.AnomalyDetectionLibSVMParams;
 import org.opensearch.ml.common.input.parameter.MLAlgoParams;
 import org.opensearch.ml.common.output.MLOutput;
 import org.opensearch.ml.common.output.MLPredictionOutput;
-import org.opensearch.ml.common.Model;
 import org.opensearch.ml.engine.Predictable;
 import org.opensearch.ml.engine.Trainable;
 import org.opensearch.ml.engine.annotation.Function;
@@ -48,6 +50,7 @@ public class AnomalyDetectionLibSVM implements Trainable, Predictable {
     private static KernelType DEFAULT_KERNEL_TYPE = KernelType.RBF;
 
     private AnomalyDetectionLibSVMParams parameters;
+    private LibSVMModel libSVMAnomalyModel = null;
 
     public AnomalyDetectionLibSVM() {}
 
@@ -69,15 +72,24 @@ private void validateParameters() {
     }
 
     @Override
-    public MLOutput predict(DataFrame dataFrame, Model model) {
-        if (model == null) {
-            throw new IllegalArgumentException("No model found for KMeans prediction.");
-        }
+    public void initModel(MLModel model, Map<String, Object> params) {
+        this.libSVMAnomalyModel = (LibSVMModel) ModelSerDeSer.deserialize(model);
+    }
 
+    @Override
+    public void close() {
+        this.libSVMAnomalyModel = null;
+    }
+
+    @Override
+    public MLOutput predict(MLInputDataset inputDataset) {
+        DataFrame dataFrame = ((DataFrameInputDataset)inputDataset).getDataFrame();
+        if (libSVMAnomalyModel == null) {
+            throw new IllegalArgumentException("model not loaded");
+        }
         List<Prediction<Event>> predictions;
         MutableDataset<Event> predictionDataset = TribuoUtil.generateDataset(dataFrame, new AnomalyFactory(),
                 "Anomaly detection LibSVM prediction data from OpenSearch", TribuoOutputType.ANOMALY_DETECTION_LIBSVM);
-        LibSVMModel libSVMAnomalyModel = (LibSVMModel) ModelSerDeSer.deserialize(model.getContent());
         predictions = libSVMAnomalyModel.predict(predictionDataset);
 
         List<Map<String, Object>> adResults = new ArrayList<>();
@@ -92,7 +104,18 @@ public MLOutput predict(DataFrame dataFrame, Model model) {
     }
 
     @Override
-    public Model train(DataFrame dataFrame) {
+    public MLOutput predict(MLInputDataset inputDataset, MLModel model) {
+        if (model == null) {
+            throw new IllegalArgumentException("No model found for KMeans prediction.");
+        }
+
+        libSVMAnomalyModel = (LibSVMModel) ModelSerDeSer.deserialize(model);
+        return predict(inputDataset);
+    }
+
+    @Override
+    public MLModel train(MLInputDataset inputDataset) {
+        DataFrame dataFrame = ((DataFrameInputDataset)inputDataset).getDataFrame();
         KernelType kernelType = parseKernelType();
         SVMParameters params = new SVMParameters<>(new SVMAnomalyType(SVMAnomalyType.SVMMode.ONE_CLASS), kernelType);
         Double gamma = Optional.ofNullable(parameters.getGamma()).orElse(DEFAULT_GAMMA);
@@ -118,10 +141,13 @@ public Model train(DataFrame dataFrame) {
 
         LibSVMModel libSVMModel = trainer.train(data);
         ((LibSVMAnomalyModel)libSVMModel).getNumberOfSupportVectors();
-        Model model = new Model();
-        model.setName(FunctionName.AD_LIBSVM.name());
-        model.setVersion(VERSION);
-        model.setContent(ModelSerDeSer.serialize(libSVMModel));
+
+        MLModel model = MLModel.builder()
+                .name(FunctionName.AD_LIBSVM.name())
+                .algorithm(FunctionName.AD_LIBSVM)
+                .version(VERSION)
+                .content(ModelSerDeSer.serializeToBase64(libSVMModel))
+                .build();
         return model;
     }
 
diff --git a/ml-algorithms/src/main/java/org/opensearch/ml/engine/algorithms/clustering/KMeans.java b/ml-algorithms/src/main/java/org/opensearch/ml/engine/algorithms/clustering/KMeans.java
index f789c4078f..9c7de99fa5 100644
--- a/ml-algorithms/src/main/java/org/opensearch/ml/engine/algorithms/clustering/KMeans.java
+++ b/ml-algorithms/src/main/java/org/opensearch/ml/engine/algorithms/clustering/KMeans.java
@@ -5,14 +5,16 @@
 
 package org.opensearch.ml.engine.algorithms.clustering;
 
+import org.opensearch.ml.common.MLModel;
 import org.opensearch.ml.common.dataframe.DataFrame;
 import org.opensearch.ml.common.dataframe.DataFrameBuilder;
+import org.opensearch.ml.common.dataset.DataFrameInputDataset;
+import org.opensearch.ml.common.dataset.MLInputDataset;
 import org.opensearch.ml.common.input.parameter.clustering.KMeansParams;
 import org.opensearch.ml.common.FunctionName;
 import org.opensearch.ml.common.input.parameter.MLAlgoParams;
 import org.opensearch.ml.common.output.MLOutput;
 import org.opensearch.ml.common.output.MLPredictionOutput;
-import org.opensearch.ml.common.Model;
 import org.opensearch.ml.engine.TrainAndPredictable;
 import org.opensearch.ml.engine.annotation.Function;
 import org.opensearch.ml.engine.utils.ModelSerDeSer;
@@ -42,11 +44,12 @@ public class KMeans implements TrainAndPredictable {
 
     //The number of threads.
     private int numThreads = Math.max(Runtime.getRuntime().availableProcessors() / 2, 1); //Assume cpu-bound.
-    
+
     //The random seed.
     private long seed = System.currentTimeMillis();
     private KMeansTrainer.Distance distance;
 
+    private KMeansModel kMeansModel;
     public KMeans() {}
 
     public KMeans(MLAlgoParams parameters) {
@@ -83,17 +86,21 @@ private void createDistance() {
     }
 
     @Override
-    public MLOutput predict(DataFrame dataFrame, Model model) {
-        if (model == null) {
-            throw new IllegalArgumentException("No model found for KMeans prediction.");
-        }
+    public void initModel(MLModel model, Map<String, Object> params) {
+        this.kMeansModel = (KMeansModel) ModelSerDeSer.deserialize(model);
+    }
+
+    @Override
+    public void close() {
+        this.kMeansModel = null;
+    }
 
-        List<Prediction<ClusterID>> predictions;
+    @Override
+    public MLOutput predict(MLInputDataset inputDataset) {
+        DataFrame dataFrame = ((DataFrameInputDataset)inputDataset).getDataFrame();
         MutableDataset<ClusterID> predictionDataset = TribuoUtil.generateDataset(dataFrame, new ClusteringFactory(),
                 "KMeans prediction data from opensearch", TribuoOutputType.CLUSTERID);
-        KMeansModel kMeansModel = (KMeansModel) ModelSerDeSer.deserialize(model.getContent());
-        predictions = kMeansModel.predict(predictionDataset);
-
+        List<Prediction<ClusterID>> predictions = kMeansModel.predict(predictionDataset);
         List<Map<String, Object>> listClusterID = new ArrayList<>();
         predictions.forEach(e -> listClusterID.add(Collections.singletonMap("ClusterID", e.getOutput().getID())));
 
@@ -101,23 +108,36 @@ public MLOutput predict(DataFrame dataFrame, Model model) {
     }
 
     @Override
-    public Model train(DataFrame dataFrame) {
+    public MLOutput predict(MLInputDataset inputDataset, MLModel model) {
+        if (model == null) {
+            throw new IllegalArgumentException("No model found for KMeans prediction.");
+        }
+        this.kMeansModel = (KMeansModel) ModelSerDeSer.deserialize(model);
+        return predict(inputDataset);
+    }
+
+    @Override
+    public MLModel train(MLInputDataset inputDataset) {
+        DataFrame dataFrame = ((DataFrameInputDataset)inputDataset).getDataFrame();
         MutableDataset<ClusterID> trainDataset = TribuoUtil.generateDataset(dataFrame, new ClusteringFactory(),
                 "KMeans training data from opensearch", TribuoOutputType.CLUSTERID);
         Integer centroids = Optional.ofNullable(parameters.getCentroids()).orElse(DEFAULT_CENTROIDS);
         Integer iterations = Optional.ofNullable(parameters.getIterations()).orElse(DEFAULT_ITERATIONS);
         KMeansTrainer trainer = new KMeansTrainer(centroids, iterations, distance, numThreads, seed);
         KMeansModel kMeansModel = trainer.train(trainDataset);
-        Model model = new Model();
-        model.setName(FunctionName.KMEANS.name());
-        model.setVersion(1);
-        model.setContent(ModelSerDeSer.serialize(kMeansModel));
 
+        MLModel model = MLModel.builder()
+                .name(FunctionName.KMEANS.name())
+                .algorithm(FunctionName.KMEANS)
+                .version(1)
+                .content(ModelSerDeSer.serializeToBase64(kMeansModel))
+                .build();
         return model;
     }
 
     @Override
-    public MLOutput trainAndPredict(DataFrame dataFrame) {
+    public MLOutput trainAndPredict(MLInputDataset inputDataset) {
+        DataFrame dataFrame = ((DataFrameInputDataset)inputDataset).getDataFrame();
         MutableDataset<ClusterID> trainDataset = TribuoUtil.generateDataset(dataFrame, new ClusteringFactory(),
                 "KMeans training and predicting data from opensearch", TribuoOutputType.CLUSTERID);
         Integer centroids = Optional.ofNullable(parameters.getCentroids()).orElse(DEFAULT_CENTROIDS);
diff --git a/ml-algorithms/src/main/java/org/opensearch/ml/engine/algorithms/clustering/RCFSummarize.java b/ml-algorithms/src/main/java/org/opensearch/ml/engine/algorithms/clustering/RCFSummarize.java
index 43e28c777b..48810db810 100644
--- a/ml-algorithms/src/main/java/org/opensearch/ml/engine/algorithms/clustering/RCFSummarize.java
+++ b/ml-algorithms/src/main/java/org/opensearch/ml/engine/algorithms/clustering/RCFSummarize.java
@@ -5,15 +5,17 @@
 
 package org.opensearch.ml.engine.algorithms.clustering;
 
+import org.opensearch.ml.common.MLModel;
 import org.opensearch.ml.common.dataframe.DataFrame;
 import org.opensearch.ml.common.dataframe.DataFrameBuilder;
+import org.opensearch.ml.common.dataset.DataFrameInputDataset;
+import org.opensearch.ml.common.dataset.MLInputDataset;
 import org.opensearch.ml.common.input.parameter.clustering.RCFSummarizeParams;
 import org.opensearch.common.collect.Tuple;
 import org.opensearch.ml.common.FunctionName;
 import org.opensearch.ml.common.input.parameter.MLAlgoParams;
 import org.opensearch.ml.common.output.MLOutput;
 import org.opensearch.ml.common.output.MLPredictionOutput;
-import org.opensearch.ml.common.Model;
 import org.opensearch.ml.engine.TrainAndPredictable;
 import org.opensearch.ml.engine.annotation.Function;
 import org.opensearch.ml.engine.utils.MathUtil;
@@ -21,7 +23,6 @@
 import org.opensearch.ml.engine.utils.TribuoUtil;
 import com.amazon.randomcutforest.returntypes.SampleSummary;
 import com.amazon.randomcutforest.summarization.Summarizer;
-import org.opensearch.ml.engine.algorithms.clustering.SerializableSummary;
 
 import java.util.ArrayList;
 import java.util.Arrays;
@@ -43,6 +44,7 @@ public class RCFSummarize implements TrainAndPredictable {
     // Parameters
     private RCFSummarizeParams parameters;
     private BiFunction<float[], float[], Double> distance;
+    private SampleSummary summary;
 
     public RCFSummarize() {}
 
@@ -109,32 +111,40 @@ private void createDistance() {
     }
 
     @Override
-    public Model train(DataFrame dataFrame) {
+    public MLModel train(MLInputDataset inputDataset) {
+        DataFrame dataFrame = ((DataFrameInputDataset)inputDataset).getDataFrame();
         Tuple<String[], float[][]> featureNamesValues = TribuoUtil.transformDataFrameFloat(dataFrame);
-        SampleSummary summary = Summarizer.summarize(featureNamesValues.v2(), 
-            parameters.getMaxK(), 
-            parameters.getInitialK(), 
-            parameters.getPhase1Reassign(), 
-            distance, 
-            rnd.nextLong(), 
-            parameters.getParallel());
-
-        Model model = new Model();
-        model.setName(FunctionName.RCF_SUMMARIZE.name());
-        model.setVersion(1);
-        model.setContent(ModelSerDeSer.serialize(new SerializableSummary(summary)));
-
+        SampleSummary summary = Summarizer.summarize(featureNamesValues.v2(),
+                parameters.getMaxK(),
+                parameters.getInitialK(),
+                parameters.getPhase1Reassign(),
+                distance,
+                rnd.nextLong(),
+                parameters.getParallel());
+
+        MLModel model = MLModel.builder()
+                .name(FunctionName.RCF_SUMMARIZE.name())
+                .algorithm(FunctionName.RCF_SUMMARIZE)
+                .version(1)
+                .content(ModelSerDeSer.serializeToBase64(new SerializableSummary(summary)))
+                .build();
         return model;
     }
 
     @Override
-    public MLOutput predict(DataFrame dataFrame, Model model) {
-        if (model == null) {
-            throw new IllegalArgumentException("No model found for RCFSummarize prediction.");
-        }
+    public void initModel(MLModel model, Map<String, Object> params) {
+        this.summary = ((SerializableSummary)ModelSerDeSer.deserialize(model)).getSummary();
+    }
 
-        SampleSummary summary = ((SerializableSummary)ModelSerDeSer.deserialize(model.getContent())).getSummary();
+    @Override
+    public void close() {
+        this.summary = null;
+    }
+
+    @Override
+    public MLOutput predict(MLInputDataset inputDataset) {
         Iterable<float[]> centroidsLst = Arrays.asList(summary.summaryPoints);
+        DataFrame dataFrame = ((DataFrameInputDataset)inputDataset).getDataFrame();
         Tuple<String[], float[][]> featureNamesValues = TribuoUtil.transformDataFrameFloat(dataFrame);
         List<Integer> predictions = new ArrayList<>();
         Arrays.stream(featureNamesValues.v2()).forEach(e->predictions.add(MathUtil.findNearest(e, centroidsLst, distance)));
@@ -146,16 +156,27 @@ public MLOutput predict(DataFrame dataFrame, Model model) {
     }
 
     @Override
-    public MLOutput trainAndPredict(DataFrame dataFrame) {
+    public MLOutput predict(MLInputDataset inputDataset, MLModel model) {
+        if (model == null) {
+            throw new IllegalArgumentException("No model found for RCFSummarize prediction.");
+        }
+
+        summary = ((SerializableSummary)ModelSerDeSer.deserialize(model)).getSummary();
+        return predict(inputDataset);
+    }
+
+    @Override
+    public MLOutput trainAndPredict(MLInputDataset inputDataset) {
+        DataFrame dataFrame = ((DataFrameInputDataset)inputDataset).getDataFrame();
         Tuple<String[], float[][]> featureNamesValues = TribuoUtil.transformDataFrameFloat(dataFrame);
-        SampleSummary summary = Summarizer.summarize(featureNamesValues.v2(), 
-            parameters.getMaxK(), 
-            parameters.getInitialK(), 
-            parameters.getPhase1Reassign(), 
-            distance, 
-            rnd.nextLong(), 
-            parameters.getParallel());
-        
+        SampleSummary summary = Summarizer.summarize(featureNamesValues.v2(),
+                parameters.getMaxK(),
+                parameters.getInitialK(),
+                parameters.getPhase1Reassign(),
+                distance,
+                rnd.nextLong(),
+                parameters.getParallel());
+
         Iterable<float[]> centroidsLst = Arrays.asList(summary.summaryPoints);
         List<Integer> predictions = new ArrayList<>();
         Arrays.stream(featureNamesValues.v2()).forEach(e->predictions.add(MathUtil.findNearest(e, centroidsLst, distance)));
diff --git a/ml-algorithms/src/main/java/org/opensearch/ml/engine/algorithms/rcf/BatchRandomCutForest.java b/ml-algorithms/src/main/java/org/opensearch/ml/engine/algorithms/rcf/BatchRandomCutForest.java
index 4446e816fd..ba9e8f432c 100644
--- a/ml-algorithms/src/main/java/org/opensearch/ml/engine/algorithms/rcf/BatchRandomCutForest.java
+++ b/ml-algorithms/src/main/java/org/opensearch/ml/engine/algorithms/rcf/BatchRandomCutForest.java
@@ -10,12 +10,14 @@
 import com.amazon.randomcutforest.state.RandomCutForestState;
 import lombok.extern.log4j.Log4j2;
 import org.opensearch.ml.common.FunctionName;
-import org.opensearch.ml.common.Model;
+import org.opensearch.ml.common.MLModel;
 import org.opensearch.ml.common.dataframe.ColumnMeta;
 import org.opensearch.ml.common.dataframe.ColumnValue;
 import org.opensearch.ml.common.dataframe.DataFrame;
 import org.opensearch.ml.common.dataframe.DataFrameBuilder;
 import org.opensearch.ml.common.dataframe.Row;
+import org.opensearch.ml.common.dataset.DataFrameInputDataset;
+import org.opensearch.ml.common.dataset.MLInputDataset;
 import org.opensearch.ml.common.input.parameter.MLAlgoParams;
 import org.opensearch.ml.common.input.parameter.rcf.BatchRCFParams;
 import org.opensearch.ml.common.output.MLOutput;
@@ -29,6 +31,9 @@
 import java.util.Map;
 import java.util.Optional;
 
+import static org.opensearch.ml.engine.utils.ModelSerDeSer.decodeBase64;
+import static org.opensearch.ml.engine.utils.ModelSerDeSer.encodeBase64;
+
 /**
  * Use RCF to detect non-time-series data.
  */
@@ -48,6 +53,8 @@ public class BatchRandomCutForest implements TrainAndPredictable {
 
     private static final RandomCutForestMapper rcfMapper = new RandomCutForestMapper();
 
+    private RandomCutForest forest;
+
     public BatchRandomCutForest(){}
 
     public BatchRandomCutForest(MLAlgoParams parameters) {
@@ -63,31 +70,53 @@ public BatchRandomCutForest(MLAlgoParams parameters) {
     }
 
     @Override
-    public MLOutput predict(DataFrame dataFrame, Model model) {
+    public void initModel(MLModel model, Map<String, Object> params) {
+        RandomCutForestState state = RCFModelSerDeSer.deserializeRCF(model);
+        forest = rcfMapper.toModel(state);
+    }
+
+    @Override
+    public void close() {
+        forest = null;
+    }
+
+    @Override
+    public MLOutput predict(MLInputDataset inputDataset) {
+        DataFrame dataFrame = ((DataFrameInputDataset)inputDataset).getDataFrame();
+        List<Map<String, Object>> predictResult = process(dataFrame, forest, 0);
+        return MLPredictionOutput.builder().predictionResult(DataFrameBuilder.load(predictResult)).build();
+    }
+
+    @Override
+    public MLOutput predict(MLInputDataset inputDataset, MLModel model) {
         if (model == null) {
             throw new IllegalArgumentException("No model found for batch RCF prediction.");
         }
-        RandomCutForestState state = RCFModelSerDeSer.deserializeRCF(model.getContent());
-        RandomCutForest forest = rcfMapper.toModel(state);
-        List<Map<String, Object>> predictResult = process(dataFrame, forest, 0);
-        return MLPredictionOutput.builder().predictionResult(DataFrameBuilder.load(predictResult)).build();
+        RandomCutForestState state = RCFModelSerDeSer.deserializeRCF(model);
+        forest = rcfMapper.toModel(state);
+        return predict(inputDataset);
     }
 
     @Override
-    public Model train(DataFrame dataFrame) {
+    public MLModel train(MLInputDataset inputDataset) {
+        DataFrame dataFrame = ((DataFrameInputDataset)inputDataset).getDataFrame();
         RandomCutForest forest = createRandomCutForest(dataFrame);
         Integer actualTrainingDataSize = trainingDataSize == null ? dataFrame.size() : trainingDataSize;
         process(dataFrame, forest, actualTrainingDataSize);
-        Model model = new Model();
-        model.setName(FunctionName.BATCH_RCF.name());
-        model.setVersion(1);
+
         RandomCutForestState state = rcfMapper.toState(forest);
-        model.setContent(RCFModelSerDeSer.serializeRCF(state));
+        MLModel model = MLModel.builder()
+                .name(FunctionName.BATCH_RCF.name())
+                .algorithm(FunctionName.BATCH_RCF)
+                .version(1)
+                .content(encodeBase64(RCFModelSerDeSer.serializeRCF(state)))
+                .build();
         return model;
     }
 
     @Override
-    public MLOutput trainAndPredict(DataFrame dataFrame) {
+    public MLOutput trainAndPredict(MLInputDataset inputDataset) {
+        DataFrame dataFrame = ((DataFrameInputDataset)inputDataset).getDataFrame();
         RandomCutForest forest = createRandomCutForest(dataFrame);
         Integer actualTrainingDataSize = trainingDataSize == null ? dataFrame.size() : trainingDataSize;
         List<Map<String, Object>> predictResult = process(dataFrame, forest, actualTrainingDataSize);
diff --git a/ml-algorithms/src/main/java/org/opensearch/ml/engine/algorithms/rcf/FixedInTimeRandomCutForest.java b/ml-algorithms/src/main/java/org/opensearch/ml/engine/algorithms/rcf/FixedInTimeRandomCutForest.java
index bd881e7beb..c2754d6eee 100644
--- a/ml-algorithms/src/main/java/org/opensearch/ml/engine/algorithms/rcf/FixedInTimeRandomCutForest.java
+++ b/ml-algorithms/src/main/java/org/opensearch/ml/engine/algorithms/rcf/FixedInTimeRandomCutForest.java
@@ -13,13 +13,15 @@
 import com.amazon.randomcutforest.parkservices.state.ThresholdedRandomCutForestState;
 import lombok.extern.log4j.Log4j2;
 import org.opensearch.ml.common.FunctionName;
-import org.opensearch.ml.common.Model;
+import org.opensearch.ml.common.MLModel;
 import org.opensearch.ml.common.dataframe.ColumnMeta;
 import org.opensearch.ml.common.dataframe.ColumnType;
 import org.opensearch.ml.common.dataframe.ColumnValue;
 import org.opensearch.ml.common.dataframe.DataFrame;
 import org.opensearch.ml.common.dataframe.DataFrameBuilder;
 import org.opensearch.ml.common.dataframe.Row;
+import org.opensearch.ml.common.dataset.DataFrameInputDataset;
+import org.opensearch.ml.common.dataset.MLInputDataset;
 import org.opensearch.ml.common.exception.MLValidationException;
 import org.opensearch.ml.common.input.parameter.MLAlgoParams;
 import org.opensearch.ml.common.input.parameter.rcf.FitRCFParams;
@@ -38,6 +40,8 @@
 import java.util.Optional;
 import java.util.TimeZone;
 
+import static org.opensearch.ml.engine.utils.ModelSerDeSer.encodeBase64;
+
 /**
  * MLCommons doesn't support update trained model. So the trained RCF model in MLCommons
  * will be fixed in some time rather than updated by prediction data. We call it FIT(fixed
@@ -67,6 +71,8 @@ public class FixedInTimeRandomCutForest implements TrainAndPredictable {
     private DateFormat simpleDateFormat;
     private static final ThresholdedRandomCutForestMapper trcfMapper = new ThresholdedRandomCutForestMapper();
 
+    private ThresholdedRandomCutForest forest;
+
     public FixedInTimeRandomCutForest(){}
 
     public FixedInTimeRandomCutForest(MLAlgoParams parameters) {
@@ -93,31 +99,54 @@ public FixedInTimeRandomCutForest(MLAlgoParams parameters) {
         }
     }
 
+
+    @Override
+    public void initModel(MLModel model, Map<String, Object> params) {
+        ThresholdedRandomCutForestState state = RCFModelSerDeSer.deserializeTRCF(model);
+        this.forest = trcfMapper.toModel(state);
+    }
+
+    @Override
+    public void close() {
+        this.forest = null;
+    }
+
     @Override
-    public MLOutput predict(DataFrame dataFrame, Model model) {
+    public MLOutput predict(MLInputDataset inputDataset) {
+        DataFrame dataFrame = ((DataFrameInputDataset)inputDataset).getDataFrame();
+        List<Map<String, Object>> predictResult = process(dataFrame, forest);
+        return MLPredictionOutput.builder().predictionResult(DataFrameBuilder.load(predictResult)).build();
+    }
+
+    @Override
+    public MLOutput predict(MLInputDataset inputDataset, MLModel model) {
         if (model == null) {
             throw new IllegalArgumentException("No model found for FIT RCF prediction.");
         }
-        ThresholdedRandomCutForestState state = RCFModelSerDeSer.deserializeTRCF(model.getContent());
-        ThresholdedRandomCutForest forest = trcfMapper.toModel(state);
-        List<Map<String, Object>> predictResult = process(dataFrame, forest);
-        return MLPredictionOutput.builder().predictionResult(DataFrameBuilder.load(predictResult)).build();
+        ThresholdedRandomCutForestState state = RCFModelSerDeSer.deserializeTRCF(model);
+        forest = trcfMapper.toModel(state);
+        return predict(inputDataset);
     }
 
     @Override
-    public Model train(DataFrame dataFrame) {
+    public MLModel train(MLInputDataset inputDataset) {
+        DataFrame dataFrame = ((DataFrameInputDataset)inputDataset).getDataFrame();
         ThresholdedRandomCutForest forest = createThresholdedRandomCutForest(dataFrame);
         process(dataFrame, forest);
-        Model model = new Model();
-        model.setName(FunctionName.FIT_RCF.name());
-        model.setVersion(1);
+
         ThresholdedRandomCutForestState state = trcfMapper.toState(forest);
-        model.setContent(RCFModelSerDeSer.serializeTRCF(state));
+        MLModel model = MLModel.builder()
+                .name(FunctionName.FIT_RCF.name())
+                .algorithm(FunctionName.FIT_RCF)
+                .version(1)
+                .content(encodeBase64(RCFModelSerDeSer.serializeTRCF(state)))
+                .build();
         return model;
     }
 
     @Override
-    public MLOutput trainAndPredict(DataFrame dataFrame) {
+    public MLOutput trainAndPredict(MLInputDataset inputDataset) {
+        DataFrame dataFrame = ((DataFrameInputDataset)inputDataset).getDataFrame();
         ThresholdedRandomCutForest forest = createThresholdedRandomCutForest(dataFrame);
         List<Map<String, Object>> predictResult = process(dataFrame, forest);
         return MLPredictionOutput.builder().predictionResult(DataFrameBuilder.load(predictResult)).build();
diff --git a/ml-algorithms/src/main/java/org/opensearch/ml/engine/algorithms/rcf/RCFModelSerDeSer.java b/ml-algorithms/src/main/java/org/opensearch/ml/engine/algorithms/rcf/RCFModelSerDeSer.java
index 8079268297..2e0d6dfc9c 100644
--- a/ml-algorithms/src/main/java/org/opensearch/ml/engine/algorithms/rcf/RCFModelSerDeSer.java
+++ b/ml-algorithms/src/main/java/org/opensearch/ml/engine/algorithms/rcf/RCFModelSerDeSer.java
@@ -12,10 +12,13 @@
 import io.protostuff.Schema;
 import io.protostuff.runtime.RuntimeSchema;
 import lombok.experimental.UtilityClass;
+import org.opensearch.ml.common.MLModel;
 
 import java.security.AccessController;
 import java.security.PrivilegedAction;
 
+import static org.opensearch.ml.engine.utils.ModelSerDeSer.decodeBase64;
+
 @UtilityClass
 public class RCFModelSerDeSer {
     private static final int SERIALIZATION_BUFFER_BYTES = 512;
@@ -34,10 +37,18 @@ public static byte[] serializeTRCF(ThresholdedRandomCutForestState model) {
         return serialize(model, trcfSchema);
     }
 
+    public static RandomCutForestState deserializeRCF(MLModel model) {
+        return deserializeRCF(decodeBase64(model.getContent()));
+    }
+
     public static RandomCutForestState deserializeRCF(byte[] bytes) {
         return deserialize(bytes, rcfSchema);
     }
 
+    public static ThresholdedRandomCutForestState deserializeTRCF(MLModel model) {
+        return deserializeTRCF(decodeBase64(model.getContent()));
+    }
+
     public static ThresholdedRandomCutForestState deserializeTRCF(byte[] bytes) {
         return deserialize(bytes, trcfSchema);
     }
diff --git a/ml-algorithms/src/main/java/org/opensearch/ml/engine/algorithms/regression/LinearRegression.java b/ml-algorithms/src/main/java/org/opensearch/ml/engine/algorithms/regression/LinearRegression.java
index db524e5b63..6d06174911 100644
--- a/ml-algorithms/src/main/java/org/opensearch/ml/engine/algorithms/regression/LinearRegression.java
+++ b/ml-algorithms/src/main/java/org/opensearch/ml/engine/algorithms/regression/LinearRegression.java
@@ -5,14 +5,16 @@
 
 package org.opensearch.ml.engine.algorithms.regression;
 
+import org.opensearch.ml.common.MLModel;
 import org.opensearch.ml.common.dataframe.DataFrame;
 import org.opensearch.ml.common.dataframe.DataFrameBuilder;
+import org.opensearch.ml.common.dataset.DataFrameInputDataset;
+import org.opensearch.ml.common.dataset.MLInputDataset;
 import org.opensearch.ml.common.input.parameter.regression.LinearRegressionParams;
 import org.opensearch.ml.common.FunctionName;
 import org.opensearch.ml.common.input.parameter.MLAlgoParams;
 import org.opensearch.ml.common.output.MLOutput;
 import org.opensearch.ml.common.output.MLPredictionOutput;
-import org.opensearch.ml.common.Model;
 import org.opensearch.ml.engine.Predictable;
 import org.opensearch.ml.engine.Trainable;
 import org.opensearch.ml.engine.annotation.Function;
@@ -42,6 +44,8 @@
 import java.util.Map;
 import java.util.Optional;
 
+import static org.opensearch.ml.engine.utils.ModelSerDeSer.serializeToBase64;
+
 @Function(FunctionName.LINEAR_REGRESSION)
 public class LinearRegression implements Trainable, Predictable {
 
@@ -71,6 +75,7 @@ public class LinearRegression implements Trainable, Predictable {
     private int loggingInterval;
     private int minibatchSize;
     private long seed;
+    private org.tribuo.Model<Regressor> regressionModel;
 
     public LinearRegression() {}
 
@@ -191,13 +196,23 @@ private void validateParameters() {
         seed = Optional.ofNullable(parameters.getSeed()).orElse(DEFAULT_SEED);
     }
 
+
     @Override
-    public MLOutput predict(DataFrame dataFrame, Model model) {
-        if (model == null) {
-            throw new IllegalArgumentException("No model found for linear regression prediction.");
-        }
+    public void initModel(MLModel model, Map<String, Object> params) {
+        this.regressionModel = (org.tribuo.Model<Regressor>) ModelSerDeSer.deserialize(model);
+    }
+
+    @Override
+    public void close() {
+        this.regressionModel = null;
+    }
 
-        org.tribuo.Model<Regressor> regressionModel = (org.tribuo.Model<Regressor>) ModelSerDeSer.deserialize(model.getContent());
+    @Override
+    public MLOutput predict(MLInputDataset inputDataset) {
+        if (regressionModel == null) {
+            throw new IllegalArgumentException("model not loaded");
+        }
+        DataFrame dataFrame = ((DataFrameInputDataset)inputDataset).getDataFrame();
         MutableDataset<Regressor> predictionDataset = TribuoUtil.generateDataset(dataFrame, new RegressionFactory(),
                 "Linear regression prediction data from opensearch", TribuoOutputType.REGRESSOR);
         List<Prediction<Regressor>> predictions = regressionModel.predict(predictionDataset);
@@ -208,16 +223,29 @@ public MLOutput predict(DataFrame dataFrame, Model model) {
     }
 
     @Override
-    public Model train(DataFrame dataFrame) {
+    public MLOutput predict(MLInputDataset inputDataset, MLModel model) {
+        if (model == null) {
+            throw new IllegalArgumentException("No model found for linear regression prediction.");
+        }
+
+        regressionModel = (org.tribuo.Model<Regressor>) ModelSerDeSer.deserialize(model);
+        return predict(inputDataset);
+    }
+
+    @Override
+    public MLModel train(MLInputDataset inputDataset) {
+        DataFrame dataFrame = ((DataFrameInputDataset)inputDataset).getDataFrame();
         MutableDataset<Regressor> trainDataset = TribuoUtil.generateDatasetWithTarget(dataFrame, new RegressionFactory(),
                 "Linear regression training data from opensearch", TribuoOutputType.REGRESSOR, parameters.getTarget());
         Integer epochs = Optional.ofNullable(parameters.getEpochs()).orElse(DEFAULT_EPOCHS);
         LinearSGDTrainer linearSGDTrainer = new LinearSGDTrainer(objective, optimiser, epochs, loggingInterval, minibatchSize, seed);
         org.tribuo.Model<Regressor> regressionModel = linearSGDTrainer.train(trainDataset);
-        Model model = new Model();
-        model.setName(FunctionName.LINEAR_REGRESSION.name());
-        model.setVersion(1);
-        model.setContent(ModelSerDeSer.serialize(regressionModel));
+        MLModel model = MLModel.builder()
+                .name(FunctionName.LINEAR_REGRESSION.name())
+                .algorithm(FunctionName.LINEAR_REGRESSION)
+                .version(1)
+                .content(serializeToBase64(regressionModel))
+                .build();
 
         return model;
     }
diff --git a/ml-algorithms/src/main/java/org/opensearch/ml/engine/algorithms/regression/LogisticRegression.java b/ml-algorithms/src/main/java/org/opensearch/ml/engine/algorithms/regression/LogisticRegression.java
index de6faed9c0..e7c766af08 100644
--- a/ml-algorithms/src/main/java/org/opensearch/ml/engine/algorithms/regression/LogisticRegression.java
+++ b/ml-algorithms/src/main/java/org/opensearch/ml/engine/algorithms/regression/LogisticRegression.java
@@ -5,10 +5,12 @@
 
 package org.opensearch.ml.engine.algorithms.regression;
 
-import org.opensearch.ml.common.Model;
+import org.opensearch.ml.common.MLModel;
 import org.opensearch.ml.common.FunctionName;
 import org.opensearch.ml.common.dataframe.DataFrame;
 import org.opensearch.ml.common.dataframe.DataFrameBuilder;
+import org.opensearch.ml.common.dataset.DataFrameInputDataset;
+import org.opensearch.ml.common.dataset.MLInputDataset;
 import org.opensearch.ml.common.input.parameter.MLAlgoParams;
 import org.opensearch.ml.common.input.parameter.regression.LogisticRegressionParams;
 import org.opensearch.ml.common.output.MLOutput;
@@ -41,6 +43,8 @@
 import java.util.Map;
 import java.util.Optional;
 
+import static org.opensearch.ml.engine.utils.ModelSerDeSer.serializeToBase64;
+
 @Function(FunctionName.LOGISTIC_REGRESSION)
 public class LogisticRegression implements Trainable, Predictable {
 
@@ -69,6 +73,8 @@ public class LogisticRegression implements Trainable, Predictable {
     private LogisticRegressionParams parameters;
     private StochasticGradientOptimiser optimiser;
     private LabelObjective objective;
+    private org.tribuo.Model<Label> classificationModel;
+
     /**
      * Initialize a linear regression algorithm.
      * @param parameters the parameters for linear regression algorithm
@@ -166,27 +172,36 @@ private void createOptimiser() {
     }
 
     @Override
-    public Model train(DataFrame dataFrame) {
+    public MLModel train(MLInputDataset inputDataset) {
+        DataFrame dataFrame = ((DataFrameInputDataset)inputDataset).getDataFrame();
         MutableDataset<Label> trainDataset = TribuoUtil.generateDatasetWithTarget(dataFrame, new LabelFactory(),
                 "Logistic regression training data from OpenSearch", TribuoOutputType.LABEL, parameters.getTarget());
         // LinearSGDTrainer(objective=LogMulticlass,optimiser=AdaGrad(initialLearningRate=1.0,epsilon=0.1,initialValue=0.0),epochs=5,minibatchSize=1,seed=12345)
         Trainer<Label> logisticRegressionTrainer = new LinearSGDTrainer(objective, optimiser, epochs, loggingInterval, minibatchSize, seed);
         org.tribuo.Model<Label> classificationModel = logisticRegressionTrainer.train(trainDataset);
-        Model model = new Model();
-        model.setName(FunctionName.LOGISTIC_REGRESSION.name());
-        model.setVersion(1);
-        model.setContent(ModelSerDeSer.serialize(classificationModel));
 
+        MLModel model = MLModel.builder()
+                .name(FunctionName.LOGISTIC_REGRESSION.name())
+                .algorithm(FunctionName.LOGISTIC_REGRESSION)
+                .version(1)
+                .content(serializeToBase64(classificationModel))
+                .build();
         return model;
     }
 
     @Override
-    public MLOutput predict(DataFrame dataFrame, Model model) {
-        if (model == null) {
-            throw new IllegalArgumentException("No model found for logistic regression prediction.");
-        }
+    public void initModel(MLModel model, Map<String, Object> params) {
+        this.classificationModel = (org.tribuo.Model<Label>)ModelSerDeSer.deserialize(model);
+    }
+
+    @Override
+    public void close() {
+        this.classificationModel = null;
+    }
 
-        org.tribuo.Model<Label> classificationModel = (org.tribuo.Model<Label>)ModelSerDeSer.deserialize(model.getContent());
+    @Override
+    public MLOutput predict(MLInputDataset inputDataset) {
+        DataFrame dataFrame = ((DataFrameInputDataset)inputDataset).getDataFrame();
         MutableDataset<Label> predictionDataset = TribuoUtil.generateDataset(dataFrame, new LabelFactory(),
                 "Logistic regression prediction data from OpenSearch", TribuoOutputType.LABEL);
 
@@ -196,4 +211,14 @@ public MLOutput predict(DataFrame dataFrame, Model model) {
 
         return MLPredictionOutput.builder().predictionResult(DataFrameBuilder.load(listPrediction)).build();
     }
+
+    @Override
+    public MLOutput predict(MLInputDataset inputDataset, MLModel model) {
+        if (model == null) {
+            throw new IllegalArgumentException("No model found for logistic regression prediction.");
+        }
+
+        classificationModel = (org.tribuo.Model<Label>)ModelSerDeSer.deserialize(model);
+        return predict(inputDataset);
+    }
 }
diff --git a/ml-algorithms/src/main/java/org/opensearch/ml/engine/algorithms/sample/SampleAlgo.java b/ml-algorithms/src/main/java/org/opensearch/ml/engine/algorithms/sample/SampleAlgo.java
index 0b408c93ad..3c87cb13cf 100644
--- a/ml-algorithms/src/main/java/org/opensearch/ml/engine/algorithms/sample/SampleAlgo.java
+++ b/ml-algorithms/src/main/java/org/opensearch/ml/engine/algorithms/sample/SampleAlgo.java
@@ -5,18 +5,22 @@
 
 package org.opensearch.ml.engine.algorithms.sample;
 
+import org.opensearch.ml.common.MLModel;
 import org.opensearch.ml.common.dataframe.DataFrame;
 import org.opensearch.ml.common.FunctionName;
+import org.opensearch.ml.common.dataset.DataFrameInputDataset;
+import org.opensearch.ml.common.dataset.MLInputDataset;
+import org.opensearch.ml.common.exception.MLException;
 import org.opensearch.ml.common.input.parameter.MLAlgoParams;
 import org.opensearch.ml.common.output.MLOutput;
 import org.opensearch.ml.common.output.sample.SampleAlgoOutput;
 import org.opensearch.ml.common.input.parameter.sample.SampleAlgoParams;
-import org.opensearch.ml.common.Model;
 import org.opensearch.ml.engine.Predictable;
 import org.opensearch.ml.engine.Trainable;
 import org.opensearch.ml.engine.annotation.Function;
 import org.opensearch.ml.engine.utils.ModelSerDeSer;
 
+import java.util.Map;
 import java.util.Optional;
 import java.util.concurrent.atomic.AtomicReference;
 
@@ -32,11 +36,19 @@ public SampleAlgo(MLAlgoParams parameters) {
     }
 
     @Override
-    public MLOutput predict(DataFrame dataFrame, Model model) {
-        if (model == null) {
-            throw new IllegalArgumentException("No model found for sample algo.");
-        }
+    public void initModel(MLModel model, Map<String, Object> params) {
+        throw new MLException("Sample Algo doesn't support init model");
+    }
+
+    @Override
+    public void close() {
+        sampleParam = DEFAULT_SAMPLE_PARAM;
+    }
+
+    @Override
+    public MLOutput predict(MLInputDataset inputDataset) {
         AtomicReference<Double> sum = new AtomicReference<>((double) 0);
+        DataFrame dataFrame = ((DataFrameInputDataset)inputDataset).getDataFrame();
         dataFrame.forEach(row -> {
             row.forEach(item -> sum.updateAndGet(v -> v + item.doubleValue()));
         });
@@ -44,11 +56,21 @@ public MLOutput predict(DataFrame dataFrame, Model model) {
     }
 
     @Override
-    public Model train(DataFrame dataFrame) {
-        Model model = new Model();
-        model.setName(FunctionName.SAMPLE_ALGO.name());
-        model.setVersion(1);
-        model.setContent(ModelSerDeSer.serialize("This is a sample testing model with parameter: " + sampleParam));
+    public MLOutput predict(MLInputDataset inputDataset, MLModel model) {
+        if (model == null) {
+            throw new IllegalArgumentException("No model found for sample algo.");
+        }
+        return predict(inputDataset);
+    }
+
+    @Override
+    public MLModel train(MLInputDataset inputDataset) {
+        MLModel model = MLModel.builder()
+                .name(FunctionName.SAMPLE_ALGO.name())
+                .algorithm(FunctionName.SAMPLE_ALGO)
+                .version(1)
+                .content(ModelSerDeSer.serializeToBase64("This is a sample testing model with parameter: " + sampleParam))
+                .build();
         return model;
     }
 }
diff --git a/ml-algorithms/src/main/java/org/opensearch/ml/engine/utils/ModelSerDeSer.java b/ml-algorithms/src/main/java/org/opensearch/ml/engine/utils/ModelSerDeSer.java
index 4d477928b8..98241b2e76 100644
--- a/ml-algorithms/src/main/java/org/opensearch/ml/engine/utils/ModelSerDeSer.java
+++ b/ml-algorithms/src/main/java/org/opensearch/ml/engine/utils/ModelSerDeSer.java
@@ -7,28 +7,35 @@
 
 import lombok.experimental.UtilityClass;
 import org.apache.commons.io.serialization.ValidatingObjectInputStream;
+import org.opensearch.ml.common.MLModel;
 import org.opensearch.ml.engine.exceptions.ModelSerDeSerException;
 
 import java.io.ByteArrayInputStream;
 import java.io.ByteArrayOutputStream;
 import java.io.IOException;
 import java.io.ObjectOutputStream;
+import java.util.Base64;
 
 @UtilityClass
 public class ModelSerDeSer {
     // Welcome list includes OpenSearch ml plugin classes, JDK common classes and Tribuo libraries.
     public static final String[] ACCEPT_CLASS_PATTERNS = {
-        "java.lang.*",
-        "java.util.*",
-        "java.time.*",
-        "org.opensearch.ml.*",
-        "*org.tribuo.*",
-        "libsvm.*",
-        "com.oracle.labs.*",
-        "[*",
-        "com.amazon.randomcutforest.*"
+            "java.lang.*",
+            "java.util.*",
+            "java.time.*",
+            "org.opensearch.ml.*",
+            "*org.tribuo.*",
+            "libsvm.*",
+            "com.oracle.labs.*",
+            "[*",
+            "com.amazon.randomcutforest.*"
     };
 
+    public static String serializeToBase64(Object model) {
+        byte[] bytes = serialize(model);
+        return encodeBase64(bytes);
+    }
+
     public static byte[] serialize(Object model) {
         try (ByteArrayOutputStream byteArrayOutputStream = new ByteArrayOutputStream();
              ObjectOutputStream objectOutputStream = new ObjectOutputStream(byteArrayOutputStream)) {
@@ -50,4 +57,17 @@ public static Object deserialize(byte[] modelBin) {
             throw new ModelSerDeSerException("Failed to deserialize model.", e.getCause());
         }
     }
+
+    public static Object deserialize(MLModel model) {
+        byte[] decodeBytes = decodeBase64(model.getContent());
+        return deserialize(decodeBytes);
+    }
+
+    public static byte[] decodeBase64(String base64Str) {
+        return Base64.getDecoder().decode(base64Str);
+    }
+
+    public static String encodeBase64(byte[] bytes) {
+        return Base64.getEncoder().encodeToString(bytes);
+    }
 }
diff --git a/ml-algorithms/src/test/java/org/opensearch/ml/engine/MLEngineTest.java b/ml-algorithms/src/test/java/org/opensearch/ml/engine/MLEngineTest.java
index aa154d62bb..2c494d8e01 100644
--- a/ml-algorithms/src/test/java/org/opensearch/ml/engine/MLEngineTest.java
+++ b/ml-algorithms/src/test/java/org/opensearch/ml/engine/MLEngineTest.java
@@ -13,7 +13,10 @@
 import org.mockito.Mockito;
 import org.opensearch.common.io.stream.StreamOutput;
 import org.opensearch.common.xcontent.XContentBuilder;
+import org.opensearch.ml.common.MLModel;
+import org.opensearch.ml.common.dataframe.ColumnMeta;
 import org.opensearch.ml.common.dataframe.DataFrame;
+import org.opensearch.ml.common.dataframe.DefaultDataFrame;
 import org.opensearch.ml.common.dataset.DataFrameInputDataset;
 import org.opensearch.ml.common.dataset.MLInputDataset;
 import org.opensearch.ml.common.input.Input;
@@ -24,8 +27,8 @@
 import org.opensearch.ml.common.output.execute.samplecalculator.LocalSampleCalculatorOutput;
 import org.opensearch.ml.common.input.parameter.MLAlgoParams;
 import org.opensearch.ml.common.input.MLInput;
-import org.opensearch.ml.common.Model;
 import org.opensearch.ml.common.output.MLPredictionOutput;
+import org.opensearch.ml.engine.algorithms.regression.LinearRegression;
 
 import java.io.IOException;
 import java.util.Arrays;
@@ -40,7 +43,7 @@ public class MLEngineTest {
 
     @Test
     public void predictKMeans() {
-        Model model = trainKMeansModel();
+        MLModel model = trainKMeansModel();
         DataFrame predictionDataFrame = constructTestDataFrame(10);
         MLInputDataset inputDataset = DataFrameInputDataset.builder().dataFrame(predictionDataFrame).build();
         Input mlInput = MLInput.builder().algorithm(FunctionName.KMEANS).inputDataset(inputDataset).build();
@@ -52,7 +55,7 @@ public void predictKMeans() {
 
     @Test
     public void predictLinearRegression() {
-        Model model = trainLinearRegressionModel();
+        MLModel model = trainLinearRegressionModel();
         DataFrame predictionDataFrame = constructLinearRegressionPredictionDataFrame();
         MLInputDataset inputDataset = DataFrameInputDataset.builder().dataFrame(predictionDataFrame).build();
         Input mlInput = MLInput.builder().algorithm(FunctionName.LINEAR_REGRESSION).inputDataset(inputDataset).build();
@@ -61,19 +64,41 @@ public void predictLinearRegression() {
         Assert.assertEquals(2, predictions.size());
     }
 
+
+    @Test
+    public void loadLinearRegressionModel() {
+        MLModel model = trainLinearRegressionModel();
+        Predictable predictor = MLEngine.load(model, null);
+        DataFrame predictionDataFrame = constructLinearRegressionPredictionDataFrame();
+        MLInputDataset inputDataset = DataFrameInputDataset.builder().dataFrame(predictionDataFrame).build();
+        MLPredictionOutput output = (MLPredictionOutput)predictor.predict(inputDataset);
+        DataFrame predictions = output.getPredictionResult();
+        Assert.assertEquals(2, predictions.size());
+    }
+
+    @Test
+    public void loadLinearRegressionModel_NullModel() {
+        exceptionRule.expect(IllegalArgumentException.class);
+        exceptionRule.expectMessage("model not loaded");
+        Predictable predictor = new LinearRegression();
+        DataFrame predictionDataFrame = constructLinearRegressionPredictionDataFrame();
+        MLInputDataset inputDataset = DataFrameInputDataset.builder().dataFrame(predictionDataFrame).build();
+        predictor.predict(inputDataset);
+    }
+
     @Test
     public void trainKMeans() {
-        Model model = trainKMeansModel();
+        MLModel model = trainKMeansModel();
         Assert.assertEquals(FunctionName.KMEANS.name(), model.getName());
-        Assert.assertEquals(1, model.getVersion());
+        Assert.assertEquals(1, model.getVersion().intValue());
         Assert.assertNotNull(model.getContent());
     }
 
     @Test
     public void trainLinearRegression() {
-        Model model = trainLinearRegressionModel();
+        MLModel model = trainLinearRegressionModel();
         Assert.assertEquals(FunctionName.LINEAR_REGRESSION.name(), model.getName());
-        Assert.assertEquals(1, model.getVersion());
+        Assert.assertEquals(1, model.getVersion().intValue());
         Assert.assertNotNull(model.getContent());
     }
 
@@ -88,6 +113,17 @@ public void train_NullInput() {
         }
     }
 
+    @Test
+    public void train_NullInputDataSet() {
+        exceptionRule.expect(IllegalArgumentException.class);
+        exceptionRule.expectMessage("Input data set should not be null");
+        FunctionName algoName = FunctionName.LINEAR_REGRESSION;
+        try (MockedStatic<MLEngineClassLoader> loader = Mockito.mockStatic(MLEngineClassLoader.class)) {
+            loader.when(() -> MLEngineClassLoader.initInstance(algoName, null, MLAlgoParams.class)).thenReturn(null);
+            MLEngine.train(MLInput.builder().algorithm(algoName).build());
+        }
+    }
+
     @Test
     public void train_NullDataFrame() {
         exceptionRule.expect(IllegalArgumentException.class);
@@ -95,7 +131,8 @@ public void train_NullDataFrame() {
         FunctionName algoName = FunctionName.LINEAR_REGRESSION;
         try (MockedStatic<MLEngineClassLoader> loader = Mockito.mockStatic(MLEngineClassLoader.class)) {
             loader.when(() -> MLEngineClassLoader.initInstance(algoName, null, MLAlgoParams.class)).thenReturn(null);
-            MLEngine.train(MLInput.builder().algorithm(algoName).build());
+            DataFrame dataFrame = new DefaultDataFrame(new ColumnMeta[0]);
+            MLEngine.train(MLInput.builder().inputDataset(new DataFrameInputDataset(dataFrame)).algorithm(algoName).build());
         }
     }
 
@@ -210,7 +247,8 @@ public XContentBuilder toXContent(XContentBuilder xContentBuilder, Params params
         MLEngine.execute(input);
     }
 
-    private Model trainKMeansModel() {
+
+    private MLModel trainKMeansModel() {
         KMeansParams parameters = KMeansParams.builder()
                 .centroids(2)
                 .iterations(10)
@@ -222,7 +260,7 @@ private Model trainKMeansModel() {
         return MLEngine.train(mlInput);
     }
 
-    private Model trainLinearRegressionModel() {
+    private MLModel trainLinearRegressionModel() {
         LinearRegressionParams parameters = LinearRegressionParams.builder()
                 .objectiveType(LinearRegressionParams.ObjectiveType.SQUARED_LOSS)
                 .optimizerType(LinearRegressionParams.OptimizerType.ADAM)
diff --git a/ml-algorithms/src/test/java/org/opensearch/ml/engine/ModelSerDeSerTest.java b/ml-algorithms/src/test/java/org/opensearch/ml/engine/ModelSerDeSerTest.java
index ebff98035b..7c92196736 100644
--- a/ml-algorithms/src/test/java/org/opensearch/ml/engine/ModelSerDeSerTest.java
+++ b/ml-algorithms/src/test/java/org/opensearch/ml/engine/ModelSerDeSerTest.java
@@ -8,7 +8,7 @@
 import org.junit.Rule;
 import org.junit.Test;
 import org.junit.rules.ExpectedException;
-import org.opensearch.ml.common.Model;
+import org.opensearch.ml.common.MLModel;
 import org.opensearch.ml.common.input.parameter.clustering.KMeansParams;
 import org.opensearch.ml.common.input.parameter.regression.LinearRegressionParams;
 import org.opensearch.ml.engine.algorithms.clustering.KMeans;
@@ -18,7 +18,7 @@
 import org.tribuo.regression.sgd.linear.LinearSGDModel;
 
 import static org.junit.Assert.assertNotNull;
-import static org.opensearch.ml.engine.helper.MLTestHelper.constructTestDataFrame;
+import static org.opensearch.ml.engine.helper.MLTestHelper.concstructDataFrameInputDataSet;
 
 public class ModelSerDeSerTest {
     @Rule
@@ -28,9 +28,9 @@ public class ModelSerDeSerTest {
     public void testModelSerDeSerKMeans() {
         KMeansParams params = KMeansParams.builder().build();
         KMeans kMeans = new KMeans(params);
-        Model model = kMeans.train(constructTestDataFrame(100));
+        MLModel model = kMeans.train(concstructDataFrameInputDataSet(100));
 
-        KMeansModel deserializedModel = (KMeansModel) ModelSerDeSer.deserialize(model.getContent());
+        KMeansModel deserializedModel = (KMeansModel) ModelSerDeSer.deserialize(model);
         assertNotNull(deserializedModel);
     }
 
@@ -38,9 +38,9 @@ public void testModelSerDeSerKMeans() {
     public void testModelSerDeSerLinearRegression() {
         LinearRegressionParams params = LinearRegressionParams.builder().target("f2").build();
         LinearRegression linearRegression = new LinearRegression(params);
-        Model model = linearRegression.train(constructTestDataFrame(100));
+        MLModel model = linearRegression.train(concstructDataFrameInputDataSet(100));
 
-        LinearSGDModel deserializedModel = (LinearSGDModel) ModelSerDeSer.deserialize(model.getContent());
+        LinearSGDModel deserializedModel = (LinearSGDModel) ModelSerDeSer.deserialize(model);
         assertNotNull(deserializedModel);
     }
 
diff --git a/ml-algorithms/src/test/java/org/opensearch/ml/engine/algorithms/ad/AnomalyDetectionLibSVMTest.java b/ml-algorithms/src/test/java/org/opensearch/ml/engine/algorithms/ad/AnomalyDetectionLibSVMTest.java
index 4af15f72e6..bc65d0719b 100644
--- a/ml-algorithms/src/test/java/org/opensearch/ml/engine/algorithms/ad/AnomalyDetectionLibSVMTest.java
+++ b/ml-algorithms/src/test/java/org/opensearch/ml/engine/algorithms/ad/AnomalyDetectionLibSVMTest.java
@@ -11,6 +11,7 @@
 import org.junit.Rule;
 import org.junit.Test;
 import org.junit.rules.ExpectedException;
+import org.opensearch.ml.common.MLModel;
 import org.opensearch.ml.common.dataframe.ColumnMeta;
 import org.opensearch.ml.common.dataframe.ColumnType;
 import org.opensearch.ml.common.dataframe.ColumnValue;
@@ -18,10 +19,10 @@
 import org.opensearch.ml.common.dataframe.DefaultDataFrame;
 import org.opensearch.ml.common.dataframe.DoubleValue;
 import org.opensearch.ml.common.dataframe.Row;
+import org.opensearch.ml.common.dataset.DataFrameInputDataset;
 import org.opensearch.ml.common.input.parameter.ad.AnomalyDetectionLibSVMParams;
 import org.opensearch.ml.common.FunctionName;
 import org.opensearch.ml.common.output.MLPredictionOutput;
-import org.opensearch.ml.common.Model;
 import org.tribuo.Dataset;
 import org.tribuo.Example;
 import org.tribuo.Feature;
@@ -37,7 +38,9 @@ public class AnomalyDetectionLibSVMTest {
     private AnomalyDetectionLibSVMParams parameters;
     private AnomalyDetectionLibSVM anomalyDetection;
     private DataFrame trainDataFrame;
+    private DataFrameInputDataset trainDataFrameInputDataset;
     private DataFrame predictionDataFrame;
+    private DataFrameInputDataset predictionDataFrameInputDataset;
     private List<Event.EventType> predictionLabels;
     private double gamma = 1.0;
     private double nu = 0.1;
@@ -54,8 +57,10 @@ public void setUp() {
         Dataset<Event> data = pair.getA();
         Dataset<Event> test = pair.getB();
         trainDataFrame = constructDataFrame(data, true, null);
+        trainDataFrameInputDataset = new DataFrameInputDataset(trainDataFrame);
         predictionLabels = new ArrayList<>();
         predictionDataFrame = constructDataFrame(test, false, predictionLabels);
+        predictionDataFrameInputDataset = new DataFrameInputDataset(predictionDataFrame);
     }
 
     private DataFrame constructDataFrame(Dataset<Event> data, boolean training, List<Event.EventType> labels) {
@@ -101,9 +106,9 @@ private void addRow(List<ColumnValue> columnValues, boolean training, Example<Ev
 
     @Test
     public void train() {
-        Model model = anomalyDetection.train(trainDataFrame);
+        MLModel model = anomalyDetection.train(trainDataFrameInputDataset);
         Assert.assertEquals(FunctionName.AD_LIBSVM.name(), model.getName());
-        Assert.assertEquals(AnomalyDetectionLibSVM.VERSION, model.getVersion());
+        Assert.assertEquals(AnomalyDetectionLibSVM.VERSION, model.getVersion().intValue());
         Assert.assertNotNull(model.getContent());
     }
 
@@ -111,24 +116,24 @@ public void train() {
     public void trainWithFullParams() {
         AnomalyDetectionLibSVMParams parameters = AnomalyDetectionLibSVMParams.builder().gamma(gamma).nu(nu).cost(1.0).coeff(0.01).epsilon(0.001).degree(1).kernelType(AnomalyDetectionLibSVMParams.ADKernelType.LINEAR).build();
         AnomalyDetectionLibSVM anomalyDetection = new AnomalyDetectionLibSVM(parameters);
-        Model model = anomalyDetection.train(trainDataFrame);
+        MLModel model = anomalyDetection.train(trainDataFrameInputDataset);
         Assert.assertEquals(FunctionName.AD_LIBSVM.name(), model.getName());
-        Assert.assertEquals(AnomalyDetectionLibSVM.VERSION, model.getVersion());
+        Assert.assertEquals(AnomalyDetectionLibSVM.VERSION, model.getVersion().intValue());
         Assert.assertNotNull(model.getContent());
 
         parameters = parameters.toBuilder().kernelType(AnomalyDetectionLibSVMParams.ADKernelType.POLY).build();
         anomalyDetection = new AnomalyDetectionLibSVM(parameters);
-        model = anomalyDetection.train(trainDataFrame);
+        model = anomalyDetection.train(trainDataFrameInputDataset);
         Assert.assertEquals(FunctionName.AD_LIBSVM.name(), model.getName());
 
         parameters = parameters.toBuilder().kernelType(AnomalyDetectionLibSVMParams.ADKernelType.RBF).build();
         anomalyDetection = new AnomalyDetectionLibSVM(parameters);
-        model = anomalyDetection.train(trainDataFrame);
+        model = anomalyDetection.train(trainDataFrameInputDataset);
         Assert.assertEquals(FunctionName.AD_LIBSVM.name(), model.getName());
 
         parameters = parameters.toBuilder().kernelType(AnomalyDetectionLibSVMParams.ADKernelType.SIGMOID).build();
         anomalyDetection = new AnomalyDetectionLibSVM(parameters);
-        model = anomalyDetection.train(trainDataFrame);
+        model = anomalyDetection.train(trainDataFrameInputDataset);
         Assert.assertEquals(FunctionName.AD_LIBSVM.name(), model.getName());
     }
 
@@ -136,13 +141,13 @@ public void trainWithFullParams() {
     public void predict_NullModel() {
         exceptionRule.expect(IllegalArgumentException.class);
         exceptionRule.expectMessage("No model found for KMeans prediction");
-        anomalyDetection.predict(predictionDataFrame, null);
+        anomalyDetection.predict(predictionDataFrameInputDataset, null);
     }
 
     @Test
     public void predict() {
-        Model model = anomalyDetection.train(trainDataFrame);
-        MLPredictionOutput output = (MLPredictionOutput) anomalyDetection.predict(predictionDataFrame, model);
+        MLModel model = anomalyDetection.train(trainDataFrameInputDataset);
+        MLPredictionOutput output = (MLPredictionOutput) anomalyDetection.predict(predictionDataFrameInputDataset, model);
         DataFrame predictions = output.getPredictionResult();
         int i = 0;
         int truePositive = 0;
diff --git a/ml-algorithms/src/test/java/org/opensearch/ml/engine/algorithms/clustering/KMeansTest.java b/ml-algorithms/src/test/java/org/opensearch/ml/engine/algorithms/clustering/KMeansTest.java
index 9ef7630f07..bc4dd01fbb 100644
--- a/ml-algorithms/src/test/java/org/opensearch/ml/engine/algorithms/clustering/KMeansTest.java
+++ b/ml-algorithms/src/test/java/org/opensearch/ml/engine/algorithms/clustering/KMeansTest.java
@@ -10,11 +10,12 @@
 import org.junit.Rule;
 import org.junit.Test;
 import org.junit.rules.ExpectedException;
+import org.opensearch.ml.common.MLModel;
 import org.opensearch.ml.common.dataframe.DataFrame;
+import org.opensearch.ml.common.dataset.DataFrameInputDataset;
 import org.opensearch.ml.common.input.parameter.clustering.KMeansParams;
 import org.opensearch.ml.common.FunctionName;
 import org.opensearch.ml.common.output.MLPredictionOutput;
-import org.opensearch.ml.common.Model;
 
 import static org.opensearch.ml.engine.helper.MLTestHelper.constructTestDataFrame;
 
@@ -25,7 +26,9 @@ public class KMeansTest {
     private KMeansParams parameters;
     private KMeans kMeans;
     private DataFrame trainDataFrame;
+    private DataFrameInputDataset trainDataFrameInputDataSet;
     private DataFrame predictionDataFrame;
+    private DataFrameInputDataset predictionDataFrameInputDataset;
     private int trainSize = 100;
     private int predictionSize = 10;
 
@@ -44,8 +47,8 @@ public void setUp() {
 
     @Test
     public void predict() {
-        Model model = kMeans.train(trainDataFrame);
-        MLPredictionOutput output = (MLPredictionOutput) kMeans.predict(predictionDataFrame, model);
+        MLModel model = kMeans.train(trainDataFrameInputDataSet);
+        MLPredictionOutput output = (MLPredictionOutput) kMeans.predict(predictionDataFrameInputDataset, model);
         DataFrame predictions = output.getPredictionResult();
         Assert.assertEquals(predictionSize, predictions.size());
         predictions.forEach(row -> Assert.assertTrue(row.getValue(0).intValue() == 0 || row.getValue(0).intValue() == 1));
@@ -55,14 +58,14 @@ public void predict() {
     public void predictWithNullModel() {
         exceptionRule.expect(IllegalArgumentException.class);
         exceptionRule.expectMessage("No model found for KMeans prediction");
-        kMeans.predict(predictionDataFrame, null);
+        kMeans.predict(predictionDataFrameInputDataset, null);
     }
 
     @Test
     public void train() {
-        Model model = kMeans.train(trainDataFrame);
+        MLModel model = kMeans.train(trainDataFrameInputDataSet);
         Assert.assertEquals(FunctionName.KMEANS.name(), model.getName());
-        Assert.assertEquals(1, model.getVersion());
+        Assert.assertEquals(1, model.getVersion().intValue());
         Assert.assertNotNull(model.getContent());
     }
 
@@ -74,20 +77,20 @@ public void trainAndPredict() {
                 .centroids(2)
                 .build();
         KMeans kMeans = new KMeans(parameters);
-        MLPredictionOutput output = (MLPredictionOutput) kMeans.trainAndPredict(trainDataFrame);
+        MLPredictionOutput output = (MLPredictionOutput) kMeans.trainAndPredict(trainDataFrameInputDataSet);
         DataFrame predictions = output.getPredictionResult();
         Assert.assertEquals(trainSize, predictions.size());
         predictions.forEach(row -> Assert.assertTrue(row.getValue(0).intValue() == 0 || row.getValue(0).intValue() == 1));
 
         parameters = parameters.toBuilder().distanceType(KMeansParams.DistanceType.COSINE).build();
         kMeans = new KMeans(parameters);
-        output = (MLPredictionOutput) kMeans.trainAndPredict(trainDataFrame);
+        output = (MLPredictionOutput) kMeans.trainAndPredict(trainDataFrameInputDataSet);
         predictions = output.getPredictionResult();
         Assert.assertEquals(trainSize, predictions.size());
 
         parameters = parameters.toBuilder().distanceType(KMeansParams.DistanceType.L1).build();
         kMeans = new KMeans(parameters);
-        output = (MLPredictionOutput) kMeans.trainAndPredict(trainDataFrame);
+        output = (MLPredictionOutput) kMeans.trainAndPredict(trainDataFrameInputDataSet);
         predictions = output.getPredictionResult();
         Assert.assertEquals(trainSize, predictions.size());
     }
@@ -108,10 +111,12 @@ public void constructorWithNegtiveIterations() {
 
     private void constructKMeansPredictionDataFrame() {
         predictionDataFrame = constructTestDataFrame(predictionSize);
+        predictionDataFrameInputDataset = new DataFrameInputDataset(predictionDataFrame);
     }
 
     private void constructKMeansTrainDataFrame() {
         trainDataFrame = constructTestDataFrame(trainSize);
+        trainDataFrameInputDataSet = new DataFrameInputDataset(trainDataFrame);
     }
 
 }
diff --git a/ml-algorithms/src/test/java/org/opensearch/ml/engine/algorithms/clustering/RCFSummarizeTest.java b/ml-algorithms/src/test/java/org/opensearch/ml/engine/algorithms/clustering/RCFSummarizeTest.java
index 9fb214e8b9..2ab9e89c50 100644
--- a/ml-algorithms/src/test/java/org/opensearch/ml/engine/algorithms/clustering/RCFSummarizeTest.java
+++ b/ml-algorithms/src/test/java/org/opensearch/ml/engine/algorithms/clustering/RCFSummarizeTest.java
@@ -10,11 +10,12 @@
 import org.junit.Rule;
 import org.junit.Test;
 import org.junit.rules.ExpectedException;
+import org.opensearch.ml.common.MLModel;
 import org.opensearch.ml.common.dataframe.DataFrame;
+import org.opensearch.ml.common.dataset.DataFrameInputDataset;
 import org.opensearch.ml.common.input.parameter.clustering.RCFSummarizeParams;
 import org.opensearch.ml.common.FunctionName;
 import org.opensearch.ml.common.output.MLPredictionOutput;
-import org.opensearch.ml.common.Model;
 
 import static org.opensearch.ml.engine.helper.MLTestHelper.constructTestDataFrame;
 
@@ -26,19 +27,21 @@ public class RCFSummarizeTest {
     private RCFSummarizeParams parameters;
     private RCFSummarize rcfSummarize;
     private DataFrame trainDataFrame;
+    private DataFrameInputDataset trainDataFrameInputDataSet;
     private DataFrame predictionDataFrame;
+    private DataFrameInputDataset predictionDataFrameInputDataSet;
     private int trainSize = 100;
     private int predictionSize = 10;
 
     @Before
     public void setUp() {
         parameters = RCFSummarizeParams.builder()
-            .distanceType(RCFSummarizeParams.DistanceType.L2)
-            .maxK(2)
-            .initialK(20)
-            .phase1Reassign(true)
-            .parallel(false)
-            .build();
+                .distanceType(RCFSummarizeParams.DistanceType.L2)
+                .maxK(2)
+                .initialK(20)
+                .phase1Reassign(true)
+                .parallel(false)
+                .build();
 
         rcfSummarize = new RCFSummarize(parameters);
 
@@ -48,8 +51,8 @@ public void setUp() {
 
     @Test
     public void predictWithTrivalModelExpectBoNorminalOutput() {
-        Model model = rcfSummarize.train(trainDataFrame);
-        MLPredictionOutput output = (MLPredictionOutput) rcfSummarize.predict(predictionDataFrame, model);
+        MLModel model = rcfSummarize.train(trainDataFrameInputDataSet);
+        MLPredictionOutput output = (MLPredictionOutput) rcfSummarize.predict(predictionDataFrameInputDataSet, model);
         DataFrame predictions = output.getPredictionResult();
         Assert.assertEquals(predictionSize, predictions.size());
         predictions.forEach(row -> Assert.assertTrue(row.getValue(0).intValue() == 0 || row.getValue(0).intValue() == 1));
@@ -62,20 +65,20 @@ public void trainAndPredictWithRegularInputExpectNotNullOutput() {
                 .maxK(2).initialK(10)
                 .build();
         RCFSummarize rcfSummarize = new RCFSummarize(parameters);
-        MLPredictionOutput output = (MLPredictionOutput) rcfSummarize.trainAndPredict(trainDataFrame);
+        MLPredictionOutput output = (MLPredictionOutput) rcfSummarize.trainAndPredict(trainDataFrameInputDataSet);
         DataFrame predictions = output.getPredictionResult();
         Assert.assertEquals(trainSize, predictions.size());
         predictions.forEach(row -> Assert.assertTrue(row.getValue(0).intValue() == 0 || row.getValue(0).intValue() == 1));
 
         parameters = parameters.toBuilder().distanceType(RCFSummarizeParams.DistanceType.L2).build();
         rcfSummarize = new RCFSummarize(parameters);
-        output = (MLPredictionOutput) rcfSummarize.trainAndPredict(trainDataFrame);
+        output = (MLPredictionOutput) rcfSummarize.trainAndPredict(trainDataFrameInputDataSet);
         predictions = output.getPredictionResult();
         Assert.assertEquals(trainSize, predictions.size());
 
         parameters = parameters.toBuilder().distanceType(RCFSummarizeParams.DistanceType.LInfinity).build();
         rcfSummarize = new RCFSummarize(parameters);
-        output = (MLPredictionOutput) rcfSummarize.trainAndPredict(trainDataFrame);
+        output = (MLPredictionOutput) rcfSummarize.trainAndPredict(trainDataFrameInputDataSet);
         predictions = output.getPredictionResult();
         Assert.assertEquals(trainSize, predictions.size());
     }
@@ -98,22 +101,24 @@ public void constructorWithNegtiveInitialK() {
     public void predictWithNullModel() {
         exceptionRule.expect(IllegalArgumentException.class);
         exceptionRule.expectMessage("No model found for RCFSummarize prediction.");
-        rcfSummarize.predict(predictionDataFrame, null);
+        rcfSummarize.predict(predictionDataFrameInputDataSet, null);
     }
 
     @Test
     public void trainWithRegularInputExpectNotNullOutput() {
-        Model model = rcfSummarize.train(trainDataFrame);
+        MLModel model = rcfSummarize.train(trainDataFrameInputDataSet);
         Assert.assertEquals(FunctionName.RCF_SUMMARIZE.name(), model.getName());
-        Assert.assertEquals(1, model.getVersion());
+        Assert.assertEquals(1, model.getVersion().intValue());
         Assert.assertNotNull(model.getContent());
     }
 
     private void constructRCFSummarizePredictionDataFrame() {
         predictionDataFrame = constructTestDataFrame(predictionSize);
+        predictionDataFrameInputDataSet = new DataFrameInputDataset(predictionDataFrame);
     }
 
     private void constructRCFSummarizeTrainDataFrame() {
         trainDataFrame = constructTestDataFrame(trainSize);
+        trainDataFrameInputDataSet = new DataFrameInputDataset(trainDataFrame);
     }
 }
diff --git a/ml-algorithms/src/test/java/org/opensearch/ml/engine/algorithms/rcf/BatchRandomCutForestTest.java b/ml-algorithms/src/test/java/org/opensearch/ml/engine/algorithms/rcf/BatchRandomCutForestTest.java
index 5c7e45e011..df68c19316 100644
--- a/ml-algorithms/src/test/java/org/opensearch/ml/engine/algorithms/rcf/BatchRandomCutForestTest.java
+++ b/ml-algorithms/src/test/java/org/opensearch/ml/engine/algorithms/rcf/BatchRandomCutForestTest.java
@@ -10,15 +10,16 @@
 import org.junit.Rule;
 import org.junit.Test;
 import org.junit.rules.ExpectedException;
+import org.opensearch.ml.common.MLModel;
 import org.opensearch.ml.common.dataframe.ColumnMeta;
 import org.opensearch.ml.common.dataframe.ColumnType;
 import org.opensearch.ml.common.dataframe.DataFrame;
 import org.opensearch.ml.common.dataframe.DefaultDataFrame;
 import org.opensearch.ml.common.dataframe.Row;
+import org.opensearch.ml.common.dataset.DataFrameInputDataset;
 import org.opensearch.ml.common.input.parameter.rcf.BatchRCFParams;
 import org.opensearch.ml.common.FunctionName;
 import org.opensearch.ml.common.output.MLPredictionOutput;
-import org.opensearch.ml.common.Model;
 
 import java.util.concurrent.ThreadLocalRandom;
 
@@ -29,7 +30,9 @@ public class BatchRandomCutForestTest {
     private BatchRCFParams parameters;
     private BatchRandomCutForest forest;
     private DataFrame trainDataFrame;
+    private DataFrameInputDataset trainDataFrameInputDataSet;
     private DataFrame predictionDataFrame;
+    private DataFrameInputDataset predictionDataFrameInputDataSet;
     private int dataSize = 500;
 
     @Before
@@ -44,7 +47,9 @@ public void setUp() {
                 .build();
         forest = new BatchRandomCutForest(parameters);
         trainDataFrame = constructRCFDataFrame(false);
+        trainDataFrameInputDataSet = new DataFrameInputDataset(trainDataFrame);
         predictionDataFrame = constructRCFDataFrame(true);
+        predictionDataFrameInputDataSet = new DataFrameInputDataset(predictionDataFrame);
     }
 
     @Test
@@ -55,8 +60,8 @@ public void constructorWithNullParams() {
 
     @Test
     public void predict() {
-        Model model = forest.train(trainDataFrame);
-        MLPredictionOutput output = (MLPredictionOutput) forest.predict(predictionDataFrame, model);
+        MLModel model = forest.train(trainDataFrameInputDataSet);
+        MLPredictionOutput output = (MLPredictionOutput) forest.predict(predictionDataFrameInputDataSet, model);
         verifyPredictionResult(output);
     }
 
@@ -64,21 +69,21 @@ public void predict() {
     public void predictWithNullModel() {
         exceptionRule.expect(IllegalArgumentException.class);
         exceptionRule.expectMessage("No model found for batch RCF prediction");
-        MLPredictionOutput output = (MLPredictionOutput) forest.predict(predictionDataFrame, null);
+        MLPredictionOutput output = (MLPredictionOutput) forest.predict(predictionDataFrameInputDataSet, null);
         verifyPredictionResult(output);
     }
 
     @Test
     public void train() {
-        Model model = forest.train(trainDataFrame);
+        MLModel model = forest.train(trainDataFrameInputDataSet);
         Assert.assertEquals(FunctionName.BATCH_RCF.name(), model.getName());
-        Assert.assertEquals(1, model.getVersion());
+        Assert.assertEquals(1, model.getVersion().intValue());
         Assert.assertNotNull(model.getContent());
     }
 
     @Test
     public void trainAndPredict() {
-        MLPredictionOutput output = (MLPredictionOutput) forest.trainAndPredict(trainDataFrame);
+        MLPredictionOutput output = (MLPredictionOutput) forest.trainAndPredict(trainDataFrameInputDataSet);
         verifyPredictionResult(output);
     }
 
diff --git a/ml-algorithms/src/test/java/org/opensearch/ml/engine/algorithms/rcf/FixedInTimeRandomCutForestTest.java b/ml-algorithms/src/test/java/org/opensearch/ml/engine/algorithms/rcf/FixedInTimeRandomCutForestTest.java
index 6ebcfd26d2..706e8ce20f 100644
--- a/ml-algorithms/src/test/java/org/opensearch/ml/engine/algorithms/rcf/FixedInTimeRandomCutForestTest.java
+++ b/ml-algorithms/src/test/java/org/opensearch/ml/engine/algorithms/rcf/FixedInTimeRandomCutForestTest.java
@@ -8,13 +8,14 @@
 import org.junit.Assert;
 import org.junit.Before;
 import org.junit.Test;
+import org.opensearch.ml.common.MLModel;
 import org.opensearch.ml.common.dataframe.ColumnMeta;
 import org.opensearch.ml.common.dataframe.ColumnType;
 import org.opensearch.ml.common.dataframe.DataFrame;
 import org.opensearch.ml.common.dataframe.DefaultDataFrame;
 import org.opensearch.ml.common.FunctionName;
+import org.opensearch.ml.common.dataset.DataFrameInputDataset;
 import org.opensearch.ml.common.output.MLPredictionOutput;
-import org.opensearch.ml.common.Model;
 import org.opensearch.ml.common.input.parameter.rcf.FitRCFParams;
 
 import java.util.concurrent.ThreadLocalRandom;
@@ -24,7 +25,9 @@ public class FixedInTimeRandomCutForestTest {
     private FitRCFParams parameters;
     private FixedInTimeRandomCutForest forest;
     private DataFrame trainDataFrame;
+    private DataFrameInputDataset trainDataFrameInputDataSet;
     private DataFrame predictionDataFrame;
+    private DataFrameInputDataset predictionDataFrameInputDataSet;
     private int dataSize = 500;
 
     @Before
@@ -38,13 +41,15 @@ public void setUp() {
 
         forest = new FixedInTimeRandomCutForest(parameters);
         trainDataFrame = constructRCFDataFrame(false);
+        trainDataFrameInputDataSet = new DataFrameInputDataset(trainDataFrame);
         predictionDataFrame = constructRCFDataFrame(true);
+        predictionDataFrameInputDataSet = new DataFrameInputDataset(predictionDataFrame);
     }
 
     @Test
     public void predict() {
-        Model model = forest.train(trainDataFrame);
-        MLPredictionOutput output = (MLPredictionOutput) forest.predict(predictionDataFrame, model);
+        MLModel model = forest.train(trainDataFrameInputDataSet);
+        MLPredictionOutput output = (MLPredictionOutput) forest.predict(predictionDataFrameInputDataSet, model);
         DataFrame predictions = output.getPredictionResult();
         Assert.assertEquals(dataSize, predictions.size());
         int anomalyCount = 0;
@@ -60,9 +65,9 @@ public void predict() {
 
     @Test
     public void train() {
-        Model model = forest.train(trainDataFrame);
+        MLModel model = forest.train(trainDataFrameInputDataSet);
         Assert.assertEquals(FunctionName.FIT_RCF.name(), model.getName());
-        Assert.assertEquals(1, model.getVersion());
+        Assert.assertEquals(1, model.getVersion().intValue());
         Assert.assertNotNull(model.getContent());
     }
 
diff --git a/ml-algorithms/src/test/java/org/opensearch/ml/engine/algorithms/rcf/RCFModelSerDeSerTest.java b/ml-algorithms/src/test/java/org/opensearch/ml/engine/algorithms/rcf/RCFModelSerDeSerTest.java
index 9690009505..1c6bc17747 100644
--- a/ml-algorithms/src/test/java/org/opensearch/ml/engine/algorithms/rcf/RCFModelSerDeSerTest.java
+++ b/ml-algorithms/src/test/java/org/opensearch/ml/engine/algorithms/rcf/RCFModelSerDeSerTest.java
@@ -14,9 +14,11 @@
 import org.junit.Rule;
 import org.junit.Test;
 import org.junit.rules.ExpectedException;
-import org.opensearch.ml.common.Model;
+import org.opensearch.ml.common.MLModel;
+import org.opensearch.ml.common.dataset.DataFrameInputDataset;
 import org.opensearch.ml.common.input.parameter.rcf.BatchRCFParams;
 import org.opensearch.ml.common.input.parameter.rcf.FitRCFParams;
+import org.opensearch.ml.engine.utils.ModelSerDeSer;
 
 import java.util.Arrays;
 
@@ -36,26 +38,26 @@ public class RCFModelSerDeSerTest {
     public void testModelSerDeSerBatchRCF() {
         BatchRCFParams params = BatchRCFParams.builder().build();
         BatchRandomCutForest batchRCF = new BatchRandomCutForest(params);
-        Model model = batchRCF.train(constructTestDataFrame(500));
+        MLModel model = batchRCF.train(new DataFrameInputDataset(constructTestDataFrame(500)));
 
-        RandomCutForestState deserializedState = RCFModelSerDeSer.deserializeRCF(model.getContent());
+        RandomCutForestState deserializedState = RCFModelSerDeSer.deserializeRCF(model);
         RandomCutForest forest = rcfMapper.toModel(deserializedState);
         assertNotNull(forest);
         byte[] serializedModel = RCFModelSerDeSer.serializeRCF(deserializedState);
-        assertTrue(Arrays.equals(serializedModel, model.getContent()));
+        assertTrue(Arrays.equals(serializedModel, ModelSerDeSer.decodeBase64(model.getContent())));
     }
 
     @Test
     public void testModelSerDeSerFitRCF() {
         FitRCFParams params = FitRCFParams.builder().timeField(TIME_FIELD).build();
         FixedInTimeRandomCutForest fitRCF = new FixedInTimeRandomCutForest(params);
-        Model model = fitRCF.train(constructTestDataFrame(500, true));
+        MLModel model = fitRCF.train(new DataFrameInputDataset(constructTestDataFrame(500, true)));
 
-        ThresholdedRandomCutForestState deserializedState = RCFModelSerDeSer.deserializeTRCF(model.getContent());
+        ThresholdedRandomCutForestState deserializedState = RCFModelSerDeSer.deserializeTRCF(model);
         ThresholdedRandomCutForest forest = trcfMapper.toModel(deserializedState);
         assertNotNull(forest);
         byte[] serializedModel = RCFModelSerDeSer.serializeTRCF(deserializedState);
-        assertTrue(Arrays.equals(serializedModel, model.getContent()));
+        assertTrue(Arrays.equals(serializedModel, ModelSerDeSer.decodeBase64(model.getContent())));
     }
 
 }
diff --git a/ml-algorithms/src/test/java/org/opensearch/ml/engine/algorithms/regression/LinearRegressionTest.java b/ml-algorithms/src/test/java/org/opensearch/ml/engine/algorithms/regression/LinearRegressionTest.java
index a90f1f10bb..1dbed55521 100644
--- a/ml-algorithms/src/test/java/org/opensearch/ml/engine/algorithms/regression/LinearRegressionTest.java
+++ b/ml-algorithms/src/test/java/org/opensearch/ml/engine/algorithms/regression/LinearRegressionTest.java
@@ -10,11 +10,12 @@
 import org.junit.Rule;
 import org.junit.Test;
 import org.junit.rules.ExpectedException;
+import org.opensearch.ml.common.MLModel;
 import org.opensearch.ml.common.dataframe.DataFrame;
 import org.opensearch.ml.common.FunctionName;
+import org.opensearch.ml.common.dataset.DataFrameInputDataset;
 import org.opensearch.ml.common.input.parameter.regression.LinearRegressionParams;
 import org.opensearch.ml.common.output.MLPredictionOutput;
-import org.opensearch.ml.common.Model;
 
 import static org.opensearch.ml.engine.helper.LinearRegressionHelper.constructLinearRegressionPredictionDataFrame;
 import static org.opensearch.ml.engine.helper.LinearRegressionHelper.constructLinearRegressionTrainDataFrame;
@@ -26,7 +27,9 @@ public class LinearRegressionTest {
 
     private LinearRegressionParams parameters;
     private DataFrame trainDataFrame;
+    private DataFrameInputDataset trainDataFrameInputDataSet;
     private DataFrame predictionDataFrame;
+    private DataFrameInputDataset predictionDataFrameInputDataSet;
 
     @Before
     public void setUp() {
@@ -40,14 +43,16 @@ public void setUp() {
                 .target("price")
                 .build();
         trainDataFrame = constructLinearRegressionTrainDataFrame();
+        trainDataFrameInputDataSet = new DataFrameInputDataset(trainDataFrame);
         predictionDataFrame = constructLinearRegressionPredictionDataFrame();
+        predictionDataFrameInputDataSet = new DataFrameInputDataset(predictionDataFrame);
     }
 
     @Test
     public void predict() {
         LinearRegression regression = new LinearRegression(parameters);
-        Model model = regression.train(trainDataFrame);
-        MLPredictionOutput output = (MLPredictionOutput)regression.predict(predictionDataFrame, model);
+        MLModel model = regression.train(trainDataFrameInputDataSet);
+        MLPredictionOutput output = (MLPredictionOutput)regression.predict(predictionDataFrameInputDataSet, model);
         DataFrame predictions = output.getPredictionResult();
         Assert.assertEquals(2, predictions.size());
     }
@@ -57,7 +62,7 @@ public void predictWithoutModel() {
         exceptionRule.expect(IllegalArgumentException.class);
         exceptionRule.expectMessage("No model found for linear regression prediction.");
         LinearRegression regression = new LinearRegression(parameters);
-        regression.predict(predictionDataFrame, null);
+        regression.predict(predictionDataFrameInputDataSet, null);
     }
 
     @Test
@@ -106,9 +111,9 @@ public void trainWithRmsProp() {
 
     private void trainAndVerify(LinearRegressionParams params) {
         LinearRegression regression = new LinearRegression(params);
-        Model model = regression.train(trainDataFrame);
+        MLModel model = regression.train(trainDataFrameInputDataSet);
         Assert.assertEquals(FunctionName.LINEAR_REGRESSION.name(), model.getName());
-        Assert.assertEquals(1, model.getVersion());
+        Assert.assertEquals(1, model.getVersion().intValue());
         Assert.assertNotNull(model.getContent());
     }
 
@@ -118,7 +123,7 @@ public void trainExceptionWithoutTarget() {
         exceptionRule.expectMessage("Empty target when generating dataset from data frame.");
         parameters.setTarget(null);
         LinearRegression regression = new LinearRegression(parameters);
-        Model model = regression.train(trainDataFrame);
+        MLModel model = regression.train(trainDataFrameInputDataSet);
     }
 
     @Test
@@ -127,7 +132,7 @@ public void trainExceptionUnmatchedTarget() {
         exceptionRule.expectMessage("No matched target when generating dataset from data frame.");
         parameters.setTarget("not found");
         LinearRegression regression = new LinearRegression(parameters);
-        Model model = regression.train(trainDataFrame);
+        MLModel model = regression.train(trainDataFrameInputDataSet);
     }
 
     @Test
diff --git a/ml-algorithms/src/test/java/org/opensearch/ml/engine/algorithms/regression/LogisticRegressionTest.java b/ml-algorithms/src/test/java/org/opensearch/ml/engine/algorithms/regression/LogisticRegressionTest.java
index 28e02c4416..31d2b850db 100644
--- a/ml-algorithms/src/test/java/org/opensearch/ml/engine/algorithms/regression/LogisticRegressionTest.java
+++ b/ml-algorithms/src/test/java/org/opensearch/ml/engine/algorithms/regression/LogisticRegressionTest.java
@@ -11,8 +11,9 @@
 import org.junit.Test;
 import org.junit.rules.ExpectedException;
 import org.opensearch.ml.common.FunctionName;
-import org.opensearch.ml.common.Model;
+import org.opensearch.ml.common.MLModel;
 import org.opensearch.ml.common.dataframe.DataFrame;
+import org.opensearch.ml.common.dataset.DataFrameInputDataset;
 import org.opensearch.ml.common.input.parameter.regression.LogisticRegressionParams;
 import org.opensearch.ml.common.output.MLPredictionOutput;
 
@@ -25,7 +26,9 @@ public class LogisticRegressionTest {
 
     private LogisticRegressionParams parameters;
     private DataFrame trainDataFrame;
+    private DataFrameInputDataset trainDataFrameInputDataSet;
     private DataFrame predictionDataFrame;
+    private DataFrameInputDataset predictionDataFrameInputDataSet;
 
     @Before
     public void setUp() {
@@ -37,7 +40,9 @@ public void setUp() {
                 .target("class")
                 .build();
         trainDataFrame = constructLogisticRegressionTrainDataFrame();
+        trainDataFrameInputDataSet = new DataFrameInputDataset(trainDataFrame);
         predictionDataFrame = constructLogisticRegressionPredictionDataFrame();
+        predictionDataFrameInputDataSet = new DataFrameInputDataset(predictionDataFrame);
     }
 
     @Test
@@ -87,14 +92,14 @@ public void trainExceptionWithoutTarget() {
         exceptionRule.expectMessage("Empty target when generating dataset from data frame.");
         parameters.setTarget(null);
         LogisticRegression classification = new LogisticRegression(parameters);
-        Model model = classification.train(trainDataFrame);
+        MLModel model = classification.train(trainDataFrameInputDataSet);
     }
 
     @Test
     public void predict() {
         LogisticRegression classification = new LogisticRegression(parameters);
-        Model model = classification.train(trainDataFrame);
-        MLPredictionOutput output = (MLPredictionOutput)classification.predict(predictionDataFrame, model);
+        MLModel model = classification.train(trainDataFrameInputDataSet);
+        MLPredictionOutput output = (MLPredictionOutput)classification.predict(predictionDataFrameInputDataSet, model);
         DataFrame predictions = output.getPredictionResult();
         Assert.assertEquals(2, predictions.size());
     }
@@ -104,7 +109,7 @@ public void predictWithoutModel() {
         exceptionRule.expect(IllegalArgumentException.class);
         exceptionRule.expectMessage("No model found for logistic regression prediction.");
         LogisticRegression classification = new LogisticRegression(parameters);
-        classification.predict(predictionDataFrame, null);
+        classification.predict(predictionDataFrameInputDataSet, null);
     }
 
     @Test
@@ -137,9 +142,9 @@ public void constructorNegativeBatchSize() {
 
     private void trainAndVerify(LogisticRegressionParams params) {
         LogisticRegression classification = new LogisticRegression(params);
-        Model model = classification.train(trainDataFrame);
+        MLModel model = classification.train(trainDataFrameInputDataSet);
         Assert.assertEquals(FunctionName.LOGISTIC_REGRESSION.name(), model.getName());
-        Assert.assertEquals(1, model.getVersion());
+        Assert.assertEquals(1, model.getVersion().intValue());
         Assert.assertNotNull(model.getContent());
     }
 }
diff --git a/ml-algorithms/src/test/java/org/opensearch/ml/engine/algorithms/sample/SampleAlgoTest.java b/ml-algorithms/src/test/java/org/opensearch/ml/engine/algorithms/sample/SampleAlgoTest.java
index f23e0ed386..c99e3f674f 100644
--- a/ml-algorithms/src/test/java/org/opensearch/ml/engine/algorithms/sample/SampleAlgoTest.java
+++ b/ml-algorithms/src/test/java/org/opensearch/ml/engine/algorithms/sample/SampleAlgoTest.java
@@ -10,12 +10,13 @@
 import org.junit.Rule;
 import org.junit.Test;
 import org.junit.rules.ExpectedException;
+import org.opensearch.ml.common.MLModel;
 import org.opensearch.ml.common.dataframe.ColumnMeta;
 import org.opensearch.ml.common.dataframe.ColumnType;
 import org.opensearch.ml.common.dataframe.DataFrame;
 import org.opensearch.ml.common.dataframe.DefaultDataFrame;
+import org.opensearch.ml.common.dataset.DataFrameInputDataset;
 import org.opensearch.ml.common.input.parameter.MLAlgoParams;
-import org.opensearch.ml.common.Model;
 import org.opensearch.ml.common.output.sample.SampleAlgoOutput;
 import org.opensearch.ml.common.input.parameter.sample.SampleAlgoParams;
 
@@ -26,20 +27,24 @@ public class SampleAlgoTest {
     private MLAlgoParams parameters;
     private SampleAlgo sampleAlgo;
     private DataFrame trainDataFrame;
+    private DataFrameInputDataset trainDataFrameInputDataSet;
     private DataFrame predictionDataFrame;
+    private DataFrameInputDataset predictionDataFrameInputDataSet;
 
     @Before
     public void setUp() {
         parameters = SampleAlgoParams.builder().sampleParam(2).build();
         sampleAlgo = new SampleAlgo(parameters);
         trainDataFrame = constructDataFrame(10);
+        trainDataFrameInputDataSet = new DataFrameInputDataset(trainDataFrame);
         predictionDataFrame = constructDataFrame(3);
+        predictionDataFrameInputDataSet = new DataFrameInputDataset(predictionDataFrame);
     }
 
     @Test
     public void predict() {
-        Model model = sampleAlgo.train(trainDataFrame);
-        SampleAlgoOutput output = (SampleAlgoOutput)sampleAlgo.predict(predictionDataFrame, model);
+        MLModel model = sampleAlgo.train(trainDataFrameInputDataSet);
+        SampleAlgoOutput output = (SampleAlgoOutput)sampleAlgo.predict(predictionDataFrameInputDataSet, model);
         Assert.assertEquals(3.0, output.getSampleResult().doubleValue(), 1e-5);
     }
 
@@ -47,7 +52,7 @@ public void predict() {
     public void predictWithNullModel() {
         exceptionRule.expect(IllegalArgumentException.class);
         exceptionRule.expectMessage("No model found for sample algo");
-        sampleAlgo.predict(predictionDataFrame, null);
+        sampleAlgo.predict(predictionDataFrameInputDataSet, null);
     }
 
     private DataFrame constructDataFrame(int dataSize) {
diff --git a/ml-algorithms/src/test/java/org/opensearch/ml/engine/helper/MLTestHelper.java b/ml-algorithms/src/test/java/org/opensearch/ml/engine/helper/MLTestHelper.java
index c98d2a0f3e..4eccdcdb4c 100644
--- a/ml-algorithms/src/test/java/org/opensearch/ml/engine/helper/MLTestHelper.java
+++ b/ml-algorithms/src/test/java/org/opensearch/ml/engine/helper/MLTestHelper.java
@@ -12,6 +12,7 @@
 import org.opensearch.ml.common.dataframe.ColumnType;
 import org.opensearch.ml.common.dataframe.DataFrame;
 import org.opensearch.ml.common.dataframe.DataFrameBuilder;
+import org.opensearch.ml.common.dataset.DataFrameInputDataset;
 
 import java.util.ArrayList;
 import java.util.Arrays;
@@ -22,6 +23,11 @@
 public class MLTestHelper {
 
     public static final String TIME_FIELD = "timestamp";
+
+    public static DataFrameInputDataset concstructDataFrameInputDataSet(int size) {
+        return new DataFrameInputDataset(constructTestDataFrame(size));
+    }
+
     public static DataFrame constructTestDataFrame(int size) {
         return constructTestDataFrame(size, false);
     }
diff --git a/plugin/src/main/java/org/opensearch/ml/indices/MLInputDatasetHandler.java b/plugin/src/main/java/org/opensearch/ml/indices/MLInputDatasetHandler.java
index e4156ce683..03a2f60d27 100644
--- a/plugin/src/main/java/org/opensearch/ml/indices/MLInputDatasetHandler.java
+++ b/plugin/src/main/java/org/opensearch/ml/indices/MLInputDatasetHandler.java
@@ -53,7 +53,7 @@ public DataFrame parseDataFrameInput(MLInputDataset mlInputDataset) {
      * @param mlInputDataset MLInputDataset
      * @param listener ActionListener
      */
-    public void parseSearchQueryInput(MLInputDataset mlInputDataset, ActionListener<DataFrame> listener) {
+    public void parseSearchQueryInput(MLInputDataset mlInputDataset, ActionListener<MLInputDataset> listener) {
         if (!mlInputDataset.getInputDataType().equals(MLInputDataType.SEARCH_QUERY)) {
             throw new IllegalArgumentException("Input dataset is not SEARCH_QUERY type.");
         }
@@ -77,7 +77,8 @@ public void parseSearchQueryInput(MLInputDataset mlInputDataset, ActionListener<
                 input.add(hit.getSourceAsMap());
             }
             DataFrame dataFrame = DataFrameBuilder.load(input);
-            listener.onResponse(dataFrame);
+            MLInputDataset dfInputDataset = new DataFrameInputDataset(dataFrame);
+            listener.onResponse(dfInputDataset);
             return;
         }, e -> {
             log.error("Failed to search" + e);
diff --git a/plugin/src/main/java/org/opensearch/ml/task/MLPredictTaskRunner.java b/plugin/src/main/java/org/opensearch/ml/task/MLPredictTaskRunner.java
index b64fb3fa2a..585f42f163 100644
--- a/plugin/src/main/java/org/opensearch/ml/task/MLPredictTaskRunner.java
+++ b/plugin/src/main/java/org/opensearch/ml/task/MLPredictTaskRunner.java
@@ -12,7 +12,6 @@
 import static org.opensearch.ml.plugin.MachineLearningPlugin.TASK_THREAD_POOL;
 
 import java.time.Instant;
-import java.util.Base64;
 import java.util.UUID;
 
 import lombok.extern.log4j.Log4j2;
@@ -36,11 +35,9 @@
 import org.opensearch.ml.common.MLTask;
 import org.opensearch.ml.common.MLTaskState;
 import org.opensearch.ml.common.MLTaskType;
-import org.opensearch.ml.common.Model;
 import org.opensearch.ml.common.breaker.MLCircuitBreakerService;
-import org.opensearch.ml.common.dataframe.DataFrame;
-import org.opensearch.ml.common.dataset.DataFrameInputDataset;
 import org.opensearch.ml.common.dataset.MLInputDataType;
+import org.opensearch.ml.common.dataset.MLInputDataset;
 import org.opensearch.ml.common.input.MLInput;
 import org.opensearch.ml.common.output.MLOutput;
 import org.opensearch.ml.common.output.MLPredictionOutput;
@@ -105,9 +102,11 @@ protected TransportResponseHandler<MLTaskResponse> getResponseHandler(ActionList
     protected void executeTask(MLPredictionTaskRequest request, ActionListener<MLTaskResponse> listener) {
         MLInputDataType inputDataType = request.getMlInput().getInputDataset().getInputDataType();
         Instant now = Instant.now();
+        String modelId = request.getModelId();
         MLTask mlTask = MLTask
             .builder()
             .taskId(UUID.randomUUID().toString())
+            .modelId(modelId)
             .modelId(request.getModelId())
             .taskType(MLTaskType.PREDICTION)
             .inputType(inputDataType)
@@ -119,30 +118,31 @@ protected void executeTask(MLPredictionTaskRequest request, ActionListener<MLTas
             .async(false)
             .build();
         MLInput mlInput = request.getMlInput();
-        if (mlInput.getInputDataset().getInputDataType().equals(MLInputDataType.SEARCH_QUERY)) {
-            ActionListener<DataFrame> dataFrameActionListener = ActionListener
-                .wrap(dataFrame -> { predict(mlTask, dataFrame, request, listener); }, e -> {
+        switch (inputDataType) {
+            case SEARCH_QUERY:
+                ActionListener<MLInputDataset> dataFrameActionListener = ActionListener.wrap(dataSet -> {
+                    MLInput newInput = mlInput.toBuilder().inputDataset(dataSet).build();
+                    predict(modelId, mlTask, newInput, listener);
+                }, e -> {
                     log.error("Failed to generate DataFrame from search query", e);
                     handleAsyncMLTaskFailure(mlTask, e);
                     listener.onFailure(e);
                 });
-            mlInputDatasetHandler
-                .parseSearchQueryInput(
-                    mlInput.getInputDataset(),
-                    new ThreadedActionListener<>(log, threadPool, TASK_THREAD_POOL, dataFrameActionListener, false)
-                );
-        } else {
-            DataFrame inputDataFrame = mlInputDatasetHandler.parseDataFrameInput(mlInput.getInputDataset());
-            threadPool.executor(TASK_THREAD_POOL).execute(() -> { predict(mlTask, inputDataFrame, request, listener); });
+                mlInputDatasetHandler
+                    .parseSearchQueryInput(
+                        mlInput.getInputDataset(),
+                        new ThreadedActionListener<>(log, threadPool, TASK_THREAD_POOL, dataFrameActionListener, false)
+                    );
+                break;
+            case DATA_FRAME:
+            case TEXT_DOCS:
+            default:
+                threadPool.executor(TASK_THREAD_POOL).execute(() -> { predict(modelId, mlTask, mlInput, listener); });
+                break;
         }
     }
 
-    private void predict(
-        MLTask mlTask,
-        DataFrame inputDataFrame,
-        MLPredictionTaskRequest request,
-        ActionListener<MLTaskResponse> listener
-    ) {
+    private void predict(String modelId, MLTask mlTask, MLInput mlInput, ActionListener<MLTaskResponse> listener) {
         ActionListener<MLTaskResponse> internalListener = wrappedCleanupListener(listener, mlTask.getTaskId());
         // track ML task count and add ML task into cache
         mlStats.getStat(MLNodeLevelStat.ML_NODE_EXECUTING_TASK_COUNT).increment();
@@ -153,10 +153,9 @@ private void predict(
         mlTaskManager.add(mlTask);
 
         // run predict
-        if (request.getModelId() != null) {
+        if (modelId != null) {
             // search model by model id.
             try (ThreadContext.StoredContext context = threadPool.getThreadContext().stashContext()) {
-                MLInput mlInput = request.getMlInput();
                 ActionListener<GetResponse> getResponseListener = ActionListener.wrap(r -> {
                     if (r == null || !r.isExists()) {
                         internalListener.onFailure(new ResourceNotFoundException("No model found, please check the modelId."));
@@ -171,27 +170,18 @@ private void predict(
                         MLModel mlModel = MLModel.parse(xContentParser);
                         User resourceUser = mlModel.getUser();
                         User requestUser = getUserContext(client);
-                        if (!checkUserPermissions(requestUser, resourceUser, request.getModelId())) {
+                        if (!checkUserPermissions(requestUser, resourceUser, modelId)) {
                             // The backend roles of request user and resource user doesn't have intersection
                             OpenSearchException e = new OpenSearchException(
-                                "User: "
-                                    + requestUser.getName()
-                                    + " does not have permissions to run predict by model: "
-                                    + request.getModelId()
+                                "User: " + requestUser.getName() + " does not have permissions to run predict by model: " + modelId
                             );
                             handlePredictFailure(mlTask, internalListener, e, false);
                             return;
                         }
-                        Model model = new Model();
-                        model.setName(mlModel.getName());
-                        model.setVersion(mlModel.getVersion());
-                        byte[] decoded = Base64.getDecoder().decode(mlModel.getContent());
-                        model.setContent(decoded);
 
                         // run predict
                         mlTaskManager.updateTaskState(mlTask.getTaskId(), MLTaskState.RUNNING, mlTask.isAsync());
-                        MLOutput output = MLEngine
-                            .predict(mlInput.toBuilder().inputDataset(new DataFrameInputDataset(inputDataFrame)).build(), model);
+                        MLOutput output = MLEngine.predict(mlInput, mlModel);
                         if (output instanceof MLPredictionOutput) {
                             ((MLPredictionOutput) output).setStatus(MLTaskState.COMPLETED.name());
                         }
@@ -201,7 +191,7 @@ private void predict(
                         MLTaskResponse response = MLTaskResponse.builder().output(output).build();
                         internalListener.onResponse(response);
                     } catch (Exception e) {
-                        log.error("Failed to predict model " + request.getModelId(), e);
+                        log.error("Failed to predict model " + modelId, e);
                         internalListener.onFailure(e);
                     }
 
diff --git a/plugin/src/main/java/org/opensearch/ml/task/MLTrainAndPredictTaskRunner.java b/plugin/src/main/java/org/opensearch/ml/task/MLTrainAndPredictTaskRunner.java
index 457e3e67ae..eb59b03c98 100644
--- a/plugin/src/main/java/org/opensearch/ml/task/MLTrainAndPredictTaskRunner.java
+++ b/plugin/src/main/java/org/opensearch/ml/task/MLTrainAndPredictTaskRunner.java
@@ -21,9 +21,8 @@
 import org.opensearch.ml.common.MLTaskState;
 import org.opensearch.ml.common.MLTaskType;
 import org.opensearch.ml.common.breaker.MLCircuitBreakerService;
-import org.opensearch.ml.common.dataframe.DataFrame;
-import org.opensearch.ml.common.dataset.DataFrameInputDataset;
 import org.opensearch.ml.common.dataset.MLInputDataType;
+import org.opensearch.ml.common.dataset.MLInputDataset;
 import org.opensearch.ml.common.input.MLInput;
 import org.opensearch.ml.common.output.MLOutput;
 import org.opensearch.ml.common.output.MLPredictionOutput;
@@ -98,30 +97,26 @@ protected void executeTask(MLTrainingTaskRequest request, ActionListener<MLTaskR
             .async(false)
             .build();
         MLInput mlInput = request.getMlInput();
-
+        MLInputDataset inputDataset = mlInput.getInputDataset();
         if (mlInput.getInputDataset().getInputDataType().equals(MLInputDataType.SEARCH_QUERY)) {
-            ActionListener<DataFrame> dataFrameActionListener = ActionListener
-                .wrap(dataFrame -> { trainAndPredict(mlTask, dataFrame, request, listener); }, e -> {
-                    log.error("Failed to generate DataFrame from search query", e);
-                    handlePredictFailure(mlTask, listener, e, false);
-                });
+            ActionListener<MLInputDataset> dataFrameActionListener = ActionListener.wrap(dataSet -> {
+                MLInput newInput = mlInput.toBuilder().inputDataset(dataSet).build();
+                trainAndPredict(mlTask, newInput, listener);
+            }, e -> {
+                log.error("Failed to generate DataFrame from search query", e);
+                handlePredictFailure(mlTask, listener, e, false);
+            });
             mlInputDatasetHandler
                 .parseSearchQueryInput(
-                    mlInput.getInputDataset(),
+                    inputDataset,
                     new ThreadedActionListener<>(log, threadPool, TASK_THREAD_POOL, dataFrameActionListener, false)
                 );
         } else {
-            DataFrame inputDataFrame = mlInputDatasetHandler.parseDataFrameInput(mlInput.getInputDataset());
-            threadPool.executor(TASK_THREAD_POOL).execute(() -> { trainAndPredict(mlTask, inputDataFrame, request, listener); });
+            threadPool.executor(TASK_THREAD_POOL).execute(() -> { trainAndPredict(mlTask, mlInput, listener); });
         }
     }
 
-    private void trainAndPredict(
-        MLTask mlTask,
-        DataFrame inputDataFrame,
-        MLTrainingTaskRequest request,
-        ActionListener<MLTaskResponse> listener
-    ) {
+    private void trainAndPredict(MLTask mlTask, MLInput mlInput, ActionListener<MLTaskResponse> listener) {
         ActionListener<MLTaskResponse> internalListener = wrappedCleanupListener(listener, mlTask.getTaskId());
         // track ML task count and add ML task into cache
         mlStats.getStat(MLNodeLevelStat.ML_NODE_EXECUTING_TASK_COUNT).increment();
@@ -130,12 +125,11 @@ private void trainAndPredict(
             .createCounterStatIfAbsent(mlTask.getFunctionName(), ActionName.TRAIN_PREDICT, MLActionLevelStat.ML_ACTION_REQUEST_COUNT)
             .increment();
         mlTaskManager.add(mlTask);
-        MLInput mlInput = request.getMlInput();
 
         // run train and predict
         try {
             mlTaskManager.updateTaskState(mlTask.getTaskId(), MLTaskState.RUNNING, mlTask.isAsync());
-            MLOutput output = MLEngine.trainAndPredict(mlInput.toBuilder().inputDataset(new DataFrameInputDataset(inputDataFrame)).build());
+            MLOutput output = MLEngine.trainAndPredict(mlInput);
             handleAsyncMLTaskComplete(mlTask);
             if (output instanceof MLPredictionOutput) {
                 ((MLPredictionOutput) output).setStatus(MLTaskState.COMPLETED.name());
diff --git a/plugin/src/main/java/org/opensearch/ml/task/MLTrainingTaskRunner.java b/plugin/src/main/java/org/opensearch/ml/task/MLTrainingTaskRunner.java
index 2295e58303..928de2be3e 100644
--- a/plugin/src/main/java/org/opensearch/ml/task/MLTrainingTaskRunner.java
+++ b/plugin/src/main/java/org/opensearch/ml/task/MLTrainingTaskRunner.java
@@ -29,11 +29,9 @@
 import org.opensearch.ml.common.MLTask;
 import org.opensearch.ml.common.MLTaskState;
 import org.opensearch.ml.common.MLTaskType;
-import org.opensearch.ml.common.Model;
 import org.opensearch.ml.common.breaker.MLCircuitBreakerService;
-import org.opensearch.ml.common.dataframe.DataFrame;
-import org.opensearch.ml.common.dataset.DataFrameInputDataset;
 import org.opensearch.ml.common.dataset.MLInputDataType;
+import org.opensearch.ml.common.dataset.MLInputDataset;
 import org.opensearch.ml.common.input.MLInput;
 import org.opensearch.ml.common.output.MLTrainingOutput;
 import org.opensearch.ml.common.transport.MLTaskResponse;
@@ -147,16 +145,11 @@ private void startTrainingTask(MLTask mlTask, MLInput mlInput, ActionListener<ML
         mlTaskManager.add(mlTask);
         try {
             if (mlInput.getInputDataset().getInputDataType().equals(MLInputDataType.SEARCH_QUERY)) {
-                ActionListener<DataFrame> dataFrameActionListener = ActionListener
-                    .wrap(
-                        dataFrame -> {
-                            train(mlTask, mlInput.toBuilder().inputDataset(new DataFrameInputDataset(dataFrame)).build(), internalListener);
-                        },
-                        e -> {
-                            log.error("Failed to generate DataFrame from search query", e);
-                            internalListener.onFailure(e);
-                        }
-                    );
+                ActionListener<MLInputDataset> dataFrameActionListener = ActionListener
+                    .wrap(dataSet -> { train(mlTask, mlInput.toBuilder().inputDataset(dataSet).build(), internalListener); }, e -> {
+                        log.error("Failed to generate DataFrame from search query", e);
+                        internalListener.onFailure(e);
+                    });
                 mlInputDatasetHandler
                     .parseSearchQueryInput(
                         mlInput.getInputDataset(),
@@ -182,18 +175,16 @@ private void train(MLTask mlTask, MLInput mlInput, ActionListener<MLTaskResponse
         try {
             // run training
             mlTaskManager.updateTaskState(mlTask.getTaskId(), MLTaskState.RUNNING, mlTask.isAsync());
-            Model model = MLEngine.train(mlInput);
+            MLModel mlModel = MLEngine.train(mlInput);
             mlIndicesHandler.initModelIndexIfAbsent(ActionListener.wrap(indexCreated -> {
                 if (!indexCreated) {
                     listener.onFailure(new RuntimeException("No response to create ML task index"));
                     return;
                 }
                 // TODO: put the user into model for backend role based access control.
-                MLModel mlModel = new MLModel(mlInput.getAlgorithm(), model);
                 try (ThreadContext.StoredContext context = client.threadPool().getThreadContext().stashContext()) {
                     ActionListener<IndexResponse> indexResponseListener = ActionListener.wrap(r -> {
                         log.info("Model data indexing done, result:{}, model id: {}", r.getResult(), r.getId());
-                        mlStats.getStat(MLNodeLevelStat.ML_NODE_TOTAL_MODEL_COUNT).increment();
                         String returnedTaskId = mlTask.isAsync() ? mlTask.getTaskId() : null;
                         MLTrainingOutput output = new MLTrainingOutput(r.getId(), returnedTaskId, MLTaskState.COMPLETED.name());
                         listener.onResponse(MLTaskResponse.builder().output(output).build());
diff --git a/plugin/src/test/java/org/opensearch/ml/indices/MLInputDatasetHandlerTests.java b/plugin/src/test/java/org/opensearch/ml/indices/MLInputDatasetHandlerTests.java
index 627d922f65..8569f12e3f 100644
--- a/plugin/src/test/java/org/opensearch/ml/indices/MLInputDatasetHandlerTests.java
+++ b/plugin/src/test/java/org/opensearch/ml/indices/MLInputDatasetHandlerTests.java
@@ -34,6 +34,7 @@
 import org.opensearch.ml.common.dataframe.DataFrame;
 import org.opensearch.ml.common.dataframe.DataFrameBuilder;
 import org.opensearch.ml.common.dataset.DataFrameInputDataset;
+import org.opensearch.ml.common.dataset.MLInputDataset;
 import org.opensearch.ml.common.dataset.SearchQueryInputDataset;
 import org.opensearch.search.SearchHit;
 import org.opensearch.search.SearchHits;
@@ -43,7 +44,7 @@
 public class MLInputDatasetHandlerTests extends OpenSearchTestCase {
     Client client;
     MLInputDatasetHandler mlInputDatasetHandler;
-    ActionListener<DataFrame> listener;
+    ActionListener<MLInputDataset> listener;
     DataFrame dataFrame;
     SearchResponse searchResponse;
 
@@ -59,9 +60,9 @@ public void setup() {
         dataFrame = DataFrameBuilder.load(mapList);
         client = mock(Client.class);
         mlInputDatasetHandler = new MLInputDatasetHandler(client);
-        listener = spy(new ActionListener<DataFrame>() {
+        listener = spy(new ActionListener<MLInputDataset>() {
             @Override
-            public void onResponse(DataFrame dataFrame) {}
+            public void onResponse(MLInputDataset inputDataset) {}
 
             @Override
             public void onFailure(Exception e) {}
@@ -111,7 +112,7 @@ public void testSearchQueryInputDatasetWithHits() {
             .searchSourceBuilder(new SearchSourceBuilder().query(QueryBuilders.matchAllQuery()))
             .build();
         mlInputDatasetHandler.parseSearchQueryInput(searchQueryInputDataset, listener);
-        ArgumentCaptor<DataFrame> captor = ArgumentCaptor.forClass(DataFrame.class);
+        ArgumentCaptor<MLInputDataset> captor = ArgumentCaptor.forClass(MLInputDataset.class);
         verify(listener, times(1)).onResponse(captor.capture());
         Assert.assertEquals(captor.getAllValues().size(), 1);
     }
diff --git a/plugin/src/test/java/org/opensearch/ml/task/MLPredictTaskRunnerTests.java b/plugin/src/test/java/org/opensearch/ml/task/MLPredictTaskRunnerTests.java
index 00236c5ee1..058127fa1c 100644
--- a/plugin/src/test/java/org/opensearch/ml/task/MLPredictTaskRunnerTests.java
+++ b/plugin/src/test/java/org/opensearch/ml/task/MLPredictTaskRunnerTests.java
@@ -50,6 +50,7 @@
 import org.opensearch.ml.common.transport.MLTaskResponse;
 import org.opensearch.ml.common.transport.prediction.MLPredictionTaskAction;
 import org.opensearch.ml.common.transport.prediction.MLPredictionTaskRequest;
+import org.opensearch.ml.engine.algorithms.rcf.BatchRandomCutForest;
 import org.opensearch.ml.indices.MLInputDatasetHandler;
 import org.opensearch.ml.stats.MLNodeLevelStat;
 import org.opensearch.ml.stats.MLStat;
@@ -98,6 +99,7 @@ public class MLPredictTaskRunnerTests extends OpenSearchTestCase {
 
     MLStats mlStats;
     DataFrame dataFrame;
+    DataFrameInputDataset dataFrameInputDataSet;
     DiscoveryNode localNode;
     DiscoveryNode remoteNode;
     MLInputDatasetHandler mlInputDatasetHandler;
@@ -109,6 +111,7 @@ public class MLPredictTaskRunnerTests extends OpenSearchTestCase {
     String errorMessage = "test error";
     GetResponse getResponse;
     MLInput mlInputWithDataFrame;
+    String modelId = "test_modelId";
 
     @Before
     public void setup() throws IOException {
@@ -145,7 +148,8 @@ public void setup() throws IOException {
             )
         );
 
-        dataFrame = TestData.constructTestDataFrame(100);
+        dataFrame = TestData.constructTestDataFrame(300);
+        dataFrameInputDataSet = new DataFrameInputDataset(dataFrame);
 
         MLInputDataset dataFrameInputDataSet = new DataFrameInputDataset(dataFrame);
         BatchRCFParams batchRCFParams = BatchRCFParams.builder().build();
@@ -175,13 +179,15 @@ public void setup() throws IOException {
         when(client.threadPool()).thenReturn(threadPool);
         when(threadPool.getThreadContext()).thenReturn(threadContext);
 
+        BatchRandomCutForest batchRCF = new BatchRandomCutForest();
+        MLModel trainedModel = batchRCF.train(dataFrameInputDataSet);
         MLModel mlModel = MLModel
             .builder()
             .user(User.parse(USER_STRING))
             .version(111)
             .name("test")
             .algorithm(FunctionName.BATCH_RCF)
-            .content("content")
+            .content(trainedModel.getContent())
             .build();
         XContentBuilder content = mlModel.toXContent(XContentFactory.jsonBuilder(), ToXContent.EMPTY_PARAMS);
         BytesReference bytesReference = BytesReference.bytes(content);
@@ -195,7 +201,6 @@ public void testExecuteTask_OnLocalNode() {
 
         taskRunner.dispatchTask(requestWithDataFrame, transportService, listener);
         verify(mlInputDatasetHandler, never()).parseSearchQueryInput(any(), any());
-        verify(mlInputDatasetHandler).parseDataFrameInput(requestWithDataFrame.getMlInput().getInputDataset());
         verify(mlTaskManager).add(any(MLTask.class));
         verify(client).get(any(), any());
         verify(mlTaskManager).remove(anyString());
@@ -206,7 +211,6 @@ public void testExecuteTask_OnLocalNode_QueryInput() {
 
         taskRunner.dispatchTask(requestWithQuery, transportService, listener);
         verify(mlInputDatasetHandler).parseSearchQueryInput(any(), any());
-        verify(mlInputDatasetHandler, never()).parseDataFrameInput(requestWithDataFrame.getMlInput().getInputDataset());
         verify(mlTaskManager).add(any(MLTask.class));
         verify(client).get(any(), any());
         verify(mlTaskManager).remove(anyString());
@@ -246,7 +250,6 @@ public void testExecuteTask_OnLocalNode_GetModelFail() {
 
         taskRunner.dispatchTask(requestWithDataFrame, transportService, listener);
         verify(mlInputDatasetHandler, never()).parseSearchQueryInput(any(), any());
-        verify(mlInputDatasetHandler).parseDataFrameInput(requestWithDataFrame.getMlInput().getInputDataset());
         verify(mlTaskManager).add(any(MLTask.class));
         verify(client).get(any(), any());
         ArgumentCaptor<Exception> argumentCaptor = ArgumentCaptor.forClass(Exception.class);
@@ -260,7 +263,6 @@ public void testExecuteTask_OnLocalNode_NullModelIdException() {
 
         taskRunner.dispatchTask(requestWithDataFrame, transportService, listener);
         verify(mlInputDatasetHandler, never()).parseSearchQueryInput(any(), any());
-        verify(mlInputDatasetHandler).parseDataFrameInput(requestWithDataFrame.getMlInput().getInputDataset());
         verify(mlTaskManager).add(any(MLTask.class));
         verify(client, never()).get(any(), any());
         verify(mlTaskManager).remove(anyString());
@@ -274,7 +276,6 @@ public void testExecuteTask_OnLocalNode_NullGetResponse() {
 
         taskRunner.dispatchTask(requestWithDataFrame, transportService, listener);
         verify(mlInputDatasetHandler, never()).parseSearchQueryInput(any(), any());
-        verify(mlInputDatasetHandler).parseDataFrameInput(requestWithDataFrame.getMlInput().getInputDataset());
         verify(mlTaskManager).add(any(MLTask.class));
         verify(client).get(any(), any());
         verify(mlTaskManager).remove(anyString());
@@ -296,14 +297,14 @@ private void setupMocks(boolean runOnLocalNode, boolean failedToParseQueryInput,
 
         if (failedToParseQueryInput) {
             doAnswer(invocation -> {
-                ActionListener<DataFrame> actionListener = invocation.getArgument(1);
+                ActionListener<MLInputDataset> actionListener = invocation.getArgument(1);
                 actionListener.onFailure(new RuntimeException(errorMessage));
                 return null;
             }).when(mlInputDatasetHandler).parseSearchQueryInput(any(), any());
         } else {
             doAnswer(invocation -> {
-                ActionListener<DataFrame> actionListener = invocation.getArgument(1);
-                actionListener.onResponse(dataFrame);
+                ActionListener<MLInputDataset> actionListener = invocation.getArgument(1);
+                actionListener.onResponse(dataFrameInputDataSet);
                 return null;
             }).when(mlInputDatasetHandler).parseSearchQueryInput(any(), any());
         }
diff --git a/plugin/src/test/java/org/opensearch/ml/task/MLTrainAndPredictTaskRunnerTests.java b/plugin/src/test/java/org/opensearch/ml/task/MLTrainAndPredictTaskRunnerTests.java
index a1c16ae7d3..fe12fd4622 100644
--- a/plugin/src/test/java/org/opensearch/ml/task/MLTrainAndPredictTaskRunnerTests.java
+++ b/plugin/src/test/java/org/opensearch/ml/task/MLTrainAndPredictTaskRunnerTests.java
@@ -165,8 +165,8 @@ public void testExecuteTask_OnLocalNode_QueryInput() {
         }).when(mlTaskDispatcher).dispatchTask(any());
 
         doAnswer(invocation -> {
-            ActionListener<DataFrame> actionListener = invocation.getArgument(1);
-            actionListener.onResponse(dataFrame);
+            ActionListener<MLInputDataset> actionListener = invocation.getArgument(1);
+            actionListener.onResponse(new DataFrameInputDataset(dataFrame));
             return null;
         }).when(mlInputDatasetHandler).parseSearchQueryInput(any(), any());
 
diff --git a/plugin/src/test/java/org/opensearch/ml/task/MLTrainingTaskRunnerTests.java b/plugin/src/test/java/org/opensearch/ml/task/MLTrainingTaskRunnerTests.java
index 92ac981c85..237d7c4973 100644
--- a/plugin/src/test/java/org/opensearch/ml/task/MLTrainingTaskRunnerTests.java
+++ b/plugin/src/test/java/org/opensearch/ml/task/MLTrainingTaskRunnerTests.java
@@ -321,14 +321,14 @@ private void setupMocks(
 
         if (failedToParseQueryInput) {
             doAnswer(invocation -> {
-                ActionListener<DataFrame> actionListener = invocation.getArgument(1);
+                ActionListener<MLInputDataset> actionListener = invocation.getArgument(1);
                 actionListener.onFailure(new RuntimeException(errorMessage));
                 return null;
             }).when(mlInputDatasetHandler).parseSearchQueryInput(any(), any());
         } else {
             doAnswer(invocation -> {
-                ActionListener<DataFrame> actionListener = invocation.getArgument(1);
-                actionListener.onResponse(dataFrame);
+                ActionListener<MLInputDataset> actionListener = invocation.getArgument(1);
+                actionListener.onResponse(new DataFrameInputDataset(dataFrame));
                 return null;
             }).when(mlInputDatasetHandler).parseSearchQueryInput(any(), any());
         }