From 18b1d82073557d1ebe9f2c6761dfcf5d9ed9081e Mon Sep 17 00:00:00 2001
From: Xun Zhang <xunzh@amazon.com>
Date: Thu, 7 Jul 2022 17:10:51 -0700
Subject: [PATCH 1/4] Add Logistic Regression algorithm

Signed-off-by: Xun Zhang <xunzh@amazon.com>
---
 .../opensearch/ml/common/FunctionName.java    |   3 +-
 .../ml/common/dataframe/DataFrame.java        |   6 +
 .../ml/common/dataframe/DefaultDataFrame.java |  18 ++
 .../regression/LogisticRegressionParams.java  | 231 ++++++++++++++++++
 ml-algorithms/build.gradle                    |   1 +
 .../regression/LogisticRegression.java        | 145 +++++++++++
 .../ml/engine/contants/TribuoOutputType.java  |   4 +-
 .../ml/engine/utils/TribuoUtil.java           | 113 +++++++--
 .../regression/LogisticRegressionTest.java    | 109 +++++++++
 .../helper/LogisticRegressionHelper.java      |  55 +++++
 .../ml/action/MLCommonsIntegTestCase.java     |  33 +++
 .../action/prediction/PredictionITTests.java  |  10 +
 .../ml/action/training/TrainingITTests.java   |  24 +-
 13 files changed, 726 insertions(+), 26 deletions(-)
 create mode 100644 common/src/main/java/org/opensearch/ml/common/input/parameter/regression/LogisticRegressionParams.java
 create mode 100644 ml-algorithms/src/main/java/org/opensearch/ml/engine/algorithms/regression/LogisticRegression.java
 create mode 100644 ml-algorithms/src/test/java/org/opensearch/ml/engine/algorithms/regression/LogisticRegressionTest.java
 create mode 100644 ml-algorithms/src/test/java/org/opensearch/ml/engine/helper/LogisticRegressionHelper.java
diff --git a/common/src/main/java/org/opensearch/ml/common/FunctionName.java b/common/src/main/java/org/opensearch/ml/common/FunctionName.java
index 44f9eff7e1..697c9b68f8 100644
--- a/common/src/main/java/org/opensearch/ml/common/FunctionName.java
+++ b/common/src/main/java/org/opensearch/ml/common/FunctionName.java
@@ -14,7 +14,8 @@ public enum FunctionName {
     FIT_RCF,
     BATCH_RCF,
     ANOMALY_LOCALIZATION,
-    RCF_SUMMARIZE;
+    RCF_SUMMARIZE,
+    LOGISTIC_REGRESSION;
 
     public static FunctionName from(String value) {
         try {
diff --git a/common/src/main/java/org/opensearch/ml/common/dataframe/DataFrame.java b/common/src/main/java/org/opensearch/ml/common/dataframe/DataFrame.java
index 7f0daa5d4e..f7675a07e4 100644
--- a/common/src/main/java/org/opensearch/ml/common/dataframe/DataFrame.java
+++ b/common/src/main/java/org/opensearch/ml/common/dataframe/DataFrame.java
@@ -58,4 +58,10 @@ public interface DataFrame extends Iterable<Row>, Writeable, ToXContentObject {
      */
     DataFrame select(int[] columns);
 
+    /**
+     * Find the index of the target in columnMetas
+     * @param target the string value of the target
+     * @return column index of the target in the list of columnMetas
+     */
+    int getColumnIndex(String target);
 }
diff --git a/common/src/main/java/org/opensearch/ml/common/dataframe/DefaultDataFrame.java b/common/src/main/java/org/opensearch/ml/common/dataframe/DefaultDataFrame.java
index ccb7aa6097..228dd40157 100644
--- a/common/src/main/java/org/opensearch/ml/common/dataframe/DefaultDataFrame.java
+++ b/common/src/main/java/org/opensearch/ml/common/dataframe/DefaultDataFrame.java
@@ -131,6 +131,24 @@ public DataFrame select(int[] columns) {
         return new DefaultDataFrame(newColumnMetas, rows.stream().map(row-> row.select(columns)).collect(Collectors.toList()));
     }
 
+    @Override
+    public int getColumnIndex(String target) {
+        List<String> featureNames = Arrays.stream(this.columnMetas()).map(ColumnMeta::getName).collect(Collectors.toList());
+
+        int targetIndex = -1;
+        for (int i = 0; i < featureNames.size(); ++i) {
+            if (featureNames.get(i).equals(target)) {
+                targetIndex = i;
+                break;
+            }
+        }
+        if (targetIndex == -1) {
+            throw new IllegalArgumentException("No matched target when generating dataset from data frame.");
+        }
+
+        return targetIndex;
+    }
+
     @Override
     public Iterator<Row> iterator() {
         return rows.iterator();
diff --git a/common/src/main/java/org/opensearch/ml/common/input/parameter/regression/LogisticRegressionParams.java b/common/src/main/java/org/opensearch/ml/common/input/parameter/regression/LogisticRegressionParams.java
new file mode 100644
index 0000000000..506a5289ea
--- /dev/null
+++ b/common/src/main/java/org/opensearch/ml/common/input/parameter/regression/LogisticRegressionParams.java
@@ -0,0 +1,231 @@
+/*
+ * Copyright OpenSearch Contributors
+ * SPDX-License-Identifier: Apache-2.0
+ */
+
+package org.opensearch.ml.common.input.parameter.regression;
+
+import lombok.Builder;
+import lombok.Data;
+import org.opensearch.common.ParseField;
+import org.opensearch.common.io.stream.StreamInput;
+import org.opensearch.common.io.stream.StreamOutput;
+import org.opensearch.common.xcontent.NamedXContentRegistry;
+import org.opensearch.common.xcontent.XContentBuilder;
+import org.opensearch.common.xcontent.XContentParser;
+import org.opensearch.ml.common.FunctionName;
+import org.opensearch.ml.common.annotation.MLAlgoParameter;
+import org.opensearch.ml.common.input.parameter.MLAlgoParams;
+
+import java.io.IOException;
+import java.util.Locale;
+
+import static org.opensearch.common.xcontent.XContentParserUtils.ensureExpectedToken;
+
+@Data
+@MLAlgoParameter(algorithms={FunctionName.LOGISTIC_REGRESSION})
+public class LogisticRegressionParams implements MLAlgoParams {
+
+    public static final String PARSE_FIELD_NAME = FunctionName.LOGISTIC_REGRESSION.name();
+    public static final NamedXContentRegistry.Entry XCONTENT_REGISTRY = new NamedXContentRegistry.Entry(
+            MLAlgoParams.class,
+            new ParseField(PARSE_FIELD_NAME),
+            it -> parse(it)
+    );
+
+    public static final String OBJECTIVE_FIELD = "objective";
+    public static final String OPTIMISER_FIELD = "optimiser";
+    public static final String LEARNING_RATE_FIELD = "learning_rate";
+    public static final String EPSILON_FIELD = "epsilon";
+    public static final String EPOCHS_FIELD = "epochs";
+    public static final String BATCH_SIZE_FIELD = "batch_size";
+    public static final String SEED_FIELD = "seed";
+    public static final String TARGET_FIELD = "target";
+
+    private LogisticRegressionParams.ObjectiveType objectiveType;
+    private LogisticRegressionParams.OptimizerType optimizerType;
+    private Double learningRate;
+    private Double epsilon;
+    private Integer epochs;
+    private Integer batchSize;
+    private Long seed;
+    private String target;
+
+    @Builder(toBuilder = true)
+    public LogisticRegressionParams(
+        ObjectiveType objectiveType,
+        OptimizerType optimizerType,
+        Double learningRate,
+        Double epsilon,
+        Integer epochs,
+        Integer batchSize,
+        Long seed,
+        String target
+    ) {
+        this.objectiveType = objectiveType;
+        this.optimizerType = optimizerType;
+        this.learningRate = learningRate;
+        this.epsilon = epsilon;
+        this.epochs = epochs;
+        this.batchSize = batchSize;
+        this.seed = seed;
+        this.target = target;
+    }
+
+    public LogisticRegressionParams(StreamInput in) throws IOException {
+        if (in.readBoolean()) {
+            this.objectiveType = in.readEnum(ObjectiveType.class);
+        }
+        if (in.readBoolean()) {
+            this.optimizerType = in.readEnum(OptimizerType.class);
+        }
+        this.learningRate = in.readOptionalDouble();
+
+        this.epsilon = in.readOptionalDouble();
+        this.epochs = in.readOptionalInt();
+        this.batchSize = in.readOptionalInt();
+        this.seed = in.readOptionalLong();
+        this.target = in.readOptionalString();
+    }
+
+    public static MLAlgoParams parse(XContentParser parser) throws IOException {
+        ObjectiveType objective = null;
+        OptimizerType optimizerType = null;
+        Double learningRate = null;
+        Double epsilon = null;
+        Integer epochs = null;
+        Integer batchSize = null;
+        Long seed = null;
+        String target = null;
+
+        ensureExpectedToken(XContentParser.Token.START_OBJECT, parser.currentToken(), parser);
+        while (parser.nextToken() != XContentParser.Token.END_OBJECT) {
+            String fieldName = parser.currentName();
+            parser.nextToken();
+
+            switch (fieldName) {
+                case OBJECTIVE_FIELD:
+                    objective = ObjectiveType.valueOf(parser.text().toUpperCase(Locale.ROOT));
+                    break;
+                case OPTIMISER_FIELD:
+                    optimizerType = OptimizerType.valueOf(parser.text().toUpperCase(Locale.ROOT));
+                    break;
+                case LEARNING_RATE_FIELD:
+                    learningRate = parser.doubleValue(false);
+                    break;
+                case EPSILON_FIELD:
+                    epsilon = parser.doubleValue(false);
+                    break;
+                case EPOCHS_FIELD:
+                    epochs = parser.intValue(false);
+                    break;
+                case BATCH_SIZE_FIELD:
+                    batchSize = parser.intValue(false);
+                    break;
+                case SEED_FIELD:
+                    seed = parser.longValue(false);
+                    break;
+                case TARGET_FIELD:
+                    target = parser.text();
+                    break;
+                default:
+                    parser.skipChildren();
+                    break;
+            }
+        }
+        return new LogisticRegressionParams(objective,  optimizerType,  learningRate, epsilon, epochs, batchSize, seed, target);
+    }
+
+    @Override
+    public void writeTo(StreamOutput out) throws IOException {
+        if (objectiveType != null) {
+            out.writeBoolean(true);
+            out.writeEnum(objectiveType);
+        } else {
+            out.writeBoolean(false);
+        }
+        if (optimizerType != null) {
+            out.writeBoolean(true);
+            out.writeEnum(optimizerType);
+        } else {
+            out.writeBoolean(false);
+        }
+        out.writeOptionalDouble(learningRate);
+        out.writeOptionalDouble(epsilon);
+        out.writeOptionalInt(epochs);
+        out.writeOptionalInt(batchSize);
+        out.writeOptionalLong(seed);
+        out.writeOptionalString(target);
+    }
+
+    @Override
+    public XContentBuilder toXContent(XContentBuilder builder, Params params) throws IOException {
+        builder.startObject();
+        if (objectiveType != null) {
+            builder.field(OBJECTIVE_FIELD, objectiveType);
+        }
+        if (optimizerType != null) {
+            builder.field(OPTIMISER_FIELD, optimizerType);
+        }
+        if (learningRate != null) {
+            builder.field(LEARNING_RATE_FIELD, learningRate);
+        }
+        if (epsilon != null) {
+            builder.field(EPSILON_FIELD, epsilon);
+        }
+        if (epochs != null) {
+            builder.field(EPOCHS_FIELD, epochs);
+        }
+        if (batchSize != null) {
+            builder.field(BATCH_SIZE_FIELD, batchSize);
+        }
+        if (seed != null) {
+            builder.field(SEED_FIELD, seed);
+        }
+        if (target != null) {
+            builder.field(TARGET_FIELD, target);
+        }
+        builder.endObject();
+        return builder;
+    }
+
+    @Override
+    public String getWriteableName() {
+        return PARSE_FIELD_NAME;
+    }
+
+    @Override
+    public int getVersion() {
+        return 1;
+    }
+
+    public enum ObjectiveType {
+        HINGE,
+        LOGMULTICLASS;
+        public static ObjectiveType from(String value) {
+            try{
+                return ObjectiveType.valueOf(value);
+            } catch (Exception e) {
+                throw new IllegalArgumentException("Wrong objective type");
+            }
+        }
+    }
+
+    public enum OptimizerType {
+        SIMPLE_SGD,
+        LINEAR_DECAY_SGD,
+        SQRT_DECAY_SGD,
+        ADA_GRAD,
+        ADA_DELTA,
+        ADAM,
+        RMS_PROP;
+
+        public static OptimizerType from(String value) {
+            try{
+                return OptimizerType.valueOf(value);
+            } catch (Exception e) {
+                throw new IllegalArgumentException("Wrong optimizer type");
+            }
+        }
+    }
+}
diff --git a/ml-algorithms/build.gradle b/ml-algorithms/build.gradle
index 4e766e9279..889cfa76e2 100644
--- a/ml-algorithms/build.gradle
+++ b/ml-algorithms/build.gradle
@@ -20,6 +20,7 @@ dependencies {
     implementation group: 'org.tribuo', name: 'tribuo-clustering-kmeans', version: '4.2.1'
     implementation group: 'org.tribuo', name: 'tribuo-regression-sgd', version: '4.2.1'
     implementation group: 'org.tribuo', name: 'tribuo-anomaly-libsvm', version: '4.2.1'
+    implementation group: 'org.tribuo', name: 'tribuo-classification-sgd', version: '4.2.1'
     implementation group: 'commons-io', name: 'commons-io', version: '2.11.0'
     implementation 'software.amazon.randomcutforest:randomcutforest-parkservices:3.0-rc3'
     implementation 'software.amazon.randomcutforest:randomcutforest-core:3.0-rc3'
diff --git a/ml-algorithms/src/main/java/org/opensearch/ml/engine/algorithms/regression/LogisticRegression.java b/ml-algorithms/src/main/java/org/opensearch/ml/engine/algorithms/regression/LogisticRegression.java
new file mode 100644
index 0000000000..54086db8e4
--- /dev/null
+++ b/ml-algorithms/src/main/java/org/opensearch/ml/engine/algorithms/regression/LogisticRegression.java
@@ -0,0 +1,145 @@
+/*
+ * Copyright OpenSearch Contributors
+ * SPDX-License-Identifier: Apache-2.0
+ */
+
+package org.opensearch.ml.engine.algorithms.regression;
+
+import org.opensearch.ml.common.Model;
+import org.opensearch.ml.common.FunctionName;
+import org.opensearch.ml.common.dataframe.DataFrame;
+import org.opensearch.ml.common.dataframe.DataFrameBuilder;
+import org.opensearch.ml.common.input.parameter.MLAlgoParams;
+import org.opensearch.ml.common.input.parameter.regression.LogisticRegressionParams;
+import org.opensearch.ml.common.output.MLOutput;
+import org.opensearch.ml.common.output.MLPredictionOutput;
+import org.opensearch.ml.engine.Predictable;
+import org.opensearch.ml.engine.Trainable;
+import org.opensearch.ml.engine.annotation.Function;
+import org.opensearch.ml.engine.contants.TribuoOutputType;
+import org.opensearch.ml.engine.utils.ModelSerDeSer;
+import org.opensearch.ml.engine.utils.TribuoUtil;
+import org.tribuo.MutableDataset;
+import org.tribuo.Prediction;
+import org.tribuo.Trainer;
+import org.tribuo.classification.Label;
+import org.tribuo.classification.LabelFactory;
+import org.tribuo.classification.sgd.LabelObjective;
+import org.tribuo.classification.sgd.linear.LogisticRegressionTrainer;
+import org.tribuo.classification.sgd.objectives.Hinge;
+import org.tribuo.classification.sgd.objectives.LogMulticlass;
+import org.tribuo.math.StochasticGradientOptimiser;
+import org.tribuo.math.optimisers.AdaGrad;
+
+import java.util.ArrayList;
+import java.util.Collections;
+import java.util.List;
+import java.util.Map;
+import java.util.Optional;
+
+@Function(FunctionName.LOGISTIC_REGRESSION)
+public class LogisticRegression implements Trainable, Predictable {
+
+    private static final LogisticRegressionParams.ObjectiveType DEFAULT_OBJECTIVE_TYPE = LogisticRegressionParams.ObjectiveType.LOGMULTICLASS;
+    private static final LogisticRegressionParams.OptimizerType DEFAULT_OPTIMIZER_TYPE = LogisticRegressionParams.OptimizerType.ADA_GRAD;
+    private static final double DEFAULT_LEARNING_RATE = 0.01;
+
+    //AdaGrad, AdaDelta, AdaGradRDA, Adam, RMSProp
+    private static final double DEFAULT_EPSILON = 1e-6;
+
+    private static final int DEFAULT_EPOCHS = 10;
+
+    private LogisticRegressionParams parameters;
+    private StochasticGradientOptimiser optimiser;
+    private LabelObjective objective;
+    /**
+     * Initialize a linear regression algorithm.
+     * @param parameters the parameters for linear regression algorithm
+     */
+    public LogisticRegression(MLAlgoParams parameters) {
+        this.parameters = parameters == null ? LogisticRegressionParams.builder().build() : (LogisticRegressionParams)parameters;
+        validateParameters();
+        createObjective();
+        createOptimiser();
+    }
+
+    private void validateParameters() {
+        if (parameters.getLearningRate() != null && parameters.getLearningRate() < 0) {
+            throw new IllegalArgumentException("Learning rate should not be negative.");
+        }
+
+        if (parameters.getEpsilon() != null && parameters.getEpsilon() < 0) {
+            throw new IllegalArgumentException("Epsilon should not be negative.");
+        }
+
+        if (parameters.getEpochs() != null && parameters.getEpochs() < 0) {
+            throw new IllegalArgumentException("Epochs should not be negative.");
+        }
+
+        if (parameters.getBatchSize() != null && parameters.getBatchSize() < 0) {
+            throw new IllegalArgumentException("MiniBatchSize should not be negative.");
+        }
+    }
+
+    private void createObjective() {
+        LogisticRegressionParams.ObjectiveType objectiveType = Optional.ofNullable(parameters.getObjectiveType()).orElse(DEFAULT_OBJECTIVE_TYPE);
+        switch (objectiveType) {
+            case HINGE:
+                objective = new Hinge();
+                break;
+            default:
+                objective = new LogMulticlass();
+                break;
+        }
+    }
+
+    private void createOptimiser() {
+        LogisticRegressionParams.OptimizerType optimizerType = Optional.ofNullable(parameters.getOptimizerType()).orElse(DEFAULT_OPTIMIZER_TYPE);
+        Double learningRate = Optional.ofNullable(parameters.getLearningRate()).orElse(DEFAULT_LEARNING_RATE);
+        Double epsilon = Optional.ofNullable(parameters.getEpsilon()).orElse(DEFAULT_EPSILON);
+
+        switch (optimizerType) {
+            // ToDo: Add more possible optimizer. Tribuo only provides AdaGrad for logistic regression.
+            case ADA_GRAD:
+                optimiser = new AdaGrad(learningRate, epsilon);
+                break;
+            default:
+                //Use default SGD with a constant learning rate.
+                optimiser = new AdaGrad(learningRate, epsilon);
+                break;
+        }
+    }
+
+    @Override
+    public Model train(DataFrame dataFrame) {
+        MutableDataset<Label> trainDataset = TribuoUtil.generateDatasetWithTarget(dataFrame, new LabelFactory(),
+                "Logistic regression training data from OpenSearch", TribuoOutputType.LABEL, parameters.getTarget());
+        // Integer epochs = Optional.ofNullable(parameters.getEpochs()).orElse(DEFAULT_EPOCHS);
+        // LinearSGDTrainer(objective=LogMulticlass,optimiser=AdaGrad(initialLearningRate=1.0,epsilon=0.1,initialValue=0.0),epochs=5,minibatchSize=1,seed=12345)
+        Trainer<Label> logisticRegressionTrainer = new LogisticRegressionTrainer();
+        org.tribuo.Model<Label> classificationModel = logisticRegressionTrainer.train(trainDataset);
+        Model model = new Model();
+        model.setName(FunctionName.LOGISTIC_REGRESSION.name());
+        model.setVersion(1);
+        model.setContent(ModelSerDeSer.serialize(classificationModel));
+
+        return model;
+    }
+
+    @Override
+    public MLOutput predict(DataFrame dataFrame, Model model) {
+        if (model == null) {
+            throw new IllegalArgumentException("No model found for logistic regression prediction.");
+        }
+
+        org.tribuo.Model<Label> classificationModel = (org.tribuo.Model<Label>)ModelSerDeSer.deserialize(model.getContent());
+        MutableDataset<Label> predictionDataset = TribuoUtil.generateDataset(dataFrame, new LabelFactory(),
+                "Logistic regression prediction data from OpenSearch", TribuoOutputType.LABEL);
+
+        List<Prediction<Label>> predictions = classificationModel.predict(predictionDataset);
+        List<Map<String, Object>> listPrediction = new ArrayList<>();
+        predictions.forEach(e -> listPrediction.add(Collections.singletonMap("result", e.getOutput().getLabel())));
+
+        return MLPredictionOutput.builder().predictionResult(DataFrameBuilder.load(listPrediction)).build();
+    }
+}
diff --git a/ml-algorithms/src/main/java/org/opensearch/ml/engine/contants/TribuoOutputType.java b/ml-algorithms/src/main/java/org/opensearch/ml/engine/contants/TribuoOutputType.java
index b6f01e4727..81d2f15f1f 100644
--- a/ml-algorithms/src/main/java/org/opensearch/ml/engine/contants/TribuoOutputType.java
+++ b/ml-algorithms/src/main/java/org/opensearch/ml/engine/contants/TribuoOutputType.java
@@ -11,5 +11,7 @@ public enum TribuoOutputType {
     //for tribuo regression
     REGRESSOR,
     //for anomaly detection based on libSVM
-    ANOMALY_DETECTION_LIBSVM;
+    ANOMALY_DETECTION_LIBSVM,
+    //for tribuo classification
+    LABEL;
 }
diff --git a/ml-algorithms/src/main/java/org/opensearch/ml/engine/utils/TribuoUtil.java b/ml-algorithms/src/main/java/org/opensearch/ml/engine/utils/TribuoUtil.java
index 19cc3a3778..40cf7718a6 100644
--- a/ml-algorithms/src/main/java/org/opensearch/ml/engine/utils/TribuoUtil.java
+++ b/ml-algorithms/src/main/java/org/opensearch/ml/engine/utils/TribuoUtil.java
@@ -18,6 +18,7 @@
 import org.tribuo.Output;
 import org.tribuo.OutputFactory;
 import org.tribuo.anomaly.Event;
+import org.tribuo.classification.Label;
 import org.tribuo.clustering.ClusterID;
 import org.tribuo.datasource.ListDataSource;
 import org.tribuo.impl.ArrayExample;
@@ -28,6 +29,7 @@
 import java.util.Arrays;
 import java.util.Iterator;
 import java.util.List;
+import java.util.stream.Collectors;
 import java.util.stream.IntStream;
 import java.util.stream.StreamSupport;
 
@@ -56,7 +58,7 @@ public static Tuple<String[], float[][]> transformDataFrameFloat(DataFrame dataF
             Row row = itr.next();
             float[] v = new float[row.size()];
             for (int ii = 0; ii < row.size(); ii++) {
-                v[ii] = (float)row.getValue(ii).doubleValue();
+                v[ii] = (float) row.getValue(ii).doubleValue();
             }
 
             featureValues[i] = v;
@@ -66,6 +68,43 @@ public static Tuple<String[], float[][]> transformDataFrameFloat(DataFrame dataF
         return new Tuple<>(featureNames, featureValues);
     }
 
+    public static Tuple<String[], double[][]> transformClassificationDataFrame(DataFrame dataFrame, String target) {
+        List<String> featureNames = Arrays.stream(dataFrame.columnMetas()).map(ColumnMeta::getName).collect(Collectors.toList());
+        int targetIndex = dataFrame.getColumnIndex(target);
+
+        int i = 0;
+        Iterator<Row> itr = dataFrame.iterator();
+        double[][] featureValues = new double[dataFrame.size()][featureNames.size() - 1];
+        while (itr.hasNext()) {
+            Row row = itr.next();
+            int col = 0;
+            for (int j = 0; j < featureNames.size(); j++) {
+                if (j == targetIndex) {
+                    continue;
+                }
+                featureValues[i][col++] = row.getValue(j).doubleValue();
+            }
+            ++i;
+        }
+        featureNames.remove(target);
+        return new Tuple<>(featureNames.toArray(new String[featureNames.size()]), featureValues);
+    }
+
+    public static String[] transformTargetValuesDataFrames(DataFrame dataFrame, String target) {
+        int targetIndex = dataFrame.getColumnIndex(target);
+
+        int i = 0;
+        Iterator<Row> itr = dataFrame.iterator();
+        String[] targetValues = new String[dataFrame.size()];
+        while (itr.hasNext()) {
+            Row row = itr.next();
+            targetValues[i] = row.getValue(targetIndex).stringValue();
+            ++i;
+        }
+
+        return targetValues;
+    }
+
     /**
      * Generate tribuo dataset from data frame.
      * @param dataFrame features data
@@ -95,6 +134,9 @@ public static <T extends Output<T>> MutableDataset<T> generateDataset(DataFrame
                     // TODO: support anomaly labels to evaluate prediction result
                     example = new ArrayExample<>((T) new Event(defaultEventType), featureNamesValues.v1(), featureNamesValues.v2()[i]);
                     break;
+                case LABEL:
+                    example = new ArrayExample<>((T) new Label(""), featureNamesValues.v1(), featureNamesValues.v2()[i]);
+                    break;
                 default:
                     throw new IllegalArgumentException("unknown type:" + outputType);
             }
@@ -119,37 +161,35 @@ public static <T extends Output<T>> MutableDataset<T> generateDatasetWithTarget(
         }
 
         List<Example<T>> dataset = new ArrayList<>();
-        Tuple<String[], double[][]> featureNamesValues = transformDataFrame(dataFrame);
-
-        int targetIndex = -1;
-        for (int i = 0; i < featureNamesValues.v1().length; ++i) {
-            if (featureNamesValues.v1()[i].equals(target)) {
-                targetIndex = i;
-                break;
-            }
-        }
-        if (targetIndex == -1) {
-            throw new IllegalArgumentException("No matched target when generating dataset from data frame.");
-        }
-
         ArrayExample<T> example;
-        final int finalTargetIndex = targetIndex;
-        String[] featureNames = IntStream.range(0, featureNamesValues.v1().length).
-                filter(e -> e != finalTargetIndex).
-                mapToObj(e -> featureNamesValues.v1()[e]).
-                toArray(String[]::new);
 
         for (int i=0; i<dataFrame.size(); ++i) {
+            final int finalI = i;
+            double[] featureValues;
+            Tuple<String[], double[][]> featureNamesValues;
+            String[] featureNames;
+            int finalTargetIndex;
             switch (outputType) {
                 case REGRESSOR:
-                    final int finalI = i;
+                    featureNamesValues = transformDataFrame(dataFrame);
+                    finalTargetIndex = findFinalTargetIndex(featureNamesValues, target);
+                    featureNames = createFeatureNames(featureNamesValues, finalTargetIndex);
                     double targetValue = featureNamesValues.v2()[finalI][finalTargetIndex];
-                    double[] featureValues = IntStream.range(0, featureNamesValues.v2()[i].length).
+                    featureValues = IntStream.range(0, featureNamesValues.v2()[i].length).
                             filter(e -> e != finalTargetIndex).
                             mapToDouble(e -> featureNamesValues.v2()[finalI][e]).
                             toArray();
                     example = new ArrayExample<>((T) new Regressor(target, targetValue), featureNames, featureValues);
                     break;
+                case LABEL:
+                    featureNamesValues = transformClassificationDataFrame(dataFrame, target);
+                    featureNames = createFeatureNames(featureNamesValues);
+                    String[] targetValues = transformTargetValuesDataFrames(dataFrame, target);
+                    featureValues = IntStream.range(0, featureNamesValues.v2()[i].length).
+                            mapToDouble(e -> featureNamesValues.v2()[finalI][e]).
+                            toArray();
+                    example = new ArrayExample<>((T) new Label(targetValues[i]), featureNames, featureValues);
+                    break;
                 default:
                     throw new IllegalArgumentException("unknown type:" + outputType);
             }
@@ -159,4 +199,35 @@ public static <T extends Output<T>> MutableDataset<T> generateDatasetWithTarget(
         return new MutableDataset<>(new ListDataSource<>(dataset, outputFactory, provenance));
     }
 
+    private int findFinalTargetIndex(Tuple<String[], double[][]> featureNamesValues, String target) {
+        int targetIndex = -1;
+        for (int i = 0; i < featureNamesValues.v1().length; ++i) {
+            if (featureNamesValues.v1()[i].equals(target)) {
+                targetIndex = i;
+                break;
+            }
+        }
+        if (targetIndex == -1) {
+            throw new IllegalArgumentException("No matched target when generating dataset from data frame.");
+        }
+
+        return targetIndex;
+    }
+
+    private String[] createFeatureNames(Tuple<String[], double[][]> featureNamesValues, int finalTargetIndex) {
+        String[] featureNames = IntStream.range(0, featureNamesValues.v1().length).
+                filter(e -> e != finalTargetIndex).
+                mapToObj(e -> featureNamesValues.v1()[e]).
+                toArray(String[]::new);
+
+        return featureNames;
+    }
+
+    private String[] createFeatureNames(Tuple<String[], double[][]> featureNamesValues) {
+        String[] featureNames = IntStream.range(0, featureNamesValues.v1().length).
+                mapToObj(e -> featureNamesValues.v1()[e]).
+                toArray(String[]::new);
+
+        return featureNames;
+    }
 }
diff --git a/ml-algorithms/src/test/java/org/opensearch/ml/engine/algorithms/regression/LogisticRegressionTest.java b/ml-algorithms/src/test/java/org/opensearch/ml/engine/algorithms/regression/LogisticRegressionTest.java
new file mode 100644
index 0000000000..a03e93afc6
--- /dev/null
+++ b/ml-algorithms/src/test/java/org/opensearch/ml/engine/algorithms/regression/LogisticRegressionTest.java
@@ -0,0 +1,109 @@
+/*
+ * Copyright OpenSearch Contributors
+ * SPDX-License-Identifier: Apache-2.0
+ */
+
+package org.opensearch.ml.engine.algorithms.regression;
+
+import org.junit.Assert;
+import org.junit.Before;
+import org.junit.Rule;
+import org.junit.Test;
+import org.junit.rules.ExpectedException;
+import org.opensearch.ml.common.FunctionName;
+import org.opensearch.ml.common.Model;
+import org.opensearch.ml.common.dataframe.DataFrame;
+import org.opensearch.ml.common.input.parameter.regression.LogisticRegressionParams;
+import org.opensearch.ml.common.output.MLPredictionOutput;
+
+import static org.opensearch.ml.engine.helper.LogisticRegressionHelper.constructLogisticRegressionPredictionDataFrame;
+import static org.opensearch.ml.engine.helper.LogisticRegressionHelper.constructLogisticRegressionTrainDataFrame;
+
+public class LogisticRegressionTest {
+    @Rule
+    public ExpectedException exceptionRule = ExpectedException.none();
+
+    private LogisticRegressionParams parameters;
+    private DataFrame trainDataFrame;
+    private DataFrame predictionDataFrame;
+
+    @Before
+    public void setUp() {
+        parameters = LogisticRegressionParams.builder()
+                .objectiveType(LogisticRegressionParams.ObjectiveType.LOGMULTICLASS)
+                .optimizerType(LogisticRegressionParams.OptimizerType.ADA_GRAD)
+                .learningRate(0.9)
+                .epsilon(1e-6)
+                .target("class")
+                .build();
+        trainDataFrame = constructLogisticRegressionTrainDataFrame();
+        predictionDataFrame = constructLogisticRegressionPredictionDataFrame();
+    }
+
+    @Test
+    public void train() {
+        trainAndVerify(parameters);
+    }
+
+    @Test
+    public void trainExceptionWithoutTarget() {
+        exceptionRule.expect(RuntimeException.class);
+        exceptionRule.expectMessage("Empty target when generating dataset from data frame.");
+        parameters.setTarget(null);
+        LogisticRegression classification = new LogisticRegression(parameters);
+        Model model = classification.train(trainDataFrame);
+    }
+
+    @Test
+    public void predict() {
+        LogisticRegression classification = new LogisticRegression(parameters);
+        Model model = classification.train(trainDataFrame);
+        MLPredictionOutput output = (MLPredictionOutput)classification.predict(predictionDataFrame, model);
+        DataFrame predictions = output.getPredictionResult();
+        Assert.assertEquals(2, predictions.size());
+    }
+
+    @Test
+    public void predictWithoutModel() {
+        exceptionRule.expect(IllegalArgumentException.class);
+        exceptionRule.expectMessage("No model found for logistic regression prediction.");
+        LogisticRegression classification = new LogisticRegression(parameters);
+        classification.predict(predictionDataFrame, null);
+    }
+
+    @Test
+    public void constructorNegativeLearnRate() {
+        exceptionRule.expect(RuntimeException.class);
+        exceptionRule.expectMessage("Learning rate should not be negative");
+        new LogisticRegression(parameters.toBuilder().learningRate(-0.1).build());
+    }
+
+    @Test
+    public void constructorNegativeEpsilon() {
+        exceptionRule.expect(RuntimeException.class);
+        exceptionRule.expectMessage("Epsilon should not be negative");
+        new LogisticRegression(parameters.toBuilder().epsilon(-1.0).build());
+    }
+
+    @Test
+    public void constructorNegativeEpochs() {
+        exceptionRule.expect(RuntimeException.class);
+        exceptionRule.expectMessage("Epochs should not be negative");
+        new LogisticRegression(parameters.toBuilder().epochs(-1).build());
+    }
+
+    @Test
+    public void constructorNegativeBatchSize() {
+        exceptionRule.expect(RuntimeException.class);
+        exceptionRule.expectMessage("MiniBatchSize should not be negative");
+        new LogisticRegression(parameters.toBuilder().batchSize(-1).build());
+    }
+
+    private void trainAndVerify(LogisticRegressionParams params) {
+        LogisticRegression classification = new LogisticRegression(params);
+        Model model = classification.train(trainDataFrame);
+        Assert.assertEquals(FunctionName.LOGISTIC_REGRESSION.name(), model.getName());
+        Assert.assertEquals(1, model.getVersion());
+        Assert.assertNotNull(model.getContent());
+    }
+}
diff --git a/ml-algorithms/src/test/java/org/opensearch/ml/engine/helper/LogisticRegressionHelper.java b/ml-algorithms/src/test/java/org/opensearch/ml/engine/helper/LogisticRegressionHelper.java
new file mode 100644
index 0000000000..59b4726555
--- /dev/null
+++ b/ml-algorithms/src/test/java/org/opensearch/ml/engine/helper/LogisticRegressionHelper.java
@@ -0,0 +1,55 @@
+/*
+ * Copyright OpenSearch Contributors
+ * SPDX-License-Identifier: Apache-2.0
+ */
+
+package org.opensearch.ml.engine.helper;
+
+import lombok.experimental.UtilityClass;
+import org.opensearch.ml.common.dataframe.ColumnMeta;
+import org.opensearch.ml.common.dataframe.ColumnType;
+import org.opensearch.ml.common.dataframe.DataFrame;
+import org.opensearch.ml.common.dataframe.DataFrameBuilder;
+
+import java.util.ArrayList;
+import java.util.Arrays;
+import java.util.HashMap;
+import java.util.List;
+import java.util.Map;
+
+@UtilityClass
+public class LogisticRegressionHelper {
+    public static DataFrame constructLogisticRegressionTrainDataFrame() {
+        double[] heights = new double[]{175.0, 172.0, 180.0, 165.0, 160.0, 163.0, 182.0, 190.0, 170.0};
+        String[] classes = new String[]{"medium", "medium", "tall", "short", "short", "short", "tall", "tall", "medium"};
+        String[] columnNames = new String[]{"height", "class"};
+        ColumnMeta[] columnMetas = Arrays.stream(columnNames).map(e -> {
+            if (e.equals("class")) {
+                return new ColumnMeta(e, ColumnType.STRING);
+            }
+            return new ColumnMeta(e, ColumnType.DOUBLE);
+        }).toArray(ColumnMeta[]::new);
+        List<Map<String, Object>> rows = new ArrayList<>();
+        for (int i=0; i<heights.length; ++i) {
+            Map<String, Object> row = new HashMap<>();
+            row.put("height", heights[i]);
+            row.put("class", classes[i]);
+            rows.add(row);
+        }
+
+        return DataFrameBuilder.load(columnMetas, rows);
+    }
+
+    public static DataFrame constructLogisticRegressionPredictionDataFrame() {
+        double[] heights = new double[]{181,171};
+        String[] columnNames = new String[]{"height"};
+        ColumnMeta[] columnMetas = Arrays.stream(columnNames).map(e -> new ColumnMeta(e, ColumnType.DOUBLE)).toArray(ColumnMeta[]::new);
+        List<Map<String, Object>> rows = new ArrayList<>();
+        for (int i=0; i<heights.length; ++i) {
+            Map<String, Object> row = new HashMap<>();
+            row.put("height", heights[i]);
+            rows.add(row);
+        }
+        return DataFrameBuilder.load(columnMetas, rows);
+    }
+}
diff --git a/plugin/src/test/java/org/opensearch/ml/action/MLCommonsIntegTestCase.java b/plugin/src/test/java/org/opensearch/ml/action/MLCommonsIntegTestCase.java
index d6f9628579..b9b75e96d6 100644
--- a/plugin/src/test/java/org/opensearch/ml/action/MLCommonsIntegTestCase.java
+++ b/plugin/src/test/java/org/opensearch/ml/action/MLCommonsIntegTestCase.java
@@ -5,6 +5,7 @@
 
 package org.opensearch.ml.action;
 
+import static org.opensearch.ml.common.input.parameter.regression.LogisticRegressionParams.ObjectiveType.LOGMULTICLASS;
 import static org.opensearch.ml.utils.TestData.TARGET_FIELD;
 import static org.opensearch.ml.utils.TestData.TIME_FIELD;
 
@@ -34,6 +35,7 @@
 import org.opensearch.ml.common.input.parameter.rcf.BatchRCFParams;
 import org.opensearch.ml.common.input.parameter.rcf.FitRCFParams;
 import org.opensearch.ml.common.input.parameter.regression.LinearRegressionParams;
+import org.opensearch.ml.common.input.parameter.regression.LogisticRegressionParams;
 import org.opensearch.ml.common.output.MLPredictionOutput;
 import org.opensearch.ml.common.output.MLTrainingOutput;
 import org.opensearch.ml.common.transport.MLTaskResponse;
@@ -103,6 +105,27 @@ public SearchSourceBuilder irisDataQuery() {
         return searchSourceBuilder;
     }
 
+    public SearchSourceBuilder irisDataQueryTrainLogisticRegression() {
+        SearchSourceBuilder searchSourceBuilder = new SearchSourceBuilder();
+        searchSourceBuilder.size(1000);
+        searchSourceBuilder
+            .fetchSource(
+                new String[] { "sepal_length_in_cm", "sepal_width_in_cm", "petal_length_in_cm", "petal_width_in_cm", "class" },
+                null
+            );
+        searchSourceBuilder.query(QueryBuilders.matchAllQuery());
+        return searchSourceBuilder;
+    }
+
+    public SearchSourceBuilder irisDataQueryPredictLogisticRegression() {
+        SearchSourceBuilder searchSourceBuilder = new SearchSourceBuilder();
+        searchSourceBuilder.size(1000);
+        searchSourceBuilder
+            .fetchSource(new String[] { "sepal_length_in_cm", "sepal_width_in_cm", "petal_length_in_cm", "petal_width_in_cm" }, null);
+        searchSourceBuilder.query(QueryBuilders.matchAllQuery());
+        return searchSourceBuilder;
+    }
+
     public MLInputDataset emptyQueryInputDataSet(String indexName) {
         SearchSourceBuilder searchSourceBuilder = irisDataQuery();
         searchSourceBuilder.query(QueryBuilders.matchQuery("class", "wrong_value"));
@@ -135,6 +158,16 @@ public String trainKmeansWithIrisData(String irisIndexName, boolean async) {
         return trainModel(FunctionName.KMEANS, KMeansParams.builder().centroids(3).build(), inputDataset, async);
     }
 
+    public String trainLogisticRegressionWithIrisData(String irisIndexName, boolean async) {
+        MLInputDataset inputDataset = new SearchQueryInputDataset(ImmutableList.of(irisIndexName), irisDataQueryTrainLogisticRegression());
+        return trainModel(
+            FunctionName.LOGISTIC_REGRESSION,
+            LogisticRegressionParams.builder().objectiveType(LOGMULTICLASS).target("class").build(),
+            inputDataset,
+            async
+        );
+    }
+
     public String trainBatchRCFWithDataFrame(int dataSize, boolean async) {
         MLInputDataset inputDataset = new DataFrameInputDataset(TestData.constructTestDataFrame(dataSize));
         return trainModel(FunctionName.BATCH_RCF, BatchRCFParams.builder().build(), inputDataset, async);
diff --git a/plugin/src/test/java/org/opensearch/ml/action/prediction/PredictionITTests.java b/plugin/src/test/java/org/opensearch/ml/action/prediction/PredictionITTests.java
index 704bae9fbd..ba8b313a6a 100644
--- a/plugin/src/test/java/org/opensearch/ml/action/prediction/PredictionITTests.java
+++ b/plugin/src/test/java/org/opensearch/ml/action/prediction/PredictionITTests.java
@@ -47,6 +47,7 @@ public class PredictionITTests extends MLCommonsIntegTestCase {
     private String batchRcfModelId;
     private String fitRcfModelId;
     private String linearRegressionModelId;
+    private String logisticRegressionModelId;
     private int batchRcfDataSize = 100;
 
     @Rule
@@ -66,6 +67,7 @@ public void setUp() throws Exception {
         batchRcfModelId = trainBatchRCFWithDataFrame(500, false);
         fitRcfModelId = trainFitRCFWithDataFrame(500, false);
         linearRegressionModelId = trainLinearRegressionWithDataFrame(100, false);
+        logisticRegressionModelId = trainLogisticRegressionWithIrisData(irisIndexName, false);
         MLModel batchRcfModel = getModel(batchRcfModelId);
         assertNotNull(batchRcfModel);
     }
@@ -103,6 +105,14 @@ public void testPredictionWithEmptyDataset_KMeans() {
         predictionFuture.actionGet();
     }
 
+    public void testPredictionWithSearchInput_LogisticRegression() {
+        MLInputDataset inputDataset = new SearchQueryInputDataset(
+            ImmutableList.of(irisIndexName),
+            irisDataQueryPredictLogisticRegression()
+        );
+        predictAndVerify(logisticRegressionModelId, inputDataset, FunctionName.LOGISTIC_REGRESSION, null, IRIS_DATA_SIZE);
+    }
+
     public void testPredictionWithDataFrame_BatchRCF() {
         MLInputDataset inputDataset = new DataFrameInputDataset(TestData.constructTestDataFrame(batchRcfDataSize));
         predictAndVerify(batchRcfModelId, inputDataset, FunctionName.BATCH_RCF, null, batchRcfDataSize);
diff --git a/plugin/src/test/java/org/opensearch/ml/action/training/TrainingITTests.java b/plugin/src/test/java/org/opensearch/ml/action/training/TrainingITTests.java
index af2947da2f..7ee2378cf9 100644
--- a/plugin/src/test/java/org/opensearch/ml/action/training/TrainingITTests.java
+++ b/plugin/src/test/java/org/opensearch/ml/action/training/TrainingITTests.java
@@ -8,7 +8,6 @@
 import java.util.concurrent.TimeUnit;
 import java.util.concurrent.atomic.AtomicReference;
 
-import org.apache.lucene.tests.util.LuceneTestCase;
 import org.junit.Before;
 import org.junit.Rule;
 import org.junit.rules.ExpectedException;
@@ -34,7 +33,6 @@ public void setUp() throws Exception {
         loadIrisData(irisIndexName);
     }
 
-    @LuceneTestCase.AwaitsFix(bugUrl = "https://github.com/oracle/tribuo/issues/223")
     public void testTrainingWithSearchInput_Async_KMenas() throws InterruptedException {
         String taskId = trainKmeansWithIrisData(irisIndexName, true);
         assertNotNull(taskId);
@@ -49,7 +47,6 @@ public void testTrainingWithSearchInput_Async_KMenas() throws InterruptedExcepti
         assertNotNull(model);
     }
 
-    @LuceneTestCase.AwaitsFix(bugUrl = "https://github.com/oracle/tribuo/issues/223")
     public void testTrainingWithSearchInput_Sync_KMenas() {
         String modelId = trainKmeansWithIrisData(irisIndexName, false);
         assertNotNull(modelId);
@@ -57,6 +54,27 @@ public void testTrainingWithSearchInput_Sync_KMenas() {
         assertNotNull(model);
     }
 
+    public void testTrainingWithSearchInput_Sync_LogisticRegression() {
+        String modelId = trainLogisticRegressionWithIrisData(irisIndexName, false);
+        assertNotNull(modelId);
+        MLModel model = getModel(modelId);
+        assertNotNull(model);
+    }
+
+    public void testTrainingWithSearchInput_Async_LogisticRegression() throws InterruptedException {
+        String taskId = trainLogisticRegressionWithIrisData(irisIndexName, true);
+        assertNotNull(taskId);
+
+        AtomicReference<String> modelId = new AtomicReference<>();
+        waitUntil(() -> {
+            String id = getTask(taskId).getModelId();
+            modelId.set(id);
+            return id != null;
+        }, 10, TimeUnit.SECONDS);
+        MLModel model = getModel(modelId.get());
+        assertNotNull(model);
+    }
+
     public void testTrainingWithDataFrame_Async_BatchRCF() throws InterruptedException {
         String taskId = trainBatchRCFWithDataFrame(500, true);
         assertNotNull(taskId);

From 0a3b6df271dcb550d52225dfe18fa45956cb66a8 Mon Sep 17 00:00:00 2001
From: Xun Zhang <xunzh@amazon.com>
Date: Tue, 2 Aug 2022 16:34:04 -0700
Subject: [PATCH 2/4] register logistic regression param and use
 LinearSGDTrainer

Signed-off-by: Xun Zhang <xunzh@amazon.com>
---
 .../ml/engine/algorithms/regression/LogisticRegression.java  | 5 ++---
 .../main/java/org/opensearch/ml/engine/utils/TribuoUtil.java | 2 +-
 .../java/org/opensearch/ml/plugin/MachineLearningPlugin.java | 4 +++-
 3 files changed, 6 insertions(+), 5 deletions(-)

diff --git a/ml-algorithms/src/main/java/org/opensearch/ml/engine/algorithms/regression/LogisticRegression.java b/ml-algorithms/src/main/java/org/opensearch/ml/engine/algorithms/regression/LogisticRegression.java
index 54086db8e4..ab15a92c18 100644
--- a/ml-algorithms/src/main/java/org/opensearch/ml/engine/algorithms/regression/LogisticRegression.java
+++ b/ml-algorithms/src/main/java/org/opensearch/ml/engine/algorithms/regression/LogisticRegression.java
@@ -25,7 +25,7 @@
 import org.tribuo.classification.Label;
 import org.tribuo.classification.LabelFactory;
 import org.tribuo.classification.sgd.LabelObjective;
-import org.tribuo.classification.sgd.linear.LogisticRegressionTrainer;
+import org.tribuo.classification.sgd.linear.LinearSGDTrainer;
 import org.tribuo.classification.sgd.objectives.Hinge;
 import org.tribuo.classification.sgd.objectives.LogMulticlass;
 import org.tribuo.math.StochasticGradientOptimiser;
@@ -114,9 +114,8 @@ private void createOptimiser() {
     public Model train(DataFrame dataFrame) {
         MutableDataset<Label> trainDataset = TribuoUtil.generateDatasetWithTarget(dataFrame, new LabelFactory(),
                 "Logistic regression training data from OpenSearch", TribuoOutputType.LABEL, parameters.getTarget());
-        // Integer epochs = Optional.ofNullable(parameters.getEpochs()).orElse(DEFAULT_EPOCHS);
         // LinearSGDTrainer(objective=LogMulticlass,optimiser=AdaGrad(initialLearningRate=1.0,epsilon=0.1,initialValue=0.0),epochs=5,minibatchSize=1,seed=12345)
-        Trainer<Label> logisticRegressionTrainer = new LogisticRegressionTrainer();
+        Trainer<Label> logisticRegressionTrainer = new LinearSGDTrainer(new LogMulticlass(), new AdaGrad(1.0, 0.1), 5, Trainer.DEFAULT_SEED);
         org.tribuo.Model<Label> classificationModel = logisticRegressionTrainer.train(trainDataset);
         Model model = new Model();
         model.setName(FunctionName.LOGISTIC_REGRESSION.name());
diff --git a/ml-algorithms/src/main/java/org/opensearch/ml/engine/utils/TribuoUtil.java b/ml-algorithms/src/main/java/org/opensearch/ml/engine/utils/TribuoUtil.java
index 40cf7718a6..5805a0c1da 100644
--- a/ml-algorithms/src/main/java/org/opensearch/ml/engine/utils/TribuoUtil.java
+++ b/ml-algorithms/src/main/java/org/opensearch/ml/engine/utils/TribuoUtil.java
@@ -135,7 +135,7 @@ public static <T extends Output<T>> MutableDataset<T> generateDataset(DataFrame
                     example = new ArrayExample<>((T) new Event(defaultEventType), featureNamesValues.v1(), featureNamesValues.v2()[i]);
                     break;
                 case LABEL:
-                    example = new ArrayExample<>((T) new Label(""), featureNamesValues.v1(), featureNamesValues.v2()[i]);
+                    example = new ArrayExample<>((T) outputFactory.getUnknownOutput(), featureNamesValues.v1(), featureNamesValues.v2()[i]);
                     break;
                 default:
                     throw new IllegalArgumentException("unknown type:" + outputType);
diff --git a/plugin/src/main/java/org/opensearch/ml/plugin/MachineLearningPlugin.java b/plugin/src/main/java/org/opensearch/ml/plugin/MachineLearningPlugin.java
index 3976883753..e2cc1e8383 100644
--- a/plugin/src/main/java/org/opensearch/ml/plugin/MachineLearningPlugin.java
+++ b/plugin/src/main/java/org/opensearch/ml/plugin/MachineLearningPlugin.java
@@ -52,6 +52,7 @@
 import org.opensearch.ml.common.input.parameter.rcf.BatchRCFParams;
 import org.opensearch.ml.common.input.parameter.rcf.FitRCFParams;
 import org.opensearch.ml.common.input.parameter.regression.LinearRegressionParams;
+import org.opensearch.ml.common.input.parameter.regression.LogisticRegressionParams;
 import org.opensearch.ml.common.input.parameter.sample.SampleAlgoParams;
 import org.opensearch.ml.common.transport.execute.MLExecuteTaskAction;
 import org.opensearch.ml.common.transport.model.MLModelDeleteAction;
@@ -298,7 +299,8 @@ public List<NamedXContentRegistry.Entry> getNamedXContent() {
                 BatchRCFParams.XCONTENT_REGISTRY,
                 LocalSampleCalculatorInput.XCONTENT_REGISTRY,
                 AnomalyLocalizationInput.XCONTENT_REGISTRY_ENTRY,
-                RCFSummarizeParams.XCONTENT_REGISTRY
+                RCFSummarizeParams.XCONTENT_REGISTRY,
+                LogisticRegressionParams.XCONTENT_REGISTRY
             );
     }
 }

From cca73b5bee3fda519cd2927835c8af7bce97e5c7 Mon Sep 17 00:00:00 2001
From: Xun Zhang <xunzh@amazon.com>
Date: Wed, 3 Aug 2022 16:39:13 -0700
Subject: [PATCH 3/4] make all logistic regression params configurable

Signed-off-by: Xun Zhang <xunzh@amazon.com>
---
 .../regression/LogisticRegressionParams.java  | 15 +++++++++++-
 .../regression/LogisticRegression.java        | 24 +++++++++++++++----
 2 files changed, 34 insertions(+), 5 deletions(-)

diff --git a/common/src/main/java/org/opensearch/ml/common/input/parameter/regression/LogisticRegressionParams.java b/common/src/main/java/org/opensearch/ml/common/input/parameter/regression/LogisticRegressionParams.java
index 506a5289ea..f1f1c0a712 100644
--- a/common/src/main/java/org/opensearch/ml/common/input/parameter/regression/LogisticRegressionParams.java
+++ b/common/src/main/java/org/opensearch/ml/common/input/parameter/regression/LogisticRegressionParams.java
@@ -39,6 +39,7 @@ public class LogisticRegressionParams implements MLAlgoParams {
     public static final String EPSILON_FIELD = "epsilon";
     public static final String EPOCHS_FIELD = "epochs";
     public static final String BATCH_SIZE_FIELD = "batch_size";
+    public static final String LOGGING_INTERVAL_FIELD = "logging_interval";
     public static final String SEED_FIELD = "seed";
     public static final String TARGET_FIELD = "target";
 
@@ -48,6 +49,7 @@ public class LogisticRegressionParams implements MLAlgoParams {
     private Double epsilon;
     private Integer epochs;
     private Integer batchSize;
+    private Integer loggingInterval;
     private Long seed;
     private String target;
 
@@ -59,6 +61,7 @@ public LogisticRegressionParams(
         Double epsilon,
         Integer epochs,
         Integer batchSize,
+        Integer loggingInterval,
         Long seed,
         String target
     ) {
@@ -68,6 +71,7 @@ public LogisticRegressionParams(
         this.epsilon = epsilon;
         this.epochs = epochs;
         this.batchSize = batchSize;
+        this.loggingInterval = loggingInterval;
         this.seed = seed;
         this.target = target;
     }
@@ -84,6 +88,7 @@ public LogisticRegressionParams(StreamInput in) throws IOException {
         this.epsilon = in.readOptionalDouble();
         this.epochs = in.readOptionalInt();
         this.batchSize = in.readOptionalInt();
+        this.loggingInterval = in.readOptionalInt();
         this.seed = in.readOptionalLong();
         this.target = in.readOptionalString();
     }
@@ -95,6 +100,7 @@ public static MLAlgoParams parse(XContentParser parser) throws IOException {
         Double epsilon = null;
         Integer epochs = null;
         Integer batchSize = null;
+        Integer loggingInterval = null;
         Long seed = null;
         String target = null;
 
@@ -122,6 +128,9 @@ public static MLAlgoParams parse(XContentParser parser) throws IOException {
                 case BATCH_SIZE_FIELD:
                     batchSize = parser.intValue(false);
                     break;
+                case LOGGING_INTERVAL_FIELD:
+                    loggingInterval = parser.intValue(false);
+                    break;
                 case SEED_FIELD:
                     seed = parser.longValue(false);
                     break;
@@ -133,7 +142,7 @@ public static MLAlgoParams parse(XContentParser parser) throws IOException {
                     break;
             }
         }
-        return new LogisticRegressionParams(objective,  optimizerType,  learningRate, epsilon, epochs, batchSize, seed, target);
+        return new LogisticRegressionParams(objective,  optimizerType,  learningRate, epsilon, epochs, batchSize, loggingInterval, seed, target);
     }
 
     @Override
@@ -154,6 +163,7 @@ public void writeTo(StreamOutput out) throws IOException {
         out.writeOptionalDouble(epsilon);
         out.writeOptionalInt(epochs);
         out.writeOptionalInt(batchSize);
+        out.writeOptionalInt(loggingInterval);
         out.writeOptionalLong(seed);
         out.writeOptionalString(target);
     }
@@ -179,6 +189,9 @@ public XContentBuilder toXContent(XContentBuilder builder, Params params) throws
         if (batchSize != null) {
             builder.field(BATCH_SIZE_FIELD, batchSize);
         }
+        if (loggingInterval != null) {
+            builder.field(LOGGING_INTERVAL_FIELD, loggingInterval);
+        }
         if (seed != null) {
             builder.field(SEED_FIELD, seed);
         }
diff --git a/ml-algorithms/src/main/java/org/opensearch/ml/engine/algorithms/regression/LogisticRegression.java b/ml-algorithms/src/main/java/org/opensearch/ml/engine/algorithms/regression/LogisticRegression.java
index ab15a92c18..5aae1d469b 100644
--- a/ml-algorithms/src/main/java/org/opensearch/ml/engine/algorithms/regression/LogisticRegression.java
+++ b/ml-algorithms/src/main/java/org/opensearch/ml/engine/algorithms/regression/LogisticRegression.java
@@ -42,12 +42,19 @@ public class LogisticRegression implements Trainable, Predictable {
 
     private static final LogisticRegressionParams.ObjectiveType DEFAULT_OBJECTIVE_TYPE = LogisticRegressionParams.ObjectiveType.LOGMULTICLASS;
     private static final LogisticRegressionParams.OptimizerType DEFAULT_OPTIMIZER_TYPE = LogisticRegressionParams.OptimizerType.ADA_GRAD;
-    private static final double DEFAULT_LEARNING_RATE = 0.01;
+    private static final double DEFAULT_LEARNING_RATE = 1.0;
 
     //AdaGrad, AdaDelta, AdaGradRDA, Adam, RMSProp
-    private static final double DEFAULT_EPSILON = 1e-6;
+    private static final double DEFAULT_EPSILON = 0.1;
+    private static final int DEFAULT_EPOCHS = 5;
+    private static final int DEFAULT_LOGGING_INTERVAL = 1000;
+    private static final int DEFAULT_BATCH_SIZE = 1;
+    private static final Long DEFAULT_SEED = Trainer.DEFAULT_SEED;
 
-    private static final int DEFAULT_EPOCHS = 10;
+    private int epochs;
+    private int loggingInterval;
+    private int minibatchSize;
+    private long seed;
 
     private LogisticRegressionParams parameters;
     private StochasticGradientOptimiser optimiser;
@@ -79,6 +86,15 @@ private void validateParameters() {
         if (parameters.getBatchSize() != null && parameters.getBatchSize() < 0) {
             throw new IllegalArgumentException("MiniBatchSize should not be negative.");
         }
+
+        if (parameters.getLoggingInterval() != null && parameters.getLoggingInterval() < 0) {
+            throw new IllegalArgumentException("Logging intervals should not be negative.");
+        }
+
+        epochs = Optional.ofNullable(parameters.getEpochs()).orElse(DEFAULT_EPOCHS);
+        loggingInterval = Optional.ofNullable(parameters.getLoggingInterval()).orElse(DEFAULT_LOGGING_INTERVAL);
+        minibatchSize = Optional.ofNullable(parameters.getBatchSize()).orElse(DEFAULT_BATCH_SIZE);
+        seed = Optional.ofNullable(parameters.getSeed()).orElse(DEFAULT_SEED);
     }
 
     private void createObjective() {
@@ -115,7 +131,7 @@ public Model train(DataFrame dataFrame) {
         MutableDataset<Label> trainDataset = TribuoUtil.generateDatasetWithTarget(dataFrame, new LabelFactory(),
                 "Logistic regression training data from OpenSearch", TribuoOutputType.LABEL, parameters.getTarget());
         // LinearSGDTrainer(objective=LogMulticlass,optimiser=AdaGrad(initialLearningRate=1.0,epsilon=0.1,initialValue=0.0),epochs=5,minibatchSize=1,seed=12345)
-        Trainer<Label> logisticRegressionTrainer = new LinearSGDTrainer(new LogMulticlass(), new AdaGrad(1.0, 0.1), 5, Trainer.DEFAULT_SEED);
+        Trainer<Label> logisticRegressionTrainer = new LinearSGDTrainer(objective, optimiser, epochs, loggingInterval, minibatchSize, seed);
         org.tribuo.Model<Label> classificationModel = logisticRegressionTrainer.train(trainDataset);
         Model model = new Model();
         model.setName(FunctionName.LOGISTIC_REGRESSION.name());

From 6e0f349f8ad9a5a664f842e0e7216de3433a74bd Mon Sep 17 00:00:00 2001
From: Xun Zhang <xunzh@amazon.com>
Date: Thu, 4 Aug 2022 13:59:43 -0700
Subject: [PATCH 4/4] add more optimizerTypes and momentumTypes

Signed-off-by: Xun Zhang <xunzh@amazon.com>
---
 .../ml/common/dataframe/DefaultDataFrame.java |  6 +-
 .../regression/LogisticRegressionParams.java  | 92 ++++++++++++++++++-
 .../regression/LogisticRegression.java        | 51 ++++++++--
 .../regression/LogisticRegressionTest.java    | 36 ++++++++
 4 files changed, 172 insertions(+), 13 deletions(-)

diff --git a/common/src/main/java/org/opensearch/ml/common/dataframe/DefaultDataFrame.java b/common/src/main/java/org/opensearch/ml/common/dataframe/DefaultDataFrame.java
index 228dd40157..2f5daed23b 100644
--- a/common/src/main/java/org/opensearch/ml/common/dataframe/DefaultDataFrame.java
+++ b/common/src/main/java/org/opensearch/ml/common/dataframe/DefaultDataFrame.java
@@ -133,11 +133,11 @@ public DataFrame select(int[] columns) {
 
     @Override
     public int getColumnIndex(String target) {
-        List<String> featureNames = Arrays.stream(this.columnMetas()).map(ColumnMeta::getName).collect(Collectors.toList());
+        List<String> columnNames = Arrays.stream(this.columnMetas()).map(ColumnMeta::getName).collect(Collectors.toList());
 
         int targetIndex = -1;
-        for (int i = 0; i < featureNames.size(); ++i) {
-            if (featureNames.get(i).equals(target)) {
+        for (int i = 0; i < columnNames.size(); ++i) {
+            if (columnNames.get(i).equals(target)) {
                 targetIndex = i;
                 break;
             }
diff --git a/common/src/main/java/org/opensearch/ml/common/input/parameter/regression/LogisticRegressionParams.java b/common/src/main/java/org/opensearch/ml/common/input/parameter/regression/LogisticRegressionParams.java
index f1f1c0a712..992dad68cf 100644
--- a/common/src/main/java/org/opensearch/ml/common/input/parameter/regression/LogisticRegressionParams.java
+++ b/common/src/main/java/org/opensearch/ml/common/input/parameter/regression/LogisticRegressionParams.java
@@ -35,18 +35,28 @@ public class LogisticRegressionParams implements MLAlgoParams {
 
     public static final String OBJECTIVE_FIELD = "objective";
     public static final String OPTIMISER_FIELD = "optimiser";
+    public static final String MOMENTUM_TYPE_FIELD = "momentum_type";
     public static final String LEARNING_RATE_FIELD = "learning_rate";
     public static final String EPSILON_FIELD = "epsilon";
+    public static final String MOMENTUM_FACTOR_FIELD = "momentum_factor";
+    public static final String BETA1_FIELD = "beta1";
+    public static final String BETA2_FIELD = "beta2";
+    public static final String DECAY_RATE_FIELD = "decay_rate";
     public static final String EPOCHS_FIELD = "epochs";
     public static final String BATCH_SIZE_FIELD = "batch_size";
     public static final String LOGGING_INTERVAL_FIELD = "logging_interval";
     public static final String SEED_FIELD = "seed";
     public static final String TARGET_FIELD = "target";
 
-    private LogisticRegressionParams.ObjectiveType objectiveType;
-    private LogisticRegressionParams.OptimizerType optimizerType;
+    private ObjectiveType objectiveType;
+    private OptimizerType optimizerType;
+    private MomentumType momentumType;
     private Double learningRate;
     private Double epsilon;
+    private Double momentumFactor;
+    private Double beta1;
+    private Double beta2;
+    private Double decayRate;
     private Integer epochs;
     private Integer batchSize;
     private Integer loggingInterval;
@@ -57,8 +67,13 @@ public class LogisticRegressionParams implements MLAlgoParams {
     public LogisticRegressionParams(
         ObjectiveType objectiveType,
         OptimizerType optimizerType,
+        MomentumType momentumType,
         Double learningRate,
         Double epsilon,
+        Double momentumFactor,
+        Double beta1,
+        Double beta2,
+        Double decayRate,
         Integer epochs,
         Integer batchSize,
         Integer loggingInterval,
@@ -67,8 +82,13 @@ public LogisticRegressionParams(
     ) {
         this.objectiveType = objectiveType;
         this.optimizerType = optimizerType;
+        this.momentumType = momentumType;
         this.learningRate = learningRate;
         this.epsilon = epsilon;
+        this.momentumFactor = momentumFactor;
+        this.beta1 = beta1;
+        this.beta2 = beta2;
+        this.decayRate = decayRate;
         this.epochs = epochs;
         this.batchSize = batchSize;
         this.loggingInterval = loggingInterval;
@@ -83,9 +103,15 @@ public LogisticRegressionParams(StreamInput in) throws IOException {
         if (in.readBoolean()) {
             this.optimizerType = in.readEnum(OptimizerType.class);
         }
+        if (in.readBoolean()) {
+            this.momentumType = in.readEnum(MomentumType.class);
+        }
         this.learningRate = in.readOptionalDouble();
-
         this.epsilon = in.readOptionalDouble();
+        this.momentumFactor = in.readOptionalDouble();
+        this.beta1 = in.readOptionalDouble();
+        this.beta2 = in.readOptionalDouble();
+        this.decayRate = in.readOptionalDouble();
         this.epochs = in.readOptionalInt();
         this.batchSize = in.readOptionalInt();
         this.loggingInterval = in.readOptionalInt();
@@ -96,8 +122,13 @@ public LogisticRegressionParams(StreamInput in) throws IOException {
     public static MLAlgoParams parse(XContentParser parser) throws IOException {
         ObjectiveType objective = null;
         OptimizerType optimizerType = null;
+        MomentumType momentumType = null;
         Double learningRate = null;
         Double epsilon = null;
+        Double momentumFactor = null;
+        Double beta1 = null;
+        Double beta2 = null;
+        Double decayRate = null;
         Integer epochs = null;
         Integer batchSize = null;
         Integer loggingInterval = null;
@@ -116,12 +147,27 @@ public static MLAlgoParams parse(XContentParser parser) throws IOException {
                 case OPTIMISER_FIELD:
                     optimizerType = OptimizerType.valueOf(parser.text().toUpperCase(Locale.ROOT));
                     break;
+                case MOMENTUM_TYPE_FIELD:
+                    momentumType = MomentumType.valueOf(parser.text().toUpperCase(Locale.ROOT));
+                    break;
                 case LEARNING_RATE_FIELD:
                     learningRate = parser.doubleValue(false);
                     break;
                 case EPSILON_FIELD:
                     epsilon = parser.doubleValue(false);
                     break;
+                case MOMENTUM_FACTOR_FIELD:
+                    momentumFactor = parser.doubleValue(false);
+                    break;
+                case BETA1_FIELD:
+                    beta1 = parser.doubleValue(false);
+                    break;
+                case BETA2_FIELD:
+                    beta2 = parser.doubleValue(false);
+                    break;
+                case DECAY_RATE_FIELD:
+                    decayRate = parser.doubleValue(false);
+                    break;
                 case EPOCHS_FIELD:
                     epochs = parser.intValue(false);
                     break;
@@ -142,7 +188,7 @@ public static MLAlgoParams parse(XContentParser parser) throws IOException {
                     break;
             }
         }
-        return new LogisticRegressionParams(objective,  optimizerType,  learningRate, epsilon, epochs, batchSize, loggingInterval, seed, target);
+        return new LogisticRegressionParams(objective, optimizerType, momentumType, learningRate, epsilon, momentumFactor, beta1, beta2, decayRate, epochs, batchSize, loggingInterval, seed, target);
     }
 
     @Override
@@ -159,8 +205,18 @@ public void writeTo(StreamOutput out) throws IOException {
         } else {
             out.writeBoolean(false);
         }
+        if (momentumType != null) {
+            out.writeBoolean(true);
+            out.writeEnum(momentumType);
+        } else {
+            out.writeBoolean(false);
+        }
         out.writeOptionalDouble(learningRate);
         out.writeOptionalDouble(epsilon);
+        out.writeOptionalDouble(momentumFactor);
+        out.writeOptionalDouble(beta1);
+        out.writeOptionalDouble(beta2);
+        out.writeOptionalDouble(decayRate);
         out.writeOptionalInt(epochs);
         out.writeOptionalInt(batchSize);
         out.writeOptionalInt(loggingInterval);
@@ -177,12 +233,27 @@ public XContentBuilder toXContent(XContentBuilder builder, Params params) throws
         if (optimizerType != null) {
             builder.field(OPTIMISER_FIELD, optimizerType);
         }
+        if (momentumType != null) {
+            builder.field(MOMENTUM_TYPE_FIELD, momentumType);
+        }
         if (learningRate != null) {
             builder.field(LEARNING_RATE_FIELD, learningRate);
         }
         if (epsilon != null) {
             builder.field(EPSILON_FIELD, epsilon);
         }
+        if (momentumFactor != null) {
+            builder.field(MOMENTUM_FACTOR_FIELD, momentumFactor);
+        }
+        if (beta1 != null) {
+            builder.field(BETA1_FIELD, beta1);
+        }
+        if (beta2 != null) {
+            builder.field(BETA1_FIELD, beta2);
+        }
+        if (decayRate != null) {
+            builder.field(DECAY_RATE_FIELD, decayRate);
+        }
         if (epochs != null) {
             builder.field(EPOCHS_FIELD, epochs);
         }
@@ -224,6 +295,19 @@ public static ObjectiveType from(String value) {
         }
     }
 
+    public enum MomentumType {
+        STANDARD,
+        NESTEROV;
+
+        public static MomentumType from(String value) {
+            try{
+                return MomentumType.valueOf(value);
+            } catch (Exception e) {
+                throw new IllegalArgumentException("Wrong momentum type");
+            }
+        }
+    }
+
     public enum OptimizerType {
         SIMPLE_SGD,
         LINEAR_DECAY_SGD,
diff --git a/ml-algorithms/src/main/java/org/opensearch/ml/engine/algorithms/regression/LogisticRegression.java b/ml-algorithms/src/main/java/org/opensearch/ml/engine/algorithms/regression/LogisticRegression.java
index 5aae1d469b..de6faed9c0 100644
--- a/ml-algorithms/src/main/java/org/opensearch/ml/engine/algorithms/regression/LogisticRegression.java
+++ b/ml-algorithms/src/main/java/org/opensearch/ml/engine/algorithms/regression/LogisticRegression.java
@@ -29,7 +29,11 @@
 import org.tribuo.classification.sgd.objectives.Hinge;
 import org.tribuo.classification.sgd.objectives.LogMulticlass;
 import org.tribuo.math.StochasticGradientOptimiser;
+import org.tribuo.math.optimisers.AdaDelta;
 import org.tribuo.math.optimisers.AdaGrad;
+import org.tribuo.math.optimisers.Adam;
+import org.tribuo.math.optimisers.RMSProp;
+import org.tribuo.math.optimisers.SGD;
 
 import java.util.ArrayList;
 import java.util.Collections;
@@ -42,6 +46,7 @@ public class LogisticRegression implements Trainable, Predictable {
 
     private static final LogisticRegressionParams.ObjectiveType DEFAULT_OBJECTIVE_TYPE = LogisticRegressionParams.ObjectiveType.LOGMULTICLASS;
     private static final LogisticRegressionParams.OptimizerType DEFAULT_OPTIMIZER_TYPE = LogisticRegressionParams.OptimizerType.ADA_GRAD;
+    private static final LogisticRegressionParams.MomentumType DEFAULT_MOMENTUM_TYPE = LogisticRegressionParams.MomentumType.STANDARD;
     private static final double DEFAULT_LEARNING_RATE = 1.0;
 
     //AdaGrad, AdaDelta, AdaGradRDA, Adam, RMSProp
@@ -50,6 +55,11 @@ public class LogisticRegression implements Trainable, Predictable {
     private static final int DEFAULT_LOGGING_INTERVAL = 1000;
     private static final int DEFAULT_BATCH_SIZE = 1;
     private static final Long DEFAULT_SEED = Trainer.DEFAULT_SEED;
+    private static final double DEFAULT_MOMENTUM_FACTOR = 0;
+    private static final double DEFAULT_BETA1 = 0.9;
+    private static final double DEFAULT_BETA2 = 0.99;
+    //RMSProp
+    private static final double DEFAULT_DECAY_RATE = 0.9;
 
     private int epochs;
     private int loggingInterval;
@@ -87,8 +97,9 @@ private void validateParameters() {
             throw new IllegalArgumentException("MiniBatchSize should not be negative.");
         }
 
-        if (parameters.getLoggingInterval() != null && parameters.getLoggingInterval() < 0) {
-            throw new IllegalArgumentException("Logging intervals should not be negative.");
+        // loggingInterval – Log the loss after this many iterations. If -1 don't log anything.
+        if (parameters.getLoggingInterval() != null && parameters.getLoggingInterval() < -1) {
+            throw new IllegalArgumentException("Invalid Logging intervals");
         }
 
         epochs = Optional.ofNullable(parameters.getEpochs()).orElse(DEFAULT_EPOCHS);
@@ -113,11 +124,39 @@ private void createOptimiser() {
         LogisticRegressionParams.OptimizerType optimizerType = Optional.ofNullable(parameters.getOptimizerType()).orElse(DEFAULT_OPTIMIZER_TYPE);
         Double learningRate = Optional.ofNullable(parameters.getLearningRate()).orElse(DEFAULT_LEARNING_RATE);
         Double epsilon = Optional.ofNullable(parameters.getEpsilon()).orElse(DEFAULT_EPSILON);
-
+        Double momentumFactor = Optional.ofNullable(parameters.getMomentumFactor()).orElse(DEFAULT_MOMENTUM_FACTOR);
+        LogisticRegressionParams.MomentumType momentumType = Optional.ofNullable(parameters.getMomentumType()).orElse(DEFAULT_MOMENTUM_TYPE);
+        Double beta1 = Optional.ofNullable(parameters.getBeta1()).orElse(DEFAULT_BETA1);
+        Double beta2 = Optional.ofNullable(parameters.getBeta2()).orElse(DEFAULT_BETA2);
+        Double decayRate = Optional.ofNullable(parameters.getDecayRate()).orElse(DEFAULT_DECAY_RATE);
+
+        SGD.Momentum momentum;
+        switch (momentumType) {
+            case NESTEROV:
+                momentum = SGD.Momentum.NESTEROV;
+                break;
+            default:
+                momentum = SGD.Momentum.STANDARD;
+                break;
+        }
         switch (optimizerType) {
-            // ToDo: Add more possible optimizer. Tribuo only provides AdaGrad for logistic regression.
-            case ADA_GRAD:
-                optimiser = new AdaGrad(learningRate, epsilon);
+            case LINEAR_DECAY_SGD:
+                optimiser = SGD.getLinearDecaySGD(learningRate, momentumFactor, momentum);
+                break;
+            case SQRT_DECAY_SGD:
+                optimiser = SGD.getSqrtDecaySGD(learningRate, momentumFactor, momentum);
+                break;
+            case ADA_DELTA:
+                optimiser = new AdaDelta(momentumFactor, epsilon);
+                break;
+            case ADAM:
+                optimiser = new Adam(learningRate, beta1, beta2, epsilon);
+                break;
+            case RMS_PROP:
+                optimiser = new RMSProp(learningRate, momentumFactor, epsilon, decayRate);
+                break;
+            case SIMPLE_SGD:
+                optimiser = SGD.getSimpleSGD(learningRate, momentumFactor, momentum);
                 break;
             default:
                 //Use default SGD with a constant learning rate.
diff --git a/ml-algorithms/src/test/java/org/opensearch/ml/engine/algorithms/regression/LogisticRegressionTest.java b/ml-algorithms/src/test/java/org/opensearch/ml/engine/algorithms/regression/LogisticRegressionTest.java
index a03e93afc6..28e02c4416 100644
--- a/ml-algorithms/src/test/java/org/opensearch/ml/engine/algorithms/regression/LogisticRegressionTest.java
+++ b/ml-algorithms/src/test/java/org/opensearch/ml/engine/algorithms/regression/LogisticRegressionTest.java
@@ -45,6 +45,42 @@ public void train() {
         trainAndVerify(parameters);
     }
 
+    @Test
+    public void train_linear_decay_sgd() {
+        parameters.setOptimizerType(LogisticRegressionParams.OptimizerType.LINEAR_DECAY_SGD);
+        trainAndVerify(parameters);
+    }
+
+    @Test
+    public void train_sqrt_decay_sgd() {
+        parameters.setOptimizerType(LogisticRegressionParams.OptimizerType.SQRT_DECAY_SGD);
+        trainAndVerify(parameters);
+    }
+
+    @Test
+    public void train_sqrt_ada_delta() {
+        parameters.setOptimizerType(LogisticRegressionParams.OptimizerType.ADA_DELTA);
+        trainAndVerify(parameters);
+    }
+
+    @Test
+    public void train_adam() {
+        parameters.setOptimizerType(LogisticRegressionParams.OptimizerType.ADAM);
+        trainAndVerify(parameters);
+    }
+
+    @Test
+    public void train_rms_prop() {
+        parameters.setOptimizerType(LogisticRegressionParams.OptimizerType.SIMPLE_SGD);
+        trainAndVerify(parameters);
+    }
+
+    @Test
+    public void train_simple_sgd() {
+        parameters.setOptimizerType(LogisticRegressionParams.OptimizerType.RMS_PROP);
+        trainAndVerify(parameters);
+    }
+
     @Test
     public void trainExceptionWithoutTarget() {
         exceptionRule.expect(RuntimeException.class);