Async query get result bug fix (opensearch-project#2443)

* Add IT to reproduce the bug first Signed-off-by: Chen Dai <daichen@amazon.com> * Modify IT as temporary reproduce commit Signed-off-by: Chen Dai <daichen@amazon.com> * Fix issue by preferred option and modify IT Signed-off-by: Chen Dai <daichen@amazon.com> * Refactor IT with fluent assertion Signed-off-by: Chen Dai <daichen@amazon.com> * Add IT for batch query handler Signed-off-by: Chen Dai <daichen@amazon.com> * Add IT for streaming query handler Signed-off-by: Chen Dai <daichen@amazon.com> * Add more IT for normal case Signed-off-by: Chen Dai <daichen@amazon.com> * Add IT for drop index Signed-off-by: Chen Dai <daichen@amazon.com> * Consider drop statement running if result doc unavailable Signed-off-by: Chen Dai <daichen@amazon.com> * Fix broken UT Signed-off-by: Chen Dai <daichen@amazon.com> * Address PR comments Signed-off-by: Chen Dai <daichen@amazon.com> * Address PR comments Signed-off-by: Chen Dai <daichen@amazon.com> --------- Signed-off-by: Chen Dai <daichen@amazon.com>
zane-neo · Dec 1, 2023 · 60058ce · 60058ce
1 parent 2c230be
commit 60058ce
Show file tree

Hide file tree

Showing 6 changed files with 471 additions and 124 deletions.
diff --git a/spark/src/main/java/org/opensearch/sql/spark/dispatcher/AsyncQueryHandler.java b/spark/src/main/java/org/opensearch/sql/spark/dispatcher/AsyncQueryHandler.java
@@ -15,6 +15,7 @@
 import org.opensearch.sql.spark.dispatcher.model.DispatchQueryContext;
 import org.opensearch.sql.spark.dispatcher.model.DispatchQueryRequest;
 import org.opensearch.sql.spark.dispatcher.model.DispatchQueryResponse;
+import org.opensearch.sql.spark.execution.statement.StatementState;
 
 /** Process async query request. */
 public abstract class AsyncQueryHandler {
@@ -33,10 +34,20 @@ public JSONObject getQueryResponse(AsyncQueryJobMetadata asyncQueryJobMetadata)
       result.put(ERROR_FIELD, error);
       return result;
     } else {
-      return getResponseFromExecutor(asyncQueryJobMetadata);
+      JSONObject statement = getResponseFromExecutor(asyncQueryJobMetadata);
+
+      // Consider statement still running if state is success but query result unavailable
+      if (isSuccessState(statement)) {
+        statement.put(STATUS_FIELD, StatementState.RUNNING.getState());
+      }
+      return statement;
     }
   }
 
+  private boolean isSuccessState(JSONObject statement) {
+    return StatementState.SUCCESS.getState().equalsIgnoreCase(statement.optString(STATUS_FIELD));
+  }
+
   protected abstract JSONObject getResponseFromResultIndex(
       AsyncQueryJobMetadata asyncQueryJobMetadata);
 

diff --git a/spark/src/main/java/org/opensearch/sql/spark/dispatcher/IndexDMLHandler.java b/spark/src/main/java/org/opensearch/sql/spark/dispatcher/IndexDMLHandler.java
@@ -5,6 +5,8 @@
 
 package org.opensearch.sql.spark.dispatcher;
 
+import static org.opensearch.sql.spark.data.constants.SparkConstants.ERROR_FIELD;
+import static org.opensearch.sql.spark.data.constants.SparkConstants.STATUS_FIELD;
 import static org.opensearch.sql.spark.execution.statestore.StateStore.createIndexDMLResult;
 
 import com.amazonaws.services.emrserverless.model.JobRunState;
@@ -24,6 +26,7 @@
 import org.opensearch.sql.spark.dispatcher.model.DispatchQueryResponse;
 import org.opensearch.sql.spark.dispatcher.model.IndexDMLResult;
 import org.opensearch.sql.spark.dispatcher.model.IndexQueryDetails;
+import org.opensearch.sql.spark.execution.statement.StatementState;
 import org.opensearch.sql.spark.execution.statestore.StateStore;
 import org.opensearch.sql.spark.flint.FlintIndexMetadata;
 import org.opensearch.sql.spark.flint.FlintIndexMetadataReader;
@@ -106,7 +109,11 @@ protected JSONObject getResponseFromResultIndex(AsyncQueryJobMetadata asyncQuery
 
   @Override
   protected JSONObject getResponseFromExecutor(AsyncQueryJobMetadata asyncQueryJobMetadata) {
-    throw new IllegalStateException("[BUG] can't fetch result of index DML query form server");
+    // Consider statement still running if result doc created in submit() is not available yet
+    JSONObject result = new JSONObject();
+    result.put(STATUS_FIELD, StatementState.RUNNING.getState());
+    result.put(ERROR_FIELD, "");
+    return result;
   }
 
   @Override

diff --git a/spark/src/test/java/org/opensearch/sql/spark/asyncquery/AsyncQueryExecutorServiceSpec.java b/spark/src/test/java/org/opensearch/sql/spark/asyncquery/AsyncQueryExecutorServiceSpec.java
@@ -15,6 +15,7 @@
 import com.amazonaws.services.emrserverless.model.CancelJobRunResult;
 import com.amazonaws.services.emrserverless.model.GetJobRunResult;
 import com.amazonaws.services.emrserverless.model.JobRun;
+import com.amazonaws.services.emrserverless.model.JobRunState;
 import com.google.common.base.Charsets;
 import com.google.common.collect.ImmutableList;
 import com.google.common.collect.ImmutableMap;
@@ -27,11 +28,13 @@
 import java.util.List;
 import java.util.Optional;
 import lombok.Getter;
+import lombok.RequiredArgsConstructor;
 import lombok.SneakyThrows;
 import org.apache.commons.lang3.StringUtils;
 import org.junit.After;
 import org.junit.Before;
 import org.opensearch.action.admin.indices.create.CreateIndexRequest;
+import org.opensearch.action.admin.indices.delete.DeleteIndexRequest;
 import org.opensearch.action.search.SearchRequest;
 import org.opensearch.action.search.SearchResponse;
 import org.opensearch.client.node.NodeClient;
@@ -41,6 +44,7 @@
 import org.opensearch.common.settings.Settings;
 import org.opensearch.common.xcontent.XContentType;
 import org.opensearch.index.query.QueryBuilder;
+import org.opensearch.index.seqno.SequenceNumbers;
 import org.opensearch.plugins.Plugin;
 import org.opensearch.search.builder.SearchSourceBuilder;
 import org.opensearch.sql.datasource.model.DataSourceMetadata;
@@ -63,6 +67,9 @@
 import org.opensearch.sql.spark.execution.session.SessionState;
 import org.opensearch.sql.spark.execution.statestore.StateStore;
 import org.opensearch.sql.spark.flint.FlintIndexMetadataReaderImpl;
+import org.opensearch.sql.spark.flint.FlintIndexState;
+import org.opensearch.sql.spark.flint.FlintIndexStateModel;
+import org.opensearch.sql.spark.flint.FlintIndexType;
 import org.opensearch.sql.spark.leasemanager.DefaultLeaseManager;
 import org.opensearch.sql.spark.response.JobExecutionResponseReader;
 import org.opensearch.sql.storage.DataSourceFactory;
@@ -189,10 +196,17 @@ private DataSourceServiceImpl createDataSourceService() {
 
   protected AsyncQueryExecutorService createAsyncQueryExecutorService(
       EMRServerlessClient emrServerlessClient) {
+    return createAsyncQueryExecutorService(
+        emrServerlessClient, new JobExecutionResponseReader(client));
+  }
+
+  /** Pass a custom response reader which can mock interaction between PPL plugin and EMR-S job. */
+  protected AsyncQueryExecutorService createAsyncQueryExecutorService(
+      EMRServerlessClient emrServerlessClient,
+      JobExecutionResponseReader jobExecutionResponseReader) {
     StateStore stateStore = new StateStore(client, clusterService);
     AsyncQueryJobMetadataStorageService asyncQueryJobMetadataStorageService =
         new OpensearchAsyncQueryJobMetadataStorageService(stateStore);
-    JobExecutionResponseReader jobExecutionResponseReader = new JobExecutionResponseReader(client);
     SparkQueryDispatcher sparkQueryDispatcher =
         new SparkQueryDispatcher(
             emrServerlessClient,
@@ -215,6 +229,7 @@ public static class LocalEMRSClient implements EMRServerlessClient {
     private int startJobRunCalled = 0;
     private int cancelJobRunCalled = 0;
     private int getJobResult = 0;
+    private JobRunState jobState = JobRunState.RUNNING;
 
     @Getter private StartJobRequest jobRequest;
 
@@ -229,7 +244,7 @@ public String startJobRun(StartJobRequest startJobRequest) {
     public GetJobRunResult getJobRunResult(String applicationId, String jobId) {
       getJobResult++;
       JobRun jobRun = new JobRun();
-      jobRun.setState("RUNNING");
+      jobRun.setState(jobState.toString());
       return new GetJobRunResult().withJobRun(jobRun);
     }
 
@@ -250,6 +265,10 @@ public void cancelJobRunCalled(int expectedTimes) {
     public void getJobRunResultCalled(int expectedTimes) {
       assertEquals(expectedTimes, getJobResult);
     }
+
+    public void setJobState(JobRunState jobState) {
+      this.jobState = jobState;
+    }
   }
 
   public SparkExecutionEngineConfig sparkExecutionEngineConfig() {
@@ -306,6 +325,111 @@ public String loadResultIndexMappings() {
     return Resources.toString(url, Charsets.UTF_8);
   }
 
+  public class MockFlintSparkJob {
+
+    private FlintIndexStateModel stateModel;
+
+    public MockFlintSparkJob(String latestId) {
+      assertNotNull(latestId);
+      stateModel =
+          new FlintIndexStateModel(
+              FlintIndexState.EMPTY,
+              "mockAppId",
+              "mockJobId",
+              latestId,
+              DATASOURCE,
+              System.currentTimeMillis(),
+              "",
+              SequenceNumbers.UNASSIGNED_SEQ_NO,
+              SequenceNumbers.UNASSIGNED_PRIMARY_TERM);
+      stateModel = StateStore.createFlintIndexState(stateStore, DATASOURCE).apply(stateModel);
+    }
+
+    public void refreshing() {
+      stateModel =
+          StateStore.updateFlintIndexState(stateStore, DATASOURCE)
+              .apply(stateModel, FlintIndexState.REFRESHING);
+    }
+
+    public void cancelling() {
+      stateModel =
+          StateStore.updateFlintIndexState(stateStore, DATASOURCE)
+              .apply(stateModel, FlintIndexState.CANCELLING);
+    }
+
+    public void active() {
+      stateModel =
+          StateStore.updateFlintIndexState(stateStore, DATASOURCE)
+              .apply(stateModel, FlintIndexState.ACTIVE);
+    }
+
+    public void deleting() {
+      stateModel =
+          StateStore.updateFlintIndexState(stateStore, DATASOURCE)
+              .apply(stateModel, FlintIndexState.DELETING);
+    }
+
+    public void deleted() {
+      stateModel =
+          StateStore.updateFlintIndexState(stateStore, DATASOURCE)
+              .apply(stateModel, FlintIndexState.DELETED);
+    }
+
+    void assertState(FlintIndexState expected) {
+      Optional<FlintIndexStateModel> stateModelOpt =
+          StateStore.getFlintIndexState(stateStore, DATASOURCE).apply(stateModel.getId());
+      assertTrue((stateModelOpt.isPresent()));
+      assertEquals(expected, stateModelOpt.get().getIndexState());
+    }
+  }
+
+  @RequiredArgsConstructor
+  public class FlintDatasetMock {
+    final String query;
+    final FlintIndexType indexType;
+    final String indexName;
+    boolean isLegacy = false;
+    String latestId;
+
+    FlintDatasetMock isLegacy(boolean isLegacy) {
+      this.isLegacy = isLegacy;
+      return this;
+    }
+
+    FlintDatasetMock latestId(String latestId) {
+      this.latestId = latestId;
+      return this;
+    }
+
+    public void createIndex() {
+      String pathPrefix = isLegacy ? "flint-index-mappings" : "flint-index-mappings/0.1.1";
+      switch (indexType) {
+        case SKIPPING:
+          createIndexWithMappings(
+              indexName, loadMappings(pathPrefix + "/" + "flint_skipping_index.json"));
+          break;
+        case COVERING:
+          createIndexWithMappings(
+              indexName, loadMappings(pathPrefix + "/" + "flint_covering_index.json"));
+          break;
+        case MATERIALIZED_VIEW:
+          createIndexWithMappings(indexName, loadMappings(pathPrefix + "/" + "flint_mv.json"));
+          break;
+      }
+    }
+
+    @SneakyThrows
+    public void deleteIndex() {
+      client().admin().indices().delete(new DeleteIndexRequest().indices(indexName)).get();
+    }
+  }
+
+  @SneakyThrows
+  public static String loadMappings(String path) {
+    URL url = Resources.getResource(path);
+    return Resources.toString(url, Charsets.UTF_8);
+  }
+
   public void createIndexWithMappings(String indexName, String metadata) {
     CreateIndexRequest request = new CreateIndexRequest(indexName);
     request.mapping(metadata, XContentType.JSON);