From bb68daa64d75be111bc6fcd5c08eb4c97abe92f6 Mon Sep 17 00:00:00 2001 From: Sean Kao Date: Mon, 25 Mar 2024 10:49:45 -0700 Subject: [PATCH] Bug Fix: Escape query in spark submit parameter (#2587) * escape query in spark submit parameter Signed-off-by: Sean Kao * spotless Signed-off-by: Sean Kao * test case for special character Signed-off-by: Sean Kao --------- Signed-off-by: Sean Kao (cherry picked from commit 2bcf0b8b3371558a60200c8b994ee6de64ddcf6e) --- common/build.gradle | 1 + core/build.gradle | 1 + legacy/build.gradle | 1 + .../model/SparkSubmitParameters.java | 8 ++++++- .../model/SparkSubmitParametersTest.java | 23 ++++++++++++++++--- 5 files changed, 30 insertions(+), 4 deletions(-) diff --git a/common/build.gradle b/common/build.gradle index 799e07dd08..5e1759fc64 100644 --- a/common/build.gradle +++ b/common/build.gradle @@ -38,6 +38,7 @@ dependencies { api group: 'org.apache.logging.log4j', name: 'log4j-core', version:"${versions.log4j}" api group: 'org.apache.commons', name: 'commons-lang3', version: '3.12.0' api group: 'com.squareup.okhttp3', name: 'okhttp', version: '4.9.3' + api group: 'org.apache.commons', name: 'commons-text', version: '1.10.0' implementation 'com.github.babbel:okhttp-aws-signer:1.0.2' api group: 'com.amazonaws', name: 'aws-java-sdk-core', version: "${aws_java_sdk_version}" api group: 'com.amazonaws', name: 'aws-java-sdk-sts', version: "${aws_java_sdk_version}" diff --git a/core/build.gradle b/core/build.gradle index fcf25f4983..1c3b467bb9 100644 --- a/core/build.gradle +++ b/core/build.gradle @@ -37,6 +37,7 @@ repositories { dependencies { api group: 'com.google.guava', name: 'guava', version: '32.0.1-jre' api group: 'org.apache.commons', name: 'commons-lang3', version: '3.12.0' + api group: 'org.apache.commons', name: 'commons-text', version: '1.10.0' api group: 'com.facebook.presto', name: 'presto-matching', version: '0.240' api group: 'org.apache.commons', name: 'commons-math3', version: '3.6.1' api "com.fasterxml.jackson.core:jackson-core:${versions.jackson}" diff --git a/legacy/build.gradle b/legacy/build.gradle index db4f930a96..677ca560cb 100644 --- a/legacy/build.gradle +++ b/legacy/build.gradle @@ -92,6 +92,7 @@ dependencies { implementation group: 'com.google.guava', name: 'guava', version: '32.0.1-jre' implementation group: 'org.json', name: 'json', version:'20231013' implementation group: 'org.apache.commons', name: 'commons-lang3', version: '3.12.0' + implementation group: 'org.apache.commons', name: 'commons-text', version: '1.10.0' implementation group: 'org.opensearch', name: 'opensearch', version: "${opensearch_version}" // add geo module as dependency. https://github.com/opensearch-project/OpenSearch/pull/4180/. implementation group: 'org.opensearch.plugin', name: 'geo', version: "${opensearch_version}" diff --git a/spark/src/main/java/org/opensearch/sql/spark/asyncquery/model/SparkSubmitParameters.java b/spark/src/main/java/org/opensearch/sql/spark/asyncquery/model/SparkSubmitParameters.java index e6d1dcd8c8..11e418f42f 100644 --- a/spark/src/main/java/org/opensearch/sql/spark/asyncquery/model/SparkSubmitParameters.java +++ b/spark/src/main/java/org/opensearch/sql/spark/asyncquery/model/SparkSubmitParameters.java @@ -21,6 +21,7 @@ import java.util.function.Supplier; import lombok.AllArgsConstructor; import lombok.RequiredArgsConstructor; +import org.apache.commons.text.StringEscapeUtils; import org.opensearch.sql.datasource.model.DataSourceMetadata; import org.opensearch.sql.datasource.model.DataSourceType; import org.opensearch.sql.datasources.auth.AuthenticationType; @@ -85,8 +86,13 @@ public Builder clusterName(String clusterName) { return this; } + /** + * For query in spark submit parameters to be parsed correctly, escape the characters in the + * query, then wrap the query with double quotes. + */ public Builder query(String query) { - String wrappedQuery = "\"" + query + "\""; // Wrap the query with double quotes + String escapedQuery = StringEscapeUtils.escapeJava(query); + String wrappedQuery = "\"" + escapedQuery + "\""; config.put(FLINT_JOB_QUERY, wrappedQuery); return this; } diff --git a/spark/src/test/java/org/opensearch/sql/spark/asyncquery/model/SparkSubmitParametersTest.java b/spark/src/test/java/org/opensearch/sql/spark/asyncquery/model/SparkSubmitParametersTest.java index 9b47cfc43a..e732cf698c 100644 --- a/spark/src/test/java/org/opensearch/sql/spark/asyncquery/model/SparkSubmitParametersTest.java +++ b/spark/src/test/java/org/opensearch/sql/spark/asyncquery/model/SparkSubmitParametersTest.java @@ -30,8 +30,25 @@ public void testBuildWithExtraParameters() { @Test public void testBuildQueryString() { - String query = "SHOW tables LIKE \"%\";"; - String params = SparkSubmitParameters.Builder.builder().query(query).build().toString(); - assertTrue(params.contains(query)); + String rawQuery = "SHOW tables LIKE \"%\";"; + String expectedQueryInParams = "\"SHOW tables LIKE \\\"%\\\";\""; + String params = SparkSubmitParameters.Builder.builder().query(rawQuery).build().toString(); + assertTrue(params.contains(expectedQueryInParams)); + } + + @Test + public void testBuildQueryStringNestedQuote() { + String rawQuery = "SELECT '\"1\"'"; + String expectedQueryInParams = "\"SELECT '\\\"1\\\"'\""; + String params = SparkSubmitParameters.Builder.builder().query(rawQuery).build().toString(); + assertTrue(params.contains(expectedQueryInParams)); + } + + @Test + public void testBuildQueryStringSpecialCharacter() { + String rawQuery = "SELECT '{\"test ,:+\\\"inner\\\"/\\|?#><\"}'"; + String expectedQueryInParams = "SELECT '{\\\"test ,:+\\\\\\\"inner\\\\\\\"/\\\\|?#><\\\"}'"; + String params = SparkSubmitParameters.Builder.builder().query(rawQuery).build().toString(); + assertTrue(params.contains(expectedQueryInParams)); } }