From 21fb34b564159bc5d39f10dc58f845f85e21c0f9 Mon Sep 17 00:00:00 2001 From: Greg Schohn Date: Wed, 13 Nov 2024 17:56:09 -0500 Subject: [PATCH 01/26] Initial checkin for type mapping removal transformer and experimenting w/ Jinjava. Major things to figure out: 1) how to deal with compositing parts of jinja templates (maybe it's just snippets vended as resources and a user writes their own top-level template) and 2) how to suppress reading any part of the json body when only the headers need to be transformed to prevent parsing the json/ndjson for every request through the system (probably minor though since most setups will probably be doing full-transforms on the vast majority of data flowing). Signed-off-by: Greg Schohn --- .../jsonJinjavaTransformer/README.md | 124 ++++++++++++++++++ .../jsonJinjavaTransformer/build.gradle | 19 +++ .../transform/JinjavaTransformer.java | 43 ++++++ ...rations.transform.IJsonTransformerProvider | 1 + .../transform/JinjavaTransformerTest.java | 85 ++++++++++++ .../transform/ITextTransformer.java | 12 ++ ...rations.transform.ITextTransformerProvider | 0 .../README.md | 124 ++++++++++++++++++ .../build.gradle | 19 +++ .../TypeMappingSanitizerTransformer.java | 60 +++++++++ ...rations.transform.IJsonTransformerProvider | 1 + .../TypeMappingSanitizerTransformerTest.java | 44 +++++++ 12 files changed, 532 insertions(+) create mode 100644 transformation/transformationPlugins/jsonMessageTransformers/jsonJinjavaTransformer/README.md create mode 100644 transformation/transformationPlugins/jsonMessageTransformers/jsonJinjavaTransformer/build.gradle create mode 100644 transformation/transformationPlugins/jsonMessageTransformers/jsonJinjavaTransformer/src/main/java/org/opensearch/migrations/transform/JinjavaTransformer.java create mode 100644 transformation/transformationPlugins/jsonMessageTransformers/jsonJinjavaTransformer/src/main/resources/META-INF/services/org.opensearch.migrations.transform.IJsonTransformerProvider create mode 100644 transformation/transformationPlugins/jsonMessageTransformers/jsonJinjavaTransformer/src/test/java/org/opensearch/migrations/transform/JinjavaTransformerTest.java create mode 100644 transformation/transformationPlugins/jsonMessageTransformers/jsonMessageTransformerInterface/src/main/java/org/opensearch/migrations/transform/ITextTransformer.java create mode 100644 transformation/transformationPlugins/jsonMessageTransformers/jsonMessageTransformerInterface/src/main/resources/META-INF/services/org.opensearch.migrations.transform.ITextTransformerProvider create mode 100644 transformation/transformationPlugins/jsonMessageTransformers/jsonTypeMappingsSanitizerTransformer/README.md create mode 100644 transformation/transformationPlugins/jsonMessageTransformers/jsonTypeMappingsSanitizerTransformer/build.gradle create mode 100644 transformation/transformationPlugins/jsonMessageTransformers/jsonTypeMappingsSanitizerTransformer/src/main/java/org/opensearch/migrations/transform/TypeMappingSanitizerTransformer.java create mode 100644 transformation/transformationPlugins/jsonMessageTransformers/jsonTypeMappingsSanitizerTransformer/src/main/resources/META-INF/services/org.opensearch.migrations.transform.IJsonTransformerProvider create mode 100644 transformation/transformationPlugins/jsonMessageTransformers/jsonTypeMappingsSanitizerTransformer/src/test/java/org/opensearch/migrations/transform/TypeMappingSanitizerTransformerTest.java diff --git a/transformation/transformationPlugins/jsonMessageTransformers/jsonJinjavaTransformer/README.md b/transformation/transformationPlugins/jsonMessageTransformers/jsonJinjavaTransformer/README.md new file mode 100644 index 000000000..abb81c5e2 --- /dev/null +++ b/transformation/transformationPlugins/jsonMessageTransformers/jsonJinjavaTransformer/README.md @@ -0,0 +1,124 @@ +This transformer converts routes for various requests (see below) to indices that used +[multi-type mappings](https://www.elastic.co/guide/en/elasticsearch/reference/5.6/mapping.html) (configured from ES 5.x +and earlier clusters) to work with newer versions of Elasticsearch and OpenSearch. + +## Usage Prior to Elasticsearch 6 + +Let's start with a sample index definition (adapted from the Elasticsearch documentation) with two type mappings and +documents for each of them. +``` +PUT activity +{ + "mappings": { + "user": { + "properties": { + "name": { "type": "text" }, + "user_name": { "type": "keyword" }, + "email": { "type": "keyword" } + } + }, + "post": { + "properties": { + "content": { "type": "text" }, + "user_name": { "type": "keyword" }, + "post_at": { "type": "date" } + } + } + } +} + +PUT activity/user/someuser +{ + "name": "Some User", + "user_name": "user", + "email": "user@example.com" +} + +PUT activity/post/1 +{ + "user_name": "user", + "tweeted_at": "2024-11-13T00:00:00Z", + "content": "change is inevitable" +} + +GET activity/post/_search +{ + "query": { + "match": { + "user_name": "user" + } + } +} +``` + +## Routing data to new indices + +The structure of the documents will need to change. Some options are to use separate indices, drop some of the types +to make an index single-purpose, or to create an index that's the union of all the types' fields. + +With a simple mapping directive, we can define each of these three behaviors. The following yaml shows how to map +documents into two different indices named users and posts: +``` +activity: + user: new_users + post: new_posts +``` + +To drop one, just leave it out: +``` +activity: + user: only_users +``` + +To merge them together, use the same value: +``` +activity: + user: any_activity + post: any_activity +``` + +Any indices that are NOT specified won't be modified - all additions, changes, and queries on those other indices not +specified at the root level will remain untouched. To remove ALL the activity for a given index, specify and empty +index at the top level +``` +activity: {} +``` + +## Final Results + +``` +PUT any_activity +{ + "mappings": { + "properties": { + "type": { + "type": "keyword" + }, + "name": { + "type": "text" + }, + "user_name": { + "type": "keyword" + }, + "email": { + "type": "keyword" + }, + "content": { + "type": "text" + }, + "tweeted_at": { + "type": "date" + } + } + } +} + +PUT any_activity/_doc/someuser +{ + "name": "Some User", + "user_name": "user", + "email": "user@example.com" +} + + +``` \ No newline at end of file diff --git a/transformation/transformationPlugins/jsonMessageTransformers/jsonJinjavaTransformer/build.gradle b/transformation/transformationPlugins/jsonMessageTransformers/jsonJinjavaTransformer/build.gradle new file mode 100644 index 000000000..22dd99683 --- /dev/null +++ b/transformation/transformationPlugins/jsonMessageTransformers/jsonJinjavaTransformer/build.gradle @@ -0,0 +1,19 @@ +plugins { + id 'io.freefair.lombok' +} + +dependencies { + implementation project(':transformation:transformationPlugins:jsonMessageTransformers:jsonMessageTransformerInterface') + + implementation group: 'com.hubspot.jinjava', name: 'jinjava', version: "2.7.3" + + testImplementation project(':TrafficCapture:trafficReplayer') + testImplementation testFixtures(project(path: ':testHelperFixtures')) + testImplementation testFixtures(project(path: ':TrafficCapture:trafficReplayer')) + + testImplementation group: 'com.google.guava', name: 'guava' + testImplementation group: 'org.junit.jupiter', name:'junit-jupiter-api' + testImplementation group: 'org.junit.jupiter', name:'junit-jupiter-params' + testImplementation group: 'org.slf4j', name: 'slf4j-api' + testRuntimeOnly group:'org.junit.jupiter', name:'junit-jupiter-engine' +} diff --git a/transformation/transformationPlugins/jsonMessageTransformers/jsonJinjavaTransformer/src/main/java/org/opensearch/migrations/transform/JinjavaTransformer.java b/transformation/transformationPlugins/jsonMessageTransformers/jsonJinjavaTransformer/src/main/java/org/opensearch/migrations/transform/JinjavaTransformer.java new file mode 100644 index 000000000..f01b4d4ab --- /dev/null +++ b/transformation/transformationPlugins/jsonMessageTransformers/jsonJinjavaTransformer/src/main/java/org/opensearch/migrations/transform/JinjavaTransformer.java @@ -0,0 +1,43 @@ +package org.opensearch.migrations.transform; + +import java.io.File; +import java.io.Reader; +import java.util.HashMap; +import java.util.Map; +import java.util.function.Function; + +import com.fasterxml.jackson.databind.ObjectMapper; +import com.hubspot.jinjava.Jinjava; +import com.hubspot.jinjava.loader.FileLocator; +import lombok.SneakyThrows; + +public class JinjavaTransformer implements IJsonTransformer { + + protected final static ObjectMapper objectMapper = new ObjectMapper(); + protected final String templateString; + protected final Jinjava jinjava; + protected final Function, Map> wrapSourceAsContextConverter; + + public JinjavaTransformer(String templateString, + Function, Map> wrapSourceAsContextConverter) { + this(templateString, wrapSourceAsContextConverter, null); + } + + public JinjavaTransformer(String templateString, + Function, Map> wrapSourceAsContextConverter, + FileLocator fileLocator) + { + this.templateString = templateString; + this.wrapSourceAsContextConverter = wrapSourceAsContextConverter; + this.jinjava = new Jinjava(); + this.jinjava.setResourceLocator(fileLocator); + + } + + @SneakyThrows + @Override + public Map transformJson(Map incomingJson) { + String resultStr = jinjava.render(templateString, wrapSourceAsContextConverter.apply(incomingJson)); + return objectMapper.readValue(resultStr, Map.class); + } +} diff --git a/transformation/transformationPlugins/jsonMessageTransformers/jsonJinjavaTransformer/src/main/resources/META-INF/services/org.opensearch.migrations.transform.IJsonTransformerProvider b/transformation/transformationPlugins/jsonMessageTransformers/jsonJinjavaTransformer/src/main/resources/META-INF/services/org.opensearch.migrations.transform.IJsonTransformerProvider new file mode 100644 index 000000000..86105dbfd --- /dev/null +++ b/transformation/transformationPlugins/jsonMessageTransformers/jsonJinjavaTransformer/src/main/resources/META-INF/services/org.opensearch.migrations.transform.IJsonTransformerProvider @@ -0,0 +1 @@ +org.opensearch.migrations.transform.JinJavaTransformer \ No newline at end of file diff --git a/transformation/transformationPlugins/jsonMessageTransformers/jsonJinjavaTransformer/src/test/java/org/opensearch/migrations/transform/JinjavaTransformerTest.java b/transformation/transformationPlugins/jsonMessageTransformers/jsonJinjavaTransformer/src/test/java/org/opensearch/migrations/transform/JinjavaTransformerTest.java new file mode 100644 index 000000000..20cbf75fc --- /dev/null +++ b/transformation/transformationPlugins/jsonMessageTransformers/jsonJinjavaTransformer/src/test/java/org/opensearch/migrations/transform/JinjavaTransformerTest.java @@ -0,0 +1,85 @@ +package org.opensearch.migrations.transform; + +import java.util.Map; + +import org.junit.jupiter.api.BeforeAll; +import org.junit.jupiter.api.Test; +import org.testcontainers.shaded.com.fasterxml.jackson.databind.ObjectMapper; + +class JinjavaTransformerTest { + + private final static String template = "" + + "{# First, parse the URI to check if it matches the pattern we want to transform #}\n" + + "{% set uri_parts = request.uri.split('/') %}\n" + + "{% set is_type_request = uri_parts | length == 2 %}\n" + + "{% set is_doc_request = uri_parts | length == 3 %}\n" + + "\n" + + "{# If this is a document request, check if we need to transform it based on mapping #}\n" + + "{% if is_doc_request and uri_parts[0] in index_mappings and uri_parts[1] in index_mappings[uri_parts[0]] %}\n" + + " {# This is a document request that needs transformation #}\n" + + " {\n" + + " \"verb\": \"{{ request.verb }}\",\n" + + " \"uri\": \"{{ index_mappings[uri_parts[0]][uri_parts[1]] }}/_doc/{{ uri_parts[2] }}\",\n" + + " \"body\": {{ request.body | tojson }}\n" + + " }\n" + + "{% elif is_type_request and uri_parts[0] in index_mappings %}\n" + + " {# This is an index creation request that needs transformation #}\n" + + " {\n" + + " \"verb\": \"{{ request.verb }}\",\n" + + " \"uri\": \"{{ index_mappings[uri_parts[0]][uri_parts[1]] }}\",\n" + + " \"body\": {\n" + + " \"mappings\": {\n" + + " \"properties\": {\n" + + " \"type\": {\n" + + " \"type\": \"keyword\"\n" + + " }\n" + + " {%- for type_name, type_props in request.body.mappings.items() %}\n" + + " {%- for prop_name, prop_def in type_props.properties.items() %}\n" + + " ,\n" + + " \"{{ prop_name }}\": {{ prop_def | tojson }}\n" + + " {%- endfor %}\n" + + " {%- endfor %}\n" + + " }\n" + + " }\n" + + " }\n" + + " }\n" + + "{% else %}\n" + + " {# Pass through any requests that don't match our transformation patterns #}\n" + + " {{ request | tojson }}\n" + + "{% endif %}"; + + private static JinjavaTransformer indexTypeMappingRewriter; + @BeforeAll + static void initialize() { + var indexMappings = Map.of( + "indexA", Map.of( + "type1", "indexA_1", + "type2", "indexA_2"), + "indexB", Map.of( + "type1", "indexB", + "type2", "indexB"), + "indexC", Map.of( + "type2", "indexC")); + indexTypeMappingRewriter = new JinjavaTransformer(template, request -> + Map.of("index_mappings", indexMappings, + "request", request)); + } + + @Test + public void test() throws Exception { + var testString = + "{\n" + + " \"verb\": \"PUT\",\n" + + " \"uri\": \"indexA/type2/someuser\",\n" + + " \"body\": {\n" + + " \"name\": \"Some User\",\n" + + " \"user_name\": \"user\",\n" + + " \"email\": \"user@example.com\"\n" + + " }\n" + + "}"; + var objMapper = new ObjectMapper(); + var resultObj = indexTypeMappingRewriter.transformJson(objMapper.readValue(testString, Map.class)); + var resultStr = objMapper.writeValueAsString(resultObj); + System.out.println("resultStr = " + resultStr); + } +} \ No newline at end of file diff --git a/transformation/transformationPlugins/jsonMessageTransformers/jsonMessageTransformerInterface/src/main/java/org/opensearch/migrations/transform/ITextTransformer.java b/transformation/transformationPlugins/jsonMessageTransformers/jsonMessageTransformerInterface/src/main/java/org/opensearch/migrations/transform/ITextTransformer.java new file mode 100644 index 000000000..e4da4b051 --- /dev/null +++ b/transformation/transformationPlugins/jsonMessageTransformers/jsonMessageTransformerInterface/src/main/java/org/opensearch/migrations/transform/ITextTransformer.java @@ -0,0 +1,12 @@ +package org.opensearch.migrations.transform; + +import java.io.Reader; +import java.util.Map; + +/** + * This is a simple interface to convert a JSON object (String, Map, or Array) into another + * JSON object. Any changes to datastructures, nesting, order, etc should be intentional. + */ +public interface ITextTransformer { + Reader transformJson(Reader incomingText); +} diff --git a/transformation/transformationPlugins/jsonMessageTransformers/jsonMessageTransformerInterface/src/main/resources/META-INF/services/org.opensearch.migrations.transform.ITextTransformerProvider b/transformation/transformationPlugins/jsonMessageTransformers/jsonMessageTransformerInterface/src/main/resources/META-INF/services/org.opensearch.migrations.transform.ITextTransformerProvider new file mode 100644 index 000000000..e69de29bb diff --git a/transformation/transformationPlugins/jsonMessageTransformers/jsonTypeMappingsSanitizerTransformer/README.md b/transformation/transformationPlugins/jsonMessageTransformers/jsonTypeMappingsSanitizerTransformer/README.md new file mode 100644 index 000000000..abb81c5e2 --- /dev/null +++ b/transformation/transformationPlugins/jsonMessageTransformers/jsonTypeMappingsSanitizerTransformer/README.md @@ -0,0 +1,124 @@ +This transformer converts routes for various requests (see below) to indices that used +[multi-type mappings](https://www.elastic.co/guide/en/elasticsearch/reference/5.6/mapping.html) (configured from ES 5.x +and earlier clusters) to work with newer versions of Elasticsearch and OpenSearch. + +## Usage Prior to Elasticsearch 6 + +Let's start with a sample index definition (adapted from the Elasticsearch documentation) with two type mappings and +documents for each of them. +``` +PUT activity +{ + "mappings": { + "user": { + "properties": { + "name": { "type": "text" }, + "user_name": { "type": "keyword" }, + "email": { "type": "keyword" } + } + }, + "post": { + "properties": { + "content": { "type": "text" }, + "user_name": { "type": "keyword" }, + "post_at": { "type": "date" } + } + } + } +} + +PUT activity/user/someuser +{ + "name": "Some User", + "user_name": "user", + "email": "user@example.com" +} + +PUT activity/post/1 +{ + "user_name": "user", + "tweeted_at": "2024-11-13T00:00:00Z", + "content": "change is inevitable" +} + +GET activity/post/_search +{ + "query": { + "match": { + "user_name": "user" + } + } +} +``` + +## Routing data to new indices + +The structure of the documents will need to change. Some options are to use separate indices, drop some of the types +to make an index single-purpose, or to create an index that's the union of all the types' fields. + +With a simple mapping directive, we can define each of these three behaviors. The following yaml shows how to map +documents into two different indices named users and posts: +``` +activity: + user: new_users + post: new_posts +``` + +To drop one, just leave it out: +``` +activity: + user: only_users +``` + +To merge them together, use the same value: +``` +activity: + user: any_activity + post: any_activity +``` + +Any indices that are NOT specified won't be modified - all additions, changes, and queries on those other indices not +specified at the root level will remain untouched. To remove ALL the activity for a given index, specify and empty +index at the top level +``` +activity: {} +``` + +## Final Results + +``` +PUT any_activity +{ + "mappings": { + "properties": { + "type": { + "type": "keyword" + }, + "name": { + "type": "text" + }, + "user_name": { + "type": "keyword" + }, + "email": { + "type": "keyword" + }, + "content": { + "type": "text" + }, + "tweeted_at": { + "type": "date" + } + } + } +} + +PUT any_activity/_doc/someuser +{ + "name": "Some User", + "user_name": "user", + "email": "user@example.com" +} + + +``` \ No newline at end of file diff --git a/transformation/transformationPlugins/jsonMessageTransformers/jsonTypeMappingsSanitizerTransformer/build.gradle b/transformation/transformationPlugins/jsonMessageTransformers/jsonTypeMappingsSanitizerTransformer/build.gradle new file mode 100644 index 000000000..2bf74f89a --- /dev/null +++ b/transformation/transformationPlugins/jsonMessageTransformers/jsonTypeMappingsSanitizerTransformer/build.gradle @@ -0,0 +1,19 @@ +plugins { + id 'io.freefair.lombok' +} + +dependencies { + implementation project(':transformation:transformationPlugins:jsonMessageTransformers:jsonMessageTransformerInterface') + + implementation project(':transformation:transformationPlugins:jsonMessageTransformers:jsonJinjavaTransformer') + + testImplementation project(':TrafficCapture:trafficReplayer') + testImplementation testFixtures(project(path: ':testHelperFixtures')) + testImplementation testFixtures(project(path: ':TrafficCapture:trafficReplayer')) + + testImplementation group: 'com.google.guava', name: 'guava' + testImplementation group: 'org.junit.jupiter', name:'junit-jupiter-api' + testImplementation group: 'org.junit.jupiter', name:'junit-jupiter-params' + testImplementation group: 'org.slf4j', name: 'slf4j-api' + testRuntimeOnly group:'org.junit.jupiter', name:'junit-jupiter-engine' +} diff --git a/transformation/transformationPlugins/jsonMessageTransformers/jsonTypeMappingsSanitizerTransformer/src/main/java/org/opensearch/migrations/transform/TypeMappingSanitizerTransformer.java b/transformation/transformationPlugins/jsonMessageTransformers/jsonTypeMappingsSanitizerTransformer/src/main/java/org/opensearch/migrations/transform/TypeMappingSanitizerTransformer.java new file mode 100644 index 000000000..cbe79b4ec --- /dev/null +++ b/transformation/transformationPlugins/jsonMessageTransformers/jsonTypeMappingsSanitizerTransformer/src/main/java/org/opensearch/migrations/transform/TypeMappingSanitizerTransformer.java @@ -0,0 +1,60 @@ +package org.opensearch.migrations.transform; + +import java.util.HashMap; +import java.util.Map; +import java.util.function.Function; + +public class TypeMappingSanitizerTransformer extends JinjavaTransformer { + + private final static String template = "" + + // First, parse the URI to check if it matches the pattern we want to transform + "{% set uri_parts = request.uri.split('/') %}\n" + + "{% set is_type_request = uri_parts | length == 2 %}\n" + + "{% set is_doc_request = uri_parts | length == 3 %}\n" + + "\n" + + // If this is a document request, check if we need to transform it based on mapping + "{% if is_doc_request and uri_parts[0] in index_mappings and uri_parts[1] in index_mappings[uri_parts[0]] %}\n" + + // This is a document request that needs transformation + " {\n" + + " \"verb\": \"{{ request.verb }}\",\n" + + " \"uri\": \"{{ index_mappings[uri_parts[0]][uri_parts[1]] }}/_doc/{{ uri_parts[2] }}\",\n" + + " \"body\": {{ request.body | tojson }}\n" + + " }\n" + + "{% elif is_type_request and uri_parts[0] in index_mappings %}\n" + + // This is an index creation request that needs transformation + " {\n" + + " \"verb\": \"{{ request.verb }}\",\n" + + " \"uri\": \"{{ index_mappings[uri_parts[0]][uri_parts[1]] }}\",\n" + + " \"body\": {\n" + + " \"mappings\": {\n" + + " \"properties\": {\n" + + " \"type\": {\n" + + " \"type\": \"keyword\"\n" + + " }\n" + + " {%- for type_name, type_props in request.body.mappings.items() %}\n" + + " {%- for prop_name, prop_def in type_props.properties.items() %}\n" + + " ,\n" + + " \"{{ prop_name }}\": {{ prop_def | tojson }}\n" + + " {%- endfor %}\n" + + " {%- endfor %}\n" + + " }\n" + + " }\n" + + " }\n" + + " }\n" + + "{% else %}\n" + + // Pass through + " {{ request | tojson }}\n" + + "{% endif %}"; + + public TypeMappingSanitizerTransformer(Map> indexMappings) { + super(template, getContextWrapper(indexMappings)); + } + + private static Function, Map> + getContextWrapper(Map> indexMappings) + { + return incomingJson -> Map.of( + "index_mappings", indexMappings, + "request", incomingJson); + } +} diff --git a/transformation/transformationPlugins/jsonMessageTransformers/jsonTypeMappingsSanitizerTransformer/src/main/resources/META-INF/services/org.opensearch.migrations.transform.IJsonTransformerProvider b/transformation/transformationPlugins/jsonMessageTransformers/jsonTypeMappingsSanitizerTransformer/src/main/resources/META-INF/services/org.opensearch.migrations.transform.IJsonTransformerProvider new file mode 100644 index 000000000..5beb0df6a --- /dev/null +++ b/transformation/transformationPlugins/jsonMessageTransformers/jsonTypeMappingsSanitizerTransformer/src/main/resources/META-INF/services/org.opensearch.migrations.transform.IJsonTransformerProvider @@ -0,0 +1 @@ +org.opensearch.migrations.transform.TypeMappingSanitizerTransformer \ No newline at end of file diff --git a/transformation/transformationPlugins/jsonMessageTransformers/jsonTypeMappingsSanitizerTransformer/src/test/java/org/opensearch/migrations/transform/TypeMappingSanitizerTransformerTest.java b/transformation/transformationPlugins/jsonMessageTransformers/jsonTypeMappingsSanitizerTransformer/src/test/java/org/opensearch/migrations/transform/TypeMappingSanitizerTransformerTest.java new file mode 100644 index 000000000..0d0e3e409 --- /dev/null +++ b/transformation/transformationPlugins/jsonMessageTransformers/jsonTypeMappingsSanitizerTransformer/src/test/java/org/opensearch/migrations/transform/TypeMappingSanitizerTransformerTest.java @@ -0,0 +1,44 @@ +package org.opensearch.migrations.transform; + +import java.util.Map; + +import org.junit.jupiter.api.BeforeAll; +import org.junit.jupiter.api.Test; +import org.testcontainers.shaded.com.fasterxml.jackson.databind.ObjectMapper; + +class TypeMappingSanitizerTransformerTest { + + + private static TypeMappingSanitizerTransformer indexTypeMappingRewriter; + @BeforeAll + static void initialize() { + var indexMappings = Map.of( + "indexA", Map.of( + "type1", "indexA_1", + "type2", "indexA_2"), + "indexB", Map.of( + "type1", "indexB", + "type2", "indexB"), + "indexC", Map.of( + "type2", "indexC")); + indexTypeMappingRewriter = new TypeMappingSanitizerTransformer(indexMappings); + } + + @Test + public void test() throws Exception { + var testString = + "{\n" + + " \"verb\": \"PUT\",\n" + + " \"uri\": \"indexA/type2/someuser\",\n" + + " \"body\": {\n" + + " \"name\": \"Some User\",\n" + + " \"user_name\": \"user\",\n" + + " \"email\": \"user@example.com\"\n" + + " }\n" + + "}"; + var objMapper = new ObjectMapper(); + var resultObj = indexTypeMappingRewriter.transformJson(objMapper.readValue(testString, Map.class)); + var resultStr = objMapper.writeValueAsString(resultObj); + System.out.println("resultStr = " + resultStr); + } +} \ No newline at end of file From 926e6e8cbb3b865c2e037a43c5b54105e1eb6e3e Mon Sep 17 00:00:00 2001 From: Greg Schohn Date: Mon, 18 Nov 2024 13:00:44 -0500 Subject: [PATCH 02/26] Further building out the jinjava and index type mappings transformers so that they can fit w/in the transformation ecosystems. Signed-off-by: Greg Schohn --- ... JsonJMESPathTransformerProviderTest.java} | 10 +- .../transform/JinjavaTransformer.java | 10 +- .../transform/JinjavaTransformerTest.java | 2 +- .../build.gradle | 31 +++++ .../JsonJinjavaTransformerProvider.java | 46 ++++++++ ...rations.transform.IJsonTransformerProvider | 1 + .../JinjavaTransformerProviderTest.java | 107 ++++++++++++++++++ .../src/test/resources/log4j2.properties | 18 +++ .../transform/ITextTransformer.java | 12 -- .../README.md | 0 .../build.gradle | 3 +- .../TypeMappingsSanitizationTransformer.java | 61 ++++++++++ ...rations.transform.IJsonTransformerProvider | 1 + .../src/main/resources/v1/template.jinja | 33 ++++++ ...eMappingsSanitizationTransformerTest.java} | 11 +- .../build.gradle | 32 ++++++ ...appingSanitizationTransformerProvider.java | 28 +++++ ...rations.transform.IJsonTransformerProvider | 1 + .../replay/TypeMappingsSanitizationTest.java | 80 +++++++++++++ .../src/test/resources/log4j2.properties | 18 +++ .../TypeMappingSanitizerTransformer.java | 60 ---------- ...rations.transform.IJsonTransformerProvider | 1 - 22 files changed, 475 insertions(+), 91 deletions(-) rename transformation/transformationPlugins/jsonMessageTransformers/jsonJMESPathMessageTransformerProvider/src/test/java/org/opensearch/migrations/replay/{JsonTransformerTest.java => JsonJMESPathTransformerProviderTest.java} (93%) create mode 100644 transformation/transformationPlugins/jsonMessageTransformers/jsonJinjavaTransformerProvider/build.gradle create mode 100644 transformation/transformationPlugins/jsonMessageTransformers/jsonJinjavaTransformerProvider/src/main/java/org/opensearch/migrations/transform/JsonJinjavaTransformerProvider.java create mode 100644 transformation/transformationPlugins/jsonMessageTransformers/jsonJinjavaTransformerProvider/src/main/resources/META-INF/services/org.opensearch.migrations.transform.IJsonTransformerProvider create mode 100644 transformation/transformationPlugins/jsonMessageTransformers/jsonJinjavaTransformerProvider/src/test/java/org/opensearch/migrations/replay/JinjavaTransformerProviderTest.java create mode 100644 transformation/transformationPlugins/jsonMessageTransformers/jsonJinjavaTransformerProvider/src/test/resources/log4j2.properties delete mode 100644 transformation/transformationPlugins/jsonMessageTransformers/jsonMessageTransformerInterface/src/main/java/org/opensearch/migrations/transform/ITextTransformer.java rename transformation/transformationPlugins/jsonMessageTransformers/{jsonTypeMappingsSanitizerTransformer => jsonTypeMappingsSanitizationTransformer}/README.md (100%) rename transformation/transformationPlugins/jsonMessageTransformers/{jsonTypeMappingsSanitizerTransformer => jsonTypeMappingsSanitizationTransformer}/build.gradle (85%) create mode 100644 transformation/transformationPlugins/jsonMessageTransformers/jsonTypeMappingsSanitizationTransformer/src/main/java/org/opensearch/migrations/transform/TypeMappingsSanitizationTransformer.java create mode 100644 transformation/transformationPlugins/jsonMessageTransformers/jsonTypeMappingsSanitizationTransformer/src/main/resources/META-INF/services/org.opensearch.migrations.transform.IJsonTransformerProvider create mode 100644 transformation/transformationPlugins/jsonMessageTransformers/jsonTypeMappingsSanitizationTransformer/src/main/resources/v1/template.jinja rename transformation/transformationPlugins/jsonMessageTransformers/{jsonTypeMappingsSanitizerTransformer/src/test/java/org/opensearch/migrations/transform/TypeMappingSanitizerTransformerTest.java => jsonTypeMappingsSanitizationTransformer/src/test/java/org/opensearch/migrations/transform/TypeMappingsSanitizationTransformerTest.java} (81%) create mode 100644 transformation/transformationPlugins/jsonMessageTransformers/jsonTypeMappingsSanitizationTransformerProvider/build.gradle create mode 100644 transformation/transformationPlugins/jsonMessageTransformers/jsonTypeMappingsSanitizationTransformerProvider/src/main/java/org/opensearch/migrations/transform/TypeMappingSanitizationTransformerProvider.java create mode 100644 transformation/transformationPlugins/jsonMessageTransformers/jsonTypeMappingsSanitizationTransformerProvider/src/main/resources/META-INF/services/org.opensearch.migrations.transform.IJsonTransformerProvider create mode 100644 transformation/transformationPlugins/jsonMessageTransformers/jsonTypeMappingsSanitizationTransformerProvider/src/test/java/org/opensearch/migrations/replay/TypeMappingsSanitizationTest.java create mode 100644 transformation/transformationPlugins/jsonMessageTransformers/jsonTypeMappingsSanitizationTransformerProvider/src/test/resources/log4j2.properties delete mode 100644 transformation/transformationPlugins/jsonMessageTransformers/jsonTypeMappingsSanitizerTransformer/src/main/java/org/opensearch/migrations/transform/TypeMappingSanitizerTransformer.java delete mode 100644 transformation/transformationPlugins/jsonMessageTransformers/jsonTypeMappingsSanitizerTransformer/src/main/resources/META-INF/services/org.opensearch.migrations.transform.IJsonTransformerProvider diff --git a/transformation/transformationPlugins/jsonMessageTransformers/jsonJMESPathMessageTransformerProvider/src/test/java/org/opensearch/migrations/replay/JsonTransformerTest.java b/transformation/transformationPlugins/jsonMessageTransformers/jsonJMESPathMessageTransformerProvider/src/test/java/org/opensearch/migrations/replay/JsonJMESPathTransformerProviderTest.java similarity index 93% rename from transformation/transformationPlugins/jsonMessageTransformers/jsonJMESPathMessageTransformerProvider/src/test/java/org/opensearch/migrations/replay/JsonTransformerTest.java rename to transformation/transformationPlugins/jsonMessageTransformers/jsonJMESPathMessageTransformerProvider/src/test/java/org/opensearch/migrations/replay/JsonJMESPathTransformerProviderTest.java index 2885678ab..912fd3c9e 100644 --- a/transformation/transformationPlugins/jsonMessageTransformers/jsonJMESPathMessageTransformerProvider/src/test/java/org/opensearch/migrations/replay/JsonTransformerTest.java +++ b/transformation/transformationPlugins/jsonMessageTransformers/jsonJMESPathMessageTransformerProvider/src/test/java/org/opensearch/migrations/replay/JsonJMESPathTransformerProviderTest.java @@ -4,19 +4,18 @@ import java.util.Map; import org.opensearch.migrations.testutils.WrapWithNettyLeakDetection; -import org.opensearch.migrations.transform.JsonJMESPathTransformer; +import org.opensearch.migrations.transform.JsonJMESPathTransformerProvider; import com.fasterxml.jackson.core.JsonProcessingException; import com.fasterxml.jackson.core.type.TypeReference; import com.fasterxml.jackson.databind.ObjectMapper; -import io.burt.jmespath.jcf.JcfRuntime; import lombok.extern.slf4j.Slf4j; import org.junit.jupiter.api.Assertions; import org.junit.jupiter.api.Test; @Slf4j @WrapWithNettyLeakDetection(disableLeakChecks = true) -class JsonTransformerTest { +class JsonJMESPathTransformerProviderTest { static final String TEST_INPUT_REQUEST = "{\n" + " \"method\": \"PUT\",\n" + " \"URI\": \"/oldStyleIndex\",\n" @@ -56,7 +55,7 @@ class JsonTransformerTest { static final TypeReference> TYPE_REFERENCE_FOR_MAP_TYPE = new TypeReference<>() { }; - public JsonTransformerTest() { + public JsonJMESPathTransformerProviderTest() { mapper.configure(com.fasterxml.jackson.core.JsonParser.Feature.ALLOW_COMMENTS, true); } @@ -76,7 +75,8 @@ static String emitJson(ObjectMapper mapper, Object transformedDocument) throws J @Test public void testSimpleTransform() throws JsonProcessingException { var documentJson = parseStringAsJson(mapper, TEST_INPUT_REQUEST); - var transformer = new JsonJMESPathTransformer(new JcfRuntime(), EXCISE_TYPE_EXPRESSION_STRING); + var transformer = new JsonJMESPathTransformerProvider().createTransformer(Map.of( + "script", EXCISE_TYPE_EXPRESSION_STRING)); var transformedDocument = transformer.transformJson(documentJson); var outputStr = emitJson(mapper, transformedDocument); diff --git a/transformation/transformationPlugins/jsonMessageTransformers/jsonJinjavaTransformer/src/main/java/org/opensearch/migrations/transform/JinjavaTransformer.java b/transformation/transformationPlugins/jsonMessageTransformers/jsonJinjavaTransformer/src/main/java/org/opensearch/migrations/transform/JinjavaTransformer.java index f01b4d4ab..f6704b4c7 100644 --- a/transformation/transformationPlugins/jsonMessageTransformers/jsonJinjavaTransformer/src/main/java/org/opensearch/migrations/transform/JinjavaTransformer.java +++ b/transformation/transformationPlugins/jsonMessageTransformers/jsonJinjavaTransformer/src/main/java/org/opensearch/migrations/transform/JinjavaTransformer.java @@ -1,8 +1,5 @@ package org.opensearch.migrations.transform; -import java.io.File; -import java.io.Reader; -import java.util.HashMap; import java.util.Map; import java.util.function.Function; @@ -10,7 +7,9 @@ import com.hubspot.jinjava.Jinjava; import com.hubspot.jinjava.loader.FileLocator; import lombok.SneakyThrows; +import lombok.extern.slf4j.Slf4j; +@Slf4j public class JinjavaTransformer implements IJsonTransformer { protected final static ObjectMapper objectMapper = new ObjectMapper(); @@ -19,8 +18,8 @@ public class JinjavaTransformer implements IJsonTransformer { protected final Function, Map> wrapSourceAsContextConverter; public JinjavaTransformer(String templateString, - Function, Map> wrapSourceAsContextConverter) { - this(templateString, wrapSourceAsContextConverter, null); + Function, Map> contextProviderFromSource) { + this(templateString, contextProviderFromSource, null); } public JinjavaTransformer(String templateString, @@ -38,6 +37,7 @@ public JinjavaTransformer(String templateString, @Override public Map transformJson(Map incomingJson) { String resultStr = jinjava.render(templateString, wrapSourceAsContextConverter.apply(incomingJson)); + log.atInfo().setMessage("output = {}").addArgument(resultStr).log(); return objectMapper.readValue(resultStr, Map.class); } } diff --git a/transformation/transformationPlugins/jsonMessageTransformers/jsonJinjavaTransformer/src/test/java/org/opensearch/migrations/transform/JinjavaTransformerTest.java b/transformation/transformationPlugins/jsonMessageTransformers/jsonJinjavaTransformer/src/test/java/org/opensearch/migrations/transform/JinjavaTransformerTest.java index 20cbf75fc..3a3b1abd7 100644 --- a/transformation/transformationPlugins/jsonMessageTransformers/jsonJinjavaTransformer/src/test/java/org/opensearch/migrations/transform/JinjavaTransformerTest.java +++ b/transformation/transformationPlugins/jsonMessageTransformers/jsonJinjavaTransformer/src/test/java/org/opensearch/migrations/transform/JinjavaTransformerTest.java @@ -82,4 +82,4 @@ public void test() throws Exception { var resultStr = objMapper.writeValueAsString(resultObj); System.out.println("resultStr = " + resultStr); } -} \ No newline at end of file +} diff --git a/transformation/transformationPlugins/jsonMessageTransformers/jsonJinjavaTransformerProvider/build.gradle b/transformation/transformationPlugins/jsonMessageTransformers/jsonJinjavaTransformerProvider/build.gradle new file mode 100644 index 000000000..3e02184bb --- /dev/null +++ b/transformation/transformationPlugins/jsonMessageTransformers/jsonJinjavaTransformerProvider/build.gradle @@ -0,0 +1,31 @@ +buildscript { + dependencies { + classpath 'org.junit.platform:junit-platform-gradle-plugin:1.0.1' + } +} + +plugins { + id 'io.freefair.lombok' +} + +dependencies { + implementation project(':transformation:transformationPlugins:jsonMessageTransformers:jsonMessageTransformerInterface') + implementation project(':transformation:transformationPlugins:jsonMessageTransformers:jsonJinjavaTransformer') + + implementation group: 'org.apache.commons', name: 'commons-collections4', version: '4.4' + + testImplementation project(':TrafficCapture:trafficReplayer') + testImplementation testFixtures(project(path: ':testHelperFixtures')) + testImplementation testFixtures(project(path: ':TrafficCapture:trafficReplayer')) + + testImplementation group: 'com.fasterxml.jackson.core', name: 'jackson-databind' + testImplementation group: 'io.netty', name: 'netty-all' + testImplementation group: 'org.junit.jupiter', name:'junit-jupiter-api' + testImplementation group: 'org.junit.jupiter', name:'junit-jupiter-params' + testImplementation group: 'org.slf4j', name: 'slf4j-api' + testRuntimeOnly group:'org.junit.jupiter', name:'junit-jupiter-engine' +} + +tasks.named('test') { + useJUnitPlatform() +} diff --git a/transformation/transformationPlugins/jsonMessageTransformers/jsonJinjavaTransformerProvider/src/main/java/org/opensearch/migrations/transform/JsonJinjavaTransformerProvider.java b/transformation/transformationPlugins/jsonMessageTransformers/jsonJinjavaTransformerProvider/src/main/java/org/opensearch/migrations/transform/JsonJinjavaTransformerProvider.java new file mode 100644 index 000000000..b8cc45eca --- /dev/null +++ b/transformation/transformationPlugins/jsonMessageTransformers/jsonJinjavaTransformerProvider/src/main/java/org/opensearch/migrations/transform/JsonJinjavaTransformerProvider.java @@ -0,0 +1,46 @@ +package org.opensearch.migrations.transform; + +import java.util.Collections; +import java.util.Map; + +import org.apache.commons.collections4.map.CompositeMap; + + +public class JsonJinjavaTransformerProvider implements IJsonTransformerProvider { + + public static final String REQUEST_KEY = "request"; + public static final String TEMPLATE_KEY = "template"; + + @Override + public IJsonTransformer createTransformer(Object jsonConfig) { + if (!(jsonConfig instanceof Map)) { + throw new IllegalArgumentException(getConfigUsageStr()); + } + var config = (Map) jsonConfig; + if (config.containsKey(REQUEST_KEY)) { + throw new IllegalArgumentException(REQUEST_KEY + " was already present in the incoming configuration. " + + getConfigUsageStr()); + } + if (!config.containsKey(TEMPLATE_KEY)) { + throw new IllegalArgumentException(TEMPLATE_KEY + " was not present in the incoming configuration. " + + getConfigUsageStr()); + } + + var immutableBaseConfig = Collections.unmodifiableMap(config); + try { + var templateString = (String) config.get(TEMPLATE_KEY); + return new JinjavaTransformer(templateString, + source -> new CompositeMap<>(Map.of(REQUEST_KEY, source), immutableBaseConfig)); + } catch (ClassCastException e) { + throw new IllegalArgumentException(getConfigUsageStr(), e); + } + } + + private String getConfigUsageStr() { + return this.getClass().getName() + " expects the incoming configuration to be a Map " + + "with a '" + TEMPLATE_KEY + "' key that specifies the Jinjava template. " + + "The key '" + REQUEST_KEY + "' must not be specified so that it can be used to pass the source document " + + "into the template. " + + "The other top-level keys will be passed directly to the template."; + } +} diff --git a/transformation/transformationPlugins/jsonMessageTransformers/jsonJinjavaTransformerProvider/src/main/resources/META-INF/services/org.opensearch.migrations.transform.IJsonTransformerProvider b/transformation/transformationPlugins/jsonMessageTransformers/jsonJinjavaTransformerProvider/src/main/resources/META-INF/services/org.opensearch.migrations.transform.IJsonTransformerProvider new file mode 100644 index 000000000..8d65ec87b --- /dev/null +++ b/transformation/transformationPlugins/jsonMessageTransformers/jsonJinjavaTransformerProvider/src/main/resources/META-INF/services/org.opensearch.migrations.transform.IJsonTransformerProvider @@ -0,0 +1 @@ +org.opensearch.migrations.transform.JsonJinjavaTransformerProvider \ No newline at end of file diff --git a/transformation/transformationPlugins/jsonMessageTransformers/jsonJinjavaTransformerProvider/src/test/java/org/opensearch/migrations/replay/JinjavaTransformerProviderTest.java b/transformation/transformationPlugins/jsonMessageTransformers/jsonJinjavaTransformerProvider/src/test/java/org/opensearch/migrations/replay/JinjavaTransformerProviderTest.java new file mode 100644 index 000000000..ca5ae3657 --- /dev/null +++ b/transformation/transformationPlugins/jsonMessageTransformers/jsonJinjavaTransformerProvider/src/test/java/org/opensearch/migrations/replay/JinjavaTransformerProviderTest.java @@ -0,0 +1,107 @@ +package org.opensearch.migrations.replay; + +import java.util.LinkedHashMap; +import java.util.Map; + +import org.opensearch.migrations.testutils.WrapWithNettyLeakDetection; +import org.opensearch.migrations.transform.JsonJinjavaTransformerProvider; + +import com.fasterxml.jackson.core.JsonProcessingException; +import com.fasterxml.jackson.core.type.TypeReference; +import com.fasterxml.jackson.databind.ObjectMapper; +import lombok.extern.slf4j.Slf4j; +import org.junit.jupiter.api.Assertions; +import org.junit.jupiter.api.Test; + +@Slf4j +@WrapWithNettyLeakDetection(disableLeakChecks = true) +class JinjavaTransformerProviderTest { + static final String TEST_INPUT_REQUEST = "{\n" + + " \"method\": \"PUT\",\n" + + " \"URI\": \"/oldStyleIndex\",\n" + + " \"headers\": {\n" + + " \"host\": \"127.0.0.1\"\n" + + " },\n" + + " \"payload\": {\n" + + " \"inlinedJsonBody\": {\n" + + " \"mappings\": {\n" + + " \"oldType\": {\n" + + " \"properties\": {\n" + + " \"field1\": {\n" + + " \"type\": \"text\"\n" + + " },\n" + + " \"field2\": {\n" + + " \"type\": \"keyword\"\n" + + " }\n" + + " }\n" + + " }\n" + + " }\n" + + " }\n" + + " }\n" + + "}\n"; + + static final String EXCISE_TYPE_EXPRESSION_STRING = "{\n" + + " \"method\": method,\n" + + " \"URI\": URI,\n" + + " \"headers\": headers,\n" + + " \"payload\": {\n" + + " \"inlinedJsonBody\": {\n" + + " \"mappings\": payload.inlinedJsonBody.mappings.oldType\n" + + " }\n" + + " }\n" + + "}"; + + ObjectMapper mapper = new ObjectMapper(); + static final TypeReference> TYPE_REFERENCE_FOR_MAP_TYPE = new TypeReference<>() { + }; + + public JinjavaTransformerProviderTest() { + mapper.configure(com.fasterxml.jackson.core.JsonParser.Feature.ALLOW_COMMENTS, true); + } + + static Map parseStringAsJson(ObjectMapper mapper, String jsonStr) throws JsonProcessingException { + return mapper.readValue(jsonStr, TYPE_REFERENCE_FOR_MAP_TYPE); + } + + static String normalize(ObjectMapper mapper, String input) throws JsonProcessingException { + return mapper.writeValueAsString(mapper.readTree(input)); + } + + static String emitJson(ObjectMapper mapper, Object transformedDocument) throws JsonProcessingException { + mapper.configure(com.fasterxml.jackson.core.JsonParser.Feature.ALLOW_COMMENTS, true); // optional + return mapper.writeValueAsString(transformedDocument); + } + + @Test + public void testSimpleTransform() throws JsonProcessingException { + var documentJson = parseStringAsJson(mapper, TEST_INPUT_REQUEST); + var transformer = new JsonJinjavaTransformerProvider().createTransformer(Map.of( + "script", EXCISE_TYPE_EXPRESSION_STRING)); + var transformedDocument = transformer.transformJson(documentJson); + var outputStr = emitJson(mapper, transformedDocument); + + final String TEST_OUTPUT_REQUEST = "{\n" + + " \"method\": \"PUT\",\n" + + " \"URI\": \"/oldStyleIndex\",\n" + + " \"headers\": {\n" + + " \"host\": \"127.0.0.1\"\n" + + " },\n" + + " \"payload\": {\n" + + " \"inlinedJsonBody\": {\n" + + " \"mappings\": {\n" + + " \"properties\": {\n" + + " \"field1\": {\n" + + " \"type\": \"text\"\n" + + " },\n" + + " \"field2\": {\n" + + " \"type\": \"keyword\"\n" + + " }\n" + + " }\n" + + " }\n" + + " }\n" + + " }\n" + + "}"; + + Assertions.assertEquals(normalize(mapper, TEST_OUTPUT_REQUEST), normalize(mapper, outputStr)); + } +} diff --git a/transformation/transformationPlugins/jsonMessageTransformers/jsonJinjavaTransformerProvider/src/test/resources/log4j2.properties b/transformation/transformationPlugins/jsonMessageTransformers/jsonJinjavaTransformerProvider/src/test/resources/log4j2.properties new file mode 100644 index 000000000..6adca47b5 --- /dev/null +++ b/transformation/transformationPlugins/jsonMessageTransformers/jsonJinjavaTransformerProvider/src/test/resources/log4j2.properties @@ -0,0 +1,18 @@ +status = WARN + +property.ownedPackagesLogLevel=${sys:migrationLogLevel:-INFO} + +appender.console.type = Console +appender.console.name = Console +appender.console.target = SYSTEM_OUT +appender.console.layout.type = PatternLayout +appender.console.layout.pattern = %d{yyyy-MM-dd HH:mm:ss,SSS}{UTC} %p %c{1.} [%t] %m%n + +rootLogger.level = info +rootLogger.appenderRef.console.ref = Console + +# Allow customization of owned package logs +logger.rfs.name = org.opensearch.migrations.bulkload +logger.rfs.level = ${ownedPackagesLogLevel} +logger.migration.name = org.opensearch.migrations +logger.migration.level = ${ownedPackagesLogLevel} diff --git a/transformation/transformationPlugins/jsonMessageTransformers/jsonMessageTransformerInterface/src/main/java/org/opensearch/migrations/transform/ITextTransformer.java b/transformation/transformationPlugins/jsonMessageTransformers/jsonMessageTransformerInterface/src/main/java/org/opensearch/migrations/transform/ITextTransformer.java deleted file mode 100644 index e4da4b051..000000000 --- a/transformation/transformationPlugins/jsonMessageTransformers/jsonMessageTransformerInterface/src/main/java/org/opensearch/migrations/transform/ITextTransformer.java +++ /dev/null @@ -1,12 +0,0 @@ -package org.opensearch.migrations.transform; - -import java.io.Reader; -import java.util.Map; - -/** - * This is a simple interface to convert a JSON object (String, Map, or Array) into another - * JSON object. Any changes to datastructures, nesting, order, etc should be intentional. - */ -public interface ITextTransformer { - Reader transformJson(Reader incomingText); -} diff --git a/transformation/transformationPlugins/jsonMessageTransformers/jsonTypeMappingsSanitizerTransformer/README.md b/transformation/transformationPlugins/jsonMessageTransformers/jsonTypeMappingsSanitizationTransformer/README.md similarity index 100% rename from transformation/transformationPlugins/jsonMessageTransformers/jsonTypeMappingsSanitizerTransformer/README.md rename to transformation/transformationPlugins/jsonMessageTransformers/jsonTypeMappingsSanitizationTransformer/README.md diff --git a/transformation/transformationPlugins/jsonMessageTransformers/jsonTypeMappingsSanitizerTransformer/build.gradle b/transformation/transformationPlugins/jsonMessageTransformers/jsonTypeMappingsSanitizationTransformer/build.gradle similarity index 85% rename from transformation/transformationPlugins/jsonMessageTransformers/jsonTypeMappingsSanitizerTransformer/build.gradle rename to transformation/transformationPlugins/jsonMessageTransformers/jsonTypeMappingsSanitizationTransformer/build.gradle index 2bf74f89a..f48b1c329 100644 --- a/transformation/transformationPlugins/jsonMessageTransformers/jsonTypeMappingsSanitizerTransformer/build.gradle +++ b/transformation/transformationPlugins/jsonMessageTransformers/jsonTypeMappingsSanitizationTransformer/build.gradle @@ -1,11 +1,12 @@ plugins { id 'io.freefair.lombok' + id 'java-library' } dependencies { implementation project(':transformation:transformationPlugins:jsonMessageTransformers:jsonMessageTransformerInterface') - implementation project(':transformation:transformationPlugins:jsonMessageTransformers:jsonJinjavaTransformer') + api project(':transformation:transformationPlugins:jsonMessageTransformers:jsonJinjavaTransformer') testImplementation project(':TrafficCapture:trafficReplayer') testImplementation testFixtures(project(path: ':testHelperFixtures')) diff --git a/transformation/transformationPlugins/jsonMessageTransformers/jsonTypeMappingsSanitizationTransformer/src/main/java/org/opensearch/migrations/transform/TypeMappingsSanitizationTransformer.java b/transformation/transformationPlugins/jsonMessageTransformers/jsonTypeMappingsSanitizationTransformer/src/main/java/org/opensearch/migrations/transform/TypeMappingsSanitizationTransformer.java new file mode 100644 index 000000000..507c9191d --- /dev/null +++ b/transformation/transformationPlugins/jsonMessageTransformers/jsonTypeMappingsSanitizationTransformer/src/main/java/org/opensearch/migrations/transform/TypeMappingsSanitizationTransformer.java @@ -0,0 +1,61 @@ +package org.opensearch.migrations.transform; + +import java.util.Map; +import java.util.function.Function; + +public class TypeMappingsSanitizationTransformer extends JinjavaTransformer { + + private final static String template = "" + + // First, parse the URI to check if it matches the pattern we want to transform + "{% set uri_parts = request.URI.split('/') | reject('equalto', '') | list %}\n" + + "\n" + + // If this is a document request, check if we need to transform it based on mapping + "{% if uri_parts | length == 3 and uri_parts[0] in index_mappings and uri_parts[1] in index_mappings[uri_parts[0]] %}\n" + + // This is a document request that needs transformation + " {\n" + + " \"method\": \"{{ request.method }}\",\n" + + " \"URI\": \"/{{ index_mappings[uri_parts[0]][uri_parts[1]] }}/_doc/{{ uri_parts[2] }}\",\n" + + " \"headers\": {{ request.headers | tojson }},\n" + + " \"payload\": {{ request.payload | tojson }}\n" + + " }\n" + + "{% elif uri_parts | length == 2 and uri_parts[0] in index_mappings %}\n" + + // This is an index creation request that needs transformation + " {\n" + + " \"method\": \"{{ request.method }}\",\n" + + " \"URI\": \"{{ index_mappings[uri_parts[0]][uri_parts[1]] }}\",\n" + + " \"payload\": {\n" + + " \"inlinedJsonBody\": {\n" + + " \"mappings\": {\n" + + " \"properties\": {\n" + + " \"type\": {\n" + + " \"type\": \"keyword\"\n" + + " }\n" + + " {%- for type_name, type_props in request.body.mappings.items() %}\n" + + " {%- for prop_name, prop_def in type_props.properties.items() %}\n" + + " ,\n" + + " \"{{ prop_name }}\": {{ prop_def | tojson }}\n" + + " {%- endfor %}\n" + + " {%- endfor %}\n" + + " }\n" + + " }\n" + + " }\n" + + " }\n" + + " }\n" + + "{% else %}\n" + + // Pass through + " { \"urilen\": {{uri_parts | length}} }" + + //" {{ request | tojson }}\n" + + "{% endif %}"; + + public TypeMappingsSanitizationTransformer(Map> indexMappings) { + super(template, getContextWrapper(indexMappings)); + } + + private static Function, Map> + getContextWrapper(Map> indexMappings) + { + return incomingJson -> Map.of( + "index_mappings", indexMappings, + "request", incomingJson); + } +} diff --git a/transformation/transformationPlugins/jsonMessageTransformers/jsonTypeMappingsSanitizationTransformer/src/main/resources/META-INF/services/org.opensearch.migrations.transform.IJsonTransformerProvider b/transformation/transformationPlugins/jsonMessageTransformers/jsonTypeMappingsSanitizationTransformer/src/main/resources/META-INF/services/org.opensearch.migrations.transform.IJsonTransformerProvider new file mode 100644 index 000000000..dac77603a --- /dev/null +++ b/transformation/transformationPlugins/jsonMessageTransformers/jsonTypeMappingsSanitizationTransformer/src/main/resources/META-INF/services/org.opensearch.migrations.transform.IJsonTransformerProvider @@ -0,0 +1 @@ +org.opensearch.migrations.transform.TypeMappingsSanitizationTransformer \ No newline at end of file diff --git a/transformation/transformationPlugins/jsonMessageTransformers/jsonTypeMappingsSanitizationTransformer/src/main/resources/v1/template.jinja b/transformation/transformationPlugins/jsonMessageTransformers/jsonTypeMappingsSanitizationTransformer/src/main/resources/v1/template.jinja new file mode 100644 index 000000000..e9222e483 --- /dev/null +++ b/transformation/transformationPlugins/jsonMessageTransformers/jsonTypeMappingsSanitizationTransformer/src/main/resources/v1/template.jinja @@ -0,0 +1,33 @@ +{% set uri_parts = request.URI.split('/') | reject('equalto', '') | list %} + +{% if uri_parts | length == 3 and uri_parts[0] in index_mappings and uri_parts[1] in index_mappings[uri_parts[0]] %} + { + "method": "{{ request.method }}", + "URI": "/{{ index_mappings[uri_parts[0]][uri_parts[1]] }}/_doc/{{ uri_parts[2] }}", + "headers": {{ request.headers | tojson }}, + "payload": {{ request.payload | tojson }} + } +{% elif uri_parts | length == 2 and uri_parts[0] in index_mappings %} + { + "method": "{{ request.method }}", + "URI": "{{ index_mappings[uri_parts[0]][uri_parts[1]] }}", + "payload": { + "inlinedJsonBody": { + "mappings": { + "properties": { + "type": { + "type": "keyword" + } + {%- for type_name, type_props in request.body.mappings.items() %} + {%- for prop_name, prop_def in type_props.properties.items() %} + , + "{{ prop_name }}": {{ prop_def | tojson }} + {%- endfor %} + {%- endfor %} + } + } + } + } + } +{% else %} + { "urilen": {{uri_parts | length}} }{% endif %} \ No newline at end of file diff --git a/transformation/transformationPlugins/jsonMessageTransformers/jsonTypeMappingsSanitizerTransformer/src/test/java/org/opensearch/migrations/transform/TypeMappingSanitizerTransformerTest.java b/transformation/transformationPlugins/jsonMessageTransformers/jsonTypeMappingsSanitizationTransformer/src/test/java/org/opensearch/migrations/transform/TypeMappingsSanitizationTransformerTest.java similarity index 81% rename from transformation/transformationPlugins/jsonMessageTransformers/jsonTypeMappingsSanitizerTransformer/src/test/java/org/opensearch/migrations/transform/TypeMappingSanitizerTransformerTest.java rename to transformation/transformationPlugins/jsonMessageTransformers/jsonTypeMappingsSanitizationTransformer/src/test/java/org/opensearch/migrations/transform/TypeMappingsSanitizationTransformerTest.java index 0d0e3e409..603f4e5d0 100644 --- a/transformation/transformationPlugins/jsonMessageTransformers/jsonTypeMappingsSanitizerTransformer/src/test/java/org/opensearch/migrations/transform/TypeMappingSanitizerTransformerTest.java +++ b/transformation/transformationPlugins/jsonMessageTransformers/jsonTypeMappingsSanitizationTransformer/src/test/java/org/opensearch/migrations/transform/TypeMappingsSanitizationTransformerTest.java @@ -6,10 +6,9 @@ import org.junit.jupiter.api.Test; import org.testcontainers.shaded.com.fasterxml.jackson.databind.ObjectMapper; -class TypeMappingSanitizerTransformerTest { +class TypeMappingsSanitizationTransformerTest { - - private static TypeMappingSanitizerTransformer indexTypeMappingRewriter; + private static TypeMappingsSanitizationTransformer indexTypeMappingRewriter; @BeforeAll static void initialize() { var indexMappings = Map.of( @@ -21,7 +20,7 @@ static void initialize() { "type2", "indexB"), "indexC", Map.of( "type2", "indexC")); - indexTypeMappingRewriter = new TypeMappingSanitizerTransformer(indexMappings); + indexTypeMappingRewriter = new TypeMappingsSanitizationTransformer(indexMappings); } @Test @@ -29,7 +28,7 @@ public void test() throws Exception { var testString = "{\n" + " \"verb\": \"PUT\",\n" + - " \"uri\": \"indexA/type2/someuser\",\n" + + " \"uri\": \"/indexA/type2/someuser\",\n" + " \"body\": {\n" + " \"name\": \"Some User\",\n" + " \"user_name\": \"user\",\n" + @@ -41,4 +40,4 @@ public void test() throws Exception { var resultStr = objMapper.writeValueAsString(resultObj); System.out.println("resultStr = " + resultStr); } -} \ No newline at end of file +} diff --git a/transformation/transformationPlugins/jsonMessageTransformers/jsonTypeMappingsSanitizationTransformerProvider/build.gradle b/transformation/transformationPlugins/jsonMessageTransformers/jsonTypeMappingsSanitizationTransformerProvider/build.gradle new file mode 100644 index 000000000..128adb34c --- /dev/null +++ b/transformation/transformationPlugins/jsonMessageTransformers/jsonTypeMappingsSanitizationTransformerProvider/build.gradle @@ -0,0 +1,32 @@ +buildscript { + dependencies { + classpath 'org.junit.platform:junit-platform-gradle-plugin:1.0.1' + } +} + +plugins { + id 'io.freefair.lombok' +} + +dependencies { + implementation project(':transformation:transformationPlugins:jsonMessageTransformers:jsonMessageTransformerInterface') + implementation project(':transformation:transformationPlugins:jsonMessageTransformers:jsonTypeMappingsSanitizationTransformer') + + testImplementation project(':transformation:transformationPlugins:jsonMessageTransformers:jsonTypeMappingsSanitizationTransformer') + testImplementation project(':coreUtilities') + testImplementation project(':TrafficCapture:trafficReplayer') + testImplementation testFixtures(project(path: ':coreUtilities')) + testImplementation testFixtures(project(path: ':testHelperFixtures')) + testImplementation testFixtures(project(path: ':TrafficCapture:trafficReplayer')) + + testImplementation group: 'com.fasterxml.jackson.core', name: 'jackson-databind' + testImplementation group: 'io.netty', name: 'netty-all' + testImplementation group: 'org.junit.jupiter', name:'junit-jupiter-api' + testImplementation group: 'org.junit.jupiter', name:'junit-jupiter-params' + testImplementation group: 'org.slf4j', name: 'slf4j-api' + testRuntimeOnly group:'org.junit.jupiter', name:'junit-jupiter-engine' +} + +tasks.named('test') { + useJUnitPlatform() +} diff --git a/transformation/transformationPlugins/jsonMessageTransformers/jsonTypeMappingsSanitizationTransformerProvider/src/main/java/org/opensearch/migrations/transform/TypeMappingSanitizationTransformerProvider.java b/transformation/transformationPlugins/jsonMessageTransformers/jsonTypeMappingsSanitizationTransformerProvider/src/main/java/org/opensearch/migrations/transform/TypeMappingSanitizationTransformerProvider.java new file mode 100644 index 000000000..fe64452c9 --- /dev/null +++ b/transformation/transformationPlugins/jsonMessageTransformers/jsonTypeMappingsSanitizationTransformerProvider/src/main/java/org/opensearch/migrations/transform/TypeMappingSanitizationTransformerProvider.java @@ -0,0 +1,28 @@ +package org.opensearch.migrations.transform; + +import java.util.Map; + +public class TypeMappingSanitizationTransformerProvider implements IJsonTransformerProvider { + + @Override + public IJsonTransformer createTransformer(Object jsonConfig) { + try { + if (jsonConfig instanceof Map) { + return new TypeMappingsSanitizationTransformer((Map>) jsonConfig); + } else { + throw new IllegalArgumentException(getConfigUsageStr()); + } + } catch (ClassCastException e) { + throw new IllegalArgumentException(getConfigUsageStr(), e); + } + } + + private String getConfigUsageStr() { + return this.getClass().getName() + + " expects the incoming configuration " + + "to be a Map>. " + + "The top-level key is a source index name, that key's children values are the index's type mappings. " + + "The value for the inner keys is the target index name that the " + + "source type's documents should be written to."; + } +} diff --git a/transformation/transformationPlugins/jsonMessageTransformers/jsonTypeMappingsSanitizationTransformerProvider/src/main/resources/META-INF/services/org.opensearch.migrations.transform.IJsonTransformerProvider b/transformation/transformationPlugins/jsonMessageTransformers/jsonTypeMappingsSanitizationTransformerProvider/src/main/resources/META-INF/services/org.opensearch.migrations.transform.IJsonTransformerProvider new file mode 100644 index 000000000..fb490338a --- /dev/null +++ b/transformation/transformationPlugins/jsonMessageTransformers/jsonTypeMappingsSanitizationTransformerProvider/src/main/resources/META-INF/services/org.opensearch.migrations.transform.IJsonTransformerProvider @@ -0,0 +1 @@ +org.opensearch.migrations.transform.TypeMappingSanitizationTransformerProvider \ No newline at end of file diff --git a/transformation/transformationPlugins/jsonMessageTransformers/jsonTypeMappingsSanitizationTransformerProvider/src/test/java/org/opensearch/migrations/replay/TypeMappingsSanitizationTest.java b/transformation/transformationPlugins/jsonMessageTransformers/jsonTypeMappingsSanitizationTransformerProvider/src/test/java/org/opensearch/migrations/replay/TypeMappingsSanitizationTest.java new file mode 100644 index 000000000..18056ca7d --- /dev/null +++ b/transformation/transformationPlugins/jsonMessageTransformers/jsonTypeMappingsSanitizationTransformerProvider/src/test/java/org/opensearch/migrations/replay/TypeMappingsSanitizationTest.java @@ -0,0 +1,80 @@ +package org.opensearch.migrations.replay; + +import java.util.Map; + +import org.opensearch.migrations.testutils.WrapWithNettyLeakDetection; +import org.opensearch.migrations.transform.TypeMappingSanitizationTransformerProvider; + +import com.fasterxml.jackson.core.JsonProcessingException; +import com.fasterxml.jackson.core.type.TypeReference; +import com.fasterxml.jackson.databind.ObjectMapper; +import lombok.extern.slf4j.Slf4j; +import org.junit.jupiter.api.Assertions; +import org.junit.jupiter.api.Test; + +@Slf4j +@WrapWithNettyLeakDetection(disableLeakChecks = true) +public class TypeMappingsSanitizationTest { + + static final String TEST_INPUT_REQUEST = "{\n" + + " \"method\": \"PUT\",\n" + + " \"URI\": \"/indexA/type2/someuser\",\n" + + " \"headers\": {\n" + + " \"host\": \"127.0.0.1\"\n" + + " },\n" + + " \"payload\": {\n" + + " \"inlinedJsonBody\": {\n" + + " \"name\": \"Some User\",\n" + + " \"user_name\": \"user\",\n" + + " \"email\": \"user@example.com\"\n" + + " }\n" + + " }\n" + + "}\n"; + + + ObjectMapper mapper = new ObjectMapper(); + + static String normalize(ObjectMapper mapper, String input) throws JsonProcessingException { + return mapper.writeValueAsString(mapper.readTree(input)); + } + + static String emitJson(ObjectMapper mapper, Object transformedDocument) throws JsonProcessingException { + mapper.configure(com.fasterxml.jackson.core.JsonParser.Feature.ALLOW_COMMENTS, true); // optional + return mapper.writeValueAsString(transformedDocument); + } + + @Test + public void testSimpleTransform() throws JsonProcessingException { + var config = Map.of( + "indexA", Map.of( + "type1", "indexA_1", + "type2", "indexA_2"), + "indexB", Map.of( + "type1", "indexB", + "type2", "indexB"), + "indexC", Map.of( + "type2", "indexC"));; + var transformer = new TypeMappingSanitizationTransformerProvider().createTransformer(config); + var transformedDocument = + transformer.transformJson(mapper.readValue(TEST_INPUT_REQUEST, new TypeReference<>(){})); + var outputStr = emitJson(mapper, transformedDocument); + + log.atInfo().setMessage("output={}").addArgument(outputStr).log(); + final String TEST_OUTPUT_REQUEST = "{\n" + + " \"method\": \"PUT\",\n" + + " \"URI\": \"/indexA_2/_doc/someuser\",\n" + + " \"headers\": {\n" + + " \"host\": \"127.0.0.1\"\n" + + " },\n" + + " \"payload\": {\n" + + " \"inlinedJsonBody\": {\n" + + " \"name\": \"Some User\",\n" + + " \"user_name\": \"user\",\n" + + " \"email\": \"user@example.com\"\n" + + " }\n" + + " }\n" + + "}\n"; + + Assertions.assertEquals(normalize(mapper, TEST_OUTPUT_REQUEST), normalize(mapper, outputStr)); + } +} diff --git a/transformation/transformationPlugins/jsonMessageTransformers/jsonTypeMappingsSanitizationTransformerProvider/src/test/resources/log4j2.properties b/transformation/transformationPlugins/jsonMessageTransformers/jsonTypeMappingsSanitizationTransformerProvider/src/test/resources/log4j2.properties new file mode 100644 index 000000000..6adca47b5 --- /dev/null +++ b/transformation/transformationPlugins/jsonMessageTransformers/jsonTypeMappingsSanitizationTransformerProvider/src/test/resources/log4j2.properties @@ -0,0 +1,18 @@ +status = WARN + +property.ownedPackagesLogLevel=${sys:migrationLogLevel:-INFO} + +appender.console.type = Console +appender.console.name = Console +appender.console.target = SYSTEM_OUT +appender.console.layout.type = PatternLayout +appender.console.layout.pattern = %d{yyyy-MM-dd HH:mm:ss,SSS}{UTC} %p %c{1.} [%t] %m%n + +rootLogger.level = info +rootLogger.appenderRef.console.ref = Console + +# Allow customization of owned package logs +logger.rfs.name = org.opensearch.migrations.bulkload +logger.rfs.level = ${ownedPackagesLogLevel} +logger.migration.name = org.opensearch.migrations +logger.migration.level = ${ownedPackagesLogLevel} diff --git a/transformation/transformationPlugins/jsonMessageTransformers/jsonTypeMappingsSanitizerTransformer/src/main/java/org/opensearch/migrations/transform/TypeMappingSanitizerTransformer.java b/transformation/transformationPlugins/jsonMessageTransformers/jsonTypeMappingsSanitizerTransformer/src/main/java/org/opensearch/migrations/transform/TypeMappingSanitizerTransformer.java deleted file mode 100644 index cbe79b4ec..000000000 --- a/transformation/transformationPlugins/jsonMessageTransformers/jsonTypeMappingsSanitizerTransformer/src/main/java/org/opensearch/migrations/transform/TypeMappingSanitizerTransformer.java +++ /dev/null @@ -1,60 +0,0 @@ -package org.opensearch.migrations.transform; - -import java.util.HashMap; -import java.util.Map; -import java.util.function.Function; - -public class TypeMappingSanitizerTransformer extends JinjavaTransformer { - - private final static String template = "" + - // First, parse the URI to check if it matches the pattern we want to transform - "{% set uri_parts = request.uri.split('/') %}\n" + - "{% set is_type_request = uri_parts | length == 2 %}\n" + - "{% set is_doc_request = uri_parts | length == 3 %}\n" + - "\n" + - // If this is a document request, check if we need to transform it based on mapping - "{% if is_doc_request and uri_parts[0] in index_mappings and uri_parts[1] in index_mappings[uri_parts[0]] %}\n" + - // This is a document request that needs transformation - " {\n" + - " \"verb\": \"{{ request.verb }}\",\n" + - " \"uri\": \"{{ index_mappings[uri_parts[0]][uri_parts[1]] }}/_doc/{{ uri_parts[2] }}\",\n" + - " \"body\": {{ request.body | tojson }}\n" + - " }\n" + - "{% elif is_type_request and uri_parts[0] in index_mappings %}\n" + - // This is an index creation request that needs transformation - " {\n" + - " \"verb\": \"{{ request.verb }}\",\n" + - " \"uri\": \"{{ index_mappings[uri_parts[0]][uri_parts[1]] }}\",\n" + - " \"body\": {\n" + - " \"mappings\": {\n" + - " \"properties\": {\n" + - " \"type\": {\n" + - " \"type\": \"keyword\"\n" + - " }\n" + - " {%- for type_name, type_props in request.body.mappings.items() %}\n" + - " {%- for prop_name, prop_def in type_props.properties.items() %}\n" + - " ,\n" + - " \"{{ prop_name }}\": {{ prop_def | tojson }}\n" + - " {%- endfor %}\n" + - " {%- endfor %}\n" + - " }\n" + - " }\n" + - " }\n" + - " }\n" + - "{% else %}\n" + - // Pass through - " {{ request | tojson }}\n" + - "{% endif %}"; - - public TypeMappingSanitizerTransformer(Map> indexMappings) { - super(template, getContextWrapper(indexMappings)); - } - - private static Function, Map> - getContextWrapper(Map> indexMappings) - { - return incomingJson -> Map.of( - "index_mappings", indexMappings, - "request", incomingJson); - } -} diff --git a/transformation/transformationPlugins/jsonMessageTransformers/jsonTypeMappingsSanitizerTransformer/src/main/resources/META-INF/services/org.opensearch.migrations.transform.IJsonTransformerProvider b/transformation/transformationPlugins/jsonMessageTransformers/jsonTypeMappingsSanitizerTransformer/src/main/resources/META-INF/services/org.opensearch.migrations.transform.IJsonTransformerProvider deleted file mode 100644 index 5beb0df6a..000000000 --- a/transformation/transformationPlugins/jsonMessageTransformers/jsonTypeMappingsSanitizerTransformer/src/main/resources/META-INF/services/org.opensearch.migrations.transform.IJsonTransformerProvider +++ /dev/null @@ -1 +0,0 @@ -org.opensearch.migrations.transform.TypeMappingSanitizerTransformer \ No newline at end of file From 9bd5c60ba9d9ce1cf54f3018b0a89959c74bc63c Mon Sep 17 00:00:00 2001 From: Greg Schohn Date: Tue, 19 Nov 2024 13:46:56 -0500 Subject: [PATCH 03/26] Checkpoint on jinjava and loading template transformations. This supports preparsing templates and loading default or specific versions. Those features are likely now in flux to be replaced with a better UX. Signed-off-by: Greg Schohn --- .../transform/JinjavaTransformer.java | 47 ++++++++++++--- .../InlineTemplateResourceLocator.java | 26 ++++++++ .../NameMappingClasspathResourceLocator.java | 37 ++++++++++++ .../JinjavaTransformerProviderTest.java | 2 +- .../TypeMappingsSanitizationTransformer.java | 60 ++++--------------- .../typeMappings/replayer.j2} | 0 6 files changed, 112 insertions(+), 60 deletions(-) create mode 100644 transformation/transformationPlugins/jsonMessageTransformers/jsonJinjavaTransformer/src/main/java/org/opensearch/migrations/transform/jinjava/InlineTemplateResourceLocator.java create mode 100644 transformation/transformationPlugins/jsonMessageTransformers/jsonJinjavaTransformer/src/main/java/org/opensearch/migrations/transform/jinjava/NameMappingClasspathResourceLocator.java rename transformation/transformationPlugins/jsonMessageTransformers/jsonTypeMappingsSanitizationTransformer/src/main/resources/{v1/template.jinja => jinjava/typeMappings/replayer.j2} (100%) diff --git a/transformation/transformationPlugins/jsonMessageTransformers/jsonJinjavaTransformer/src/main/java/org/opensearch/migrations/transform/JinjavaTransformer.java b/transformation/transformationPlugins/jsonMessageTransformers/jsonJinjavaTransformer/src/main/java/org/opensearch/migrations/transform/JinjavaTransformer.java index f6704b4c7..79ab2a13c 100644 --- a/transformation/transformationPlugins/jsonMessageTransformers/jsonJinjavaTransformer/src/main/java/org/opensearch/migrations/transform/JinjavaTransformer.java +++ b/transformation/transformationPlugins/jsonMessageTransformers/jsonJinjavaTransformer/src/main/java/org/opensearch/migrations/transform/JinjavaTransformer.java @@ -3,9 +3,17 @@ import java.util.Map; import java.util.function.Function; +import org.opensearch.migrations.transform.jinjava.InlineTemplateResourceLocator; +import org.opensearch.migrations.transform.jinjava.NameMappingClasspathResourceLocator; + import com.fasterxml.jackson.databind.ObjectMapper; import com.hubspot.jinjava.Jinjava; -import com.hubspot.jinjava.loader.FileLocator; +import com.hubspot.jinjava.interpret.Context; +import com.hubspot.jinjava.interpret.JinjavaInterpreter; +import com.hubspot.jinjava.loader.CascadingResourceLocator; +import com.hubspot.jinjava.loader.ResourceLocator; +import com.hubspot.jinjava.tree.Node; +import lombok.NonNull; import lombok.SneakyThrows; import lombok.extern.slf4j.Slf4j; @@ -13,30 +21,51 @@ public class JinjavaTransformer implements IJsonTransformer { protected final static ObjectMapper objectMapper = new ObjectMapper(); - protected final String templateString; + protected final Jinjava jinjava; + protected final ThreadLocal threadLocalInterpreter; + protected final Node template; protected final Function, Map> wrapSourceAsContextConverter; public JinjavaTransformer(String templateString, + Map baseImmutableBindings, Function, Map> contextProviderFromSource) { - this(templateString, contextProviderFromSource, null); + this(templateString, baseImmutableBindings, contextProviderFromSource, new NameMappingClasspathResourceLocator()); + } + + public JinjavaTransformer(String templateString, + Map baseImmutableBindings, + Function, Map> contextProviderFromSource, + @NonNull Map inlineTemplates) { + this(templateString, baseImmutableBindings, contextProviderFromSource, new CascadingResourceLocator( + new NameMappingClasspathResourceLocator(), + new InlineTemplateResourceLocator(inlineTemplates))); } public JinjavaTransformer(String templateString, + Map baseImmutableBindings, Function, Map> wrapSourceAsContextConverter, - FileLocator fileLocator) + ResourceLocator resourceLocator) { - this.templateString = templateString; + jinjava = new Jinjava(); this.wrapSourceAsContextConverter = wrapSourceAsContextConverter; - this.jinjava = new Jinjava(); - this.jinjava.setResourceLocator(fileLocator); - + jinjava.setResourceLocator(resourceLocator); + threadLocalInterpreter = ThreadLocal.withInitial(() -> { + var context = new Context(null, baseImmutableBindings); + return jinjava.getGlobalConfig().getInterpreterFactory().newInstance(jinjava, context, jinjava.getGlobalConfig()); + }); + var interpreter = threadLocalInterpreter.get(); + this.template = interpreter.parse(templateString); } @SneakyThrows @Override public Map transformJson(Map incomingJson) { - String resultStr = jinjava.render(templateString, wrapSourceAsContextConverter.apply(incomingJson)); + var sourceBindings = wrapSourceAsContextConverter.apply(incomingJson); + JinjavaInterpreter parentInterpreter = threadLocalInterpreter.get(); + Context childContext = new Context(parentInterpreter.getContext(), sourceBindings); + JinjavaInterpreter interpreter = new JinjavaInterpreter(jinjava, childContext, parentInterpreter.getConfig()); + String resultStr = interpreter.render(template); log.atInfo().setMessage("output = {}").addArgument(resultStr).log(); return objectMapper.readValue(resultStr, Map.class); } diff --git a/transformation/transformationPlugins/jsonMessageTransformers/jsonJinjavaTransformer/src/main/java/org/opensearch/migrations/transform/jinjava/InlineTemplateResourceLocator.java b/transformation/transformationPlugins/jsonMessageTransformers/jsonJinjavaTransformer/src/main/java/org/opensearch/migrations/transform/jinjava/InlineTemplateResourceLocator.java new file mode 100644 index 000000000..d6629946e --- /dev/null +++ b/transformation/transformationPlugins/jsonMessageTransformers/jsonJinjavaTransformer/src/main/java/org/opensearch/migrations/transform/jinjava/InlineTemplateResourceLocator.java @@ -0,0 +1,26 @@ +package org.opensearch.migrations.transform.jinjava; + +import java.nio.charset.Charset; +import java.util.Map; + +import com.hubspot.jinjava.interpret.JinjavaInterpreter; +import com.hubspot.jinjava.loader.ResourceLocator; +import com.hubspot.jinjava.loader.ResourceNotFoundException; + +public class InlineTemplateResourceLocator implements ResourceLocator { + + private final Map templates; + + public InlineTemplateResourceLocator(Map templates) { + this.templates = templates; + } + + @Override + public String getString(String fullName, Charset encoding, JinjavaInterpreter interpreter) + throws ResourceNotFoundException { + if (templates.containsKey(fullName)) { + return templates.get(fullName); + } + throw new ResourceNotFoundException("Template not found: " + fullName); + } +} diff --git a/transformation/transformationPlugins/jsonMessageTransformers/jsonJinjavaTransformer/src/main/java/org/opensearch/migrations/transform/jinjava/NameMappingClasspathResourceLocator.java b/transformation/transformationPlugins/jsonMessageTransformers/jsonJinjavaTransformer/src/main/java/org/opensearch/migrations/transform/jinjava/NameMappingClasspathResourceLocator.java new file mode 100644 index 000000000..d3ea1a0d4 --- /dev/null +++ b/transformation/transformationPlugins/jsonMessageTransformers/jsonJinjavaTransformer/src/main/java/org/opensearch/migrations/transform/jinjava/NameMappingClasspathResourceLocator.java @@ -0,0 +1,37 @@ +package org.opensearch.migrations.transform.jinjava; + +import java.io.IOException; +import java.nio.charset.Charset; +import java.nio.charset.StandardCharsets; +import java.util.stream.Collectors; + +import com.google.common.io.Resources; +import com.hubspot.jinjava.interpret.JinjavaInterpreter; +import com.hubspot.jinjava.loader.ClasspathResourceLocator; +import com.hubspot.jinjava.loader.ResourceNotFoundException; +import lombok.extern.slf4j.Slf4j; + +@Slf4j +public class NameMappingClasspathResourceLocator extends ClasspathResourceLocator { + + private String getDefaultVersion(final String fullName) throws IOException { + try { + var versionFile = fullName + "/defaultVersion"; + var versionLines = Resources.readLines(Resources.getResource(versionFile), StandardCharsets.UTF_8).stream() + .filter(s->!s.isEmpty()) + .collect(Collectors.toList()); + if (versionLines.size() == 1) { + return fullName + "/" + versionLines.get(0).trim(); + } + throw new IllegalStateException("Expected defaultVersion resource to contain a single line with a name"); + } catch (ResourceNotFoundException e) { + log.atTrace().setCause(e).setMessage("Caught ResourceNotFoundException, but this is expected").log(); + } + return fullName; + } + + @Override + public String getString(String fullName, Charset encoding, JinjavaInterpreter interpreter) throws IOException { + return super.getString(getDefaultVersion("jinjava/" + fullName), encoding, interpreter); + } +} diff --git a/transformation/transformationPlugins/jsonMessageTransformers/jsonJinjavaTransformerProvider/src/test/java/org/opensearch/migrations/replay/JinjavaTransformerProviderTest.java b/transformation/transformationPlugins/jsonMessageTransformers/jsonJinjavaTransformerProvider/src/test/java/org/opensearch/migrations/replay/JinjavaTransformerProviderTest.java index ca5ae3657..eb78010a7 100644 --- a/transformation/transformationPlugins/jsonMessageTransformers/jsonJinjavaTransformerProvider/src/test/java/org/opensearch/migrations/replay/JinjavaTransformerProviderTest.java +++ b/transformation/transformationPlugins/jsonMessageTransformers/jsonJinjavaTransformerProvider/src/test/java/org/opensearch/migrations/replay/JinjavaTransformerProviderTest.java @@ -76,7 +76,7 @@ static String emitJson(ObjectMapper mapper, Object transformedDocument) throws J public void testSimpleTransform() throws JsonProcessingException { var documentJson = parseStringAsJson(mapper, TEST_INPUT_REQUEST); var transformer = new JsonJinjavaTransformerProvider().createTransformer(Map.of( - "script", EXCISE_TYPE_EXPRESSION_STRING)); + "template", EXCISE_TYPE_EXPRESSION_STRING)); var transformedDocument = transformer.transformJson(documentJson); var outputStr = emitJson(mapper, transformedDocument); diff --git a/transformation/transformationPlugins/jsonMessageTransformers/jsonTypeMappingsSanitizationTransformer/src/main/java/org/opensearch/migrations/transform/TypeMappingsSanitizationTransformer.java b/transformation/transformationPlugins/jsonMessageTransformers/jsonTypeMappingsSanitizationTransformer/src/main/java/org/opensearch/migrations/transform/TypeMappingsSanitizationTransformer.java index 507c9191d..a3d778276 100644 --- a/transformation/transformationPlugins/jsonMessageTransformers/jsonTypeMappingsSanitizationTransformer/src/main/java/org/opensearch/migrations/transform/TypeMappingsSanitizationTransformer.java +++ b/transformation/transformationPlugins/jsonMessageTransformers/jsonTypeMappingsSanitizationTransformer/src/main/java/org/opensearch/migrations/transform/TypeMappingsSanitizationTransformer.java @@ -1,61 +1,21 @@ package org.opensearch.migrations.transform; import java.util.Map; -import java.util.function.Function; public class TypeMappingsSanitizationTransformer extends JinjavaTransformer { - private final static String template = "" + - // First, parse the URI to check if it matches the pattern we want to transform - "{% set uri_parts = request.URI.split('/') | reject('equalto', '') | list %}\n" + - "\n" + - // If this is a document request, check if we need to transform it based on mapping - "{% if uri_parts | length == 3 and uri_parts[0] in index_mappings and uri_parts[1] in index_mappings[uri_parts[0]] %}\n" + - // This is a document request that needs transformation - " {\n" + - " \"method\": \"{{ request.method }}\",\n" + - " \"URI\": \"/{{ index_mappings[uri_parts[0]][uri_parts[1]] }}/_doc/{{ uri_parts[2] }}\",\n" + - " \"headers\": {{ request.headers | tojson }},\n" + - " \"payload\": {{ request.payload | tojson }}\n" + - " }\n" + - "{% elif uri_parts | length == 2 and uri_parts[0] in index_mappings %}\n" + - // This is an index creation request that needs transformation - " {\n" + - " \"method\": \"{{ request.method }}\",\n" + - " \"URI\": \"{{ index_mappings[uri_parts[0]][uri_parts[1]] }}\",\n" + - " \"payload\": {\n" + - " \"inlinedJsonBody\": {\n" + - " \"mappings\": {\n" + - " \"properties\": {\n" + - " \"type\": {\n" + - " \"type\": \"keyword\"\n" + - " }\n" + - " {%- for type_name, type_props in request.body.mappings.items() %}\n" + - " {%- for prop_name, prop_def in type_props.properties.items() %}\n" + - " ,\n" + - " \"{{ prop_name }}\": {{ prop_def | tojson }}\n" + - " {%- endfor %}\n" + - " {%- endfor %}\n" + - " }\n" + - " }\n" + - " }\n" + - " }\n" + - " }\n" + - "{% else %}\n" + - // Pass through - " { \"urilen\": {{uri_parts | length}} }" + - //" {{ request | tojson }}\n" + - "{% endif %}"; - public TypeMappingsSanitizationTransformer(Map> indexMappings) { - super(template, getContextWrapper(indexMappings)); + this("typeMappings/replayerreplayer", indexMappings); + } + + public TypeMappingsSanitizationTransformer(String variantName, Map> indexMappings) { + super( + makeTemplate(variantName), + Map.of("index_mappings", indexMappings), + incomingJson -> Map.of("request", incomingJson)); } - private static Function, Map> - getContextWrapper(Map> indexMappings) - { - return incomingJson -> Map.of( - "index_mappings", indexMappings, - "request", incomingJson); + private static String makeTemplate(String variantName) { + return "{% include \"" + variantName+ "\" %}"; } } diff --git a/transformation/transformationPlugins/jsonMessageTransformers/jsonTypeMappingsSanitizationTransformer/src/main/resources/v1/template.jinja b/transformation/transformationPlugins/jsonMessageTransformers/jsonTypeMappingsSanitizationTransformer/src/main/resources/jinjava/typeMappings/replayer.j2 similarity index 100% rename from transformation/transformationPlugins/jsonMessageTransformers/jsonTypeMappingsSanitizationTransformer/src/main/resources/v1/template.jinja rename to transformation/transformationPlugins/jsonMessageTransformers/jsonTypeMappingsSanitizationTransformer/src/main/resources/jinjava/typeMappings/replayer.j2 From f1e1d509381959c0a37ebc870b1c4087137c0a1c Mon Sep 17 00:00:00 2001 From: Greg Schohn Date: Wed, 20 Nov 2024 15:57:09 -0500 Subject: [PATCH 04/26] Checkpoint add support for macros and feature flags for different parts of jinjava transforms (see 'is_enabled'). These changes will reduce the efficiency of this type of transform, but w/out it, it isn't clear how we'll utilize dynamic typing. My hope is that template logic is small relative to documents - and compute is cheap, so these are good tradeoffs to make. Signed-off-by: Greg Schohn --- .../build.gradle | 2 + .../jsonJinjavaTransformer/build.gradle | 1 + .../transform/JinjavaTransformer.java | 43 ++-------- .../NameMappingClasspathResourceLocator.java | 6 +- .../jinjava/common/featureEnabled.j2 | 27 ++++++ .../transform/FeatureMaskingTest.java | 82 +++++++++++++++++++ .../transform/JinjavaTransformerTest.java | 5 +- .../JinjavaTransformerProviderTest.java | 8 +- .../build.gradle | 1 + .../transform/flags/FeatureFlags.java | 48 +++++++++++ .../flags/FeatureFlagsDeserializer.java | 51 ++++++++++++ .../flags/FeatureFlagsSerializer.java | 33 ++++++++ .../build.gradle | 5 +- .../TypeMappingsSanitizationTransformer.java | 21 +++-- .../jinjava/typeMappings/replayer.j2 | 77 +++++++++++------ ...peMappingsSanitizationTransformerTest.java | 3 +- ...appingSanitizationTransformerProvider.java | 3 + 17 files changed, 335 insertions(+), 81 deletions(-) create mode 100644 transformation/transformationPlugins/jsonMessageTransformers/jsonJinjavaTransformer/src/main/resources/jinjava/common/featureEnabled.j2 create mode 100644 transformation/transformationPlugins/jsonMessageTransformers/jsonJinjavaTransformer/src/test/java/org/opensearch/migrations/transform/FeatureMaskingTest.java create mode 100644 transformation/transformationPlugins/jsonMessageTransformers/jsonMessageTransformerLoaders/src/main/java/org/opensearch/migrations/transform/flags/FeatureFlags.java create mode 100644 transformation/transformationPlugins/jsonMessageTransformers/jsonMessageTransformerLoaders/src/main/java/org/opensearch/migrations/transform/flags/FeatureFlagsDeserializer.java create mode 100644 transformation/transformationPlugins/jsonMessageTransformers/jsonMessageTransformerLoaders/src/main/java/org/opensearch/migrations/transform/flags/FeatureFlagsSerializer.java diff --git a/commonDependencyVersionConstraints/build.gradle b/commonDependencyVersionConstraints/build.gradle index f785f7e23..2bfc4a187 100644 --- a/commonDependencyVersionConstraints/build.gradle +++ b/commonDependencyVersionConstraints/build.gradle @@ -55,6 +55,8 @@ dependencies { def jackson = '2.16.2' api group: 'com.fasterxml.jackson.core', name: 'jackson-databind', version: jackson + api group: 'com.fasterxml.jackson.core', name: 'jackson-dataformat-yaml', version: jackson + api group: 'com.fasterxml.jackson.dataformat', name: 'jackson-dataformat-yaml', version: jackson api group: 'com.fasterxml.jackson.dataformat', name: 'jackson-dataformat-smile', version: jackson def jupiter = '5.10.2' diff --git a/transformation/transformationPlugins/jsonMessageTransformers/jsonJinjavaTransformer/build.gradle b/transformation/transformationPlugins/jsonMessageTransformers/jsonJinjavaTransformer/build.gradle index 22dd99683..448b9e529 100644 --- a/transformation/transformationPlugins/jsonMessageTransformers/jsonJinjavaTransformer/build.gradle +++ b/transformation/transformationPlugins/jsonMessageTransformers/jsonJinjavaTransformer/build.gradle @@ -8,6 +8,7 @@ dependencies { implementation group: 'com.hubspot.jinjava', name: 'jinjava', version: "2.7.3" testImplementation project(':TrafficCapture:trafficReplayer') + testImplementation project(':transformation:transformationPlugins:jsonMessageTransformers:jsonMessageTransformerLoaders') testImplementation testFixtures(project(path: ':testHelperFixtures')) testImplementation testFixtures(project(path: ':TrafficCapture:trafficReplayer')) diff --git a/transformation/transformationPlugins/jsonMessageTransformers/jsonJinjavaTransformer/src/main/java/org/opensearch/migrations/transform/JinjavaTransformer.java b/transformation/transformationPlugins/jsonMessageTransformers/jsonJinjavaTransformer/src/main/java/org/opensearch/migrations/transform/JinjavaTransformer.java index 79ab2a13c..d2a2d8a72 100644 --- a/transformation/transformationPlugins/jsonMessageTransformers/jsonJinjavaTransformer/src/main/java/org/opensearch/migrations/transform/JinjavaTransformer.java +++ b/transformation/transformationPlugins/jsonMessageTransformers/jsonJinjavaTransformer/src/main/java/org/opensearch/migrations/transform/JinjavaTransformer.java @@ -3,17 +3,11 @@ import java.util.Map; import java.util.function.Function; -import org.opensearch.migrations.transform.jinjava.InlineTemplateResourceLocator; import org.opensearch.migrations.transform.jinjava.NameMappingClasspathResourceLocator; import com.fasterxml.jackson.databind.ObjectMapper; import com.hubspot.jinjava.Jinjava; -import com.hubspot.jinjava.interpret.Context; -import com.hubspot.jinjava.interpret.JinjavaInterpreter; -import com.hubspot.jinjava.loader.CascadingResourceLocator; import com.hubspot.jinjava.loader.ResourceLocator; -import com.hubspot.jinjava.tree.Node; -import lombok.NonNull; import lombok.SneakyThrows; import lombok.extern.slf4j.Slf4j; @@ -23,50 +17,29 @@ public class JinjavaTransformer implements IJsonTransformer { protected final static ObjectMapper objectMapper = new ObjectMapper(); protected final Jinjava jinjava; - protected final ThreadLocal threadLocalInterpreter; - protected final Node template; - protected final Function, Map> wrapSourceAsContextConverter; + protected final Function, Map> createContextWithSourceFunction; + private final String templateStr; public JinjavaTransformer(String templateString, - Map baseImmutableBindings, Function, Map> contextProviderFromSource) { - this(templateString, baseImmutableBindings, contextProviderFromSource, new NameMappingClasspathResourceLocator()); + this(templateString, contextProviderFromSource, new NameMappingClasspathResourceLocator()); } public JinjavaTransformer(String templateString, - Map baseImmutableBindings, - Function, Map> contextProviderFromSource, - @NonNull Map inlineTemplates) { - this(templateString, baseImmutableBindings, contextProviderFromSource, new CascadingResourceLocator( - new NameMappingClasspathResourceLocator(), - new InlineTemplateResourceLocator(inlineTemplates))); - } - - public JinjavaTransformer(String templateString, - Map baseImmutableBindings, - Function, Map> wrapSourceAsContextConverter, + Function, Map> createContextWithSource, ResourceLocator resourceLocator) { jinjava = new Jinjava(); - this.wrapSourceAsContextConverter = wrapSourceAsContextConverter; + this.createContextWithSourceFunction = createContextWithSource; jinjava.setResourceLocator(resourceLocator); - threadLocalInterpreter = ThreadLocal.withInitial(() -> { - var context = new Context(null, baseImmutableBindings); - return jinjava.getGlobalConfig().getInterpreterFactory().newInstance(jinjava, context, jinjava.getGlobalConfig()); - }); - var interpreter = threadLocalInterpreter.get(); - this.template = interpreter.parse(templateString); + this.templateStr = templateString; } @SneakyThrows @Override public Map transformJson(Map incomingJson) { - var sourceBindings = wrapSourceAsContextConverter.apply(incomingJson); - JinjavaInterpreter parentInterpreter = threadLocalInterpreter.get(); - Context childContext = new Context(parentInterpreter.getContext(), sourceBindings); - JinjavaInterpreter interpreter = new JinjavaInterpreter(jinjava, childContext, parentInterpreter.getConfig()); - String resultStr = interpreter.render(template); - log.atInfo().setMessage("output = {}").addArgument(resultStr).log(); + var resultStr = jinjava.render(templateStr, createContextWithSourceFunction.apply(incomingJson)); + log.atInfo().setMessage("output from jinjava... {}").addArgument(resultStr).log(); return objectMapper.readValue(resultStr, Map.class); } } diff --git a/transformation/transformationPlugins/jsonMessageTransformers/jsonJinjavaTransformer/src/main/java/org/opensearch/migrations/transform/jinjava/NameMappingClasspathResourceLocator.java b/transformation/transformationPlugins/jsonMessageTransformers/jsonJinjavaTransformer/src/main/java/org/opensearch/migrations/transform/jinjava/NameMappingClasspathResourceLocator.java index d3ea1a0d4..d73bf07e2 100644 --- a/transformation/transformationPlugins/jsonMessageTransformers/jsonJinjavaTransformer/src/main/java/org/opensearch/migrations/transform/jinjava/NameMappingClasspathResourceLocator.java +++ b/transformation/transformationPlugins/jsonMessageTransformers/jsonJinjavaTransformer/src/main/java/org/opensearch/migrations/transform/jinjava/NameMappingClasspathResourceLocator.java @@ -8,7 +8,6 @@ import com.google.common.io.Resources; import com.hubspot.jinjava.interpret.JinjavaInterpreter; import com.hubspot.jinjava.loader.ClasspathResourceLocator; -import com.hubspot.jinjava.loader.ResourceNotFoundException; import lombok.extern.slf4j.Slf4j; @Slf4j @@ -24,7 +23,7 @@ private String getDefaultVersion(final String fullName) throws IOException { return fullName + "/" + versionLines.get(0).trim(); } throw new IllegalStateException("Expected defaultVersion resource to contain a single line with a name"); - } catch (ResourceNotFoundException e) { + } catch (IllegalArgumentException e) { log.atTrace().setCause(e).setMessage("Caught ResourceNotFoundException, but this is expected").log(); } return fullName; @@ -32,6 +31,7 @@ private String getDefaultVersion(final String fullName) throws IOException { @Override public String getString(String fullName, Charset encoding, JinjavaInterpreter interpreter) throws IOException { - return super.getString(getDefaultVersion("jinjava/" + fullName), encoding, interpreter); + var rval = super.getString(getDefaultVersion("jinjava/" + fullName), encoding, interpreter); + return rval; } } diff --git a/transformation/transformationPlugins/jsonMessageTransformers/jsonJinjavaTransformer/src/main/resources/jinjava/common/featureEnabled.j2 b/transformation/transformationPlugins/jsonMessageTransformers/jsonJinjavaTransformer/src/main/resources/jinjava/common/featureEnabled.j2 new file mode 100644 index 000000000..2d44f468c --- /dev/null +++ b/transformation/transformationPlugins/jsonMessageTransformers/jsonJinjavaTransformer/src/main/resources/jinjava/common/featureEnabled.j2 @@ -0,0 +1,27 @@ +{%- macro is_enabled(features, path) -%} + {%- if features == None -%} + true + {%- else -%} + {%- set ns = namespace(value=features) -%} + {%- set debug = namespace(log=[]) -%} + {%- for key in (path | split('.')) -%} + {% set debug.log = debug.log + ["k:"+key] -%} + {% set debug.log = debug.log + ["ismapping?:"+(ns.value is mapping)] -%} + {%- if ns.value is mapping and key in ns.value -%} + {%- set ns.value = ns.value[key] -%} + {%- else -%} + {%- set ns.value = None -%} + {%- endif -%} + {%- endfor -%} + {%- set debug.log = debug.log + ["val=" + (ns.value)] -%} + {%- set debug.log = debug.log + ["is map?=" + (ns.value is map)] -%} + {%- set debug.log = debug.log + ["enabled val=" + (ns.value.enabled)] -%} + {%- if ns.value is boolean and ns.value -%} + true + {%- elif ns.value is mapping and ns.value.get('enabled') is boolean -%} + {{- ns.value.get('enabled') -}} + {%- else -%} + false + {%- endif -%} + {%- endif -%} +{%- endmacro -%} diff --git a/transformation/transformationPlugins/jsonMessageTransformers/jsonJinjavaTransformer/src/test/java/org/opensearch/migrations/transform/FeatureMaskingTest.java b/transformation/transformationPlugins/jsonMessageTransformers/jsonJinjavaTransformer/src/test/java/org/opensearch/migrations/transform/FeatureMaskingTest.java new file mode 100644 index 000000000..7c58cbb04 --- /dev/null +++ b/transformation/transformationPlugins/jsonMessageTransformers/jsonJinjavaTransformer/src/test/java/org/opensearch/migrations/transform/FeatureMaskingTest.java @@ -0,0 +1,82 @@ +package org.opensearch.migrations.transform; + +import java.io.IOException; +import java.util.Map; + +import org.opensearch.migrations.transform.flags.FeatureFlags; + +import lombok.extern.slf4j.Slf4j; +import org.junit.jupiter.api.Assertions; +import org.junit.jupiter.api.Test; +import org.testcontainers.shaded.com.fasterxml.jackson.databind.ObjectMapper; + +@Slf4j +public class FeatureMaskingTest { + private static final ObjectMapper objectMapper = new ObjectMapper(); + public Map transformForMask(Map incomingFlags) throws IOException { + var incomingFlagStr = objectMapper.writeValueAsString(incomingFlags); + log.atInfo().setMessage("incoming map as string: {}").addArgument(incomingFlagStr).log(); + var flags = FeatureFlags.parseJson(incomingFlagStr); + log.atInfo().setMessage("parsed flags: {}").addArgument(flags == null ? "[NULL]" : flags.writeJson()).log(); + final var template = "" + + "{%- include \"common/featureEnabled.j2\" -%}" + + " { " + + "{%- set ns = namespace(debug_info=['list: ']) -%}" + + "{%- set ns.debug_info = ['list: '] -%}" + + "\"enabledFlags\": \"" + + "{{- is_enabled(features,'testFlag') -}}," + + "{{- is_enabled(features,'testFlag.t1') -}}," + + "{{- is_enabled(features,'testFlag.t2') -}}," + + "{{- is_enabled(features,'nextTestFlag.n1') -}}" + + "\"" + + "}"; + var sanitization = new JinjavaTransformer(template, + src -> flags == null ? Map.of() : Map.of("features", flags)); + return sanitization.transformJson(Map.of()); + } + + @Test + public void testFalseFlag() throws Exception { + Assertions.assertEquals( + "false,false,false,false", + transformForMask(Map.of("testFlag", false)).get("enabledFlags")); + } + + @Test + public void testTrueFlag() throws Exception { + Assertions.assertEquals( + "true,false,false,false", + transformForMask(Map.of("testFlag", true)).get("enabledFlags")); + } + + @Test + public void testLongerFalseFlag() throws Exception { + Assertions.assertEquals( + "false,false,false,false", + transformForMask(Map.of("testFlag", false)).get("enabledFlags")); + } + + @Test + public void testLongerTrueFlag() throws Exception { + Assertions.assertEquals( + "true,false,false,false", + transformForMask(Map.of( + "testFlag", Map.of("notPresent", false)) + ).get("enabledFlags")); + } + + @Test + public void testImplicitTrueFlag() throws Exception { + Assertions.assertEquals( + "true,true,false,false", + transformForMask(Map.of( + "testFlag", Map.of("t1", true)) + ).get("enabledFlags")); + } + + @Test + public void testNullFeatures() throws Exception { + Assertions.assertEquals( + "true,true,true,true", transformForMask(null).get("enabledFlags")); + } +} diff --git a/transformation/transformationPlugins/jsonMessageTransformers/jsonJinjavaTransformer/src/test/java/org/opensearch/migrations/transform/JinjavaTransformerTest.java b/transformation/transformationPlugins/jsonMessageTransformers/jsonJinjavaTransformer/src/test/java/org/opensearch/migrations/transform/JinjavaTransformerTest.java index 3a3b1abd7..2bec339ae 100644 --- a/transformation/transformationPlugins/jsonMessageTransformers/jsonJinjavaTransformer/src/test/java/org/opensearch/migrations/transform/JinjavaTransformerTest.java +++ b/transformation/transformationPlugins/jsonMessageTransformers/jsonJinjavaTransformer/src/test/java/org/opensearch/migrations/transform/JinjavaTransformerTest.java @@ -60,8 +60,9 @@ static void initialize() { "type2", "indexB"), "indexC", Map.of( "type2", "indexC")); - indexTypeMappingRewriter = new JinjavaTransformer(template, request -> - Map.of("index_mappings", indexMappings, + indexTypeMappingRewriter = new JinjavaTransformer(template, + request -> Map.of( + "index_mappings", indexMappings, "request", request)); } diff --git a/transformation/transformationPlugins/jsonMessageTransformers/jsonJinjavaTransformerProvider/src/test/java/org/opensearch/migrations/replay/JinjavaTransformerProviderTest.java b/transformation/transformationPlugins/jsonMessageTransformers/jsonJinjavaTransformerProvider/src/test/java/org/opensearch/migrations/replay/JinjavaTransformerProviderTest.java index eb78010a7..8687bf75d 100644 --- a/transformation/transformationPlugins/jsonMessageTransformers/jsonJinjavaTransformerProvider/src/test/java/org/opensearch/migrations/replay/JinjavaTransformerProviderTest.java +++ b/transformation/transformationPlugins/jsonMessageTransformers/jsonJinjavaTransformerProvider/src/test/java/org/opensearch/migrations/replay/JinjavaTransformerProviderTest.java @@ -41,12 +41,12 @@ class JinjavaTransformerProviderTest { + "}\n"; static final String EXCISE_TYPE_EXPRESSION_STRING = "{\n" - + " \"method\": method,\n" - + " \"URI\": URI,\n" - + " \"headers\": headers,\n" + + " \"method\": \"{{ request.method }}\",\n" + + " \"URI\": \"{{ request.URI }}\",\n" + + " \"headers\": {{ request.headers | tojson }},\n" + " \"payload\": {\n" + " \"inlinedJsonBody\": {\n" - + " \"mappings\": payload.inlinedJsonBody.mappings.oldType\n" + + " \"mappings\": {{ request.payload.inlinedJsonBody.mappings.oldType | tojson }}\n" + " }\n" + " }\n" + "}"; diff --git a/transformation/transformationPlugins/jsonMessageTransformers/jsonMessageTransformerLoaders/build.gradle b/transformation/transformationPlugins/jsonMessageTransformers/jsonMessageTransformerLoaders/build.gradle index 86f260503..2da9c9c85 100644 --- a/transformation/transformationPlugins/jsonMessageTransformers/jsonMessageTransformerLoaders/build.gradle +++ b/transformation/transformationPlugins/jsonMessageTransformers/jsonMessageTransformerLoaders/build.gradle @@ -25,6 +25,7 @@ plugins { dependencies { implementation group: 'org.slf4j', name: 'slf4j-api' implementation group: 'com.fasterxml.jackson.core', name: 'jackson-databind' + implementation group: 'com.fasterxml.jackson.dataformat', name: 'jackson-dataformat-yaml' api project(':transformation:transformationPlugins:jsonMessageTransformers:jsonMessageTransformerInterface') diff --git a/transformation/transformationPlugins/jsonMessageTransformers/jsonMessageTransformerLoaders/src/main/java/org/opensearch/migrations/transform/flags/FeatureFlags.java b/transformation/transformationPlugins/jsonMessageTransformers/jsonMessageTransformerLoaders/src/main/java/org/opensearch/migrations/transform/flags/FeatureFlags.java new file mode 100644 index 000000000..c3b14a3cd --- /dev/null +++ b/transformation/transformationPlugins/jsonMessageTransformers/jsonMessageTransformerLoaders/src/main/java/org/opensearch/migrations/transform/flags/FeatureFlags.java @@ -0,0 +1,48 @@ +package org.opensearch.migrations.transform.flags; + +import java.io.IOException; +import java.util.HashMap; + +import com.fasterxml.jackson.databind.ObjectMapper; +import com.fasterxml.jackson.databind.annotation.JsonDeserialize; +import com.fasterxml.jackson.dataformat.yaml.YAMLFactory; +import lombok.Getter; +import lombok.Setter; + +@Getter +@Setter +@JsonDeserialize(using = FeatureFlagsDeserializer.class) +public class FeatureFlags extends HashMap { + + public static final String ENABLED_KEY = "enabled"; + + // Static ObjectMappers for JSON and YAML + private static final ObjectMapper jsonMapper = new ObjectMapper(); + private static final ObjectMapper yamlMapper = new ObjectMapper(new YAMLFactory()); + + + // Parsing methods + public static FeatureFlags parseJson(String contents) throws IOException { + return jsonMapper.readValue(contents, FeatureFlags.class); + } + + public static FeatureFlags parseYaml(String contents) throws IOException { + return yamlMapper.readValue(contents, FeatureFlags.class); + } + + public String writeJson() throws IOException { + return jsonMapper.writeValueAsString(this); + } + + public String writeYaml() throws IOException { + return yamlMapper.writeValueAsString(this); + } + + @Override + public String toString() { + return "FeatureFlags{" + + "enabled=" + get(ENABLED_KEY) + + ", features=" + super.toString() + + '}'; + } +} diff --git a/transformation/transformationPlugins/jsonMessageTransformers/jsonMessageTransformerLoaders/src/main/java/org/opensearch/migrations/transform/flags/FeatureFlagsDeserializer.java b/transformation/transformationPlugins/jsonMessageTransformers/jsonMessageTransformerLoaders/src/main/java/org/opensearch/migrations/transform/flags/FeatureFlagsDeserializer.java new file mode 100644 index 000000000..4c5514f8f --- /dev/null +++ b/transformation/transformationPlugins/jsonMessageTransformers/jsonMessageTransformerLoaders/src/main/java/org/opensearch/migrations/transform/flags/FeatureFlagsDeserializer.java @@ -0,0 +1,51 @@ +package org.opensearch.migrations.transform.flags; + +import java.io.IOException; +import java.util.Iterator; +import java.util.Map; + +import com.fasterxml.jackson.core.JsonParser; +import com.fasterxml.jackson.databind.*; +import com.fasterxml.jackson.databind.DeserializationContext; +import com.fasterxml.jackson.databind.JsonNode; +import com.fasterxml.jackson.databind.deser.std.StdDeserializer; +import lombok.extern.slf4j.Slf4j; + +@Slf4j +public class FeatureFlagsDeserializer extends StdDeserializer { + + public FeatureFlagsDeserializer() { + this(null); + } + + public FeatureFlagsDeserializer(Class vc) { + super(vc); + } + + @Override + public FeatureFlags deserialize(JsonParser p, DeserializationContext ctx) throws IOException { + FeatureFlags featureFlags = new FeatureFlags(); + JsonNode node = p.getCodec().readTree(p); + + Iterator> fields = node.fields(); + while (fields.hasNext()) { + Map.Entry entry = fields.next(); + final var key = entry.getKey(); + final var value = entry.getValue(); + if (value.isObject()) { + JsonParser valueParser = value.traverse(); + valueParser.setCodec(p.getCodec()); + featureFlags.put(key, ctx.readValue(valueParser, FeatureFlags.class)); + } else { + featureFlags.put(key, Map.of(FeatureFlags.ENABLED_KEY, value.booleanValue())); + } + } + // If 'enabled' is not explicitly set, default to true + if (!featureFlags.containsKey(FeatureFlags.ENABLED_KEY)) { + featureFlags.put(FeatureFlags.ENABLED_KEY, true); + } else if (!(featureFlags.get(FeatureFlags.ENABLED_KEY) instanceof Boolean)) { + throw new IllegalArgumentException("enabled key must map to a boolean value"); + } + return featureFlags; + } +} diff --git a/transformation/transformationPlugins/jsonMessageTransformers/jsonMessageTransformerLoaders/src/main/java/org/opensearch/migrations/transform/flags/FeatureFlagsSerializer.java b/transformation/transformationPlugins/jsonMessageTransformers/jsonMessageTransformerLoaders/src/main/java/org/opensearch/migrations/transform/flags/FeatureFlagsSerializer.java new file mode 100644 index 000000000..4e482b226 --- /dev/null +++ b/transformation/transformationPlugins/jsonMessageTransformers/jsonMessageTransformerLoaders/src/main/java/org/opensearch/migrations/transform/flags/FeatureFlagsSerializer.java @@ -0,0 +1,33 @@ +//package org.opensearch.migrations.transform.flags; +// +//import java.io.IOException; +//import java.util.Map; +// +//import com.fasterxml.jackson.core.JsonGenerator; +//import com.fasterxml.jackson.databind.SerializerProvider; +//import com.fasterxml.jackson.databind.ser.std.StdSerializer; +// +//public class FeatureFlagsSerializer extends StdSerializer { +// +// public FeatureFlagsSerializer() { +// this(null); +// } +// +// public FeatureFlagsSerializer(Class t) { +// super(t); +// } +// +// @Override +// public void serialize(FeatureFlags value, JsonGenerator gen, SerializerProvider provider) throws IOException { +// gen.writeStartObject(); +// // Serialize the 'enabled' field +// gen.writeBooleanField("enabled", value.isEnabled()); +// +// // Serialize all map entries +// for (Map.Entry entry : value.entrySet()) { +// gen.writeObjectField(entry.getKey(), entry.getValue()); +// } +// +// gen.writeEndObject(); +// } +//} diff --git a/transformation/transformationPlugins/jsonMessageTransformers/jsonTypeMappingsSanitizationTransformer/build.gradle b/transformation/transformationPlugins/jsonMessageTransformers/jsonTypeMappingsSanitizationTransformer/build.gradle index f48b1c329..05540ced8 100644 --- a/transformation/transformationPlugins/jsonMessageTransformers/jsonTypeMappingsSanitizationTransformer/build.gradle +++ b/transformation/transformationPlugins/jsonMessageTransformers/jsonTypeMappingsSanitizationTransformer/build.gradle @@ -4,10 +4,11 @@ plugins { } dependencies { - implementation project(':transformation:transformationPlugins:jsonMessageTransformers:jsonMessageTransformerInterface') - api project(':transformation:transformationPlugins:jsonMessageTransformers:jsonJinjavaTransformer') + implementation project(':transformation:transformationPlugins:jsonMessageTransformers:jsonMessageTransformerInterface') + implementation group: 'com.google.guava', name: 'guava' + testImplementation project(':TrafficCapture:trafficReplayer') testImplementation testFixtures(project(path: ':testHelperFixtures')) testImplementation testFixtures(project(path: ':TrafficCapture:trafficReplayer')) diff --git a/transformation/transformationPlugins/jsonMessageTransformers/jsonTypeMappingsSanitizationTransformer/src/main/java/org/opensearch/migrations/transform/TypeMappingsSanitizationTransformer.java b/transformation/transformationPlugins/jsonMessageTransformers/jsonTypeMappingsSanitizationTransformer/src/main/java/org/opensearch/migrations/transform/TypeMappingsSanitizationTransformer.java index a3d778276..e76ea8357 100644 --- a/transformation/transformationPlugins/jsonMessageTransformers/jsonTypeMappingsSanitizationTransformer/src/main/java/org/opensearch/migrations/transform/TypeMappingsSanitizationTransformer.java +++ b/transformation/transformationPlugins/jsonMessageTransformers/jsonTypeMappingsSanitizationTransformer/src/main/java/org/opensearch/migrations/transform/TypeMappingsSanitizationTransformer.java @@ -1,21 +1,28 @@ package org.opensearch.migrations.transform; +import java.io.IOException; +import java.nio.charset.StandardCharsets; import java.util.Map; +import com.google.common.io.Resources; + public class TypeMappingsSanitizationTransformer extends JinjavaTransformer { - public TypeMappingsSanitizationTransformer(Map> indexMappings) { - this("typeMappings/replayerreplayer", indexMappings); + public TypeMappingsSanitizationTransformer(Map> indexMappings) throws IOException { + this("jinjava/typeMappings/replayer.j2", null, indexMappings); } - public TypeMappingsSanitizationTransformer(String variantName, Map> indexMappings) { + public TypeMappingsSanitizationTransformer(String variantName, + Map featureFlags, + Map> indexMappings) throws IOException { super( makeTemplate(variantName), - Map.of("index_mappings", indexMappings), - incomingJson -> Map.of("request", incomingJson)); + incomingJson -> Map.of("request", incomingJson, + "index_mappings", indexMappings, + "featureFlags", featureFlags == null ? Map.of() : featureFlags)); } - private static String makeTemplate(String variantName) { - return "{% include \"" + variantName+ "\" %}"; + private static String makeTemplate(String variantName) throws IOException { + return Resources.toString(Resources.getResource(variantName), StandardCharsets.UTF_8); } } diff --git a/transformation/transformationPlugins/jsonMessageTransformers/jsonTypeMappingsSanitizationTransformer/src/main/resources/jinjava/typeMappings/replayer.j2 b/transformation/transformationPlugins/jsonMessageTransformers/jsonTypeMappingsSanitizationTransformer/src/main/resources/jinjava/typeMappings/replayer.j2 index e9222e483..68ef8a387 100644 --- a/transformation/transformationPlugins/jsonMessageTransformers/jsonTypeMappingsSanitizationTransformer/src/main/resources/jinjava/typeMappings/replayer.j2 +++ b/transformation/transformationPlugins/jsonMessageTransformers/jsonTypeMappingsSanitizationTransformer/src/main/resources/jinjava/typeMappings/replayer.j2 @@ -1,33 +1,56 @@ -{% set uri_parts = request.URI.split('/') | reject('equalto', '') | list %} +{%- include "common/featureEnabled.j2" -%} -{% if uri_parts | length == 3 and uri_parts[0] in index_mappings and uri_parts[1] in index_mappings[uri_parts[0]] %} - { - "method": "{{ request.method }}", - "URI": "/{{ index_mappings[uri_parts[0]][uri_parts[1]] }}/_doc/{{ uri_parts[2] }}", - "headers": {{ request.headers | tojson }}, - "payload": {{ request.payload | tojson }} - } -{% elif uri_parts | length == 2 and uri_parts[0] in index_mappings %} - { - "method": "{{ request.method }}", - "URI": "{{ index_mappings[uri_parts[0]][uri_parts[1]] }}", - "payload": { - "inlinedJsonBody": { - "mappings": { - "properties": { - "type": { - "type": "keyword" - } - {%- for type_name, type_props in request.body.mappings.items() %} - {%- for prop_name, prop_def in type_props.properties.items() %} - , - "{{ prop_name }}": {{ prop_def | tojson }} - {%- endfor %} - {%- endfor %} +{%- macro handle_else(uri_parts) -%} + {{- request | tojson }} +{%- endmacro -%} + +{%- macro rewrite_uri_to_strip_types(uri_parts, index_mappings, request) -%} +{ + "method": "{{ request.method }}", + "URI": "/{{ index_mappings[uri_parts[0]][uri_parts[1]] }}/_doc/{{ uri_parts[2] }}", + "headers": {{ request.headers | tojson }}, + "payload": {{ request.payload | tojson }} +} +{%- endmacro -%} + + +{% macro rewrite_typemapping_to_target_index(uri_parts, index_mappings, request) -%} +{ + "method": "{{ request.method }}", + "URI": "{{ index_mappings[uri_parts[0]][uri_parts[1]] }}", + "payload": { + "inlinedJsonBody": { + "mappings": { + "properties": { + "type": { + "type": "keyword" } + {%- for type_name, type_props in request.body.mappings.items() -%} + {%- for prop_name, prop_def in type_props.properties.items() -%} + , + "{{- prop_name -}}": {{- prop_def | tojson -}} + {%- endfor -%} + {%- endfor -%} } } } } -{% else %} - { "urilen": {{uri_parts | length}} }{% endif %} \ No newline at end of file +} +{%- endmacro -%} + + +{%- set uri_parts = request.URI.split('/') | reject('equalto', '') | list -%} + +{%- if uri_parts | length == 3 and uri_parts[0] in index_mappings and uri_parts[1] in index_mappings[uri_parts[0]] -%} + {%- if is_enabled(features, 'rewrite_uri_to_strip_types') -%} + {{ rewrite_uri_to_strip_types(uri_parts, index_mappings, request) -}} + {%- endif -%} +{%- elif uri_parts | length == 2 and uri_parts[0] in index_mappings -%} + {%- if is_enabled(features, 'rewrite_typemapping_to_target_index') -%} + {{ rewrite_typemapping_to_target_index(uri_parts, index_mappings, request) -}} + {%- endif -%} +{%- else -%} + {%- if is_enabled(features, 'handle_else') -%} + {{- handle_else(uri_parts) -}} + {%- endif -%} +{%- endif -%} diff --git a/transformation/transformationPlugins/jsonMessageTransformers/jsonTypeMappingsSanitizationTransformer/src/test/java/org/opensearch/migrations/transform/TypeMappingsSanitizationTransformerTest.java b/transformation/transformationPlugins/jsonMessageTransformers/jsonTypeMappingsSanitizationTransformer/src/test/java/org/opensearch/migrations/transform/TypeMappingsSanitizationTransformerTest.java index 603f4e5d0..3105eb9c6 100644 --- a/transformation/transformationPlugins/jsonMessageTransformers/jsonTypeMappingsSanitizationTransformer/src/test/java/org/opensearch/migrations/transform/TypeMappingsSanitizationTransformerTest.java +++ b/transformation/transformationPlugins/jsonMessageTransformers/jsonTypeMappingsSanitizationTransformer/src/test/java/org/opensearch/migrations/transform/TypeMappingsSanitizationTransformerTest.java @@ -1,5 +1,6 @@ package org.opensearch.migrations.transform; +import java.io.IOException; import java.util.Map; import org.junit.jupiter.api.BeforeAll; @@ -10,7 +11,7 @@ class TypeMappingsSanitizationTransformerTest { private static TypeMappingsSanitizationTransformer indexTypeMappingRewriter; @BeforeAll - static void initialize() { + static void initialize() throws IOException { var indexMappings = Map.of( "indexA", Map.of( "type1", "indexA_1", diff --git a/transformation/transformationPlugins/jsonMessageTransformers/jsonTypeMappingsSanitizationTransformerProvider/src/main/java/org/opensearch/migrations/transform/TypeMappingSanitizationTransformerProvider.java b/transformation/transformationPlugins/jsonMessageTransformers/jsonTypeMappingsSanitizationTransformerProvider/src/main/java/org/opensearch/migrations/transform/TypeMappingSanitizationTransformerProvider.java index fe64452c9..3fd154b8f 100644 --- a/transformation/transformationPlugins/jsonMessageTransformers/jsonTypeMappingsSanitizationTransformerProvider/src/main/java/org/opensearch/migrations/transform/TypeMappingSanitizationTransformerProvider.java +++ b/transformation/transformationPlugins/jsonMessageTransformers/jsonTypeMappingsSanitizationTransformerProvider/src/main/java/org/opensearch/migrations/transform/TypeMappingSanitizationTransformerProvider.java @@ -2,8 +2,11 @@ import java.util.Map; +import lombok.SneakyThrows; + public class TypeMappingSanitizationTransformerProvider implements IJsonTransformerProvider { + @SneakyThrows @Override public IJsonTransformer createTransformer(Object jsonConfig) { try { From dd983770c71f38b1330e36da18d7416f47c894cf Mon Sep 17 00:00:00 2001 From: Greg Schohn Date: Thu, 21 Nov 2024 08:16:28 -0500 Subject: [PATCH 05/26] Cleanup + added a "preserve" flag to let templates inline source nodes after the templating... That preserve splicing not only improves efficiency, it also lets us pass messages through a template that might have non-textual data, like the ByteBufs, etc. Signed-off-by: Greg Schohn --- TrafficCapture/trafficReplayer/build.gradle | 2 +- ...ttpRequestPreliminaryTransformHandler.java | 60 ++++++++----------- .../transform/JinjavaTransformer.java | 28 ++++++++- ...rations.transform.IJsonTransformerProvider | 1 - .../transform/JsonKeysForHttpMessage.java | 21 ++++++- ...rations.transform.IJsonTransformerProvider | 1 - .../jinjava/typeMappings/replayer.j2 | 7 ++- 7 files changed, 76 insertions(+), 44 deletions(-) delete mode 100644 transformation/transformationPlugins/jsonMessageTransformers/jsonJinjavaTransformer/src/main/resources/META-INF/services/org.opensearch.migrations.transform.IJsonTransformerProvider delete mode 100644 transformation/transformationPlugins/jsonMessageTransformers/jsonTypeMappingsSanitizationTransformer/src/main/resources/META-INF/services/org.opensearch.migrations.transform.IJsonTransformerProvider diff --git a/TrafficCapture/trafficReplayer/build.gradle b/TrafficCapture/trafficReplayer/build.gradle index 39d2a59ee..ac04a2582 100644 --- a/TrafficCapture/trafficReplayer/build.gradle +++ b/TrafficCapture/trafficReplayer/build.gradle @@ -23,7 +23,7 @@ dependencies { implementation project(':transformation:transformationPlugins:jsonMessageTransformers:jsonMessageTransformerInterface') runtimeOnly project(':transformation:transformationPlugins:jsonMessageTransformers:jsonJMESPathMessageTransformerProvider') runtimeOnly project(':transformation:transformationPlugins:jsonMessageTransformers:jsonJoltMessageTransformerProvider') - runtimeOnly project(':transformation:transformationPlugins:jsonMessageTransformers:openSearch23PlusTargetTransformerProvider') + runtimeOnly project(':transformation:transformationPlugins:jsonMessageTransformers:jsonTypeMappingsSanitizationTransformerProvider') implementation group: 'org.jcommander', name: 'jcommander' implementation group: 'com.fasterxml.jackson.core', name: 'jackson-databind' diff --git a/TrafficCapture/trafficReplayer/src/main/java/org/opensearch/migrations/replay/datahandlers/http/NettyDecodedHttpRequestPreliminaryTransformHandler.java b/TrafficCapture/trafficReplayer/src/main/java/org/opensearch/migrations/replay/datahandlers/http/NettyDecodedHttpRequestPreliminaryTransformHandler.java index 3d74c42ca..f467383c4 100644 --- a/TrafficCapture/trafficReplayer/src/main/java/org/opensearch/migrations/replay/datahandlers/http/NettyDecodedHttpRequestPreliminaryTransformHandler.java +++ b/TrafficCapture/trafficReplayer/src/main/java/org/opensearch/migrations/replay/datahandlers/http/NettyDecodedHttpRequestPreliminaryTransformHandler.java @@ -75,10 +75,8 @@ public void channelRead(@NonNull ChannelHandlerContext ctx, @NonNull Object msg) authTransformer ); } catch (PayloadNotLoadedException pnle) { - log.debug( - "The transforms for this message require payload manipulation, " - + "all content handlers are being loaded." - ); + log.atDebug().setMessage("The transforms for this message require payload manipulation, " + + "all content handlers are being loaded.").log(); // make a fresh message and its headers requestPipelineOrchestrator.addJsonParsingHandlers( ctx, @@ -131,43 +129,35 @@ private void handlePayloadNeutralTransformationOrThrow( var pipeline = ctx.pipeline(); if (streamingAuthTransformer != null) { - log.info( - diagnosticLabel - + "An Authorization Transformation is required for this message. " - + "The headers and payload will be parsed and reformatted." - ); + log.atInfo().setMessage("{} An Authorization Transformation is required for this message. " + + "The headers and payload will be parsed and reformatted.") + .addArgument(diagnosticLabel).log(); requestPipelineOrchestrator.addContentRepackingHandlers(ctx, streamingAuthTransformer); ctx.fireChannelRead(httpJsonMessage); } else if (headerFieldsAreIdentical(originalRequest, httpJsonMessage)) { - log.info( - diagnosticLabel - + "Transformation isn't necessary. " - + "Resetting the processing pipeline to let the caller send the original network bytes as-is." - ); + log.atInfo().setMessage("{} Transformation isn't necessary. " + + "Resetting the processing pipeline to let the caller send the original network bytes as-is.") + .addArgument(diagnosticLabel) + .log(); RequestPipelineOrchestrator.removeAllHandlers(pipeline); - } else if (headerFieldIsIdentical("content-encoding", originalRequest, httpJsonMessage) && headerFieldIsIdentical("transfer-encoding", originalRequest, httpJsonMessage)) { - log.info( - diagnosticLabel - + "There were changes to the headers that require the message to be reformatted " - + "but the payload doesn't need to be transformed." - ); - // By adding the baseline handlers and removing this and previous handlers in reverse order, - // we will cause the upstream handlers to flush their in-progress accumulated ByteBufs downstream - // to be processed accordingly - requestPipelineOrchestrator.addBaselineHandlers(pipeline); - ctx.fireChannelRead(httpJsonMessage); - RequestPipelineOrchestrator.removeThisAndPreviousHandlers(pipeline, this); - } else { - log.info( - diagnosticLabel - + "New headers have been specified that require the payload stream to be " - + "reformatted. Setting up the processing pipeline to parse and reformat the request payload." - ); - requestPipelineOrchestrator.addContentRepackingHandlers(ctx, streamingAuthTransformer); - ctx.fireChannelRead(httpJsonMessage); - } + log.atInfo().setMessage("{} There were changes to the headers that require the message to be reformatted " + + "but the payload doesn't need to be transformed.") + .addArgument(diagnosticLabel).log(); + // By adding the baseline handlers and removing this and previous handlers in reverse order, + // we will cause the upstream handlers to flush their in-progress accumulated ByteBufs downstream + // to be processed accordingly + requestPipelineOrchestrator.addBaselineHandlers(pipeline); + ctx.fireChannelRead(httpJsonMessage); + RequestPipelineOrchestrator.removeThisAndPreviousHandlers(pipeline, this); + } else { + log.atInfo().setMessage("{} New headers have been specified that require the payload stream to be " + + "reformatted. Setting up the processing pipeline to parse and reformat the request payload.") + .addArgument(diagnosticLabel).log(); + requestPipelineOrchestrator.addContentRepackingHandlers(ctx, streamingAuthTransformer); + ctx.fireChannelRead(httpJsonMessage); + } } private static HttpJsonRequestWithFaultingPayload handleAuthHeaders( diff --git a/transformation/transformationPlugins/jsonMessageTransformers/jsonJinjavaTransformer/src/main/java/org/opensearch/migrations/transform/JinjavaTransformer.java b/transformation/transformationPlugins/jsonMessageTransformers/jsonJinjavaTransformer/src/main/java/org/opensearch/migrations/transform/JinjavaTransformer.java index d2a2d8a72..a151fb9b0 100644 --- a/transformation/transformationPlugins/jsonMessageTransformers/jsonJinjavaTransformer/src/main/java/org/opensearch/migrations/transform/JinjavaTransformer.java +++ b/transformation/transformationPlugins/jsonMessageTransformers/jsonJinjavaTransformer/src/main/java/org/opensearch/migrations/transform/JinjavaTransformer.java @@ -1,6 +1,8 @@ package org.opensearch.migrations.transform; +import java.util.List; import java.util.Map; +import java.util.Optional; import java.util.function.Function; import org.opensearch.migrations.transform.jinjava.NameMappingClasspathResourceLocator; @@ -40,6 +42,30 @@ public JinjavaTransformer(String templateString, public Map transformJson(Map incomingJson) { var resultStr = jinjava.render(templateStr, createContextWithSourceFunction.apply(incomingJson)); log.atInfo().setMessage("output from jinjava... {}").addArgument(resultStr).log(); - return objectMapper.readValue(resultStr, Map.class); + var parsedObj = (Map) objectMapper.readValue(resultStr, Map.class); + return doFinalSubstitutions(incomingJson, parsedObj); + } + + private Map doFinalSubstitutions(Map incomingJson, Map parsedObj) { + return Optional.ofNullable(parsedObj.get(JsonKeysForHttpMessage.PRESERVE_KEY)).filter(v->v.equals("*")) + .map(star -> incomingJson) + .orElseGet(() -> { + findAndReplacePreserves(incomingJson, parsedObj); + findAndReplacePreserves((Map) incomingJson.get(JsonKeysForHttpMessage.PAYLOAD_KEY), + (Map) parsedObj.get(JsonKeysForHttpMessage.PAYLOAD_KEY)); + return parsedObj; + }); + } + + private void findAndReplacePreserves(Map incomingRoot, Map parsedRoot) { + if (parsedRoot == null || incomingRoot == null) { + return; + } + var preserveKeys = (List) parsedRoot.get(JsonKeysForHttpMessage.PRESERVE_KEY); + if (preserveKeys != null) { + preserveKeys.forEach(preservedKey -> + parsedRoot.put(preservedKey, incomingRoot.get(preservedKey))); + parsedRoot.remove(JsonKeysForHttpMessage.PRESERVE_KEY); + } } } diff --git a/transformation/transformationPlugins/jsonMessageTransformers/jsonJinjavaTransformer/src/main/resources/META-INF/services/org.opensearch.migrations.transform.IJsonTransformerProvider b/transformation/transformationPlugins/jsonMessageTransformers/jsonJinjavaTransformer/src/main/resources/META-INF/services/org.opensearch.migrations.transform.IJsonTransformerProvider deleted file mode 100644 index 86105dbfd..000000000 --- a/transformation/transformationPlugins/jsonMessageTransformers/jsonJinjavaTransformer/src/main/resources/META-INF/services/org.opensearch.migrations.transform.IJsonTransformerProvider +++ /dev/null @@ -1 +0,0 @@ -org.opensearch.migrations.transform.JinJavaTransformer \ No newline at end of file diff --git a/transformation/transformationPlugins/jsonMessageTransformers/jsonMessageTransformerInterface/src/main/java/org/opensearch/migrations/transform/JsonKeysForHttpMessage.java b/transformation/transformationPlugins/jsonMessageTransformers/jsonMessageTransformerInterface/src/main/java/org/opensearch/migrations/transform/JsonKeysForHttpMessage.java index 65f0a5894..3ab644e30 100644 --- a/transformation/transformationPlugins/jsonMessageTransformers/jsonMessageTransformerInterface/src/main/java/org/opensearch/migrations/transform/JsonKeysForHttpMessage.java +++ b/transformation/transformationPlugins/jsonMessageTransformers/jsonMessageTransformerInterface/src/main/java/org/opensearch/migrations/transform/JsonKeysForHttpMessage.java @@ -12,6 +12,21 @@ private JsonKeysForHttpMessage() {} public static final String PROTOCOL_KEY = "protocol"; public static final String HEADERS_KEY = "headers"; public static final String PAYLOAD_KEY = "payload"; + + /** + *

This key is valid at the top level and as a direct within a "payload" value. + * After a transformation has completed, these objects will be excised and replaced with + * the original nodes from the original document.

+ * + *

For example. the following will cause the original payload to be preserved.

+ * `"preserve": [ "payload" ]` + *

The following will cause the original headers and payload to be preserved.

+ * `"preserve": [ "headers", "payload" ]` + * + *

Notice that any already existing items will be replaced.

+ */ + public static final String PRESERVE_KEY = "preserve"; + /** * This is the key under the 'payload' object whose value is the parsed json from the HTTP message payload. * Notice that there aren't yet other ways to access the payload contents. If the content-type was not json, @@ -19,11 +34,13 @@ private JsonKeysForHttpMessage() {} */ public static final String INLINED_JSON_BODY_DOCUMENT_KEY = "inlinedJsonBody"; /** - * for the type application + * Like INLINED_JSON_BODY_DOCUMENT_KEY, this key is used directly under the 'payload' object. Its value + * will be a list of json documents that represent the lines of the original ndjson payload, when present. */ public static final String INLINED_NDJSON_BODIES_DOCUMENT_KEY = "inlinedJsonSequenceBodies"; /** - * This maps to a ByteBuf that is owned by the caller. + * Like INLINED_JSON_BODY_DOCUMENT_KEY, this key is used directly under the 'payload' object. Its value + * maps to a ByteBuf that is owned by the caller. * Any consumers should retain if they need to access it later. This may be UTF8, UTF16 encoded, or something else. */ public static final String INLINED_BINARY_BODY_DOCUMENT_KEY = "inlinedBinaryBody"; diff --git a/transformation/transformationPlugins/jsonMessageTransformers/jsonTypeMappingsSanitizationTransformer/src/main/resources/META-INF/services/org.opensearch.migrations.transform.IJsonTransformerProvider b/transformation/transformationPlugins/jsonMessageTransformers/jsonTypeMappingsSanitizationTransformer/src/main/resources/META-INF/services/org.opensearch.migrations.transform.IJsonTransformerProvider deleted file mode 100644 index dac77603a..000000000 --- a/transformation/transformationPlugins/jsonMessageTransformers/jsonTypeMappingsSanitizationTransformer/src/main/resources/META-INF/services/org.opensearch.migrations.transform.IJsonTransformerProvider +++ /dev/null @@ -1 +0,0 @@ -org.opensearch.migrations.transform.TypeMappingsSanitizationTransformer \ No newline at end of file diff --git a/transformation/transformationPlugins/jsonMessageTransformers/jsonTypeMappingsSanitizationTransformer/src/main/resources/jinjava/typeMappings/replayer.j2 b/transformation/transformationPlugins/jsonMessageTransformers/jsonTypeMappingsSanitizationTransformer/src/main/resources/jinjava/typeMappings/replayer.j2 index 68ef8a387..48dc9f28b 100644 --- a/transformation/transformationPlugins/jsonMessageTransformers/jsonTypeMappingsSanitizationTransformer/src/main/resources/jinjava/typeMappings/replayer.j2 +++ b/transformation/transformationPlugins/jsonMessageTransformers/jsonTypeMappingsSanitizationTransformer/src/main/resources/jinjava/typeMappings/replayer.j2 @@ -1,15 +1,16 @@ {%- include "common/featureEnabled.j2" -%} {%- macro handle_else(uri_parts) -%} - {{- request | tojson }} +{ + "preserve": "*" +} {%- endmacro -%} {%- macro rewrite_uri_to_strip_types(uri_parts, index_mappings, request) -%} { "method": "{{ request.method }}", "URI": "/{{ index_mappings[uri_parts[0]][uri_parts[1]] }}/_doc/{{ uri_parts[2] }}", - "headers": {{ request.headers | tojson }}, - "payload": {{ request.payload | tojson }} + "preserve": ["headers","payload"] } {%- endmacro -%} From 357a6a658dc3383d2a6bb96088345e498c0a9d2d Mon Sep 17 00:00:00 2001 From: Greg Schohn Date: Fri, 22 Nov 2024 10:29:54 -0500 Subject: [PATCH 06/26] Add jinja-style regex matching to jinjava transformations. Signed-off-by: Greg Schohn --- .../jsonJinjavaTransformer/build.gradle | 1 + .../transform/JinjavaTransformer.java | 2 + .../transform/jinjava/RegexCaptureFilter.java | 39 +++++++++++++++++++ ...TypeMappingsSanitizationProviderTest.java} | 0 4 files changed, 42 insertions(+) create mode 100644 transformation/transformationPlugins/jsonMessageTransformers/jsonJinjavaTransformer/src/main/java/org/opensearch/migrations/transform/jinjava/RegexCaptureFilter.java rename transformation/transformationPlugins/jsonMessageTransformers/jsonTypeMappingsSanitizationTransformerProvider/src/test/java/org/opensearch/migrations/replay/{TypeMappingsSanitizationTest.java => TypeMappingsSanitizationProviderTest.java} (100%) diff --git a/transformation/transformationPlugins/jsonMessageTransformers/jsonJinjavaTransformer/build.gradle b/transformation/transformationPlugins/jsonMessageTransformers/jsonJinjavaTransformer/build.gradle index 448b9e529..f4b05736e 100644 --- a/transformation/transformationPlugins/jsonMessageTransformers/jsonJinjavaTransformer/build.gradle +++ b/transformation/transformationPlugins/jsonMessageTransformers/jsonJinjavaTransformer/build.gradle @@ -6,6 +6,7 @@ dependencies { implementation project(':transformation:transformationPlugins:jsonMessageTransformers:jsonMessageTransformerInterface') implementation group: 'com.hubspot.jinjava', name: 'jinjava', version: "2.7.3" + implementation group: 'com.google.re2j', name: 're2j', version: "1.7" testImplementation project(':TrafficCapture:trafficReplayer') testImplementation project(':transformation:transformationPlugins:jsonMessageTransformers:jsonMessageTransformerLoaders') diff --git a/transformation/transformationPlugins/jsonMessageTransformers/jsonJinjavaTransformer/src/main/java/org/opensearch/migrations/transform/JinjavaTransformer.java b/transformation/transformationPlugins/jsonMessageTransformers/jsonJinjavaTransformer/src/main/java/org/opensearch/migrations/transform/JinjavaTransformer.java index a151fb9b0..b67713129 100644 --- a/transformation/transformationPlugins/jsonMessageTransformers/jsonJinjavaTransformer/src/main/java/org/opensearch/migrations/transform/JinjavaTransformer.java +++ b/transformation/transformationPlugins/jsonMessageTransformers/jsonJinjavaTransformer/src/main/java/org/opensearch/migrations/transform/JinjavaTransformer.java @@ -6,6 +6,7 @@ import java.util.function.Function; import org.opensearch.migrations.transform.jinjava.NameMappingClasspathResourceLocator; +import org.opensearch.migrations.transform.jinjava.RegexCaptureFilter; import com.fasterxml.jackson.databind.ObjectMapper; import com.hubspot.jinjava.Jinjava; @@ -34,6 +35,7 @@ public JinjavaTransformer(String templateString, jinjava = new Jinjava(); this.createContextWithSourceFunction = createContextWithSource; jinjava.setResourceLocator(resourceLocator); + jinjava.getGlobalContext().registerFilter(new RegexCaptureFilter()); this.templateStr = templateString; } diff --git a/transformation/transformationPlugins/jsonMessageTransformers/jsonJinjavaTransformer/src/main/java/org/opensearch/migrations/transform/jinjava/RegexCaptureFilter.java b/transformation/transformationPlugins/jsonMessageTransformers/jsonJinjavaTransformer/src/main/java/org/opensearch/migrations/transform/jinjava/RegexCaptureFilter.java new file mode 100644 index 000000000..7fce682c9 --- /dev/null +++ b/transformation/transformationPlugins/jsonMessageTransformers/jsonJinjavaTransformer/src/main/java/org/opensearch/migrations/transform/jinjava/RegexCaptureFilter.java @@ -0,0 +1,39 @@ +package org.opensearch.migrations.transform.jinjava; + +import java.util.HashMap; + +import com.google.re2j.Pattern; +import com.google.re2j.Matcher; +import com.hubspot.jinjava.interpret.JinjavaInterpreter; +import com.hubspot.jinjava.lib.filter.Filter; + +public class RegexCaptureFilter implements Filter { + @Override + public String getName() { + return "regex_capture"; + } + + @Override + public Object filter(Object var, JinjavaInterpreter interpreter, String... args) { + if (var == null || args.length < 1) { + return null; + } + + String input = var.toString(); + String pattern = args[0]; + + try { + Matcher matcher = Pattern.compile(pattern).matcher(input); + if (matcher.find()) { + var groups = new HashMap<>(); + for (int i = 0; i <= matcher.groupCount(); i++) { + groups.put("group" + i, matcher.group(i)); + } + return groups; + } + } catch (Exception e) { + return null; + } + return null; + } +} \ No newline at end of file diff --git a/transformation/transformationPlugins/jsonMessageTransformers/jsonTypeMappingsSanitizationTransformerProvider/src/test/java/org/opensearch/migrations/replay/TypeMappingsSanitizationTest.java b/transformation/transformationPlugins/jsonMessageTransformers/jsonTypeMappingsSanitizationTransformerProvider/src/test/java/org/opensearch/migrations/replay/TypeMappingsSanitizationProviderTest.java similarity index 100% rename from transformation/transformationPlugins/jsonMessageTransformers/jsonTypeMappingsSanitizationTransformerProvider/src/test/java/org/opensearch/migrations/replay/TypeMappingsSanitizationTest.java rename to transformation/transformationPlugins/jsonMessageTransformers/jsonTypeMappingsSanitizationTransformerProvider/src/test/java/org/opensearch/migrations/replay/TypeMappingsSanitizationProviderTest.java From 12c0cfae3e839772f9aa53ee72d0c9bf95153eb9 Mon Sep 17 00:00:00 2001 From: Greg Schohn Date: Sat, 23 Nov 2024 18:13:21 -0500 Subject: [PATCH 07/26] Checkpoint - I've added a new invoke_macro java function to lookup a macro by name and invoke it since jinjava can't deal with invoking macros with dynamic names. There are some rough tests in place that don't fully work. The original ambition was to allow a user to specify both a route and an action for a given map in a macro but since macros only output rendered content, they're not well-suited to chain complex data (like regex matches) between macros. As such, there will be significant design changes to the jinja routing mechanisms. Signed-off-by: Greg Schohn --- .../transform/JinjavaTransformer.java | 12 +++ .../jinjava/DynamicMacroFunction.java | 60 ++++++++++++ .../resources/jinjava/common/route-bkp.j2 | 25 +++++ .../main/resources/jinjava/common/route.j2 | 22 +++++ .../resources/jinjava/common/testAndAction.j2 | 0 .../transform/FeatureMaskingTest.java | 14 +-- .../migrations/transform/RouteTest.java | 96 +++++++++++++++++++ .../TypeMappingsSanitizationProviderTest.java | 6 +- 8 files changed, 226 insertions(+), 9 deletions(-) create mode 100644 transformation/transformationPlugins/jsonMessageTransformers/jsonJinjavaTransformer/src/main/java/org/opensearch/migrations/transform/jinjava/DynamicMacroFunction.java create mode 100644 transformation/transformationPlugins/jsonMessageTransformers/jsonJinjavaTransformer/src/main/resources/jinjava/common/route-bkp.j2 create mode 100644 transformation/transformationPlugins/jsonMessageTransformers/jsonJinjavaTransformer/src/main/resources/jinjava/common/route.j2 create mode 100644 transformation/transformationPlugins/jsonMessageTransformers/jsonJinjavaTransformer/src/main/resources/jinjava/common/testAndAction.j2 create mode 100644 transformation/transformationPlugins/jsonMessageTransformers/jsonJinjavaTransformer/src/test/java/org/opensearch/migrations/transform/RouteTest.java diff --git a/transformation/transformationPlugins/jsonMessageTransformers/jsonJinjavaTransformer/src/main/java/org/opensearch/migrations/transform/JinjavaTransformer.java b/transformation/transformationPlugins/jsonMessageTransformers/jsonJinjavaTransformer/src/main/java/org/opensearch/migrations/transform/JinjavaTransformer.java index b67713129..ff4354713 100644 --- a/transformation/transformationPlugins/jsonMessageTransformers/jsonJinjavaTransformer/src/main/java/org/opensearch/migrations/transform/JinjavaTransformer.java +++ b/transformation/transformationPlugins/jsonMessageTransformers/jsonJinjavaTransformer/src/main/java/org/opensearch/migrations/transform/JinjavaTransformer.java @@ -5,11 +5,13 @@ import java.util.Optional; import java.util.function.Function; +import org.opensearch.migrations.transform.jinjava.DynamicMacroFunction; import org.opensearch.migrations.transform.jinjava.NameMappingClasspathResourceLocator; import org.opensearch.migrations.transform.jinjava.RegexCaptureFilter; import com.fasterxml.jackson.databind.ObjectMapper; import com.hubspot.jinjava.Jinjava; +import com.hubspot.jinjava.lib.fn.ELFunctionDefinition; import com.hubspot.jinjava.loader.ResourceLocator; import lombok.SneakyThrows; import lombok.extern.slf4j.Slf4j; @@ -36,6 +38,16 @@ public JinjavaTransformer(String templateString, this.createContextWithSourceFunction = createContextWithSource; jinjava.setResourceLocator(resourceLocator); jinjava.getGlobalContext().registerFilter(new RegexCaptureFilter()); + var dynamicMacroFunction = new ELFunctionDefinition( + "", + "invoke_macro", + DynamicMacroFunction.class, + "invokeMacro", + String.class, + Object[].class + ); + + jinjava.getGlobalContext().registerFunction(dynamicMacroFunction); this.templateStr = templateString; } diff --git a/transformation/transformationPlugins/jsonMessageTransformers/jsonJinjavaTransformer/src/main/java/org/opensearch/migrations/transform/jinjava/DynamicMacroFunction.java b/transformation/transformationPlugins/jsonMessageTransformers/jsonJinjavaTransformer/src/main/java/org/opensearch/migrations/transform/jinjava/DynamicMacroFunction.java new file mode 100644 index 000000000..c785a3f9b --- /dev/null +++ b/transformation/transformationPlugins/jsonMessageTransformers/jsonJinjavaTransformer/src/main/java/org/opensearch/migrations/transform/jinjava/DynamicMacroFunction.java @@ -0,0 +1,60 @@ +package org.opensearch.migrations.transform.jinjava; + +import java.util.HashMap; +import java.util.List; +import java.util.Map; +import java.util.Optional; + +import com.hubspot.jinjava.interpret.Context; +import com.hubspot.jinjava.interpret.JinjavaInterpreter; +import com.hubspot.jinjava.lib.fn.ELFunctionDefinition; +import com.hubspot.jinjava.lib.fn.Functions; +import com.hubspot.jinjava.objects.collections.PyList; +import com.hubspot.jinjava.lib.fn.MacroFunction; + +public class DynamicMacroFunction { + + /** + * Called from templates through the registration in the JinjavaTransformer class + */ + public static Object invokeMacro(String macroName, Object... args) { + JinjavaInterpreter interpreter = JinjavaInterpreter.getCurrent(); + + MacroFunction macro = getMacroFromContext(interpreter.getContext(), macroName); + + Context macroContext = new Context(interpreter.getContext()); + int argCount = Math.min(args.length, macro.getArguments().size()); + + for (int i = 0; i < argCount; i++) { + String argName = macro.getArguments().get(i); + macroContext.put(argName, args[i]); + } + + var argsMap = new HashMap(); + + var paramNames = macro.getArguments(); + Map defaults = macro.getDefaults(); + + for (int i = 0; i < paramNames.size(); i++) { + String paramName = paramNames.get(i); + if (i < args.length) { + argsMap.put(paramName, args[i]); + } else if (defaults.containsKey(paramName)) { + argsMap.put(paramName, defaults.get(paramName)); + } else { + throw new RuntimeException("Missing argument for macro: " + paramName); + } + } + + return macro.doEvaluate(argsMap, Map.of(), List.of()); + } + + private static MacroFunction getMacroFromContext(Context context, String macroName) { + if (context == null) { + return null; + } + return context.getLocalMacro(macroName) + .or(() -> Optional.ofNullable(context.getGlobalMacro(macroName))) + .orElseGet(() -> getMacroFromContext(context.getParent(), macroName)); + } +} diff --git a/transformation/transformationPlugins/jsonMessageTransformers/jsonJinjavaTransformer/src/main/resources/jinjava/common/route-bkp.j2 b/transformation/transformationPlugins/jsonMessageTransformers/jsonJinjavaTransformer/src/main/resources/jinjava/common/route-bkp.j2 new file mode 100644 index 000000000..9e7792f94 --- /dev/null +++ b/transformation/transformationPlugins/jsonMessageTransformers/jsonJinjavaTransformer/src/main/resources/jinjava/common/route-bkp.j2 @@ -0,0 +1,25 @@ +{% import "common/featureEnabled.j2" as flags %} +{% macro route(input, feature_flags, default_action, routes) %} + {%- set ns = namespace(result=none, matched=false) -%} + {%- for feature_name, pattern, action in routes if not ns.matched -%} + {%- if not ns.matched -%} {# we haven't found a match yet, otherwise skip the rest #} + checking {{ feature_name }}... + {%- set match = none -%} + {%- call pattern(input) -%}{% endcall %} + match {{ match }}... + {%- if match is not none -%} + in a non-null match {{ match }} + in a match! + {%- set ns.matched = true -%} + {%- if flags.is_enabled(feature_flags, feature_name) -%} + {%- set ns.result = action | call(match) -%} + {%- endif -%} + {%- endif -%} + {%- endif -%} + {%- endfor -%} + {%- if ns.result is none -%} + default answer: {{- default_action | call(input) -}} + {%- else -%} + result: {{- ns.result -}} + {%- endif -%} +{% endmacro %} \ No newline at end of file diff --git a/transformation/transformationPlugins/jsonMessageTransformers/jsonJinjavaTransformer/src/main/resources/jinjava/common/route.j2 b/transformation/transformationPlugins/jsonMessageTransformers/jsonJinjavaTransformer/src/main/resources/jinjava/common/route.j2 new file mode 100644 index 000000000..a436fa431 --- /dev/null +++ b/transformation/transformationPlugins/jsonMessageTransformers/jsonJinjavaTransformer/src/main/resources/jinjava/common/route.j2 @@ -0,0 +1,22 @@ +{% import "common/featureEnabled.j2" as flags %} +within import {{ __macros__ | pprint }} +{% macro route(input, feature_flags, default_action, routes) %} + {%- set ns = namespace(result=none, matched=false) -%} + {%- for feature_name, pattern_fn, action_fn in routes if not ns.matched -%} + {%- if not ns.matched -%} {# we haven't found a match yet, otherwise skip the rest #} + {%- set match = invoke_macro(pattern_fn, input) -%} + {%- if match is not none -%} + {%- set ns.matched = true -%} + {%- if flags.is_enabled(feature_flags, feature_name) -%} + {%- set ns.result = invoke_macro(action_fn, match) -%} + {%- endif -%} + {%- endif -%} + {%- endif -%} + {%- endfor -%} + {%- if ns.result is none -%} + default answer: + {{- invoke_macro(default_action, input) -}} + {%- else -%} + result: {{- ns.result -}} + {%- endif -%} +{% endmacro %} \ No newline at end of file diff --git a/transformation/transformationPlugins/jsonMessageTransformers/jsonJinjavaTransformer/src/main/resources/jinjava/common/testAndAction.j2 b/transformation/transformationPlugins/jsonMessageTransformers/jsonJinjavaTransformer/src/main/resources/jinjava/common/testAndAction.j2 new file mode 100644 index 000000000..e69de29bb diff --git a/transformation/transformationPlugins/jsonMessageTransformers/jsonJinjavaTransformer/src/test/java/org/opensearch/migrations/transform/FeatureMaskingTest.java b/transformation/transformationPlugins/jsonMessageTransformers/jsonJinjavaTransformer/src/test/java/org/opensearch/migrations/transform/FeatureMaskingTest.java index 7c58cbb04..961855bb9 100644 --- a/transformation/transformationPlugins/jsonMessageTransformers/jsonJinjavaTransformer/src/test/java/org/opensearch/migrations/transform/FeatureMaskingTest.java +++ b/transformation/transformationPlugins/jsonMessageTransformers/jsonJinjavaTransformer/src/test/java/org/opensearch/migrations/transform/FeatureMaskingTest.java @@ -19,20 +19,20 @@ public Map transformForMask(Map incomingFlags) t var flags = FeatureFlags.parseJson(incomingFlagStr); log.atInfo().setMessage("parsed flags: {}").addArgument(flags == null ? "[NULL]" : flags.writeJson()).log(); final var template = "" + - "{%- include \"common/featureEnabled.j2\" -%}" + + "{%- import \"common/featureEnabled.j2\" as features -%}" + " { " + "{%- set ns = namespace(debug_info=['list: ']) -%}" + "{%- set ns.debug_info = ['list: '] -%}" + "\"enabledFlags\": \"" + - "{{- is_enabled(features,'testFlag') -}}," + - "{{- is_enabled(features,'testFlag.t1') -}}," + - "{{- is_enabled(features,'testFlag.t2') -}}," + - "{{- is_enabled(features,'nextTestFlag.n1') -}}" + + "{{- features.is_enabled(features,'testFlag') -}}," + + "{{- features.is_enabled(features,'testFlag.t1') -}}," + + "{{- features.is_enabled(features,'testFlag.t2') -}}," + + "{{- features.is_enabled(features,'nextTestFlag.n1') -}}" + "\"" + "}"; - var sanitization = new JinjavaTransformer(template, + var transformed = new JinjavaTransformer(template, src -> flags == null ? Map.of() : Map.of("features", flags)); - return sanitization.transformJson(Map.of()); + return transformed.transformJson(Map.of()); } @Test diff --git a/transformation/transformationPlugins/jsonMessageTransformers/jsonJinjavaTransformer/src/test/java/org/opensearch/migrations/transform/RouteTest.java b/transformation/transformationPlugins/jsonMessageTransformers/jsonJinjavaTransformer/src/test/java/org/opensearch/migrations/transform/RouteTest.java new file mode 100644 index 000000000..36bbb44a0 --- /dev/null +++ b/transformation/transformationPlugins/jsonMessageTransformers/jsonJinjavaTransformer/src/test/java/org/opensearch/migrations/transform/RouteTest.java @@ -0,0 +1,96 @@ +package org.opensearch.migrations.transform; + +import java.io.IOException; +import java.util.Map; + +import org.opensearch.migrations.transform.flags.FeatureFlags; + +import com.fasterxml.jackson.databind.ObjectMapper; +import lombok.extern.slf4j.Slf4j; +import org.junit.jupiter.api.Assertions; +import org.junit.jupiter.api.Test; + +@Slf4j +public class RouteTest { + private static final ObjectMapper objectMapper = new ObjectMapper(); + + private final static String DEFAULT_RESPONSE = "{ \"default\": {}}"; + + public Map doRouting(Map flags, Map inputDoc) { + log.atInfo().setMessage("parsed flags: {}").addArgument(flags).log(); + final var template = "" + + "{%- macro doDefault() -%}" + + " {}" + + "{%- endmacro -%}\n" + + + "{%- macro matchIt(doc) -%}" + + " {{ doc.label | regex_capture('Thing_A(.*)') }}" + + "{%- endmacro -%}\n" + + "{% macro handleIt(matches) %}\n" + + "{% for key, value in matches.items() %}\n" + // TODO - this is a string, not an object! + +// " {{ key }}: {{ value }}
\n" + + "{% endfor %}" + +// " - {{ matches['group'] }} - " + +// " { \"matchedVal\": \"{{ matches['group1'] }}\"}" + + "{% endmacro %}" + + + " {% call doDefault() %}" + + " {{input}}" + + " {% endcall %}" + + + "\n" + + "{%- import \"common/route.j2\" as router -%}" + + "{{- router.route(source, flags, doDefault," + + " [" + + " ('labelMatches', 'matchIt', 'handleIt')" + + " ])" + + "-}}"; + + var transformed = new JinjavaTransformer(template, + src -> flags == null ? Map.of("source", inputDoc) : Map.of("source", inputDoc, "flags", flags)); + return transformed.transformJson(inputDoc); + } + + + @Test + public void test() { + var flags = Map.of( + "first", false, + "second", (Object) true); + var inputDoc = Map.of( + "label", "Thing_A_and more!", + "stuff", Map.of( + "inner1", "data1", + "inner2", "data2" + ) + ); + + log.atInfo().setMessage("parsed flags: {}").addArgument(flags).log(); + final var template = "" + + "{% macro table(predicate_output) %}\n" + + " {{Content of Macro 1\n}}" + + "{% endmacro %}\n" + + "\n"; + var transformed = new JinjavaTransformer(template, + src -> flags == null ? Map.of("source", inputDoc) : Map.of("source", inputDoc, "flags", flags)); + var result = transformed.transformJson(inputDoc); + System.out.println(result); + } + + @Test + public void testA() { + var flagAOff = Map.of( + "first", false, + "second", (Object) true); + var doc = Map.of( + "label", "Thing_A_and more!", + "stuff", Map.of( + "inner1", "data1", + "inner2", "data2" + ) + ); + Assertions.assertEquals("_and more!", doRouting(null, doc).get("matchedVal")); + Assertions.assertTrue(doRouting(flagAOff, doc).isEmpty()); + } +} diff --git a/transformation/transformationPlugins/jsonMessageTransformers/jsonTypeMappingsSanitizationTransformerProvider/src/test/java/org/opensearch/migrations/replay/TypeMappingsSanitizationProviderTest.java b/transformation/transformationPlugins/jsonMessageTransformers/jsonTypeMappingsSanitizationTransformerProvider/src/test/java/org/opensearch/migrations/replay/TypeMappingsSanitizationProviderTest.java index 18056ca7d..67fd561db 100644 --- a/transformation/transformationPlugins/jsonMessageTransformers/jsonTypeMappingsSanitizationTransformerProvider/src/test/java/org/opensearch/migrations/replay/TypeMappingsSanitizationProviderTest.java +++ b/transformation/transformationPlugins/jsonMessageTransformers/jsonTypeMappingsSanitizationTransformerProvider/src/test/java/org/opensearch/migrations/replay/TypeMappingsSanitizationProviderTest.java @@ -14,7 +14,7 @@ @Slf4j @WrapWithNettyLeakDetection(disableLeakChecks = true) -public class TypeMappingsSanitizationTest { +public class TypeMappingsSanitizationProviderTest { static final String TEST_INPUT_REQUEST = "{\n" + " \"method\": \"PUT\",\n" @@ -53,7 +53,9 @@ public void testSimpleTransform() throws JsonProcessingException { "type1", "indexB", "type2", "indexB"), "indexC", Map.of( - "type2", "indexC"));; + "type2", "indexC"), + "(time*)", Map.of( + "(type*)", "\\1_And_\\2"));; var transformer = new TypeMappingSanitizationTransformerProvider().createTransformer(config); var transformedDocument = transformer.transformJson(mapper.readValue(TEST_INPUT_REQUEST, new TypeReference<>(){})); From e8dfb3f056549904bf1261e3bffb9e99349d21f1 Mon Sep 17 00:00:00 2001 From: Greg Schohn Date: Sat, 23 Nov 2024 19:58:33 -0500 Subject: [PATCH 08/26] Get a test that changes some contents via the route macro to pass. Signed-off-by: Greg Schohn --- .../transform/JinjavaTransformer.java | 3 +- .../jinjava/DynamicMacroFunction.java | 3 - .../transform/jinjava/RegexCaptureFilter.java | 4 +- .../main/resources/jinjava/common/route.j2 | 16 ++-- .../transform/FeatureMaskingTest.java | 10 +- .../migrations/transform/RouteTest.java | 92 +++++++++---------- 6 files changed, 57 insertions(+), 71 deletions(-) diff --git a/transformation/transformationPlugins/jsonMessageTransformers/jsonJinjavaTransformer/src/main/java/org/opensearch/migrations/transform/JinjavaTransformer.java b/transformation/transformationPlugins/jsonMessageTransformers/jsonJinjavaTransformer/src/main/java/org/opensearch/migrations/transform/JinjavaTransformer.java index ff4354713..3d5c45057 100644 --- a/transformation/transformationPlugins/jsonMessageTransformers/jsonJinjavaTransformer/src/main/java/org/opensearch/migrations/transform/JinjavaTransformer.java +++ b/transformation/transformationPlugins/jsonMessageTransformers/jsonJinjavaTransformer/src/main/java/org/opensearch/migrations/transform/JinjavaTransformer.java @@ -1,5 +1,6 @@ package org.opensearch.migrations.transform; +import java.util.LinkedHashMap; import java.util.List; import java.util.Map; import java.util.Optional; @@ -56,7 +57,7 @@ public JinjavaTransformer(String templateString, public Map transformJson(Map incomingJson) { var resultStr = jinjava.render(templateStr, createContextWithSourceFunction.apply(incomingJson)); log.atInfo().setMessage("output from jinjava... {}").addArgument(resultStr).log(); - var parsedObj = (Map) objectMapper.readValue(resultStr, Map.class); + var parsedObj = (Map) objectMapper.readValue(resultStr, LinkedHashMap.class); return doFinalSubstitutions(incomingJson, parsedObj); } diff --git a/transformation/transformationPlugins/jsonMessageTransformers/jsonJinjavaTransformer/src/main/java/org/opensearch/migrations/transform/jinjava/DynamicMacroFunction.java b/transformation/transformationPlugins/jsonMessageTransformers/jsonJinjavaTransformer/src/main/java/org/opensearch/migrations/transform/jinjava/DynamicMacroFunction.java index c785a3f9b..685713fca 100644 --- a/transformation/transformationPlugins/jsonMessageTransformers/jsonJinjavaTransformer/src/main/java/org/opensearch/migrations/transform/jinjava/DynamicMacroFunction.java +++ b/transformation/transformationPlugins/jsonMessageTransformers/jsonJinjavaTransformer/src/main/java/org/opensearch/migrations/transform/jinjava/DynamicMacroFunction.java @@ -7,9 +7,6 @@ import com.hubspot.jinjava.interpret.Context; import com.hubspot.jinjava.interpret.JinjavaInterpreter; -import com.hubspot.jinjava.lib.fn.ELFunctionDefinition; -import com.hubspot.jinjava.lib.fn.Functions; -import com.hubspot.jinjava.objects.collections.PyList; import com.hubspot.jinjava.lib.fn.MacroFunction; public class DynamicMacroFunction { diff --git a/transformation/transformationPlugins/jsonMessageTransformers/jsonJinjavaTransformer/src/main/java/org/opensearch/migrations/transform/jinjava/RegexCaptureFilter.java b/transformation/transformationPlugins/jsonMessageTransformers/jsonJinjavaTransformer/src/main/java/org/opensearch/migrations/transform/jinjava/RegexCaptureFilter.java index 7fce682c9..3612b164b 100644 --- a/transformation/transformationPlugins/jsonMessageTransformers/jsonJinjavaTransformer/src/main/java/org/opensearch/migrations/transform/jinjava/RegexCaptureFilter.java +++ b/transformation/transformationPlugins/jsonMessageTransformers/jsonJinjavaTransformer/src/main/java/org/opensearch/migrations/transform/jinjava/RegexCaptureFilter.java @@ -2,8 +2,8 @@ import java.util.HashMap; -import com.google.re2j.Pattern; import com.google.re2j.Matcher; +import com.google.re2j.Pattern; import com.hubspot.jinjava.interpret.JinjavaInterpreter; import com.hubspot.jinjava.lib.filter.Filter; @@ -36,4 +36,4 @@ public Object filter(Object var, JinjavaInterpreter interpreter, String... args) } return null; } -} \ No newline at end of file +} diff --git a/transformation/transformationPlugins/jsonMessageTransformers/jsonJinjavaTransformer/src/main/resources/jinjava/common/route.j2 b/transformation/transformationPlugins/jsonMessageTransformers/jsonJinjavaTransformer/src/main/resources/jinjava/common/route.j2 index a436fa431..1fa9aef94 100644 --- a/transformation/transformationPlugins/jsonMessageTransformers/jsonJinjavaTransformer/src/main/resources/jinjava/common/route.j2 +++ b/transformation/transformationPlugins/jsonMessageTransformers/jsonJinjavaTransformer/src/main/resources/jinjava/common/route.j2 @@ -1,22 +1,20 @@ -{% import "common/featureEnabled.j2" as flags %} -within import {{ __macros__ | pprint }} -{% macro route(input, feature_flags, default_action, routes) %} +{% import "common/featureEnabled.j2" as fscope %} +{% macro route(input, field_to_match, feature_flags, default_action, routes) %} {%- set ns = namespace(result=none, matched=false) -%} - {%- for feature_name, pattern_fn, action_fn in routes if not ns.matched -%} + {%- for feature_name, pattern, action_fn in routes if not ns.matched -%} {%- if not ns.matched -%} {# we haven't found a match yet, otherwise skip the rest #} - {%- set match = invoke_macro(pattern_fn, input) -%} + {%- set match = field_to_match | regex_capture(pattern) -%} {%- if match is not none -%} {%- set ns.matched = true -%} - {%- if flags.is_enabled(feature_flags, feature_name) -%} - {%- set ns.result = invoke_macro(action_fn, match) -%} + {%- if fscope.is_enabled(feature_flags, feature_name) -%} + {%- set ns.result = invoke_macro(action_fn, match, input) -%} {%- endif -%} {%- endif -%} {%- endif -%} {%- endfor -%} {%- if ns.result is none -%} - default answer: {{- invoke_macro(default_action, input) -}} {%- else -%} - result: {{- ns.result -}} + {{- ns.result -}} {%- endif -%} {% endmacro %} \ No newline at end of file diff --git a/transformation/transformationPlugins/jsonMessageTransformers/jsonJinjavaTransformer/src/test/java/org/opensearch/migrations/transform/FeatureMaskingTest.java b/transformation/transformationPlugins/jsonMessageTransformers/jsonJinjavaTransformer/src/test/java/org/opensearch/migrations/transform/FeatureMaskingTest.java index 961855bb9..80a01b102 100644 --- a/transformation/transformationPlugins/jsonMessageTransformers/jsonJinjavaTransformer/src/test/java/org/opensearch/migrations/transform/FeatureMaskingTest.java +++ b/transformation/transformationPlugins/jsonMessageTransformers/jsonJinjavaTransformer/src/test/java/org/opensearch/migrations/transform/FeatureMaskingTest.java @@ -19,15 +19,15 @@ public Map transformForMask(Map incomingFlags) t var flags = FeatureFlags.parseJson(incomingFlagStr); log.atInfo().setMessage("parsed flags: {}").addArgument(flags == null ? "[NULL]" : flags.writeJson()).log(); final var template = "" + - "{%- import \"common/featureEnabled.j2\" as features -%}" + + "{%- import \"common/featureEnabled.j2\" as fscope -%}" + " { " + "{%- set ns = namespace(debug_info=['list: ']) -%}" + "{%- set ns.debug_info = ['list: '] -%}" + "\"enabledFlags\": \"" + - "{{- features.is_enabled(features,'testFlag') -}}," + - "{{- features.is_enabled(features,'testFlag.t1') -}}," + - "{{- features.is_enabled(features,'testFlag.t2') -}}," + - "{{- features.is_enabled(features,'nextTestFlag.n1') -}}" + + "{{- fscope.is_enabled(features,'testFlag') -}}," + + "{{- fscope.is_enabled(features,'testFlag.t1') -}}," + + "{{- fscope.is_enabled(features,'testFlag.t2') -}}," + + "{{- fscope.is_enabled(features,'nextTestFlag.n1') -}}" + "\"" + "}"; var transformed = new JinjavaTransformer(template, diff --git a/transformation/transformationPlugins/jsonMessageTransformers/jsonJinjavaTransformer/src/test/java/org/opensearch/migrations/transform/RouteTest.java b/transformation/transformationPlugins/jsonMessageTransformers/jsonJinjavaTransformer/src/test/java/org/opensearch/migrations/transform/RouteTest.java index 36bbb44a0..d0281963d 100644 --- a/transformation/transformationPlugins/jsonMessageTransformers/jsonJinjavaTransformer/src/test/java/org/opensearch/migrations/transform/RouteTest.java +++ b/transformation/transformationPlugins/jsonMessageTransformers/jsonJinjavaTransformer/src/test/java/org/opensearch/migrations/transform/RouteTest.java @@ -1,9 +1,9 @@ package org.opensearch.migrations.transform; import java.io.IOException; +import java.util.List; import java.util.Map; - -import org.opensearch.migrations.transform.flags.FeatureFlags; +import java.util.TreeMap; import com.fasterxml.jackson.databind.ObjectMapper; import lombok.extern.slf4j.Slf4j; @@ -23,27 +23,24 @@ public Map doRouting(Map flags, Map\n" + - "{% endfor %}" + -// " - {{ matches['group'] }} - " + -// " { \"matchedVal\": \"{{ matches['group1'] }}\"}" + + "{% macro echoFirstMatch(matches, input) %}\n" + + " { \"matchedVal\": \"{{ matches['group1'] }}\"}" + + "{% endmacro %}" + + "{% macro echoFirstMatchAgain(matches, input) %}\n" + + " { \"again\": \"{{ matches['group1'] }}\"}" + + "{% endmacro %}" + + "{% macro switchStuff(matches, input) %}\n" + + " {% set swapped_list = [input.stuff[1], input.stuff[0]] %}" + + " {% set input = input + {'stuff': swapped_list} %}" + + " {{ input | tojson }} " + "{% endmacro %}" + - " {% call doDefault() %}" + - " {{input}}" + - " {% endcall %}" + - - "\n" + - "{%- import \"common/route.j2\" as router -%}" + - "{{- router.route(source, flags, doDefault," + + "{%- import \"common/route.j2\" as rscope -%}" + + "{{- rscope.route(source, source.label, flags, 'doDefault'," + " [" + - " ('labelMatches', 'matchIt', 'handleIt')" + + " ('matchA', 'Thing_A(.*)', 'echoFirstMatch')," + + " ('matchA', 'Thing_A(.*)', 'echoFirstMatchAgain')," + // make sure that we don't get duplicate results + " ('matchB', 'B(.*)', 'switchStuff')" + " ])" + "-}}"; @@ -52,45 +49,38 @@ public Map doRouting(Map flags, Map flags == null ? Map.of("source", inputDoc) : Map.of("source", inputDoc, "flags", flags)); - var result = transformed.transformJson(inputDoc); - System.out.println(result); - } - - @Test - public void testA() { - var flagAOff = Map.of( - "first", false, - "second", (Object) true); - var doc = Map.of( - "label", "Thing_A_and more!", - "stuff", Map.of( - "inner1", "data1", - "inner2", "data2" + var docB = Map.of( + "label", "B-hive", + "stuff", List.of( + "data1", + "data2" ) ); - Assertions.assertEquals("_and more!", doRouting(null, doc).get("matchedVal")); - Assertions.assertTrue(doRouting(flagAOff, doc).isEmpty()); + { + var resultMap = doRouting(null, docA); + Assertions.assertEquals(1, resultMap.size()); + Assertions.assertEquals("_and more!", resultMap.get("matchedVal")); + } + { + var resultMap = doRouting(flagAOff, docA); + Assertions.assertTrue(resultMap.isEmpty()); + } + { + var resultMap = doRouting(flagAOff, docB); + Assertions.assertEquals("{\"label\":\"B-hive\",\"stuff\":[\"data2\",\"data1\"]}", + objectMapper.writeValueAsString(new TreeMap<>(resultMap))); + } } } From 93dc5c89d5c8154954fd87606b18a11e6743df24 Mon Sep 17 00:00:00 2001 From: Greg Schohn Date: Sun, 24 Nov 2024 15:46:22 -0500 Subject: [PATCH 09/26] Assorted jinjava template changes for replayer... Switched out Google's re2j for Java's implementation. I didn't realize that the java implementation is closer to python regexes and that re2j (which I had thought was closer to python). Minor tweaks to the route jinja template to make it easier to read when it's invoked. Switched the replayer template to use the route functionality, which is considerably easier to get one's head around. TODO - * I'd like to make the feature flag names the same as the macro name for the route when the feature flag name is omitted. * The test cases for the type mappings sanitization need a lot of work. * When indices are created that DO NOT use type mappings, we should handle those more gracefully. Signed-off-by: Greg Schohn --- .../jsonJinjavaTransformer/build.gradle | 1 - .../transform/jinjava/RegexCaptureFilter.java | 4 +- .../resources/jinjava/common/route-bkp.j2 | 25 -------- .../main/resources/jinjava/common/route.j2 | 3 +- .../resources/jinjava/common/testAndAction.j2 | 0 .../migrations/transform/RouteTest.java | 14 ++--- .../jinjava/typeMappings/replayer.j2 | 44 ++++++------- ...peMappingsSanitizationTransformerTest.java | 62 +++++++++++++++---- 8 files changed, 80 insertions(+), 73 deletions(-) delete mode 100644 transformation/transformationPlugins/jsonMessageTransformers/jsonJinjavaTransformer/src/main/resources/jinjava/common/route-bkp.j2 delete mode 100644 transformation/transformationPlugins/jsonMessageTransformers/jsonJinjavaTransformer/src/main/resources/jinjava/common/testAndAction.j2 diff --git a/transformation/transformationPlugins/jsonMessageTransformers/jsonJinjavaTransformer/build.gradle b/transformation/transformationPlugins/jsonMessageTransformers/jsonJinjavaTransformer/build.gradle index f4b05736e..448b9e529 100644 --- a/transformation/transformationPlugins/jsonMessageTransformers/jsonJinjavaTransformer/build.gradle +++ b/transformation/transformationPlugins/jsonMessageTransformers/jsonJinjavaTransformer/build.gradle @@ -6,7 +6,6 @@ dependencies { implementation project(':transformation:transformationPlugins:jsonMessageTransformers:jsonMessageTransformerInterface') implementation group: 'com.hubspot.jinjava', name: 'jinjava', version: "2.7.3" - implementation group: 'com.google.re2j', name: 're2j', version: "1.7" testImplementation project(':TrafficCapture:trafficReplayer') testImplementation project(':transformation:transformationPlugins:jsonMessageTransformers:jsonMessageTransformerLoaders') diff --git a/transformation/transformationPlugins/jsonMessageTransformers/jsonJinjavaTransformer/src/main/java/org/opensearch/migrations/transform/jinjava/RegexCaptureFilter.java b/transformation/transformationPlugins/jsonMessageTransformers/jsonJinjavaTransformer/src/main/java/org/opensearch/migrations/transform/jinjava/RegexCaptureFilter.java index 3612b164b..ba10ead79 100644 --- a/transformation/transformationPlugins/jsonMessageTransformers/jsonJinjavaTransformer/src/main/java/org/opensearch/migrations/transform/jinjava/RegexCaptureFilter.java +++ b/transformation/transformationPlugins/jsonMessageTransformers/jsonJinjavaTransformer/src/main/java/org/opensearch/migrations/transform/jinjava/RegexCaptureFilter.java @@ -1,9 +1,9 @@ package org.opensearch.migrations.transform.jinjava; import java.util.HashMap; +import java.util.regex.Matcher; +import java.util.regex.Pattern; -import com.google.re2j.Matcher; -import com.google.re2j.Pattern; import com.hubspot.jinjava.interpret.JinjavaInterpreter; import com.hubspot.jinjava.lib.filter.Filter; diff --git a/transformation/transformationPlugins/jsonMessageTransformers/jsonJinjavaTransformer/src/main/resources/jinjava/common/route-bkp.j2 b/transformation/transformationPlugins/jsonMessageTransformers/jsonJinjavaTransformer/src/main/resources/jinjava/common/route-bkp.j2 deleted file mode 100644 index 9e7792f94..000000000 --- a/transformation/transformationPlugins/jsonMessageTransformers/jsonJinjavaTransformer/src/main/resources/jinjava/common/route-bkp.j2 +++ /dev/null @@ -1,25 +0,0 @@ -{% import "common/featureEnabled.j2" as flags %} -{% macro route(input, feature_flags, default_action, routes) %} - {%- set ns = namespace(result=none, matched=false) -%} - {%- for feature_name, pattern, action in routes if not ns.matched -%} - {%- if not ns.matched -%} {# we haven't found a match yet, otherwise skip the rest #} - checking {{ feature_name }}... - {%- set match = none -%} - {%- call pattern(input) -%}{% endcall %} - match {{ match }}... - {%- if match is not none -%} - in a non-null match {{ match }} - in a match! - {%- set ns.matched = true -%} - {%- if flags.is_enabled(feature_flags, feature_name) -%} - {%- set ns.result = action | call(match) -%} - {%- endif -%} - {%- endif -%} - {%- endif -%} - {%- endfor -%} - {%- if ns.result is none -%} - default answer: {{- default_action | call(input) -}} - {%- else -%} - result: {{- ns.result -}} - {%- endif -%} -{% endmacro %} \ No newline at end of file diff --git a/transformation/transformationPlugins/jsonMessageTransformers/jsonJinjavaTransformer/src/main/resources/jinjava/common/route.j2 b/transformation/transformationPlugins/jsonMessageTransformers/jsonJinjavaTransformer/src/main/resources/jinjava/common/route.j2 index 1fa9aef94..bc4793a4d 100644 --- a/transformation/transformationPlugins/jsonMessageTransformers/jsonJinjavaTransformer/src/main/resources/jinjava/common/route.j2 +++ b/transformation/transformationPlugins/jsonMessageTransformers/jsonJinjavaTransformer/src/main/resources/jinjava/common/route.j2 @@ -1,7 +1,8 @@ {% import "common/featureEnabled.j2" as fscope %} {% macro route(input, field_to_match, feature_flags, default_action, routes) %} {%- set ns = namespace(result=none, matched=false) -%} - {%- for feature_name, pattern, action_fn in routes if not ns.matched -%} + {%- for pattern, action_fn, feature_name_param in routes if not ns.matched -%} + {% set feature_name = feature_name_param | default(action_fn) %} {%- if not ns.matched -%} {# we haven't found a match yet, otherwise skip the rest #} {%- set match = field_to_match | regex_capture(pattern) -%} {%- if match is not none -%} diff --git a/transformation/transformationPlugins/jsonMessageTransformers/jsonJinjavaTransformer/src/main/resources/jinjava/common/testAndAction.j2 b/transformation/transformationPlugins/jsonMessageTransformers/jsonJinjavaTransformer/src/main/resources/jinjava/common/testAndAction.j2 deleted file mode 100644 index e69de29bb..000000000 diff --git a/transformation/transformationPlugins/jsonMessageTransformers/jsonJinjavaTransformer/src/test/java/org/opensearch/migrations/transform/RouteTest.java b/transformation/transformationPlugins/jsonMessageTransformers/jsonJinjavaTransformer/src/test/java/org/opensearch/migrations/transform/RouteTest.java index d0281963d..b5964e548 100644 --- a/transformation/transformationPlugins/jsonMessageTransformers/jsonJinjavaTransformer/src/test/java/org/opensearch/migrations/transform/RouteTest.java +++ b/transformation/transformationPlugins/jsonMessageTransformers/jsonJinjavaTransformer/src/test/java/org/opensearch/migrations/transform/RouteTest.java @@ -19,7 +19,7 @@ public class RouteTest { public Map doRouting(Map flags, Map inputDoc) { log.atInfo().setMessage("parsed flags: {}").addArgument(flags).log(); final var template = "" + - "{%- macro doDefault() -%}" + + "{%- macro doDefault(ignored_input) -%}" + " {}" + "{%- endmacro -%}\n" + @@ -38,9 +38,9 @@ public Map doRouting(Map flags, Map regexCache = + CacheBuilder.newBuilder().build(CacheLoader.from((Function)Pattern::compile)); + + @SneakyThrows + private static Pattern getCompiledPattern(String pattern) { + return regexCache.get(pattern); + } + @Override public String getName() { return "regex_capture"; @@ -23,7 +37,7 @@ public Object filter(Object var, JinjavaInterpreter interpreter, String... args) String pattern = args[0]; try { - Matcher matcher = Pattern.compile(pattern).matcher(input); + Matcher matcher = getCompiledPattern(pattern).matcher(input); if (matcher.find()) { var groups = new HashMap<>(); for (int i = 0; i <= matcher.groupCount(); i++) { diff --git a/transformation/transformationPlugins/jsonMessageTransformers/jsonJinjavaTransformer/src/test/java/org/opensearch/migrations/transform/JinjavaTransformerTest.java b/transformation/transformationPlugins/jsonMessageTransformers/jsonJinjavaTransformer/src/test/java/org/opensearch/migrations/transform/JinjavaTransformerTest.java index 2bec339ae..f215c809b 100644 --- a/transformation/transformationPlugins/jsonMessageTransformers/jsonJinjavaTransformer/src/test/java/org/opensearch/migrations/transform/JinjavaTransformerTest.java +++ b/transformation/transformationPlugins/jsonMessageTransformers/jsonJinjavaTransformer/src/test/java/org/opensearch/migrations/transform/JinjavaTransformerTest.java @@ -2,10 +2,12 @@ import java.util.Map; +import lombok.extern.slf4j.Slf4j; import org.junit.jupiter.api.BeforeAll; import org.junit.jupiter.api.Test; import org.testcontainers.shaded.com.fasterxml.jackson.databind.ObjectMapper; +@Slf4j class JinjavaTransformerTest { private final static String template = "" + @@ -81,6 +83,6 @@ public void test() throws Exception { var objMapper = new ObjectMapper(); var resultObj = indexTypeMappingRewriter.transformJson(objMapper.readValue(testString, Map.class)); var resultStr = objMapper.writeValueAsString(resultObj); - System.out.println("resultStr = " + resultStr); + log.atInfo().setMessage("resultStr = {}").setMessage(resultStr).log(); } } diff --git a/transformation/transformationPlugins/jsonMessageTransformers/jsonTypeMappingsSanitizationTransformer/src/main/java/org/opensearch/migrations/transform/TypeMappingsSanitizationTransformer.java b/transformation/transformationPlugins/jsonMessageTransformers/jsonTypeMappingsSanitizationTransformer/src/main/java/org/opensearch/migrations/transform/TypeMappingsSanitizationTransformer.java index e76ea8357..224a4f619 100644 --- a/transformation/transformationPlugins/jsonMessageTransformers/jsonTypeMappingsSanitizationTransformer/src/main/java/org/opensearch/migrations/transform/TypeMappingsSanitizationTransformer.java +++ b/transformation/transformationPlugins/jsonMessageTransformers/jsonTypeMappingsSanitizationTransformer/src/main/java/org/opensearch/migrations/transform/TypeMappingsSanitizationTransformer.java @@ -2,24 +2,50 @@ import java.io.IOException; import java.nio.charset.StandardCharsets; +import java.util.List; import java.util.Map; +import java.util.function.Function; import com.google.common.io.Resources; public class TypeMappingsSanitizationTransformer extends JinjavaTransformer { - public TypeMappingsSanitizationTransformer(Map> indexMappings) throws IOException { - this("jinjava/typeMappings/replayer.j2", null, indexMappings); + public static final String REPLAYER_VARIANT = "jinjava/typeMappings/replayer.j2"; + + public TypeMappingsSanitizationTransformer() + throws IOException { + this(REPLAYER_VARIANT, null, null, null); + } + + public TypeMappingsSanitizationTransformer(Map> indexMappings, + List> regexIndexMappings) + throws IOException { + this(REPLAYER_VARIANT, null, indexMappings, regexIndexMappings); } public TypeMappingsSanitizationTransformer(String variantName, Map featureFlags, - Map> indexMappings) throws IOException { + Map> indexMappings, + List> regexIndexMappings) throws IOException { super( makeTemplate(variantName), - incomingJson -> Map.of("request", incomingJson, - "index_mappings", indexMappings, - "featureFlags", featureFlags == null ? Map.of() : featureFlags)); + makeSourceWrapperFunction(featureFlags, indexMappings, regexIndexMappings)); + } + + private static Function, Map> + makeSourceWrapperFunction(Map featureFlagsIncoming, + Map> indexMappingsIncoming, + List> regexIndexMappingsIncoming) + { + var featureFlags = featureFlagsIncoming != null ? featureFlagsIncoming : Map.of(); + var indexMappings = indexMappingsIncoming != null ? indexMappingsIncoming : Map.of(); + var regexIndexMappings = regexIndexMappingsIncoming != null ? regexIndexMappingsIncoming : + (indexMappingsIncoming == null ? List.of(List.of("(.*)", "(.*)", "\\1_\\2")) : List.of()); + + return incomingJson -> Map.of("request", incomingJson, + "index_mappings", indexMappings, + "regex_index_mappings", regexIndexMappings, + "featureFlags", featureFlags); } private static String makeTemplate(String variantName) throws IOException { diff --git a/transformation/transformationPlugins/jsonMessageTransformers/jsonTypeMappingsSanitizationTransformer/src/main/resources/jinjava/typeMappings/replayer.j2 b/transformation/transformationPlugins/jsonMessageTransformers/jsonTypeMappingsSanitizationTransformer/src/main/resources/jinjava/typeMappings/replayer.j2 index 70929af79..29910a959 100644 --- a/transformation/transformationPlugins/jsonMessageTransformers/jsonTypeMappingsSanitizationTransformer/src/main/resources/jinjava/typeMappings/replayer.j2 +++ b/transformation/transformationPlugins/jsonMessageTransformers/jsonTypeMappingsSanitizationTransformer/src/main/resources/jinjava/typeMappings/replayer.j2 @@ -1,27 +1,59 @@ {%- include "common/featureEnabled.j2" -%} -{%- macro default_action(source_and_mappings) -%} -{ - "diagPair": {{ source_and_mappings }}, - "preserve": "*" -} +{%- macro preserve_original(source_and_mappings) -%} + { "preserve": "*" } {%- endmacro -%} -{%- macro rewrite_uri_to_strip_types(match, input_map) -%} -{ - "method": "{{ input_map.request.method }}", - "URI": "/{{ input_map.index_mappings[match.group1][match.group2] }}/_doc/{{ match.group3 }}", - "preserve": ["headers","payload"] -} +{%- macro make_no_op() -%} + { "method": "GET", "URI": "/" } {%- endmacro -%} -{% macro rewrite_create_index(match, input_map) -%} -{# In reality, this is going to need to figure out if there are multiple type mappings and deal with them according.y #} +{%- macro rewrite_uri_to_strip_types(source_index, source_type, regex_index_mappings) -%} + {%- set ns = namespace(target_index=none) -%} + {%- for entry in regex_index_mappings -%} + {%- set idx_regex = entry.get(0) -%} + {%- set type_regex = entry[1] -%} + {%- set target_idx_pattern = entry[2] -%} + + {%- if ns.target_index is none -%} + {%- set conjoined_source = source_index + "/" + source_type -%} + {%- set conjoined_regex = idx_regex + "/" + type_regex -%} + {%- set didMatch = conjoined_source | regex_capture(conjoined_regex) -%} + {%- if didMatch is not none -%} + {%- set ns.target_index = conjoined_source | regex_replace(conjoined_regex, target_idx_pattern) -%} + {%- endif -%} + {%- endif -%} + {%- endfor -%} + {{- ns.target_index -}} +{%- endmacro -%} + +{%- macro rewrite_uri_for_types(match, input_map) -%} + {%- set target_index = (input_map.index_mappings[match.group1] | default({}))[match.group2] -%} + {%- if target_index is none %} {# not sure if default arguments would be eagerly evaluated #} + {%- set target_index = invoke_macro('rewrite_uri_to_strip_types', match.group1, match.group2, input_map.regex_index_mappings) -%} + {%- endif -%} + {%- if target_index is none -%} + {{ make_no_op() }} + {%- else -%} + { + "method": "{{ input_map.request.method }}", + "URI": "/{{ target_index }}/_doc/{{ match.group3 }}", + "preserve": ["headers","payload"] + } + {%- endif -%} +{%- endmacro -%} + +{% macro rewrite_create_index_excise(match, input_map) -%} { "method": "{{ input_map.request.method }}", "URI": "{{ input_map.index_mappings[match.group1] }}", "payload": { "inlinedJsonBody": { + {%- for key, value in input_map.request.body.items() -%} + {%- if key != "mappings" -%} + "{{ key }}": {{ value | tojson }}, + {%- endif -%} + {%- endfor -%} "mappings": { "properties": { "type": { @@ -40,12 +72,28 @@ } {%- endmacro -%} -{% set source_and_mappings = { 'request': request, 'index_mappings': index_mappings} %} +{% macro rewrite_create_index(match, input_map) -%} + {% set target_mappings = input_map.index_mappings[match.group1] | default({}) | length %} + {% if target_mappings == 0 %} + {{ make_no_op() }} + {% elif num_mappings == 1 %} + {{ rewrite_create_index_excise(match, input_map) }} + {% elif num_mappings > 1 %} + {% else %} + {{ preserve_original(input_mappings) }} + {% endif %} +{%- endmacro -%} + +{% set source_and_mappings = { + 'request': request, + 'index_mappings': index_mappings, + 'regex_index_mappings': regex_index_mappings} +%} {%- import "common/route.j2" as rscope -%} -{{- rscope.route(source_and_mappings, request.method + " " + request.URI, flags, 'default_action', +{{- rscope.route(source_and_mappings, request.method + " " + request.URI, flags, 'preserve_original', [ - ('(?:PUT|POST) /([^/]*)/([^/]*)/.*', 'rewrite_uri_to_strip_types', 'rewrite_add_request_to_strip_types'), - ( 'GET /([^/]*)/([^/]*)/.*', 'rewrite_uri_to_strip_types', 'rewrite_get_request_to_strip_types'), - ('(?:PUT|POST) /([^/]*)', 'rewrite_create_index', 'rewrite_create_index') + ('(?:PUT|POST) /([^/]*)/([^/]*)/(.*)', 'rewrite_uri_for_types', 'rewrite_add_request_to_strip_types'), + ( 'GET /([^/]*)/([^/]*)/.*', 'rewrite_uri_for_types', 'rewrite_get_request_to_strip_types'), + ('(?:PUT|POST) /([^/]*)', 'rewrite_create_index', 'rewrite_create_index') ]) -}} diff --git a/transformation/transformationPlugins/jsonMessageTransformers/jsonTypeMappingsSanitizationTransformer/src/test/java/org/opensearch/migrations/transform/TypeMappingsSanitizationTransformerTest.java b/transformation/transformationPlugins/jsonMessageTransformers/jsonTypeMappingsSanitizationTransformer/src/test/java/org/opensearch/migrations/transform/TypeMappingsSanitizationTransformerTest.java index e7249845c..bd57a153f 100644 --- a/transformation/transformationPlugins/jsonMessageTransformers/jsonTypeMappingsSanitizationTransformer/src/test/java/org/opensearch/migrations/transform/TypeMappingsSanitizationTransformerTest.java +++ b/transformation/transformationPlugins/jsonMessageTransformers/jsonTypeMappingsSanitizationTransformer/src/test/java/org/opensearch/migrations/transform/TypeMappingsSanitizationTransformerTest.java @@ -2,13 +2,15 @@ import java.io.IOException; import java.util.LinkedHashMap; +import java.util.List; import java.util.Map; -import java.util.regex.Pattern; +import lombok.extern.slf4j.Slf4j; import org.junit.jupiter.api.BeforeAll; import org.junit.jupiter.api.Test; import org.testcontainers.shaded.com.fasterxml.jackson.databind.ObjectMapper; +@Slf4j class TypeMappingsSanitizationTransformerTest { private static TypeMappingsSanitizationTransformer indexTypeMappingRewriter; @@ -23,8 +25,9 @@ static void initialize() throws IOException { "type2", "indexB"), "indexC", Map.of( "type2", "indexC")); - //"time-(*)", Map.of("(*)", "time-\\1-\\2")); - indexTypeMappingRewriter = new TypeMappingsSanitizationTransformer(indexMappings); + var regexIndexMappings = List.of( + List.of("time-(.*)", "(.*)", "time-\\1-\\2")); + indexTypeMappingRewriter = new TypeMappingsSanitizationTransformer(indexMappings, regexIndexMappings); } @Test @@ -44,7 +47,27 @@ public void testPutDoc() throws Exception { var objMapper = new ObjectMapper(); var resultObj = indexTypeMappingRewriter.transformJson(objMapper.readValue(testString, LinkedHashMap.class)); var resultStr = objMapper.writeValueAsString(resultObj); - System.out.println("resultStr = " + resultStr); + log.atInfo().setMessage("resultStr = {}").setMessage(resultStr).log(); + } + + @Test + public void testPutDocRegex() throws Exception { + var testString = + "{\n" + + " \"" + JsonKeysForHttpMessage.METHOD_KEY + "\": \"PUT\",\n" + + " \"" + JsonKeysForHttpMessage.URI_KEY + "\": \"/time-nov11/cpu/doc2\",\n" + + " \"" + JsonKeysForHttpMessage.PAYLOAD_KEY + "\": {\n" + + " \"" + JsonKeysForHttpMessage.INLINED_JSON_BODY_DOCUMENT_KEY + "\": {" + + " \"name\": \"Some User\",\n" + + " \"user_name\": \"user\",\n" + + " \"email\": \"user@example.com\"\n" + + " }\n" + + " }\n" + + "}"; + var objMapper = new ObjectMapper(); + var resultObj = indexTypeMappingRewriter.transformJson(objMapper.readValue(testString, LinkedHashMap.class)); + var resultStr = objMapper.writeValueAsString(resultObj); + log.atInfo().setMessage("resultStr = {}").setMessage(resultStr).log(); } @Test @@ -56,6 +79,9 @@ public void testPutIndex() throws Exception { " \"" + JsonKeysForHttpMessage.PAYLOAD_KEY + "\": {\n" + " \"" + JsonKeysForHttpMessage.INLINED_JSON_BODY_DOCUMENT_KEY + "\": " + "{\n" + + " \"settings\" : {\n" + + " \"number_of_shards\" : 1\n" + + " }," + " \"mappings\": {\n" + " \"user\": {\n" + " \"properties\": {\n" + @@ -79,6 +105,6 @@ public void testPutIndex() throws Exception { var objMapper = new ObjectMapper(); var resultObj = indexTypeMappingRewriter.transformJson(objMapper.readValue(testString, LinkedHashMap.class)); var resultStr = objMapper.writeValueAsString(resultObj); - System.out.println("resultStr = " + resultStr); + log.atInfo().setMessage("resultStr = {}").setMessage(resultStr).log(); } } diff --git a/transformation/transformationPlugins/jsonMessageTransformers/jsonTypeMappingsSanitizationTransformerProvider/src/main/java/org/opensearch/migrations/transform/TypeMappingSanitizationTransformerProvider.java b/transformation/transformationPlugins/jsonMessageTransformers/jsonTypeMappingsSanitizationTransformerProvider/src/main/java/org/opensearch/migrations/transform/TypeMappingSanitizationTransformerProvider.java index 3fd154b8f..89f99a02d 100644 --- a/transformation/transformationPlugins/jsonMessageTransformers/jsonTypeMappingsSanitizationTransformerProvider/src/main/java/org/opensearch/migrations/transform/TypeMappingSanitizationTransformerProvider.java +++ b/transformation/transformationPlugins/jsonMessageTransformers/jsonTypeMappingsSanitizationTransformerProvider/src/main/java/org/opensearch/migrations/transform/TypeMappingSanitizationTransformerProvider.java @@ -1,31 +1,50 @@ package org.opensearch.migrations.transform; +import java.util.List; import java.util.Map; import lombok.SneakyThrows; public class TypeMappingSanitizationTransformerProvider implements IJsonTransformerProvider { + public static final String FEATURE_FLAGS = "featureFlags"; + public static final String STATIC_MAPPINGS = "staticMappings"; + public static final String REGEX_MAPPINGS = "regexMappings"; + @SneakyThrows @Override public IJsonTransformer createTransformer(Object jsonConfig) { try { - if (jsonConfig instanceof Map) { - return new TypeMappingsSanitizationTransformer((Map>) jsonConfig); - } else { + if (jsonConfig == null) { + return new TypeMappingsSanitizationTransformer(TypeMappingsSanitizationTransformer.REPLAYER_VARIANT, + null, null, null); + } else if (!(jsonConfig instanceof Map)) { throw new IllegalArgumentException(getConfigUsageStr()); } + + var config = (Map) jsonConfig; + return new TypeMappingsSanitizationTransformer(TypeMappingsSanitizationTransformer.REPLAYER_VARIANT, + (Map) config.get(FEATURE_FLAGS), + (Map>) config.get(STATIC_MAPPINGS), + (List>) config.get(REGEX_MAPPINGS)); } catch (ClassCastException e) { throw new IllegalArgumentException(getConfigUsageStr(), e); } } private String getConfigUsageStr() { - return this.getClass().getName() - + " expects the incoming configuration " - + "to be a Map>. " + - "The top-level key is a source index name, that key's children values are the index's type mappings. " + - "The value for the inner keys is the target index name that the " + - "source type's documents should be written to."; + return this.getClass().getName() + " " + + "expects the incoming configuration to be a Map, " + + "with values '" + STATIC_MAPPINGS + "', '" + REGEX_MAPPINGS + "', and '" + FEATURE_FLAGS + "'. " + + "The value of " + STATIC_MAPPINGS + " should be a two-level map where the top-level key is the name " + + "of a source index and that key's dictionary maps each sub-type to a specific target index. " + + REGEX_MAPPINGS + " (List<[List>]) matches index names and sub-types to a target pattern. " + + "The patterns are matched in ascending order, finding the first match. " + + "The items within each top-level " + REGEX_MAPPINGS + " element are [indexRegex, typeRegex, targetPattern]." + + " The targetPattern can contain backreferences ('\\1'...) to refer to captured groups from the regex. " + + "Finally, the " + FEATURE_FLAGS + " is an arbitrarily deep map with boolean leaves. " + + "The " + FEATURE_FLAGS + " map is optional. " + + "When present, it can disable some types of transformations, " + + "such as when they may not be applicable for a given migration."; } } diff --git a/transformation/transformationPlugins/jsonMessageTransformers/jsonTypeMappingsSanitizationTransformerProvider/src/test/java/org/opensearch/migrations/replay/TypeMappingsSanitizationProviderTest.java b/transformation/transformationPlugins/jsonMessageTransformers/jsonTypeMappingsSanitizationTransformerProvider/src/test/java/org/opensearch/migrations/replay/TypeMappingsSanitizationProviderTest.java index 67fd561db..fcc98c1f1 100644 --- a/transformation/transformationPlugins/jsonMessageTransformers/jsonTypeMappingsSanitizationTransformerProvider/src/test/java/org/opensearch/migrations/replay/TypeMappingsSanitizationProviderTest.java +++ b/transformation/transformationPlugins/jsonMessageTransformers/jsonTypeMappingsSanitizationTransformerProvider/src/test/java/org/opensearch/migrations/replay/TypeMappingsSanitizationProviderTest.java @@ -1,5 +1,6 @@ package org.opensearch.migrations.replay; +import java.util.List; import java.util.Map; import org.opensearch.migrations.testutils.WrapWithNettyLeakDetection; @@ -45,38 +46,49 @@ static String emitJson(ObjectMapper mapper, Object transformedDocument) throws J @Test public void testSimpleTransform() throws JsonProcessingException { - var config = Map.of( - "indexA", Map.of( - "type1", "indexA_1", - "type2", "indexA_2"), - "indexB", Map.of( - "type1", "indexB", - "type2", "indexB"), - "indexC", Map.of( - "type2", "indexC"), - "(time*)", Map.of( - "(type*)", "\\1_And_\\2"));; - var transformer = new TypeMappingSanitizationTransformerProvider().createTransformer(config); + var config = Map.of("staticMappings", + Map.of( + "indexA", Map.of( + "type1", "indexA_1", + "type2", "indexA_2"), + "indexB", Map.of( + "type1", "indexB", + "type2", "indexB"), + "indexC", Map.of( + "type2", "indexC")), + "regexMappings", List.of(List.of("(time*)", "(type*)", "\\1_And_\\2"))); + var provider = new TypeMappingSanitizationTransformerProvider(); + var transformer = provider.createTransformer(config); var transformedDocument = - transformer.transformJson(mapper.readValue(TEST_INPUT_REQUEST, new TypeReference<>(){})); + transformer.transformJson(mapper.readValue(TEST_INPUT_REQUEST, new TypeReference<>() { + })); var outputStr = emitJson(mapper, transformedDocument); log.atInfo().setMessage("output={}").addArgument(outputStr).log(); final String TEST_OUTPUT_REQUEST = "{\n" - + " \"method\": \"PUT\",\n" - + " \"URI\": \"/indexA_2/_doc/someuser\",\n" - + " \"headers\": {\n" - + " \"host\": \"127.0.0.1\"\n" - + " },\n" - + " \"payload\": {\n" - + " \"inlinedJsonBody\": {\n" - + " \"name\": \"Some User\",\n" - + " \"user_name\": \"user\",\n" - + " \"email\": \"user@example.com\"\n" - + " }\n" - + " }\n" - + "}\n"; + + " \"method\": \"PUT\",\n" + + " \"URI\": \"/indexA_2/_doc/someuser\",\n" + + " \"headers\": {\n" + + " \"host\": \"127.0.0.1\"\n" + + " },\n" + + " \"payload\": {\n" + + " \"inlinedJsonBody\": {\n" + + " \"name\": \"Some User\",\n" + + " \"user_name\": \"user\",\n" + + " \"email\": \"user@example.com\"\n" + + " }\n" + + " }\n" + + "}\n"; - Assertions.assertEquals(normalize(mapper, TEST_OUTPUT_REQUEST), normalize(mapper, outputStr)); + var normalizedOutput = normalize(mapper, TEST_OUTPUT_REQUEST); + Assertions.assertEquals(normalizedOutput, normalize(mapper, outputStr)); + { + var resultFromNullConfig = provider.createTransformer(null) + .transformJson(mapper.readValue(TEST_INPUT_REQUEST, new TypeReference<>() { + })); + Assertions.assertEquals(normalizedOutput + .replace("/indexA_2/_doc/someuser", "/1_2/_doc/someuser"), + normalize(mapper, emitJson(mapper, resultFromNullConfig))); + } } } From 0712eae349fd87a7271f14d8b1c5ee85cf61a376 Mon Sep 17 00:00:00 2001 From: Greg Schohn Date: Mon, 2 Dec 2024 10:58:05 -0500 Subject: [PATCH 11/26] Further work to support bulk delete, index create with type mapping migration, and regex target index patterns. Fix regex replace to use java's regex classes instead of the builtin ones. The builtin filter uses Google's re2j library, which doesn't do backreferences. Now both capture and replace use custom filters that use the builtin java regex library. Tests are in place to do some index remapping w/ backreferenced captures. For bulk APIs, only the delete command is fully supported, but the structure for the others should be in place. I've also worked on improving the test for creating an index and fixed numerous issues there. It's also CRITICAL to note that constructing dictionaries in jinjava with keys that are defined via variables is NOT SUPPORTED. See https://github.com/HubSpot/jinjava/issues/379. The workaround that I'm currently using is to construct a map as a string in json and parse it into a map - or to construct maps dynamically. Also note that python dictionary operations like 'update' or 'delete' are NOT present since we don't have the luxury of overriding the dictionary implementation easily. This is also something that has a significant impact on the ease of use for jinjava and to maintain compatibility to the python implementation. Signed-off-by: Greg Schohn --- .../transform/JinjavaTransformer.java | 15 ++- ...ilter.java => JavaRegexCaptureFilter.java} | 2 +- .../jinjava/JavaRegexReplaceFilter.java | 50 ++++++++ .../transform/jinjava/ThrowTag.java | 46 +++++++ .../jinjava/common/featureEnabled.j2 | 4 +- .../main/resources/jinjava/common/route.j2 | 9 +- .../build.gradle | 2 + .../jinjava/typeMappings/makeNoop.j2 | 3 + .../jinjava/typeMappings/preserveAll.j2 | 3 + .../jinjava/typeMappings/replayer.j2 | 101 ++------------- .../typeMappings/rewriteBulkRequest.j2 | 76 ++++++++++++ .../typeMappings/rewriteCreateIndexRequest.j2 | 58 +++++++++ .../typeMappings/rewriteDocumentRequest.j2 | 15 +++ .../typeMappings/rewriteIndexForTarget.j2 | 24 ++++ ...ppingsSanitizationTransformerBulkTest.java | 98 +++++++++++++++ ...peMappingsSanitizationTransformerTest.java | 116 ++++++++++++------ 16 files changed, 479 insertions(+), 143 deletions(-) rename transformation/transformationPlugins/jsonMessageTransformers/jsonJinjavaTransformer/src/main/java/org/opensearch/migrations/transform/jinjava/{RegexCaptureFilter.java => JavaRegexCaptureFilter.java} (96%) create mode 100644 transformation/transformationPlugins/jsonMessageTransformers/jsonJinjavaTransformer/src/main/java/org/opensearch/migrations/transform/jinjava/JavaRegexReplaceFilter.java create mode 100644 transformation/transformationPlugins/jsonMessageTransformers/jsonJinjavaTransformer/src/main/java/org/opensearch/migrations/transform/jinjava/ThrowTag.java create mode 100644 transformation/transformationPlugins/jsonMessageTransformers/jsonTypeMappingsSanitizationTransformer/src/main/resources/jinjava/typeMappings/makeNoop.j2 create mode 100644 transformation/transformationPlugins/jsonMessageTransformers/jsonTypeMappingsSanitizationTransformer/src/main/resources/jinjava/typeMappings/preserveAll.j2 create mode 100644 transformation/transformationPlugins/jsonMessageTransformers/jsonTypeMappingsSanitizationTransformer/src/main/resources/jinjava/typeMappings/rewriteBulkRequest.j2 create mode 100644 transformation/transformationPlugins/jsonMessageTransformers/jsonTypeMappingsSanitizationTransformer/src/main/resources/jinjava/typeMappings/rewriteCreateIndexRequest.j2 create mode 100644 transformation/transformationPlugins/jsonMessageTransformers/jsonTypeMappingsSanitizationTransformer/src/main/resources/jinjava/typeMappings/rewriteDocumentRequest.j2 create mode 100644 transformation/transformationPlugins/jsonMessageTransformers/jsonTypeMappingsSanitizationTransformer/src/main/resources/jinjava/typeMappings/rewriteIndexForTarget.j2 create mode 100644 transformation/transformationPlugins/jsonMessageTransformers/jsonTypeMappingsSanitizationTransformer/src/test/java/org/opensearch/migrations/transform/TypeMappingsSanitizationTransformerBulkTest.java diff --git a/transformation/transformationPlugins/jsonMessageTransformers/jsonJinjavaTransformer/src/main/java/org/opensearch/migrations/transform/JinjavaTransformer.java b/transformation/transformationPlugins/jsonMessageTransformers/jsonJinjavaTransformer/src/main/java/org/opensearch/migrations/transform/JinjavaTransformer.java index 3d5c45057..abfcccf5a 100644 --- a/transformation/transformationPlugins/jsonMessageTransformers/jsonJinjavaTransformer/src/main/java/org/opensearch/migrations/transform/JinjavaTransformer.java +++ b/transformation/transformationPlugins/jsonMessageTransformers/jsonJinjavaTransformer/src/main/java/org/opensearch/migrations/transform/JinjavaTransformer.java @@ -7,8 +7,10 @@ import java.util.function.Function; import org.opensearch.migrations.transform.jinjava.DynamicMacroFunction; +import org.opensearch.migrations.transform.jinjava.JavaRegexCaptureFilter; +import org.opensearch.migrations.transform.jinjava.JavaRegexReplaceFilter; import org.opensearch.migrations.transform.jinjava.NameMappingClasspathResourceLocator; -import org.opensearch.migrations.transform.jinjava.RegexCaptureFilter; +import org.opensearch.migrations.transform.jinjava.ThrowTag; import com.fasterxml.jackson.databind.ObjectMapper; import com.hubspot.jinjava.Jinjava; @@ -38,17 +40,18 @@ public JinjavaTransformer(String templateString, jinjava = new Jinjava(); this.createContextWithSourceFunction = createContextWithSource; jinjava.setResourceLocator(resourceLocator); - jinjava.getGlobalContext().registerFilter(new RegexCaptureFilter()); - var dynamicMacroFunction = new ELFunctionDefinition( + jinjava.getGlobalContext().registerFilter(new JavaRegexCaptureFilter()); + jinjava.getGlobalContext().registerFilter(new JavaRegexReplaceFilter()); + + jinjava.getGlobalContext().registerFunction(new ELFunctionDefinition( "", "invoke_macro", DynamicMacroFunction.class, "invokeMacro", String.class, Object[].class - ); - - jinjava.getGlobalContext().registerFunction(dynamicMacroFunction); + )); + jinjava.getGlobalContext().registerTag(new ThrowTag()); this.templateStr = templateString; } diff --git a/transformation/transformationPlugins/jsonMessageTransformers/jsonJinjavaTransformer/src/main/java/org/opensearch/migrations/transform/jinjava/RegexCaptureFilter.java b/transformation/transformationPlugins/jsonMessageTransformers/jsonJinjavaTransformer/src/main/java/org/opensearch/migrations/transform/jinjava/JavaRegexCaptureFilter.java similarity index 96% rename from transformation/transformationPlugins/jsonMessageTransformers/jsonJinjavaTransformer/src/main/java/org/opensearch/migrations/transform/jinjava/RegexCaptureFilter.java rename to transformation/transformationPlugins/jsonMessageTransformers/jsonJinjavaTransformer/src/main/java/org/opensearch/migrations/transform/jinjava/JavaRegexCaptureFilter.java index 7e1cbdd6b..5fbd6610d 100644 --- a/transformation/transformationPlugins/jsonMessageTransformers/jsonJinjavaTransformer/src/main/java/org/opensearch/migrations/transform/jinjava/RegexCaptureFilter.java +++ b/transformation/transformationPlugins/jsonMessageTransformers/jsonJinjavaTransformer/src/main/java/org/opensearch/migrations/transform/jinjava/JavaRegexCaptureFilter.java @@ -12,7 +12,7 @@ import com.hubspot.jinjava.lib.filter.Filter; import lombok.SneakyThrows; -public class RegexCaptureFilter implements Filter { +public class JavaRegexCaptureFilter implements Filter { private static LoadingCache regexCache = CacheBuilder.newBuilder().build(CacheLoader.from((Function)Pattern::compile)); diff --git a/transformation/transformationPlugins/jsonMessageTransformers/jsonJinjavaTransformer/src/main/java/org/opensearch/migrations/transform/jinjava/JavaRegexReplaceFilter.java b/transformation/transformationPlugins/jsonMessageTransformers/jsonJinjavaTransformer/src/main/java/org/opensearch/migrations/transform/jinjava/JavaRegexReplaceFilter.java new file mode 100644 index 000000000..fe36364bf --- /dev/null +++ b/transformation/transformationPlugins/jsonMessageTransformers/jsonJinjavaTransformer/src/main/java/org/opensearch/migrations/transform/jinjava/JavaRegexReplaceFilter.java @@ -0,0 +1,50 @@ +package org.opensearch.migrations.transform.jinjava; + +import java.util.regex.Matcher; +import java.util.regex.Pattern; + +import com.google.common.base.Function; +import com.google.common.cache.CacheBuilder; +import com.google.common.cache.CacheLoader; +import com.google.common.cache.LoadingCache; +import com.hubspot.jinjava.interpret.JinjavaInterpreter; +import com.hubspot.jinjava.lib.filter.Filter; +import lombok.SneakyThrows; +import lombok.extern.slf4j.Slf4j; + +@Slf4j +public class JavaRegexReplaceFilter implements Filter { + + private static LoadingCache regexCache = + CacheBuilder.newBuilder().build(CacheLoader.from((Function)Pattern::compile)); + + @SneakyThrows + private static Pattern getCompiledPattern(String pattern) { + return regexCache.get(pattern); + } + + @Override + public String getName() { + return "regex_replace"; + } + + @Override + public Object filter(Object var, JinjavaInterpreter interpreter, String... args) { + if (var == null || args.length < 2) { + return null; + } + + String input = var.toString(); + String pattern = args[0]; + String replacement = args[1]; + + try { + Matcher matcher = getCompiledPattern(pattern).matcher(input); + var rval = matcher.replaceAll(replacement); + log.atError().setMessage("replaced value {}").addArgument(rval).log(); + return rval; + } catch (Exception e) { + return null; + } + } +} diff --git a/transformation/transformationPlugins/jsonMessageTransformers/jsonJinjavaTransformer/src/main/java/org/opensearch/migrations/transform/jinjava/ThrowTag.java b/transformation/transformationPlugins/jsonMessageTransformers/jsonJinjavaTransformer/src/main/java/org/opensearch/migrations/transform/jinjava/ThrowTag.java new file mode 100644 index 000000000..b4e314181 --- /dev/null +++ b/transformation/transformationPlugins/jsonMessageTransformers/jsonJinjavaTransformer/src/main/java/org/opensearch/migrations/transform/jinjava/ThrowTag.java @@ -0,0 +1,46 @@ +package org.opensearch.migrations.transform.jinjava; + +import com.hubspot.jinjava.doc.annotations.JinjavaDoc; +import com.hubspot.jinjava.doc.annotations.JinjavaParam; +import com.hubspot.jinjava.doc.annotations.JinjavaSnippet; +import com.hubspot.jinjava.interpret.JinjavaInterpreter; +import com.hubspot.jinjava.lib.tag.Tag; +import com.hubspot.jinjava.tree.TagNode; + +@JinjavaDoc( + value = "Throws a runtime exception with the specified message", + params = { + @JinjavaParam(value = "message", type = "string", desc = "The error message to throw") + }, + snippets = { + @JinjavaSnippet( + code = "{% throw 'Invalid input provided' %}" + ) + } +) + +public class ThrowTag implements Tag { + private static final String TAG_NAME = "throw"; + + @Override + public String getName() { + return TAG_NAME; + } + + @Override + public String interpret(TagNode tagNode, JinjavaInterpreter interpreter) { + String message = interpreter.render(tagNode.getHelpers().trim()); + throw new JinjavaThrowTagException(message); + } + + public static class JinjavaThrowTagException extends RuntimeException { + public JinjavaThrowTagException(String message) { + super(message); + } + } + + @Override + public String getEndTagName() { + return null; + } +} diff --git a/transformation/transformationPlugins/jsonMessageTransformers/jsonJinjavaTransformer/src/main/resources/jinjava/common/featureEnabled.j2 b/transformation/transformationPlugins/jsonMessageTransformers/jsonJinjavaTransformer/src/main/resources/jinjava/common/featureEnabled.j2 index 2d44f468c..a7c2f6222 100644 --- a/transformation/transformationPlugins/jsonMessageTransformers/jsonJinjavaTransformer/src/main/resources/jinjava/common/featureEnabled.j2 +++ b/transformation/transformationPlugins/jsonMessageTransformers/jsonJinjavaTransformer/src/main/resources/jinjava/common/featureEnabled.j2 @@ -5,8 +5,8 @@ {%- set ns = namespace(value=features) -%} {%- set debug = namespace(log=[]) -%} {%- for key in (path | split('.')) -%} - {% set debug.log = debug.log + ["k:"+key] -%} - {% set debug.log = debug.log + ["ismapping?:"+(ns.value is mapping)] -%} + {%- set debug.log = debug.log + ["k:"+key] -%} + {%- set debug.log = debug.log + ["ismapping?:"+(ns.value is mapping)] -%} {%- if ns.value is mapping and key in ns.value -%} {%- set ns.value = ns.value[key] -%} {%- else -%} diff --git a/transformation/transformationPlugins/jsonMessageTransformers/jsonJinjavaTransformer/src/main/resources/jinjava/common/route.j2 b/transformation/transformationPlugins/jsonMessageTransformers/jsonJinjavaTransformer/src/main/resources/jinjava/common/route.j2 index bc4793a4d..47543b7ca 100644 --- a/transformation/transformationPlugins/jsonMessageTransformers/jsonJinjavaTransformer/src/main/resources/jinjava/common/route.j2 +++ b/transformation/transformationPlugins/jsonMessageTransformers/jsonJinjavaTransformer/src/main/resources/jinjava/common/route.j2 @@ -1,8 +1,9 @@ -{% import "common/featureEnabled.j2" as fscope %} -{% macro route(input, field_to_match, feature_flags, default_action, routes) %} +{%- import "common/featureEnabled.j2" as fscope -%} +{%- import "common/featureEnabled.j2" as fscope -%} +{%- macro route(input, field_to_match, feature_flags, default_action, routes) -%} {%- set ns = namespace(result=none, matched=false) -%} {%- for pattern, action_fn, feature_name_param in routes if not ns.matched -%} - {% set feature_name = feature_name_param | default(action_fn) %} + {%- set feature_name = feature_name_param | default(action_fn) -%} {%- if not ns.matched -%} {# we haven't found a match yet, otherwise skip the rest #} {%- set match = field_to_match | regex_capture(pattern) -%} {%- if match is not none -%} @@ -18,4 +19,4 @@ {%- else -%} {{- ns.result -}} {%- endif -%} -{% endmacro %} \ No newline at end of file +{%- endmacro -%} \ No newline at end of file diff --git a/transformation/transformationPlugins/jsonMessageTransformers/jsonTypeMappingsSanitizationTransformer/build.gradle b/transformation/transformationPlugins/jsonMessageTransformers/jsonTypeMappingsSanitizationTransformer/build.gradle index 05540ced8..f0912fded 100644 --- a/transformation/transformationPlugins/jsonMessageTransformers/jsonTypeMappingsSanitizationTransformer/build.gradle +++ b/transformation/transformationPlugins/jsonMessageTransformers/jsonTypeMappingsSanitizationTransformer/build.gradle @@ -13,7 +13,9 @@ dependencies { testImplementation testFixtures(project(path: ':testHelperFixtures')) testImplementation testFixtures(project(path: ':TrafficCapture:trafficReplayer')) + testImplementation group: 'com.fasterxml.jackson.core', name: 'jackson-databind' testImplementation group: 'com.google.guava', name: 'guava' + testImplementation group: 'org.hamcrest', name: 'hamcrest' testImplementation group: 'org.junit.jupiter', name:'junit-jupiter-api' testImplementation group: 'org.junit.jupiter', name:'junit-jupiter-params' testImplementation group: 'org.slf4j', name: 'slf4j-api' diff --git a/transformation/transformationPlugins/jsonMessageTransformers/jsonTypeMappingsSanitizationTransformer/src/main/resources/jinjava/typeMappings/makeNoop.j2 b/transformation/transformationPlugins/jsonMessageTransformers/jsonTypeMappingsSanitizationTransformer/src/main/resources/jinjava/typeMappings/makeNoop.j2 new file mode 100644 index 000000000..e34232799 --- /dev/null +++ b/transformation/transformationPlugins/jsonMessageTransformers/jsonTypeMappingsSanitizationTransformer/src/main/resources/jinjava/typeMappings/makeNoop.j2 @@ -0,0 +1,3 @@ +{%- macro make_request() -%} + { "method": "GET", "URI": "/" } +{%- endmacro -%} diff --git a/transformation/transformationPlugins/jsonMessageTransformers/jsonTypeMappingsSanitizationTransformer/src/main/resources/jinjava/typeMappings/preserveAll.j2 b/transformation/transformationPlugins/jsonMessageTransformers/jsonTypeMappingsSanitizationTransformer/src/main/resources/jinjava/typeMappings/preserveAll.j2 new file mode 100644 index 000000000..009f4b094 --- /dev/null +++ b/transformation/transformationPlugins/jsonMessageTransformers/jsonTypeMappingsSanitizationTransformer/src/main/resources/jinjava/typeMappings/preserveAll.j2 @@ -0,0 +1,3 @@ +{%- macro make_keep_json(source_and_mappings) -%} + { "preserve": "*" } +{%- endmacro -%} diff --git a/transformation/transformationPlugins/jsonMessageTransformers/jsonTypeMappingsSanitizationTransformer/src/main/resources/jinjava/typeMappings/replayer.j2 b/transformation/transformationPlugins/jsonMessageTransformers/jsonTypeMappingsSanitizationTransformer/src/main/resources/jinjava/typeMappings/replayer.j2 index 29910a959..f6cbdcdd2 100644 --- a/transformation/transformationPlugins/jsonMessageTransformers/jsonTypeMappingsSanitizationTransformer/src/main/resources/jinjava/typeMappings/replayer.j2 +++ b/transformation/transformationPlugins/jsonMessageTransformers/jsonTypeMappingsSanitizationTransformer/src/main/resources/jinjava/typeMappings/replayer.j2 @@ -1,99 +1,20 @@ -{%- include "common/featureEnabled.j2" -%} - -{%- macro preserve_original(source_and_mappings) -%} - { "preserve": "*" } -{%- endmacro -%} - -{%- macro make_no_op() -%} - { "method": "GET", "URI": "/" } -{%- endmacro -%} - -{%- macro rewrite_uri_to_strip_types(source_index, source_type, regex_index_mappings) -%} - {%- set ns = namespace(target_index=none) -%} - {%- for entry in regex_index_mappings -%} - {%- set idx_regex = entry.get(0) -%} - {%- set type_regex = entry[1] -%} - {%- set target_idx_pattern = entry[2] -%} - - {%- if ns.target_index is none -%} - {%- set conjoined_source = source_index + "/" + source_type -%} - {%- set conjoined_regex = idx_regex + "/" + type_regex -%} - {%- set didMatch = conjoined_source | regex_capture(conjoined_regex) -%} - {%- if didMatch is not none -%} - {%- set ns.target_index = conjoined_source | regex_replace(conjoined_regex, target_idx_pattern) -%} - {%- endif -%} - {%- endif -%} - {%- endfor -%} - {{- ns.target_index -}} -{%- endmacro -%} - -{%- macro rewrite_uri_for_types(match, input_map) -%} - {%- set target_index = (input_map.index_mappings[match.group1] | default({}))[match.group2] -%} - {%- if target_index is none %} {# not sure if default arguments would be eagerly evaluated #} - {%- set target_index = invoke_macro('rewrite_uri_to_strip_types', match.group1, match.group2, input_map.regex_index_mappings) -%} - {%- endif -%} - {%- if target_index is none -%} - {{ make_no_op() }} - {%- else -%} - { - "method": "{{ input_map.request.method }}", - "URI": "/{{ target_index }}/_doc/{{ match.group3 }}", - "preserve": ["headers","payload"] - } - {%- endif -%} -{%- endmacro -%} - -{% macro rewrite_create_index_excise(match, input_map) -%} -{ - "method": "{{ input_map.request.method }}", - "URI": "{{ input_map.index_mappings[match.group1] }}", - "payload": { - "inlinedJsonBody": { - {%- for key, value in input_map.request.body.items() -%} - {%- if key != "mappings" -%} - "{{ key }}": {{ value | tojson }}, - {%- endif -%} - {%- endfor -%} - "mappings": { - "properties": { - "type": { - "type": "keyword" - } - {%- for type_name, type_props in input_map.request.body.mappings.items() -%} - {%- for prop_name, prop_def in type_props.properties.items() -%} - , - "{{- prop_name -}}": {{- prop_def | tojson -}} - {%- endfor -%} - {%- endfor -%} - } - } - } - } -} -{%- endmacro -%} +{%- import "common/route.j2" as rscope -%} +{%- import "typeMappings/preserveAll.j2" as preserve -%} +{%- include "typeMappings/rewriteDocumentRequest.j2" -%} +{%- include "typeMappings/rewriteBulkRequest.j2" -%} +{%- include "typeMappings/rewriteCreateIndexRequest.j2" -%} -{% macro rewrite_create_index(match, input_map) -%} - {% set target_mappings = input_map.index_mappings[match.group1] | default({}) | length %} - {% if target_mappings == 0 %} - {{ make_no_op() }} - {% elif num_mappings == 1 %} - {{ rewrite_create_index_excise(match, input_map) }} - {% elif num_mappings > 1 %} - {% else %} - {{ preserve_original(input_mappings) }} - {% endif %} -{%- endmacro -%} -{% set source_and_mappings = { +{%- set source_and_mappings = { 'request': request, 'index_mappings': index_mappings, 'regex_index_mappings': regex_index_mappings} -%} -{%- import "common/route.j2" as rscope -%} -{{- rscope.route(source_and_mappings, request.method + " " + request.URI, flags, 'preserve_original', +-%} +{{- rscope.route(source_and_mappings, request.method + " " + request.URI, flags, 'make_keep_json', [ - ('(?:PUT|POST) /([^/]*)/([^/]*)/(.*)', 'rewrite_uri_for_types', 'rewrite_add_request_to_strip_types'), - ( 'GET /([^/]*)/([^/]*)/.*', 'rewrite_uri_for_types', 'rewrite_get_request_to_strip_types'), + ('(?:PUT|POST) /([^/]*)/([^/]*)/(.*)', 'rewrite_doc_request', 'rewrite_add_request_to_strip_types'), + ( 'GET /([^/]*)/([^/]*)/.*', 'rewrite_doc_request', 'rewrite_get_request_to_strip_types'), + ('(?:PUT|POST) /_bulk', 'rewrite_bulk', 'rewrite_bulk'), ('(?:PUT|POST) /([^/]*)', 'rewrite_create_index', 'rewrite_create_index') ]) -}} diff --git a/transformation/transformationPlugins/jsonMessageTransformers/jsonTypeMappingsSanitizationTransformer/src/main/resources/jinjava/typeMappings/rewriteBulkRequest.j2 b/transformation/transformationPlugins/jsonMessageTransformers/jsonTypeMappingsSanitizationTransformer/src/main/resources/jinjava/typeMappings/rewriteBulkRequest.j2 new file mode 100644 index 000000000..c611a3178 --- /dev/null +++ b/transformation/transformationPlugins/jsonMessageTransformers/jsonTypeMappingsSanitizationTransformer/src/main/resources/jinjava/typeMappings/rewriteBulkRequest.j2 @@ -0,0 +1,76 @@ +{%- include "typeMappings/rewriteIndexForTarget.j2" -%} +{%- import "typeMappings/rewriteIndexForTarget.j2" as transidx -%} + +{%- macro run_create(command, target_index, doc) -%} +{%- endmacro -%} +{%- macro run_index(command, target_index, doc) -%} +{%- endmacro -%} + +{%- macro run_delete(command, target_index) -%} + {%- if target_index -%} + {%- set ns = namespace(delete_inner={}) -%} + {%- for key, value in command.items() -%} + {%- if key != '_type' and key != '_index' -%} + {%- set inner_json = value | tojson -%} + {%- set jsonblob = ("{\"" + key + "\":" + inner_json + "}") | fromjson -%} + {%- set ns.delete_inner = ns.delete_inner + jsonblob -%} + {%- endif -%} + {%- endfor -%} + {%- set index_json = target_index | tojson -%} + {%- set index_blob = ("{\"_index\":" + index_json + "}") | fromjson -%} + {%- set ns.delete_inner = ns.delete_inner + index_blob -%} + {%- set final_json = ("{\"delete\":" + (ns.delete_inner | tojson) + "}") | fromjson -%} + {{ final_json | tojson }} + {%- endif -%} +{%- endmacro -%} + +{%- macro run_update(command, target_index, doc) -%} +{%- endmacro -%} +{%- macro rewrite_bulk_for_default_source_index(uri_match, input_map, source_index) -%} +{ + "preserve": ["headers","method","URI","protocol"], + "payload": { + "inlinedJsonSequenceBodies": [ + {%- set operation_types = ['delete', 'update', 'index', 'create'] -%} + {%- for item in input_map.request.payload.inlinedJsonSequenceBodies -%} + {%- set operation = namespace(type=None) -%} + {%- for type in operation_types -%} + {%- if item is mapping and type in item -%} + {%- set operation.type = type -%} + {%- endif -%} + {%- endfor -%} + + {%- if operation.type is not none -%} + {%- set command = item[operation.type] -%} + {%- set target_index = transidx.convert_source_index_to_target(command['_index'], command['_type'], input_map.index_mappings, input_map.regex_index_mappings) -%} +{# command['_index'] {{ command['_index'] }}, command['_type'] = {{ command['_type'] }}, input_map.index_mappings = {{ input_map.index_mappings }}, input_map.regex_index_mappings = {{ input_map.regex_index_mappings }})#} + {%- if operation.type == 'delete' -%} + {{ run_delete(command, target_index) }} + {%- else -%} + {%- if loop.index < operations|length -%} + {%- set next_item = operations[loop.index] -%} + {%- if operation.type == 'create' -%} + {{ run_create(command, target_index, next_item) }} + {%- elif operation.type == 'update' -%} + {{ run_update(command, target_index, next_item) }} + {%- elif operation.type == 'index' -%} + {{ run_index(command, target_index, next_item) }} + {%- endif -%} + {%- set loop.index = loop.index + 1 -%} + {%- else -%} + Handle case where there's no next item but one was expected + {# {{ throw_error('Expected document after ' + operation.type + ' operation') }}#} + {%- endif -%} + {%- endif -%} + {%- else -%} + Handle case where no valid operation type was found + {# {{ throw_error('Invalid operation type in item: ' + item|string) }}#} + {%- endif -%} + {%- endfor -%} + ] + } +} +{%- endmacro -%} +{%- macro rewrite_bulk(match, input_map) -%} + {{ rewrite_bulk_for_default_source_index(match, input_map, none) }} +{%- endmacro -%} \ No newline at end of file diff --git a/transformation/transformationPlugins/jsonMessageTransformers/jsonTypeMappingsSanitizationTransformer/src/main/resources/jinjava/typeMappings/rewriteCreateIndexRequest.j2 b/transformation/transformationPlugins/jsonMessageTransformers/jsonTypeMappingsSanitizationTransformer/src/main/resources/jinjava/typeMappings/rewriteCreateIndexRequest.j2 new file mode 100644 index 000000000..498454e57 --- /dev/null +++ b/transformation/transformationPlugins/jsonMessageTransformers/jsonTypeMappingsSanitizationTransformer/src/main/resources/jinjava/typeMappings/rewriteCreateIndexRequest.j2 @@ -0,0 +1,58 @@ +{%- import "typeMappings/makeNoop.j2" as noop -%} +{%- import "typeMappings/preserveAll.j2" as preserve -%} + +{%- macro rewrite_create_index_as_unioned_excise(source_index_name, target_index_name, input_map) -%} + {%- set source_input_types = input_map.index_mappings[source_index_name] -%} + {%- set source_type_name = source_input_types.keys() | first() -%} + { + "method": "{{ input_map.request.method }}", + "URI": "/{{ target_index_name }}", + "payload": { + "inlinedJsonBody": { + {%- for key, value in input_map.request.payload.inlinedJsonBody.items() -%} + {%- if key != "mappings" -%} + "{{ key }}": {{ value | tojson }}, + {%- endif -%} + {%- endfor -%} + "mappings": { + "properties": { + {%- set ns = namespace(combined_props={"type": "keyword"}) -%} + {%- for source_type_name in source_input_types.keys() -%} + {%- set type_props = input_map.request.payload.inlinedJsonBody.mappings.get(source_type_name) -%} + {%- for prop_name, prop_def in type_props.properties.items() -%} + {%- if prop_name in ns.combined_props -%} + {%- if ns.combined_props[prop_name] != prop_def -%} + {%- throw "Conflicting definitions for property {{ prop_name }} ({{ ns.combined_props[prop_name] }} and {{ prop_def }})" -%} + {%- endif -%} + {%- else -%} + {%- set body = prop_def | tojson -%} + {%- set jsonblob = ("{\"" + prop_name + "\":" + body + "}") | fromjson -%} + {%- set ns.combined_props = ns.combined_props + jsonblob -%} + {%- endif -%} + {%- endfor -%} + {%- endfor -%} + + {%- for prop_name, prop_def in ns.combined_props.items() -%} + "{{- prop_name -}}": {{- prop_def | tojson -}}, + {%- endfor -%} + + "type": { "type": "keyword" } + } + } + } + } + } +{%- endmacro -%} +{%- macro rewrite_create_index(match, input_map) -%} + {%- set source_index_name = match.group1 -%} + {%- set target_indices = (input_map.index_mappings[source_index_name] | default({})).values() | unique() -%} + {%- set num_mappings = target_indices | length -%} + {%- if num_mappings == 0 -%} + {{- noop.make_request() -}} + {%- elif num_mappings == 1 -%} + {{- rewrite_create_index_as_unioned_excise(source_index_name, (target_indices | first), input_map) -}} + {%- elif num_mappings > 1 -%} + {# Need to extend the replayer to allow multiple requests since this needs to become multiple requests #} + {{- preserve.make_keep_json(input_mappings) -}} + {%- endif -%} +{%- endmacro -%} diff --git a/transformation/transformationPlugins/jsonMessageTransformers/jsonTypeMappingsSanitizationTransformer/src/main/resources/jinjava/typeMappings/rewriteDocumentRequest.j2 b/transformation/transformationPlugins/jsonMessageTransformers/jsonTypeMappingsSanitizationTransformer/src/main/resources/jinjava/typeMappings/rewriteDocumentRequest.j2 new file mode 100644 index 000000000..f35fb3f0d --- /dev/null +++ b/transformation/transformationPlugins/jsonMessageTransformers/jsonTypeMappingsSanitizationTransformer/src/main/resources/jinjava/typeMappings/rewriteDocumentRequest.j2 @@ -0,0 +1,15 @@ +{%- import "typeMappings/makeNoop.j2" as noop -%} +{%- import "typeMappings/rewriteIndexForTarget.j2" as transidx -%} + +{%- macro rewrite_doc_request(match, input_map) -%} + {%- set target_index = transidx.convert_source_index_to_target(match.group1, match.group2, input_map.index_mappings, input_map.regex_index_mappings) -%} + {%- if target_index is none -%} + {{- noop.make_request() -}} + {%- else -%} + { + "method": "{{ input_map.request.method }}", + "URI": "/{{ target_index }}/_doc/{{ match.group3 }}", + "preserve": ["headers","payload"] + } + {%- endif -%} +{%- endmacro -%} diff --git a/transformation/transformationPlugins/jsonMessageTransformers/jsonTypeMappingsSanitizationTransformer/src/main/resources/jinjava/typeMappings/rewriteIndexForTarget.j2 b/transformation/transformationPlugins/jsonMessageTransformers/jsonTypeMappingsSanitizationTransformer/src/main/resources/jinjava/typeMappings/rewriteIndexForTarget.j2 new file mode 100644 index 000000000..588d809ca --- /dev/null +++ b/transformation/transformationPlugins/jsonMessageTransformers/jsonTypeMappingsSanitizationTransformer/src/main/resources/jinjava/typeMappings/rewriteIndexForTarget.j2 @@ -0,0 +1,24 @@ +{%- macro convert_source_index_to_target_via_regex(source_index, source_type, regex_index_mappings) -%} + {%- set ns = namespace(target_index=none) -%} + {%- for idx_regex, type_regex, target_idx_pattern in regex_index_mappings -%} + {%- if ns.target_index is none -%} + {%- set conjoined_source = source_index + "/" + source_type -%} + {%- set conjoined_regex = idx_regex + "/" + type_regex -%} + {%- set didMatch = conjoined_source | regex_capture(conjoined_regex) -%} + {%- if didMatch is not none -%} +{# conjoined_source = {{ conjoined_source }} conjoined_regex {{ conjoined_regex }} target_idx_pattern = {{ target_idx_pattern }}#} + {%- set ns.target_index = conjoined_source | regex_replace(conjoined_regex, target_idx_pattern) -%} + {%- endif -%} + {%- endif -%} + {%- endfor -%} + {{- ns.target_index -}} +{%- endmacro -%} + +{%- macro convert_source_index_to_target(source_index, source_type, index_mappings, regex_index_mappings) -%} + {%- set ns = namespace(target_index=none) -%} + {%- set ns.target_index2 = (index_mappings[source_index] | default({}))[source_type] -%} + {%- if ns.target_index2 is none -%} + {%- set ns.target_index2 = convert_source_index_to_target_via_regex(source_index, source_type, regex_index_mappings) -%} + {%- endif -%} + {{ ns.target_index2 }} +{%- endmacro -%} \ No newline at end of file diff --git a/transformation/transformationPlugins/jsonMessageTransformers/jsonTypeMappingsSanitizationTransformer/src/test/java/org/opensearch/migrations/transform/TypeMappingsSanitizationTransformerBulkTest.java b/transformation/transformationPlugins/jsonMessageTransformers/jsonTypeMappingsSanitizationTransformer/src/test/java/org/opensearch/migrations/transform/TypeMappingsSanitizationTransformerBulkTest.java new file mode 100644 index 000000000..bb7215461 --- /dev/null +++ b/transformation/transformationPlugins/jsonMessageTransformers/jsonTypeMappingsSanitizationTransformer/src/test/java/org/opensearch/migrations/transform/TypeMappingsSanitizationTransformerBulkTest.java @@ -0,0 +1,98 @@ +package org.opensearch.migrations.transform; + +import java.io.IOException; +import java.util.LinkedHashMap; +import java.util.List; +import java.util.Map; + +import com.fasterxml.jackson.core.JsonProcessingException; +import com.fasterxml.jackson.databind.ObjectMapper; +import com.fasterxml.jackson.databind.SerializationFeature; +import lombok.extern.slf4j.Slf4j; +import org.junit.jupiter.api.Assertions; +import org.junit.jupiter.api.BeforeAll; +import org.junit.jupiter.api.Test; + +import static org.hamcrest.Matchers.*; + +@Slf4j +public class TypeMappingsSanitizationTransformerBulkTest { + + private final static ObjectMapper OBJECT_MAPPER = new ObjectMapper(); + private static TypeMappingsSanitizationTransformer indexTypeMappingRewriter; + @BeforeAll + static void initialize() throws IOException { + var indexMappings = Map.of( + "indexA", Map.of( + "type1", "indexA_1", + "type2", "indexA_2"), + "indexB", Map.of( + "type1", "indexB", + "type2", "indexB"), + "indexC", Map.of( + "type2", "indexC")); + var regexIndexMappings = List.of( + List.of("time-(.*)", "(.*)", "time-$1-$2")); + indexTypeMappingRewriter = new TypeMappingsSanitizationTransformer(indexMappings, regexIndexMappings); + } + + @Test + public void testBulk() throws Exception { + var testString = + "{\n" + + " \"" + JsonKeysForHttpMessage.METHOD_KEY + "\": \"PUT\",\n" + + " \"" + JsonKeysForHttpMessage.PROTOCOL_KEY + "\": \"HTTP/1.1\",\n" + + " \"" + JsonKeysForHttpMessage.URI_KEY + "\": \"/_bulk\",\n" + + " \"" + JsonKeysForHttpMessage.HEADERS_KEY + "\": {},\n" + + " \"" + JsonKeysForHttpMessage.PAYLOAD_KEY + "\": {\n" + + " \"" + JsonKeysForHttpMessage.INLINED_NDJSON_BODIES_DOCUMENT_KEY + "\": [\n" + +// "{ \"index\" : { \"_index\" : \"test\", \"_type\" : \"type1\", \"_id\" : \"1\" } },\n" + +// "{ \"field1\" : \"value1\" },\n" + + "{ \"delete\" : { \"_index\" : \"test\", \"_type\" : \"type1\", \"_id\" : \"2\" } },\n" + + "{ \"delete\" : { \"_index\" : \"time-January_1970\", \"_type\" : \"cpu\", \"_id\" : \"8\" } }\n" + +// "{ \"create\" : { \"_index\" : \"test\", \"_type\" : \"type1\", \"_id\" : \"3\" } },\n" + +// "{ \"field1\" : \"value3\" },\n" + +// "{ \"update\" : {\"_id\" : \"1\", \"_type\" : \"type1\", \"_index\" : \"test\"} },\n" + +// "{ \"doc\" : {\"field2\" : \"value2\"} }\n" + + " ]\n" + + " }\n" + + "}"; + + var expectedString = + "{\n" + + " \"" + JsonKeysForHttpMessage.METHOD_KEY + "\": \"PUT\",\n" + + " \"" + JsonKeysForHttpMessage.PROTOCOL_KEY + "\": \"HTTP/1.1\",\n" + + " \"" + JsonKeysForHttpMessage.URI_KEY + "\": \"/_bulk\",\n" + + " \"" + JsonKeysForHttpMessage.HEADERS_KEY + "\": {},\n" + + " \"" + JsonKeysForHttpMessage.PAYLOAD_KEY + "\": {\n" + + " \"" + JsonKeysForHttpMessage.INLINED_NDJSON_BODIES_DOCUMENT_KEY + "\": [\n" + +// "{ \"index\" : { \"_index\" : \"test\", \"_type\" : \"type1\", \"_id\" : \"1\" } },\n" + +// "{ \"field1\" : \"value1\" },\n" + + "{ \"delete\" : { \"_index\" : \"time-January_1970-cpu\", \"_id\" : \"8\" } }\n" + +// "{ \"create\" : { \"_index\" : \"test\", \"_type\" : \"type1\", \"_id\" : \"3\" } },\n" + +// "{ \"field1\" : \"value3\" },\n" + +// "{ \"update\" : {\"_id\" : \"1\", \"_type\" : \"type1\", \"_index\" : \"test\"} },\n" + +// "{ \"doc\" : {\"field2\" : \"value2\"} }\n" + + " ]\n" + + " }\n" + + "}"; + + + var resultObj = indexTypeMappingRewriter.transformJson(OBJECT_MAPPER.readValue(testString, LinkedHashMap.class)); + log.atInfo().setMessage("resultStr = {}").addArgument(() -> { + try { + return OBJECT_MAPPER.writeValueAsString(resultObj); + } catch (JsonProcessingException e) { + throw new RuntimeException(e); + } + }).log(); + Assertions.assertEquals(normalize(OBJECT_MAPPER.readValue(expectedString, LinkedHashMap.class)), normalize(resultObj)); + } + + static String normalize(Object obj) throws Exception { + return new ObjectMapper() + .configure(SerializationFeature.ORDER_MAP_ENTRIES_BY_KEYS, true) + .configure(SerializationFeature.INDENT_OUTPUT, true) + .writeValueAsString(obj); + } +} diff --git a/transformation/transformationPlugins/jsonMessageTransformers/jsonTypeMappingsSanitizationTransformer/src/test/java/org/opensearch/migrations/transform/TypeMappingsSanitizationTransformerTest.java b/transformation/transformationPlugins/jsonMessageTransformers/jsonTypeMappingsSanitizationTransformer/src/test/java/org/opensearch/migrations/transform/TypeMappingsSanitizationTransformerTest.java index bd57a153f..216b69e94 100644 --- a/transformation/transformationPlugins/jsonMessageTransformers/jsonTypeMappingsSanitizationTransformer/src/test/java/org/opensearch/migrations/transform/TypeMappingsSanitizationTransformerTest.java +++ b/transformation/transformationPlugins/jsonMessageTransformers/jsonTypeMappingsSanitizationTransformer/src/test/java/org/opensearch/migrations/transform/TypeMappingsSanitizationTransformerTest.java @@ -1,17 +1,21 @@ package org.opensearch.migrations.transform; import java.io.IOException; +import java.util.HashMap; import java.util.LinkedHashMap; import java.util.List; import java.util.Map; +import com.fasterxml.jackson.databind.ObjectMapper; +import com.fasterxml.jackson.databind.node.ObjectNode; import lombok.extern.slf4j.Slf4j; +import org.junit.jupiter.api.Assertions; import org.junit.jupiter.api.BeforeAll; import org.junit.jupiter.api.Test; -import org.testcontainers.shaded.com.fasterxml.jackson.databind.ObjectMapper; @Slf4j class TypeMappingsSanitizationTransformerTest { + private final static ObjectMapper objMapper = new ObjectMapper(); private static TypeMappingsSanitizationTransformer indexTypeMappingRewriter; @BeforeAll @@ -23,8 +27,9 @@ static void initialize() throws IOException { "indexB", Map.of( "type1", "indexB", "type2", "indexB"), - "indexC", Map.of( - "type2", "indexC")); + "socialTypes", Map.of( + "tweet", "communal", + "user", "communal")); var regexIndexMappings = List.of( List.of("time-(.*)", "(.*)", "time-\\1-\\2")); indexTypeMappingRewriter = new TypeMappingsSanitizationTransformer(indexMappings, regexIndexMappings); @@ -44,7 +49,6 @@ public void testPutDoc() throws Exception { " }\n" + " }\n" + "}"; - var objMapper = new ObjectMapper(); var resultObj = indexTypeMappingRewriter.transformJson(objMapper.readValue(testString, LinkedHashMap.class)); var resultStr = objMapper.writeValueAsString(resultObj); log.atInfo().setMessage("resultStr = {}").setMessage(resultStr).log(); @@ -64,47 +68,79 @@ public void testPutDocRegex() throws Exception { " }\n" + " }\n" + "}"; - var objMapper = new ObjectMapper(); var resultObj = indexTypeMappingRewriter.transformJson(objMapper.readValue(testString, LinkedHashMap.class)); var resultStr = objMapper.writeValueAsString(resultObj); log.atInfo().setMessage("resultStr = {}").setMessage(resultStr).log(); } - @Test - public void testPutIndex() throws Exception { - var testString = + private static String makeMultiTypePutIndexRequest(String indexName) { + return "{\n" + + " \"" + JsonKeysForHttpMessage.METHOD_KEY + "\": \"PUT\",\n" + + " \"" + JsonKeysForHttpMessage.URI_KEY + "\": \"/" + indexName + "\",\n" + + " \"" + JsonKeysForHttpMessage.PAYLOAD_KEY + "\": {\n" + + " \"" + JsonKeysForHttpMessage.INLINED_JSON_BODY_DOCUMENT_KEY + "\": " + "{\n" + - " \"" + JsonKeysForHttpMessage.METHOD_KEY + "\": \"PUT\",\n" + - " \"" + JsonKeysForHttpMessage.URI_KEY + "\": \"/indexA\",\n" + - " \"" + JsonKeysForHttpMessage.PAYLOAD_KEY + "\": {\n" + - " \"" + JsonKeysForHttpMessage.INLINED_JSON_BODY_DOCUMENT_KEY + "\": " + - "{\n" + - " \"settings\" : {\n" + - " \"number_of_shards\" : 1\n" + - " }," + - " \"mappings\": {\n" + - " \"user\": {\n" + - " \"properties\": {\n" + - " \"name\": { \"type\": \"text\" },\n" + - " \"user_name\": { \"type\": \"keyword\" },\n" + - " \"email\": { \"type\": \"keyword\" }\n" + - " }\n" + - " },\n" + - " \"tweet\": {\n" + - " \"properties\": {\n" + - " \"content\": { \"type\": \"text\" },\n" + - " \"user_name\": { \"type\": \"keyword\" },\n" + - " \"tweeted_at\": { \"type\": \"date\" }\n" + - " }\n" + - " }\n" + - " }\n" + - "}" + - "\n" + - " }\n" + - "}"; - var objMapper = new ObjectMapper(); - var resultObj = indexTypeMappingRewriter.transformJson(objMapper.readValue(testString, LinkedHashMap.class)); - var resultStr = objMapper.writeValueAsString(resultObj); - log.atInfo().setMessage("resultStr = {}").setMessage(resultStr).log(); + " \"settings\" : {\n" + + " \"number_of_shards\" : 1\n" + + " }," + + " \"mappings\": {\n" + + " \"user\": {\n" + + " \"properties\": {\n" + + " \"name\": { \"type\": \"text\" },\n" + + " \"user_name\": { \"type\": \"keyword\" },\n" + + " \"email\": { \"type\": \"keyword\" }\n" + + " }\n" + + " },\n" + + " \"tweet\": {\n" + + " \"properties\": {\n" + + " \"content\": { \"type\": \"text\" },\n" + + " \"user_name\": { \"type\": \"keyword\" },\n" + + " \"tweeted_at\": { \"type\": \"date\" }\n" + + " }\n" + + " },\n" + + " \"following\": {\n" + + " \"properties\": {\n" + + " \"count\": { \"type\": \"integer\" },\n" + + " \"followers\": { \"type\": \"string\" }\n" + + " }\n" + + " }\n" + + " }\n" + + "}" + + "\n" + + " }\n" + + "}"; + } + + Map doPutIndex(String indexName) throws Exception { + var testString = makeMultiTypePutIndexRequest(indexName); + return indexTypeMappingRewriter.transformJson(objMapper.readValue(testString, LinkedHashMap.class)); + } + + @Test + public void testPutSingleTypeIndex() throws Exception { + final String index = "indexA"; + var result = doPutIndex(index); + Assertions.assertEquals(objMapper.readValue(makeMultiTypePutIndexRequest(index), LinkedHashMap.class), + result); + } + + @Test + public void testMultiTypeIndex() throws Exception { + final String index = "socialTypes"; + var result = doPutIndex(index); + var expected = objMapper.readTree(makeMultiTypePutIndexRequest(index)); + var mappings = ((ObjectNode) expected.path(JsonKeysForHttpMessage.PAYLOAD_KEY) + .path(JsonKeysForHttpMessage.INLINED_JSON_BODY_DOCUMENT_KEY) + .path("mappings")); + mappings.remove("following"); + var newProperties = new HashMap(); + newProperties.put("type", Map.of("type", "keyword")); + var user = mappings.remove("user"); + user.path("properties").fields().forEachRemaining(e -> newProperties.put(e.getKey(), e.getValue())); + var tweet = mappings.remove("tweet"); + tweet.path("properties").fields().forEachRemaining(e -> newProperties.put(e.getKey(), e.getValue())); + var properties = mappings.put("properties", objMapper.valueToTree(newProperties)); + ((ObjectNode)expected).put(JsonKeysForHttpMessage.URI_KEY, "/communal"); + Assertions.assertEquals(expected, objMapper.readTree(objMapper.writeValueAsString(result))); } } From e6c02293e287971487b85ef29c6116c9688351ce Mon Sep 17 00:00:00 2001 From: Greg Schohn Date: Mon, 2 Dec 2024 21:59:53 -0500 Subject: [PATCH 12/26] Updated READMEs and finished implementing a basic version of bulk transformations. All unit tests pass. Signed-off-by: Greg Schohn --- .../flags/FeatureFlagsSerializer.java | 33 ------- .../README.md | 42 ++++++-- .../typeMappings/rewriteBulkRequest.j2 | 96 ++++++++++--------- ...ppingsSanitizationTransformerBulkTest.java | 57 +++++++---- .../README.md | 38 ++++++++ .../TypeMappingsSanitizationProviderTest.java | 2 +- 6 files changed, 167 insertions(+), 101 deletions(-) delete mode 100644 transformation/transformationPlugins/jsonMessageTransformers/jsonMessageTransformerLoaders/src/main/java/org/opensearch/migrations/transform/flags/FeatureFlagsSerializer.java create mode 100644 transformation/transformationPlugins/jsonMessageTransformers/jsonTypeMappingsSanitizationTransformerProvider/README.md diff --git a/transformation/transformationPlugins/jsonMessageTransformers/jsonMessageTransformerLoaders/src/main/java/org/opensearch/migrations/transform/flags/FeatureFlagsSerializer.java b/transformation/transformationPlugins/jsonMessageTransformers/jsonMessageTransformerLoaders/src/main/java/org/opensearch/migrations/transform/flags/FeatureFlagsSerializer.java deleted file mode 100644 index 4e482b226..000000000 --- a/transformation/transformationPlugins/jsonMessageTransformers/jsonMessageTransformerLoaders/src/main/java/org/opensearch/migrations/transform/flags/FeatureFlagsSerializer.java +++ /dev/null @@ -1,33 +0,0 @@ -//package org.opensearch.migrations.transform.flags; -// -//import java.io.IOException; -//import java.util.Map; -// -//import com.fasterxml.jackson.core.JsonGenerator; -//import com.fasterxml.jackson.databind.SerializerProvider; -//import com.fasterxml.jackson.databind.ser.std.StdSerializer; -// -//public class FeatureFlagsSerializer extends StdSerializer { -// -// public FeatureFlagsSerializer() { -// this(null); -// } -// -// public FeatureFlagsSerializer(Class t) { -// super(t); -// } -// -// @Override -// public void serialize(FeatureFlags value, JsonGenerator gen, SerializerProvider provider) throws IOException { -// gen.writeStartObject(); -// // Serialize the 'enabled' field -// gen.writeBooleanField("enabled", value.isEnabled()); -// -// // Serialize all map entries -// for (Map.Entry entry : value.entrySet()) { -// gen.writeObjectField(entry.getKey(), entry.getValue()); -// } -// -// gen.writeEndObject(); -// } -//} diff --git a/transformation/transformationPlugins/jsonMessageTransformers/jsonTypeMappingsSanitizationTransformer/README.md b/transformation/transformationPlugins/jsonMessageTransformers/jsonTypeMappingsSanitizationTransformer/README.md index abb81c5e2..2ff97492b 100644 --- a/transformation/transformationPlugins/jsonMessageTransformers/jsonTypeMappingsSanitizationTransformer/README.md +++ b/transformation/transformationPlugins/jsonMessageTransformers/jsonTypeMappingsSanitizationTransformer/README.md @@ -53,8 +53,8 @@ GET activity/post/_search ## Routing data to new indices -The structure of the documents will need to change. Some options are to use separate indices, drop some of the types -to make an index single-purpose, or to create an index that's the union of all the types' fields. +The structure of the documents and indices need to change. Some options are to use separate indices, drop some of +the types to make an index single-purpose, or to create an index that's the union of all the types' fields. With a simple mapping directive, we can define each of these three behaviors. The following yaml shows how to map documents into two different indices named users and posts: @@ -64,26 +64,54 @@ activity: post: new_posts ``` -To drop one, just leave it out: +To drop one type, just leave it out: ``` activity: user: only_users ``` -To merge them together, use the same value: +To merge types together, use the same value: ``` activity: user: any_activity post: any_activity ``` -Any indices that are NOT specified won't be modified - all additions, changes, and queries on those other indices not -specified at the root level will remain untouched. To remove ALL the activity for a given index, specify and empty -index at the top level +Any _indices_ that are NOT specified won't be modified - all additions, changes, and queries on those other indices not +specified at the root level will remain untouched by the static mapping rewriter. However, missing types from a +specified index _**will**_ be removed. To remove ALL the activity for a given index, specify an empty index with no +children types. ``` activity: {} ``` +In addition to static source/target mappings, users can specify source and type pairs as a regex and use any captured +groups in the target index name. Regex rules take precedent _after_ the static rules and are only applied when there +was no index match in the static mappings. + +Regex replacement is controlled via an ordered list of `[indexNamePattern, typeNamePattern, replacementString]`. +The transformer will use the replacement for the first matched item found. +If none are found, unlike missing indices for static mappings, the system presumes that the index and type are +**NOT** to be propagated to the target - any reference to those types and their corresponding data will be suppressed. +To preserve all items, a default rule will need to be included. + +The following sample shows how indices that start with 'time-' will be migrated and every other index and type not +already matched will be dropped. +``` +[ + ["time-(.*)", "(cpu)", "time-$1-$2"] +] +``` + +The following example preserves all other non-matched items, +merging all types into a single index with the same name as the source index. +``` +[ + ["time-(.*)", "(cpu)", "time-$1-$2"], + ["(.*)", ".*", "$1"] +] +``` + ## Final Results ``` diff --git a/transformation/transformationPlugins/jsonMessageTransformers/jsonTypeMappingsSanitizationTransformer/src/main/resources/jinjava/typeMappings/rewriteBulkRequest.j2 b/transformation/transformationPlugins/jsonMessageTransformers/jsonTypeMappingsSanitizationTransformer/src/main/resources/jinjava/typeMappings/rewriteBulkRequest.j2 index c611a3178..8496ca7b8 100644 --- a/transformation/transformationPlugins/jsonMessageTransformers/jsonTypeMappingsSanitizationTransformer/src/main/resources/jinjava/typeMappings/rewriteBulkRequest.j2 +++ b/transformation/transformationPlugins/jsonMessageTransformers/jsonTypeMappingsSanitizationTransformer/src/main/resources/jinjava/typeMappings/rewriteBulkRequest.j2 @@ -1,70 +1,78 @@ {%- include "typeMappings/rewriteIndexForTarget.j2" -%} {%- import "typeMappings/rewriteIndexForTarget.j2" as transidx -%} -{%- macro run_create(command, target_index, doc) -%} -{%- endmacro -%} -{%- macro run_index(command, target_index, doc) -%} +{%- macro retarget_command_parameters(parameters, target_index) -%} + {%- set ns = namespace(new_params={}) -%} + {%- for key, value in parameters.items() -%} + {%- if key != '_type' and key != '_index' -%} + {%- set inner_json = value | tojson -%} + {%- set jsonblob = ("{\"" + key + "\":" + inner_json + "}") | fromjson -%} + {%- set ns.new_params = ns.new_params + jsonblob -%} + {%- endif -%} + {%- endfor -%} + {%- set index_json = target_index | tojson -%} + {%- set index_blob = ("{\"_index\":" + index_json + "}") | fromjson -%} + {{- (ns.new_params + index_blob) | tojson -}} {%- endmacro -%} -{%- macro run_delete(command, target_index) -%} +{%- macro get_create() -%}create{% endmacro %} +{%- macro get_index() -%}index{% endmacro %} +{%- macro get_update() -%}update{% endmacro %} + +{%- macro rewrite_command(command, parameters, target_index, doc) -%} {%- if target_index -%} - {%- set ns = namespace(delete_inner={}) -%} - {%- for key, value in command.items() -%} - {%- if key != '_type' and key != '_index' -%} - {%- set inner_json = value | tojson -%} - {%- set jsonblob = ("{\"" + key + "\":" + inner_json + "}") | fromjson -%} - {%- set ns.delete_inner = ns.delete_inner + jsonblob -%} - {%- endif -%} - {%- endfor -%} - {%- set index_json = target_index | tojson -%} - {%- set index_blob = ("{\"_index\":" + index_json + "}") | fromjson -%} - {%- set ns.delete_inner = ns.delete_inner + index_blob -%} - {%- set final_json = ("{\"delete\":" + (ns.delete_inner | tojson) + "}") | fromjson -%} - {{ final_json | tojson }} + { "{{ invoke_macro("get_"+command) }}": {{ retarget_command_parameters(parameters, target_index) }} }, + {{ doc | tojson }} {%- endif -%} {%- endmacro -%} -{%- macro run_update(command, target_index, doc) -%} +{%- macro run_delete(parameters, target_index) -%} + {%- if target_index -%} + { "delete": {{ retarget_command_parameters(parameters, target_index) }} } + {%- endif -%} {%- endmacro -%} + {%- macro rewrite_bulk_for_default_source_index(uri_match, input_map, source_index) -%} { "preserve": ["headers","method","URI","protocol"], "payload": { "inlinedJsonSequenceBodies": [ {%- set operation_types = ['delete', 'update', 'index', 'create'] -%} - {%- for item in input_map.request.payload.inlinedJsonSequenceBodies -%} - {%- set operation = namespace(type=None) -%} - {%- for type in operation_types -%} - {%- if item is mapping and type in item -%} - {%- set operation.type = type -%} - {%- endif -%} - {%- endfor -%} + {%- set operations = input_map.request.payload.inlinedJsonSequenceBodies -%} + {%- set loopcontrol = namespace(skipnext=false) -%} + {%- for item in operations -%} + {%- set operation = namespace(type=None, output=None, num_written=0) -%} + {%- if not loopcontrol.skipnext -%} + {%- for type in operation_types -%} + {%- if item is mapping and type in item -%} + {%- set operation.type = type -%} + {%- endif -%} + {%- endfor -%} + {%- if not operation -%} + {%- throw "No valid operation type was found for item {{ item }}" -%} + {% endif %} + {% else %} + {%- set loopcontrol.skipnext = false -%} + {%- endif -%} - {%- if operation.type is not none -%} - {%- set command = item[operation.type] -%} - {%- set target_index = transidx.convert_source_index_to_target(command['_index'], command['_type'], input_map.index_mappings, input_map.regex_index_mappings) -%} -{# command['_index'] {{ command['_index'] }}, command['_type'] = {{ command['_type'] }}, input_map.index_mappings = {{ input_map.index_mappings }}, input_map.regex_index_mappings = {{ input_map.regex_index_mappings }})#} + {%- if operation.type -%} + {%- set parameters = item[operation.type] -%} + {%- set target_index = transidx.convert_source_index_to_target(parameters['_index'], parameters['_type'], input_map.index_mappings, input_map.regex_index_mappings) -%} {%- if operation.type == 'delete' -%} - {{ run_delete(command, target_index) }} + {%- set operation.output = run_delete(parameters, target_index) -%} {%- else -%} {%- if loop.index < operations|length -%} - {%- set next_item = operations[loop.index] -%} - {%- if operation.type == 'create' -%} - {{ run_create(command, target_index, next_item) }} - {%- elif operation.type == 'update' -%} - {{ run_update(command, target_index, next_item) }} - {%- elif operation.type == 'index' -%} - {{ run_index(command, target_index, next_item) }} - {%- endif -%} - {%- set loop.index = loop.index + 1 -%} + {%- set operation.output = rewrite_command(operation.type, parameters, target_index, operations[loop.index]) -%} + {%- set loopcontrol.skipnext = true -%} {%- else -%} - Handle case where there's no next item but one was expected - {# {{ throw_error('Expected document after ' + operation.type + ' operation') }}#} + {%- throw "Handle case where there's no next item but one was expected for item {{ item }}" -%} {%- endif -%} {%- endif -%} - {%- else -%} - Handle case where no valid operation type was found - {# {{ throw_error('Invalid operation type in item: ' + item|string) }}#} + {% if (operation.output | string | trim | length) > 0 %} + {%- set loopcontrol.num_written = loopcontrol.num_written + 1 -%} + {{ "," if loopcontrol.num_written > 1 else "" }} + {{ operation.output }} + {% endif %} {%- endif -%} {%- endfor -%} ] diff --git a/transformation/transformationPlugins/jsonMessageTransformers/jsonTypeMappingsSanitizationTransformer/src/test/java/org/opensearch/migrations/transform/TypeMappingsSanitizationTransformerBulkTest.java b/transformation/transformationPlugins/jsonMessageTransformers/jsonTypeMappingsSanitizationTransformer/src/test/java/org/opensearch/migrations/transform/TypeMappingsSanitizationTransformerBulkTest.java index bb7215461..c455601a0 100644 --- a/transformation/transformationPlugins/jsonMessageTransformers/jsonTypeMappingsSanitizationTransformer/src/test/java/org/opensearch/migrations/transform/TypeMappingsSanitizationTransformerBulkTest.java +++ b/transformation/transformationPlugins/jsonMessageTransformers/jsonTypeMappingsSanitizationTransformer/src/test/java/org/opensearch/migrations/transform/TypeMappingsSanitizationTransformerBulkTest.java @@ -46,14 +46,31 @@ public void testBulk() throws Exception { " \"" + JsonKeysForHttpMessage.HEADERS_KEY + "\": {},\n" + " \"" + JsonKeysForHttpMessage.PAYLOAD_KEY + "\": {\n" + " \"" + JsonKeysForHttpMessage.INLINED_NDJSON_BODIES_DOCUMENT_KEY + "\": [\n" + -// "{ \"index\" : { \"_index\" : \"test\", \"_type\" : \"type1\", \"_id\" : \"1\" } },\n" + -// "{ \"field1\" : \"value1\" },\n" + - "{ \"delete\" : { \"_index\" : \"test\", \"_type\" : \"type1\", \"_id\" : \"2\" } },\n" + - "{ \"delete\" : { \"_index\" : \"time-January_1970\", \"_type\" : \"cpu\", \"_id\" : \"8\" } }\n" + -// "{ \"create\" : { \"_index\" : \"test\", \"_type\" : \"type1\", \"_id\" : \"3\" } },\n" + -// "{ \"field1\" : \"value3\" },\n" + -// "{ \"update\" : {\"_id\" : \"1\", \"_type\" : \"type1\", \"_index\" : \"test\"} },\n" + -// "{ \"doc\" : {\"field2\" : \"value2\"} }\n" + + "{ \"index\": { \"_index\": \"indexA\", \"_type\": \"type1\", \"_id\": \"1\" } },\n" + + "{ \"field1\": \"value1\" },\n" + + + "{ \"index\": { \"_index\": \"indexA\", \"_type\": \"typeDontMap\", \"_id\": \"1\" } },\n" + + "{ \"field1\": \"value9\" },\n" + + + "{ \"delete\": { \"_index\": \"test\", \"_type\": \"type1\", \"_id\": \"2\" } },\n" + + + "{ \"delete\": { \"_index\": \"time-January_1970\", \"_type\": \"cpu\", \"_id\": \"8\" } },\n" + + + "{ \"create\": { \"_index\": \"indexC\", \"_type\": \"type1\", \"_id\": \"3\" } },\n" + + "{ \"field1\": \"value3\" },\n" + + + "{ \"create\": { \"_index\": \"indexC\", \"_type\": \"type2\", \"_id\": \"14\" } },\n" + + "{ \"field14\": \"value14\" },\n" + + + "{ \"update\": {\"_id\": \"1\", \"_type\": \"type1\", \"_index\": \"indexB\"} },\n" + + "{ \"doc\": {\"field2\": \"value2\"} },\n" + + + "{ \"update\": {\"_id\": \"1\", \"_type\": \"type2\", \"_index\": \"indexB\"} },\n" + + "{ \"doc\": {\"field10\": \"value10\"} },\n" + + + "{ \"update\": {\"_id\": \"1\", \"_type\": \"type3\", \"_index\": \"indexB\"} },\n" + + "{ \"doc\": {\"field10\": \"value11\"} }\n" + + " ]\n" + " }\n" + "}"; @@ -66,13 +83,20 @@ public void testBulk() throws Exception { " \"" + JsonKeysForHttpMessage.HEADERS_KEY + "\": {},\n" + " \"" + JsonKeysForHttpMessage.PAYLOAD_KEY + "\": {\n" + " \"" + JsonKeysForHttpMessage.INLINED_NDJSON_BODIES_DOCUMENT_KEY + "\": [\n" + -// "{ \"index\" : { \"_index\" : \"test\", \"_type\" : \"type1\", \"_id\" : \"1\" } },\n" + -// "{ \"field1\" : \"value1\" },\n" + - "{ \"delete\" : { \"_index\" : \"time-January_1970-cpu\", \"_id\" : \"8\" } }\n" + -// "{ \"create\" : { \"_index\" : \"test\", \"_type\" : \"type1\", \"_id\" : \"3\" } },\n" + -// "{ \"field1\" : \"value3\" },\n" + -// "{ \"update\" : {\"_id\" : \"1\", \"_type\" : \"type1\", \"_index\" : \"test\"} },\n" + -// "{ \"doc\" : {\"field2\" : \"value2\"} }\n" + + "{ \"index\": { \"_index\": \"indexA_1\", \"_id\": \"1\" } },\n" + + "{ \"field1\": \"value1\" },\n" + + + "{ \"delete\": { \"_index\": \"time-January_1970-cpu\", \"_id\": \"8\" } },\n" + + + "{ \"create\": { \"_index\": \"indexC\", \"_id\": \"14\" } },\n" + + "{ \"field14\": \"value14\" },\n" + + + "{ \"update\": {\"_id\": \"1\", \"_index\": \"indexB\"} },\n" + + "{ \"doc\": {\"field2\": \"value2\"} },\n" + + + "{ \"update\": {\"_id\": \"1\", \"_index\": \"indexB\"} },\n" + + "{ \"doc\": {\"field10\": \"value10\"} }\n" + + " ]\n" + " }\n" + "}"; @@ -86,7 +110,8 @@ public void testBulk() throws Exception { throw new RuntimeException(e); } }).log(); - Assertions.assertEquals(normalize(OBJECT_MAPPER.readValue(expectedString, LinkedHashMap.class)), normalize(resultObj)); + Assertions.assertEquals(normalize(OBJECT_MAPPER.readValue(expectedString, LinkedHashMap.class)), + normalize(resultObj)); } static String normalize(Object obj) throws Exception { diff --git a/transformation/transformationPlugins/jsonMessageTransformers/jsonTypeMappingsSanitizationTransformerProvider/README.md b/transformation/transformationPlugins/jsonMessageTransformers/jsonTypeMappingsSanitizationTransformerProvider/README.md new file mode 100644 index 000000000..327343e76 --- /dev/null +++ b/transformation/transformationPlugins/jsonMessageTransformers/jsonTypeMappingsSanitizationTransformerProvider/README.md @@ -0,0 +1,38 @@ +# Configuration Routing + +See the [README for the Type Mappings Sanitization Transformer](../jsonTypeMappingsSanitizationTransformer/README.md) +for specifics of how rules are evaluated. + +This package loads a [Type Mappings Sanitization Transformer](../jsonTypeMappingsSanitizationTransformer/src/main/java/org/opensearch/migrations/transform/TypeMappingsSanitizationTransformer.java) +for that appropriate application variant (currently only for the REPLAYER) along with the configuration passed into +the provider. This [Provider](./src/main/java/org/opensearch/migrations/transform/TypeMappingSanitizationTransformerProvider.java) +pulls the values for keys `featureFlags`, `staticMappings`, and `regexMappings` from the incoming configuration map +object so that the Type Mappings Sanitization Transformer can adjust requests for specific type mappings into the +appropriate target index. + +The following example will load a Transformer to rewrite types as per the static mappings shown in the second key-value +(staticMappings), or if not present, will then default to the mappings in regexMappings. Note that regexMappings will +only be checked if there are no entries in staticMappings. +staticMappings index names (top-level key) and keys to their children maps will be evaluated literally, not as patterns. +Patterns are ONLY supported via regexMappings. + +``` +{ + "staticMappings": { + "indexA": { + "type2": "indexA_2", + "type1": "indexA_1" + }, + "indexB": { + "type2": "indexB", + "type1": "indexB" + }, + "indexC": { + "type2": "indexC" + } + }, + "regexMappings": [ + [ "(time*)", "(type*)", "$1_And_$2" ] + ] +} +``` \ No newline at end of file diff --git a/transformation/transformationPlugins/jsonMessageTransformers/jsonTypeMappingsSanitizationTransformerProvider/src/test/java/org/opensearch/migrations/replay/TypeMappingsSanitizationProviderTest.java b/transformation/transformationPlugins/jsonMessageTransformers/jsonTypeMappingsSanitizationTransformerProvider/src/test/java/org/opensearch/migrations/replay/TypeMappingsSanitizationProviderTest.java index fcc98c1f1..4050664c6 100644 --- a/transformation/transformationPlugins/jsonMessageTransformers/jsonTypeMappingsSanitizationTransformerProvider/src/test/java/org/opensearch/migrations/replay/TypeMappingsSanitizationProviderTest.java +++ b/transformation/transformationPlugins/jsonMessageTransformers/jsonTypeMappingsSanitizationTransformerProvider/src/test/java/org/opensearch/migrations/replay/TypeMappingsSanitizationProviderTest.java @@ -56,7 +56,7 @@ public void testSimpleTransform() throws JsonProcessingException { "type2", "indexB"), "indexC", Map.of( "type2", "indexC")), - "regexMappings", List.of(List.of("(time*)", "(type*)", "\\1_And_\\2"))); + "regexMappings", List.of(List.of("(time*)", "(type*)", "$1_And_$2"))); var provider = new TypeMappingSanitizationTransformerProvider(); var transformer = provider.createTransformer(config); var transformedDocument = From 071368a8201188815edbf084731bd5856f29ac6d Mon Sep 17 00:00:00 2001 From: Greg Schohn Date: Tue, 3 Dec 2024 00:10:07 -0500 Subject: [PATCH 13/26] Transformation cleanup in light of new type mappings transformation. Cleanup a number of linting issues, including removing the old openSearch23PlusTargetTransformer code. That was for example purposes, but the newer jinja versions are more complete and easier to express/understand. Removing the old transfomer required a couple other changes. 1) When the TypeMappingSanitizationTransformerProvider is invoked with an empty string, that will cause transformers to be created w/ null values for all of the parameters (which means that we'll default to stripping type mappings and sending all of the docs to the same index). 2) The new type mappings transformer doesn't throw an exception for the same types of errant input that the old opensearch23... implementation did. That caused a test to fall through the type mapping transformation with the same output as its input (missing a headers value), which in turn caused the host rewrite mapping to throw an exception. When such an occurrence happens later in the pipeline, a TransformationException will be thrown. However, in this test case, the exception was thrown in the preliminary handler which didn't translate exceptions during transformation into TransformationExceptions. As long as the exception isn't a PayloadNotLoadedException exception, the code now does that translation. Signed-off-by: Greg Schohn --- DocumentsFromSnapshotMigration/build.gradle | 2 +- RFS/build.gradle | 2 +- TrafficCapture/trafficReplayer/README.md | 4 +- TrafficCapture/trafficReplayer/build.gradle | 2 +- ...ttpRequestPreliminaryTransformHandler.java | 19 +++-- .../HttpJsonTransformingConsumerTest.java | 2 +- .../transform/JinjavaTransformer.java | 7 +- .../jinjava/DynamicMacroFunction.java | 9 ++- .../InlineTemplateResourceLocator.java | 26 ------ .../jinjava/JavaRegexCaptureFilter.java | 6 +- .../jinjava/JavaRegexReplaceFilter.java | 6 +- .../NameMappingClasspathResourceLocator.java | 3 +- .../transform/JinjavaTransformerTest.java | 4 +- .../migrations/transform/RouteTest.java | 2 - .../build.gradle | 2 +- .../JsonConditionalTransformerProvider.java | 3 - .../flags/FeatureFlagsDeserializer.java | 1 - .../transform/replay/JsonTransformerTest.java | 1 - .../replay/MultipleJMESPathScriptsTest.java | 7 -- .../replay/TransformationLoaderTest.java | 9 +-- .../TypeMappingsSanitizationTransformer.java | 9 ++- ...ppingsSanitizationTransformerBulkTest.java | 2 +- ...peMappingsSanitizationTransformerTest.java | 4 +- ...appingSanitizationTransformerProvider.java | 3 + .../build.gradle | 19 ----- ...Search23PlusTargetTransformerProvider.java | 8 -- .../transform/JsonTypeMappingTransformer.java | 81 ------------------- ...rations.transform.IJsonTransformerProvider | 1 - .../transform/TypeMappingsExcisionTest.java | 71 ---------------- .../src/test/resources/log4j2.properties | 18 ----- .../typeMappings/get_query_input.txt | 9 --- .../typeMappings/get_query_output.txt | 10 --- .../typeMappings/put_document_input.txt | 10 --- .../typeMappings/put_document_output.txt | 10 --- .../typeMappings/put_index_input.txt | 20 ----- .../typeMappings/put_index_output.txt | 18 ----- 36 files changed, 55 insertions(+), 355 deletions(-) delete mode 100644 transformation/transformationPlugins/jsonMessageTransformers/jsonJinjavaTransformer/src/main/java/org/opensearch/migrations/transform/jinjava/InlineTemplateResourceLocator.java delete mode 100644 transformation/transformationPlugins/jsonMessageTransformers/openSearch23PlusTargetTransformerProvider/build.gradle delete mode 100644 transformation/transformationPlugins/jsonMessageTransformers/openSearch23PlusTargetTransformerProvider/src/main/java/org/opensearch/migrations/transform/JsonTransformerForOpenSearch23PlusTargetTransformerProvider.java delete mode 100644 transformation/transformationPlugins/jsonMessageTransformers/openSearch23PlusTargetTransformerProvider/src/main/java/org/opensearch/migrations/transform/JsonTypeMappingTransformer.java delete mode 100644 transformation/transformationPlugins/jsonMessageTransformers/openSearch23PlusTargetTransformerProvider/src/main/resources/META-INF/services/org.opensearch.migrations.transform.IJsonTransformerProvider delete mode 100644 transformation/transformationPlugins/jsonMessageTransformers/openSearch23PlusTargetTransformerProvider/src/test/java/org/opensearch/migrations/transform/TypeMappingsExcisionTest.java delete mode 100644 transformation/transformationPlugins/jsonMessageTransformers/openSearch23PlusTargetTransformerProvider/src/test/resources/log4j2.properties delete mode 100644 transformation/transformationPlugins/jsonMessageTransformers/openSearch23PlusTargetTransformerProvider/src/test/resources/sampleJsonDocuments/typeMappings/get_query_input.txt delete mode 100644 transformation/transformationPlugins/jsonMessageTransformers/openSearch23PlusTargetTransformerProvider/src/test/resources/sampleJsonDocuments/typeMappings/get_query_output.txt delete mode 100644 transformation/transformationPlugins/jsonMessageTransformers/openSearch23PlusTargetTransformerProvider/src/test/resources/sampleJsonDocuments/typeMappings/put_document_input.txt delete mode 100644 transformation/transformationPlugins/jsonMessageTransformers/openSearch23PlusTargetTransformerProvider/src/test/resources/sampleJsonDocuments/typeMappings/put_document_output.txt delete mode 100644 transformation/transformationPlugins/jsonMessageTransformers/openSearch23PlusTargetTransformerProvider/src/test/resources/sampleJsonDocuments/typeMappings/put_index_input.txt delete mode 100644 transformation/transformationPlugins/jsonMessageTransformers/openSearch23PlusTargetTransformerProvider/src/test/resources/sampleJsonDocuments/typeMappings/put_index_output.txt diff --git a/DocumentsFromSnapshotMigration/build.gradle b/DocumentsFromSnapshotMigration/build.gradle index f74fc5b62..c95c6362d 100644 --- a/DocumentsFromSnapshotMigration/build.gradle +++ b/DocumentsFromSnapshotMigration/build.gradle @@ -30,7 +30,7 @@ dependencies { implementation project(":RFS") implementation project(":transformation") implementation project(':transformation:transformationPlugins:jsonMessageTransformers:jsonMessageTransformerLoaders') - runtimeOnly project(':transformation:transformationPlugins:jsonMessageTransformers:openSearch23PlusTargetTransformerProvider') + runtimeOnly project(':transformation:transformationPlugins:jsonMessageTransformers:jsonTypeMappingsSanitizationTransformerProvider') implementation group: 'org.apache.logging.log4j', name: 'log4j-api' implementation group: 'org.apache.logging.log4j', name: 'log4j-core' diff --git a/RFS/build.gradle b/RFS/build.gradle index aa24dd409..57637bdad 100644 --- a/RFS/build.gradle +++ b/RFS/build.gradle @@ -62,7 +62,7 @@ dependencies { testImplementation group: 'org.mockito', name: 'mockito-junit-jupiter' testImplementation project(':transformation:transformationPlugins:jsonMessageTransformers:jsonMessageTransformerLoaders') - testRuntimeOnly project(':transformation:transformationPlugins:jsonMessageTransformers:openSearch23PlusTargetTransformerProvider') + testRuntimeOnly project(':transformation:transformationPlugins:jsonMessageTransformers:jsonTypeMappingsSanitizationTransformerProvider') testRuntimeOnly group: 'org.junit.jupiter', name: 'junit-jupiter-engine' diff --git a/TrafficCapture/trafficReplayer/README.md b/TrafficCapture/trafficReplayer/README.md index de789a3fd..0562844c1 100644 --- a/TrafficCapture/trafficReplayer/README.md +++ b/TrafficCapture/trafficReplayer/README.md @@ -145,7 +145,7 @@ transform to add GZIP encoding and another to apply a new header would be config ``` To run only one transformer without any configuration, the `--transformer-config` argument can simply -be set to the name of the transformer (e.g. 'JsonTransformerForOpenSearch23PlusTargetTransformerProvider', +be set to the name of the transformer (e.g. 'TypeMappingSanitizationTransformerProvider', without quotes or any json surrounding it). The user can also specify a file to read the transformations from using the `--transformer-config-file`. Users can @@ -153,7 +153,7 @@ also pass the script as an argument via `--transformer-config-base64`. Each of is mutually exclusive. Some simple transformations are included to change headers to add compression or to force an HTTP message payload to -be chunked. Another transformer, [JsonTypeMappingTransformer.java](../../transformation/transformationPlugins/jsonMessageTransformers/openSearch23PlusTargetTransformerProvider/src/main/java/org/opensearch/migrations/transform/JsonTypeMappingTransformer.java), +be chunked. Another transformer, [TypeMappingSanitizationTransformer.java](../../transformation/transformationPlugins/jsonMessageTransformers/jsonTypeMappingsSanitizationTransformer/src/main/java/org/opensearch/migrations/transform/TypeMappingsSanitizationTransformer.java), is a work-in-progress to excise type mapping references from URIs and message payloads since versions of OpenSource greater than 2.3 do not support them. diff --git a/TrafficCapture/trafficReplayer/build.gradle b/TrafficCapture/trafficReplayer/build.gradle index ac04a2582..cda888d16 100644 --- a/TrafficCapture/trafficReplayer/build.gradle +++ b/TrafficCapture/trafficReplayer/build.gradle @@ -59,7 +59,7 @@ dependencies { testImplementation testFixtures(project(path: ':coreUtilities')) testImplementation project(':transformation:transformationPlugins:jsonMessageTransformers:jsonJMESPathMessageTransformerProvider') testImplementation project(':transformation:transformationPlugins:jsonMessageTransformers:jsonJoltMessageTransformerProvider') - testImplementation project(':transformation:transformationPlugins:jsonMessageTransformers:openSearch23PlusTargetTransformerProvider') + testImplementation project(':transformation:transformationPlugins:jsonMessageTransformers:jsonTypeMappingsSanitizationTransformerProvider') testImplementation group: 'org.apache.httpcomponents.client5', name: 'httpclient5' testImplementation group: 'org.junit.jupiter', name:'junit-jupiter-api' diff --git a/TrafficCapture/trafficReplayer/src/main/java/org/opensearch/migrations/replay/datahandlers/http/NettyDecodedHttpRequestPreliminaryTransformHandler.java b/TrafficCapture/trafficReplayer/src/main/java/org/opensearch/migrations/replay/datahandlers/http/NettyDecodedHttpRequestPreliminaryTransformHandler.java index f467383c4..9c452ac52 100644 --- a/TrafficCapture/trafficReplayer/src/main/java/org/opensearch/migrations/replay/datahandlers/http/NettyDecodedHttpRequestPreliminaryTransformHandler.java +++ b/TrafficCapture/trafficReplayer/src/main/java/org/opensearch/migrations/replay/datahandlers/http/NettyDecodedHttpRequestPreliminaryTransformHandler.java @@ -67,13 +67,9 @@ public void channelRead(@NonNull ChannelHandlerContext ctx, @NonNull Object msg) IAuthTransformer authTransformer = requestPipelineOrchestrator.authTransfomerFactory.getAuthTransformer( httpJsonMessage ); + HttpJsonRequestWithFaultingPayload transformedMessage = null; try { - handlePayloadNeutralTransformationOrThrow( - ctx, - originalHttpJsonMessage, - transform(transformer, httpJsonMessage), - authTransformer - ); + transformedMessage = transform(transformer, httpJsonMessage); } catch (PayloadNotLoadedException pnle) { log.atDebug().setMessage("The transforms for this message require payload manipulation, " + "all content handlers are being loaded.").log(); @@ -84,6 +80,17 @@ public void channelRead(@NonNull ChannelHandlerContext ctx, @NonNull Object msg) getAuthTransformerAsStreamingTransformer(authTransformer) ); ctx.fireChannelRead(handleAuthHeaders(httpJsonMessage, authTransformer)); + } catch (Exception e) { + throw new TransformationException(e); + } + + if (transformedMessage != null) { + handlePayloadNeutralTransformationOrThrow( + ctx, + originalHttpJsonMessage, + transformedMessage, + authTransformer + ); } } else if (msg instanceof HttpContent) { ctx.fireChannelRead(msg); diff --git a/TrafficCapture/trafficReplayer/src/test/java/org/opensearch/migrations/replay/datahandlers/http/HttpJsonTransformingConsumerTest.java b/TrafficCapture/trafficReplayer/src/test/java/org/opensearch/migrations/replay/datahandlers/http/HttpJsonTransformingConsumerTest.java index 7e106b433..64d62631c 100644 --- a/TrafficCapture/trafficReplayer/src/test/java/org/opensearch/migrations/replay/datahandlers/http/HttpJsonTransformingConsumerTest.java +++ b/TrafficCapture/trafficReplayer/src/test/java/org/opensearch/migrations/replay/datahandlers/http/HttpJsonTransformingConsumerTest.java @@ -331,7 +331,7 @@ public void testMalformedPayload_andThrowingTransformation_IsPassedThrough() thr new TransformationLoader().getTransformerFactoryLoader( HOST_NAME, null, - "[{\"JsonTransformerForOpenSearch23PlusTargetTransformerProvider\":\"\"}]" + "[{\"TypeMappingSanitizationTransformerProvider\":\"\"}]" ), null, testPacketCapture, diff --git a/transformation/transformationPlugins/jsonMessageTransformers/jsonJinjavaTransformer/src/main/java/org/opensearch/migrations/transform/JinjavaTransformer.java b/transformation/transformationPlugins/jsonMessageTransformers/jsonJinjavaTransformer/src/main/java/org/opensearch/migrations/transform/JinjavaTransformer.java index abfcccf5a..af23be1cb 100644 --- a/transformation/transformationPlugins/jsonMessageTransformers/jsonJinjavaTransformer/src/main/java/org/opensearch/migrations/transform/JinjavaTransformer.java +++ b/transformation/transformationPlugins/jsonMessageTransformers/jsonJinjavaTransformer/src/main/java/org/opensearch/migrations/transform/JinjavaTransformer.java @@ -5,6 +5,7 @@ import java.util.Map; import java.util.Optional; import java.util.function.Function; +import java.util.function.UnaryOperator; import org.opensearch.migrations.transform.jinjava.DynamicMacroFunction; import org.opensearch.migrations.transform.jinjava.JavaRegexCaptureFilter; @@ -22,19 +23,19 @@ @Slf4j public class JinjavaTransformer implements IJsonTransformer { - protected final static ObjectMapper objectMapper = new ObjectMapper(); + protected static final ObjectMapper objectMapper = new ObjectMapper(); protected final Jinjava jinjava; protected final Function, Map> createContextWithSourceFunction; private final String templateStr; public JinjavaTransformer(String templateString, - Function, Map> contextProviderFromSource) { + UnaryOperator> contextProviderFromSource) { this(templateString, contextProviderFromSource, new NameMappingClasspathResourceLocator()); } public JinjavaTransformer(String templateString, - Function, Map> createContextWithSource, + UnaryOperator> createContextWithSource, ResourceLocator resourceLocator) { jinjava = new Jinjava(); diff --git a/transformation/transformationPlugins/jsonMessageTransformers/jsonJinjavaTransformer/src/main/java/org/opensearch/migrations/transform/jinjava/DynamicMacroFunction.java b/transformation/transformationPlugins/jsonMessageTransformers/jsonJinjavaTransformer/src/main/java/org/opensearch/migrations/transform/jinjava/DynamicMacroFunction.java index 685713fca..e91e6d0b2 100644 --- a/transformation/transformationPlugins/jsonMessageTransformers/jsonJinjavaTransformer/src/main/java/org/opensearch/migrations/transform/jinjava/DynamicMacroFunction.java +++ b/transformation/transformationPlugins/jsonMessageTransformers/jsonJinjavaTransformer/src/main/java/org/opensearch/migrations/transform/jinjava/DynamicMacroFunction.java @@ -11,13 +11,18 @@ public class DynamicMacroFunction { + private DynamicMacroFunction() {} + /** * Called from templates through the registration in the JinjavaTransformer class */ public static Object invokeMacro(String macroName, Object... args) { JinjavaInterpreter interpreter = JinjavaInterpreter.getCurrent(); - MacroFunction macro = getMacroFromContext(interpreter.getContext(), macroName); + var macro = getMacroFromContext(interpreter.getContext(), macroName); + if (macro == null) { + throw new IllegalArgumentException("Could not find argument name " + macroName); + } Context macroContext = new Context(interpreter.getContext()); int argCount = Math.min(args.length, macro.getArguments().size()); @@ -39,7 +44,7 @@ public static Object invokeMacro(String macroName, Object... args) { } else if (defaults.containsKey(paramName)) { argsMap.put(paramName, defaults.get(paramName)); } else { - throw new RuntimeException("Missing argument for macro: " + paramName); + throw new IllegalArgumentException("Missing argument for macro: " + paramName); } } diff --git a/transformation/transformationPlugins/jsonMessageTransformers/jsonJinjavaTransformer/src/main/java/org/opensearch/migrations/transform/jinjava/InlineTemplateResourceLocator.java b/transformation/transformationPlugins/jsonMessageTransformers/jsonJinjavaTransformer/src/main/java/org/opensearch/migrations/transform/jinjava/InlineTemplateResourceLocator.java deleted file mode 100644 index d6629946e..000000000 --- a/transformation/transformationPlugins/jsonMessageTransformers/jsonJinjavaTransformer/src/main/java/org/opensearch/migrations/transform/jinjava/InlineTemplateResourceLocator.java +++ /dev/null @@ -1,26 +0,0 @@ -package org.opensearch.migrations.transform.jinjava; - -import java.nio.charset.Charset; -import java.util.Map; - -import com.hubspot.jinjava.interpret.JinjavaInterpreter; -import com.hubspot.jinjava.loader.ResourceLocator; -import com.hubspot.jinjava.loader.ResourceNotFoundException; - -public class InlineTemplateResourceLocator implements ResourceLocator { - - private final Map templates; - - public InlineTemplateResourceLocator(Map templates) { - this.templates = templates; - } - - @Override - public String getString(String fullName, Charset encoding, JinjavaInterpreter interpreter) - throws ResourceNotFoundException { - if (templates.containsKey(fullName)) { - return templates.get(fullName); - } - throw new ResourceNotFoundException("Template not found: " + fullName); - } -} diff --git a/transformation/transformationPlugins/jsonMessageTransformers/jsonJinjavaTransformer/src/main/java/org/opensearch/migrations/transform/jinjava/JavaRegexCaptureFilter.java b/transformation/transformationPlugins/jsonMessageTransformers/jsonJinjavaTransformer/src/main/java/org/opensearch/migrations/transform/jinjava/JavaRegexCaptureFilter.java index 5fbd6610d..f48c9955d 100644 --- a/transformation/transformationPlugins/jsonMessageTransformers/jsonJinjavaTransformer/src/main/java/org/opensearch/migrations/transform/jinjava/JavaRegexCaptureFilter.java +++ b/transformation/transformationPlugins/jsonMessageTransformers/jsonJinjavaTransformer/src/main/java/org/opensearch/migrations/transform/jinjava/JavaRegexCaptureFilter.java @@ -28,12 +28,12 @@ public String getName() { } @Override - public Object filter(Object var, JinjavaInterpreter interpreter, String... args) { - if (var == null || args.length < 1) { + public Object filter(Object inputObject, JinjavaInterpreter interpreter, String... args) { + if (inputObject == null || args.length < 1) { return null; } - String input = var.toString(); + String input = inputObject.toString(); String pattern = args[0]; try { diff --git a/transformation/transformationPlugins/jsonMessageTransformers/jsonJinjavaTransformer/src/main/java/org/opensearch/migrations/transform/jinjava/JavaRegexReplaceFilter.java b/transformation/transformationPlugins/jsonMessageTransformers/jsonJinjavaTransformer/src/main/java/org/opensearch/migrations/transform/jinjava/JavaRegexReplaceFilter.java index fe36364bf..537698de3 100644 --- a/transformation/transformationPlugins/jsonMessageTransformers/jsonJinjavaTransformer/src/main/java/org/opensearch/migrations/transform/jinjava/JavaRegexReplaceFilter.java +++ b/transformation/transformationPlugins/jsonMessageTransformers/jsonJinjavaTransformer/src/main/java/org/opensearch/migrations/transform/jinjava/JavaRegexReplaceFilter.java @@ -29,12 +29,12 @@ public String getName() { } @Override - public Object filter(Object var, JinjavaInterpreter interpreter, String... args) { - if (var == null || args.length < 2) { + public Object filter(Object inputObject, JinjavaInterpreter interpreter, String... args) { + if (inputObject == null || args.length < 2) { return null; } - String input = var.toString(); + String input = inputObject.toString(); String pattern = args[0]; String replacement = args[1]; diff --git a/transformation/transformationPlugins/jsonMessageTransformers/jsonJinjavaTransformer/src/main/java/org/opensearch/migrations/transform/jinjava/NameMappingClasspathResourceLocator.java b/transformation/transformationPlugins/jsonMessageTransformers/jsonJinjavaTransformer/src/main/java/org/opensearch/migrations/transform/jinjava/NameMappingClasspathResourceLocator.java index d73bf07e2..24e6bb85f 100644 --- a/transformation/transformationPlugins/jsonMessageTransformers/jsonJinjavaTransformer/src/main/java/org/opensearch/migrations/transform/jinjava/NameMappingClasspathResourceLocator.java +++ b/transformation/transformationPlugins/jsonMessageTransformers/jsonJinjavaTransformer/src/main/java/org/opensearch/migrations/transform/jinjava/NameMappingClasspathResourceLocator.java @@ -31,7 +31,6 @@ private String getDefaultVersion(final String fullName) throws IOException { @Override public String getString(String fullName, Charset encoding, JinjavaInterpreter interpreter) throws IOException { - var rval = super.getString(getDefaultVersion("jinjava/" + fullName), encoding, interpreter); - return rval; + return super.getString(getDefaultVersion("jinjava/" + fullName), encoding, interpreter); } } diff --git a/transformation/transformationPlugins/jsonMessageTransformers/jsonJinjavaTransformer/src/test/java/org/opensearch/migrations/transform/JinjavaTransformerTest.java b/transformation/transformationPlugins/jsonMessageTransformers/jsonJinjavaTransformer/src/test/java/org/opensearch/migrations/transform/JinjavaTransformerTest.java index f215c809b..85bfa2d53 100644 --- a/transformation/transformationPlugins/jsonMessageTransformers/jsonJinjavaTransformer/src/test/java/org/opensearch/migrations/transform/JinjavaTransformerTest.java +++ b/transformation/transformationPlugins/jsonMessageTransformers/jsonJinjavaTransformer/src/test/java/org/opensearch/migrations/transform/JinjavaTransformerTest.java @@ -10,7 +10,7 @@ @Slf4j class JinjavaTransformerTest { - private final static String template = "" + + private static final String TEMPLATE = "" + "{# First, parse the URI to check if it matches the pattern we want to transform #}\n" + "{% set uri_parts = request.uri.split('/') %}\n" + "{% set is_type_request = uri_parts | length == 2 %}\n" + @@ -62,7 +62,7 @@ static void initialize() { "type2", "indexB"), "indexC", Map.of( "type2", "indexC")); - indexTypeMappingRewriter = new JinjavaTransformer(template, + indexTypeMappingRewriter = new JinjavaTransformer(TEMPLATE, request -> Map.of( "index_mappings", indexMappings, "request", request)); diff --git a/transformation/transformationPlugins/jsonMessageTransformers/jsonJinjavaTransformer/src/test/java/org/opensearch/migrations/transform/RouteTest.java b/transformation/transformationPlugins/jsonMessageTransformers/jsonJinjavaTransformer/src/test/java/org/opensearch/migrations/transform/RouteTest.java index b5964e548..e287bcbba 100644 --- a/transformation/transformationPlugins/jsonMessageTransformers/jsonJinjavaTransformer/src/test/java/org/opensearch/migrations/transform/RouteTest.java +++ b/transformation/transformationPlugins/jsonMessageTransformers/jsonJinjavaTransformer/src/test/java/org/opensearch/migrations/transform/RouteTest.java @@ -14,8 +14,6 @@ public class RouteTest { private static final ObjectMapper objectMapper = new ObjectMapper(); - private final static String DEFAULT_RESPONSE = "{ \"default\": {}}"; - public Map doRouting(Map flags, Map inputDoc) { log.atInfo().setMessage("parsed flags: {}").addArgument(flags).log(); final var template = "" + diff --git a/transformation/transformationPlugins/jsonMessageTransformers/jsonMessageTransformerLoaders/build.gradle b/transformation/transformationPlugins/jsonMessageTransformers/jsonMessageTransformerLoaders/build.gradle index 2da9c9c85..006dcdd34 100644 --- a/transformation/transformationPlugins/jsonMessageTransformers/jsonMessageTransformerLoaders/build.gradle +++ b/transformation/transformationPlugins/jsonMessageTransformers/jsonMessageTransformerLoaders/build.gradle @@ -32,7 +32,7 @@ dependencies { testImplementation testFixtures(project(path: ':testHelperFixtures')) testImplementation project(':transformation:transformationPlugins:jsonMessageTransformers:jsonJMESPathMessageTransformerProvider') testImplementation project(':transformation:transformationPlugins:jsonMessageTransformers:jsonJoltMessageTransformerProvider') - testImplementation project(':transformation:transformationPlugins:jsonMessageTransformers:openSearch23PlusTargetTransformerProvider') + testImplementation project(':transformation:transformationPlugins:jsonMessageTransformers:jsonTypeMappingsSanitizationTransformerProvider') testImplementation project(':transformation:transformationPlugins:jsonMessageTransformers:jsonJoltMessageTransformer') testImplementation project(':transformation:transformationPlugins:jsonMessageTransformers:jsonJMESPathMessageTransformer') diff --git a/transformation/transformationPlugins/jsonMessageTransformers/jsonMessageTransformerLoaders/src/main/java/org/opensearch/migrations/transform/JsonConditionalTransformerProvider.java b/transformation/transformationPlugins/jsonMessageTransformers/jsonMessageTransformerLoaders/src/main/java/org/opensearch/migrations/transform/JsonConditionalTransformerProvider.java index c410b9595..93d6c3d00 100644 --- a/transformation/transformationPlugins/jsonMessageTransformers/jsonMessageTransformerLoaders/src/main/java/org/opensearch/migrations/transform/JsonConditionalTransformerProvider.java +++ b/transformation/transformationPlugins/jsonMessageTransformers/jsonMessageTransformerLoaders/src/main/java/org/opensearch/migrations/transform/JsonConditionalTransformerProvider.java @@ -9,9 +9,6 @@ @Slf4j public class JsonConditionalTransformerProvider implements IJsonTransformerProvider { - public JsonConditionalTransformerProvider() { - } - @Override @SneakyThrows public IJsonTransformer createTransformer(Object jsonConfig) { diff --git a/transformation/transformationPlugins/jsonMessageTransformers/jsonMessageTransformerLoaders/src/main/java/org/opensearch/migrations/transform/flags/FeatureFlagsDeserializer.java b/transformation/transformationPlugins/jsonMessageTransformers/jsonMessageTransformerLoaders/src/main/java/org/opensearch/migrations/transform/flags/FeatureFlagsDeserializer.java index 4c5514f8f..47220c1cb 100644 --- a/transformation/transformationPlugins/jsonMessageTransformers/jsonMessageTransformerLoaders/src/main/java/org/opensearch/migrations/transform/flags/FeatureFlagsDeserializer.java +++ b/transformation/transformationPlugins/jsonMessageTransformers/jsonMessageTransformerLoaders/src/main/java/org/opensearch/migrations/transform/flags/FeatureFlagsDeserializer.java @@ -5,7 +5,6 @@ import java.util.Map; import com.fasterxml.jackson.core.JsonParser; -import com.fasterxml.jackson.databind.*; import com.fasterxml.jackson.databind.DeserializationContext; import com.fasterxml.jackson.databind.JsonNode; import com.fasterxml.jackson.databind.deser.std.StdDeserializer; diff --git a/transformation/transformationPlugins/jsonMessageTransformers/jsonMessageTransformerLoaders/src/test/java/org/opensearch/migrations/transform/replay/JsonTransformerTest.java b/transformation/transformationPlugins/jsonMessageTransformers/jsonMessageTransformerLoaders/src/test/java/org/opensearch/migrations/transform/replay/JsonTransformerTest.java index 3434c31e8..5a894d4cb 100644 --- a/transformation/transformationPlugins/jsonMessageTransformers/jsonMessageTransformerLoaders/src/test/java/org/opensearch/migrations/transform/replay/JsonTransformerTest.java +++ b/transformation/transformationPlugins/jsonMessageTransformers/jsonMessageTransformerLoaders/src/test/java/org/opensearch/migrations/transform/replay/JsonTransformerTest.java @@ -43,7 +43,6 @@ private Map parseSampleRequestFromResource(String path) { } private String emitJson(Object transformedDocument) throws JsonProcessingException { - ObjectMapper mapper = new ObjectMapper(); mapper.configure(com.fasterxml.jackson.core.JsonParser.Feature.ALLOW_COMMENTS, true); // optional return mapper.writeValueAsString(transformedDocument); } diff --git a/transformation/transformationPlugins/jsonMessageTransformers/jsonMessageTransformerLoaders/src/test/java/org/opensearch/migrations/transform/replay/MultipleJMESPathScriptsTest.java b/transformation/transformationPlugins/jsonMessageTransformers/jsonMessageTransformerLoaders/src/test/java/org/opensearch/migrations/transform/replay/MultipleJMESPathScriptsTest.java index 088015583..fca6ecff8 100644 --- a/transformation/transformationPlugins/jsonMessageTransformers/jsonMessageTransformerLoaders/src/test/java/org/opensearch/migrations/transform/replay/MultipleJMESPathScriptsTest.java +++ b/transformation/transformationPlugins/jsonMessageTransformers/jsonMessageTransformerLoaders/src/test/java/org/opensearch/migrations/transform/replay/MultipleJMESPathScriptsTest.java @@ -1,11 +1,9 @@ package org.opensearch.migrations.transform.replay; -import java.util.Map; import java.util.StringJoiner; import org.opensearch.migrations.transform.TransformationLoader; -import com.fasterxml.jackson.core.type.TypeReference; import com.fasterxml.jackson.databind.ObjectMapper; import org.junit.jupiter.api.Assertions; import org.junit.jupiter.api.Test; @@ -18,11 +16,6 @@ public class MultipleJMESPathScriptsTest { + "\\\"headers\\\": {\\\"host\\\": \\\"localhost\\\"},\\n \\\"payload\\\": payload\\n}"; private static final ObjectMapper mapper = new ObjectMapper(); - private static Map parseAsMap(String contents) throws Exception { - return mapper.readValue(contents.getBytes(), new TypeReference<>() { - }); - } - @Test public void testTwoScripts() throws Exception { var aggregateScriptJoiner = new StringJoiner(",\n", "[", "]"); diff --git a/transformation/transformationPlugins/jsonMessageTransformers/jsonMessageTransformerLoaders/src/test/java/org/opensearch/migrations/transform/replay/TransformationLoaderTest.java b/transformation/transformationPlugins/jsonMessageTransformers/jsonMessageTransformerLoaders/src/test/java/org/opensearch/migrations/transform/replay/TransformationLoaderTest.java index 47e93b320..e0519de63 100644 --- a/transformation/transformationPlugins/jsonMessageTransformers/jsonMessageTransformerLoaders/src/test/java/org/opensearch/migrations/transform/replay/TransformationLoaderTest.java +++ b/transformation/transformationPlugins/jsonMessageTransformers/jsonMessageTransformerLoaders/src/test/java/org/opensearch/migrations/transform/replay/TransformationLoaderTest.java @@ -44,10 +44,11 @@ public void testThatSimpleNoopTransformerLoads() throws Exception { } @Test - public void testMisconfiguration() throws Exception { + public void testMisconfiguration() { + var transformLoader = new TransformationLoader(); Assertions.assertThrows( IllegalArgumentException.class, - () -> new TransformationLoader().getTransformerFactoryLoader("localhost", null, "Not right") + () -> transformLoader.getTransformerFactoryLoader("localhost", null, "Not right") ); } @@ -61,7 +62,7 @@ public void testThatNoConfigMeansNoThrow() throws Exception { Assertions.assertNotNull(transformer.transformJson(origDoc)); } - final String TEST_INPUT_REQUEST = "{\n" + static final String TEST_INPUT_REQUEST = "{\n" + " \"method\": \"PUT\",\n" + " \"URI\": \"/oldStyleIndex\",\n" + " \"headers\": {\n" @@ -75,9 +76,7 @@ public void testUserAgentAppends() throws Exception { var userAgentTransformer = new TransformationLoader().getTransformerFactoryLoader("localhost", "tester", null); var origDoc = parseAsMap(TEST_INPUT_REQUEST); - var origDocStr = mapper.writeValueAsString(origDoc); var pass1 = userAgentTransformer.transformJson(origDoc); - var pass1DocStr = mapper.writeValueAsString(origDoc); var pass2 = userAgentTransformer.transformJson(pass1); var finalUserAgentInHeaders = ((Map) pass2.get("headers")).get("user-agent"); Assertions.assertEquals("tester; tester", finalUserAgentInHeaders); diff --git a/transformation/transformationPlugins/jsonMessageTransformers/jsonTypeMappingsSanitizationTransformer/src/main/java/org/opensearch/migrations/transform/TypeMappingsSanitizationTransformer.java b/transformation/transformationPlugins/jsonMessageTransformers/jsonTypeMappingsSanitizationTransformer/src/main/java/org/opensearch/migrations/transform/TypeMappingsSanitizationTransformer.java index 224a4f619..c6344b9c4 100644 --- a/transformation/transformationPlugins/jsonMessageTransformers/jsonTypeMappingsSanitizationTransformer/src/main/java/org/opensearch/migrations/transform/TypeMappingsSanitizationTransformer.java +++ b/transformation/transformationPlugins/jsonMessageTransformers/jsonTypeMappingsSanitizationTransformer/src/main/java/org/opensearch/migrations/transform/TypeMappingsSanitizationTransformer.java @@ -4,7 +4,8 @@ import java.nio.charset.StandardCharsets; import java.util.List; import java.util.Map; -import java.util.function.Function; +import java.util.Optional; +import java.util.function.UnaryOperator; import com.google.common.io.Resources; @@ -32,15 +33,15 @@ public TypeMappingsSanitizationTransformer(String variantName, makeSourceWrapperFunction(featureFlags, indexMappings, regexIndexMappings)); } - private static Function, Map> + private static UnaryOperator> makeSourceWrapperFunction(Map featureFlagsIncoming, Map> indexMappingsIncoming, List> regexIndexMappingsIncoming) { var featureFlags = featureFlagsIncoming != null ? featureFlagsIncoming : Map.of(); var indexMappings = indexMappingsIncoming != null ? indexMappingsIncoming : Map.of(); - var regexIndexMappings = regexIndexMappingsIncoming != null ? regexIndexMappingsIncoming : - (indexMappingsIncoming == null ? List.of(List.of("(.*)", "(.*)", "\\1_\\2")) : List.of()); + var regexIndexMappings = Optional.ofNullable(regexIndexMappingsIncoming) + .orElseGet(() -> (indexMappingsIncoming == null ? List.of(List.of("(.*)", "(.*)", "\\1_\\2")) : List.of())); return incomingJson -> Map.of("request", incomingJson, "index_mappings", indexMappings, diff --git a/transformation/transformationPlugins/jsonMessageTransformers/jsonTypeMappingsSanitizationTransformer/src/test/java/org/opensearch/migrations/transform/TypeMappingsSanitizationTransformerBulkTest.java b/transformation/transformationPlugins/jsonMessageTransformers/jsonTypeMappingsSanitizationTransformer/src/test/java/org/opensearch/migrations/transform/TypeMappingsSanitizationTransformerBulkTest.java index c455601a0..dd057c6f6 100644 --- a/transformation/transformationPlugins/jsonMessageTransformers/jsonTypeMappingsSanitizationTransformer/src/test/java/org/opensearch/migrations/transform/TypeMappingsSanitizationTransformerBulkTest.java +++ b/transformation/transformationPlugins/jsonMessageTransformers/jsonTypeMappingsSanitizationTransformer/src/test/java/org/opensearch/migrations/transform/TypeMappingsSanitizationTransformerBulkTest.java @@ -18,7 +18,7 @@ @Slf4j public class TypeMappingsSanitizationTransformerBulkTest { - private final static ObjectMapper OBJECT_MAPPER = new ObjectMapper(); + private static final ObjectMapper OBJECT_MAPPER = new ObjectMapper(); private static TypeMappingsSanitizationTransformer indexTypeMappingRewriter; @BeforeAll static void initialize() throws IOException { diff --git a/transformation/transformationPlugins/jsonMessageTransformers/jsonTypeMappingsSanitizationTransformer/src/test/java/org/opensearch/migrations/transform/TypeMappingsSanitizationTransformerTest.java b/transformation/transformationPlugins/jsonMessageTransformers/jsonTypeMappingsSanitizationTransformer/src/test/java/org/opensearch/migrations/transform/TypeMappingsSanitizationTransformerTest.java index 216b69e94..d809eeaee 100644 --- a/transformation/transformationPlugins/jsonMessageTransformers/jsonTypeMappingsSanitizationTransformer/src/test/java/org/opensearch/migrations/transform/TypeMappingsSanitizationTransformerTest.java +++ b/transformation/transformationPlugins/jsonMessageTransformers/jsonTypeMappingsSanitizationTransformer/src/test/java/org/opensearch/migrations/transform/TypeMappingsSanitizationTransformerTest.java @@ -15,7 +15,7 @@ @Slf4j class TypeMappingsSanitizationTransformerTest { - private final static ObjectMapper objMapper = new ObjectMapper(); + private static final ObjectMapper objMapper = new ObjectMapper(); private static TypeMappingsSanitizationTransformer indexTypeMappingRewriter; @BeforeAll @@ -139,7 +139,7 @@ public void testMultiTypeIndex() throws Exception { user.path("properties").fields().forEachRemaining(e -> newProperties.put(e.getKey(), e.getValue())); var tweet = mappings.remove("tweet"); tweet.path("properties").fields().forEachRemaining(e -> newProperties.put(e.getKey(), e.getValue())); - var properties = mappings.put("properties", objMapper.valueToTree(newProperties)); + mappings.set("properties", objMapper.valueToTree(newProperties)); ((ObjectNode)expected).put(JsonKeysForHttpMessage.URI_KEY, "/communal"); Assertions.assertEquals(expected, objMapper.readTree(objMapper.writeValueAsString(result))); } diff --git a/transformation/transformationPlugins/jsonMessageTransformers/jsonTypeMappingsSanitizationTransformerProvider/src/main/java/org/opensearch/migrations/transform/TypeMappingSanitizationTransformerProvider.java b/transformation/transformationPlugins/jsonMessageTransformers/jsonTypeMappingsSanitizationTransformerProvider/src/main/java/org/opensearch/migrations/transform/TypeMappingSanitizationTransformerProvider.java index 89f99a02d..0b3405f89 100644 --- a/transformation/transformationPlugins/jsonMessageTransformers/jsonTypeMappingsSanitizationTransformerProvider/src/main/java/org/opensearch/migrations/transform/TypeMappingSanitizationTransformerProvider.java +++ b/transformation/transformationPlugins/jsonMessageTransformers/jsonTypeMappingsSanitizationTransformerProvider/src/main/java/org/opensearch/migrations/transform/TypeMappingSanitizationTransformerProvider.java @@ -18,6 +18,9 @@ public IJsonTransformer createTransformer(Object jsonConfig) { if (jsonConfig == null) { return new TypeMappingsSanitizationTransformer(TypeMappingsSanitizationTransformer.REPLAYER_VARIANT, null, null, null); + } else if (jsonConfig instanceof String && ((String) jsonConfig).isEmpty()) { + return new TypeMappingsSanitizationTransformer(TypeMappingsSanitizationTransformer.REPLAYER_VARIANT, + null, null, null); } else if (!(jsonConfig instanceof Map)) { throw new IllegalArgumentException(getConfigUsageStr()); } diff --git a/transformation/transformationPlugins/jsonMessageTransformers/openSearch23PlusTargetTransformerProvider/build.gradle b/transformation/transformationPlugins/jsonMessageTransformers/openSearch23PlusTargetTransformerProvider/build.gradle deleted file mode 100644 index 4c9912f46..000000000 --- a/transformation/transformationPlugins/jsonMessageTransformers/openSearch23PlusTargetTransformerProvider/build.gradle +++ /dev/null @@ -1,19 +0,0 @@ -plugins { - id 'io.freefair.lombok' -} - -dependencies { - implementation project(':transformation:transformationPlugins:jsonMessageTransformers:jsonMessageTransformerInterface') - - testImplementation project(':TrafficCapture:trafficReplayer') - testImplementation testFixtures(project(path: ':testHelperFixtures')) - testImplementation testFixtures(project(path: ':TrafficCapture:trafficReplayer')) - - testImplementation group: 'com.fasterxml.jackson.core', name: 'jackson-databind' - testImplementation group: 'com.google.guava', name: 'guava' - testImplementation group: 'io.netty', name: 'netty-all' - testImplementation group: 'org.junit.jupiter', name:'junit-jupiter-api' - testImplementation group: 'org.junit.jupiter', name:'junit-jupiter-params' - testImplementation group: 'org.slf4j', name: 'slf4j-api' - testRuntimeOnly group:'org.junit.jupiter', name:'junit-jupiter-engine' -} diff --git a/transformation/transformationPlugins/jsonMessageTransformers/openSearch23PlusTargetTransformerProvider/src/main/java/org/opensearch/migrations/transform/JsonTransformerForOpenSearch23PlusTargetTransformerProvider.java b/transformation/transformationPlugins/jsonMessageTransformers/openSearch23PlusTargetTransformerProvider/src/main/java/org/opensearch/migrations/transform/JsonTransformerForOpenSearch23PlusTargetTransformerProvider.java deleted file mode 100644 index 14f60b499..000000000 --- a/transformation/transformationPlugins/jsonMessageTransformers/openSearch23PlusTargetTransformerProvider/src/main/java/org/opensearch/migrations/transform/JsonTransformerForOpenSearch23PlusTargetTransformerProvider.java +++ /dev/null @@ -1,8 +0,0 @@ -package org.opensearch.migrations.transform; - -public class JsonTransformerForOpenSearch23PlusTargetTransformerProvider implements IJsonTransformerProvider { - @Override - public IJsonTransformer createTransformer(Object jsonConfig) { - return new JsonTypeMappingTransformer(); - } -} diff --git a/transformation/transformationPlugins/jsonMessageTransformers/openSearch23PlusTargetTransformerProvider/src/main/java/org/opensearch/migrations/transform/JsonTypeMappingTransformer.java b/transformation/transformationPlugins/jsonMessageTransformers/openSearch23PlusTargetTransformerProvider/src/main/java/org/opensearch/migrations/transform/JsonTypeMappingTransformer.java deleted file mode 100644 index b141b5045..000000000 --- a/transformation/transformationPlugins/jsonMessageTransformers/openSearch23PlusTargetTransformerProvider/src/main/java/org/opensearch/migrations/transform/JsonTypeMappingTransformer.java +++ /dev/null @@ -1,81 +0,0 @@ -package org.opensearch.migrations.transform; - -import java.util.Map; -import java.util.regex.Pattern; - -/** - * This is an experimental JsonTransformer that is meant to perform basic URI and payload transformations - * to excise index type mappings for relevant operations. - */ -public class JsonTypeMappingTransformer implements IJsonTransformer { - /** - * This is used to match a URI of the form /INDEX/TYPE/foo... so that it can be - * transformed into /INDEX/foo... - */ - static final Pattern TYPED_OPERATION_URI_PATTERN_WITH_SIDE_CAPTURES = Pattern.compile( - "^(\\/[^\\/]*)\\/[^\\/]*(\\/[^\\/]*)$" - ); - - /** - * This is used to match a URI of the form /foo... - */ - static final Pattern SINGLE_LEVEL_OPERATION_PATTERN_WITH_CAPTURE = Pattern.compile("^(\\/[^\\/]*)$"); - public static final String SEARCH_URI_COMPONENT = "/_search"; - public static final String DOC_URI_COMPONENT = "/_doc"; - public static final String MAPPINGS_KEYNAME = "mappings"; - - @Override - public Map transformJson(Map incomingJson) { - return transformHttpMessage(incomingJson); - } - - private Map transformHttpMessage(Map httpMsg) { - var incomingMethod = httpMsg.get(JsonKeysForHttpMessage.METHOD_KEY); - if ("GET".equals(incomingMethod)) { - processGet(httpMsg); - } else if ("PUT".equals(incomingMethod)) { - processPut(httpMsg); - } - return httpMsg; - } - - private void processGet(Map httpMsg) { - var incomingUri = (String) httpMsg.get(JsonKeysForHttpMessage.URI_KEY); - var matchedUri = TYPED_OPERATION_URI_PATTERN_WITH_SIDE_CAPTURES.matcher(incomingUri); - if (matchedUri.matches()) { - var operationStr = matchedUri.group(2); - if (operationStr.equals(SEARCH_URI_COMPONENT)) { - httpMsg.put(JsonKeysForHttpMessage.URI_KEY, matchedUri.group(1) + operationStr); - } - } - } - - private void processPut(Map httpMsg) { - final var uriStr = (String) httpMsg.get(JsonKeysForHttpMessage.URI_KEY); - var matchedTriple = TYPED_OPERATION_URI_PATTERN_WITH_SIDE_CAPTURES.matcher(uriStr); - if (matchedTriple.matches()) { - // TODO: Add support for multiple type mappings per index (something possible with - // versions before ES7) - httpMsg.put( - JsonKeysForHttpMessage.URI_KEY, - matchedTriple.group(1) + DOC_URI_COMPONENT + matchedTriple.group(2) - ); - return; - } - var matchedSingle = SINGLE_LEVEL_OPERATION_PATTERN_WITH_CAPTURE.matcher(uriStr); - if (matchedSingle.matches()) { - var topPayloadElement = (Map) ((Map) httpMsg.get( - JsonKeysForHttpMessage.PAYLOAD_KEY - )).get(JsonKeysForHttpMessage.INLINED_JSON_BODY_DOCUMENT_KEY); - var mappingsValue = (Map) topPayloadElement.get(MAPPINGS_KEYNAME); - if (mappingsValue != null) { - exciseMappingsType(topPayloadElement, mappingsValue); - } - } - } - - private void exciseMappingsType(Map mappingsParent, Map mappingsValue) { - var firstMappingOp = mappingsValue.entrySet().stream().findFirst(); - firstMappingOp.ifPresent(firstMapping -> mappingsParent.put(MAPPINGS_KEYNAME, firstMapping.getValue())); - } -} diff --git a/transformation/transformationPlugins/jsonMessageTransformers/openSearch23PlusTargetTransformerProvider/src/main/resources/META-INF/services/org.opensearch.migrations.transform.IJsonTransformerProvider b/transformation/transformationPlugins/jsonMessageTransformers/openSearch23PlusTargetTransformerProvider/src/main/resources/META-INF/services/org.opensearch.migrations.transform.IJsonTransformerProvider deleted file mode 100644 index 34d314de6..000000000 --- a/transformation/transformationPlugins/jsonMessageTransformers/openSearch23PlusTargetTransformerProvider/src/main/resources/META-INF/services/org.opensearch.migrations.transform.IJsonTransformerProvider +++ /dev/null @@ -1 +0,0 @@ -org.opensearch.migrations.transform.JsonTransformerForOpenSearch23PlusTargetTransformerProvider \ No newline at end of file diff --git a/transformation/transformationPlugins/jsonMessageTransformers/openSearch23PlusTargetTransformerProvider/src/test/java/org/opensearch/migrations/transform/TypeMappingsExcisionTest.java b/transformation/transformationPlugins/jsonMessageTransformers/openSearch23PlusTargetTransformerProvider/src/test/java/org/opensearch/migrations/transform/TypeMappingsExcisionTest.java deleted file mode 100644 index d732b031f..000000000 --- a/transformation/transformationPlugins/jsonMessageTransformers/openSearch23PlusTargetTransformerProvider/src/test/java/org/opensearch/migrations/transform/TypeMappingsExcisionTest.java +++ /dev/null @@ -1,71 +0,0 @@ -package org.opensearch.migrations.transform; - -import java.io.InputStream; -import java.io.InputStreamReader; -import java.nio.ByteBuffer; -import java.nio.charset.StandardCharsets; -import java.util.LinkedHashMap; -import java.util.Map; - -import org.opensearch.migrations.replay.datahandlers.JsonAccumulator; - -import com.fasterxml.jackson.core.type.TypeReference; -import com.fasterxml.jackson.databind.ObjectMapper; -import com.google.common.io.CharStreams; -import org.junit.jupiter.api.Assertions; -import org.junit.jupiter.api.Test; - -public class TypeMappingsExcisionTest { - - static final TypeReference> TYPE_REFERENCE_FOR_MAP_TYPE = new TypeReference<>() { - }; - - static ObjectMapper objectMapper = new ObjectMapper(); - - static InputStream getInputStreamForTypeMappingResource(String resourceName) { - return TypeMappingsExcisionTest.class.getResourceAsStream("/sampleJsonDocuments/typeMappings/" + resourceName); - } - - @Test - public void removesTypeMappingsFrom_indexCreation() throws Exception { - var json = parseJsonFromResourceName("put_index_input.txt"); - transformAndVerifyResult(json, "put_index_output.txt"); - } - - @Test - public void removesTypeMappingsFrom_documentPut() throws Exception { - var json = parseJsonFromResourceName("put_document_input.txt"); - transformAndVerifyResult(json, "put_document_output.txt"); - } - - @Test - public void removesTypeMappingsFrom_queryGet() throws Exception { - var json = parseJsonFromResourceName("get_query_input.txt"); - transformAndVerifyResult(json, "get_query_output.txt"); - } - - private static Map parseJsonFromResourceName(String resourceName) throws Exception { - var jsonAccumulator = new JsonAccumulator(); - try ( - var resourceStream = getInputStreamForTypeMappingResource(resourceName); - var isr = new InputStreamReader(resourceStream, StandardCharsets.UTF_8) - ) { - var expectedBytes = CharStreams.toString(isr).getBytes(StandardCharsets.UTF_8); - return (Map) jsonAccumulator.consumeByteBufferForSingleObject(ByteBuffer.wrap(expectedBytes)); - } - } - - private static void transformAndVerifyResult(Map json, String expectedValueSource) - throws Exception { - var jsonTransformer = getJsonTransformer(); - json = jsonTransformer.transformJson(json); - var jsonAsStr = objectMapper.writeValueAsString(json); - Object expectedObject = parseJsonFromResourceName(expectedValueSource); - var expectedValue = objectMapper.writeValueAsString(expectedObject); - Assertions.assertEquals(expectedValue, jsonAsStr); - } - - static IJsonTransformer getJsonTransformer() { - return new JsonTypeMappingTransformer(); - } -} diff --git a/transformation/transformationPlugins/jsonMessageTransformers/openSearch23PlusTargetTransformerProvider/src/test/resources/log4j2.properties b/transformation/transformationPlugins/jsonMessageTransformers/openSearch23PlusTargetTransformerProvider/src/test/resources/log4j2.properties deleted file mode 100644 index 6adca47b5..000000000 --- a/transformation/transformationPlugins/jsonMessageTransformers/openSearch23PlusTargetTransformerProvider/src/test/resources/log4j2.properties +++ /dev/null @@ -1,18 +0,0 @@ -status = WARN - -property.ownedPackagesLogLevel=${sys:migrationLogLevel:-INFO} - -appender.console.type = Console -appender.console.name = Console -appender.console.target = SYSTEM_OUT -appender.console.layout.type = PatternLayout -appender.console.layout.pattern = %d{yyyy-MM-dd HH:mm:ss,SSS}{UTC} %p %c{1.} [%t] %m%n - -rootLogger.level = info -rootLogger.appenderRef.console.ref = Console - -# Allow customization of owned package logs -logger.rfs.name = org.opensearch.migrations.bulkload -logger.rfs.level = ${ownedPackagesLogLevel} -logger.migration.name = org.opensearch.migrations -logger.migration.level = ${ownedPackagesLogLevel} diff --git a/transformation/transformationPlugins/jsonMessageTransformers/openSearch23PlusTargetTransformerProvider/src/test/resources/sampleJsonDocuments/typeMappings/get_query_input.txt b/transformation/transformationPlugins/jsonMessageTransformers/openSearch23PlusTargetTransformerProvider/src/test/resources/sampleJsonDocuments/typeMappings/get_query_input.txt deleted file mode 100644 index 14318a64b..000000000 --- a/transformation/transformationPlugins/jsonMessageTransformers/openSearch23PlusTargetTransformerProvider/src/test/resources/sampleJsonDocuments/typeMappings/get_query_input.txt +++ /dev/null @@ -1,9 +0,0 @@ -{ - "method": "GET", - "URI": "/oldStyleIndex/oldType/_search", - "payload": { - "inlinedJsonBody": { - "query": { "match": { "field1": "VALUE_1" } } - } - } -} diff --git a/transformation/transformationPlugins/jsonMessageTransformers/openSearch23PlusTargetTransformerProvider/src/test/resources/sampleJsonDocuments/typeMappings/get_query_output.txt b/transformation/transformationPlugins/jsonMessageTransformers/openSearch23PlusTargetTransformerProvider/src/test/resources/sampleJsonDocuments/typeMappings/get_query_output.txt deleted file mode 100644 index 33ba1bc3a..000000000 --- a/transformation/transformationPlugins/jsonMessageTransformers/openSearch23PlusTargetTransformerProvider/src/test/resources/sampleJsonDocuments/typeMappings/get_query_output.txt +++ /dev/null @@ -1,10 +0,0 @@ -{ - "method": "GET", - "URI": "/oldStyleIndex/_search", - "payload": { - "inlinedJsonBody": { - "query": { "match": { "field1": "VALUE_1" } - } - } - } -} diff --git a/transformation/transformationPlugins/jsonMessageTransformers/openSearch23PlusTargetTransformerProvider/src/test/resources/sampleJsonDocuments/typeMappings/put_document_input.txt b/transformation/transformationPlugins/jsonMessageTransformers/openSearch23PlusTargetTransformerProvider/src/test/resources/sampleJsonDocuments/typeMappings/put_document_input.txt deleted file mode 100644 index 1e169fcfd..000000000 --- a/transformation/transformationPlugins/jsonMessageTransformers/openSearch23PlusTargetTransformerProvider/src/test/resources/sampleJsonDocuments/typeMappings/put_document_input.txt +++ /dev/null @@ -1,10 +0,0 @@ -{ - "method": "PUT", - "URI": "/oldStyleIndex/oldType/1", - "payload": { - "inlinedJsonBody": { - "field1": "VALUE1", - "field2": "VALUE2" - } - } -} diff --git a/transformation/transformationPlugins/jsonMessageTransformers/openSearch23PlusTargetTransformerProvider/src/test/resources/sampleJsonDocuments/typeMappings/put_document_output.txt b/transformation/transformationPlugins/jsonMessageTransformers/openSearch23PlusTargetTransformerProvider/src/test/resources/sampleJsonDocuments/typeMappings/put_document_output.txt deleted file mode 100644 index 24902fc0a..000000000 --- a/transformation/transformationPlugins/jsonMessageTransformers/openSearch23PlusTargetTransformerProvider/src/test/resources/sampleJsonDocuments/typeMappings/put_document_output.txt +++ /dev/null @@ -1,10 +0,0 @@ -{ - "method": "PUT", - "URI": "/oldStyleIndex/_doc/1", - "payload": { - "inlinedJsonBody": { - "field1": "VALUE1", - "field2": "VALUE2" - } - } -} diff --git a/transformation/transformationPlugins/jsonMessageTransformers/openSearch23PlusTargetTransformerProvider/src/test/resources/sampleJsonDocuments/typeMappings/put_index_input.txt b/transformation/transformationPlugins/jsonMessageTransformers/openSearch23PlusTargetTransformerProvider/src/test/resources/sampleJsonDocuments/typeMappings/put_index_input.txt deleted file mode 100644 index beed65ea3..000000000 --- a/transformation/transformationPlugins/jsonMessageTransformers/openSearch23PlusTargetTransformerProvider/src/test/resources/sampleJsonDocuments/typeMappings/put_index_input.txt +++ /dev/null @@ -1,20 +0,0 @@ -{ - "method": "PUT", - "URI": "/oldStyleIndex", - "payload": { - "inlinedJsonBody": { - "mappings": { - "oldType": { - "properties": { - "field1": { - "type": "text" - }, - "field2": { - "type": "keyword" - } - } - } - } - } - } -} diff --git a/transformation/transformationPlugins/jsonMessageTransformers/openSearch23PlusTargetTransformerProvider/src/test/resources/sampleJsonDocuments/typeMappings/put_index_output.txt b/transformation/transformationPlugins/jsonMessageTransformers/openSearch23PlusTargetTransformerProvider/src/test/resources/sampleJsonDocuments/typeMappings/put_index_output.txt deleted file mode 100644 index 3ae3b4b2f..000000000 --- a/transformation/transformationPlugins/jsonMessageTransformers/openSearch23PlusTargetTransformerProvider/src/test/resources/sampleJsonDocuments/typeMappings/put_index_output.txt +++ /dev/null @@ -1,18 +0,0 @@ -{ - "method": "PUT", - "URI": "/oldStyleIndex", - "payload": { - "inlinedJsonBody": { - "mappings": { - "properties": { - "field1": { - "type": "text" - }, - "field2": { - "type": "keyword" - } - } - } - } - } -} From 59fd4d9a07a151c7caac58cc0040183534bc47a7 Mon Sep 17 00:00:00 2001 From: Greg Schohn Date: Tue, 3 Dec 2024 21:42:05 -0500 Subject: [PATCH 14/26] Simple bugfixes, especially around more carefully staying away from requests that don't need to be transformed for type mappings excision. Improved some tests as well. Signed-off-by: Greg Schohn --- .../src/main/docker/docker-compose.yml | 4 +- .../migrations/testutils/JsonNormalizer.java | 23 ++++++ .../transform/JinjavaTransformer.java | 2 +- .../jinjava/JavaRegexReplaceFilter.java | 2 +- .../TypeMappingsSanitizationTransformer.java | 2 +- .../jinjava/typeMappings/replayer.j2 | 4 +- ...ppingsSanitizationTransformerBulkTest.java | 14 +--- ...peMappingsSanitizationTransformerTest.java | 53 +++++++++++--- .../TypeMappingsSanitizationProviderTest.java | 71 ++++++++----------- 9 files changed, 106 insertions(+), 69 deletions(-) create mode 100644 testHelperFixtures/src/testFixtures/java/org/opensearch/migrations/testutils/JsonNormalizer.java diff --git a/TrafficCapture/dockerSolution/src/main/docker/docker-compose.yml b/TrafficCapture/dockerSolution/src/main/docker/docker-compose.yml index 3a3212b83..407fa7a9f 100644 --- a/TrafficCapture/dockerSolution/src/main/docker/docker-compose.yml +++ b/TrafficCapture/dockerSolution/src/main/docker/docker-compose.yml @@ -78,8 +78,8 @@ services: condition: service_started opensearchtarget: condition: service_started - command: /bin/sh -c "/runJavaWithClasspath.sh org.opensearch.migrations.replay.TrafficReplayer --speedup-factor 2 https://opensearchtarget:9200 --auth-header-value Basic\\ YWRtaW46bXlTdHJvbmdQYXNzd29yZDEyMyE= --insecure --kafka-traffic-brokers kafka:9092 --kafka-traffic-topic logging-traffic-topic --kafka-traffic-group-id logging-group-default --otelCollectorEndpoint http://otel-collector:4317" #--transformer-config-base64 W3sgIkpzb25Kb2x0VHJhbnNmb3JtZXJQcm92aWRlciI6ClsKICB7CiAgICAic2NyaXB0IjogewogICAgICAib3BlcmF0aW9uIjogInNoaWZ0IiwKICAgICAgInNwZWMiOiB7CiAgICAgICAgIm1ldGhvZCI6ICJtZXRob2QiLAogICAgICAgICJVUkkiOiAiVVJJIiwKICAgICAgICAiaGVhZGVycyI6ICJoZWFkZXJzIiwKICAgICAgICAicGF5bG9hZCI6IHsKICAgICAgICAgICJpbmxpbmVkSnNvbkJvZHkiOiB7CiAgICAgICAgICAgICJ0b3AiOiB7CiAgICAgICAgICAgICAgInRhZ1RvRXhjaXNlIjogewogICAgICAgICAgICAgICAgIioiOiAicGF5bG9hZC5pbmxpbmVkSnNvbkJvZHkudG9wLiYiIAogICAgICAgICAgICAgIH0sCiAgICAgICAgICAgICAgIioiOiAicGF5bG9hZC5pbmxpbmVkSnNvbkJvZHkudG9wLiYiCiAgICAgICAgICAgIH0sCiAgICAgICAgICAiKiI6ICJwYXlsb2FkLmlubGluZWRKc29uQm9keS4mIgogICAgICAgICAgfQogICAgICAgIH0KICAgICAgfQogICAgfQogIH0sIAogewogICAic2NyaXB0IjogewogICAgICJvcGVyYXRpb24iOiAibW9kaWZ5LW92ZXJ3cml0ZS1iZXRhIiwKICAgICAic3BlYyI6IHsKICAgICAgICJVUkkiOiAiPXNwbGl0KCcvZXh0cmFUaGluZ1RvUmVtb3ZlJyxAKDEsJikpIgogICAgIH0KICB9CiB9LAogewogICAic2NyaXB0IjogewogICAgICJvcGVyYXRpb24iOiAibW9kaWZ5LW92ZXJ3cml0ZS1iZXRhIiwKICAgICAic3BlYyI6IHsKICAgICAgICJVUkkiOiAiPWpvaW4oJycsQCgxLCYpKSIKICAgICB9CiAgfQogfQpdCn1dCg==" - +# command: /bin/sh -c "/runJavaWithClasspath.sh org.opensearch.migrations.replay.TrafficReplayer --speedup-factor 2 https://opensearchtarget:9200 --auth-header-value Basic\\ YWRtaW46bXlTdHJvbmdQYXNzd29yZDEyMyE= --insecure --kafka-traffic-brokers kafka:9092 --kafka-traffic-topic logging-traffic-topic --kafka-traffic-group-id logging-group-default --otelCollectorEndpoint http://otel-collector:4317 --transformer-config " + command: /bin/sh -c "/runJavaWithClasspath.sh org.opensearch.migrations.replay.TrafficReplayer --speedup-factor 2 https://opensearchtarget:9200 --auth-header-value Basic\\ YWRtaW46bXlTdHJvbmdQYXNzd29yZDEyMyE= --insecure --kafka-traffic-brokers kafka:9092 --kafka-traffic-topic logging-traffic-topic --kafka-traffic-group-id logging-group-default --otelCollectorEndpoint http://otel-collector:4317 --transformer-config '[{\"TypeMappingSanitizationTransformerProvider\":\"\"}]'" opensearchtarget: image: 'opensearchproject/opensearch:2.15.0' environment: diff --git a/testHelperFixtures/src/testFixtures/java/org/opensearch/migrations/testutils/JsonNormalizer.java b/testHelperFixtures/src/testFixtures/java/org/opensearch/migrations/testutils/JsonNormalizer.java new file mode 100644 index 000000000..b84219354 --- /dev/null +++ b/testHelperFixtures/src/testFixtures/java/org/opensearch/migrations/testutils/JsonNormalizer.java @@ -0,0 +1,23 @@ +package org.opensearch.migrations.testutils; + +import java.util.SortedMap; + +import com.fasterxml.jackson.databind.ObjectMapper; +import com.fasterxml.jackson.databind.SerializationFeature; +import lombok.SneakyThrows; + +public class JsonNormalizer { + private static final ObjectMapper OBJECT_MAPPER = new ObjectMapper() + .configure(SerializationFeature.ORDER_MAP_ENTRIES_BY_KEYS, true) + .configure(SerializationFeature.INDENT_OUTPUT, true); + + @SneakyThrows + public static String fromString(String input) { + return OBJECT_MAPPER.writeValueAsString(OBJECT_MAPPER.readValue(input, SortedMap.class)); + } + + @SneakyThrows + public static String fromObject(Object obj) { + return fromString(OBJECT_MAPPER.writeValueAsString(obj)); + } +} diff --git a/transformation/transformationPlugins/jsonMessageTransformers/jsonJinjavaTransformer/src/main/java/org/opensearch/migrations/transform/JinjavaTransformer.java b/transformation/transformationPlugins/jsonMessageTransformers/jsonJinjavaTransformer/src/main/java/org/opensearch/migrations/transform/JinjavaTransformer.java index af23be1cb..2d24f6a74 100644 --- a/transformation/transformationPlugins/jsonMessageTransformers/jsonJinjavaTransformer/src/main/java/org/opensearch/migrations/transform/JinjavaTransformer.java +++ b/transformation/transformationPlugins/jsonMessageTransformers/jsonJinjavaTransformer/src/main/java/org/opensearch/migrations/transform/JinjavaTransformer.java @@ -83,7 +83,7 @@ private void findAndReplacePreserves(Map incomingRoot, Map) parsedRoot.get(JsonKeysForHttpMessage.PRESERVE_KEY); if (preserveKeys != null) { preserveKeys.forEach(preservedKey -> - parsedRoot.put(preservedKey, incomingRoot.get(preservedKey))); + Optional.ofNullable(incomingRoot.get(preservedKey)).ifPresent(v->parsedRoot.put(preservedKey, v))); parsedRoot.remove(JsonKeysForHttpMessage.PRESERVE_KEY); } } diff --git a/transformation/transformationPlugins/jsonMessageTransformers/jsonJinjavaTransformer/src/main/java/org/opensearch/migrations/transform/jinjava/JavaRegexReplaceFilter.java b/transformation/transformationPlugins/jsonMessageTransformers/jsonJinjavaTransformer/src/main/java/org/opensearch/migrations/transform/jinjava/JavaRegexReplaceFilter.java index 537698de3..46d346946 100644 --- a/transformation/transformationPlugins/jsonMessageTransformers/jsonJinjavaTransformer/src/main/java/org/opensearch/migrations/transform/jinjava/JavaRegexReplaceFilter.java +++ b/transformation/transformationPlugins/jsonMessageTransformers/jsonJinjavaTransformer/src/main/java/org/opensearch/migrations/transform/jinjava/JavaRegexReplaceFilter.java @@ -41,7 +41,7 @@ public Object filter(Object inputObject, JinjavaInterpreter interpreter, String. try { Matcher matcher = getCompiledPattern(pattern).matcher(input); var rval = matcher.replaceAll(replacement); - log.atError().setMessage("replaced value {}").addArgument(rval).log(); + log.atError().setMessage("replaced value {} with {}").addArgument(input).addArgument(rval).log(); return rval; } catch (Exception e) { return null; diff --git a/transformation/transformationPlugins/jsonMessageTransformers/jsonTypeMappingsSanitizationTransformer/src/main/java/org/opensearch/migrations/transform/TypeMappingsSanitizationTransformer.java b/transformation/transformationPlugins/jsonMessageTransformers/jsonTypeMappingsSanitizationTransformer/src/main/java/org/opensearch/migrations/transform/TypeMappingsSanitizationTransformer.java index c6344b9c4..bc98fda37 100644 --- a/transformation/transformationPlugins/jsonMessageTransformers/jsonTypeMappingsSanitizationTransformer/src/main/java/org/opensearch/migrations/transform/TypeMappingsSanitizationTransformer.java +++ b/transformation/transformationPlugins/jsonMessageTransformers/jsonTypeMappingsSanitizationTransformer/src/main/java/org/opensearch/migrations/transform/TypeMappingsSanitizationTransformer.java @@ -41,7 +41,7 @@ public TypeMappingsSanitizationTransformer(String variantName, var featureFlags = featureFlagsIncoming != null ? featureFlagsIncoming : Map.of(); var indexMappings = indexMappingsIncoming != null ? indexMappingsIncoming : Map.of(); var regexIndexMappings = Optional.ofNullable(regexIndexMappingsIncoming) - .orElseGet(() -> (indexMappingsIncoming == null ? List.of(List.of("(.*)", "(.*)", "\\1_\\2")) : List.of())); + .orElseGet(() -> (indexMappingsIncoming == null ? List.of(List.of("(.*)", ".*", "$1")) : List.of())); return incomingJson -> Map.of("request", incomingJson, "index_mappings", indexMappings, diff --git a/transformation/transformationPlugins/jsonMessageTransformers/jsonTypeMappingsSanitizationTransformer/src/main/resources/jinjava/typeMappings/replayer.j2 b/transformation/transformationPlugins/jsonMessageTransformers/jsonTypeMappingsSanitizationTransformer/src/main/resources/jinjava/typeMappings/replayer.j2 index f6cbdcdd2..28c499b93 100644 --- a/transformation/transformationPlugins/jsonMessageTransformers/jsonTypeMappingsSanitizationTransformer/src/main/resources/jinjava/typeMappings/replayer.j2 +++ b/transformation/transformationPlugins/jsonMessageTransformers/jsonTypeMappingsSanitizationTransformer/src/main/resources/jinjava/typeMappings/replayer.j2 @@ -10,10 +10,10 @@ 'index_mappings': index_mappings, 'regex_index_mappings': regex_index_mappings} -%} -{{- rscope.route(source_and_mappings, request.method + " " + request.URI, flags, 'make_keep_json', +{{- rscope.route(source_and_mappings, request.method + " " + request.URI, flags, 'preserve.make_keep_json', [ ('(?:PUT|POST) /([^/]*)/([^/]*)/(.*)', 'rewrite_doc_request', 'rewrite_add_request_to_strip_types'), - ( 'GET /([^/]*)/([^/]*)/.*', 'rewrite_doc_request', 'rewrite_get_request_to_strip_types'), + ( 'GET /((?!\\.\\.$)[^-_+\\p{Lu}\\\\/*?\\\"<>|,# ][^\\p{Lu}\\\\/*?\\\"<>|,# ]*)/((?!\\.\\.$)[^-_+\\p{Lu}\\\\/*?\\\"<>|,# ][^\\p{Lu}\\\\/*?\\\"<>|,# ]*)/([^/]+)$', 'rewrite_doc_request', 'rewrite_get_request_to_strip_types'), ('(?:PUT|POST) /_bulk', 'rewrite_bulk', 'rewrite_bulk'), ('(?:PUT|POST) /([^/]*)', 'rewrite_create_index', 'rewrite_create_index') ]) diff --git a/transformation/transformationPlugins/jsonMessageTransformers/jsonTypeMappingsSanitizationTransformer/src/test/java/org/opensearch/migrations/transform/TypeMappingsSanitizationTransformerBulkTest.java b/transformation/transformationPlugins/jsonMessageTransformers/jsonTypeMappingsSanitizationTransformer/src/test/java/org/opensearch/migrations/transform/TypeMappingsSanitizationTransformerBulkTest.java index dd057c6f6..136eea570 100644 --- a/transformation/transformationPlugins/jsonMessageTransformers/jsonTypeMappingsSanitizationTransformer/src/test/java/org/opensearch/migrations/transform/TypeMappingsSanitizationTransformerBulkTest.java +++ b/transformation/transformationPlugins/jsonMessageTransformers/jsonTypeMappingsSanitizationTransformer/src/test/java/org/opensearch/migrations/transform/TypeMappingsSanitizationTransformerBulkTest.java @@ -5,16 +5,15 @@ import java.util.List; import java.util.Map; +import org.opensearch.migrations.testutils.JsonNormalizer; + import com.fasterxml.jackson.core.JsonProcessingException; import com.fasterxml.jackson.databind.ObjectMapper; -import com.fasterxml.jackson.databind.SerializationFeature; import lombok.extern.slf4j.Slf4j; import org.junit.jupiter.api.Assertions; import org.junit.jupiter.api.BeforeAll; import org.junit.jupiter.api.Test; -import static org.hamcrest.Matchers.*; - @Slf4j public class TypeMappingsSanitizationTransformerBulkTest { @@ -110,14 +109,7 @@ public void testBulk() throws Exception { throw new RuntimeException(e); } }).log(); - Assertions.assertEquals(normalize(OBJECT_MAPPER.readValue(expectedString, LinkedHashMap.class)), - normalize(resultObj)); + Assertions.assertEquals(JsonNormalizer.fromString(expectedString), JsonNormalizer.fromObject(resultObj)); } - static String normalize(Object obj) throws Exception { - return new ObjectMapper() - .configure(SerializationFeature.ORDER_MAP_ENTRIES_BY_KEYS, true) - .configure(SerializationFeature.INDENT_OUTPUT, true) - .writeValueAsString(obj); - } } diff --git a/transformation/transformationPlugins/jsonMessageTransformers/jsonTypeMappingsSanitizationTransformer/src/test/java/org/opensearch/migrations/transform/TypeMappingsSanitizationTransformerTest.java b/transformation/transformationPlugins/jsonMessageTransformers/jsonTypeMappingsSanitizationTransformer/src/test/java/org/opensearch/migrations/transform/TypeMappingsSanitizationTransformerTest.java index d809eeaee..731d9058c 100644 --- a/transformation/transformationPlugins/jsonMessageTransformers/jsonTypeMappingsSanitizationTransformer/src/test/java/org/opensearch/migrations/transform/TypeMappingsSanitizationTransformerTest.java +++ b/transformation/transformationPlugins/jsonMessageTransformers/jsonTypeMappingsSanitizationTransformer/src/test/java/org/opensearch/migrations/transform/TypeMappingsSanitizationTransformerTest.java @@ -6,16 +6,21 @@ import java.util.List; import java.util.Map; +import org.opensearch.migrations.testutils.JsonNormalizer; + +import com.fasterxml.jackson.core.type.TypeReference; import com.fasterxml.jackson.databind.ObjectMapper; import com.fasterxml.jackson.databind.node.ObjectNode; import lombok.extern.slf4j.Slf4j; import org.junit.jupiter.api.Assertions; import org.junit.jupiter.api.BeforeAll; import org.junit.jupiter.api.Test; +import org.junit.jupiter.params.ParameterizedTest; +import org.junit.jupiter.params.provider.ValueSource; @Slf4j class TypeMappingsSanitizationTransformerTest { - private static final ObjectMapper objMapper = new ObjectMapper(); + private static final ObjectMapper OBJECT_MAPPER = new ObjectMapper(); private static TypeMappingsSanitizationTransformer indexTypeMappingRewriter; @BeforeAll @@ -49,8 +54,8 @@ public void testPutDoc() throws Exception { " }\n" + " }\n" + "}"; - var resultObj = indexTypeMappingRewriter.transformJson(objMapper.readValue(testString, LinkedHashMap.class)); - var resultStr = objMapper.writeValueAsString(resultObj); + var resultObj = indexTypeMappingRewriter.transformJson(OBJECT_MAPPER.readValue(testString, LinkedHashMap.class)); + var resultStr = OBJECT_MAPPER.writeValueAsString(resultObj); log.atInfo().setMessage("resultStr = {}").setMessage(resultStr).log(); } @@ -68,9 +73,21 @@ public void testPutDocRegex() throws Exception { " }\n" + " }\n" + "}"; - var resultObj = indexTypeMappingRewriter.transformJson(objMapper.readValue(testString, LinkedHashMap.class)); - var resultStr = objMapper.writeValueAsString(resultObj); + var expectedString = "{\n" + + " \"" + JsonKeysForHttpMessage.METHOD_KEY + "\":\"PUT\",\n" + + " \"" + JsonKeysForHttpMessage.URI_KEY + "\": \"/time-1-2/_doc/doc2\",\n" + + " \"" + JsonKeysForHttpMessage.PAYLOAD_KEY + "\":{" + + " \"" + JsonKeysForHttpMessage.INLINED_JSON_BODY_DOCUMENT_KEY + "\":{" + + " \"name\":\"Some User\"," + + " \"user_name\":\"user\"," + + " \"email\":\"user@example.com\"" + + " }" + + " }" + + "}"; + var resultObj = indexTypeMappingRewriter.transformJson(OBJECT_MAPPER.readValue(testString, LinkedHashMap.class)); + var resultStr = OBJECT_MAPPER.writeValueAsString(resultObj); log.atInfo().setMessage("resultStr = {}").setMessage(resultStr).log(); + Assertions.assertEquals(JsonNormalizer.fromString(expectedString), JsonNormalizer.fromObject(resultObj)); } private static String makeMultiTypePutIndexRequest(String indexName) { @@ -113,22 +130,22 @@ private static String makeMultiTypePutIndexRequest(String indexName) { Map doPutIndex(String indexName) throws Exception { var testString = makeMultiTypePutIndexRequest(indexName); - return indexTypeMappingRewriter.transformJson(objMapper.readValue(testString, LinkedHashMap.class)); + return indexTypeMappingRewriter.transformJson(OBJECT_MAPPER.readValue(testString, LinkedHashMap.class)); } @Test public void testPutSingleTypeIndex() throws Exception { final String index = "indexA"; var result = doPutIndex(index); - Assertions.assertEquals(objMapper.readValue(makeMultiTypePutIndexRequest(index), LinkedHashMap.class), - result); + Assertions.assertEquals(JsonNormalizer.fromString(makeMultiTypePutIndexRequest(index)), + JsonNormalizer.fromObject(result)); } @Test public void testMultiTypeIndex() throws Exception { final String index = "socialTypes"; var result = doPutIndex(index); - var expected = objMapper.readTree(makeMultiTypePutIndexRequest(index)); + var expected = OBJECT_MAPPER.readTree(makeMultiTypePutIndexRequest(index)); var mappings = ((ObjectNode) expected.path(JsonKeysForHttpMessage.PAYLOAD_KEY) .path(JsonKeysForHttpMessage.INLINED_JSON_BODY_DOCUMENT_KEY) .path("mappings")); @@ -139,8 +156,22 @@ public void testMultiTypeIndex() throws Exception { user.path("properties").fields().forEachRemaining(e -> newProperties.put(e.getKey(), e.getValue())); var tweet = mappings.remove("tweet"); tweet.path("properties").fields().forEachRemaining(e -> newProperties.put(e.getKey(), e.getValue())); - mappings.set("properties", objMapper.valueToTree(newProperties)); + mappings.set("properties", OBJECT_MAPPER.valueToTree(newProperties)); ((ObjectNode)expected).put(JsonKeysForHttpMessage.URI_KEY, "/communal"); - Assertions.assertEquals(expected, objMapper.readTree(objMapper.writeValueAsString(result))); + Assertions.assertEquals(JsonNormalizer.fromObject(expected), JsonNormalizer.fromObject(result)); + } + + @ParameterizedTest + @ValueSource(strings = {"status", "_cat/indices", "_cat/indices/nov-*"} ) + public void testDefaultActionPreservesRequest(String uri) throws Exception { + final String bespokeRequest = "" + + "{\n" + + " \"" + JsonKeysForHttpMessage.METHOD_KEY + "\": \"GET\",\n" + + " \"" + JsonKeysForHttpMessage.URI_KEY + "\": \"/" + uri + "\"" + + "}"; + var transformedResult = indexTypeMappingRewriter.transformJson( + OBJECT_MAPPER.readValue(bespokeRequest, new TypeReference<>(){})); + Assertions.assertEquals(JsonNormalizer.fromString(bespokeRequest), + JsonNormalizer.fromObject(transformedResult)); } } diff --git a/transformation/transformationPlugins/jsonMessageTransformers/jsonTypeMappingsSanitizationTransformerProvider/src/test/java/org/opensearch/migrations/replay/TypeMappingsSanitizationProviderTest.java b/transformation/transformationPlugins/jsonMessageTransformers/jsonTypeMappingsSanitizationTransformerProvider/src/test/java/org/opensearch/migrations/replay/TypeMappingsSanitizationProviderTest.java index 4050664c6..c0b66acb6 100644 --- a/transformation/transformationPlugins/jsonMessageTransformers/jsonTypeMappingsSanitizationTransformerProvider/src/test/java/org/opensearch/migrations/replay/TypeMappingsSanitizationProviderTest.java +++ b/transformation/transformationPlugins/jsonMessageTransformers/jsonTypeMappingsSanitizationTransformerProvider/src/test/java/org/opensearch/migrations/replay/TypeMappingsSanitizationProviderTest.java @@ -3,6 +3,7 @@ import java.util.List; import java.util.Map; +import org.opensearch.migrations.testutils.JsonNormalizer; import org.opensearch.migrations.testutils.WrapWithNettyLeakDetection; import org.opensearch.migrations.transform.TypeMappingSanitizationTransformerProvider; @@ -17,33 +18,8 @@ @WrapWithNettyLeakDetection(disableLeakChecks = true) public class TypeMappingsSanitizationProviderTest { - static final String TEST_INPUT_REQUEST = "{\n" - + " \"method\": \"PUT\",\n" - + " \"URI\": \"/indexA/type2/someuser\",\n" - + " \"headers\": {\n" - + " \"host\": \"127.0.0.1\"\n" - + " },\n" - + " \"payload\": {\n" - + " \"inlinedJsonBody\": {\n" - + " \"name\": \"Some User\",\n" - + " \"user_name\": \"user\",\n" - + " \"email\": \"user@example.com\"\n" - + " }\n" - + " }\n" - + "}\n"; - - ObjectMapper mapper = new ObjectMapper(); - static String normalize(ObjectMapper mapper, String input) throws JsonProcessingException { - return mapper.writeValueAsString(mapper.readTree(input)); - } - - static String emitJson(ObjectMapper mapper, Object transformedDocument) throws JsonProcessingException { - mapper.configure(com.fasterxml.jackson.core.JsonParser.Feature.ALLOW_COMMENTS, true); // optional - return mapper.writeValueAsString(transformedDocument); - } - @Test public void testSimpleTransform() throws JsonProcessingException { var config = Map.of("staticMappings", @@ -56,16 +32,22 @@ public void testSimpleTransform() throws JsonProcessingException { "type2", "indexB"), "indexC", Map.of( "type2", "indexC")), - "regexMappings", List.of(List.of("(time*)", "(type*)", "$1_And_$2"))); - var provider = new TypeMappingSanitizationTransformerProvider(); - var transformer = provider.createTransformer(config); - var transformedDocument = - transformer.transformJson(mapper.readValue(TEST_INPUT_REQUEST, new TypeReference<>() { - })); - var outputStr = emitJson(mapper, transformedDocument); - - log.atInfo().setMessage("output={}").addArgument(outputStr).log(); - final String TEST_OUTPUT_REQUEST = "{\n" + "regexMappings", List.of(List.of("(time.*)", "(type.*)", "$1_And_$2"))); + final String TEST_INPUT_REQUEST = "{\n" + + " \"method\": \"PUT\",\n" + + " \"URI\": \"/indexA/type2/someuser\",\n" + + " \"headers\": {\n" + + " \"host\": \"127.0.0.1\"\n" + + " },\n" + + " \"payload\": {\n" + + " \"inlinedJsonBody\": {\n" + + " \"name\": \"Some User\",\n" + + " \"user_name\": \"user\",\n" + + " \"email\": \"user@example.com\"\n" + + " }\n" + + " }\n" + + "}\n"; + final String EXPECTED = "{\n" + " \"method\": \"PUT\",\n" + " \"URI\": \"/indexA_2/_doc/someuser\",\n" + " \"headers\": {\n" @@ -80,15 +62,24 @@ public void testSimpleTransform() throws JsonProcessingException { + " }\n" + "}\n"; - var normalizedOutput = normalize(mapper, TEST_OUTPUT_REQUEST); - Assertions.assertEquals(normalizedOutput, normalize(mapper, outputStr)); + var provider = new TypeMappingSanitizationTransformerProvider(); + + { + var transformedDocument = provider.createTransformer(config) + .transformJson(mapper.readValue(TEST_INPUT_REQUEST, new TypeReference<>() {})); + Assertions.assertEquals(JsonNormalizer.fromString(EXPECTED), + JsonNormalizer.fromObject(transformedDocument)); + } { var resultFromNullConfig = provider.createTransformer(null) .transformJson(mapper.readValue(TEST_INPUT_REQUEST, new TypeReference<>() { })); - Assertions.assertEquals(normalizedOutput - .replace("/indexA_2/_doc/someuser", "/1_2/_doc/someuser"), - normalize(mapper, emitJson(mapper, resultFromNullConfig))); + Assertions.assertEquals( + JsonNormalizer.fromString( + EXPECTED.replace( + "/indexA_2/_doc/someuser", + "/indexA/_doc/someuser")), + JsonNormalizer.fromObject(resultFromNullConfig)); } } } From fb9c20c2c730b973ec14ae3579662650b6a43ea1 Mon Sep 17 00:00:00 2001 From: Greg Schohn Date: Tue, 3 Dec 2024 22:54:32 -0500 Subject: [PATCH 15/26] Remove YAML support for feature flags - nobody is using it and no reason to force it - just the POJO structure matters anyway. Signed-off-by: Greg Schohn --- .../jsonMessageTransformerLoaders/build.gradle | 1 - .../migrations/transform/flags/FeatureFlags.java | 10 ---------- 2 files changed, 11 deletions(-) diff --git a/transformation/transformationPlugins/jsonMessageTransformers/jsonMessageTransformerLoaders/build.gradle b/transformation/transformationPlugins/jsonMessageTransformers/jsonMessageTransformerLoaders/build.gradle index 006dcdd34..d0ba8e706 100644 --- a/transformation/transformationPlugins/jsonMessageTransformers/jsonMessageTransformerLoaders/build.gradle +++ b/transformation/transformationPlugins/jsonMessageTransformers/jsonMessageTransformerLoaders/build.gradle @@ -25,7 +25,6 @@ plugins { dependencies { implementation group: 'org.slf4j', name: 'slf4j-api' implementation group: 'com.fasterxml.jackson.core', name: 'jackson-databind' - implementation group: 'com.fasterxml.jackson.dataformat', name: 'jackson-dataformat-yaml' api project(':transformation:transformationPlugins:jsonMessageTransformers:jsonMessageTransformerInterface') diff --git a/transformation/transformationPlugins/jsonMessageTransformers/jsonMessageTransformerLoaders/src/main/java/org/opensearch/migrations/transform/flags/FeatureFlags.java b/transformation/transformationPlugins/jsonMessageTransformers/jsonMessageTransformerLoaders/src/main/java/org/opensearch/migrations/transform/flags/FeatureFlags.java index c3b14a3cd..d415c18f7 100644 --- a/transformation/transformationPlugins/jsonMessageTransformers/jsonMessageTransformerLoaders/src/main/java/org/opensearch/migrations/transform/flags/FeatureFlags.java +++ b/transformation/transformationPlugins/jsonMessageTransformers/jsonMessageTransformerLoaders/src/main/java/org/opensearch/migrations/transform/flags/FeatureFlags.java @@ -5,7 +5,6 @@ import com.fasterxml.jackson.databind.ObjectMapper; import com.fasterxml.jackson.databind.annotation.JsonDeserialize; -import com.fasterxml.jackson.dataformat.yaml.YAMLFactory; import lombok.Getter; import lombok.Setter; @@ -18,7 +17,6 @@ public class FeatureFlags extends HashMap { // Static ObjectMappers for JSON and YAML private static final ObjectMapper jsonMapper = new ObjectMapper(); - private static final ObjectMapper yamlMapper = new ObjectMapper(new YAMLFactory()); // Parsing methods @@ -26,18 +24,10 @@ public static FeatureFlags parseJson(String contents) throws IOException { return jsonMapper.readValue(contents, FeatureFlags.class); } - public static FeatureFlags parseYaml(String contents) throws IOException { - return yamlMapper.readValue(contents, FeatureFlags.class); - } - public String writeJson() throws IOException { return jsonMapper.writeValueAsString(this); } - public String writeYaml() throws IOException { - return yamlMapper.writeValueAsString(this); - } - @Override public String toString() { return "FeatureFlags{" + From f5c4fedce5b9ed1bda32dda1f4f70e4c0f0ed23d Mon Sep 17 00:00:00 2001 From: Greg Schohn Date: Wed, 4 Dec 2024 10:54:04 -0500 Subject: [PATCH 16/26] Change how the transformation netty pipeline discovers if the payload was accessed. When the PayloadAccessFaultingMap throws a PayloadNotLoadedException, set a flag to show that. The Preliminary Transformation handler now checks the flag to determine if the payload needs to be parsed instead of relying upon the type of the exception that was thrown. The exception might be wrapped or eaten any number of ways. Jinjava does a nice job of packing all of the exception into an aggregate exception w/ line numbers, etc. It doesn't make sense to throw that away just to get a signal across a number of different unknown boundaries. Doing the direct connection w/ the flag makes a lot more sense. Signed-off-by: Greg Schohn --- .../PayloadAccessFaultingMap.java | 22 +++++++++-- ...ttpRequestPreliminaryTransformHandler.java | 27 ++++++++------ .../replay/PayloadNotFoundTest.java | 37 +++++++++++++++++++ 3 files changed, 70 insertions(+), 16 deletions(-) create mode 100644 TrafficCapture/trafficReplayer/src/test/java/org/opensearch/migrations/replay/PayloadNotFoundTest.java diff --git a/TrafficCapture/trafficReplayer/src/main/java/org/opensearch/migrations/replay/datahandlers/PayloadAccessFaultingMap.java b/TrafficCapture/trafficReplayer/src/main/java/org/opensearch/migrations/replay/datahandlers/PayloadAccessFaultingMap.java index ff8c3f665..76a6b7783 100644 --- a/TrafficCapture/trafficReplayer/src/main/java/org/opensearch/migrations/replay/datahandlers/PayloadAccessFaultingMap.java +++ b/TrafficCapture/trafficReplayer/src/main/java/org/opensearch/migrations/replay/datahandlers/PayloadAccessFaultingMap.java @@ -32,6 +32,7 @@ public class PayloadAccessFaultingMap extends AbstractMap { @Getter @Setter private boolean disableThrowingPayloadNotLoaded; + private boolean payloadWasAccessed; public PayloadAccessFaultingMap(StrictCaseInsensitiveHttpHeadersMap headers) { underlyingMap = new TreeMap<>(); @@ -51,19 +52,19 @@ public Iterator> iterator() { return new Iterator<>() { @Override public boolean hasNext() { - throw PayloadNotLoadedException.getInstance(); + throw makeFault(); } @Override public Map.Entry next() { - throw PayloadNotLoadedException.getInstance(); + throw makeFault(); } }; } @Override public int size() { - throw PayloadNotLoadedException.getInstance(); + throw makeFault(); } }; } else { @@ -80,8 +81,21 @@ public Object put(String key, Object value) { public Object get(Object key) { var value = super.get(key); if (value == null && !disableThrowingPayloadNotLoaded) { - throw PayloadNotLoadedException.getInstance(); + throw makeFault(); } return value; } + + public boolean missingPaylaodWasAccessed() { + return payloadWasAccessed; + } + + public void resetMissingPaylaodWasAccessed() { + payloadWasAccessed = false; + } + + private PayloadNotLoadedException makeFault() throws PayloadNotLoadedException { + payloadWasAccessed = true; + return PayloadNotLoadedException.getInstance(); + } } diff --git a/TrafficCapture/trafficReplayer/src/main/java/org/opensearch/migrations/replay/datahandlers/http/NettyDecodedHttpRequestPreliminaryTransformHandler.java b/TrafficCapture/trafficReplayer/src/main/java/org/opensearch/migrations/replay/datahandlers/http/NettyDecodedHttpRequestPreliminaryTransformHandler.java index 9c452ac52..a8ead48f7 100644 --- a/TrafficCapture/trafficReplayer/src/main/java/org/opensearch/migrations/replay/datahandlers/http/NettyDecodedHttpRequestPreliminaryTransformHandler.java +++ b/TrafficCapture/trafficReplayer/src/main/java/org/opensearch/migrations/replay/datahandlers/http/NettyDecodedHttpRequestPreliminaryTransformHandler.java @@ -7,7 +7,6 @@ import java.util.Optional; import org.opensearch.migrations.replay.datahandlers.PayloadAccessFaultingMap; -import org.opensearch.migrations.replay.datahandlers.PayloadNotLoadedException; import org.opensearch.migrations.replay.tracing.IReplayContexts; import org.opensearch.migrations.transform.IAuthTransformer; import org.opensearch.migrations.transform.IJsonTransformer; @@ -70,18 +69,22 @@ public void channelRead(@NonNull ChannelHandlerContext ctx, @NonNull Object msg) HttpJsonRequestWithFaultingPayload transformedMessage = null; try { transformedMessage = transform(transformer, httpJsonMessage); - } catch (PayloadNotLoadedException pnle) { - log.atDebug().setMessage("The transforms for this message require payload manipulation, " - + "all content handlers are being loaded.").log(); - // make a fresh message and its headers - requestPipelineOrchestrator.addJsonParsingHandlers( - ctx, - transformer, - getAuthTransformerAsStreamingTransformer(authTransformer) - ); - ctx.fireChannelRead(handleAuthHeaders(httpJsonMessage, authTransformer)); } catch (Exception e) { - throw new TransformationException(e); + var payload = (PayloadAccessFaultingMap) httpJsonMessage.payload(); + if (payload.missingPaylaodWasAccessed()) { + payload.resetMissingPaylaodWasAccessed(); + log.atDebug().setMessage("The transforms for this message require payload manipulation, " + + "all content handlers are being loaded.").log(); + // make a fresh message and its headers + requestPipelineOrchestrator.addJsonParsingHandlers( + ctx, + transformer, + getAuthTransformerAsStreamingTransformer(authTransformer) + ); + ctx.fireChannelRead(handleAuthHeaders(httpJsonMessage, authTransformer)); + } else{ + throw new TransformationException(e); + } } if (transformedMessage != null) { diff --git a/TrafficCapture/trafficReplayer/src/test/java/org/opensearch/migrations/replay/PayloadNotFoundTest.java b/TrafficCapture/trafficReplayer/src/test/java/org/opensearch/migrations/replay/PayloadNotFoundTest.java new file mode 100644 index 000000000..3d44f283c --- /dev/null +++ b/TrafficCapture/trafficReplayer/src/test/java/org/opensearch/migrations/replay/PayloadNotFoundTest.java @@ -0,0 +1,37 @@ +package org.opensearch.migrations.replay; + + +import org.opensearch.migrations.replay.datahandlers.PayloadAccessFaultingMap; +import org.opensearch.migrations.replay.datahandlers.http.HttpJsonRequestWithFaultingPayload; +import org.opensearch.migrations.replay.datahandlers.http.ListKeyAdaptingCaseInsensitiveHeadersMap; +import org.opensearch.migrations.replay.datahandlers.http.StrictCaseInsensitiveHttpHeadersMap; +import org.opensearch.migrations.transform.TransformationLoader; + +import com.fasterxml.jackson.core.JsonProcessingException; +import org.junit.jupiter.api.Assertions; +import org.junit.jupiter.api.Test; + +public class PayloadNotFoundTest { + @Test + public void testTransformsPropagateExceptionProperly() throws JsonProcessingException { + final HttpJsonRequestWithFaultingPayload FAULTING_MAP = new HttpJsonRequestWithFaultingPayload(); + FAULTING_MAP.setMethod("PUT"); + FAULTING_MAP.setPath("/_bulk"); + FAULTING_MAP.setHeaders(new ListKeyAdaptingCaseInsensitiveHeadersMap(new StrictCaseInsensitiveHttpHeadersMap())); + FAULTING_MAP.headers().put("Content-Type", "application/json"); + FAULTING_MAP.setPayloadFaultMap(new PayloadAccessFaultingMap(FAULTING_MAP.headers().asStrictMap())); + final String EXPECTED = "{\n" + + " \"method\": \"PUT\",\n" + + " \"URI\": \"/_bulk\",\n" + + " \"headers\": {\n" + + " \"Content-Type\": \"application/json\"\n" + + " }\n" + + "}\n"; + + var transformer = new TransformationLoader().getTransformerFactoryLoader("newhost", null, + "[{\"TypeMappingSanitizationTransformerProvider\":\"\"}]"); + var e = Assertions.assertThrows(Exception.class, + () -> transformer.transformJson(FAULTING_MAP)); + Assertions.assertTrue(((PayloadAccessFaultingMap)FAULTING_MAP.payload()).missingPaylaodWasAccessed()); + } +} From 5be3ddc30c9816d990d09bb70d6c790c8f56bb04 Mon Sep 17 00:00:00 2001 From: Greg Schohn Date: Wed, 4 Dec 2024 10:56:11 -0500 Subject: [PATCH 17/26] Minor cleanup + the addition of a resource cache for jinjava java resource streams Signed-off-by: Greg Schohn --- .../NameMappingClasspathResourceLocator.java | 34 ++++++++++++++++++- .../build.gradle | 1 - .../TypeMappingsSanitizationProviderTest.java | 9 ++--- 3 files changed, 36 insertions(+), 8 deletions(-) diff --git a/transformation/transformationPlugins/jsonMessageTransformers/jsonJinjavaTransformer/src/main/java/org/opensearch/migrations/transform/jinjava/NameMappingClasspathResourceLocator.java b/transformation/transformationPlugins/jsonMessageTransformers/jsonJinjavaTransformer/src/main/java/org/opensearch/migrations/transform/jinjava/NameMappingClasspathResourceLocator.java index 24e6bb85f..071bab0bd 100644 --- a/transformation/transformationPlugins/jsonMessageTransformers/jsonJinjavaTransformer/src/main/java/org/opensearch/migrations/transform/jinjava/NameMappingClasspathResourceLocator.java +++ b/transformation/transformationPlugins/jsonMessageTransformers/jsonJinjavaTransformer/src/main/java/org/opensearch/migrations/transform/jinjava/NameMappingClasspathResourceLocator.java @@ -3,15 +3,43 @@ import java.io.IOException; import java.nio.charset.Charset; import java.nio.charset.StandardCharsets; +import java.util.concurrent.ExecutionException; import java.util.stream.Collectors; +import com.google.common.cache.CacheBuilder; +import com.google.common.cache.CacheLoader; +import com.google.common.cache.LoadingCache; import com.google.common.io.Resources; import com.hubspot.jinjava.interpret.JinjavaInterpreter; import com.hubspot.jinjava.loader.ClasspathResourceLocator; +import com.hubspot.jinjava.loader.ResourceNotFoundException; +import lombok.AllArgsConstructor; +import lombok.EqualsAndHashCode; +import lombok.Getter; import lombok.extern.slf4j.Slf4j; @Slf4j public class NameMappingClasspathResourceLocator extends ClasspathResourceLocator { + @AllArgsConstructor + @Getter + @EqualsAndHashCode + private static class ResourceCacheKey { + private String fullName; + private Charset encoding; + } + + private final LoadingCache resourceCache = CacheBuilder.newBuilder() + .build(new CacheLoader<>() { + @Override + public String load(ResourceCacheKey key) throws IOException { + try { + String versionedName = getDefaultVersion("jinjava/" + key.getFullName()); + return Resources.toString(Resources.getResource(versionedName), key.getEncoding()); + } catch (IllegalArgumentException e) { + throw new ResourceNotFoundException("Couldn't find resource: " + key.getFullName()); + } + } + }); private String getDefaultVersion(final String fullName) throws IOException { try { @@ -31,6 +59,10 @@ private String getDefaultVersion(final String fullName) throws IOException { @Override public String getString(String fullName, Charset encoding, JinjavaInterpreter interpreter) throws IOException { - return super.getString(getDefaultVersion("jinjava/" + fullName), encoding, interpreter); + try { + return resourceCache.get(new ResourceCacheKey(fullName, encoding)); + } catch (ExecutionException e) { + throw new IOException("Failed to get resource content from cache", e); + } } } diff --git a/transformation/transformationPlugins/jsonMessageTransformers/jsonTypeMappingsSanitizationTransformerProvider/build.gradle b/transformation/transformationPlugins/jsonMessageTransformers/jsonTypeMappingsSanitizationTransformerProvider/build.gradle index 128adb34c..ff5c69557 100644 --- a/transformation/transformationPlugins/jsonMessageTransformers/jsonTypeMappingsSanitizationTransformerProvider/build.gradle +++ b/transformation/transformationPlugins/jsonMessageTransformers/jsonTypeMappingsSanitizationTransformerProvider/build.gradle @@ -14,7 +14,6 @@ dependencies { testImplementation project(':transformation:transformationPlugins:jsonMessageTransformers:jsonTypeMappingsSanitizationTransformer') testImplementation project(':coreUtilities') - testImplementation project(':TrafficCapture:trafficReplayer') testImplementation testFixtures(project(path: ':coreUtilities')) testImplementation testFixtures(project(path: ':testHelperFixtures')) testImplementation testFixtures(project(path: ':TrafficCapture:trafficReplayer')) diff --git a/transformation/transformationPlugins/jsonMessageTransformers/jsonTypeMappingsSanitizationTransformerProvider/src/test/java/org/opensearch/migrations/replay/TypeMappingsSanitizationProviderTest.java b/transformation/transformationPlugins/jsonMessageTransformers/jsonTypeMappingsSanitizationTransformerProvider/src/test/java/org/opensearch/migrations/replay/TypeMappingsSanitizationProviderTest.java index c0b66acb6..cde31e360 100644 --- a/transformation/transformationPlugins/jsonMessageTransformers/jsonTypeMappingsSanitizationTransformerProvider/src/test/java/org/opensearch/migrations/replay/TypeMappingsSanitizationProviderTest.java +++ b/transformation/transformationPlugins/jsonMessageTransformers/jsonTypeMappingsSanitizationTransformerProvider/src/test/java/org/opensearch/migrations/replay/TypeMappingsSanitizationProviderTest.java @@ -63,17 +63,14 @@ public void testSimpleTransform() throws JsonProcessingException { + "}\n"; var provider = new TypeMappingSanitizationTransformerProvider(); - + Map inputMap = mapper.readValue(TEST_INPUT_REQUEST, new TypeReference<>() {}); { - var transformedDocument = provider.createTransformer(config) - .transformJson(mapper.readValue(TEST_INPUT_REQUEST, new TypeReference<>() {})); + var transformedDocument = provider.createTransformer(config).transformJson(inputMap); Assertions.assertEquals(JsonNormalizer.fromString(EXPECTED), JsonNormalizer.fromObject(transformedDocument)); } { - var resultFromNullConfig = provider.createTransformer(null) - .transformJson(mapper.readValue(TEST_INPUT_REQUEST, new TypeReference<>() { - })); + var resultFromNullConfig = provider.createTransformer(null).transformJson(inputMap); Assertions.assertEquals( JsonNormalizer.fromString( EXPECTED.replace( From 73c8e13e29dca1304a6f4f1754ad5c91460d6ac5 Mon Sep 17 00:00:00 2001 From: Greg Schohn Date: Sat, 7 Dec 2024 18:45:03 -0500 Subject: [PATCH 18/26] Lots of improvements for jinjava and type mappings transformations and other findings along the way * JsonAccumulator (replayer) no longer throws when numeric values are > 32 bit ranges - now we use longs and doubles to parse the string sequences into, so some tuple transformation exceptions cease. * regex replace filters now can be configured via the jinjava config to specify what format the replacement strings should be in. The format is controlled by a series of regex replacements on the replacement string itself - e.g. to convert \\# to $# so that python-style regexes can be used. Notice that this was done the way that it was so that it's a easier to override and let users tweak for their own specific needs. Things get really sticky on malformed input and I don't have an interest in fully supporting that we behave the same on malformed escape sequences. Letting users have the option to specify the exact escaping seems like it's a hedge. * template files (resources) are still loaded from the jarfile, but users can add more templates and override existing ones. New templates can be passed through the json config to the provider in a simple key->template dictionary. * VARIANTs of top-level templates are gone. Now there's a top-level transformByType.j2 that does some tests on the incoming document and routes switches for the replayer template or the document backfill one (implementation and tests are still pending). That simplifies contextual awareness where this transformer no longer needs to have it. To round that change out, replayer.j2 was renamed httpRequests.j2 since that's a more accurate name now. * log_value and log_value_and_return are bound for jinjava templates to log through Slf4j. * There's still more work to be done in rewriteCreateIndexRequest to work w/ various versions of ES so that we can figure out when type mappings should/shouldn't be present and do the right thing. Now that we have source properties, that's just a matter of pulling a field and writing some more template code. * Converted all of the test indices and types to NOT include upper-case characters to avoid confusion and exercising transforms in ways that they'll never need to be tested. Signed-off-by: Greg Schohn --- RFS/build.gradle | 2 + TrafficCapture/trafficReplayer/build.gradle | 1 + .../replay/datahandlers/JsonAccumulator.java | 4 +- .../PayloadAccessFaultingMap.java | 4 +- ...ttpRequestPreliminaryTransformHandler.java | 4 +- .../replay/PayloadNotFoundTest.java | 2 +- .../HttpJsonTransformingConsumerTest.java | 13 +-- .../transform/JinjavaTransformer.java | 39 +++++--- .../jinjava/JavaRegexReplaceFilter.java | 46 +++++++++- .../transform/jinjava/JinjavaConfig.java | 20 +++++ .../transform/jinjava/LogFunction.java | 28 ++++++ .../NameMappingClasspathResourceLocator.java | 14 ++- .../jinjava/RegexReplaceException.java | 31 +++++++ .../jinjava/common/featureEnabled.j2 | 7 +- .../main/resources/jinjava/common/route.j2 | 2 +- .../transform/JinjavaTransformerTest.java | 89 ++++++++++++++----- .../jinjava/JavaRegexReplaceFilterTest.java | 29 ++++++ .../build.gradle | 2 + .../JsonJinjavaTransformerProvider.java | 11 ++- .../transform/IJsonTransformerProvider.java | 1 + .../transform/TransformationLoader.java | 6 +- .../README.md | 6 +- .../build.gradle | 3 + .../TypeMappingsSanitizationTransformer.java | 51 ++++++----- .../typemappings/SourceProperties.java | 20 +++++ .../typeMappings/documentBackfillItems.j2 | 0 .../typeMappings/elasticVersionProperties.j2 | 0 .../{replayer.j2 => httpRequests.j2} | 7 +- .../jinjava/typeMappings/preserveAll.j2 | 2 +- .../typeMappings/rewriteBulkRequest.j2 | 15 +++- .../typeMappings/rewriteCreateIndexRequest.j2 | 26 +++--- .../jinjava/typeMappings/transformByType.j2 | 12 +++ ...ppingsSanitizationTransformerBulkTest.java | 54 ++++++----- ...peMappingsSanitizationTransformerTest.java | 78 +++++++++++++--- .../build.gradle | 3 + ...appingSanitizationTransformerProvider.java | 29 ++++-- .../TypeMappingsSanitizationProviderTest.java | 2 +- 37 files changed, 519 insertions(+), 144 deletions(-) create mode 100644 transformation/transformationPlugins/jsonMessageTransformers/jsonJinjavaTransformer/src/main/java/org/opensearch/migrations/transform/jinjava/JinjavaConfig.java create mode 100644 transformation/transformationPlugins/jsonMessageTransformers/jsonJinjavaTransformer/src/main/java/org/opensearch/migrations/transform/jinjava/LogFunction.java create mode 100644 transformation/transformationPlugins/jsonMessageTransformers/jsonJinjavaTransformer/src/main/java/org/opensearch/migrations/transform/jinjava/RegexReplaceException.java create mode 100644 transformation/transformationPlugins/jsonMessageTransformers/jsonJinjavaTransformer/src/test/java/org/opensearch/migrations/transform/jinjava/JavaRegexReplaceFilterTest.java create mode 100644 transformation/transformationPlugins/jsonMessageTransformers/jsonTypeMappingsSanitizationTransformer/src/main/java/org/opensearch/migrations/transform/typemappings/SourceProperties.java create mode 100644 transformation/transformationPlugins/jsonMessageTransformers/jsonTypeMappingsSanitizationTransformer/src/main/resources/jinjava/typeMappings/documentBackfillItems.j2 create mode 100644 transformation/transformationPlugins/jsonMessageTransformers/jsonTypeMappingsSanitizationTransformer/src/main/resources/jinjava/typeMappings/elasticVersionProperties.j2 rename transformation/transformationPlugins/jsonMessageTransformers/jsonTypeMappingsSanitizationTransformer/src/main/resources/jinjava/typeMappings/{replayer.j2 => httpRequests.j2} (79%) create mode 100644 transformation/transformationPlugins/jsonMessageTransformers/jsonTypeMappingsSanitizationTransformer/src/main/resources/jinjava/typeMappings/transformByType.j2 diff --git a/RFS/build.gradle b/RFS/build.gradle index 57637bdad..e40d7f6ae 100644 --- a/RFS/build.gradle +++ b/RFS/build.gradle @@ -21,7 +21,9 @@ dependencies { implementation project(':transformation:transformationPlugins:jsonMessageTransformers:jsonMessageTransformerInterface') runtimeOnly project(':transformation:transformationPlugins:jsonMessageTransformers:jsonJMESPathMessageTransformerProvider') + runtimeOnly project(':transformation:transformationPlugins:jsonMessageTransformers:jsonJinjavaTransformerProvider') runtimeOnly project(':transformation:transformationPlugins:jsonMessageTransformers:jsonJoltMessageTransformerProvider') + runtimeOnly project(':transformation:transformationPlugins:jsonMessageTransformers:jsonTypeMappingsSanitizationTransformerProvider') implementation group: 'org.jcommander', name: 'jcommander' implementation group: 'com.fasterxml.jackson.core', name: 'jackson-databind' diff --git a/TrafficCapture/trafficReplayer/build.gradle b/TrafficCapture/trafficReplayer/build.gradle index cda888d16..0bf34d63c 100644 --- a/TrafficCapture/trafficReplayer/build.gradle +++ b/TrafficCapture/trafficReplayer/build.gradle @@ -22,6 +22,7 @@ dependencies { implementation project(':transformation:transformationPlugins:jsonMessageTransformers:jsonMessageTransformerLoaders') implementation project(':transformation:transformationPlugins:jsonMessageTransformers:jsonMessageTransformerInterface') runtimeOnly project(':transformation:transformationPlugins:jsonMessageTransformers:jsonJMESPathMessageTransformerProvider') + runtimeOnly project(':transformation:transformationPlugins:jsonMessageTransformers:jsonJinjavaTransformerProvider') runtimeOnly project(':transformation:transformationPlugins:jsonMessageTransformers:jsonJoltMessageTransformerProvider') runtimeOnly project(':transformation:transformationPlugins:jsonMessageTransformers:jsonTypeMappingsSanitizationTransformerProvider') diff --git a/TrafficCapture/trafficReplayer/src/main/java/org/opensearch/migrations/replay/datahandlers/JsonAccumulator.java b/TrafficCapture/trafficReplayer/src/main/java/org/opensearch/migrations/replay/datahandlers/JsonAccumulator.java index 3c57dbb6b..cb7e5025d 100644 --- a/TrafficCapture/trafficReplayer/src/main/java/org/opensearch/migrations/replay/datahandlers/JsonAccumulator.java +++ b/TrafficCapture/trafficReplayer/src/main/java/org/opensearch/migrations/replay/datahandlers/JsonAccumulator.java @@ -116,10 +116,10 @@ public Object getNextTopLevelObject() throws IOException { pushCompletedValue(parser.getText()); break; case VALUE_NUMBER_INT: - pushCompletedValue(parser.getIntValue()); + pushCompletedValue(parser.getLongValue()); break; case VALUE_NUMBER_FLOAT: - pushCompletedValue(parser.getFloatValue()); + pushCompletedValue(parser.getDoubleValue()); break; case NOT_AVAILABLE: // pipeline stall - need more data diff --git a/TrafficCapture/trafficReplayer/src/main/java/org/opensearch/migrations/replay/datahandlers/PayloadAccessFaultingMap.java b/TrafficCapture/trafficReplayer/src/main/java/org/opensearch/migrations/replay/datahandlers/PayloadAccessFaultingMap.java index 76a6b7783..75c85f19b 100644 --- a/TrafficCapture/trafficReplayer/src/main/java/org/opensearch/migrations/replay/datahandlers/PayloadAccessFaultingMap.java +++ b/TrafficCapture/trafficReplayer/src/main/java/org/opensearch/migrations/replay/datahandlers/PayloadAccessFaultingMap.java @@ -86,11 +86,11 @@ public Object get(Object key) { return value; } - public boolean missingPaylaodWasAccessed() { + public boolean missingPayloadWasAccessed() { return payloadWasAccessed; } - public void resetMissingPaylaodWasAccessed() { + public void resetMissingPayloadWasAccessed() { payloadWasAccessed = false; } diff --git a/TrafficCapture/trafficReplayer/src/main/java/org/opensearch/migrations/replay/datahandlers/http/NettyDecodedHttpRequestPreliminaryTransformHandler.java b/TrafficCapture/trafficReplayer/src/main/java/org/opensearch/migrations/replay/datahandlers/http/NettyDecodedHttpRequestPreliminaryTransformHandler.java index a8ead48f7..f1b4b5b58 100644 --- a/TrafficCapture/trafficReplayer/src/main/java/org/opensearch/migrations/replay/datahandlers/http/NettyDecodedHttpRequestPreliminaryTransformHandler.java +++ b/TrafficCapture/trafficReplayer/src/main/java/org/opensearch/migrations/replay/datahandlers/http/NettyDecodedHttpRequestPreliminaryTransformHandler.java @@ -71,8 +71,8 @@ public void channelRead(@NonNull ChannelHandlerContext ctx, @NonNull Object msg) transformedMessage = transform(transformer, httpJsonMessage); } catch (Exception e) { var payload = (PayloadAccessFaultingMap) httpJsonMessage.payload(); - if (payload.missingPaylaodWasAccessed()) { - payload.resetMissingPaylaodWasAccessed(); + if (payload.missingPayloadWasAccessed()) { + payload.resetMissingPayloadWasAccessed(); log.atDebug().setMessage("The transforms for this message require payload manipulation, " + "all content handlers are being loaded.").log(); // make a fresh message and its headers diff --git a/TrafficCapture/trafficReplayer/src/test/java/org/opensearch/migrations/replay/PayloadNotFoundTest.java b/TrafficCapture/trafficReplayer/src/test/java/org/opensearch/migrations/replay/PayloadNotFoundTest.java index 3d44f283c..0308c9b8b 100644 --- a/TrafficCapture/trafficReplayer/src/test/java/org/opensearch/migrations/replay/PayloadNotFoundTest.java +++ b/TrafficCapture/trafficReplayer/src/test/java/org/opensearch/migrations/replay/PayloadNotFoundTest.java @@ -32,6 +32,6 @@ public void testTransformsPropagateExceptionProperly() throws JsonProcessingExce "[{\"TypeMappingSanitizationTransformerProvider\":\"\"}]"); var e = Assertions.assertThrows(Exception.class, () -> transformer.transformJson(FAULTING_MAP)); - Assertions.assertTrue(((PayloadAccessFaultingMap)FAULTING_MAP.payload()).missingPaylaodWasAccessed()); + Assertions.assertTrue(((PayloadAccessFaultingMap)FAULTING_MAP.payload()).missingPayloadWasAccessed()); } } diff --git a/TrafficCapture/trafficReplayer/src/test/java/org/opensearch/migrations/replay/datahandlers/http/HttpJsonTransformingConsumerTest.java b/TrafficCapture/trafficReplayer/src/test/java/org/opensearch/migrations/replay/datahandlers/http/HttpJsonTransformingConsumerTest.java index 745d869e3..7babdb434 100644 --- a/TrafficCapture/trafficReplayer/src/test/java/org/opensearch/migrations/replay/datahandlers/http/HttpJsonTransformingConsumerTest.java +++ b/TrafficCapture/trafficReplayer/src/test/java/org/opensearch/migrations/replay/datahandlers/http/HttpJsonTransformingConsumerTest.java @@ -25,6 +25,7 @@ import org.opensearch.migrations.transform.TransformationLoader; import org.opensearch.migrations.utils.TrackedFuture; +import com.fasterxml.jackson.databind.ObjectMapper; import io.netty.buffer.ByteBuf; import io.netty.buffer.Unpooled; import io.netty.util.ReferenceCountUtil; @@ -331,8 +332,11 @@ public void testMalformedPayload_andThrowingTransformation_IsPassedThrough() thr new TransformationLoader().getTransformerFactoryLoader( HOST_NAME, null, - "[{\"TypeMappingSanitizationTransformerProvider\":\"\"}]" - ), + new ObjectMapper().writeValueAsString(List.of( + Map.of("JsonJinjavaTransformerProvider", Map.of( + "template", "{%- throw \"intentional exception\" -%}" + )) + ))), null, testPacketCapture, rootContext.getTestConnectionRequestContext(0) @@ -362,10 +366,7 @@ public void testMalformedPayload_andThrowingTransformation_IsPassedThrough() thr ); var outputAndResult = finalizationFuture.get(); Assertions.assertInstanceOf(TransformationException.class, - TrackedFuture.unwindPossibleCompletionException(outputAndResult.transformationStatus.getException()), - "It's acceptable for now that the OpenSearch upgrade transformation can't handle non-json " + - "content. If that Transform wants to handle this on its own, we'll need to use another transform " + - "configuration so that it throws and we can do this test."); + TrackedFuture.unwindPossibleCompletionException(outputAndResult.transformationStatus.getException())); var combinedOutputBuf = outputAndResult.transformedOutput.getResponseAsByteBuf(); Assertions.assertTrue(combinedOutputBuf.readableBytes() == 0); combinedOutputBuf.release(); diff --git a/transformation/transformationPlugins/jsonMessageTransformers/jsonJinjavaTransformer/src/main/java/org/opensearch/migrations/transform/JinjavaTransformer.java b/transformation/transformationPlugins/jsonMessageTransformers/jsonJinjavaTransformer/src/main/java/org/opensearch/migrations/transform/JinjavaTransformer.java index 2d24f6a74..8a1acb398 100644 --- a/transformation/transformationPlugins/jsonMessageTransformers/jsonJinjavaTransformer/src/main/java/org/opensearch/migrations/transform/JinjavaTransformer.java +++ b/transformation/transformationPlugins/jsonMessageTransformers/jsonJinjavaTransformer/src/main/java/org/opensearch/migrations/transform/JinjavaTransformer.java @@ -10,6 +10,8 @@ import org.opensearch.migrations.transform.jinjava.DynamicMacroFunction; import org.opensearch.migrations.transform.jinjava.JavaRegexCaptureFilter; import org.opensearch.migrations.transform.jinjava.JavaRegexReplaceFilter; +import org.opensearch.migrations.transform.jinjava.JinjavaConfig; +import org.opensearch.migrations.transform.jinjava.LogFunction; import org.opensearch.migrations.transform.jinjava.NameMappingClasspathResourceLocator; import org.opensearch.migrations.transform.jinjava.ThrowTag; @@ -17,6 +19,7 @@ import com.hubspot.jinjava.Jinjava; import com.hubspot.jinjava.lib.fn.ELFunctionDefinition; import com.hubspot.jinjava.loader.ResourceLocator; +import lombok.NonNull; import lombok.SneakyThrows; import lombok.extern.slf4j.Slf4j; @@ -24,6 +27,7 @@ public class JinjavaTransformer implements IJsonTransformer { protected static final ObjectMapper objectMapper = new ObjectMapper(); + public static final String REGEX_REPLACEMENT_CONVERSION_PATTERNS = "regex_replacement_conversion_patterns"; protected final Jinjava jinjava; protected final Function, Map> createContextWithSourceFunction; @@ -31,12 +35,22 @@ public class JinjavaTransformer implements IJsonTransformer { public JinjavaTransformer(String templateString, UnaryOperator> contextProviderFromSource) { - this(templateString, contextProviderFromSource, new NameMappingClasspathResourceLocator()); + this(templateString, contextProviderFromSource, new JinjavaConfig()); + } + + public JinjavaTransformer(String templateString, + UnaryOperator> contextProviderFromSource, + @NonNull JinjavaConfig jinjavaConfig) { + this(templateString, + contextProviderFromSource, + new NameMappingClasspathResourceLocator(jinjavaConfig.getNamedScripts()), + jinjavaConfig.getRegexReplacementConversionPatterns()); } public JinjavaTransformer(String templateString, UnaryOperator> createContextWithSource, - ResourceLocator resourceLocator) + ResourceLocator resourceLocator, + List> regexReplacementConversionPatterns) { jinjava = new Jinjava(); this.createContextWithSourceFunction = createContextWithSource; @@ -44,15 +58,20 @@ public JinjavaTransformer(String templateString, jinjava.getGlobalContext().registerFilter(new JavaRegexCaptureFilter()); jinjava.getGlobalContext().registerFilter(new JavaRegexReplaceFilter()); - jinjava.getGlobalContext().registerFunction(new ELFunctionDefinition( - "", - "invoke_macro", - DynamicMacroFunction.class, - "invokeMacro", - String.class, - Object[].class - )); + jinjava.getGlobalContext().registerFunction( + new ELFunctionDefinition("", "invoke_macro", DynamicMacroFunction.class, "invokeMacro", + String.class, Object[].class)); + jinjava.getGlobalContext().registerFunction( + new ELFunctionDefinition("", "log_value_and_return", LogFunction.class, "logValueAndReturn", + String.class, Object.class, Object.class)); + jinjava.getGlobalContext().registerFunction( + new ELFunctionDefinition("", "log_value", LogFunction.class, "logValue", + String.class, Object.class)); + jinjava.getGlobalContext().registerTag(new ThrowTag()); + jinjava.getGlobalContext().put(REGEX_REPLACEMENT_CONVERSION_PATTERNS, + Optional.ofNullable(regexReplacementConversionPatterns) + .orElse(JavaRegexReplaceFilter.DEFAULT_REGEX_REPLACE_FILTER)); this.templateStr = templateString; } diff --git a/transformation/transformationPlugins/jsonMessageTransformers/jsonJinjavaTransformer/src/main/java/org/opensearch/migrations/transform/jinjava/JavaRegexReplaceFilter.java b/transformation/transformationPlugins/jsonMessageTransformers/jsonJinjavaTransformer/src/main/java/org/opensearch/migrations/transform/jinjava/JavaRegexReplaceFilter.java index 46d346946..b2175aa84 100644 --- a/transformation/transformationPlugins/jsonMessageTransformers/jsonJinjavaTransformer/src/main/java/org/opensearch/migrations/transform/jinjava/JavaRegexReplaceFilter.java +++ b/transformation/transformationPlugins/jsonMessageTransformers/jsonJinjavaTransformer/src/main/java/org/opensearch/migrations/transform/jinjava/JavaRegexReplaceFilter.java @@ -1,21 +1,34 @@ package org.opensearch.migrations.transform.jinjava; +import java.util.List; +import java.util.Map; +import java.util.Optional; import java.util.regex.Matcher; import java.util.regex.Pattern; +import org.opensearch.migrations.transform.JinjavaTransformer; + import com.google.common.base.Function; import com.google.common.cache.CacheBuilder; import com.google.common.cache.CacheLoader; import com.google.common.cache.LoadingCache; import com.hubspot.jinjava.interpret.JinjavaInterpreter; import com.hubspot.jinjava.lib.filter.Filter; +import lombok.AllArgsConstructor; +import lombok.EqualsAndHashCode; import lombok.SneakyThrows; import lombok.extern.slf4j.Slf4j; @Slf4j public class JavaRegexReplaceFilter implements Filter { - private static LoadingCache regexCache = + public static final List> JAVA_REGEX_REPLACE_FILTER = List.of(); + public static final List> PYTHONESQUE_REGEX_REPLACE_FILTER = List.of( + Map.entry("(\\$)", "\\\\\\$"), + Map.entry("((?:\\\\\\\\)*)(\\\\)(?=\\d)", "\\$")); + public static final List> DEFAULT_REGEX_REPLACE_FILTER = PYTHONESQUE_REGEX_REPLACE_FILTER; + + private static final LoadingCache regexCache = CacheBuilder.newBuilder().build(CacheLoader.from((Function)Pattern::compile)); @SneakyThrows @@ -23,6 +36,25 @@ private static Pattern getCompiledPattern(String pattern) { return regexCache.get(pattern); } + @AllArgsConstructor + @EqualsAndHashCode + private static class ReplacementAndTransform { + String replacement; + List> substitutions; + } + + private static final LoadingCache replacementCache = + CacheBuilder.newBuilder().build(CacheLoader.from(rat -> { + var r = rat.replacement; + if (rat.substitutions != null) { + for (var kvp : rat.substitutions) { + r = r.replaceAll(kvp.getKey(), kvp.getValue()); + } + } + return r; + })); + + @Override public String getName() { return "regex_replace"; @@ -38,13 +70,21 @@ public Object filter(Object inputObject, JinjavaInterpreter interpreter, String. String pattern = args[0]; String replacement = args[1]; + String rewritten = null; try { Matcher matcher = getCompiledPattern(pattern).matcher(input); - var rval = matcher.replaceAll(replacement); + rewritten = replacementCache.get( + new ReplacementAndTransform(replacement, + Optional.ofNullable(interpreter) + .flatMap(ji->Optional.ofNullable(ji.getContext())) + .flatMap(c-> Optional.ofNullable((List>) + c.get(JinjavaTransformer.REGEX_REPLACEMENT_CONVERSION_PATTERNS))) + .orElse(DEFAULT_REGEX_REPLACE_FILTER))); + var rval = matcher.replaceAll(rewritten); log.atError().setMessage("replaced value {} with {}").addArgument(input).addArgument(rval).log(); return rval; } catch (Exception e) { - return null; + throw new RegexReplaceException(e, input, pattern, replacement, rewritten); } } } diff --git a/transformation/transformationPlugins/jsonMessageTransformers/jsonJinjavaTransformer/src/main/java/org/opensearch/migrations/transform/jinjava/JinjavaConfig.java b/transformation/transformationPlugins/jsonMessageTransformers/jsonJinjavaTransformer/src/main/java/org/opensearch/migrations/transform/jinjava/JinjavaConfig.java new file mode 100644 index 000000000..e8ddf58f6 --- /dev/null +++ b/transformation/transformationPlugins/jsonMessageTransformers/jsonJinjavaTransformer/src/main/java/org/opensearch/migrations/transform/jinjava/JinjavaConfig.java @@ -0,0 +1,20 @@ +package org.opensearch.migrations.transform.jinjava; + +import java.util.List; +import java.util.Map; + +import com.fasterxml.jackson.annotation.JsonProperty; +import lombok.AllArgsConstructor; +import lombok.Data; +import lombok.NoArgsConstructor; + +@Data +@NoArgsConstructor +@AllArgsConstructor +public class JinjavaConfig { + @JsonProperty("regexReplacementConversionPatterns") + private List> regexReplacementConversionPatterns; + + @JsonProperty("regexReplacementConversionPatterns") + Map namedScripts; +} diff --git a/transformation/transformationPlugins/jsonMessageTransformers/jsonJinjavaTransformer/src/main/java/org/opensearch/migrations/transform/jinjava/LogFunction.java b/transformation/transformationPlugins/jsonMessageTransformers/jsonJinjavaTransformer/src/main/java/org/opensearch/migrations/transform/jinjava/LogFunction.java new file mode 100644 index 000000000..4f8ea6c5b --- /dev/null +++ b/transformation/transformationPlugins/jsonMessageTransformers/jsonJinjavaTransformer/src/main/java/org/opensearch/migrations/transform/jinjava/LogFunction.java @@ -0,0 +1,28 @@ +package org.opensearch.migrations.transform.jinjava; + +import lombok.extern.slf4j.Slf4j; +import org.slf4j.event.Level; + +@Slf4j +public class LogFunction { + + /** + * Called from templates through the registration in the JinjavaTransformer class + */ + public static Object logValueAndReturn(String levelStr, Object valueToLog, Object valueToReturn) { + Level level; + try { + level = Level.valueOf(levelStr); + } catch (IllegalArgumentException e) { + log.atError().setMessage("Could not parse the level as it was passed in, so using ERROR. Level={}") + .addArgument(levelStr).log(); + level = Level.ERROR; + } + log.atLevel(level).setMessage("{}").addArgument(valueToLog).log(); + return valueToReturn; + } + + public static void logValue(String level, Object valueToLog) { + logValueAndReturn(level, valueToLog, null); + } +} diff --git a/transformation/transformationPlugins/jsonMessageTransformers/jsonJinjavaTransformer/src/main/java/org/opensearch/migrations/transform/jinjava/NameMappingClasspathResourceLocator.java b/transformation/transformationPlugins/jsonMessageTransformers/jsonJinjavaTransformer/src/main/java/org/opensearch/migrations/transform/jinjava/NameMappingClasspathResourceLocator.java index 071bab0bd..137d4387d 100644 --- a/transformation/transformationPlugins/jsonMessageTransformers/jsonJinjavaTransformer/src/main/java/org/opensearch/migrations/transform/jinjava/NameMappingClasspathResourceLocator.java +++ b/transformation/transformationPlugins/jsonMessageTransformers/jsonJinjavaTransformer/src/main/java/org/opensearch/migrations/transform/jinjava/NameMappingClasspathResourceLocator.java @@ -3,6 +3,8 @@ import java.io.IOException; import java.nio.charset.Charset; import java.nio.charset.StandardCharsets; +import java.util.Map; +import java.util.Optional; import java.util.concurrent.ExecutionException; import java.util.stream.Collectors; @@ -20,6 +22,8 @@ @Slf4j public class NameMappingClasspathResourceLocator extends ClasspathResourceLocator { + final Map overrideResourceMap; + @AllArgsConstructor @Getter @EqualsAndHashCode @@ -41,7 +45,11 @@ public String load(ResourceCacheKey key) throws IOException { } }); - private String getDefaultVersion(final String fullName) throws IOException { + public NameMappingClasspathResourceLocator(Map overrideResourceMap) { + this.overrideResourceMap = Optional.ofNullable(overrideResourceMap).orElse(Map.of()); + } + + private static String getDefaultVersion(final String fullName) throws IOException { try { var versionFile = fullName + "/defaultVersion"; var versionLines = Resources.readLines(Resources.getResource(versionFile), StandardCharsets.UTF_8).stream() @@ -59,6 +67,10 @@ private String getDefaultVersion(final String fullName) throws IOException { @Override public String getString(String fullName, Charset encoding, JinjavaInterpreter interpreter) throws IOException { + var overrideResource = overrideResourceMap.get(fullName); + if (overrideResource != null) { + return overrideResource; + } try { return resourceCache.get(new ResourceCacheKey(fullName, encoding)); } catch (ExecutionException e) { diff --git a/transformation/transformationPlugins/jsonMessageTransformers/jsonJinjavaTransformer/src/main/java/org/opensearch/migrations/transform/jinjava/RegexReplaceException.java b/transformation/transformationPlugins/jsonMessageTransformers/jsonJinjavaTransformer/src/main/java/org/opensearch/migrations/transform/jinjava/RegexReplaceException.java new file mode 100644 index 000000000..e0369cbce --- /dev/null +++ b/transformation/transformationPlugins/jsonMessageTransformers/jsonJinjavaTransformer/src/main/java/org/opensearch/migrations/transform/jinjava/RegexReplaceException.java @@ -0,0 +1,31 @@ +package org.opensearch.migrations.transform.jinjava; + +import java.util.StringJoiner; + +import lombok.Getter; + +@Getter +public class RegexReplaceException extends RuntimeException { + final String input; + final String pattern; + final String replacement; + final String rewrittenReplacement; + + public RegexReplaceException(Throwable cause, String input, String pattern, String replacement, String rewrittenReplacement) { + super(cause); + this.input = input; + this.pattern = pattern; + this.replacement = replacement; + this.rewrittenReplacement = rewrittenReplacement; + } + + @Override + public String getMessage() { + return super.getMessage() + + new StringJoiner(", ", "{", "}") + .add("input='" + input + "'") + .add("pattern='" + pattern + "'") + .add("replacement='" + replacement + "'") + .add("rewrittenReplacement='" + rewrittenReplacement + "'"); + } +} \ No newline at end of file diff --git a/transformation/transformationPlugins/jsonMessageTransformers/jsonJinjavaTransformer/src/main/resources/jinjava/common/featureEnabled.j2 b/transformation/transformationPlugins/jsonMessageTransformers/jsonJinjavaTransformer/src/main/resources/jinjava/common/featureEnabled.j2 index a7c2f6222..a674884c4 100644 --- a/transformation/transformationPlugins/jsonMessageTransformers/jsonJinjavaTransformer/src/main/resources/jinjava/common/featureEnabled.j2 +++ b/transformation/transformationPlugins/jsonMessageTransformers/jsonJinjavaTransformer/src/main/resources/jinjava/common/featureEnabled.j2 @@ -3,19 +3,14 @@ true {%- else -%} {%- set ns = namespace(value=features) -%} - {%- set debug = namespace(log=[]) -%} {%- for key in (path | split('.')) -%} - {%- set debug.log = debug.log + ["k:"+key] -%} - {%- set debug.log = debug.log + ["ismapping?:"+(ns.value is mapping)] -%} +{# {{- log_value('ERROR', "my logged key:"+key) -}}{{- log_value('INFO', "ismapping:") -}}#} {%- if ns.value is mapping and key in ns.value -%} {%- set ns.value = ns.value[key] -%} {%- else -%} {%- set ns.value = None -%} {%- endif -%} {%- endfor -%} - {%- set debug.log = debug.log + ["val=" + (ns.value)] -%} - {%- set debug.log = debug.log + ["is map?=" + (ns.value is map)] -%} - {%- set debug.log = debug.log + ["enabled val=" + (ns.value.enabled)] -%} {%- if ns.value is boolean and ns.value -%} true {%- elif ns.value is mapping and ns.value.get('enabled') is boolean -%} diff --git a/transformation/transformationPlugins/jsonMessageTransformers/jsonJinjavaTransformer/src/main/resources/jinjava/common/route.j2 b/transformation/transformationPlugins/jsonMessageTransformers/jsonJinjavaTransformer/src/main/resources/jinjava/common/route.j2 index 47543b7ca..f1d606d41 100644 --- a/transformation/transformationPlugins/jsonMessageTransformers/jsonJinjavaTransformer/src/main/resources/jinjava/common/route.j2 +++ b/transformation/transformationPlugins/jsonMessageTransformers/jsonJinjavaTransformer/src/main/resources/jinjava/common/route.j2 @@ -1,5 +1,5 @@ {%- import "common/featureEnabled.j2" as fscope -%} -{%- import "common/featureEnabled.j2" as fscope -%} + {%- macro route(input, field_to_match, feature_flags, default_action, routes) -%} {%- set ns = namespace(result=none, matched=false) -%} {%- for pattern, action_fn, feature_name_param in routes if not ns.matched -%} diff --git a/transformation/transformationPlugins/jsonMessageTransformers/jsonJinjavaTransformer/src/test/java/org/opensearch/migrations/transform/JinjavaTransformerTest.java b/transformation/transformationPlugins/jsonMessageTransformers/jsonJinjavaTransformer/src/test/java/org/opensearch/migrations/transform/JinjavaTransformerTest.java index 85bfa2d53..c45733eaf 100644 --- a/transformation/transformationPlugins/jsonMessageTransformers/jsonJinjavaTransformer/src/test/java/org/opensearch/migrations/transform/JinjavaTransformerTest.java +++ b/transformation/transformationPlugins/jsonMessageTransformers/jsonJinjavaTransformer/src/test/java/org/opensearch/migrations/transform/JinjavaTransformerTest.java @@ -1,16 +1,25 @@ package org.opensearch.migrations.transform; import java.util.Map; +import java.util.stream.Collectors; + +import org.opensearch.migrations.testutils.CloseableLogSetup; +import org.opensearch.migrations.testutils.JsonNormalizer; +import org.opensearch.migrations.transform.jinjava.JinjavaConfig; +import org.opensearch.migrations.transform.jinjava.LogFunction; import lombok.extern.slf4j.Slf4j; -import org.junit.jupiter.api.BeforeAll; +import org.junit.jupiter.api.Assertions; import org.junit.jupiter.api.Test; import org.testcontainers.shaded.com.fasterxml.jackson.databind.ObjectMapper; + @Slf4j class JinjavaTransformerTest { - private static final String TEMPLATE = "" + + private static final ObjectMapper OBJECT_MAPPER = new ObjectMapper(); + + private static final String INDEX_TYPE_MAPPING_SAMPLE_TEMPLATE = "" + "{# First, parse the URI to check if it matches the pattern we want to transform #}\n" + "{% set uri_parts = request.uri.split('/') %}\n" + "{% set is_type_request = uri_parts | length == 2 %}\n" + @@ -50,9 +59,18 @@ class JinjavaTransformerTest { " {{ request | tojson }}\n" + "{% endif %}"; - private static JinjavaTransformer indexTypeMappingRewriter; - @BeforeAll - static void initialize() { + @Test + public void testTypeMappingSample() throws Exception { + var testString = + "{\n" + + " \"verb\": \"PUT\",\n" + + " \"uri\": \"indexA/type2/someuser\",\n" + + " \"body\": {\n" + + " \"name\": \"Some User\",\n" + + " \"user_name\": \"user\",\n" + + " \"email\": \"user@example.com\"\n" + + " }\n" + + "}"; var indexMappings = Map.of( "indexA", Map.of( "type1", "indexA_1", @@ -62,27 +80,54 @@ static void initialize() { "type2", "indexB"), "indexC", Map.of( "type2", "indexC")); - indexTypeMappingRewriter = new JinjavaTransformer(TEMPLATE, + var indexTypeMappingRewriter = new JinjavaTransformer(INDEX_TYPE_MAPPING_SAMPLE_TEMPLATE, request -> Map.of( "index_mappings", indexMappings, - "request", request)); + "request", request), + new JinjavaConfig(null, + Map.of("hello", "{%- macro hello() -%} hi {%- endmacro -%}\n"))); + + var resultObj = indexTypeMappingRewriter.transformJson(OBJECT_MAPPER.readValue(testString, Map.class)); + Assertions.assertEquals(JsonNormalizer.fromString(testString.replace("indexA/type2/", "indexA_2/_doc/")), + JsonNormalizer.fromObject(resultObj)); } @Test - public void test() throws Exception { - var testString = - "{\n" + - " \"verb\": \"PUT\",\n" + - " \"uri\": \"indexA/type2/someuser\",\n" + - " \"body\": {\n" + - " \"name\": \"Some User\",\n" + - " \"user_name\": \"user\",\n" + - " \"email\": \"user@example.com\"\n" + - " }\n" + - "}"; - var objMapper = new ObjectMapper(); - var resultObj = indexTypeMappingRewriter.transformJson(objMapper.readValue(testString, Map.class)); - var resultStr = objMapper.writeValueAsString(resultObj); - log.atInfo().setMessage("resultStr = {}").setMessage(resultStr).log(); + public void testCustomScript() throws Exception { + var indexTypeMappingRewriter = new JinjavaTransformer("" + + "{%- include \"hello\" -%}" + + "{{invoke_macro('hello')}}", + request -> Map.of("request", request), + new JinjavaConfig(null, + Map.of("hello", "{%- macro hello() -%}{\"hi\": \"world\"}{%- endmacro -%}\n"))); + + var resultObj = indexTypeMappingRewriter.transformJson(Map.of()); + var resultStr = OBJECT_MAPPER.writeValueAsString(resultObj); + Assertions.assertEquals("{\"hi\":\"world\"}", resultStr); + } + + @Test + public void debugLoggingWorks() throws Exception { + try (var closeableLogSetup = new CloseableLogSetup(LogFunction.class.getName())) { + final String FIRST_LOG_VAL = "LOGGED_VALUE=16"; + final String SECOND_LOG_VAL = "next one"; + final String THIRD_LOG_VAL = "LAST"; + + var indexTypeMappingRewriter = new JinjavaTransformer("" + + "{{ log_value_and_return('ERROR', log_value_and_return('ERROR', '" + FIRST_LOG_VAL + "', '" + SECOND_LOG_VAL + "'), '') }}" + + "{{ log_value('ERROR', '" + THIRD_LOG_VAL + "') }} " + + "{}", + request -> Map.of("request", request), + new JinjavaConfig(null, + Map.of("hello", "{%- macro hello() -%}{\"hi\": \"world\"}{%- endmacro -%}\n"))); + + var resultObj = indexTypeMappingRewriter.transformJson(Map.of()); + var resultStr = OBJECT_MAPPER.writeValueAsString(resultObj); + Assertions.assertEquals("{}", resultStr); + + var logEvents = closeableLogSetup.getLogEvents(); + Assertions.assertEquals(String.join("\n", new String[]{FIRST_LOG_VAL, SECOND_LOG_VAL, THIRD_LOG_VAL}), + logEvents.stream().collect(Collectors.joining("\n"))); + } } } diff --git a/transformation/transformationPlugins/jsonMessageTransformers/jsonJinjavaTransformer/src/test/java/org/opensearch/migrations/transform/jinjava/JavaRegexReplaceFilterTest.java b/transformation/transformationPlugins/jsonMessageTransformers/jsonJinjavaTransformer/src/test/java/org/opensearch/migrations/transform/jinjava/JavaRegexReplaceFilterTest.java new file mode 100644 index 000000000..0b310bf8e --- /dev/null +++ b/transformation/transformationPlugins/jsonMessageTransformers/jsonJinjavaTransformer/src/test/java/org/opensearch/migrations/transform/jinjava/JavaRegexReplaceFilterTest.java @@ -0,0 +1,29 @@ +package org.opensearch.migrations.transform.jinjava; + +import org.junit.jupiter.api.Assertions; +import org.junit.jupiter.api.Test; + +class JavaRegexReplaceFilterTest { + JavaRegexReplaceFilter replaceFilter = new JavaRegexReplaceFilter(); + + String makeReplacementFromKnownMatch(String replacementPattern) { + final var source = "Known Pattern 1234, and a note."; + final var capturingPattern = "(([^ \\d]*) )*(\\d*)[^\\d]*(no.e)\\."; + return (String) replaceFilter.filter(source, null, capturingPattern, replacementPattern); + } + + @Test + public void test() { + Assertions.assertEquals("somethingNew", makeReplacementFromKnownMatch("somethingNew")); + Assertions.assertEquals("Pattern$amount", makeReplacementFromKnownMatch("\\2$amount")); + Assertions.assertEquals("Pattern$1", makeReplacementFromKnownMatch("\\2$1")); + + // other things to try +// Assertions.assertEquals("Pattern\\$$1", makeReplacementFromKnownMatch("\\2\\$$\\1")); +// Assertions.assertEquals("$1\\$amount", "\\1$amount", replacement); +// "\\\\1$50", // -> \\1\$50 +// "\\\\\\1$total$", // -> \\$1\$total\$ +// "cost$1$price$2" // -> cost$1\$price$2 + + } +} diff --git a/transformation/transformationPlugins/jsonMessageTransformers/jsonJinjavaTransformerProvider/build.gradle b/transformation/transformationPlugins/jsonMessageTransformers/jsonJinjavaTransformerProvider/build.gradle index 3e02184bb..4bd547e57 100644 --- a/transformation/transformationPlugins/jsonMessageTransformers/jsonJinjavaTransformerProvider/build.gradle +++ b/transformation/transformationPlugins/jsonMessageTransformers/jsonJinjavaTransformerProvider/build.gradle @@ -13,6 +13,8 @@ dependencies { implementation project(':transformation:transformationPlugins:jsonMessageTransformers:jsonJinjavaTransformer') implementation group: 'org.apache.commons', name: 'commons-collections4', version: '4.4' + implementation group: 'com.fasterxml.jackson.core', name: 'jackson-core' + implementation group: 'com.fasterxml.jackson.core', name: 'jackson-databind' testImplementation project(':TrafficCapture:trafficReplayer') testImplementation testFixtures(project(path: ':testHelperFixtures')) diff --git a/transformation/transformationPlugins/jsonMessageTransformers/jsonJinjavaTransformerProvider/src/main/java/org/opensearch/migrations/transform/JsonJinjavaTransformerProvider.java b/transformation/transformationPlugins/jsonMessageTransformers/jsonJinjavaTransformerProvider/src/main/java/org/opensearch/migrations/transform/JsonJinjavaTransformerProvider.java index b8cc45eca..c579e8efc 100644 --- a/transformation/transformationPlugins/jsonMessageTransformers/jsonJinjavaTransformerProvider/src/main/java/org/opensearch/migrations/transform/JsonJinjavaTransformerProvider.java +++ b/transformation/transformationPlugins/jsonMessageTransformers/jsonJinjavaTransformerProvider/src/main/java/org/opensearch/migrations/transform/JsonJinjavaTransformerProvider.java @@ -2,7 +2,11 @@ import java.util.Collections; import java.util.Map; +import java.util.Optional; +import org.opensearch.migrations.transform.jinjava.JinjavaConfig; + +import com.fasterxml.jackson.databind.ObjectMapper; import org.apache.commons.collections4.map.CompositeMap; @@ -10,6 +14,9 @@ public class JsonJinjavaTransformerProvider implements IJsonTransformerProvider public static final String REQUEST_KEY = "request"; public static final String TEMPLATE_KEY = "template"; + public static final String JINJAVA_CONFIG_KEY = "jinjavaConfig"; + + public final static ObjectMapper mapper = new ObjectMapper(); @Override public IJsonTransformer createTransformer(Object jsonConfig) { @@ -30,7 +37,9 @@ public IJsonTransformer createTransformer(Object jsonConfig) { try { var templateString = (String) config.get(TEMPLATE_KEY); return new JinjavaTransformer(templateString, - source -> new CompositeMap<>(Map.of(REQUEST_KEY, source), immutableBaseConfig)); + source -> new CompositeMap<>(Map.of(REQUEST_KEY, source), immutableBaseConfig), + Optional.ofNullable(config.get(JINJAVA_CONFIG_KEY)).map(jinjavaConfig -> + mapper.convertValue(jinjavaConfig, JinjavaConfig.class)).orElse(new JinjavaConfig())); } catch (ClassCastException e) { throw new IllegalArgumentException(getConfigUsageStr(), e); } diff --git a/transformation/transformationPlugins/jsonMessageTransformers/jsonMessageTransformerInterface/src/main/java/org/opensearch/migrations/transform/IJsonTransformerProvider.java b/transformation/transformationPlugins/jsonMessageTransformers/jsonMessageTransformerInterface/src/main/java/org/opensearch/migrations/transform/IJsonTransformerProvider.java index c406b15d9..402eea157 100644 --- a/transformation/transformationPlugins/jsonMessageTransformers/jsonMessageTransformerInterface/src/main/java/org/opensearch/migrations/transform/IJsonTransformerProvider.java +++ b/transformation/transformationPlugins/jsonMessageTransformers/jsonMessageTransformerInterface/src/main/java/org/opensearch/migrations/transform/IJsonTransformerProvider.java @@ -7,6 +7,7 @@ public interface IJsonTransformerProvider { * Create a new transformer from the given configuration. This transformer * will be used repeatedly and concurrently from different threads to modify * messages. + * * @param jsonConfig is a List, Map, String, or null that should be used to configure the * IJsonTransformer that is being created * @return diff --git a/transformation/transformationPlugins/jsonMessageTransformers/jsonMessageTransformerLoaders/src/main/java/org/opensearch/migrations/transform/TransformationLoader.java b/transformation/transformationPlugins/jsonMessageTransformers/jsonMessageTransformerLoaders/src/main/java/org/opensearch/migrations/transform/TransformationLoader.java index 136815c7b..1f30ae7ad 100644 --- a/transformation/transformationPlugins/jsonMessageTransformers/jsonMessageTransformerLoaders/src/main/java/org/opensearch/migrations/transform/TransformationLoader.java +++ b/transformation/transformationPlugins/jsonMessageTransformers/jsonMessageTransformerLoaders/src/main/java/org/opensearch/migrations/transform/TransformationLoader.java @@ -148,7 +148,11 @@ private static class HostTransformer implements IJsonTransformer { @Override public Map transformJson(Map incomingJson) { var headers = (Map) incomingJson.get(JsonKeysForHttpMessage.HEADERS_KEY); - headers.replace("host", newHostName); + if (headers != null) { + headers.replace("host", newHostName); + } else { + log.atDebug().setMessage("Host header is null in incoming message: {}").addArgument(incomingJson).log(); + } return incomingJson; } } diff --git a/transformation/transformationPlugins/jsonMessageTransformers/jsonTypeMappingsSanitizationTransformer/README.md b/transformation/transformationPlugins/jsonMessageTransformers/jsonTypeMappingsSanitizationTransformer/README.md index 2ff97492b..9e88dda81 100644 --- a/transformation/transformationPlugins/jsonMessageTransformers/jsonTypeMappingsSanitizationTransformer/README.md +++ b/transformation/transformationPlugins/jsonMessageTransformers/jsonTypeMappingsSanitizationTransformer/README.md @@ -1,6 +1,8 @@ This transformer converts routes for various requests (see below) to indices that used [multi-type mappings](https://www.elastic.co/guide/en/elasticsearch/reference/5.6/mapping.html) (configured from ES 5.x -and earlier clusters) to work with newer versions of Elasticsearch and OpenSearch. +and earlier clusters) to work with newer versions of Elasticsearch and OpenSearch. +See "[Removal of Type Mappings](https://www.elastic.co/guide/en/elasticsearch/reference/7.10/removal-of-types.html)" +to understand how type mappings are treated differently through different versions of Elasticsearch. ## Usage Prior to Elasticsearch 6 @@ -79,7 +81,7 @@ activity: Any _indices_ that are NOT specified won't be modified - all additions, changes, and queries on those other indices not specified at the root level will remain untouched by the static mapping rewriter. However, missing types from a -specified index _**will**_ be removed. To remove ALL the activity for a given index, specify an empty index with no +specified index will be removed. To remove ALL the activity for a given index, specify an index with no children types. ``` activity: {} diff --git a/transformation/transformationPlugins/jsonMessageTransformers/jsonTypeMappingsSanitizationTransformer/build.gradle b/transformation/transformationPlugins/jsonMessageTransformers/jsonTypeMappingsSanitizationTransformer/build.gradle index f0912fded..fa989278e 100644 --- a/transformation/transformationPlugins/jsonMessageTransformers/jsonTypeMappingsSanitizationTransformer/build.gradle +++ b/transformation/transformationPlugins/jsonMessageTransformers/jsonTypeMappingsSanitizationTransformer/build.gradle @@ -7,6 +7,9 @@ dependencies { api project(':transformation:transformationPlugins:jsonMessageTransformers:jsonJinjavaTransformer') implementation project(':transformation:transformationPlugins:jsonMessageTransformers:jsonMessageTransformerInterface') + implementation group: 'com.fasterxml.jackson.core', name: 'jackson-annotations' + implementation group: 'com.fasterxml.jackson.core', name: 'jackson-core' + implementation group: 'com.fasterxml.jackson.core', name: 'jackson-databind' implementation group: 'com.google.guava', name: 'guava' testImplementation project(':TrafficCapture:trafficReplayer') diff --git a/transformation/transformationPlugins/jsonMessageTransformers/jsonTypeMappingsSanitizationTransformer/src/main/java/org/opensearch/migrations/transform/TypeMappingsSanitizationTransformer.java b/transformation/transformationPlugins/jsonMessageTransformers/jsonTypeMappingsSanitizationTransformer/src/main/java/org/opensearch/migrations/transform/TypeMappingsSanitizationTransformer.java index bc98fda37..94225d5ac 100644 --- a/transformation/transformationPlugins/jsonMessageTransformers/jsonTypeMappingsSanitizationTransformer/src/main/java/org/opensearch/migrations/transform/TypeMappingsSanitizationTransformer.java +++ b/transformation/transformationPlugins/jsonMessageTransformers/jsonTypeMappingsSanitizationTransformer/src/main/java/org/opensearch/migrations/transform/TypeMappingsSanitizationTransformer.java @@ -7,49 +7,58 @@ import java.util.Optional; import java.util.function.UnaryOperator; +import org.opensearch.migrations.transform.jinjava.JinjavaConfig; +import org.opensearch.migrations.transform.typemappings.SourceProperties; + import com.google.common.io.Resources; public class TypeMappingsSanitizationTransformer extends JinjavaTransformer { - public static final String REPLAYER_VARIANT = "jinjava/typeMappings/replayer.j2"; + public static final String ENTRYPOINT_JINJA_TEMPLATE = "jinjava/typeMappings/transformByType.j2"; - public TypeMappingsSanitizationTransformer() + public TypeMappingsSanitizationTransformer( + Map> indexMappings, + List> regexIndexMappings) throws IOException { - this(REPLAYER_VARIANT, null, null, null); + this(indexMappings, regexIndexMappings, null, null, null); } - public TypeMappingsSanitizationTransformer(Map> indexMappings, - List> regexIndexMappings) - throws IOException { - this(REPLAYER_VARIANT, null, indexMappings, regexIndexMappings); - } - - public TypeMappingsSanitizationTransformer(String variantName, - Map featureFlags, - Map> indexMappings, - List> regexIndexMappings) throws IOException { + public TypeMappingsSanitizationTransformer( + Map> indexMappings, + List> regexIndexMappings, + SourceProperties sourceProperties, + Map featureFlags, + JinjavaConfig jinjavaSettings) + throws IOException + { super( - makeTemplate(variantName), - makeSourceWrapperFunction(featureFlags, indexMappings, regexIndexMappings)); + makeTemplate(), + makeSourceWrapperFunction(sourceProperties, featureFlags, indexMappings, regexIndexMappings), + Optional.ofNullable(jinjavaSettings).orElse(new JinjavaConfig())); } private static UnaryOperator> - makeSourceWrapperFunction(Map featureFlagsIncoming, + makeSourceWrapperFunction(SourceProperties sourceProperties, + Map featureFlagsIncoming, Map> indexMappingsIncoming, List> regexIndexMappingsIncoming) { var featureFlags = featureFlagsIncoming != null ? featureFlagsIncoming : Map.of(); var indexMappings = indexMappingsIncoming != null ? indexMappingsIncoming : Map.of(); + // By NOT including a backreference, we're a bit more efficient, but it also lets us be agnostic to what + // types of patterns are being used. + // This regex says, match the type part and reduce it to nothing, leave the index part untouched. var regexIndexMappings = Optional.ofNullable(regexIndexMappingsIncoming) - .orElseGet(() -> (indexMappingsIncoming == null ? List.of(List.of("(.*)", ".*", "$1")) : List.of())); + .orElseGet(() -> (indexMappingsIncoming == null ? List.of(List.of("", ".*", "")) : List.of())); - return incomingJson -> Map.of("request", incomingJson, + return incomingJson -> Map.of("source_document", incomingJson, "index_mappings", indexMappings, "regex_index_mappings", regexIndexMappings, - "featureFlags", featureFlags); + "featureFlags", featureFlags, + "source_properties", sourceProperties == null ? Map.of() : sourceProperties); } - private static String makeTemplate(String variantName) throws IOException { - return Resources.toString(Resources.getResource(variantName), StandardCharsets.UTF_8); + private static String makeTemplate() throws IOException { + return Resources.toString(Resources.getResource(ENTRYPOINT_JINJA_TEMPLATE), StandardCharsets.UTF_8); } } diff --git a/transformation/transformationPlugins/jsonMessageTransformers/jsonTypeMappingsSanitizationTransformer/src/main/java/org/opensearch/migrations/transform/typemappings/SourceProperties.java b/transformation/transformationPlugins/jsonMessageTransformers/jsonTypeMappingsSanitizationTransformer/src/main/java/org/opensearch/migrations/transform/typemappings/SourceProperties.java new file mode 100644 index 000000000..1f100ffa3 --- /dev/null +++ b/transformation/transformationPlugins/jsonMessageTransformers/jsonTypeMappingsSanitizationTransformer/src/main/java/org/opensearch/migrations/transform/typemappings/SourceProperties.java @@ -0,0 +1,20 @@ +package org.opensearch.migrations.transform.typemappings; + +import lombok.AllArgsConstructor; +import lombok.Data; +import lombok.NoArgsConstructor; + +@Data +@NoArgsConstructor +@AllArgsConstructor +public class SourceProperties { + private Version version; + + @Data + @NoArgsConstructor + @AllArgsConstructor + public static class Version { + private int major; + private int minor; + } +} diff --git a/transformation/transformationPlugins/jsonMessageTransformers/jsonTypeMappingsSanitizationTransformer/src/main/resources/jinjava/typeMappings/documentBackfillItems.j2 b/transformation/transformationPlugins/jsonMessageTransformers/jsonTypeMappingsSanitizationTransformer/src/main/resources/jinjava/typeMappings/documentBackfillItems.j2 new file mode 100644 index 000000000..e69de29bb diff --git a/transformation/transformationPlugins/jsonMessageTransformers/jsonTypeMappingsSanitizationTransformer/src/main/resources/jinjava/typeMappings/elasticVersionProperties.j2 b/transformation/transformationPlugins/jsonMessageTransformers/jsonTypeMappingsSanitizationTransformer/src/main/resources/jinjava/typeMappings/elasticVersionProperties.j2 new file mode 100644 index 000000000..e69de29bb diff --git a/transformation/transformationPlugins/jsonMessageTransformers/jsonTypeMappingsSanitizationTransformer/src/main/resources/jinjava/typeMappings/replayer.j2 b/transformation/transformationPlugins/jsonMessageTransformers/jsonTypeMappingsSanitizationTransformer/src/main/resources/jinjava/typeMappings/httpRequests.j2 similarity index 79% rename from transformation/transformationPlugins/jsonMessageTransformers/jsonTypeMappingsSanitizationTransformer/src/main/resources/jinjava/typeMappings/replayer.j2 rename to transformation/transformationPlugins/jsonMessageTransformers/jsonTypeMappingsSanitizationTransformer/src/main/resources/jinjava/typeMappings/httpRequests.j2 index 28c499b93..145bdcb38 100644 --- a/transformation/transformationPlugins/jsonMessageTransformers/jsonTypeMappingsSanitizationTransformer/src/main/resources/jinjava/typeMappings/replayer.j2 +++ b/transformation/transformationPlugins/jsonMessageTransformers/jsonTypeMappingsSanitizationTransformer/src/main/resources/jinjava/typeMappings/httpRequests.j2 @@ -6,11 +6,12 @@ {%- set source_and_mappings = { - 'request': request, + 'request': source_document, 'index_mappings': index_mappings, - 'regex_index_mappings': regex_index_mappings} + 'regex_index_mappings': regex_index_mappings, + 'properties': source_properties} -%} -{{- rscope.route(source_and_mappings, request.method + " " + request.URI, flags, 'preserve.make_keep_json', +{{- rscope.route(source_and_mappings, source_document.method + " " + source_document.URI, flags, 'preserve.make_keep_json', [ ('(?:PUT|POST) /([^/]*)/([^/]*)/(.*)', 'rewrite_doc_request', 'rewrite_add_request_to_strip_types'), ( 'GET /((?!\\.\\.$)[^-_+\\p{Lu}\\\\/*?\\\"<>|,# ][^\\p{Lu}\\\\/*?\\\"<>|,# ]*)/((?!\\.\\.$)[^-_+\\p{Lu}\\\\/*?\\\"<>|,# ][^\\p{Lu}\\\\/*?\\\"<>|,# ]*)/([^/]+)$', 'rewrite_doc_request', 'rewrite_get_request_to_strip_types'), diff --git a/transformation/transformationPlugins/jsonMessageTransformers/jsonTypeMappingsSanitizationTransformer/src/main/resources/jinjava/typeMappings/preserveAll.j2 b/transformation/transformationPlugins/jsonMessageTransformers/jsonTypeMappingsSanitizationTransformer/src/main/resources/jinjava/typeMappings/preserveAll.j2 index 009f4b094..6de7ba27e 100644 --- a/transformation/transformationPlugins/jsonMessageTransformers/jsonTypeMappingsSanitizationTransformer/src/main/resources/jinjava/typeMappings/preserveAll.j2 +++ b/transformation/transformationPlugins/jsonMessageTransformers/jsonTypeMappingsSanitizationTransformer/src/main/resources/jinjava/typeMappings/preserveAll.j2 @@ -1,3 +1,3 @@ -{%- macro make_keep_json(source_and_mappings) -%} +{%- macro make_keep_json() -%} { "preserve": "*" } {%- endmacro -%} diff --git a/transformation/transformationPlugins/jsonMessageTransformers/jsonTypeMappingsSanitizationTransformer/src/main/resources/jinjava/typeMappings/rewriteBulkRequest.j2 b/transformation/transformationPlugins/jsonMessageTransformers/jsonTypeMappingsSanitizationTransformer/src/main/resources/jinjava/typeMappings/rewriteBulkRequest.j2 index 8496ca7b8..1050cbd51 100644 --- a/transformation/transformationPlugins/jsonMessageTransformers/jsonTypeMappingsSanitizationTransformer/src/main/resources/jinjava/typeMappings/rewriteBulkRequest.j2 +++ b/transformation/transformationPlugins/jsonMessageTransformers/jsonTypeMappingsSanitizationTransformer/src/main/resources/jinjava/typeMappings/rewriteBulkRequest.j2 @@ -57,12 +57,21 @@ {%- if operation.type -%} {%- set parameters = item[operation.type] -%} - {%- set target_index = transidx.convert_source_index_to_target(parameters['_index'], parameters['_type'], input_map.index_mappings, input_map.regex_index_mappings) -%} + {%- set type_name = parameters['_type'] -%} + {%- set target_index = transidx.convert_source_index_to_target(parameters['_index'], type_name, input_map.index_mappings, input_map.regex_index_mappings) if type_name -%} {%- if operation.type == 'delete' -%} - {%- set operation.output = run_delete(parameters, target_index) -%} + {%- if type_name -%} + {%- set operation.output = run_delete(parameters, target_index) -%} + {%- else -%} + {%- set operation.output = (item | tojson) -%} + {%- endif -%} {%- else -%} {%- if loop.index < operations|length -%} - {%- set operation.output = rewrite_command(operation.type, parameters, target_index, operations[loop.index]) -%} + {%- if type_name -%} + {%- set operation.output = rewrite_command(operation.type, parameters, target_index, operations[loop.index]) -%} + {%- else -%} + {%- set operation.output = (item | tojson) ~ "," ~ (operations[loop.index] | tojson) -%} + {%- endif -%} {%- set loopcontrol.skipnext = true -%} {%- else -%} {%- throw "Handle case where there's no next item but one was expected for item {{ item }}" -%} diff --git a/transformation/transformationPlugins/jsonMessageTransformers/jsonTypeMappingsSanitizationTransformer/src/main/resources/jinjava/typeMappings/rewriteCreateIndexRequest.j2 b/transformation/transformationPlugins/jsonMessageTransformers/jsonTypeMappingsSanitizationTransformer/src/main/resources/jinjava/typeMappings/rewriteCreateIndexRequest.j2 index 498454e57..81eda2b89 100644 --- a/transformation/transformationPlugins/jsonMessageTransformers/jsonTypeMappingsSanitizationTransformer/src/main/resources/jinjava/typeMappings/rewriteCreateIndexRequest.j2 +++ b/transformation/transformationPlugins/jsonMessageTransformers/jsonTypeMappingsSanitizationTransformer/src/main/resources/jinjava/typeMappings/rewriteCreateIndexRequest.j2 @@ -44,15 +44,21 @@ } {%- endmacro -%} {%- macro rewrite_create_index(match, input_map) -%} - {%- set source_index_name = match.group1 -%} - {%- set target_indices = (input_map.index_mappings[source_index_name] | default({})).values() | unique() -%} - {%- set num_mappings = target_indices | length -%} - {%- if num_mappings == 0 -%} - {{- noop.make_request() -}} - {%- elif num_mappings == 1 -%} - {{- rewrite_create_index_as_unioned_excise(source_index_name, (target_indices | first), input_map) -}} - {%- elif num_mappings > 1 -%} - {# Need to extend the replayer to allow multiple requests since this needs to become multiple requests #} - {{- preserve.make_keep_json(input_mappings) -}} + {%- set orig_mappings = input_map.request.payload.inlinedJsonBody.mappings -%} + + {%- if orig_mappings -%} + {%- set source_index_name = match.group1 -%} + {%- set target_indices = (input_map.index_mappings[source_index_name] | default({})).values() | unique() -%} + {%- set num_mappings = target_indices | length -%} + {%- if num_mappings == 0 -%} + {{- noop.make_request() -}} + {%- elif num_mappings == 1 -%} + {{- rewrite_create_index_as_unioned_excise(source_index_name, (target_indices | first), input_map) -}} + {%- elif num_mappings > 1 -%} + {# Need to extend the replayer to allow multiple requests since this needs to become multiple requests #} + {{- preserve.make_keep_json() -}} + {%- endif -%} + {%- else -%} + {{- preserve.make_keep_json() -}} {%- endif -%} {%- endmacro -%} diff --git a/transformation/transformationPlugins/jsonMessageTransformers/jsonTypeMappingsSanitizationTransformer/src/main/resources/jinjava/typeMappings/transformByType.j2 b/transformation/transformationPlugins/jsonMessageTransformers/jsonTypeMappingsSanitizationTransformer/src/main/resources/jinjava/typeMappings/transformByType.j2 new file mode 100644 index 000000000..df26b6b26 --- /dev/null +++ b/transformation/transformationPlugins/jsonMessageTransformers/jsonTypeMappingsSanitizationTransformer/src/main/resources/jinjava/typeMappings/transformByType.j2 @@ -0,0 +1,12 @@ +{%- if not source_document -%} + {%- throw "No source_document was defined - nothing to transform!" -%} +{%- endif -%} + +{%- if ("method" in source_document and "URI" in source_document) -%} + {%- include "typeMappings/httpRequests.j2" -%} +{%- elif ("index" in source_document and "source" in source_document) -%} + {%- include "typeMappings/documentBackfillItems.j2" -%} +{%- else -%} + {%- import "typeMappings/preserveAll.j2" as preserve -%} + {{- preserve.make_keep_json() -}} +{%- endif -%} \ No newline at end of file diff --git a/transformation/transformationPlugins/jsonMessageTransformers/jsonTypeMappingsSanitizationTransformer/src/test/java/org/opensearch/migrations/transform/TypeMappingsSanitizationTransformerBulkTest.java b/transformation/transformationPlugins/jsonMessageTransformers/jsonTypeMappingsSanitizationTransformer/src/test/java/org/opensearch/migrations/transform/TypeMappingsSanitizationTransformerBulkTest.java index 136eea570..4a863eb8a 100644 --- a/transformation/transformationPlugins/jsonMessageTransformers/jsonTypeMappingsSanitizationTransformer/src/test/java/org/opensearch/migrations/transform/TypeMappingsSanitizationTransformerBulkTest.java +++ b/transformation/transformationPlugins/jsonMessageTransformers/jsonTypeMappingsSanitizationTransformer/src/test/java/org/opensearch/migrations/transform/TypeMappingsSanitizationTransformerBulkTest.java @@ -22,16 +22,16 @@ public class TypeMappingsSanitizationTransformerBulkTest { @BeforeAll static void initialize() throws IOException { var indexMappings = Map.of( - "indexA", Map.of( - "type1", "indexA_1", - "type2", "indexA_2"), - "indexB", Map.of( - "type1", "indexB", - "type2", "indexB"), - "indexC", Map.of( - "type2", "indexC")); + "indexa", Map.of( + "type1", "indexa_1", + "type2", "indexa_2"), + "indexb", Map.of( + "type1", "indexb", + "type2", "indexb"), + "indexc", Map.of( + "type2", "indexc")); var regexIndexMappings = List.of( - List.of("time-(.*)", "(.*)", "time-$1-$2")); + List.of("time-(.*)", "(.*)", "time-\\1-\\2")); indexTypeMappingRewriter = new TypeMappingsSanitizationTransformer(indexMappings, regexIndexMappings); } @@ -45,30 +45,35 @@ public void testBulk() throws Exception { " \"" + JsonKeysForHttpMessage.HEADERS_KEY + "\": {},\n" + " \"" + JsonKeysForHttpMessage.PAYLOAD_KEY + "\": {\n" + " \"" + JsonKeysForHttpMessage.INLINED_NDJSON_BODIES_DOCUMENT_KEY + "\": [\n" + - "{ \"index\": { \"_index\": \"indexA\", \"_type\": \"type1\", \"_id\": \"1\" } },\n" + + "{ \"index\": { \"_index\": \"indexa\", \"_type\": \"type1\", \"_id\": \"1\" } },\n" + "{ \"field1\": \"value1\" },\n" + - "{ \"index\": { \"_index\": \"indexA\", \"_type\": \"typeDontMap\", \"_id\": \"1\" } },\n" + + "{ \"index\": { \"_index\": \"indexa\", \"_type\": \"typeDontMap\", \"_id\": \"1\" } },\n" + "{ \"field1\": \"value9\" },\n" + "{ \"delete\": { \"_index\": \"test\", \"_type\": \"type1\", \"_id\": \"2\" } },\n" + "{ \"delete\": { \"_index\": \"time-January_1970\", \"_type\": \"cpu\", \"_id\": \"8\" } },\n" + - "{ \"create\": { \"_index\": \"indexC\", \"_type\": \"type1\", \"_id\": \"3\" } },\n" + + "{ \"create\": { \"_index\": \"indexc\", \"_type\": \"type1\", \"_id\": \"3\" } },\n" + "{ \"field1\": \"value3\" },\n" + - "{ \"create\": { \"_index\": \"indexC\", \"_type\": \"type2\", \"_id\": \"14\" } },\n" + + "{ \"create\": { \"_index\": \"indexc\", \"_type\": \"type2\", \"_id\": \"14\" } },\n" + "{ \"field14\": \"value14\" },\n" + - "{ \"update\": {\"_id\": \"1\", \"_type\": \"type1\", \"_index\": \"indexB\"} },\n" + + "{ \"update\": {\"_id\": \"1\", \"_type\": \"type1\", \"_index\": \"indexb\"} },\n" + "{ \"doc\": {\"field2\": \"value2\"} },\n" + - "{ \"update\": {\"_id\": \"1\", \"_type\": \"type2\", \"_index\": \"indexB\"} },\n" + + "{ \"update\": {\"_id\": \"1\", \"_type\": \"type2\", \"_index\": \"indexb\"} },\n" + "{ \"doc\": {\"field10\": \"value10\"} },\n" + - "{ \"update\": {\"_id\": \"1\", \"_type\": \"type3\", \"_index\": \"indexB\"} },\n" + - "{ \"doc\": {\"field10\": \"value11\"} }\n" + + "{ \"update\": {\"_id\": \"1\", \"_type\": \"type3\", \"_index\": \"indexb\"} },\n" + + "{ \"doc\": {\"field11\": \"value11\"} },\n" + + + "{ \"delete\": {\"_id\": \"12\", \"_index\": \"index_without_typemappings\"} },\n" + + + "{ \"update\": {\"_id\": \"13\", \"_index\": \"index_without_typemappings\"} },\n" + + "{ \"doc\": {\"field13\": \"value11\"} }\n" + " ]\n" + " }\n" + @@ -82,19 +87,24 @@ public void testBulk() throws Exception { " \"" + JsonKeysForHttpMessage.HEADERS_KEY + "\": {},\n" + " \"" + JsonKeysForHttpMessage.PAYLOAD_KEY + "\": {\n" + " \"" + JsonKeysForHttpMessage.INLINED_NDJSON_BODIES_DOCUMENT_KEY + "\": [\n" + - "{ \"index\": { \"_index\": \"indexA_1\", \"_id\": \"1\" } },\n" + + "{ \"index\": { \"_index\": \"indexa_1\", \"_id\": \"1\" } },\n" + "{ \"field1\": \"value1\" },\n" + "{ \"delete\": { \"_index\": \"time-January_1970-cpu\", \"_id\": \"8\" } },\n" + - "{ \"create\": { \"_index\": \"indexC\", \"_id\": \"14\" } },\n" + + "{ \"create\": { \"_index\": \"indexc\", \"_id\": \"14\" } },\n" + "{ \"field14\": \"value14\" },\n" + - "{ \"update\": {\"_id\": \"1\", \"_index\": \"indexB\"} },\n" + + "{ \"update\": {\"_id\": \"1\", \"_index\": \"indexb\"} },\n" + "{ \"doc\": {\"field2\": \"value2\"} },\n" + - "{ \"update\": {\"_id\": \"1\", \"_index\": \"indexB\"} },\n" + - "{ \"doc\": {\"field10\": \"value10\"} }\n" + + "{ \"update\": {\"_id\": \"1\", \"_index\": \"indexb\"} },\n" + + "{ \"doc\": {\"field10\": \"value10\"} },\n" + + + "{ \"delete\": {\"_id\": \"12\", \"_index\": \"index_without_typemappings\"} },\n" + + + "{ \"update\": {\"_id\": \"13\", \"_index\": \"index_without_typemappings\"} },\n" + + "{ \"doc\": {\"field13\": \"value11\"} }\n" + " ]\n" + " }\n" + diff --git a/transformation/transformationPlugins/jsonMessageTransformers/jsonTypeMappingsSanitizationTransformer/src/test/java/org/opensearch/migrations/transform/TypeMappingsSanitizationTransformerTest.java b/transformation/transformationPlugins/jsonMessageTransformers/jsonTypeMappingsSanitizationTransformer/src/test/java/org/opensearch/migrations/transform/TypeMappingsSanitizationTransformerTest.java index 731d9058c..d5081f3b0 100644 --- a/transformation/transformationPlugins/jsonMessageTransformers/jsonTypeMappingsSanitizationTransformer/src/test/java/org/opensearch/migrations/transform/TypeMappingsSanitizationTransformerTest.java +++ b/transformation/transformationPlugins/jsonMessageTransformers/jsonTypeMappingsSanitizationTransformer/src/test/java/org/opensearch/migrations/transform/TypeMappingsSanitizationTransformerTest.java @@ -26,12 +26,12 @@ class TypeMappingsSanitizationTransformerTest { @BeforeAll static void initialize() throws IOException { var indexMappings = Map.of( - "indexA", Map.of( - "type1", "indexA_1", - "type2", "indexA_2"), - "indexB", Map.of( - "type1", "indexB", - "type2", "indexB"), + "indexa", Map.of( + "type1", "indexa_1", + "type2", "indexa_2"), + "indexb", Map.of( + "type1", "indexb", + "type2", "indexb"), "socialTypes", Map.of( "tweet", "communal", "user", "communal")); @@ -40,12 +40,13 @@ static void initialize() throws IOException { indexTypeMappingRewriter = new TypeMappingsSanitizationTransformer(indexMappings, regexIndexMappings); } + @Test public void testPutDoc() throws Exception { var testString = "{\n" + " \"" + JsonKeysForHttpMessage.METHOD_KEY + "\": \"PUT\",\n" + - " \"" + JsonKeysForHttpMessage.URI_KEY + "\": \"/indexA/type2/someuser\",\n" + + " \"" + JsonKeysForHttpMessage.URI_KEY + "\": \"/indexa/type2/someuser\",\n" + " \"" + JsonKeysForHttpMessage.PAYLOAD_KEY + "\": {\n" + " \"" + JsonKeysForHttpMessage.INLINED_JSON_BODY_DOCUMENT_KEY + "\": {" + " \"name\": \"Some User\",\n" + @@ -55,8 +56,8 @@ public void testPutDoc() throws Exception { " }\n" + "}"; var resultObj = indexTypeMappingRewriter.transformJson(OBJECT_MAPPER.readValue(testString, LinkedHashMap.class)); - var resultStr = OBJECT_MAPPER.writeValueAsString(resultObj); - log.atInfo().setMessage("resultStr = {}").setMessage(resultStr).log(); + Assertions.assertEquals(JsonNormalizer.fromString(testString.replace("indexa/type2/", "indexa_2/_doc/")), + JsonNormalizer.fromObject(resultObj)); } @Test @@ -75,7 +76,7 @@ public void testPutDocRegex() throws Exception { "}"; var expectedString = "{\n" + " \"" + JsonKeysForHttpMessage.METHOD_KEY + "\":\"PUT\",\n" + - " \"" + JsonKeysForHttpMessage.URI_KEY + "\": \"/time-1-2/_doc/doc2\",\n" + + " \"" + JsonKeysForHttpMessage.URI_KEY + "\": \"/time-nov11-cpu/_doc/doc2\",\n" + " \"" + JsonKeysForHttpMessage.PAYLOAD_KEY + "\":{" + " \"" + JsonKeysForHttpMessage.INLINED_JSON_BODY_DOCUMENT_KEY + "\":{" + " \"name\":\"Some User\"," + @@ -85,9 +86,9 @@ public void testPutDocRegex() throws Exception { " }" + "}"; var resultObj = indexTypeMappingRewriter.transformJson(OBJECT_MAPPER.readValue(testString, LinkedHashMap.class)); - var resultStr = OBJECT_MAPPER.writeValueAsString(resultObj); - log.atInfo().setMessage("resultStr = {}").setMessage(resultStr).log(); - Assertions.assertEquals(JsonNormalizer.fromString(expectedString), JsonNormalizer.fromObject(resultObj)); + log.atInfo().setMessage("resultStr = {}").setMessage(OBJECT_MAPPER.writeValueAsString(resultObj)).log(); + Assertions.assertEquals(JsonNormalizer.fromString(expectedString), + JsonNormalizer.fromObject(resultObj)); } private static String makeMultiTypePutIndexRequest(String indexName) { @@ -135,7 +136,7 @@ Map doPutIndex(String indexName) throws Exception { @Test public void testPutSingleTypeIndex() throws Exception { - final String index = "indexA"; + final String index = "indexa"; var result = doPutIndex(index); Assertions.assertEquals(JsonNormalizer.fromString(makeMultiTypePutIndexRequest(index)), JsonNormalizer.fromObject(result)); @@ -161,6 +162,55 @@ public void testMultiTypeIndex() throws Exception { Assertions.assertEquals(JsonNormalizer.fromObject(expected), JsonNormalizer.fromObject(result)); } + @Test + public void testCreateIndexWithoutTypeButWithMappings() throws Exception{ + var testString = "{\n" + + " \"" + JsonKeysForHttpMessage.METHOD_KEY + "\": \"PUT\",\n" + + " \"" + JsonKeysForHttpMessage.URI_KEY + "\": \"/geonames\",\n" + + " \"" + JsonKeysForHttpMessage.PROTOCOL_KEY + "\": \"HTTP/1.1\"," + + " \"" + JsonKeysForHttpMessage.HEADERS_KEY + "\": {\n" + + " \"Host\": \"capture-proxy:9200\"\n" + + " }," + + " \"" + JsonKeysForHttpMessage.PAYLOAD_KEY + "\": {\n" + + " \"settings\": {\n" + + " \"index\": {\n" + + " \"number_of_shards\": 3, \n" + + " \"number_of_replicas\": 2 \n" + + " }\n" + + " }," + + " \"mappings\": {" + + " \"properties\": {\n" + + " \"field1\": { \"type\": \"text\" }\n" + + " }" + + " }\n" + + " }\n" + + "}"; + var resultObj = indexTypeMappingRewriter.transformJson(OBJECT_MAPPER.readValue(testString, LinkedHashMap.class)); + Assertions.assertEquals(JsonNormalizer.fromString(testString), JsonNormalizer.fromObject(resultObj)); + } + + @Test + public void testCreateIndexWithoutType() throws Exception{ + var testString = "{\n" + + " \"" + JsonKeysForHttpMessage.METHOD_KEY + "\": \"PUT\",\n" + + " \"" + JsonKeysForHttpMessage.URI_KEY + "\": \"/geonames\",\n" + + " \"" + JsonKeysForHttpMessage.PROTOCOL_KEY + "\": \"HTTP/1.1\"," + + " \"" + JsonKeysForHttpMessage.HEADERS_KEY + "\": {\n" + + " \"Host\": \"capture-proxy:9200\"\n" + + " }," + + " \"" + JsonKeysForHttpMessage.PAYLOAD_KEY + "\": {\n" + + " \"settings\": {\n" + + " \"index\": {\n" + + " \"number_of_shards\": 3, \n" + + " \"number_of_replicas\": 2 \n" + + " }\n" + + " }\n" + + " }\n" + + "}"; + var resultObj = indexTypeMappingRewriter.transformJson(OBJECT_MAPPER.readValue(testString, LinkedHashMap.class)); + Assertions.assertEquals(JsonNormalizer.fromString(testString), JsonNormalizer.fromObject(resultObj)); + } + @ParameterizedTest @ValueSource(strings = {"status", "_cat/indices", "_cat/indices/nov-*"} ) public void testDefaultActionPreservesRequest(String uri) throws Exception { diff --git a/transformation/transformationPlugins/jsonMessageTransformers/jsonTypeMappingsSanitizationTransformerProvider/build.gradle b/transformation/transformationPlugins/jsonMessageTransformers/jsonTypeMappingsSanitizationTransformerProvider/build.gradle index ff5c69557..cfb8a9cad 100644 --- a/transformation/transformationPlugins/jsonMessageTransformers/jsonTypeMappingsSanitizationTransformerProvider/build.gradle +++ b/transformation/transformationPlugins/jsonMessageTransformers/jsonTypeMappingsSanitizationTransformerProvider/build.gradle @@ -12,6 +12,9 @@ dependencies { implementation project(':transformation:transformationPlugins:jsonMessageTransformers:jsonMessageTransformerInterface') implementation project(':transformation:transformationPlugins:jsonMessageTransformers:jsonTypeMappingsSanitizationTransformer') + implementation group: 'com.fasterxml.jackson.core', name: 'jackson-core' + implementation group: 'com.fasterxml.jackson.core', name: 'jackson-databind' + testImplementation project(':transformation:transformationPlugins:jsonMessageTransformers:jsonTypeMappingsSanitizationTransformer') testImplementation project(':coreUtilities') testImplementation testFixtures(project(path: ':coreUtilities')) diff --git a/transformation/transformationPlugins/jsonMessageTransformers/jsonTypeMappingsSanitizationTransformerProvider/src/main/java/org/opensearch/migrations/transform/TypeMappingSanitizationTransformerProvider.java b/transformation/transformationPlugins/jsonMessageTransformers/jsonTypeMappingsSanitizationTransformerProvider/src/main/java/org/opensearch/migrations/transform/TypeMappingSanitizationTransformerProvider.java index 0b3405f89..338c1d639 100644 --- a/transformation/transformationPlugins/jsonMessageTransformers/jsonTypeMappingsSanitizationTransformerProvider/src/main/java/org/opensearch/migrations/transform/TypeMappingSanitizationTransformerProvider.java +++ b/transformation/transformationPlugins/jsonMessageTransformers/jsonTypeMappingsSanitizationTransformerProvider/src/main/java/org/opensearch/migrations/transform/TypeMappingSanitizationTransformerProvider.java @@ -2,7 +2,12 @@ import java.util.List; import java.util.Map; +import java.util.Optional; +import org.opensearch.migrations.transform.jinjava.JinjavaConfig; +import org.opensearch.migrations.transform.typemappings.SourceProperties; + +import com.fasterxml.jackson.databind.ObjectMapper; import lombok.SneakyThrows; public class TypeMappingSanitizationTransformerProvider implements IJsonTransformerProvider { @@ -11,25 +16,31 @@ public class TypeMappingSanitizationTransformerProvider implements IJsonTransfor public static final String STATIC_MAPPINGS = "staticMappings"; public static final String REGEX_MAPPINGS = "regexMappings"; + public static final String JINJAVA_CONFIG_KEY = "jinjavaConfig"; + public static final String SOURCE_PROPERTIES_KEY = "sourceProperties"; + + public final static ObjectMapper mapper = new ObjectMapper(); + @SneakyThrows @Override public IJsonTransformer createTransformer(Object jsonConfig) { try { - if (jsonConfig == null) { - return new TypeMappingsSanitizationTransformer(TypeMappingsSanitizationTransformer.REPLAYER_VARIANT, - null, null, null); - } else if (jsonConfig instanceof String && ((String) jsonConfig).isEmpty()) { - return new TypeMappingsSanitizationTransformer(TypeMappingsSanitizationTransformer.REPLAYER_VARIANT, - null, null, null); + if ((jsonConfig == null) || + (jsonConfig instanceof String && ((String) jsonConfig).isEmpty())) { + return new TypeMappingsSanitizationTransformer(null, null, null, null, null); } else if (!(jsonConfig instanceof Map)) { throw new IllegalArgumentException(getConfigUsageStr()); } var config = (Map) jsonConfig; - return new TypeMappingsSanitizationTransformer(TypeMappingsSanitizationTransformer.REPLAYER_VARIANT, - (Map) config.get(FEATURE_FLAGS), + return new TypeMappingsSanitizationTransformer( (Map>) config.get(STATIC_MAPPINGS), - (List>) config.get(REGEX_MAPPINGS)); + (List>) config.get(REGEX_MAPPINGS), + Optional.ofNullable(config.get(SOURCE_PROPERTIES_KEY)).map(jinjavaConfig -> + mapper.convertValue(jinjavaConfig, SourceProperties.class)).orElse(null), + (Map) config.get(FEATURE_FLAGS), + Optional.ofNullable(config.get(JINJAVA_CONFIG_KEY)).map(jinjavaConfig -> + mapper.convertValue(jinjavaConfig, JinjavaConfig.class)).orElse(null)); } catch (ClassCastException e) { throw new IllegalArgumentException(getConfigUsageStr(), e); } diff --git a/transformation/transformationPlugins/jsonMessageTransformers/jsonTypeMappingsSanitizationTransformerProvider/src/test/java/org/opensearch/migrations/replay/TypeMappingsSanitizationProviderTest.java b/transformation/transformationPlugins/jsonMessageTransformers/jsonTypeMappingsSanitizationTransformerProvider/src/test/java/org/opensearch/migrations/replay/TypeMappingsSanitizationProviderTest.java index cde31e360..7c642b4c4 100644 --- a/transformation/transformationPlugins/jsonMessageTransformers/jsonTypeMappingsSanitizationTransformerProvider/src/test/java/org/opensearch/migrations/replay/TypeMappingsSanitizationProviderTest.java +++ b/transformation/transformationPlugins/jsonMessageTransformers/jsonTypeMappingsSanitizationTransformerProvider/src/test/java/org/opensearch/migrations/replay/TypeMappingsSanitizationProviderTest.java @@ -32,7 +32,7 @@ public void testSimpleTransform() throws JsonProcessingException { "type2", "indexB"), "indexC", Map.of( "type2", "indexC")), - "regexMappings", List.of(List.of("(time.*)", "(type.*)", "$1_And_$2"))); + "regexMappings", List.of(List.of("(time.*)", "(type.*)", "\\1_And_\\2"))); final String TEST_INPUT_REQUEST = "{\n" + " \"method\": \"PUT\",\n" + " \"URI\": \"/indexA/type2/someuser\",\n" From 739d5d7ca0648e167e577791d8854c05e20b5fb6 Mon Sep 17 00:00:00 2001 From: Greg Schohn Date: Sun, 8 Dec 2024 01:24:42 -0500 Subject: [PATCH 19/26] Implement a simple take on translating RFS bulk requests to use index-type rewrite rules from the type mappings sanitization transformer. Signed-off-by: Greg Schohn --- .../NameMappingClasspathResourceLocator.java | 2 +- .../jinjava/RegexReplaceException.java | 2 +- .../typeMappings/documentBackfillItems.j2 | 21 +++++++++ .../typeMappings/rewriteBulkRequest.j2 | 12 +++++- ...peMappingsSanitizationDocBackfillTest.java | 43 +++++++++++++++++++ ...ppingsSanitizationTransformerBulkTest.java | 2 +- 6 files changed, 78 insertions(+), 4 deletions(-) create mode 100644 transformation/transformationPlugins/jsonMessageTransformers/jsonTypeMappingsSanitizationTransformer/src/test/java/org/opensearch/migrations/transform/TypeMappingsSanitizationDocBackfillTest.java diff --git a/transformation/transformationPlugins/jsonMessageTransformers/jsonJinjavaTransformer/src/main/java/org/opensearch/migrations/transform/jinjava/NameMappingClasspathResourceLocator.java b/transformation/transformationPlugins/jsonMessageTransformers/jsonJinjavaTransformer/src/main/java/org/opensearch/migrations/transform/jinjava/NameMappingClasspathResourceLocator.java index 137d4387d..e69fcc2ff 100644 --- a/transformation/transformationPlugins/jsonMessageTransformers/jsonJinjavaTransformer/src/main/java/org/opensearch/migrations/transform/jinjava/NameMappingClasspathResourceLocator.java +++ b/transformation/transformationPlugins/jsonMessageTransformers/jsonJinjavaTransformer/src/main/java/org/opensearch/migrations/transform/jinjava/NameMappingClasspathResourceLocator.java @@ -74,7 +74,7 @@ public String getString(String fullName, Charset encoding, JinjavaInterpreter in try { return resourceCache.get(new ResourceCacheKey(fullName, encoding)); } catch (ExecutionException e) { - throw new IOException("Failed to get resource content from cache", e); + throw new IOException("Failed to get resource content named `" + fullName + "`from cache", e); } } } diff --git a/transformation/transformationPlugins/jsonMessageTransformers/jsonJinjavaTransformer/src/main/java/org/opensearch/migrations/transform/jinjava/RegexReplaceException.java b/transformation/transformationPlugins/jsonMessageTransformers/jsonJinjavaTransformer/src/main/java/org/opensearch/migrations/transform/jinjava/RegexReplaceException.java index e0369cbce..7931e820d 100644 --- a/transformation/transformationPlugins/jsonMessageTransformers/jsonJinjavaTransformer/src/main/java/org/opensearch/migrations/transform/jinjava/RegexReplaceException.java +++ b/transformation/transformationPlugins/jsonMessageTransformers/jsonJinjavaTransformer/src/main/java/org/opensearch/migrations/transform/jinjava/RegexReplaceException.java @@ -28,4 +28,4 @@ public String getMessage() { .add("replacement='" + replacement + "'") .add("rewrittenReplacement='" + rewrittenReplacement + "'"); } -} \ No newline at end of file +} diff --git a/transformation/transformationPlugins/jsonMessageTransformers/jsonTypeMappingsSanitizationTransformer/src/main/resources/jinjava/typeMappings/documentBackfillItems.j2 b/transformation/transformationPlugins/jsonMessageTransformers/jsonTypeMappingsSanitizationTransformer/src/main/resources/jinjava/typeMappings/documentBackfillItems.j2 index e69de29bb..2e5e85cda 100644 --- a/transformation/transformationPlugins/jsonMessageTransformers/jsonTypeMappingsSanitizationTransformer/src/main/resources/jinjava/typeMappings/documentBackfillItems.j2 +++ b/transformation/transformationPlugins/jsonMessageTransformers/jsonTypeMappingsSanitizationTransformer/src/main/resources/jinjava/typeMappings/documentBackfillItems.j2 @@ -0,0 +1,21 @@ +{# see https://github.com/opensearch-project/opensearch-migrations/pull/1110 for the format of these messages #} +{%- include "typeMappings/rewriteBulkRequest.j2" -%} +{%- import "typeMappings/rewriteIndexForTarget.j2" as transidx -%} + +{%- set parameters = source_document.index -%} +{{ log_value('ERROR', parameters) }} +{{ log_value('WARN', source_document.source) }} + +{%- set type_name = parameters['_type'] -%} +{%- if type_name -%} + {%- set target_index = transidx.convert_source_index_to_target(parameters['_index'], type_name, input_map.index_mappings, input_map.regex_index_mappings) if type_name -%} + {%- if target_index -%} + { + {{ rewrite_index_parameters(parameters, target_index) }}, + "source": {{ source_document.source | tojson }} + } + {%- endif -%} +{%- else -%} + {%- import "typeMappings/preserveAll.j2" as preserve -%} + {{- preserve.make_keep_json() -}} +{%- endif -%} diff --git a/transformation/transformationPlugins/jsonMessageTransformers/jsonTypeMappingsSanitizationTransformer/src/main/resources/jinjava/typeMappings/rewriteBulkRequest.j2 b/transformation/transformationPlugins/jsonMessageTransformers/jsonTypeMappingsSanitizationTransformer/src/main/resources/jinjava/typeMappings/rewriteBulkRequest.j2 index 1050cbd51..08f05c639 100644 --- a/transformation/transformationPlugins/jsonMessageTransformers/jsonTypeMappingsSanitizationTransformer/src/main/resources/jinjava/typeMappings/rewriteBulkRequest.j2 +++ b/transformation/transformationPlugins/jsonMessageTransformers/jsonTypeMappingsSanitizationTransformer/src/main/resources/jinjava/typeMappings/rewriteBulkRequest.j2 @@ -19,9 +19,19 @@ {%- macro get_index() -%}index{% endmacro %} {%- macro get_update() -%}update{% endmacro %} +{%- macro rewrite_command_parameters(command, parameters, target_index) -%} + {%- if target_index -%} + "{{ invoke_macro("get_"+command) }}": {{ retarget_command_parameters(parameters, target_index) }} + {%- endif -%} +{%- endmacro -%} + +{%- macro rewrite_index_parameters(parameters, target_index) -%} + {{ rewrite_command_parameters('index', parameters, target_index) }} +{%- endmacro -%} + {%- macro rewrite_command(command, parameters, target_index, doc) -%} {%- if target_index -%} - { "{{ invoke_macro("get_"+command) }}": {{ retarget_command_parameters(parameters, target_index) }} }, + { {{ rewrite_command_parameters(command, parameters, target_index) }} }, {{ doc | tojson }} {%- endif -%} {%- endmacro -%} diff --git a/transformation/transformationPlugins/jsonMessageTransformers/jsonTypeMappingsSanitizationTransformer/src/test/java/org/opensearch/migrations/transform/TypeMappingsSanitizationDocBackfillTest.java b/transformation/transformationPlugins/jsonMessageTransformers/jsonTypeMappingsSanitizationTransformer/src/test/java/org/opensearch/migrations/transform/TypeMappingsSanitizationDocBackfillTest.java new file mode 100644 index 000000000..be9d53909 --- /dev/null +++ b/transformation/transformationPlugins/jsonMessageTransformers/jsonTypeMappingsSanitizationTransformer/src/test/java/org/opensearch/migrations/transform/TypeMappingsSanitizationDocBackfillTest.java @@ -0,0 +1,43 @@ +package org.opensearch.migrations.transform; + +import java.util.LinkedHashMap; +import java.util.List; + +import org.opensearch.migrations.testutils.JsonNormalizer; + +import lombok.Lombok; +import lombok.extern.slf4j.Slf4j; +import org.junit.jupiter.api.Assertions; +import org.junit.jupiter.api.Test; +import org.testcontainers.shaded.com.fasterxml.jackson.databind.ObjectMapper; + +@Slf4j +public class TypeMappingsSanitizationDocBackfillTest { + private static final ObjectMapper OBJECT_MAPPER = new ObjectMapper(); + + @Test + public void test() throws Exception { + var testString = "{\n" + + " \"index\": { \"_index\": \"performance\", \"_type\": \"network\", \"_id\": \"1\" },\n" + + " \"source\": { \"field1\": \"value1\" }\n" + + "}"; + + var expectedString = "{\n" + + " \"index\": { \"_index\": \"network\", \"_id\": \"1\" },\n" + + " \"source\": { \"field1\": \"value1\" }\n" + + "}"; + + + var regexIndexMappings = List.of(List.of(".*", "", "")); + var indexTypeMappingRewriter = new TypeMappingsSanitizationTransformer(null, regexIndexMappings); + var resultObj = indexTypeMappingRewriter.transformJson(OBJECT_MAPPER.readValue(testString, LinkedHashMap.class)); + log.atInfo().setMessage("resultStr = {}").addArgument(() -> { + try { + return OBJECT_MAPPER.writeValueAsString(resultObj); + } catch (Exception e) { + throw Lombok.sneakyThrow(e); + } + }).log(); + Assertions.assertEquals(JsonNormalizer.fromString(expectedString), JsonNormalizer.fromObject(resultObj)); + } +} diff --git a/transformation/transformationPlugins/jsonMessageTransformers/jsonTypeMappingsSanitizationTransformer/src/test/java/org/opensearch/migrations/transform/TypeMappingsSanitizationTransformerBulkTest.java b/transformation/transformationPlugins/jsonMessageTransformers/jsonTypeMappingsSanitizationTransformer/src/test/java/org/opensearch/migrations/transform/TypeMappingsSanitizationTransformerBulkTest.java index 4a863eb8a..2b715504a 100644 --- a/transformation/transformationPlugins/jsonMessageTransformers/jsonTypeMappingsSanitizationTransformer/src/test/java/org/opensearch/migrations/transform/TypeMappingsSanitizationTransformerBulkTest.java +++ b/transformation/transformationPlugins/jsonMessageTransformers/jsonTypeMappingsSanitizationTransformer/src/test/java/org/opensearch/migrations/transform/TypeMappingsSanitizationTransformerBulkTest.java @@ -36,7 +36,7 @@ static void initialize() throws IOException { } @Test - public void testBulk() throws Exception { + public void testBulkRequest() throws Exception { var testString = "{\n" + " \"" + JsonKeysForHttpMessage.METHOD_KEY + "\": \"PUT\",\n" + From 95b71f4fd23e485d6b8a809273ca37e19a57694f Mon Sep 17 00:00:00 2001 From: Greg Schohn Date: Mon, 9 Dec 2024 00:59:26 -0500 Subject: [PATCH 20/26] Checkpoint with further refactoring improvements, mostly around tests. I still need to do a sweep over the tests to make sure none of the tests are miswired Signed-off-by: Greg Schohn --- .../jsonJinjavaTransformer/build.gradle | 4 +- .../jinjava/common/featureEnabled.j2 | 1 - .../build.gradle | 4 + .../TypeMappingsSanitizationTransformer.java | 2 +- .../typemappings/SourceProperties.java | 17 +- .../typeMappings/documentBackfillItems.j2 | 2 - .../typeMappings/elasticVersionProperties.j2 | 0 .../typeMappings/rewriteCreateIndexRequest.j2 | 51 +++++- .../typeMappings/rewriteIndexForTarget.j2 | 8 +- ...ype.j2 => transformByTypeOfSourceInput.j2} | 0 ...peMappingsSanitizationCreateIndexTest.java | 166 ++++++++++++++++++ ...peMappingsSanitizationTransformerTest.java | 122 ------------- .../transform/TestRequestBuilder.java | 53 ++++++ .../build.gradle | 1 + .../TypeMappingsSanitizationProviderTest.java | 87 ++++++++- 15 files changed, 368 insertions(+), 150 deletions(-) delete mode 100644 transformation/transformationPlugins/jsonMessageTransformers/jsonTypeMappingsSanitizationTransformer/src/main/resources/jinjava/typeMappings/elasticVersionProperties.j2 rename transformation/transformationPlugins/jsonMessageTransformers/jsonTypeMappingsSanitizationTransformer/src/main/resources/jinjava/typeMappings/{transformByType.j2 => transformByTypeOfSourceInput.j2} (100%) create mode 100644 transformation/transformationPlugins/jsonMessageTransformers/jsonTypeMappingsSanitizationTransformer/src/test/java/org/opensearch/migrations/transform/TypeMappingsSanitizationCreateIndexTest.java create mode 100644 transformation/transformationPlugins/jsonMessageTransformers/jsonTypeMappingsSanitizationTransformer/src/testFixtures/java/org/opensearch/migrations/transform/TestRequestBuilder.java diff --git a/transformation/transformationPlugins/jsonMessageTransformers/jsonJinjavaTransformer/build.gradle b/transformation/transformationPlugins/jsonMessageTransformers/jsonJinjavaTransformer/build.gradle index 8fdff96aa..5a83cfa2f 100644 --- a/transformation/transformationPlugins/jsonMessageTransformers/jsonJinjavaTransformer/build.gradle +++ b/transformation/transformationPlugins/jsonMessageTransformers/jsonJinjavaTransformer/build.gradle @@ -1,12 +1,14 @@ plugins { + id 'org.opensearch.migrations.java-library-conventions' id 'io.freefair.lombok' } dependencies { implementation project(':transformation:transformationPlugins:jsonMessageTransformers:jsonMessageTransformerInterface') + api group: 'com.hubspot.jinjava', name: 'jinjava', version: "2.7.3" + implementation group: 'com.google.guava', name: 'guava' - implementation group: 'com.hubspot.jinjava', name: 'jinjava', version: "2.7.3" testImplementation project(':TrafficCapture:trafficReplayer') testImplementation project(':transformation:transformationPlugins:jsonMessageTransformers:jsonMessageTransformerLoaders') diff --git a/transformation/transformationPlugins/jsonMessageTransformers/jsonJinjavaTransformer/src/main/resources/jinjava/common/featureEnabled.j2 b/transformation/transformationPlugins/jsonMessageTransformers/jsonJinjavaTransformer/src/main/resources/jinjava/common/featureEnabled.j2 index a674884c4..16c7f8d0f 100644 --- a/transformation/transformationPlugins/jsonMessageTransformers/jsonJinjavaTransformer/src/main/resources/jinjava/common/featureEnabled.j2 +++ b/transformation/transformationPlugins/jsonMessageTransformers/jsonJinjavaTransformer/src/main/resources/jinjava/common/featureEnabled.j2 @@ -4,7 +4,6 @@ {%- else -%} {%- set ns = namespace(value=features) -%} {%- for key in (path | split('.')) -%} -{# {{- log_value('ERROR', "my logged key:"+key) -}}{{- log_value('INFO', "ismapping:") -}}#} {%- if ns.value is mapping and key in ns.value -%} {%- set ns.value = ns.value[key] -%} {%- else -%} diff --git a/transformation/transformationPlugins/jsonMessageTransformers/jsonTypeMappingsSanitizationTransformer/build.gradle b/transformation/transformationPlugins/jsonMessageTransformers/jsonTypeMappingsSanitizationTransformer/build.gradle index fa989278e..ccec1a158 100644 --- a/transformation/transformationPlugins/jsonMessageTransformers/jsonTypeMappingsSanitizationTransformer/build.gradle +++ b/transformation/transformationPlugins/jsonMessageTransformers/jsonTypeMappingsSanitizationTransformer/build.gradle @@ -1,6 +1,7 @@ plugins { id 'io.freefair.lombok' id 'java-library' + id 'java-test-fixtures' } dependencies { @@ -12,6 +13,9 @@ dependencies { implementation group: 'com.fasterxml.jackson.core', name: 'jackson-databind' implementation group: 'com.google.guava', name: 'guava' + testFixturesImplementation project(':TrafficCapture:trafficReplayer') + testFixturesImplementation project(':transformation:transformationPlugins:jsonMessageTransformers:jsonMessageTransformerInterface') + testImplementation project(':TrafficCapture:trafficReplayer') testImplementation testFixtures(project(path: ':testHelperFixtures')) testImplementation testFixtures(project(path: ':TrafficCapture:trafficReplayer')) diff --git a/transformation/transformationPlugins/jsonMessageTransformers/jsonTypeMappingsSanitizationTransformer/src/main/java/org/opensearch/migrations/transform/TypeMappingsSanitizationTransformer.java b/transformation/transformationPlugins/jsonMessageTransformers/jsonTypeMappingsSanitizationTransformer/src/main/java/org/opensearch/migrations/transform/TypeMappingsSanitizationTransformer.java index 94225d5ac..226b858b9 100644 --- a/transformation/transformationPlugins/jsonMessageTransformers/jsonTypeMappingsSanitizationTransformer/src/main/java/org/opensearch/migrations/transform/TypeMappingsSanitizationTransformer.java +++ b/transformation/transformationPlugins/jsonMessageTransformers/jsonTypeMappingsSanitizationTransformer/src/main/java/org/opensearch/migrations/transform/TypeMappingsSanitizationTransformer.java @@ -14,7 +14,7 @@ public class TypeMappingsSanitizationTransformer extends JinjavaTransformer { - public static final String ENTRYPOINT_JINJA_TEMPLATE = "jinjava/typeMappings/transformByType.j2"; + public static final String ENTRYPOINT_JINJA_TEMPLATE = "jinjava/typeMappings/transformByTypeOfSourceInput.j2"; public TypeMappingsSanitizationTransformer( Map> indexMappings, diff --git a/transformation/transformationPlugins/jsonMessageTransformers/jsonTypeMappingsSanitizationTransformer/src/main/java/org/opensearch/migrations/transform/typemappings/SourceProperties.java b/transformation/transformationPlugins/jsonMessageTransformers/jsonTypeMappingsSanitizationTransformer/src/main/java/org/opensearch/migrations/transform/typemappings/SourceProperties.java index 1f100ffa3..28c21f9ca 100644 --- a/transformation/transformationPlugins/jsonMessageTransformers/jsonTypeMappingsSanitizationTransformer/src/main/java/org/opensearch/migrations/transform/typemappings/SourceProperties.java +++ b/transformation/transformationPlugins/jsonMessageTransformers/jsonTypeMappingsSanitizationTransformer/src/main/java/org/opensearch/migrations/transform/typemappings/SourceProperties.java @@ -8,13 +8,14 @@ @NoArgsConstructor @AllArgsConstructor public class SourceProperties { - private Version version; + private String type; + private Version version; - @Data - @NoArgsConstructor - @AllArgsConstructor - public static class Version { - private int major; - private int minor; - } + @Data + @NoArgsConstructor + @AllArgsConstructor + public static class Version { + private int major; + private int minor; + } } diff --git a/transformation/transformationPlugins/jsonMessageTransformers/jsonTypeMappingsSanitizationTransformer/src/main/resources/jinjava/typeMappings/documentBackfillItems.j2 b/transformation/transformationPlugins/jsonMessageTransformers/jsonTypeMappingsSanitizationTransformer/src/main/resources/jinjava/typeMappings/documentBackfillItems.j2 index 2e5e85cda..eba19784d 100644 --- a/transformation/transformationPlugins/jsonMessageTransformers/jsonTypeMappingsSanitizationTransformer/src/main/resources/jinjava/typeMappings/documentBackfillItems.j2 +++ b/transformation/transformationPlugins/jsonMessageTransformers/jsonTypeMappingsSanitizationTransformer/src/main/resources/jinjava/typeMappings/documentBackfillItems.j2 @@ -3,8 +3,6 @@ {%- import "typeMappings/rewriteIndexForTarget.j2" as transidx -%} {%- set parameters = source_document.index -%} -{{ log_value('ERROR', parameters) }} -{{ log_value('WARN', source_document.source) }} {%- set type_name = parameters['_type'] -%} {%- if type_name -%} diff --git a/transformation/transformationPlugins/jsonMessageTransformers/jsonTypeMappingsSanitizationTransformer/src/main/resources/jinjava/typeMappings/elasticVersionProperties.j2 b/transformation/transformationPlugins/jsonMessageTransformers/jsonTypeMappingsSanitizationTransformer/src/main/resources/jinjava/typeMappings/elasticVersionProperties.j2 deleted file mode 100644 index e69de29bb..000000000 diff --git a/transformation/transformationPlugins/jsonMessageTransformers/jsonTypeMappingsSanitizationTransformer/src/main/resources/jinjava/typeMappings/rewriteCreateIndexRequest.j2 b/transformation/transformationPlugins/jsonMessageTransformers/jsonTypeMappingsSanitizationTransformer/src/main/resources/jinjava/typeMappings/rewriteCreateIndexRequest.j2 index 81eda2b89..d1129872e 100644 --- a/transformation/transformationPlugins/jsonMessageTransformers/jsonTypeMappingsSanitizationTransformer/src/main/resources/jinjava/typeMappings/rewriteCreateIndexRequest.j2 +++ b/transformation/transformationPlugins/jsonMessageTransformers/jsonTypeMappingsSanitizationTransformer/src/main/resources/jinjava/typeMappings/rewriteCreateIndexRequest.j2 @@ -5,6 +5,7 @@ {%- set source_input_types = input_map.index_mappings[source_index_name] -%} {%- set source_type_name = source_input_types.keys() | first() -%} { + "preserve": ["protocol", "headers"], "method": "{{ input_map.request.method }}", "URI": "/{{ target_index_name }}", "payload": { @@ -43,20 +44,52 @@ } } {%- endmacro -%} + +{%- macro uses_type_names(input_map) -%} + {%- set uri_flag_match = input_map.request.URI | regex_capture("[?&]include_type_name=([^&#]*)") -%} + {%- if uri_flag_match -%} + {{- uri_flag_match.group1 | lower -}} + {%- else -%} + {%- set major_version = ((input_map.properties | default({})).version | default({})).major -%} + {%- if major_version >= 7-%} + false + {%- elif major_version <= 6 -%} + true + {%- else -%} + {%- throw "include_type_name was not set on the incoming URI." + + "The template needs to know what version the original request was targeted for " + + "in order to properly understand the semantics and what was intended. " + + "Without that, this transformation cannot map the request " + + "to an unambiguous request for the target" -%} + {%- endif -%} + {%- endif -%} +{%- endmacro -%} + {%- macro rewrite_create_index(match, input_map) -%} {%- set orig_mappings = input_map.request.payload.inlinedJsonBody.mappings -%} - {%- if orig_mappings -%} - {%- set source_index_name = match.group1 -%} - {%- set target_indices = (input_map.index_mappings[source_index_name] | default({})).values() | unique() -%} - {%- set num_mappings = target_indices | length -%} - {%- if num_mappings == 0 -%} + {%- if orig_mappings and uses_type_names(input_map).trim() == 'true' -%} + {%- set source_index_name = match.group1 | regex_replace("[?].*", "") -%} + + {%- set ns = namespace(accum_target_indices=[]) -%} + {%- for source_type, mapping in orig_mappings.items() -%} + {%- set target_index = convert_source_index_to_target(source_index_name, source_type, + input_map.index_mappings, + input_map.regex_index_mappings) | trim -%} + {%- if target_index -%} + {%- set ns.accum_target_indices = ns.accum_target_indices + [target_index] -%} + {%- endif -%} + {%- endfor -%} + + {%- set target_indices = ns.accum_target_indices | unique() -%} + {%- set num_target_mappings = target_indices | length -%} + {%- if num_target_mappings == 0 -%} {{- noop.make_request() -}} - {%- elif num_mappings == 1 -%} + {%- elif num_target_mappings == 1 -%} {{- rewrite_create_index_as_unioned_excise(source_index_name, (target_indices | first), input_map) -}} - {%- elif num_mappings > 1 -%} - {# Need to extend the replayer to allow multiple requests since this needs to become multiple requests #} - {{- preserve.make_keep_json() -}} + {%- else -%} + {%- throw "Cannot specify multiple indices to create with a single request and cannot yet " + + "represent multiple requests with the request format." -%} {%- endif -%} {%- else -%} {{- preserve.make_keep_json() -}} diff --git a/transformation/transformationPlugins/jsonMessageTransformers/jsonTypeMappingsSanitizationTransformer/src/main/resources/jinjava/typeMappings/rewriteIndexForTarget.j2 b/transformation/transformationPlugins/jsonMessageTransformers/jsonTypeMappingsSanitizationTransformer/src/main/resources/jinjava/typeMappings/rewriteIndexForTarget.j2 index 588d809ca..f0606d83f 100644 --- a/transformation/transformationPlugins/jsonMessageTransformers/jsonTypeMappingsSanitizationTransformer/src/main/resources/jinjava/typeMappings/rewriteIndexForTarget.j2 +++ b/transformation/transformationPlugins/jsonMessageTransformers/jsonTypeMappingsSanitizationTransformer/src/main/resources/jinjava/typeMappings/rewriteIndexForTarget.j2 @@ -16,9 +16,9 @@ {%- macro convert_source_index_to_target(source_index, source_type, index_mappings, regex_index_mappings) -%} {%- set ns = namespace(target_index=none) -%} - {%- set ns.target_index2 = (index_mappings[source_index] | default({}))[source_type] -%} - {%- if ns.target_index2 is none -%} - {%- set ns.target_index2 = convert_source_index_to_target_via_regex(source_index, source_type, regex_index_mappings) -%} + {%- set ns.target_index = (index_mappings[source_index] | default({}))[source_type] -%} + {%- if ns.target_index is none -%} + {%- set ns.target_index = convert_source_index_to_target_via_regex(source_index, source_type, regex_index_mappings) -%} {%- endif -%} - {{ ns.target_index2 }} + {{- ns.target_index -}} {%- endmacro -%} \ No newline at end of file diff --git a/transformation/transformationPlugins/jsonMessageTransformers/jsonTypeMappingsSanitizationTransformer/src/main/resources/jinjava/typeMappings/transformByType.j2 b/transformation/transformationPlugins/jsonMessageTransformers/jsonTypeMappingsSanitizationTransformer/src/main/resources/jinjava/typeMappings/transformByTypeOfSourceInput.j2 similarity index 100% rename from transformation/transformationPlugins/jsonMessageTransformers/jsonTypeMappingsSanitizationTransformer/src/main/resources/jinjava/typeMappings/transformByType.j2 rename to transformation/transformationPlugins/jsonMessageTransformers/jsonTypeMappingsSanitizationTransformer/src/main/resources/jinjava/typeMappings/transformByTypeOfSourceInput.j2 diff --git a/transformation/transformationPlugins/jsonMessageTransformers/jsonTypeMappingsSanitizationTransformer/src/test/java/org/opensearch/migrations/transform/TypeMappingsSanitizationCreateIndexTest.java b/transformation/transformationPlugins/jsonMessageTransformers/jsonTypeMappingsSanitizationTransformer/src/test/java/org/opensearch/migrations/transform/TypeMappingsSanitizationCreateIndexTest.java new file mode 100644 index 000000000..cfd6acf22 --- /dev/null +++ b/transformation/transformationPlugins/jsonMessageTransformers/jsonTypeMappingsSanitizationTransformer/src/test/java/org/opensearch/migrations/transform/TypeMappingsSanitizationCreateIndexTest.java @@ -0,0 +1,166 @@ +package org.opensearch.migrations.transform; + +import java.util.HashMap; +import java.util.LinkedHashMap; +import java.util.List; +import java.util.Map; + +import org.opensearch.migrations.testutils.JsonNormalizer; + +import com.fasterxml.jackson.databind.ObjectMapper; +import com.fasterxml.jackson.databind.node.ObjectNode; +import org.junit.jupiter.api.Assertions; +import org.junit.jupiter.api.Test; + +public class TypeMappingsSanitizationCreateIndexTest { + + private static final ObjectMapper OBJECT_MAPPER = new ObjectMapper(); + + private static TypeMappingsSanitizationTransformer makeIndexTypeMappingRewriter() throws Exception { + var indexMappings = Map.of( + "indexa", Map.of( + "type1", "indexa_1", + "type2", "indexa_2", + "user", "a_user"), + "indexb", Map.of( + "type1", "indexb", + "type2", "indexb"), + "socialTypes", Map.of( + "tweet", "communal", + "user", "communal")); + var regexIndexMappings = List.of( + List.of("time-(.*)", "(.*)", "time-\\1-\\2")); + return new TypeMappingsSanitizationTransformer(indexMappings, regexIndexMappings); + } + + private static String makeMultiTypePutIndexRequest(String indexName, Boolean includeTypeName) { + return TestRequestBuilder.makePutIndexRequest(indexName, true, includeTypeName); + } + + @Test + public void testPutSingleTypeToMissingTarget() throws Exception { + final String index = "indexb"; // has multiple indices for its types + var testString = TestRequestBuilder.makePutIndexRequest(index, false, true); + var indexTypeMappingRewriter = makeIndexTypeMappingRewriter(); + var result = (Map) + indexTypeMappingRewriter.transformJson(OBJECT_MAPPER.readValue(testString, LinkedHashMap.class)); + Assertions.assertEquals(JsonNormalizer.fromString("{ \"method\": \"GET\", \"URI\": \"/\" }"), + JsonNormalizer.fromObject(result)); + } + + @Test + public void testPutSingleTypeIndex() throws Exception { + final String index = "indexa"; // has multiple indices for its types + var testString = TestRequestBuilder.makePutIndexRequest(index, false, true); + var indexTypeMappingRewriter = makeIndexTypeMappingRewriter(); + var result = (Map) + indexTypeMappingRewriter.transformJson(OBJECT_MAPPER.readValue(testString, LinkedHashMap.class)); + var expectedString = "{\n" + + " \"URI\" : \"/a_user\",\n" + + " \"method\" : \"PUT\",\n" + + " \"payload\" : {\n" + + " \"inlinedJsonBody\" : {\n" + + " \"mappings\" : {\n" + + " \"properties\" : {\n" + + " \"email\" : {\n" + + " \"type\" : \"keyword\"\n" + + " },\n" + + " \"name\" : {\n" + + " \"type\" : \"text\"\n" + + " },\n" + + " \"type\" : {\n" + + " \"type\" : \"keyword\"\n" + + " },\n" + + " \"user_name\" : {\n" + + " \"type\" : \"keyword\"\n" + + " }\n" + + " }\n" + + " },\n" + + " \"settings\" : {\n" + + " \"number_of_shards\" : 1\n" + + " }\n" + + " }\n" + + " }\n" + + "}"; + Assertions.assertEquals(JsonNormalizer.fromString(expectedString), + JsonNormalizer.fromObject(result)); + } + + @Test + public void testMultiTypeIndexMerged() throws Exception { + final String index = "socialTypes"; + var testString = makeMultiTypePutIndexRequest(index, true); + var indexTypeMappingRewriter = makeIndexTypeMappingRewriter(); + var result = (Map) + indexTypeMappingRewriter.transformJson(OBJECT_MAPPER.readValue(testString, LinkedHashMap.class)); + var expected = OBJECT_MAPPER.readTree(makeMultiTypePutIndexRequest(index, null)); + var mappings = ((ObjectNode) expected.path(JsonKeysForHttpMessage.PAYLOAD_KEY) + .path(JsonKeysForHttpMessage.INLINED_JSON_BODY_DOCUMENT_KEY) + .path("mappings")); + mappings.remove("following"); + var newProperties = new HashMap(); + newProperties.put("type", Map.of("type", "keyword")); + var user = mappings.remove("user"); + user.path("properties").fields().forEachRemaining(e -> newProperties.put(e.getKey(), e.getValue())); + var tweet = mappings.remove("tweet"); + tweet.path("properties").fields().forEachRemaining(e -> newProperties.put(e.getKey(), e.getValue())); + mappings.set("properties", OBJECT_MAPPER.valueToTree(newProperties)); + ((ObjectNode)expected).put(JsonKeysForHttpMessage.URI_KEY, "/communal"); + Assertions.assertEquals(JsonNormalizer.fromObject(expected), JsonNormalizer.fromObject(result)); + } + + @Test + public void testCreateIndexWithoutTypeButWithMappings() throws Exception{ + var uri = TestRequestBuilder.formatCreateIndexUri("geonames", false);; + var testString = "{\n" + + " \"" + JsonKeysForHttpMessage.METHOD_KEY + "\": \"PUT\",\n" + + " \"" + JsonKeysForHttpMessage.URI_KEY + "\": \"" + uri + "\",\n" + + " \"" + JsonKeysForHttpMessage.PROTOCOL_KEY + "\": \"HTTP/1.1\"," + + " \"" + JsonKeysForHttpMessage.HEADERS_KEY + "\": {\n" + + " \"Host\": \"capture-proxy:9200\"\n" + + " }," + + " \"" + JsonKeysForHttpMessage.PAYLOAD_KEY + "\": {\n" + + " \"" + JsonKeysForHttpMessage.INLINED_JSON_BODY_DOCUMENT_KEY + "\": {\n" + + " \"settings\": {\n" + + " \"index\": {\n" + + " \"number_of_shards\": 3, \n" + + " \"number_of_replicas\": 2 \n" + + " }\n" + + " }," + + " \"mappings\": {" + + " \"properties\": {\n" + + " \"field1\": { \"type\": \"text\" }\n" + + " }" + + " }\n" + + " }\n" + + " }\n" + + "}"; + var indexTypeMappingRewriter = makeIndexTypeMappingRewriter(); + var resultObj = indexTypeMappingRewriter.transformJson(OBJECT_MAPPER.readValue(testString, LinkedHashMap.class)); + Assertions.assertEquals(JsonNormalizer.fromString(testString), JsonNormalizer.fromObject(resultObj)); + } + + @Test + public void testCreateIndexWithoutType() throws Exception{ + var testString = "{\n" + + " \"" + JsonKeysForHttpMessage.METHOD_KEY + "\": \"PUT\",\n" + + " \"" + JsonKeysForHttpMessage.URI_KEY + "\": \"/geonames\",\n" + + " \"" + JsonKeysForHttpMessage.PROTOCOL_KEY + "\": \"HTTP/1.1\"," + + " \"" + JsonKeysForHttpMessage.HEADERS_KEY + "\": {\n" + + " \"Host\": \"capture-proxy:9200\"\n" + + " }," + + " \"" + JsonKeysForHttpMessage.PAYLOAD_KEY + "\": {\n" + + " \"settings\": {\n" + + " \"index\": {\n" + + " \"number_of_shards\": 3, \n" + + " \"number_of_replicas\": 2 \n" + + " }\n" + + " }\n" + + " }\n" + + "}"; + var indexTypeMappingRewriter = makeIndexTypeMappingRewriter(); + var resultObj = indexTypeMappingRewriter.transformJson(OBJECT_MAPPER.readValue(testString, LinkedHashMap.class)); + Assertions.assertEquals(JsonNormalizer.fromString(testString), JsonNormalizer.fromObject(resultObj)); + } + +} diff --git a/transformation/transformationPlugins/jsonMessageTransformers/jsonTypeMappingsSanitizationTransformer/src/test/java/org/opensearch/migrations/transform/TypeMappingsSanitizationTransformerTest.java b/transformation/transformationPlugins/jsonMessageTransformers/jsonTypeMappingsSanitizationTransformer/src/test/java/org/opensearch/migrations/transform/TypeMappingsSanitizationTransformerTest.java index d5081f3b0..d0a738283 100644 --- a/transformation/transformationPlugins/jsonMessageTransformers/jsonTypeMappingsSanitizationTransformer/src/test/java/org/opensearch/migrations/transform/TypeMappingsSanitizationTransformerTest.java +++ b/transformation/transformationPlugins/jsonMessageTransformers/jsonTypeMappingsSanitizationTransformer/src/test/java/org/opensearch/migrations/transform/TypeMappingsSanitizationTransformerTest.java @@ -1,7 +1,6 @@ package org.opensearch.migrations.transform; import java.io.IOException; -import java.util.HashMap; import java.util.LinkedHashMap; import java.util.List; import java.util.Map; @@ -10,7 +9,6 @@ import com.fasterxml.jackson.core.type.TypeReference; import com.fasterxml.jackson.databind.ObjectMapper; -import com.fasterxml.jackson.databind.node.ObjectNode; import lombok.extern.slf4j.Slf4j; import org.junit.jupiter.api.Assertions; import org.junit.jupiter.api.BeforeAll; @@ -91,126 +89,6 @@ public void testPutDocRegex() throws Exception { JsonNormalizer.fromObject(resultObj)); } - private static String makeMultiTypePutIndexRequest(String indexName) { - return "{\n" + - " \"" + JsonKeysForHttpMessage.METHOD_KEY + "\": \"PUT\",\n" + - " \"" + JsonKeysForHttpMessage.URI_KEY + "\": \"/" + indexName + "\",\n" + - " \"" + JsonKeysForHttpMessage.PAYLOAD_KEY + "\": {\n" + - " \"" + JsonKeysForHttpMessage.INLINED_JSON_BODY_DOCUMENT_KEY + "\": " + - "{\n" + - " \"settings\" : {\n" + - " \"number_of_shards\" : 1\n" + - " }," + - " \"mappings\": {\n" + - " \"user\": {\n" + - " \"properties\": {\n" + - " \"name\": { \"type\": \"text\" },\n" + - " \"user_name\": { \"type\": \"keyword\" },\n" + - " \"email\": { \"type\": \"keyword\" }\n" + - " }\n" + - " },\n" + - " \"tweet\": {\n" + - " \"properties\": {\n" + - " \"content\": { \"type\": \"text\" },\n" + - " \"user_name\": { \"type\": \"keyword\" },\n" + - " \"tweeted_at\": { \"type\": \"date\" }\n" + - " }\n" + - " },\n" + - " \"following\": {\n" + - " \"properties\": {\n" + - " \"count\": { \"type\": \"integer\" },\n" + - " \"followers\": { \"type\": \"string\" }\n" + - " }\n" + - " }\n" + - " }\n" + - "}" + - "\n" + - " }\n" + - "}"; - } - - Map doPutIndex(String indexName) throws Exception { - var testString = makeMultiTypePutIndexRequest(indexName); - return indexTypeMappingRewriter.transformJson(OBJECT_MAPPER.readValue(testString, LinkedHashMap.class)); - } - - @Test - public void testPutSingleTypeIndex() throws Exception { - final String index = "indexa"; - var result = doPutIndex(index); - Assertions.assertEquals(JsonNormalizer.fromString(makeMultiTypePutIndexRequest(index)), - JsonNormalizer.fromObject(result)); - } - - @Test - public void testMultiTypeIndex() throws Exception { - final String index = "socialTypes"; - var result = doPutIndex(index); - var expected = OBJECT_MAPPER.readTree(makeMultiTypePutIndexRequest(index)); - var mappings = ((ObjectNode) expected.path(JsonKeysForHttpMessage.PAYLOAD_KEY) - .path(JsonKeysForHttpMessage.INLINED_JSON_BODY_DOCUMENT_KEY) - .path("mappings")); - mappings.remove("following"); - var newProperties = new HashMap(); - newProperties.put("type", Map.of("type", "keyword")); - var user = mappings.remove("user"); - user.path("properties").fields().forEachRemaining(e -> newProperties.put(e.getKey(), e.getValue())); - var tweet = mappings.remove("tweet"); - tweet.path("properties").fields().forEachRemaining(e -> newProperties.put(e.getKey(), e.getValue())); - mappings.set("properties", OBJECT_MAPPER.valueToTree(newProperties)); - ((ObjectNode)expected).put(JsonKeysForHttpMessage.URI_KEY, "/communal"); - Assertions.assertEquals(JsonNormalizer.fromObject(expected), JsonNormalizer.fromObject(result)); - } - - @Test - public void testCreateIndexWithoutTypeButWithMappings() throws Exception{ - var testString = "{\n" + - " \"" + JsonKeysForHttpMessage.METHOD_KEY + "\": \"PUT\",\n" + - " \"" + JsonKeysForHttpMessage.URI_KEY + "\": \"/geonames\",\n" + - " \"" + JsonKeysForHttpMessage.PROTOCOL_KEY + "\": \"HTTP/1.1\"," + - " \"" + JsonKeysForHttpMessage.HEADERS_KEY + "\": {\n" + - " \"Host\": \"capture-proxy:9200\"\n" + - " }," + - " \"" + JsonKeysForHttpMessage.PAYLOAD_KEY + "\": {\n" + - " \"settings\": {\n" + - " \"index\": {\n" + - " \"number_of_shards\": 3, \n" + - " \"number_of_replicas\": 2 \n" + - " }\n" + - " }," + - " \"mappings\": {" + - " \"properties\": {\n" + - " \"field1\": { \"type\": \"text\" }\n" + - " }" + - " }\n" + - " }\n" + - "}"; - var resultObj = indexTypeMappingRewriter.transformJson(OBJECT_MAPPER.readValue(testString, LinkedHashMap.class)); - Assertions.assertEquals(JsonNormalizer.fromString(testString), JsonNormalizer.fromObject(resultObj)); - } - - @Test - public void testCreateIndexWithoutType() throws Exception{ - var testString = "{\n" + - " \"" + JsonKeysForHttpMessage.METHOD_KEY + "\": \"PUT\",\n" + - " \"" + JsonKeysForHttpMessage.URI_KEY + "\": \"/geonames\",\n" + - " \"" + JsonKeysForHttpMessage.PROTOCOL_KEY + "\": \"HTTP/1.1\"," + - " \"" + JsonKeysForHttpMessage.HEADERS_KEY + "\": {\n" + - " \"Host\": \"capture-proxy:9200\"\n" + - " }," + - " \"" + JsonKeysForHttpMessage.PAYLOAD_KEY + "\": {\n" + - " \"settings\": {\n" + - " \"index\": {\n" + - " \"number_of_shards\": 3, \n" + - " \"number_of_replicas\": 2 \n" + - " }\n" + - " }\n" + - " }\n" + - "}"; - var resultObj = indexTypeMappingRewriter.transformJson(OBJECT_MAPPER.readValue(testString, LinkedHashMap.class)); - Assertions.assertEquals(JsonNormalizer.fromString(testString), JsonNormalizer.fromObject(resultObj)); - } - @ParameterizedTest @ValueSource(strings = {"status", "_cat/indices", "_cat/indices/nov-*"} ) public void testDefaultActionPreservesRequest(String uri) throws Exception { diff --git a/transformation/transformationPlugins/jsonMessageTransformers/jsonTypeMappingsSanitizationTransformer/src/testFixtures/java/org/opensearch/migrations/transform/TestRequestBuilder.java b/transformation/transformationPlugins/jsonMessageTransformers/jsonTypeMappingsSanitizationTransformer/src/testFixtures/java/org/opensearch/migrations/transform/TestRequestBuilder.java new file mode 100644 index 000000000..0952f3a25 --- /dev/null +++ b/transformation/transformationPlugins/jsonMessageTransformers/jsonTypeMappingsSanitizationTransformer/src/testFixtures/java/org/opensearch/migrations/transform/TestRequestBuilder.java @@ -0,0 +1,53 @@ +package org.opensearch.migrations.transform; + +import java.util.Optional; + +import lombok.NonNull; + +public class TestRequestBuilder { + public static String makePutIndexRequest(String indexName, Boolean useMultiple, Boolean includeTypeName) { + var uri = formatCreateIndexUri(indexName, includeTypeName); + return "{\n" + + " \"" + JsonKeysForHttpMessage.METHOD_KEY + "\": \"PUT\",\n" + + " \"" + JsonKeysForHttpMessage.URI_KEY + "\": \"" + uri + "\",\n" + + " \"" + JsonKeysForHttpMessage.PAYLOAD_KEY + "\": {\n" + + " \"" + JsonKeysForHttpMessage.INLINED_JSON_BODY_DOCUMENT_KEY + "\": " + + "{\n" + + " \"settings\" : {\n" + + " \"number_of_shards\" : 1\n" + + " }," + + " \"mappings\": {\n" + + " \"user\": {\n" + + " \"properties\": {\n" + + " \"name\": { \"type\": \"text\" },\n" + + " \"user_name\": { \"type\": \"keyword\" },\n" + + " \"email\": { \"type\": \"keyword\" }\n" + + " }\n" + + " }" + + (useMultiple ? ",\n" + + " \"tweet\": {\n" + + " \"properties\": {\n" + + " \"content\": { \"type\": \"text\" },\n" + + " \"user_name\": { \"type\": \"keyword\" },\n" + + " \"tweeted_at\": { \"type\": \"date\" }\n" + + " }\n" + + " },\n" + + " \"following\": {\n" + + " \"properties\": {\n" + + " \"count\": { \"type\": \"integer\" },\n" + + " \"followers\": { \"type\": \"string\" }\n" + + " }\n" + + " }\n" + : "") + + " }\n" + + "}" + + "\n" + + " }\n" + + "}"; + } + + public static @NonNull String formatCreateIndexUri(String indexName, Boolean includeTypeName) { + return "/" + indexName + + Optional.ofNullable(includeTypeName).map(b -> "?include_type_name=" + b).orElse(""); + } +} diff --git a/transformation/transformationPlugins/jsonMessageTransformers/jsonTypeMappingsSanitizationTransformerProvider/build.gradle b/transformation/transformationPlugins/jsonMessageTransformers/jsonTypeMappingsSanitizationTransformerProvider/build.gradle index cfb8a9cad..672949366 100644 --- a/transformation/transformationPlugins/jsonMessageTransformers/jsonTypeMappingsSanitizationTransformerProvider/build.gradle +++ b/transformation/transformationPlugins/jsonMessageTransformers/jsonTypeMappingsSanitizationTransformerProvider/build.gradle @@ -16,6 +16,7 @@ dependencies { implementation group: 'com.fasterxml.jackson.core', name: 'jackson-databind' testImplementation project(':transformation:transformationPlugins:jsonMessageTransformers:jsonTypeMappingsSanitizationTransformer') + testImplementation testFixtures(project(path:':transformation:transformationPlugins:jsonMessageTransformers:jsonTypeMappingsSanitizationTransformer')) testImplementation project(':coreUtilities') testImplementation testFixtures(project(path: ':coreUtilities')) testImplementation testFixtures(project(path: ':testHelperFixtures')) diff --git a/transformation/transformationPlugins/jsonMessageTransformers/jsonTypeMappingsSanitizationTransformerProvider/src/test/java/org/opensearch/migrations/replay/TypeMappingsSanitizationProviderTest.java b/transformation/transformationPlugins/jsonMessageTransformers/jsonTypeMappingsSanitizationTransformerProvider/src/test/java/org/opensearch/migrations/replay/TypeMappingsSanitizationProviderTest.java index 7c642b4c4..f8f576298 100644 --- a/transformation/transformationPlugins/jsonMessageTransformers/jsonTypeMappingsSanitizationTransformerProvider/src/test/java/org/opensearch/migrations/replay/TypeMappingsSanitizationProviderTest.java +++ b/transformation/transformationPlugins/jsonMessageTransformers/jsonTypeMappingsSanitizationTransformerProvider/src/test/java/org/opensearch/migrations/replay/TypeMappingsSanitizationProviderTest.java @@ -1,15 +1,22 @@ package org.opensearch.migrations.replay; +import java.util.LinkedHashMap; import java.util.List; import java.util.Map; +import java.util.function.Predicate; import org.opensearch.migrations.testutils.JsonNormalizer; import org.opensearch.migrations.testutils.WrapWithNettyLeakDetection; +import org.opensearch.migrations.transform.JsonKeysForHttpMessage; +import org.opensearch.migrations.transform.TestRequestBuilder; import org.opensearch.migrations.transform.TypeMappingSanitizationTransformerProvider; +import org.opensearch.migrations.transform.jinjava.ThrowTag; import com.fasterxml.jackson.core.JsonProcessingException; import com.fasterxml.jackson.core.type.TypeReference; import com.fasterxml.jackson.databind.ObjectMapper; +import com.hubspot.jinjava.interpret.FatalTemplateErrorsException; +import lombok.NonNull; import lombok.extern.slf4j.Slf4j; import org.junit.jupiter.api.Assertions; import org.junit.jupiter.api.Test; @@ -18,7 +25,7 @@ @WrapWithNettyLeakDetection(disableLeakChecks = true) public class TypeMappingsSanitizationProviderTest { - ObjectMapper mapper = new ObjectMapper(); + private static final ObjectMapper OBJECT_MAPPER = new ObjectMapper(); @Test public void testSimpleTransform() throws JsonProcessingException { @@ -63,7 +70,8 @@ public void testSimpleTransform() throws JsonProcessingException { + "}\n"; var provider = new TypeMappingSanitizationTransformerProvider(); - Map inputMap = mapper.readValue(TEST_INPUT_REQUEST, new TypeReference<>() {}); + Map inputMap = OBJECT_MAPPER.readValue(TEST_INPUT_REQUEST, new TypeReference<>() { + }); { var transformedDocument = provider.createTransformer(config).transformJson(inputMap); Assertions.assertEquals(JsonNormalizer.fromString(EXPECTED), @@ -79,4 +87,79 @@ public void testSimpleTransform() throws JsonProcessingException { JsonNormalizer.fromObject(resultFromNullConfig)); } } + + @Test + public void testMappingWithoutTypesAndLatestSourceInfoDoesNothing() throws Exception { + var testString = TestRequestBuilder.makePutIndexRequest("commingled_docs", true, false); + var fullTransformerConfig = + Map.of("sourceProperties", + Map.of("version", + Map.of("major", (Object) 6, + "minor", (Object) 10))); + var transformer = new TypeMappingSanitizationTransformerProvider().createTransformer(fullTransformerConfig); + var resultObj = transformer.transformJson(OBJECT_MAPPER.readValue(testString, LinkedHashMap.class)); + Assertions.assertEquals(JsonNormalizer.fromString(testString), JsonNormalizer.fromObject(resultObj)); + } + + @Test + public void testTypeMappingsWithSourcePropertiesWorks() throws Exception { + var testString = TestRequestBuilder.makePutIndexRequest("commingled_docs", true, false); + var fullTransformerConfig = + Map.of("sourceProperties", Map.of("version", + Map.of("major", (Object) 5, + "minor", (Object) 10)), + "regex_index_mappings", List.of(List.of("", "", ""))); + var transformer = new TypeMappingSanitizationTransformerProvider().createTransformer(fullTransformerConfig); + var resultObj = transformer.transformJson(OBJECT_MAPPER.readValue(testString, LinkedHashMap.class)); + Assertions.assertEquals(JsonNormalizer.fromString(testString), JsonNormalizer.fromObject(resultObj)); + } + + @Test + public void testMappingsButNoSourcePropertiesThrows() throws Exception { + var testString = makeCreateIndexRequestWithoutTypes(); + var noopString = "{\n" + + " \"URI\" : \"/\",\n" + + " \"method\" : \"GET\"\n" + + "}"; + var transformer = new TypeMappingSanitizationTransformerProvider().createTransformer(null); + var thrownException = + Assertions.assertThrows(FatalTemplateErrorsException.class, () -> + transformer.transformJson(OBJECT_MAPPER.readValue(testString, LinkedHashMap.class))); + Assertions.assertNotNull( + findCausalException(thrownException.getErrors().iterator().next().getException(), + e->e==null || e instanceof ThrowTag.JinjavaThrowTagException)); + } + + private static @NonNull String makeCreateIndexRequestWithoutTypes() { + return "{\n" + + " \"" + JsonKeysForHttpMessage.METHOD_KEY + "\": \"PUT\",\n" + + " \"" + JsonKeysForHttpMessage.URI_KEY + "\": \"/geonames\",\n" + + " \"" + JsonKeysForHttpMessage.PROTOCOL_KEY + "\": \"HTTP/1.1\"," + + " \"" + JsonKeysForHttpMessage.HEADERS_KEY + "\": {\n" + + " \"Host\": \"capture-proxy:9200\"\n" + + " }," + + " \"" + JsonKeysForHttpMessage.PAYLOAD_KEY + "\": {\n" + + " \"" + JsonKeysForHttpMessage.INLINED_JSON_BODY_DOCUMENT_KEY + "\": {\n" + + " \"settings\": {\n" + + " \"index\": {\n" + + " \"number_of_shards\": 3, \n" + + " \"number_of_replicas\": 2 \n" + + " }\n" + + " }," + + " \"mappings\": {" + + " \"properties\": {\n" + + " \"field1\": { \"type\": \"text\" }\n" + + " }" + + " }\n" + + " }\n" + + " }\n" + + "}"; + } + + public static Throwable findCausalException(Throwable t, Predicate p) { + while (!p.test(t)) { + t = t.getCause(); + } + return t; + } } From 2b1f3e062390ffedc98772ffa93e5a3eab73f0f8 Mon Sep 17 00:00:00 2001 From: Greg Schohn Date: Mon, 9 Dec 2024 08:26:24 -0500 Subject: [PATCH 21/26] Add a new preserve tag (preserveWhenMissing) to copy only when the key wasn't in the target's doc. That makes it a bit easier to write '"preserveWhenMissing": "*"' and not have to spend us much effort to be more specific. Signed-off-by: Greg Schohn --- .../transform/JinjavaTransformer.java | 25 +-------- .../transform/PreservesProcessor.java | 56 +++++++++++++++++++ .../typeMappings/rewriteCreateIndexRequest.j2 | 2 +- ...peMappingsSanitizationCreateIndexTest.java | 1 + .../transform/TestRequestBuilder.java | 1 + 5 files changed, 60 insertions(+), 25 deletions(-) create mode 100644 transformation/transformationPlugins/jsonMessageTransformers/jsonJinjavaTransformer/src/main/java/org/opensearch/migrations/transform/PreservesProcessor.java diff --git a/transformation/transformationPlugins/jsonMessageTransformers/jsonJinjavaTransformer/src/main/java/org/opensearch/migrations/transform/JinjavaTransformer.java b/transformation/transformationPlugins/jsonMessageTransformers/jsonJinjavaTransformer/src/main/java/org/opensearch/migrations/transform/JinjavaTransformer.java index 8a1acb398..9761b5cee 100644 --- a/transformation/transformationPlugins/jsonMessageTransformers/jsonJinjavaTransformer/src/main/java/org/opensearch/migrations/transform/JinjavaTransformer.java +++ b/transformation/transformationPlugins/jsonMessageTransformers/jsonJinjavaTransformer/src/main/java/org/opensearch/migrations/transform/JinjavaTransformer.java @@ -81,29 +81,6 @@ public Map transformJson(Map incomingJson) { var resultStr = jinjava.render(templateStr, createContextWithSourceFunction.apply(incomingJson)); log.atInfo().setMessage("output from jinjava... {}").addArgument(resultStr).log(); var parsedObj = (Map) objectMapper.readValue(resultStr, LinkedHashMap.class); - return doFinalSubstitutions(incomingJson, parsedObj); - } - - private Map doFinalSubstitutions(Map incomingJson, Map parsedObj) { - return Optional.ofNullable(parsedObj.get(JsonKeysForHttpMessage.PRESERVE_KEY)).filter(v->v.equals("*")) - .map(star -> incomingJson) - .orElseGet(() -> { - findAndReplacePreserves(incomingJson, parsedObj); - findAndReplacePreserves((Map) incomingJson.get(JsonKeysForHttpMessage.PAYLOAD_KEY), - (Map) parsedObj.get(JsonKeysForHttpMessage.PAYLOAD_KEY)); - return parsedObj; - }); - } - - private void findAndReplacePreserves(Map incomingRoot, Map parsedRoot) { - if (parsedRoot == null || incomingRoot == null) { - return; - } - var preserveKeys = (List) parsedRoot.get(JsonKeysForHttpMessage.PRESERVE_KEY); - if (preserveKeys != null) { - preserveKeys.forEach(preservedKey -> - Optional.ofNullable(incomingRoot.get(preservedKey)).ifPresent(v->parsedRoot.put(preservedKey, v))); - parsedRoot.remove(JsonKeysForHttpMessage.PRESERVE_KEY); - } + return PreservesProcessor.doFinalSubstitutions(incomingJson, parsedObj); } } diff --git a/transformation/transformationPlugins/jsonMessageTransformers/jsonJinjavaTransformer/src/main/java/org/opensearch/migrations/transform/PreservesProcessor.java b/transformation/transformationPlugins/jsonMessageTransformers/jsonJinjavaTransformer/src/main/java/org/opensearch/migrations/transform/PreservesProcessor.java new file mode 100644 index 000000000..a5d346c27 --- /dev/null +++ b/transformation/transformationPlugins/jsonMessageTransformers/jsonJinjavaTransformer/src/main/java/org/opensearch/migrations/transform/PreservesProcessor.java @@ -0,0 +1,56 @@ +package org.opensearch.migrations.transform; + +import java.util.List; +import java.util.Map; + +public class PreservesProcessor { + private static final String PRESERVE_KEY = "preserve"; + private static final String PRESERVE_WHEN_MISSING_KEY = "preserveWhenMissing"; + + private PreservesProcessor() {} + + @SuppressWarnings("unchecked") + public static Map doFinalSubstitutions(Map incomingJson, Map parsedObj) { + processPreserves(incomingJson, parsedObj); + + processPreserves( + (Map) incomingJson.get(JsonKeysForHttpMessage.PAYLOAD_KEY), + (Map) parsedObj.get(JsonKeysForHttpMessage.PAYLOAD_KEY) + ); + + return parsedObj; + } + + private static void processPreserves(Map source, Map target) { + if (target == null || source == null) { + return; + } + + copyValues(source, target, PRESERVE_KEY, true); + copyValues(source, target, PRESERVE_WHEN_MISSING_KEY, false); + } + + private static void copyValues(Map source, Map target, + String directiveKey, boolean forced) { + Object directive = target.remove(directiveKey); + if (directive == null) { + return; + } + + if (directive.equals("*")) { + source.forEach((key, value) -> { + if (forced || !target.containsKey(key)) { + target.put(key, value); + } + }); + } else if (directive instanceof List) { + ((List) directive).forEach(key -> { + if (source.containsKey(key) && + (forced || !target.containsKey(key))) + { + target.put(key, source.get(key)); + } + }); + } + } +} diff --git a/transformation/transformationPlugins/jsonMessageTransformers/jsonTypeMappingsSanitizationTransformer/src/main/resources/jinjava/typeMappings/rewriteCreateIndexRequest.j2 b/transformation/transformationPlugins/jsonMessageTransformers/jsonTypeMappingsSanitizationTransformer/src/main/resources/jinjava/typeMappings/rewriteCreateIndexRequest.j2 index d1129872e..63f37fc76 100644 --- a/transformation/transformationPlugins/jsonMessageTransformers/jsonTypeMappingsSanitizationTransformer/src/main/resources/jinjava/typeMappings/rewriteCreateIndexRequest.j2 +++ b/transformation/transformationPlugins/jsonMessageTransformers/jsonTypeMappingsSanitizationTransformer/src/main/resources/jinjava/typeMappings/rewriteCreateIndexRequest.j2 @@ -5,7 +5,7 @@ {%- set source_input_types = input_map.index_mappings[source_index_name] -%} {%- set source_type_name = source_input_types.keys() | first() -%} { - "preserve": ["protocol", "headers"], + "preserveWhenMissing": "*", "method": "{{ input_map.request.method }}", "URI": "/{{ target_index_name }}", "payload": { diff --git a/transformation/transformationPlugins/jsonMessageTransformers/jsonTypeMappingsSanitizationTransformer/src/test/java/org/opensearch/migrations/transform/TypeMappingsSanitizationCreateIndexTest.java b/transformation/transformationPlugins/jsonMessageTransformers/jsonTypeMappingsSanitizationTransformer/src/test/java/org/opensearch/migrations/transform/TypeMappingsSanitizationCreateIndexTest.java index cfd6acf22..895ebe7e9 100644 --- a/transformation/transformationPlugins/jsonMessageTransformers/jsonTypeMappingsSanitizationTransformer/src/test/java/org/opensearch/migrations/transform/TypeMappingsSanitizationCreateIndexTest.java +++ b/transformation/transformationPlugins/jsonMessageTransformers/jsonTypeMappingsSanitizationTransformer/src/test/java/org/opensearch/migrations/transform/TypeMappingsSanitizationCreateIndexTest.java @@ -58,6 +58,7 @@ public void testPutSingleTypeIndex() throws Exception { var expectedString = "{\n" + " \"URI\" : \"/a_user\",\n" + " \"method\" : \"PUT\",\n" + + " \"protocol\" : \"HTTP/1.1\",\n" + " \"payload\" : {\n" + " \"inlinedJsonBody\" : {\n" + " \"mappings\" : {\n" + diff --git a/transformation/transformationPlugins/jsonMessageTransformers/jsonTypeMappingsSanitizationTransformer/src/testFixtures/java/org/opensearch/migrations/transform/TestRequestBuilder.java b/transformation/transformationPlugins/jsonMessageTransformers/jsonTypeMappingsSanitizationTransformer/src/testFixtures/java/org/opensearch/migrations/transform/TestRequestBuilder.java index 0952f3a25..025aa6ed0 100644 --- a/transformation/transformationPlugins/jsonMessageTransformers/jsonTypeMappingsSanitizationTransformer/src/testFixtures/java/org/opensearch/migrations/transform/TestRequestBuilder.java +++ b/transformation/transformationPlugins/jsonMessageTransformers/jsonTypeMappingsSanitizationTransformer/src/testFixtures/java/org/opensearch/migrations/transform/TestRequestBuilder.java @@ -9,6 +9,7 @@ public static String makePutIndexRequest(String indexName, Boolean useMultiple, var uri = formatCreateIndexUri(indexName, includeTypeName); return "{\n" + " \"" + JsonKeysForHttpMessage.METHOD_KEY + "\": \"PUT\",\n" + + " \"" + JsonKeysForHttpMessage.PROTOCOL_KEY + "\": \"HTTP/1.1\",\n" + " \"" + JsonKeysForHttpMessage.URI_KEY + "\": \"" + uri + "\",\n" + " \"" + JsonKeysForHttpMessage.PAYLOAD_KEY + "\": {\n" + " \"" + JsonKeysForHttpMessage.INLINED_JSON_BODY_DOCUMENT_KEY + "\": " + From 4e599651ce033d2a96e53a35b06a762581e40eb6 Mon Sep 17 00:00:00 2001 From: Greg Schohn Date: Mon, 9 Dec 2024 09:24:15 -0500 Subject: [PATCH 22/26] Enable type mappings transform for the replayer in the docker-compose file + logging improvements & cleanup. Most useful logging improvement - add the URI of the source request to the end of the progess log's lines. E.g 2024-12-09 14:19:34,024: 921, 0242acfffe120008-00000007-00000065-c88ca66f1bf2aa5a-a978504d.16, 2024-12-09T14:19:33.757503Z, 2872/2890, 200/500,500,500,500, 2866/486,486,486,486, 9/3,2,2,3, /_search/scroll 2024-12-09 14:19:41,602: 950, 0242acfffe120008-00000007-00000065-c88ca66f1bf2aa5a-a978504d.17, 2024-12-09T14:19:33.767614Z, 2862/2880, 200/404,404,404,404, 119/125,125,125,125, 10/1,1,1,1, /_search/scroll Signed-off-by: Greg Schohn --- .../src/main/docker/docker-compose.yml | 4 ++-- .../replay/ParsedHttpMessagesAsDicts.java | 16 ++++++++++------ .../migrations/replay/ResultsToLogsConsumer.java | 6 ++++++ .../migrations/transform/JinjavaTransformer.java | 2 +- .../jinjava/JavaRegexReplaceFilter.java | 2 +- ...peMappingSanitizationTransformerProvider.java | 8 ++++---- 6 files changed, 24 insertions(+), 14 deletions(-) diff --git a/TrafficCapture/dockerSolution/src/main/docker/docker-compose.yml b/TrafficCapture/dockerSolution/src/main/docker/docker-compose.yml index 407fa7a9f..dc637f7a6 100644 --- a/TrafficCapture/dockerSolution/src/main/docker/docker-compose.yml +++ b/TrafficCapture/dockerSolution/src/main/docker/docker-compose.yml @@ -78,8 +78,8 @@ services: condition: service_started opensearchtarget: condition: service_started -# command: /bin/sh -c "/runJavaWithClasspath.sh org.opensearch.migrations.replay.TrafficReplayer --speedup-factor 2 https://opensearchtarget:9200 --auth-header-value Basic\\ YWRtaW46bXlTdHJvbmdQYXNzd29yZDEyMyE= --insecure --kafka-traffic-brokers kafka:9092 --kafka-traffic-topic logging-traffic-topic --kafka-traffic-group-id logging-group-default --otelCollectorEndpoint http://otel-collector:4317 --transformer-config " - command: /bin/sh -c "/runJavaWithClasspath.sh org.opensearch.migrations.replay.TrafficReplayer --speedup-factor 2 https://opensearchtarget:9200 --auth-header-value Basic\\ YWRtaW46bXlTdHJvbmdQYXNzd29yZDEyMyE= --insecure --kafka-traffic-brokers kafka:9092 --kafka-traffic-topic logging-traffic-topic --kafka-traffic-group-id logging-group-default --otelCollectorEndpoint http://otel-collector:4317 --transformer-config '[{\"TypeMappingSanitizationTransformerProvider\":\"\"}]'" +# command: /bin/sh -c "/runJavaWithClasspath.sh org.opensearch.migrations.replay.TrafficReplayer --speedup-factor 2 https://opensearchtarget:9200 --auth-header-value Basic\\ YWRtaW46bXlTdHJvbmdQYXNzd29yZDEyMyE= --insecure --kafka-traffic-brokers kafka:9092 --kafka-traffic-topic logging-traffic-topic --kafka-traffic-group-id logging-group-default --otelCollectorEndpoint http://otel-collector:4317 " + command: /bin/sh -c "/runJavaWithClasspath.sh org.opensearch.migrations.replay.TrafficReplayer --speedup-factor 2 https://opensearchtarget:9200 --auth-header-value Basic\\ YWRtaW46bXlTdHJvbmdQYXNzd29yZDEyMyE= --insecure --kafka-traffic-brokers kafka:9092 --kafka-traffic-topic logging-traffic-topic --kafka-traffic-group-id logging-group-default --otelCollectorEndpoint http://otel-collector:4317 --transformer-config '[{\"TypeMappingSanitizationTransformerProvider\":{\"sourceProperties\":{\"version\":{\"major\":7,\"minor\":10}}}}]'" opensearchtarget: image: 'opensearchproject/opensearch:2.15.0' environment: diff --git a/TrafficCapture/trafficReplayer/src/main/java/org/opensearch/migrations/replay/ParsedHttpMessagesAsDicts.java b/TrafficCapture/trafficReplayer/src/main/java/org/opensearch/migrations/replay/ParsedHttpMessagesAsDicts.java index 4a0f87609..ae598fd77 100644 --- a/TrafficCapture/trafficReplayer/src/main/java/org/opensearch/migrations/replay/ParsedHttpMessagesAsDicts.java +++ b/TrafficCapture/trafficReplayer/src/main/java/org/opensearch/migrations/replay/ParsedHttpMessagesAsDicts.java @@ -42,6 +42,10 @@ public class ParsedHttpMessagesAsDicts { public static final String STATUS_CODE_KEY = "Status-Code"; public static final String RESPONSE_TIME_MS_KEY = "response_time_ms"; public static final String EXCEPTION_KEY_STRING = "Exception"; + public static final String REQUEST_URI_KEY = "Request-URI"; + public static final String METHOD_KEY = "Method"; + public static final String HTTP_VERSION_KEY = "HTTP-Version"; + public static final String PAYLOAD_KEY = "payload"; public final Optional> sourceRequestOp; public final Optional> sourceResponseOp; @@ -183,15 +187,15 @@ private static Map convertRequest( var message = (HttpJsonRequestWithFaultingPayload) messageHolder.get(); if (message != null) { var map = new LinkedHashMap<>(message.headers()); - map.put("Request-URI", message.path()); - map.put("Method", message.method()); - map.put("HTTP-Version", message.protocol()); + map.put(REQUEST_URI_KEY, message.path()); + map.put(METHOD_KEY, message.method()); + map.put(HTTP_VERSION_KEY, message.protocol()); context.setMethod(message.method()); context.setEndpoint(message.path()); context.setHttpVersion(message.protocol()); encodeBinaryPayloadIfExists(message); if (!message.payload().isEmpty()) { - map.put("payload", message.payload()); + map.put(PAYLOAD_KEY, message.payload()); } return map; } else { @@ -223,14 +227,14 @@ private static Map convertResponse( var message = (HttpJsonResponseWithFaultingPayload) messageHolder.get(); if (message != null) { var map = new LinkedHashMap<>(message.headers()); - map.put("HTTP-Version", message.protocol()); + map.put(HTTP_VERSION_KEY, message.protocol()); map.put(STATUS_CODE_KEY, Integer.parseInt(message.code())); map.put("Reason-Phrase", message.reason()); map.put(RESPONSE_TIME_MS_KEY, latency.toMillis()); context.setHttpVersion(message.protocol()); encodeBinaryPayloadIfExists(message); if (!message.payload().isEmpty()) { - map.put("payload", message.payload()); + map.put(PAYLOAD_KEY, message.payload()); } return map; } else { diff --git a/TrafficCapture/trafficReplayer/src/main/java/org/opensearch/migrations/replay/ResultsToLogsConsumer.java b/TrafficCapture/trafficReplayer/src/main/java/org/opensearch/migrations/replay/ResultsToLogsConsumer.java index 4ef0c825a..89ca4354f 100644 --- a/TrafficCapture/trafficReplayer/src/main/java/org/opensearch/migrations/replay/ResultsToLogsConsumer.java +++ b/TrafficCapture/trafficReplayer/src/main/java/org/opensearch/migrations/replay/ResultsToLogsConsumer.java @@ -161,6 +161,7 @@ public static String getTransactionSummaryStringPreamble() { .add("SOURCE_STATUS_CODE/TARGET_STATUS_CODE...") .add("SOURCE_RESPONSE_SIZE_BYTES/TARGET_RESPONSE_SIZE_BYTES...") .add("SOURCE_LATENCY_MS/TARGET_LATENCY_MS...") + .add("URI...") .toString(); } @@ -218,6 +219,11 @@ public static String toTransactionSummaryString( transformStreamToString(parsed.targetResponseList.stream(), r -> "" + r.get(ParsedHttpMessagesAsDicts.RESPONSE_TIME_MS_KEY)) ) + // uri + .add( + parsed.sourceRequestOp + .map(r -> (String) r.get(ParsedHttpMessagesAsDicts.REQUEST_URI_KEY)) + .orElse(MISSING_STR)) .toString(); } diff --git a/transformation/transformationPlugins/jsonMessageTransformers/jsonJinjavaTransformer/src/main/java/org/opensearch/migrations/transform/JinjavaTransformer.java b/transformation/transformationPlugins/jsonMessageTransformers/jsonJinjavaTransformer/src/main/java/org/opensearch/migrations/transform/JinjavaTransformer.java index 9761b5cee..2a5254799 100644 --- a/transformation/transformationPlugins/jsonMessageTransformers/jsonJinjavaTransformer/src/main/java/org/opensearch/migrations/transform/JinjavaTransformer.java +++ b/transformation/transformationPlugins/jsonMessageTransformers/jsonJinjavaTransformer/src/main/java/org/opensearch/migrations/transform/JinjavaTransformer.java @@ -79,7 +79,7 @@ public JinjavaTransformer(String templateString, @Override public Map transformJson(Map incomingJson) { var resultStr = jinjava.render(templateStr, createContextWithSourceFunction.apply(incomingJson)); - log.atInfo().setMessage("output from jinjava... {}").addArgument(resultStr).log(); + log.atDebug().setMessage("output from jinjava... {}").addArgument(resultStr).log(); var parsedObj = (Map) objectMapper.readValue(resultStr, LinkedHashMap.class); return PreservesProcessor.doFinalSubstitutions(incomingJson, parsedObj); } diff --git a/transformation/transformationPlugins/jsonMessageTransformers/jsonJinjavaTransformer/src/main/java/org/opensearch/migrations/transform/jinjava/JavaRegexReplaceFilter.java b/transformation/transformationPlugins/jsonMessageTransformers/jsonJinjavaTransformer/src/main/java/org/opensearch/migrations/transform/jinjava/JavaRegexReplaceFilter.java index b2175aa84..035c5a001 100644 --- a/transformation/transformationPlugins/jsonMessageTransformers/jsonJinjavaTransformer/src/main/java/org/opensearch/migrations/transform/jinjava/JavaRegexReplaceFilter.java +++ b/transformation/transformationPlugins/jsonMessageTransformers/jsonJinjavaTransformer/src/main/java/org/opensearch/migrations/transform/jinjava/JavaRegexReplaceFilter.java @@ -81,7 +81,7 @@ public Object filter(Object inputObject, JinjavaInterpreter interpreter, String. c.get(JinjavaTransformer.REGEX_REPLACEMENT_CONVERSION_PATTERNS))) .orElse(DEFAULT_REGEX_REPLACE_FILTER))); var rval = matcher.replaceAll(rewritten); - log.atError().setMessage("replaced value {} with {}").addArgument(input).addArgument(rval).log(); + log.atTrace().setMessage("replaced value {} with {}").addArgument(input).addArgument(rval).log(); return rval; } catch (Exception e) { throw new RegexReplaceException(e, input, pattern, replacement, rewritten); diff --git a/transformation/transformationPlugins/jsonMessageTransformers/jsonTypeMappingsSanitizationTransformerProvider/src/main/java/org/opensearch/migrations/transform/TypeMappingSanitizationTransformerProvider.java b/transformation/transformationPlugins/jsonMessageTransformers/jsonTypeMappingsSanitizationTransformerProvider/src/main/java/org/opensearch/migrations/transform/TypeMappingSanitizationTransformerProvider.java index 338c1d639..d5dc23796 100644 --- a/transformation/transformationPlugins/jsonMessageTransformers/jsonTypeMappingsSanitizationTransformerProvider/src/main/java/org/opensearch/migrations/transform/TypeMappingSanitizationTransformerProvider.java +++ b/transformation/transformationPlugins/jsonMessageTransformers/jsonTypeMappingsSanitizationTransformerProvider/src/main/java/org/opensearch/migrations/transform/TypeMappingSanitizationTransformerProvider.java @@ -36,11 +36,11 @@ public IJsonTransformer createTransformer(Object jsonConfig) { return new TypeMappingsSanitizationTransformer( (Map>) config.get(STATIC_MAPPINGS), (List>) config.get(REGEX_MAPPINGS), - Optional.ofNullable(config.get(SOURCE_PROPERTIES_KEY)).map(jinjavaConfig -> - mapper.convertValue(jinjavaConfig, SourceProperties.class)).orElse(null), + Optional.ofNullable(config.get(SOURCE_PROPERTIES_KEY)).map(m -> + mapper.convertValue(m, SourceProperties.class)).orElse(null), (Map) config.get(FEATURE_FLAGS), - Optional.ofNullable(config.get(JINJAVA_CONFIG_KEY)).map(jinjavaConfig -> - mapper.convertValue(jinjavaConfig, JinjavaConfig.class)).orElse(null)); + Optional.ofNullable(config.get(JINJAVA_CONFIG_KEY)).map(m -> + mapper.convertValue(m, JinjavaConfig.class)).orElse(null)); } catch (ClassCastException e) { throw new IllegalArgumentException(getConfigUsageStr(), e); } From 09377de54991582a2317c4faf6bfd1f53b2a045d Mon Sep 17 00:00:00 2001 From: Greg Schohn Date: Tue, 3 Dec 2024 22:45:11 -0500 Subject: [PATCH 23/26] Flip the default should throw behavior for HttpJsonMessageWithFaultingPayload to opt-in rather than opt-out. HttpJsonMessageWithFaultingPayload throws by default - so it could be run even if it wasn't within a transform - like from within a LoggingHandler, which is what I was observing when I added some more logging. The worst part was that it created other errors which then caused the message to be processed in a very different way. Signed-off-by: Greg Schohn --- .../datahandlers/PayloadAccessFaultingMap.java | 1 + ...edHttpRequestPreliminaryTransformHandler.java | 4 ++++ .../http/NettyJsonBodyAccumulateHandler.java | 16 ++++++++++++---- 3 files changed, 17 insertions(+), 4 deletions(-) diff --git a/TrafficCapture/trafficReplayer/src/main/java/org/opensearch/migrations/replay/datahandlers/PayloadAccessFaultingMap.java b/TrafficCapture/trafficReplayer/src/main/java/org/opensearch/migrations/replay/datahandlers/PayloadAccessFaultingMap.java index ff8c3f665..57abfe43c 100644 --- a/TrafficCapture/trafficReplayer/src/main/java/org/opensearch/migrations/replay/datahandlers/PayloadAccessFaultingMap.java +++ b/TrafficCapture/trafficReplayer/src/main/java/org/opensearch/migrations/replay/datahandlers/PayloadAccessFaultingMap.java @@ -34,6 +34,7 @@ public class PayloadAccessFaultingMap extends AbstractMap { private boolean disableThrowingPayloadNotLoaded; public PayloadAccessFaultingMap(StrictCaseInsensitiveHttpHeadersMap headers) { + disableThrowingPayloadNotLoaded = true; underlyingMap = new TreeMap<>(); isJson = Optional.ofNullable(headers.get("content-type")) .map(list -> list.stream().anyMatch(s -> s.startsWith("application/json"))) diff --git a/TrafficCapture/trafficReplayer/src/main/java/org/opensearch/migrations/replay/datahandlers/http/NettyDecodedHttpRequestPreliminaryTransformHandler.java b/TrafficCapture/trafficReplayer/src/main/java/org/opensearch/migrations/replay/datahandlers/http/NettyDecodedHttpRequestPreliminaryTransformHandler.java index 3d74c42ca..3992d34a3 100644 --- a/TrafficCapture/trafficReplayer/src/main/java/org/opensearch/migrations/replay/datahandlers/http/NettyDecodedHttpRequestPreliminaryTransformHandler.java +++ b/TrafficCapture/trafficReplayer/src/main/java/org/opensearch/migrations/replay/datahandlers/http/NettyDecodedHttpRequestPreliminaryTransformHandler.java @@ -67,7 +67,9 @@ public void channelRead(@NonNull ChannelHandlerContext ctx, @NonNull Object msg) IAuthTransformer authTransformer = requestPipelineOrchestrator.authTransfomerFactory.getAuthTransformer( httpJsonMessage ); + final var payloadMap = (PayloadAccessFaultingMap) httpJsonMessage.payload(); try { + payloadMap.setDisableThrowingPayloadNotLoaded(false); handlePayloadNeutralTransformationOrThrow( ctx, originalHttpJsonMessage, @@ -86,6 +88,8 @@ public void channelRead(@NonNull ChannelHandlerContext ctx, @NonNull Object msg) getAuthTransformerAsStreamingTransformer(authTransformer) ); ctx.fireChannelRead(handleAuthHeaders(httpJsonMessage, authTransformer)); + } finally { + payloadMap.setDisableThrowingPayloadNotLoaded(true); } } else if (msg instanceof HttpContent) { ctx.fireChannelRead(msg); diff --git a/TrafficCapture/trafficReplayer/src/main/java/org/opensearch/migrations/replay/datahandlers/http/NettyJsonBodyAccumulateHandler.java b/TrafficCapture/trafficReplayer/src/main/java/org/opensearch/migrations/replay/datahandlers/http/NettyJsonBodyAccumulateHandler.java index 754ac2a4e..35ed26b68 100644 --- a/TrafficCapture/trafficReplayer/src/main/java/org/opensearch/migrations/replay/datahandlers/http/NettyJsonBodyAccumulateHandler.java +++ b/TrafficCapture/trafficReplayer/src/main/java/org/opensearch/migrations/replay/datahandlers/http/NettyJsonBodyAccumulateHandler.java @@ -8,6 +8,7 @@ import java.util.ArrayList; import java.util.List; import java.util.Optional; +import java.util.function.Predicate; import org.opensearch.migrations.replay.datahandlers.JsonAccumulator; import org.opensearch.migrations.replay.tracing.IReplayContexts; @@ -24,6 +25,7 @@ import io.netty.util.ReferenceCountUtil; import lombok.SneakyThrows; import lombok.extern.slf4j.Slf4j; +import org.slf4j.event.Level; /** * This accumulates HttpContent messages through a JsonAccumulator and eventually fires off a @@ -93,7 +95,10 @@ public void channelRead(ChannelHandlerContext ctx, Object msg) throws Exception } } } catch (JacksonException e) { - log.atInfo().setCause(e).setMessage("Error parsing json body. " + + log.atLevel(hasRequestContentTypeMatching(capturedHttpJsonMessage, + // a JacksonException for non-json data doesn't need to be surfaced to a user + v -> v.startsWith("application/json")) ? Level.INFO : Level.TRACE) + .setCause(e).setMessage("Error parsing json body. " + "Will pass all payload bytes directly as a ByteBuf within the payload map").log(); jsonWasInvalid = true; parsedJsonObjects.clear(); @@ -123,7 +128,9 @@ public void channelRead(ChannelHandlerContext ctx, Object msg) throws Exception var leftoverBody = accumulatedBody.slice(jsonBodyByteLength, accumulatedBody.readableBytes() - jsonBodyByteLength); - if (jsonBodyByteLength == 0 && isRequestContentTypeNotText(capturedHttpJsonMessage)) { + if (jsonBodyByteLength == 0 && + hasRequestContentTypeMatching(capturedHttpJsonMessage, v -> !v.startsWith("text/"))) + { context.onPayloadSetBinary(); capturedHttpJsonMessage.payload() .put(JsonKeysForHttpMessage.INLINED_BINARY_BODY_DOCUMENT_KEY, @@ -157,12 +164,13 @@ public void channelRead(ChannelHandlerContext ctx, Object msg) throws Exception } } - private boolean isRequestContentTypeNotText(HttpJsonMessageWithFaultingPayload message) { + private boolean hasRequestContentTypeMatching(HttpJsonMessageWithFaultingPayload message, + Predicate contentTypeFilter) { // ContentType not text if specified and has a value with / and that value does not start with text/ return Optional.ofNullable(capturedHttpJsonMessage.headers().insensitiveGet(HttpHeaderNames.CONTENT_TYPE.toString())) .map(s -> s.stream() .filter(v -> v.contains("/")) - .filter(v -> !v.startsWith("text/")) + .filter(contentTypeFilter) .count() > 1 ) .orElse(false); From fcf6bbc0178193037a5fe7145cd1711d834edb8b Mon Sep 17 00:00:00 2001 From: Greg Schohn Date: Mon, 9 Dec 2024 09:36:43 -0500 Subject: [PATCH 24/26] Update type mapping sanitization READMEs to use backslash backreferences instead of '$' ones. Backslashes are the default behavior. Signed-off-by: Greg Schohn --- .../jsonTypeMappingsSanitizationTransformer/README.md | 6 +++--- .../README.md | 2 +- 2 files changed, 4 insertions(+), 4 deletions(-) diff --git a/transformation/transformationPlugins/jsonMessageTransformers/jsonTypeMappingsSanitizationTransformer/README.md b/transformation/transformationPlugins/jsonMessageTransformers/jsonTypeMappingsSanitizationTransformer/README.md index 9e88dda81..61eae7074 100644 --- a/transformation/transformationPlugins/jsonMessageTransformers/jsonTypeMappingsSanitizationTransformer/README.md +++ b/transformation/transformationPlugins/jsonMessageTransformers/jsonTypeMappingsSanitizationTransformer/README.md @@ -101,7 +101,7 @@ The following sample shows how indices that start with 'time-' will be migrated already matched will be dropped. ``` [ - ["time-(.*)", "(cpu)", "time-$1-$2"] + ["time-(.*)", "(cpu)", "time-\\1-\\2"] ] ``` @@ -109,8 +109,8 @@ The following example preserves all other non-matched items, merging all types into a single index with the same name as the source index. ``` [ - ["time-(.*)", "(cpu)", "time-$1-$2"], - ["(.*)", ".*", "$1"] + ["time-(.*)", "(cpu)", "time-\\1-\\2"], + ["", ".*", ""] ] ``` diff --git a/transformation/transformationPlugins/jsonMessageTransformers/jsonTypeMappingsSanitizationTransformerProvider/README.md b/transformation/transformationPlugins/jsonMessageTransformers/jsonTypeMappingsSanitizationTransformerProvider/README.md index 327343e76..9adf06e4d 100644 --- a/transformation/transformationPlugins/jsonMessageTransformers/jsonTypeMappingsSanitizationTransformerProvider/README.md +++ b/transformation/transformationPlugins/jsonMessageTransformers/jsonTypeMappingsSanitizationTransformerProvider/README.md @@ -32,7 +32,7 @@ Patterns are ONLY supported via regexMappings. } }, "regexMappings": [ - [ "(time*)", "(type*)", "$1_And_$2" ] + [ "(time*)", "(type*)", "\\1_And_\\2" ] ] } ``` \ No newline at end of file From fbc0291ecbbb90b0d0272a6cc07e8769bbc387c6 Mon Sep 17 00:00:00 2001 From: Greg Schohn Date: Mon, 9 Dec 2024 14:25:15 -0500 Subject: [PATCH 25/26] Update remaining preserve calls so that protocol will be carried forward. Notice that headers are required to contain 'host' for http/1.1, so strictly speaking, copying headers AND protocol should be safer so that we stay in compliance. Signed-off-by: Greg Schohn --- .../src/main/resources/jinjava/typeMappings/makeNoop.j2 | 2 +- .../main/resources/jinjava/typeMappings/rewriteBulkRequest.j2 | 2 +- .../resources/jinjava/typeMappings/rewriteDocumentRequest.j2 | 2 +- .../transform/TypeMappingsSanitizationCreateIndexTest.java | 3 ++- 4 files changed, 5 insertions(+), 4 deletions(-) diff --git a/transformation/transformationPlugins/jsonMessageTransformers/jsonTypeMappingsSanitizationTransformer/src/main/resources/jinjava/typeMappings/makeNoop.j2 b/transformation/transformationPlugins/jsonMessageTransformers/jsonTypeMappingsSanitizationTransformer/src/main/resources/jinjava/typeMappings/makeNoop.j2 index e34232799..96ba372b0 100644 --- a/transformation/transformationPlugins/jsonMessageTransformers/jsonTypeMappingsSanitizationTransformer/src/main/resources/jinjava/typeMappings/makeNoop.j2 +++ b/transformation/transformationPlugins/jsonMessageTransformers/jsonTypeMappingsSanitizationTransformer/src/main/resources/jinjava/typeMappings/makeNoop.j2 @@ -1,3 +1,3 @@ {%- macro make_request() -%} - { "method": "GET", "URI": "/" } + { "method": "GET", "URI": "/", "protocol": "HTTP/1.0" } {%- endmacro -%} diff --git a/transformation/transformationPlugins/jsonMessageTransformers/jsonTypeMappingsSanitizationTransformer/src/main/resources/jinjava/typeMappings/rewriteBulkRequest.j2 b/transformation/transformationPlugins/jsonMessageTransformers/jsonTypeMappingsSanitizationTransformer/src/main/resources/jinjava/typeMappings/rewriteBulkRequest.j2 index 08f05c639..b0acfd8a7 100644 --- a/transformation/transformationPlugins/jsonMessageTransformers/jsonTypeMappingsSanitizationTransformer/src/main/resources/jinjava/typeMappings/rewriteBulkRequest.j2 +++ b/transformation/transformationPlugins/jsonMessageTransformers/jsonTypeMappingsSanitizationTransformer/src/main/resources/jinjava/typeMappings/rewriteBulkRequest.j2 @@ -44,7 +44,7 @@ {%- macro rewrite_bulk_for_default_source_index(uri_match, input_map, source_index) -%} { - "preserve": ["headers","method","URI","protocol"], + "preserveWhenMissing": "*", "payload": { "inlinedJsonSequenceBodies": [ {%- set operation_types = ['delete', 'update', 'index', 'create'] -%} diff --git a/transformation/transformationPlugins/jsonMessageTransformers/jsonTypeMappingsSanitizationTransformer/src/main/resources/jinjava/typeMappings/rewriteDocumentRequest.j2 b/transformation/transformationPlugins/jsonMessageTransformers/jsonTypeMappingsSanitizationTransformer/src/main/resources/jinjava/typeMappings/rewriteDocumentRequest.j2 index f35fb3f0d..6fc665bb2 100644 --- a/transformation/transformationPlugins/jsonMessageTransformers/jsonTypeMappingsSanitizationTransformer/src/main/resources/jinjava/typeMappings/rewriteDocumentRequest.j2 +++ b/transformation/transformationPlugins/jsonMessageTransformers/jsonTypeMappingsSanitizationTransformer/src/main/resources/jinjava/typeMappings/rewriteDocumentRequest.j2 @@ -9,7 +9,7 @@ { "method": "{{ input_map.request.method }}", "URI": "/{{ target_index }}/_doc/{{ match.group3 }}", - "preserve": ["headers","payload"] + "preserveWhenMissing": ["headers","payload"] } {%- endif -%} {%- endmacro -%} diff --git a/transformation/transformationPlugins/jsonMessageTransformers/jsonTypeMappingsSanitizationTransformer/src/test/java/org/opensearch/migrations/transform/TypeMappingsSanitizationCreateIndexTest.java b/transformation/transformationPlugins/jsonMessageTransformers/jsonTypeMappingsSanitizationTransformer/src/test/java/org/opensearch/migrations/transform/TypeMappingsSanitizationCreateIndexTest.java index 895ebe7e9..8186411fb 100644 --- a/transformation/transformationPlugins/jsonMessageTransformers/jsonTypeMappingsSanitizationTransformer/src/test/java/org/opensearch/migrations/transform/TypeMappingsSanitizationCreateIndexTest.java +++ b/transformation/transformationPlugins/jsonMessageTransformers/jsonTypeMappingsSanitizationTransformer/src/test/java/org/opensearch/migrations/transform/TypeMappingsSanitizationCreateIndexTest.java @@ -44,7 +44,8 @@ public void testPutSingleTypeToMissingTarget() throws Exception { var indexTypeMappingRewriter = makeIndexTypeMappingRewriter(); var result = (Map) indexTypeMappingRewriter.transformJson(OBJECT_MAPPER.readValue(testString, LinkedHashMap.class)); - Assertions.assertEquals(JsonNormalizer.fromString("{ \"method\": \"GET\", \"URI\": \"/\" }"), + var expected = "{ \"method\": \"GET\", \"URI\": \"/\", \"protocol\" : \"HTTP/1.0\" }"; + Assertions.assertEquals(JsonNormalizer.fromString(expected), JsonNormalizer.fromObject(result)); } From c13ef4a279696200d0923f3619d7ee9050f0d0e9 Mon Sep 17 00:00:00 2001 From: Greg Schohn Date: Tue, 10 Dec 2024 01:17:06 -0500 Subject: [PATCH 26/26] Bugfixes for type mappings removal transformations, README + other simple improvements Signed-off-by: Greg Schohn --- .../replay/HttpByteBufFormatter.java | 21 +-- .../replay/ResultsToLogsConsumer.java | 6 + .../README.md | 127 +++++++++--------- .../TypeMappingsSanitizationTransformer.java | 2 +- .../typeMappings/rewriteDocumentRequest.j2 | 2 +- .../typeMappings/rewriteIndexForTarget.j2 | 14 +- ...peMappingsSanitizationDocBackfillTest.java | 6 +- .../TypeMappingsSanitizationProviderTest.java | 24 ++-- 8 files changed, 106 insertions(+), 96 deletions(-) diff --git a/TrafficCapture/trafficReplayer/src/main/java/org/opensearch/migrations/replay/HttpByteBufFormatter.java b/TrafficCapture/trafficReplayer/src/main/java/org/opensearch/migrations/replay/HttpByteBufFormatter.java index e2e807818..c01925b46 100644 --- a/TrafficCapture/trafficReplayer/src/main/java/org/opensearch/migrations/replay/HttpByteBufFormatter.java +++ b/TrafficCapture/trafficReplayer/src/main/java/org/opensearch/migrations/replay/HttpByteBufFormatter.java @@ -197,7 +197,8 @@ public void channelRead(ChannelHandlerContext ctx, Object msg) throws Exception } else { content.release(); } - } else if (msg instanceof HttpMessage) { + } + if (msg instanceof HttpMessage) { // this & HttpContent are interfaces & 'Full' messages implement both message = (HttpMessage) msg; } if (msg instanceof LastHttpContent) { @@ -206,16 +207,16 @@ public void channelRead(ChannelHandlerContext ctx, Object msg) throws Exception } var finalMsg = (message instanceof HttpRequest) ? new DefaultFullHttpRequest(message.protocolVersion(), - ((HttpRequest) message).method(), - ((HttpRequest) message).uri(), - aggregatedContents, - message.headers(), - ((LastHttpContent) msg).trailingHeaders()) + ((HttpRequest) message).method(), + ((HttpRequest) message).uri(), + aggregatedContents, + message.headers(), + ((LastHttpContent) msg).trailingHeaders()) : new DefaultFullHttpResponse(message.protocolVersion(), - ((HttpResponse)message).status(), - aggregatedContents, - message.headers(), - ((LastHttpContent) msg).trailingHeaders()); + ((HttpResponse)message).status(), + aggregatedContents, + message.headers(), + ((LastHttpContent) msg).trailingHeaders()); super.channelRead(ctx, finalMsg); } } diff --git a/TrafficCapture/trafficReplayer/src/main/java/org/opensearch/migrations/replay/ResultsToLogsConsumer.java b/TrafficCapture/trafficReplayer/src/main/java/org/opensearch/migrations/replay/ResultsToLogsConsumer.java index 89ca4354f..528e89b93 100644 --- a/TrafficCapture/trafficReplayer/src/main/java/org/opensearch/migrations/replay/ResultsToLogsConsumer.java +++ b/TrafficCapture/trafficReplayer/src/main/java/org/opensearch/migrations/replay/ResultsToLogsConsumer.java @@ -161,6 +161,7 @@ public static String getTransactionSummaryStringPreamble() { .add("SOURCE_STATUS_CODE/TARGET_STATUS_CODE...") .add("SOURCE_RESPONSE_SIZE_BYTES/TARGET_RESPONSE_SIZE_BYTES...") .add("SOURCE_LATENCY_MS/TARGET_LATENCY_MS...") + .add("METHOD...") .add("URI...") .toString(); } @@ -219,6 +220,11 @@ public static String toTransactionSummaryString( transformStreamToString(parsed.targetResponseList.stream(), r -> "" + r.get(ParsedHttpMessagesAsDicts.RESPONSE_TIME_MS_KEY)) ) + // method + .add( + parsed.sourceRequestOp + .map(r -> (String) r.get(ParsedHttpMessagesAsDicts.METHOD_KEY)) + .orElse(MISSING_STR)) // uri .add( parsed.sourceRequestOp diff --git a/transformation/transformationPlugins/jsonMessageTransformers/jsonTypeMappingsSanitizationTransformer/README.md b/transformation/transformationPlugins/jsonMessageTransformers/jsonTypeMappingsSanitizationTransformer/README.md index 61eae7074..b47b75e54 100644 --- a/transformation/transformationPlugins/jsonMessageTransformers/jsonTypeMappingsSanitizationTransformer/README.md +++ b/transformation/transformationPlugins/jsonMessageTransformers/jsonTypeMappingsSanitizationTransformer/README.md @@ -55,47 +55,71 @@ GET activity/post/_search ## Routing data to new indices -The structure of the documents and indices need to change. Some options are to use separate indices, drop some of +The structure of the documents and indices need to change. Options are to use separate indices, drop some of the types to make an index single-purpose, or to create an index that's the union of all the types' fields. -With a simple mapping directive, we can define each of these three behaviors. The following yaml shows how to map -documents into two different indices named users and posts: +Specific instances of those behaviors can be expressed via a map (or dictionary) or indices to types to target indices. +The following sample json shows how to map documents from the 'activity' index into two different indices +('users' and 'posts'): ``` -activity: - user: new_users - post: new_posts +{ + "activity": { + "user: "new_users", + "post": "new_posts" + } ``` -To drop one type, just leave it out: +To drop the 'post' type, just leave it out: ``` -activity: - user: only_users +{ + "activity": { + "user": "only_users" + } +} ``` -To merge types together, use the same value: +To merge types into a single index, use the same value: ``` -activity: - user: any_activity - post: any_activity +{ + "activity": { + "user": "any_activity", + "post": "any_activity", + } +} ``` -Any _indices_ that are NOT specified won't be modified - all additions, changes, and queries on those other indices not -specified at the root level will remain untouched by the static mapping rewriter. However, missing types from a -specified index will be removed. To remove ALL the activity for a given index, specify an index with no -children types. +To remove ALL the activity for a given index, specify an index with no children types. ``` -activity: {} +{ + "activity": {} +} ``` -In addition to static source/target mappings, users can specify source and type pairs as a regex and use any captured -groups in the target index name. Regex rules take precedent _after_ the static rules and are only applied when there -was no index match in the static mappings. +Those regex rules take precedence **after** the static mappings specified above. + +In addition to static source/target mappings, users can specify source and type pairs as regex patterns and +use captured groups in the target index name. +Any source _indices_ that are NOT specified in the maps will be processed through the regex route rules. +The regex rules are only applied if the source index doesn't match a key in the static route map -Regex replacement is controlled via an ordered list of `[indexNamePattern, typeNamePattern, replacementString]`. -The transformer will use the replacement for the first matched item found. -If none are found, unlike missing indices for static mappings, the system presumes that the index and type are -**NOT** to be propagated to the target - any reference to those types and their corresponding data will be suppressed. -To preserve all items, a default rule will need to be included. +Regex replace rules are evaluated by concatenating the source index and source types into a single string. +The pattern components are also concatenated into a corresponding match string. +The replacement value will replace the _matched_ part of the source index + typename and replace it with the +specified value. +If that specified value contains (numerical) backreferences, those will pull from the captured groups of the +concatenated pattern. +The concatenated pattern is the index pattern followed by the type pattern, meaning that the groups in the index are +numbered from 1 and the type pattern group numbers start after all the groups from the index. + +Missing types from a specified index will be removed. +When the regex pattern isn't defined `["(.*)", "(.*)", "\\1_\\2"]` is used to map each type into its own isolated +index, preserving all data and its separation. + +For more details about regexes, see the [Python](https://docs.python.org/3/library/re.html#re.sub) or +[Java](https://docs.oracle.com/javase/8/docs/api/java/util/regex/Pattern.html) documentation. +This transform uses python-style backreferences (`'`\1`) for replacement patterns. +Notice that regexes can NOT be specified in the index-type map. +They can _only_ be used via the list, which will be evaluated in the order of the list until a match is found. The following sample shows how indices that start with 'time-' will be migrated and every other index and type not already matched will be dropped. @@ -114,41 +138,18 @@ merging all types into a single index with the same name as the source index. ] ``` -## Final Results - -``` -PUT any_activity -{ - "mappings": { - "properties": { - "type": { - "type": "keyword" - }, - "name": { - "type": "text" - }, - "user_name": { - "type": "keyword" - }, - "email": { - "type": "keyword" - }, - "content": { - "type": "text" - }, - "tweeted_at": { - "type": "date" - } - } - } -} - -PUT any_activity/_doc/someuser -{ - "name": "Some User", - "user_name": "user", - "email": "user@example.com" -} - +For more examples, compare the following cases. +Though note that anything matched by the static maps shown above will block any of these rules from being evaluated. + +| Regex Entry | Source Index | Source Type | Target Index | PUT Doc URL | Bulk Index Command | +|--------------------------------------------------------------------------------|-------------|-------------|-------------------|--------------------------------|----------------------------------------------------------------| +| `[["time-(.*)", "(cpu)", "time-\\1-\\2"]]` | time-nov11 | cpu | time-nov11-cpu | /time-nov11-cpu/_doc/doc512 | `{"index": {"_index": "time-nov11-cpu", "_id": "doc512" }}` | +| `[["time-(.*)", "(cpu)", "time-\\1-\\2"]]` | logs | access | [DELETED] | [DELETED] | [DELETED] | +| `[["time-(.*)", "(cpu)", "time-\\1-\\2"],`
` ["(.*)", "(.*)", "\\1-\\2"]]` | logs | access | logs_access | /logs_access/_doc/doc513 | `{"index": {"_index": "logs_access", "_id": "doc513" }}` | +| `[["time-(.*)", "(cpu)", "time-\\1-\\2"],`
`[["", ".*", ""]]` | everything | widgets | everything | /everything/_doc/doc514 | `{"index": {"_index": "everything", "_id": "doc514" }}` | +| `[["time-(.*)", "(cpu)", "time-\\1-\\2"],`
`[["", ".*", ""]]` | everything | sprockets | everything | /everything/_doc/doc515 | `{"index": {"_index": "everything", "_id": "doc515" }}` | +| `[["time-(.*)", "(.*)-(cpu)", "\\2-\\3-\\1"]]` | time-nov11 | host123-cpu | host123-cpu-nov11 | /host123-cpu-nov11/_doc/doc512 | `{"index": {"_index": "host123-cpu-nov11", "_id": "doc512" }}` | +| `[["", ".*", ""]]` | metadata | users | metadata | /metadata/_doc/doc516 | `{"index": {"_index": "metadata", "_id": "doc516" }}` | +| `[[".*", ".*", "leftovers"]]` | logs | access | leftovers | /leftovers/_doc/doc517 | `{"index": {"_index": "leftovers", "_id": "doc517" }}` | +| `[[".*", ".*", "leftovers"]]` | permissions | access | leftovers | /leftovers/_doc/doc517 | `{"index": {"_index": "leftovers", "_id": "doc517" }}` | -``` \ No newline at end of file diff --git a/transformation/transformationPlugins/jsonMessageTransformers/jsonTypeMappingsSanitizationTransformer/src/main/java/org/opensearch/migrations/transform/TypeMappingsSanitizationTransformer.java b/transformation/transformationPlugins/jsonMessageTransformers/jsonTypeMappingsSanitizationTransformer/src/main/java/org/opensearch/migrations/transform/TypeMappingsSanitizationTransformer.java index 226b858b9..0ea6d409e 100644 --- a/transformation/transformationPlugins/jsonMessageTransformers/jsonTypeMappingsSanitizationTransformer/src/main/java/org/opensearch/migrations/transform/TypeMappingsSanitizationTransformer.java +++ b/transformation/transformationPlugins/jsonMessageTransformers/jsonTypeMappingsSanitizationTransformer/src/main/java/org/opensearch/migrations/transform/TypeMappingsSanitizationTransformer.java @@ -49,7 +49,7 @@ public TypeMappingsSanitizationTransformer( // types of patterns are being used. // This regex says, match the type part and reduce it to nothing, leave the index part untouched. var regexIndexMappings = Optional.ofNullable(regexIndexMappingsIncoming) - .orElseGet(() -> (indexMappingsIncoming == null ? List.of(List.of("", ".*", "")) : List.of())); + .orElseGet(() -> (indexMappingsIncoming == null ? List.of(List.of("(.*)", "(.*)", "\\1_\\2")) : List.of())); return incomingJson -> Map.of("source_document", incomingJson, "index_mappings", indexMappings, diff --git a/transformation/transformationPlugins/jsonMessageTransformers/jsonTypeMappingsSanitizationTransformer/src/main/resources/jinjava/typeMappings/rewriteDocumentRequest.j2 b/transformation/transformationPlugins/jsonMessageTransformers/jsonTypeMappingsSanitizationTransformer/src/main/resources/jinjava/typeMappings/rewriteDocumentRequest.j2 index 6fc665bb2..97475c5be 100644 --- a/transformation/transformationPlugins/jsonMessageTransformers/jsonTypeMappingsSanitizationTransformer/src/main/resources/jinjava/typeMappings/rewriteDocumentRequest.j2 +++ b/transformation/transformationPlugins/jsonMessageTransformers/jsonTypeMappingsSanitizationTransformer/src/main/resources/jinjava/typeMappings/rewriteDocumentRequest.j2 @@ -9,7 +9,7 @@ { "method": "{{ input_map.request.method }}", "URI": "/{{ target_index }}/_doc/{{ match.group3 }}", - "preserveWhenMissing": ["headers","payload"] + "preserveWhenMissing": "*" } {%- endif -%} {%- endmacro -%} diff --git a/transformation/transformationPlugins/jsonMessageTransformers/jsonTypeMappingsSanitizationTransformer/src/main/resources/jinjava/typeMappings/rewriteIndexForTarget.j2 b/transformation/transformationPlugins/jsonMessageTransformers/jsonTypeMappingsSanitizationTransformer/src/main/resources/jinjava/typeMappings/rewriteIndexForTarget.j2 index f0606d83f..150f6d1a9 100644 --- a/transformation/transformationPlugins/jsonMessageTransformers/jsonTypeMappingsSanitizationTransformer/src/main/resources/jinjava/typeMappings/rewriteIndexForTarget.j2 +++ b/transformation/transformationPlugins/jsonMessageTransformers/jsonTypeMappingsSanitizationTransformer/src/main/resources/jinjava/typeMappings/rewriteIndexForTarget.j2 @@ -15,10 +15,14 @@ {%- endmacro -%} {%- macro convert_source_index_to_target(source_index, source_type, index_mappings, regex_index_mappings) -%} - {%- set ns = namespace(target_index=none) -%} - {%- set ns.target_index = (index_mappings[source_index] | default({}))[source_type] -%} - {%- if ns.target_index is none -%} - {%- set ns.target_index = convert_source_index_to_target_via_regex(source_index, source_type, regex_index_mappings) -%} + {%- if source_type == "_doc" -%} + {{- source_index -}} + {%- else -%} + {%- set ns = namespace(target_index=none) -%} + {%- set ns.target_index = (index_mappings[source_index] | default({}))[source_type] -%} + {%- if ns.target_index is none -%} + {%- set ns.target_index = convert_source_index_to_target_via_regex(source_index, source_type, regex_index_mappings) -%} + {%- endif -%} + {{- ns.target_index -}} {%- endif -%} - {{- ns.target_index -}} {%- endmacro -%} \ No newline at end of file diff --git a/transformation/transformationPlugins/jsonMessageTransformers/jsonTypeMappingsSanitizationTransformer/src/test/java/org/opensearch/migrations/transform/TypeMappingsSanitizationDocBackfillTest.java b/transformation/transformationPlugins/jsonMessageTransformers/jsonTypeMappingsSanitizationTransformer/src/test/java/org/opensearch/migrations/transform/TypeMappingsSanitizationDocBackfillTest.java index be9d53909..7318d25c9 100644 --- a/transformation/transformationPlugins/jsonMessageTransformers/jsonTypeMappingsSanitizationTransformer/src/test/java/org/opensearch/migrations/transform/TypeMappingsSanitizationDocBackfillTest.java +++ b/transformation/transformationPlugins/jsonMessageTransformers/jsonTypeMappingsSanitizationTransformer/src/test/java/org/opensearch/migrations/transform/TypeMappingsSanitizationDocBackfillTest.java @@ -1,7 +1,6 @@ package org.opensearch.migrations.transform; import java.util.LinkedHashMap; -import java.util.List; import org.opensearch.migrations.testutils.JsonNormalizer; @@ -23,13 +22,12 @@ public void test() throws Exception { "}"; var expectedString = "{\n" + - " \"index\": { \"_index\": \"network\", \"_id\": \"1\" },\n" + + " \"index\": { \"_index\": \"performance_network\", \"_id\": \"1\" },\n" + " \"source\": { \"field1\": \"value1\" }\n" + "}"; - var regexIndexMappings = List.of(List.of(".*", "", "")); - var indexTypeMappingRewriter = new TypeMappingsSanitizationTransformer(null, regexIndexMappings); + var indexTypeMappingRewriter = new TypeMappingsSanitizationTransformer(null, null); var resultObj = indexTypeMappingRewriter.transformJson(OBJECT_MAPPER.readValue(testString, LinkedHashMap.class)); log.atInfo().setMessage("resultStr = {}").addArgument(() -> { try { diff --git a/transformation/transformationPlugins/jsonMessageTransformers/jsonTypeMappingsSanitizationTransformerProvider/src/test/java/org/opensearch/migrations/replay/TypeMappingsSanitizationProviderTest.java b/transformation/transformationPlugins/jsonMessageTransformers/jsonTypeMappingsSanitizationTransformerProvider/src/test/java/org/opensearch/migrations/replay/TypeMappingsSanitizationProviderTest.java index f8f576298..d2500e656 100644 --- a/transformation/transformationPlugins/jsonMessageTransformers/jsonTypeMappingsSanitizationTransformerProvider/src/test/java/org/opensearch/migrations/replay/TypeMappingsSanitizationProviderTest.java +++ b/transformation/transformationPlugins/jsonMessageTransformers/jsonTypeMappingsSanitizationTransformerProvider/src/test/java/org/opensearch/migrations/replay/TypeMappingsSanitizationProviderTest.java @@ -31,18 +31,18 @@ public class TypeMappingsSanitizationProviderTest { public void testSimpleTransform() throws JsonProcessingException { var config = Map.of("staticMappings", Map.of( - "indexA", Map.of( - "type1", "indexA_1", - "type2", "indexA_2"), - "indexB", Map.of( - "type1", "indexB", - "type2", "indexB"), - "indexC", Map.of( - "type2", "indexC")), + "indexa", Map.of( + "type1", "indexa_1", + "type2", "indexa_2"), + "indexb", Map.of( + "type1", "indexb", + "type2", "indexb"), + "indexc", Map.of( + "type2", "indexc")), "regexMappings", List.of(List.of("(time.*)", "(type.*)", "\\1_And_\\2"))); final String TEST_INPUT_REQUEST = "{\n" + " \"method\": \"PUT\",\n" - + " \"URI\": \"/indexA/type2/someuser\",\n" + + " \"URI\": \"/indexa/type2/someuser\",\n" + " \"headers\": {\n" + " \"host\": \"127.0.0.1\"\n" + " },\n" @@ -56,7 +56,7 @@ public void testSimpleTransform() throws JsonProcessingException { + "}\n"; final String EXPECTED = "{\n" + " \"method\": \"PUT\",\n" - + " \"URI\": \"/indexA_2/_doc/someuser\",\n" + + " \"URI\": \"/indexa_2/_doc/someuser\",\n" + " \"headers\": {\n" + " \"host\": \"127.0.0.1\"\n" + " },\n" @@ -82,8 +82,8 @@ public void testSimpleTransform() throws JsonProcessingException { Assertions.assertEquals( JsonNormalizer.fromString( EXPECTED.replace( - "/indexA_2/_doc/someuser", - "/indexA/_doc/someuser")), + "/indexa_2/_doc/someuser", + "/indexa_type2/_doc/someuser")), JsonNormalizer.fromObject(resultFromNullConfig)); } }