Skip to content

Commit

Permalink
[INLONG-11223][SDK] Transform support JSON_VALUE() function (#11269)
Browse files Browse the repository at this point in the history
  • Loading branch information
emptyOVO authored Oct 8, 2024
1 parent eed150f commit 5205340
Show file tree
Hide file tree
Showing 2 changed files with 217 additions and 0 deletions.
Original file line number Diff line number Diff line change
@@ -0,0 +1,70 @@
/*
* Licensed to the Apache Software Foundation (ASF) under one or more
* contributor license agreements. See the NOTICE file distributed with
* this work for additional information regarding copyright ownership.
* The ASF licenses this file to You under the Apache License, Version 2.0
* (the "License"); you may not use this file except in compliance with
* the License. You may obtain a copy of the License at
*
* http://www.apache.org/licenses/LICENSE-2.0
*
* Unless required by applicable law or agreed to in writing, software
* distributed under the License is distributed on an "AS IS" BASIS,
* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
* See the License for the specific language governing permissions and
* limitations under the License.
*/

package org.apache.inlong.sdk.transform.process.function;

import org.apache.inlong.sdk.transform.decode.SourceData;
import org.apache.inlong.sdk.transform.process.Context;
import org.apache.inlong.sdk.transform.process.operator.OperatorTools;
import org.apache.inlong.sdk.transform.process.parser.ValueParser;

import com.alibaba.fastjson.JSONPath;
import net.sf.jsqlparser.expression.Expression;
import net.sf.jsqlparser.expression.Function;

import java.util.List;

/**
* JsonValueFunction
* description: JSON_VALUE(jsonValue, path)--Extracts a scalar from a JSON string.
* for example: json_value({"a": 1}, $.a)--return 1
* json_value({\"person\": {\"name\": \"Alice\" ,\"age\": 30}}, $.person.name)--return Alice
*/
@TransformFunction(names = {"json_value"})
public class JsonValueFunction implements ValueParser {

private final ValueParser jsonParser;

private final ValueParser pathParser;

public JsonValueFunction(Function expr) {
List<Expression> expressions = expr.getParameters().getExpressions();
this.jsonParser = OperatorTools.buildParser(expressions.get(0));
this.pathParser = OperatorTools.buildParser(expressions.get(1));
}

@Override
public Object parse(SourceData sourceData, int rowIndex, Context context) {
Object jsonObj = jsonParser.parse(sourceData, rowIndex, context);
Object pathObj = pathParser.parse(sourceData, rowIndex, context);
if (jsonObj == null || pathObj == null) {
return null;
}
String path = OperatorTools.parseString(pathObj);
String json = OperatorTools.parseString(jsonObj);

if (path.isEmpty()) {
return null;
}
Object res = JSONPath.read(json, path);
// check if it is a scalar
if (res instanceof String || res instanceof Number || res instanceof Boolean) {
return res.toString();
}
return null;
}
}
Original file line number Diff line number Diff line change
@@ -0,0 +1,147 @@
/*
* Licensed to the Apache Software Foundation (ASF) under one or more
* contributor license agreements. See the NOTICE file distributed with
* this work for additional information regarding copyright ownership.
* The ASF licenses this file to You under the Apache License, Version 2.0
* (the "License"); you may not use this file except in compliance with
* the License. You may obtain a copy of the License at
*
* http://www.apache.org/licenses/LICENSE-2.0
*
* Unless required by applicable law or agreed to in writing, software
* distributed under the License is distributed on an "AS IS" BASIS,
* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
* See the License for the specific language governing permissions and
* limitations under the License.
*/

package org.apache.inlong.sdk.transform.process.function.string;

import org.apache.inlong.sdk.transform.decode.SourceDecoderFactory;
import org.apache.inlong.sdk.transform.encode.SinkEncoderFactory;
import org.apache.inlong.sdk.transform.pojo.TransformConfig;
import org.apache.inlong.sdk.transform.process.TransformProcessor;

import org.junit.Assert;
import org.junit.Test;

import java.util.HashMap;
import java.util.List;

public class TestJsonValueFunction extends AbstractFunctionStringTestBase {

@Test
public void testJsonValueFunction() throws Exception {
String transformSql = null, data = null;
TransformConfig config = null;
TransformProcessor<String, String> processor = null;
List<String> output = null;
transformSql = "select json_value(string1,string2) from source";
config = new TransformConfig(transformSql);
processor = TransformProcessor
.create(config, SourceDecoderFactory.createCsvDecoder(csvSource),
SinkEncoderFactory.createKvEncoder(kvSink));

// case1: json_value({"a": 1}, $.a)
data = "{\"a\": 1}|$.a|3|5";
output = processor.transform(data, new HashMap<>());
Assert.assertEquals(1, output.size());
Assert.assertEquals("result=1", output.get(0));

// case2: json_value({"a": null}, $.a)
data = "{\"a\": null}|$.a|3|5";
output = processor.transform(data, new HashMap<>());
Assert.assertEquals(1, output.size());
Assert.assertEquals("result=", output.get(0));

// case3: json_value({"a": true}, $.b)
data = "{\"a\": true}|$.b|3|5";
output = processor.transform(data, new HashMap<>());
Assert.assertEquals(1, output.size());
Assert.assertEquals("result=", output.get(0));

// case4: json_value(null, $.a)
data = "|$.a|3|5";
output = processor.transform(data, new HashMap<>());
Assert.assertEquals(1, output.size());
Assert.assertEquals("result=", output.get(0));

// case5: json_value({"a": true}, null)
data = "{\"a\": true}||3|5";
output = processor.transform(data, new HashMap<>());
Assert.assertEquals(1, output.size());
Assert.assertEquals("result=", output.get(0));

// case6: json_value({\"person\": {\"name\": \"Alice\" ,\"age\": 30}}, $.person.name)
data = "{\\\"person\\\": {\\\"name\\\": \\\"Alice\\\" ,\\\"age\\\": 30}}|$.person.name|3|5";
output = processor.transform(data, new HashMap<>());
Assert.assertEquals(1, output.size());
Assert.assertEquals("result=Alice", output.get(0));

// case7: json_value({\"person\": {\"name\": \"Alice\", \"age\": 30}}, $.person.address)
data = "{\\\"person\\\": {\\\"name\\\": \\\"Alice\\\", \\\"age\\\": 30}}|$.person.address|3|5";
output = processor.transform(data, new HashMap<>());
Assert.assertEquals(1, output.size());
Assert.assertEquals("result=", output.get(0));

// case8: json_value({\"person\" : {\"name\" : \"Amy\" }}, $.person.name)
data = "{\\\"person\\\" : {\\\"name\\\" : \\\"Amy\\\" }}|$.person.name|3|5";
output = processor.transform(data, new HashMap<>());
Assert.assertEquals(1, output.size());
Assert.assertEquals("result=Amy", output.get(0));

// case9: json_value({\"people\": [{\"name\": \"Alice\"}, {\"name\": \"Bob\"}]}, $.people)
data = "{\\\"people\\\": [{\\\"name\\\": \\\"Alice\\\"}, {\\\"name\\\": \\\"Bob\\\"}]}|$.people|3|5";
output = processor.transform(data, new HashMap<>());
Assert.assertEquals(1, output.size());
Assert.assertEquals("result=", output.get(0));

// case10: json_value({\"people\": [{\"name\": \"Alice\"}, {\"name\": \"Bob\"}]}, $.people[2].name)
data = "{\\\"people\\\": [{\\\"name\\\": \\\"Alice\\\"}, {\\\"name\\\": \\\"Bob\\\"}]}|$.people[2].name|3|5";
output = processor.transform(data, new HashMap<>());
Assert.assertEquals(1, output.size());
Assert.assertEquals("result=", output.get(0));

// case11: json_value({\"data\": [{\"details\": {\"status\": \"active\"}},
// {\"details\": {\"status\": \"inactive\"}}]}, $.data[1].details.status)
data = "{\\\"data\\\": [{\\\"details\\\": {\\\"status\\\": \\\"active\\\"}}, " +
"{\\\"details\\\": {\\\"status\\\": \\\"inactive\\\"}}]}|$.data[1].details.status|3|5";
output = processor.transform(data, new HashMap<>());
Assert.assertEquals(1, output.size());
Assert.assertEquals("result=inactive", output.get(0));

// case12: json_value({\"records\": [{\"id\": 1, \"info\": {\"valid\": true}},
// {\"id\": 2, \"info\": {\"valid\": false}}]}, $.records[0].info.valid)
data = "{\\\"records\\\": [{\\\"id\\\": 1, \\\"info\\\": {\\\"valid\\\": true}}, " +
"{\\\"id\\\": 2, \\\"info\\\": {\\\"valid\\\": false}}]}|$.records[0].info.valid|3|5";
output = processor.transform(data, new HashMap<>());
Assert.assertEquals(1, output.size());
Assert.assertEquals("result=true", output.get(0));

// case13: json_value({"data": {"items": [{"id": 1, "details": {"price": 100}},
// {"id": 2, "details": {"price": 200}}]}}, $.data.items[1].details.discount)
data = "{\"data\": {\"items\": [{\"id\": 1, \"details\": {\"price\": 100}}, " +
"{\"id\": 2, \"details\": {\"price\": 200}}]}}|$.data.items[1].details.discount|3|5";
output = processor.transform(data, new HashMap<>());
Assert.assertEquals(1, output.size());
Assert.assertEquals("result=", output.get(0));

// case14: json_value({"items": []}, $.items[0])
data = "{\"items\": []}|$.items[0]|3|5";
output = processor.transform(data, new HashMap<>());
Assert.assertEquals(1, output.size());
Assert.assertEquals("result=", output.get(0));

// case15: json_value({\"list\": [null, {\"name\": \"John\"}]}, $.list[0])
data = "{\\\"list\\\": [null, {\\\"name\\\": \\\"John\\\"}]}|$.list[0]|3|5";
output = processor.transform(data, new HashMap<>());
Assert.assertEquals(1, output.size());
Assert.assertEquals("result=", output.get(0));

// case16: json_value({\"list\": [null, {\"name\": \"John\"}]}, $.list[1].name)
data = "{\\\"list\\\": [null, {\\\"name\\\": \\\"John\\\"}]}|$.list[1].name|3|5";
output = processor.transform(data, new HashMap<>());
Assert.assertEquals(1, output.size());
Assert.assertEquals("result=John", output.get(0));
}
}

0 comments on commit 5205340

Please sign in to comment.