/* * Copyright 2017 StreamSets Inc. * * Licensed under the Apache Software Foundation (ASF) under one * or more contributor license agreements. See the NOTICE file * distributed with this work for additional information * regarding copyright ownership. The ASF licenses this file * to you under the Apache License, Version 2.0 (the * "License"); you may not use this file except in compliance * with the License. You may obtain a copy of the License at * * http://www.apache.org/licenses/LICENSE-2.0 * * Unless required by applicable law or agreed to in writing, software * distributed under the License is distributed on an "AS IS" BASIS, * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. * See the License for the specific language governing permissions and * limitations under the License. */ package com.streamsets.pipeline.lib.parser.json; import com.google.common.base.Strings; import com.google.common.collect.ImmutableList; import com.streamsets.pipeline.api.OnRecordError; import com.streamsets.pipeline.api.Stage; import com.streamsets.pipeline.api.ext.io.CountingReader; import com.streamsets.pipeline.api.ext.io.ObjectLengthException; import com.streamsets.pipeline.api.ext.io.OverrunException; import com.streamsets.pipeline.api.ext.io.OverrunReader; import com.streamsets.pipeline.api.ext.json.Mode; import com.streamsets.pipeline.lib.json.OverrunStreamingJsonParser; import com.streamsets.pipeline.lib.json.StreamingJsonParser; import com.streamsets.pipeline.sdk.ContextInfoCreator; import org.junit.After; import org.junit.Assert; import org.junit.Before; import org.junit.Test; import java.io.InputStream; import java.io.InputStreamReader; import java.io.StringReader; import java.util.Collections; import java.util.List; public class TestOverrunStreamingJsonParser { @Before public void setUp() { System.getProperties().remove(OverrunReader.READ_LIMIT_SYS_PROP); } @After public void cleanUp() { setUp(); } private CountingReader getJsonReader(String name) throws Exception { InputStream is = Thread.currentThread().getContextClassLoader().getResourceAsStream(name); return (is != null) ? new CountingReader(new InputStreamReader(is)) : null; } private Stage.Context getContext() { return ContextInfoCreator.createSourceContext("i", false, OnRecordError.TO_ERROR, Collections.emptyList()); } // Parser level overrun, Array @Test public void testArrayOfObjects() throws Exception { StreamingJsonParser parser = new OverrunStreamingJsonParser( getContext(), getJsonReader("TestOverrunStreamingJsonParser-arrayOfObjects.json"), Mode.ARRAY_OBJECTS, 50); List a1 = (List) parser.read(); Assert.assertNotNull(a1); try { parser.read(); Assert.fail(); } catch (ObjectLengthException ex) { //NOP } List a2 = (List) parser.read(); Assert.assertNotNull(a2); Assert.assertNull(parser.read()); Assert.assertEquals(ImmutableList.of("a", "A"), a1); Assert.assertEquals(ImmutableList.of("b", "B"), a2); } // Parser level overrun, Objects @Test public void testMultipleObjects() throws Exception { StreamingJsonParser parser = new OverrunStreamingJsonParser( getContext(), getJsonReader("TestOverrunStreamingJsonParser-multipleObjects.json"), Mode.MULTIPLE_OBJECTS, 50); List a1 = (List) parser.read(); Assert.assertNotNull(a1); try { parser.read(); Assert.fail(); } catch (ObjectLengthException ex) { //NOP } List a2 = (List) parser.read(); Assert.assertNotNull(a2); Assert.assertNull(parser.read()); Assert.assertEquals(ImmutableList.of("a", "A"), a1); Assert.assertEquals(ImmutableList.of("b", "B"), a2); } // Stream level overrun, Array public void testStreamLevelOverrunArray(boolean attemptNextRead) throws Exception { System.setProperty(OverrunReader.READ_LIMIT_SYS_PROP, "10000"); String json = "[[\"a\"],[\"" + Strings.repeat("a", 20000) + "\"],[\"b\"]]"; StreamingJsonParser parser = new OverrunStreamingJsonParser(getContext(), new CountingReader(new StringReader(json)), Mode.ARRAY_OBJECTS, 50); List a1 = (List) parser.read(); Assert.assertNotNull(a1); Assert.assertEquals(ImmutableList.of("a"), a1); if (!attemptNextRead) { parser.read(); } else { try { parser.read(); } catch (OverrunException ex) { //NOP } parser.read(); } } @Test(expected = OverrunException.class) public void testStreamLevelOverrunArray() throws Exception { testStreamLevelOverrunArray(false); } @Test(expected = IllegalStateException.class) public void testStreamLevelOverrunArrayAttemptNextRead() throws Exception { testStreamLevelOverrunArray(true); } // Stream level overrun, Object public void testStreamLevelOverrunMultipleObjects(boolean attemptNextRead) throws Exception { System.setProperty(OverrunReader.READ_LIMIT_SYS_PROP, "10000"); String json = "[\"a\"][\"" + Strings.repeat("a", 20000) + "\"][\"b\"]"; StreamingJsonParser parser = new OverrunStreamingJsonParser(getContext(), new CountingReader(new StringReader(json)), Mode.MULTIPLE_OBJECTS, 50); List a1 = (List) parser.read(); Assert.assertNotNull(a1); Assert.assertEquals(ImmutableList.of("a"), a1); if (!attemptNextRead) { parser.read(); } else { try { parser.read(); } catch (OverrunException ex) { //NOP } parser.read(); } } @Test(expected = OverrunException.class) public void testStreamLevelOverrunMultipleObjects() throws Exception { testStreamLevelOverrunMultipleObjects(false); } @Test(expected = IllegalStateException.class) public void testStreamLevelOverrunMultipleObjectsAttemptNextRead() throws Exception { testStreamLevelOverrunMultipleObjects(true); } @Test public void testFastForwardBeyondOverrunMultipleObjects() throws Exception { System.setProperty(OverrunReader.READ_LIMIT_SYS_PROP, "10000"); String json = "[\"a\"][\"" + Strings.repeat("a", 10000) + "\"][\"b\"]"; json += "[\"a\"][\"" + Strings.repeat("a", 20000) + "\"][\"b\"]"; int initialPos = json.length(); json += "[\"x\"]"; StreamingJsonParser parser = new OverrunStreamingJsonParser(getContext(), new CountingReader(new StringReader(json)), initialPos, Mode.MULTIPLE_OBJECTS, 50); List a1 = (List) parser.read(); Assert.assertNotNull(a1); Assert.assertEquals(ImmutableList.of("x"), a1); } @Test public void testArrayPositionable() throws Exception { StreamingJsonParser parser = new OverrunStreamingJsonParser( getContext(), getJsonReader("TestOverrunStreamingJsonParser-arrayOfObjects.json"), Mode.ARRAY_OBJECTS, 50); List l1 = (List) parser.read(); long firstObjectPos = parser.getReaderPosition(); Assert.assertNotNull(l1); try { parser.read(); Assert.fail(); } catch (ObjectLengthException ex) { //NOP } List l2 = (List) parser.read(); long secondObjectPos = parser.getReaderPosition(); Assert.assertNotNull(l1); Assert.assertNotNull(l2); long lastObjectPos = parser.getReaderPosition(); Assert.assertNotNull(l1); Assert.assertNull(parser.read()); long endPos = parser.getReaderPosition(); Assert.assertNotNull(l1); parser = new OverrunStreamingJsonParser(getContext(), getJsonReader("TestOverrunStreamingJsonParser-arrayOfObjects.json"), firstObjectPos, Mode.ARRAY_OBJECTS, 50); Assert.assertEquals(firstObjectPos, parser.getReaderPosition()); try { parser.read(); Assert.fail(); } catch (ObjectLengthException ex) { //NOP } List l2a = (List) parser.read(); Assert.assertEquals(l2, l2a); Assert.assertEquals(lastObjectPos, parser.getReaderPosition()); Assert.assertNull(parser.read()); Assert.assertEquals(endPos, parser.getReaderPosition()); parser = new OverrunStreamingJsonParser(getContext(), getJsonReader("TestOverrunStreamingJsonParser-arrayOfObjects.json"), secondObjectPos, Mode.ARRAY_OBJECTS, 50); Assert.assertEquals(secondObjectPos, parser.getReaderPosition()); Assert.assertEquals(l2, l2a); Assert.assertEquals(lastObjectPos, parser.getReaderPosition()); Assert.assertNull(parser.read()); Assert.assertEquals(endPos, parser.getReaderPosition()); parser = new OverrunStreamingJsonParser(getContext(), getJsonReader("TestOverrunStreamingJsonParser-arrayOfObjects.json"), lastObjectPos, Mode.ARRAY_OBJECTS, 50); Assert.assertEquals(lastObjectPos, parser.getReaderPosition()); Assert.assertNull(parser.read()); Assert.assertEquals(endPos, parser.getReaderPosition()); parser = new OverrunStreamingJsonParser(getContext(), getJsonReader("TestOverrunStreamingJsonParser-arrayOfObjects.json"), endPos, Mode.ARRAY_OBJECTS, 50); Assert.assertEquals(endPos, parser.getReaderPosition()); Assert.assertNull(parser.read()); Assert.assertEquals(endPos, parser.getReaderPosition()); } @Test public void testMultipleObjectsPositionable() throws Exception { StreamingJsonParser parser = new OverrunStreamingJsonParser(getContext(), getJsonReader("TestOverrunStreamingJsonParser-multipleObjects.json"), Mode.MULTIPLE_OBJECTS, 50); List l1 = (List) parser.read(); long firstObjectPos = parser.getReaderPosition(); Assert.assertNotNull(l1); try { parser.read(); Assert.fail(); } catch (ObjectLengthException ex) { //NOP } List l2 = (List) parser.read(); long secondObjectPos = parser.getReaderPosition(); Assert.assertNotNull(l1); Assert.assertNotNull(l2); long lastObjectPos = parser.getReaderPosition(); Assert.assertNotNull(l1); parser = new OverrunStreamingJsonParser(getContext(), getJsonReader("TestOverrunStreamingJsonParser-multipleObjects.json"), firstObjectPos, Mode.MULTIPLE_OBJECTS, 50); Assert.assertEquals(firstObjectPos, parser.getReaderPosition()); try { parser.read(); Assert.fail(); } catch (ObjectLengthException ex) { //NOP } List l2a = (List) parser.read(); Assert.assertEquals(secondObjectPos, parser.getReaderPosition()); Assert.assertEquals(l2, l2a); Assert.assertEquals(lastObjectPos, parser.getReaderPosition()); Assert.assertNull(parser.read()); parser = new OverrunStreamingJsonParser(getContext(), getJsonReader("TestOverrunStreamingJsonParser-multipleObjects.json"), secondObjectPos, Mode.MULTIPLE_OBJECTS, 50); Assert.assertEquals(secondObjectPos, parser.getReaderPosition()); Assert.assertEquals(l2, l2a); Assert.assertEquals(lastObjectPos, parser.getReaderPosition()); Assert.assertNull(parser.read()); parser = new OverrunStreamingJsonParser(getContext(), getJsonReader("TestOverrunStreamingJsonParser-multipleObjects.json"), lastObjectPos, Mode.MULTIPLE_OBJECTS, 50); Assert.assertEquals(lastObjectPos, parser.getReaderPosition()); Assert.assertNull(parser.read()); } }