org.apache.beam.runners.flink.PipelineOptionsTest.java Source code

Java tutorial

Introduction

Here is the source code for org.apache.beam.runners.flink.PipelineOptionsTest.java

Source

/*
 * Licensed to the Apache Software Foundation (ASF) under one
 * or more contributor license agreements.  See the NOTICE file
 * distributed with this work for additional information
 * regarding copyright ownership.  The ASF licenses this file
 * to you under the Apache License, Version 2.0 (the
 * "License"); you may not use this file except in compliance
 * with the License.  You may obtain a copy of the License at
 *
 *     http://www.apache.org/licenses/LICENSE-2.0
 *
 * Unless required by applicable law or agreed to in writing, software
 * distributed under the License is distributed on an "AS IS" BASIS,
 * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
 * See the License for the specific language governing permissions and
 * limitations under the License.
 */
package org.apache.beam.runners.flink;

import static org.junit.Assert.assertEquals;
import static org.junit.Assert.assertFalse;
import static org.junit.Assert.assertNotNull;
import static org.junit.Assert.assertNull;
import static org.junit.Assert.assertTrue;

import com.fasterxml.jackson.core.JsonGenerator;
import com.fasterxml.jackson.core.JsonParser;
import com.fasterxml.jackson.core.JsonProcessingException;
import com.fasterxml.jackson.databind.DeserializationContext;
import com.fasterxml.jackson.databind.JsonDeserializer;
import com.fasterxml.jackson.databind.JsonSerializer;
import com.fasterxml.jackson.databind.Module;
import com.fasterxml.jackson.databind.SerializerProvider;
import com.fasterxml.jackson.databind.annotation.JsonDeserialize;
import com.fasterxml.jackson.databind.annotation.JsonSerialize;
import com.fasterxml.jackson.databind.module.SimpleModule;
import com.google.auto.service.AutoService;
import java.io.ByteArrayInputStream;
import java.io.ByteArrayOutputStream;
import java.io.IOException;
import java.io.ObjectInputStream;
import java.io.ObjectOutputStream;
import java.util.Collections;
import java.util.HashMap;
import org.apache.beam.runners.flink.translation.utils.SerializedPipelineOptions;
import org.apache.beam.runners.flink.translation.wrappers.streaming.DoFnOperator;
import org.apache.beam.sdk.coders.StringUtf8Coder;
import org.apache.beam.sdk.options.Default;
import org.apache.beam.sdk.options.Description;
import org.apache.beam.sdk.options.PipelineOptions;
import org.apache.beam.sdk.options.PipelineOptionsFactory;
import org.apache.beam.sdk.transforms.DoFn;
import org.apache.beam.sdk.transforms.windowing.GlobalWindow;
import org.apache.beam.sdk.transforms.windowing.PaneInfo;
import org.apache.beam.sdk.util.WindowedValue;
import org.apache.beam.sdk.values.PCollectionView;
import org.apache.beam.sdk.values.TupleTag;
import org.apache.beam.sdk.values.WindowingStrategy;
import org.apache.commons.lang3.SerializationUtils;
import org.apache.flink.api.common.ExecutionConfig;
import org.apache.flink.api.common.typeinfo.TypeHint;
import org.apache.flink.api.common.typeinfo.TypeInformation;
import org.apache.flink.runtime.state.memory.MemoryStateBackend;
import org.apache.flink.streaming.runtime.streamrecord.StreamRecord;
import org.apache.flink.streaming.util.OneInputStreamOperatorTestHarness;
import org.joda.time.Instant;
import org.junit.Assert;
import org.junit.BeforeClass;
import org.junit.Test;

/**
 * Tests for serialization and deserialization of {@link PipelineOptions} in {@link DoFnOperator}.
 */
public class PipelineOptionsTest {

    /**
     * Pipeline options.
     */
    public interface MyOptions extends FlinkPipelineOptions {
        @Description("Bla bla bla")
        @Default.String("Hello")
        String getTestOption();

        void setTestOption(String value);
    }

    private static MyOptions options;
    private static SerializedPipelineOptions serializedOptions;

    private static final String[] args = new String[] { "--testOption=nothing" };

    @BeforeClass
    public static void beforeTest() {
        options = PipelineOptionsFactory.fromArgs(args).as(MyOptions.class);
        serializedOptions = new SerializedPipelineOptions(options);
    }

    @Test
    public void testDeserialization() {
        MyOptions deserializedOptions = serializedOptions.getPipelineOptions().as(MyOptions.class);
        assertEquals("nothing", deserializedOptions.getTestOption());
    }

    @Test
    public void testIgnoredFieldSerialization() {
        FlinkPipelineOptions options = PipelineOptionsFactory.as(FlinkPipelineOptions.class);
        options.setStateBackend(new MemoryStateBackend());

        FlinkPipelineOptions deserialized = new SerializedPipelineOptions(options).getPipelineOptions()
                .as(FlinkPipelineOptions.class);

        assertNull(deserialized.getStateBackend());
    }

    @Test
    public void testEnableMetrics() {
        FlinkPipelineOptions options = PipelineOptionsFactory.as(FlinkPipelineOptions.class);
        options.setEnableMetrics(false);
        assertFalse(options.getEnableMetrics());
    }

    @Test
    public void testCaching() {
        PipelineOptions deserializedOptions = serializedOptions.getPipelineOptions().as(PipelineOptions.class);

        assertNotNull(deserializedOptions);
        assertTrue(deserializedOptions == serializedOptions.getPipelineOptions());
        assertTrue(deserializedOptions == serializedOptions.getPipelineOptions());
        assertTrue(deserializedOptions == serializedOptions.getPipelineOptions());
    }

    @Test(expected = Exception.class)
    public void testNonNull() {
        new SerializedPipelineOptions(null);
    }

    @Test(expected = Exception.class)
    public void parDoBaseClassPipelineOptionsNullTest() {
        DoFnOperator<String, String, String> doFnOperator = new DoFnOperator<>(new TestDoFn(), "stepName",
                WindowedValue.getValueOnlyCoder(StringUtf8Coder.of()), new TupleTag<String>("main-output"),
                Collections.<TupleTag<?>>emptyList(), new DoFnOperator.DefaultOutputManagerFactory<String>(),
                WindowingStrategy.globalDefault(), new HashMap<Integer, PCollectionView<?>>(),
                Collections.<PCollectionView<?>>emptyList(), null, null);

    }

    /**
     * Tests that PipelineOptions are present after serialization.
     */
    @Test
    public void parDoBaseClassPipelineOptionsSerializationTest() throws Exception {

        DoFnOperator<String, String, String> doFnOperator = new DoFnOperator<>(new TestDoFn(), "stepName",
                WindowedValue.getValueOnlyCoder(StringUtf8Coder.of()), new TupleTag<String>("main-output"),
                Collections.<TupleTag<?>>emptyList(), new DoFnOperator.DefaultOutputManagerFactory<String>(),
                WindowingStrategy.globalDefault(), new HashMap<Integer, PCollectionView<?>>(),
                Collections.<PCollectionView<?>>emptyList(), options, null);

        final byte[] serialized = SerializationUtils.serialize(doFnOperator);

        @SuppressWarnings("unchecked")
        DoFnOperator<Object, Object, Object> deserialized = (DoFnOperator<Object, Object, Object>) SerializationUtils
                .deserialize(serialized);

        TypeInformation<WindowedValue<Object>> typeInformation = TypeInformation
                .of(new TypeHint<WindowedValue<Object>>() {
                });

        OneInputStreamOperatorTestHarness<WindowedValue<Object>, Object> testHarness = new OneInputStreamOperatorTestHarness<>(
                deserialized, typeInformation.createSerializer(new ExecutionConfig()));

        testHarness.open();

        // execute once to access options
        testHarness.processElement(new StreamRecord<>(
                WindowedValue.of(new Object(), Instant.now(), GlobalWindow.INSTANCE, PaneInfo.NO_FIRING)));

        testHarness.close();

    }

    @Test
    public void testExternalizedCheckpointsConfigs() {
        String[] args = new String[] { "--externalizedCheckpointsEnabled=true",
                "--retainExternalizedCheckpointsOnCancellation=false" };
        final FlinkPipelineOptions options = PipelineOptionsFactory.fromArgs(args).as(FlinkPipelineOptions.class);
        assertEquals(options.isExternalizedCheckpointsEnabled(), true);
        assertEquals(options.getRetainExternalizedCheckpointsOnCancellation(), false);
    }

    private static class TestDoFn extends DoFn<String, String> {

        @ProcessElement
        public void processElement(ProcessContext c) throws Exception {
            Assert.assertNotNull(c.getPipelineOptions());
            Assert.assertEquals(options.getTestOption(),
                    c.getPipelineOptions().as(MyOptions.class).getTestOption());
        }
    }

    /** PipelineOptions used to test auto registration of Jackson modules. */
    public interface JacksonIncompatibleOptions extends PipelineOptions {
        JacksonIncompatible getJacksonIncompatible();

        void setJacksonIncompatible(JacksonIncompatible value);
    }

    /** A Jackson {@link Module} to test auto-registration of modules. */
    @AutoService(Module.class)
    public static class RegisteredTestModule extends SimpleModule {
        public RegisteredTestModule() {
            super("RegisteredTestModule");
            setMixInAnnotation(JacksonIncompatible.class, JacksonIncompatibleMixin.class);
        }
    }

    /** A class which Jackson does not know how to serialize/deserialize. */
    public static class JacksonIncompatible {
        private final String value;

        public JacksonIncompatible(String value) {
            this.value = value;
        }
    }

    /** A Jackson mixin used to add annotations to other classes. */
    @JsonDeserialize(using = JacksonIncompatibleDeserializer.class)
    @JsonSerialize(using = JacksonIncompatibleSerializer.class)
    public static final class JacksonIncompatibleMixin {
    }

    /** A Jackson deserializer for {@link JacksonIncompatible}. */
    public static class JacksonIncompatibleDeserializer extends JsonDeserializer<JacksonIncompatible> {

        @Override
        public JacksonIncompatible deserialize(JsonParser jsonParser, DeserializationContext deserializationContext)
                throws IOException, JsonProcessingException {
            return new JacksonIncompatible(jsonParser.readValueAs(String.class));
        }
    }

    /** A Jackson serializer for {@link JacksonIncompatible}. */
    public static class JacksonIncompatibleSerializer extends JsonSerializer<JacksonIncompatible> {

        @Override
        public void serialize(JacksonIncompatible jacksonIncompatible, JsonGenerator jsonGenerator,
                SerializerProvider serializerProvider) throws IOException, JsonProcessingException {
            jsonGenerator.writeString(jacksonIncompatible.value);
        }
    }

    @Test
    public void testSerializingPipelineOptionsWithCustomUserType() throws Exception {
        String expectedValue = "testValue";
        PipelineOptions options = PipelineOptionsFactory.fromArgs("--jacksonIncompatible=\"" + expectedValue + "\"")
                .as(JacksonIncompatibleOptions.class);
        SerializedPipelineOptions context = new SerializedPipelineOptions(options);

        ByteArrayOutputStream baos = new ByteArrayOutputStream();
        try (ObjectOutputStream outputStream = new ObjectOutputStream(baos)) {
            outputStream.writeObject(context);
        }
        try (ObjectInputStream inputStream = new ObjectInputStream(new ByteArrayInputStream(baos.toByteArray()))) {
            SerializedPipelineOptions copy = (SerializedPipelineOptions) inputStream.readObject();
            assertEquals(expectedValue,
                    copy.getPipelineOptions().as(JacksonIncompatibleOptions.class).getJacksonIncompatible().value);
        }
    }
}