org.apache.avro.mapred.TestAvroTextOutputFormat.java Source code

Java tutorial

Introduction

Here is the source code for org.apache.avro.mapred.TestAvroTextOutputFormat.java

Source

/**
 * Licensed to the Apache Software Foundation (ASF) under one
 * or more contributor license agreements.  See the NOTICE file
 * distributed with this work for additional information
 * regarding copyright ownership.  The ASF licenses this file
 * to you under the Apache License, Version 2.0 (the
 * "License"); you may not use this file except in compliance
 * with the License.  You may obtain a copy of the License at
 *
 *     http://www.apache.org/licenses/LICENSE-2.0
 *
 * Unless required by applicable law or agreed to in writing, software
 * distributed under the License is distributed on an "AS IS" BASIS,
 * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
 * See the License for the specific language governing permissions and
 * limitations under the License.
 */

package org.apache.avro.mapred;

import static org.junit.Assert.assertEquals;
import static org.junit.Assert.assertFalse;

import java.io.File;
import java.io.UnsupportedEncodingException;
import java.nio.ByteBuffer;

import org.apache.avro.Schema;
import org.apache.avro.file.DataFileReader;
import org.apache.avro.file.DataFileWriter;
import org.apache.avro.generic.GenericDatumReader;
import org.apache.avro.generic.GenericDatumWriter;
import org.apache.avro.io.DatumReader;
import org.apache.avro.io.DatumWriter;
import org.apache.hadoop.io.NullWritable;
import org.apache.hadoop.io.Text;
import org.apache.hadoop.mapred.RecordWriter;
import org.junit.Test;

public class TestAvroTextOutputFormat {

    private static final String UTF8 = "UTF-8";

    @Test
    public void testAvroTextRecordWriter() throws Exception {
        File file = new File(System.getProperty("test.dir", "."), "writer");
        Schema schema = Schema.create(Schema.Type.BYTES);
        DatumWriter<ByteBuffer> datumWriter = new GenericDatumWriter<ByteBuffer>(schema);
        DataFileWriter<ByteBuffer> fileWriter = new DataFileWriter<ByteBuffer>(datumWriter);
        fileWriter.create(schema, file);
        RecordWriter<Object, Object> rw = new AvroTextOutputFormat<Object, Object>().new AvroTextRecordWriter(
                fileWriter, "\t".getBytes(UTF8));

        rw.write(null, null);
        rw.write(null, NullWritable.get());
        rw.write(NullWritable.get(), null);
        rw.write(NullWritable.get(), NullWritable.get());

        rw.write("k1", null);
        rw.write("k2", NullWritable.get());

        rw.write(null, "v1");
        rw.write(NullWritable.get(), "v2");

        rw.write("k3", "v3");
        rw.write(new Text("k4"), new Text("v4"));

        rw.close(null);

        DatumReader<ByteBuffer> reader = new GenericDatumReader<ByteBuffer>();
        DataFileReader<ByteBuffer> fileReader = new DataFileReader<ByteBuffer>(file, reader);
        assertEquals("k1", asString(fileReader.next()));
        assertEquals("k2", asString(fileReader.next()));
        assertEquals("v1", asString(fileReader.next()));
        assertEquals("v2", asString(fileReader.next()));
        assertEquals("k3\tv3", asString(fileReader.next()));
        assertEquals("k4\tv4", asString(fileReader.next()));
        assertFalse("End", fileReader.hasNext());
    }

    private String asString(ByteBuffer buf) throws UnsupportedEncodingException {
        byte[] b = new byte[buf.remaining()];
        buf.get(b);
        return new String(b, UTF8);
    }

}