org.dswarm.graph.gdm.test.GDMResource3Test.java Source code

Java tutorial

Introduction

Here is the source code for org.dswarm.graph.gdm.test.GDMResource3Test.java

Source

/**
 * This file is part of d:swarm graph extension.
 *
 * d:swarm graph extension is free software: you can redistribute it and/or modify
 * it under the terms of the GNU General Public License as published by
 * the Free Software Foundation, either version 3 of the License, or
 * (at your option) any later version.
 *
 * d:swarm graph extension is distributed in the hope that it will be useful,
 * but WITHOUT ANY WARRANTY; without even the implied warranty of
 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
 * GNU General Public License for more details.
 *
 * You should have received a copy of the GNU General Public License
 * along with d:swarm graph extension.  If not, see <http://www.gnu.org/licenses/>.
 */
package org.dswarm.graph.gdm.test;

import java.io.BufferedInputStream;
import java.io.IOException;
import java.io.InputStream;
import java.net.URL;
import java.util.Iterator;
import java.util.Optional;

import javax.ws.rs.core.MediaType;

import com.fasterxml.jackson.databind.ObjectMapper;
import com.fasterxml.jackson.databind.SerializationFeature;
import com.fasterxml.jackson.databind.node.ArrayNode;
import com.fasterxml.jackson.databind.node.ObjectNode;
import com.google.common.io.ByteSource;
import com.google.common.io.Resources;
import com.sun.jersey.api.client.ClientResponse;
import com.sun.jersey.multipart.BodyPart;
import com.sun.jersey.multipart.MultiPart;
import org.junit.Assert;
import org.junit.Ignore;
import org.junit.Test;
import org.slf4j.Logger;
import org.slf4j.LoggerFactory;
import rx.Observable;

import org.dswarm.common.DMPStatics;
import org.dswarm.graph.json.stream.ModelParser;
import org.dswarm.graph.json.util.Util;
import org.dswarm.graph.test.Neo4jDBWrapper;

/**
 * @author tgaengler
 */
public abstract class GDMResource3Test extends BaseGDMResourceTest {

    private static final Logger LOG = LoggerFactory.getLogger(GDMResource3Test.class);

    public GDMResource3Test(final Neo4jDBWrapper neo4jDBWrapper, final String dbTypeArg) {

        super(neo4jDBWrapper, dbTypeArg);
    }

    @Ignore
    @Test
    public void mabxmlVersioningTest() throws IOException {

        final ObjectNode requestJson = getMABXMLContentSchema();

        // 157, 149
        readGDMFromDBThatWasWrittenAsGDM(Optional.of(requestJson), "versioning/mabxml_dmp.gson",
                "versioning/mabxml_dmp2.gson", "http://data.slub-dresden.de/resources/1",
                "http://www.ddb.de/professionell/mabxml/mabxml-1.xsd#datensatzType", 157, 149, false,
                Optional.empty());
    }

    @Test
    public void csvVersioningTest() throws IOException {

        final ObjectNode requestJson = objectMapper.createObjectNode();
        requestJson.put("record_identifier_attribute_path",
                "http://data.slub-dresden.de/resources/1/schema#EBL+ID");

        readGDMFromDBThatWasWrittenAsGDM(Optional.of(requestJson),
                "versioning/Testtitel_MDunitz-US-TitleSummaryReport132968_01.csv.gson",
                "versioning/Testtitel_MDunitz-US-TitleSummaryReport132968_02.csv.gson",
                "http://data.slub-dresden.de/resources/2",
                "http://data.slub-dresden.de/resources/1/schema#RecordType", 36, 35, false, Optional.empty());
    }

    /**
     * no changes are between the data models
     *
     * @throws IOException
     */
    @Test
    public void csvVersioning01Test2() throws IOException {

        final ObjectNode requestJson = objectMapper.createObjectNode();
        requestJson.put("record_identifier_attribute_path",
                "http://data.slub-dresden.de/resources/1/schema#EZB-Id");

        readGDMFromDBThatWasWrittenAsGDM(Optional.of(requestJson), "versioning/lic_dmp_01_v1.csv.gson",
                "versioning/lic_dmp_01_v2.csv.gson", "http://data.slub-dresden.de/resources/9",
                "http://data.slub-dresden.de/resources/1/schema#RecordType", 23, 23, false, Optional.empty());
    }

    /**
     * one record is missing in the updated data model
     *
     * @throws IOException
     */
    @Ignore
    @Test
    public void csvVersioning02Test2() throws IOException {

        final ObjectNode requestJson = objectMapper.createObjectNode();
        requestJson.put("record_identifier_attribute_path",
                "http://data.slub-dresden.de/resources/1/schema#EZB-Id");

        readGDMFromDBThatWasWrittenAsGDM(Optional.of(requestJson), "versioning/lic_dmp_02_v1.csv.gson",
                "versioning/lic_dmp_02_v2.csv.gson", "http://data.slub-dresden.de/resources/10",
                "http://data.slub-dresden.de/resources/1/schema#RecordType", 46, 69, true,
                Optional.of("http://data.slub-dresden.de/resources/1/schema#RecordType"));
    }

    @Ignore
    @Test
    public void csvVersioningTest2() throws IOException {

        final ObjectNode requestJson = objectMapper.createObjectNode();
        requestJson.put("record_identifier_attribute_path",
                "http://data.slub-dresden.de/resources/1/schema#EZB-Id");

        readGDMFromDBThatWasWrittenAsGDM(Optional.of(requestJson), "versioning/lic_dmp_v1.csv.gson",
                "versioning/lic_dmp_v2.csv.gson", "http://data.slub-dresden.de/resources/8",
                "http://data.slub-dresden.de/resources/1/schema#RecordType", 759, 621, true,
                Optional.of("http://data.slub-dresden.de/resources/1/schema#RecordType"));
    }

    /**
     * without content schema + makes use of record URI as record identifier
     *
     * @throws IOException
     */
    @Ignore
    @Test
    public void csvVersioningTest3() throws IOException {

        readGDMFromDBThatWasWrittenAsGDM(Optional.empty(), "versioning/csv.gdm.v1.json",
                "versioning/csv.gdm.v2.json", "http://data.slub-dresden.de/resources/18",
                "http://data.slub-dresden.de/resources/1/schema#RecordType", 107, 113, true,
                Optional.of("http://data.slub-dresden.de/resources/1/schema#RecordType"));
    }

    @Test
    public void selectedMabxmlVersioning01Test() throws IOException {

        final ObjectNode requestJson = getMABXMLContentSchema();

        readGDMFromDBThatWasWrittenAsGDM(Optional.of(requestJson),
                "versioning/selectedOriginalsDump2011_01_v1.xml.gson", "versioning/selectedUpdates_01_v2.xml.gson",
                "http://data.slub-dresden.de/resources/3",
                "http://www.ddb.de/professionell/mabxml/mabxml-1.xsd#datensatzType", 113, 95, false,
                Optional.empty());
    }

    @Test
    public void selectedMabxmlVersioning02Test() throws IOException {

        final ObjectNode requestJson = getMABXMLContentSchema();

        readGDMFromDBThatWasWrittenAsGDM(Optional.of(requestJson),
                "versioning/selectedOriginalsDump2011_02_v1.xml.gson", "versioning/selectedUpdates_02_v2.xml.gson",
                "http://data.slub-dresden.de/resources/4",
                "http://www.ddb.de/professionell/mabxml/mabxml-1.xsd#datensatzType", 75, 55, false,
                Optional.empty());
    }

    @Test
    public void selectedMabxmlVersioning03Test() throws IOException {

        final ObjectNode requestJson = getMABXMLContentSchema();

        readGDMFromDBThatWasWrittenAsGDM(Optional.of(requestJson),
                "versioning/selectedOriginalsDump2011_03_v1.xml.gson", "versioning/selectedUpdates_03_v2.xml.gson",
                "http://data.slub-dresden.de/resources/5",
                "http://www.ddb.de/professionell/mabxml/mabxml-1.xsd#datensatzType", 223, 180, false,
                Optional.empty());
    }

    @Test
    public void selectedMabxmlVersioning04Test() throws IOException {

        final ObjectNode requestJson = getMABXMLContentSchema();

        readGDMFromDBThatWasWrittenAsGDM(Optional.of(requestJson),
                "versioning/selectedOriginalsDump2011_04_v1.xml.gson", "versioning/selectedUpdates_04_v2.xml.gson",
                "http://data.slub-dresden.de/resources/6",
                "http://www.ddb.de/professionell/mabxml/mabxml-1.xsd#datensatzType", 423, 310, false,
                Optional.empty());
    }

    @Ignore
    @Test
    public void selectedMabxmlVersioningTest() throws IOException {

        final ObjectNode requestJson = getMABXMLContentSchema();

        readGDMFromDBThatWasWrittenAsGDM(Optional.of(requestJson),
                "versioning/selectedOriginalsDump2011_v1.xml.gson", "versioning/selectedUpdates_v2.xml.gson",
                "http://data.slub-dresden.de/resources/7",
                "http://www.ddb.de/professionell/mabxml/mabxml-1.xsd#datensatzType", 834, 640, false,
                Optional.empty());
    }

    private void readGDMFromDBThatWasWrittenAsGDM(final Optional<ObjectNode> optionalContentSchemaRequestJSON,
            final String resourcePathV1, final String resourcePathV2, final String dataModelURI,
            final String recordClassURI, final long statementCountCurrentVersion, final long statementCountV1,
            final boolean deprecateMissingRecords, final Optional<String> optionalRecordClassUri)
            throws IOException {

        LOG.debug("start read test for GDM resource at {} DB", dbType);

        writeGDMToDBInternal(dataModelURI, resourcePathV1);
        writeGDMToDBInternalWithContentSchema(resourcePathV2, dataModelURI, optionalContentSchemaRequestJSON,
                deprecateMissingRecords, optionalRecordClassUri);

        final ObjectMapper objectMapper = Util.getJSONObjectMapper();
        objectMapper.enable(SerializationFeature.INDENT_OUTPUT);
        final ObjectNode requestJson = objectMapper.createObjectNode();

        requestJson.put(DMPStatics.RECORD_CLASS_URI_IDENTIFIER, recordClassURI);
        requestJson.put(DMPStatics.DATA_MODEL_URI_IDENTIFIER, dataModelURI);

        final String requestJsonString = objectMapper.writeValueAsString(requestJson);

        // POST the request
        final ClientResponse response = target().path("/get").type(MediaType.APPLICATION_JSON_TYPE)
                .accept(MediaType.APPLICATION_JSON).post(ClientResponse.class, requestJsonString);

        Assert.assertEquals("expected 200", 200, response.getStatus());

        final InputStream actualResult = response.getEntity(InputStream.class);
        final BufferedInputStream bis = new BufferedInputStream(actualResult, 1024);
        final ModelParser modelParser = new ModelParser(bis);
        final org.dswarm.graph.json.Model model = new org.dswarm.graph.json.Model();

        final Observable<Void> parseObservable = modelParser.parse().map(resource1 -> {

            model.addResource(resource1);

            return null;
        });

        final Iterator<Void> iterator = parseObservable.toBlocking().getIterator();

        Assert.assertTrue(iterator.hasNext());

        while (iterator.hasNext()) {

            iterator.next();
        }

        bis.close();
        actualResult.close();

        LOG.debug("read '{}' statements", model.size());

        Assert.assertEquals("the number of statements should be " + statementCountCurrentVersion,
                statementCountCurrentVersion, model.size());

        // read first version
        final ObjectNode requestJson2 = objectMapper.createObjectNode();

        requestJson2.put(DMPStatics.RECORD_CLASS_URI_IDENTIFIER, recordClassURI);
        requestJson2.put(DMPStatics.DATA_MODEL_URI_IDENTIFIER, dataModelURI);
        requestJson2.put(DMPStatics.VERSION_IDENTIFIER, 1);

        final String requestJsonString2 = objectMapper.writeValueAsString(requestJson2);

        // POST the request
        final ClientResponse response2 = target().path("/get").type(MediaType.APPLICATION_JSON_TYPE)
                .accept(MediaType.APPLICATION_JSON).post(ClientResponse.class, requestJsonString2);

        Assert.assertEquals("expected 200", 200, response2.getStatus());

        final InputStream actualResult2 = response2.getEntity(InputStream.class);
        final BufferedInputStream bis2 = new BufferedInputStream(actualResult2, 1024);
        final ModelParser modelParser2 = new ModelParser(bis2);
        final org.dswarm.graph.json.Model model2 = new org.dswarm.graph.json.Model();

        final Observable<Void> parseObservable2 = modelParser2.parse().map(resource1 -> {

            model2.addResource(resource1);

            return null;
        });

        final Iterator<Void> iterator2 = parseObservable2.toBlocking().getIterator();

        Assert.assertTrue(iterator2.hasNext());

        while (iterator2.hasNext()) {

            iterator2.next();
        }

        bis2.close();
        actualResult2.close();

        LOG.debug("read '{}' statements", model2.size());

        Assert.assertEquals("the number of statements should be " + statementCountV1, statementCountV1,
                model2.size());

        LOG.debug("finished read test for GDM resource at {} DB", dbType);
    }

    private void writeGDMToDBInternalWithContentSchema(final String dataResourceFileName, final String dataModelURI,
            final Optional<ObjectNode> optionalContentSchemaRequestJSON, final boolean deprecateMissingRecords,
            final Optional<String> optionalRecordClassUri) throws IOException {

        LOG.debug("start writing GDM statements for GDM resource at {} DB", dbType);

        final URL fileURL = Resources.getResource(dataResourceFileName);
        final ByteSource byteSource = Resources.asByteSource(fileURL);
        final InputStream is = byteSource.openStream();
        final BufferedInputStream bis = new BufferedInputStream(is, 1024);

        final ObjectNode metadata = objectMapper.createObjectNode();
        metadata.put(DMPStatics.DATA_MODEL_URI_IDENTIFIER, dataModelURI);

        if (optionalContentSchemaRequestJSON.isPresent()) {

            metadata.set(DMPStatics.CONTENT_SCHEMA_IDENTIFIER, optionalContentSchemaRequestJSON.get());
        }

        metadata.put(DMPStatics.DEPRECATE_MISSING_RECORDS_IDENTIFIER,
                Boolean.valueOf(deprecateMissingRecords).toString());

        if (optionalRecordClassUri.isPresent()) {

            metadata.put(DMPStatics.RECORD_CLASS_URI_IDENTIFIER, optionalRecordClassUri.get());
        }

        final String requestJsonString = objectMapper.writeValueAsString(metadata);

        // Construct a MultiPart with two body parts
        final MultiPart multiPart = new MultiPart();
        multiPart.bodyPart(new BodyPart(requestJsonString, MediaType.APPLICATION_JSON_TYPE))
                .bodyPart(new BodyPart(bis, MediaType.APPLICATION_OCTET_STREAM_TYPE));

        // POST the request
        final ClientResponse response = target().path("/put").type("multipart/mixed").post(ClientResponse.class,
                multiPart);

        Assert.assertEquals("expected 200", 200, response.getStatus());

        multiPart.close();
        bis.close();
        is.close();

        LOG.debug("finished writing GDM statements for GDM resource at {} DB", dbType);
    }

    private ObjectNode getMABXMLContentSchema() {

        final ObjectNode requestJson = objectMapper.createObjectNode();
        requestJson.put("record_identifier_attribute_path",
                "http://www.ddb.de/professionell/mabxml/mabxml-1.xsd#id");
        final ArrayNode keyAttributePaths = objectMapper.createArrayNode();
        keyAttributePaths.add(
                "http://www.ddb.de/professionell/mabxml/mabxml-1.xsd#feld\u001Ehttp://www.ddb.de/professionell/mabxml/mabxml-1.xsd#nr");
        keyAttributePaths.add(
                "http://www.ddb.de/professionell/mabxml/mabxml-1.xsd#feld\u001Ehttp://www.ddb.de/professionell/mabxml/mabxml-1.xsd#ind");
        requestJson.set("key_attribute_paths", keyAttributePaths);
        requestJson.put("value_attribute_path",
                "http://www.ddb.de/professionell/mabxml/mabxml-1.xsd#feld\u001Ehttp://www.w3.org/1999/02/22-rdf-syntax-ns#value");

        return requestJson;
    }
}