org.apache.solr.common.util.TestJsonRecordReader.java Source code

Java tutorial

Introduction

Here is the source code for org.apache.solr.common.util.TestJsonRecordReader.java

Source

/*
 * Licensed to the Apache Software Foundation (ASF) under one or more
 * contributor license agreements.  See the NOTICE file distributed with
 * this work for additional information regarding copyright ownership.
 * The ASF licenses this file to You under the Apache License, Version 2.0
 * (the "License"); you may not use this file except in compliance with
 * the License.  You may obtain a copy of the License at
 *
 *     http://www.apache.org/licenses/LICENSE-2.0
 *
 * Unless required by applicable law or agreed to in writing, software
 * distributed under the License is distributed on an "AS IS" BASIS,
 * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
 * See the License for the specific language governing permissions and
 * limitations under the License.
 */
package org.apache.solr.common.util;

import java.io.IOException;
import java.io.StringReader;
import java.lang.invoke.MethodHandles;
import java.lang.ref.WeakReference;
import java.util.Arrays;
import java.util.Collections;
import java.util.List;
import java.util.Map;
import java.util.concurrent.atomic.AtomicReference;

import org.apache.commons.lang.StringUtils;
import org.apache.solr.SolrTestCaseJ4;
import org.apache.solr.util.RecordingJSONParser;
import org.slf4j.Logger;
import org.slf4j.LoggerFactory;

public class TestJsonRecordReader extends SolrTestCaseJ4 {
    private static final Logger log = LoggerFactory.getLogger(MethodHandles.lookup().lookupClass());

    public void testOneLevelSplit() throws IOException {
        String json = "{\n" + " \"a\":\"A\" ,\n" + " \"b\":[\n" + "     {\"c\":\"C\",\"d\":\"D\" ,\"e\": {\n"
                + "                         \"s\":\"S\",\n" + "                         \"t\":3}},\n"
                + "     {\"c\":\"C1\",\"d\":\"D1\"},\n" + "     {\"c\":\"C2\",\"d\":\"D2\"}\n" + " ]\n" + "}";
        JsonRecordReader streamer = JsonRecordReader.getInst("/b",
                Arrays.asList("a_s:/a", "c_s:/b/c", "d_s:/b/d", "e_s:/b/e/s", "e_i:/b/e/t"));

        List<Map<String, Object>> records = streamer.getAllRecords(new StringReader(json));
        assertEquals(3, records.size());
        assertEquals(3l, ((Map) records.get(0)).get("e_i"));
        assertEquals("D2", ((Map) records.get(2)).get("d_s"));
        assertNull(((Map) records.get(1)).get("e_s"));
        assertNull(((Map) records.get(2)).get("e_s"));
        assertNull(((Map) records.get(1)).get("e_i"));
        assertNull(((Map) records.get(2)).get("e_i"));

        //    All parameters but /b/c is omitted
        streamer = JsonRecordReader.getInst("/b", Arrays.asList("a:/a", "d:/b/d", "s:/b/e/s", "t:/b/e/t"));
        records = streamer.getAllRecords(new StringReader(json));
        for (Map<String, Object> record : records) {
            assertNull(record.get("c"));

        }

        //one nested /b/e/* object is completely ignored
        streamer = JsonRecordReader.getInst("/b", Arrays.asList("a:/a", "c:/b/c", "d:/b/d"));
        records = streamer.getAllRecords(new StringReader(json));
        for (Map<String, Object> record : records) {
            assertNull(record.get("s"));
            assertNull(record.get("t"));
        }

        //nested /b/e/* object is completely ignored even though /b/e is mapped
        streamer = JsonRecordReader.getInst("/b", Arrays.asList("a_s:/a", "c_s:/b/c", "d_s:/b/d", "e:/b/e"

        ));
        records = streamer.getAllRecords(new StringReader(json));
        for (Map<String, Object> record : records) {
            assertNull(record.get("s"));
            assertNull(record.get("t"));
            assertNull(record.get("e"));
        }

        streamer = JsonRecordReader.getInst("/b", Arrays.asList("a_s:/a", "c_s:/b/c", "d_s:/b/d", "/b/e/*"));
        records = streamer.getAllRecords(new StringReader(json));
        assertEquals(3, records.size());
        assertEquals(3l, ((Map) records.get(0)).get("t"));
        assertEquals("S", ((Map) records.get(0)).get("s"));
        assertNull(((Map) records.get(1)).get("s"));
        assertNull(((Map) records.get(2)).get("s"));

    }

    public void testSrcField() throws Exception {
        String json = "{\n" + "  \"id\" : \"123\",\n" + "  \"description\": \"Testing /json/docs srcField 1\",\n"
                + "\n" + "  \"nested_data\" : {\n" + "    \"nested_inside\" : \"check check check 1\"\n" + "  }\n"
                + "}";

        String json2 = " {\n" + "  \"id\" : \"345\",\n" + "  \"payload\": \""
                + StringUtils.repeat("0123456789", 819) + "\",\n"
                + "  \"description\": \"Testing /json/docs srcField 2\",\n" + "\n" + "  \"nested_data\" : {\n"
                + "    \"nested_inside\" : \"check check check 2\"\n" + "  }\n" + "}";

        String json3 = " {\n" + "  \"id\" : \"678\",\n" + "  \"description\": \"Testing /json/docs srcField 3\",\n"
                + "\n" + "  \"nested_data\" : {\n" + "    \"nested_inside\" : \"check check check 3\"\n" + "  }\n"
                + "}";

        JsonRecordReader streamer = JsonRecordReader.getInst("/", Arrays.asList("id:/id"));
        RecordingJSONParser parser = new RecordingJSONParser(new StringReader(json + json2 + json3));

        streamer.streamRecords(parser, new JsonRecordReader.Handler() {
            int count = 0;

            @Override
            public void handle(Map<String, Object> record, String path) {
                count++;
                String buf = parser.getBuf();
                parser.resetBuf();

                Map m = (Map) Utils.fromJSONString(buf);
                if (count == 1) {
                    assertEquals(m.get("id"), "123");
                    assertEquals(m.get("description"), "Testing /json/docs srcField 1");
                    assertEquals(((Map) m.get("nested_data")).get("nested_inside"), "check check check 1");
                }
                if (count++ == 2) {
                    assertEquals(m.get("id"), "345");
                    assertEquals(m.get("description"), "Testing /json/docs srcField 2");
                    assertEquals(((Map) m.get("nested_data")).get("nested_inside"), "check check check 2");
                }
                if (count++ == 3) {
                    assertEquals(m.get("id"), "678");
                    assertEquals(m.get("description"), "Testing /json/docs srcField 3");
                    assertEquals(((Map) m.get("nested_data")).get("nested_inside"), "check check check 3");
                }

            }
        });

    }

    public void testRecursiveWildCard() throws IOException {
        String json = "{\n" + " \"a\":\"A\" ,\n" + " \"b\":[\n" + "     {\"c\":\"C\",\"d\":\"D\" ,\"e\": {\n"
                + "                         \"s\":\"S\",\n"
                + "                         \"t\":3 ,\"u\":{\"v\":3.1234,\"w\":false}}},\n"
                + "     {\"c\":\"C1\",\"d\":\"D1\"},\n" + "     {\"c\":\"C2\",\"d\":\"D2\"}\n" + " ]\n" + "}";
        JsonRecordReader streamer;
        List<Map<String, Object>> records;

        streamer = JsonRecordReader.getInst("/b", Collections.singletonList("/b/**"));
        records = streamer.getAllRecords(new StringReader(json));
        assertEquals(3, records.size());
        assertEquals("records " + records, 3l, ((Map) records.get(0)).get("t"));
        assertEquals("records " + records, "S", ((Map) records.get(0)).get("s"));
        assertEquals("records " + records, 3.1234, ((Map) records.get(0)).get("v"));
        assertEquals("records " + records, false, ((Map) records.get(0)).get("w"));
        for (Map<String, Object> record : records) {
            assertNotNull("records " + records, record.get("c"));
            assertNotNull("records " + records, record.get("d"));
        }

        streamer = JsonRecordReader.getInst("/", Collections.singletonList("/**"));
        records = streamer.getAllRecords(new StringReader(json));
        assertEquals(1, records.size());
        assertEquals(3, ((List) ((Map) records.get(0)).get("c")).size());
        assertEquals(3, ((List) ((Map) records.get(0)).get("d")).size());
        assertEquals("records " + records, 3l, ((Map) records.get(0)).get("t"));
        assertEquals("records " + records, "S", ((Map) records.get(0)).get("s"));
        assertEquals("records " + records, "A", ((Map) records.get(0)).get("a"));
        assertEquals("records " + records, false, ((Map) records.get(0)).get("w"));

    }

    public void testRecursiveWildcard2() throws Exception {
        String json = "{\n" + "  \"first\": \"John\",\n" + "  \"last\": \"Doe\",\n" + "  \"grade\": 8,\n"
                + "  \"exams\": [\n" + "      {\n" + "        \"subject\": \"Maths\",\n"
                + "        \"test\"   : \"term1\",\n" + "        \"marks\":90},\n" + "        {\n"
                + "         \"subject\": \"Biology\",\n" + "         \"test\"   : \"term1\",\n"
                + "         \"marks\":86}\n" + "      ]\n" + "}";

        JsonRecordReader streamer;
        List<Map<String, Object>> records;

        streamer = JsonRecordReader.getInst("/exams", Collections.singletonList("/**"));
        records = streamer.getAllRecords(new StringReader(json));
        assertEquals(2, records.size());
        for (Map<String, Object> record : records) {
            assertEquals(6, record.size());
            assertTrue(record.containsKey("subject"));
            assertTrue(record.containsKey("test"));
            assertTrue(record.containsKey("marks"));
        }

        streamer = JsonRecordReader.getInst("/exams", Collections.singletonList("$FQN:/**"));
        records = streamer.getAllRecords(new StringReader(json));
        assertEquals(2, records.size());
        for (Map<String, Object> record : records) {
            assertEquals(6, record.size());
            assertTrue(record.containsKey("exams.subject"));
            assertTrue(record.containsKey("exams.test"));
            assertTrue(record.containsKey("exams.marks"));
        }

        streamer = JsonRecordReader.getInst("/", Collections.singletonList("txt:/**"));
        records = streamer.getAllRecords(new StringReader(json));
        assertEquals(1, records.size());
        assertEquals(9, ((List) records.get(0).get("txt")).size());

    }

    public void testNestedDocs() throws Exception {
        String json = "{a:{" + "b:{c:d}," + "x:y" + "}}";
        JsonRecordReader streamer = JsonRecordReader.getInst("/|/a/b", Arrays.asList("/a/x", "/a/b/*"));
        streamer.streamRecords(new StringReader(json), (record, path) -> {
            assertEquals(record.get("x"), "y");
            assertEquals(((Map) record.get(null)).get("c"), "d");
        });
        json = "{a:{" + "b:[{c:c1, e:e1},{c:c2, e :e2, d:{p:q}}]," + "x:y" + "}}";
        streamer.streamRecords(new StringReader(json), (record, path) -> {
            assertEquals(record.get("x"), "y");
            List l = (List) record.get(null);
            Map m = (Map) l.get(0);
            assertEquals(m.get("c"), "c1");
            assertEquals(m.get("e"), "e1");
            m = (Map) l.get(1);
            assertEquals(m.get("c"), "c2");
            assertEquals(m.get("e"), "e2");
        });
        streamer = JsonRecordReader.getInst("/|/a/b", Arrays.asList("$FQN:/**"));
        streamer.streamRecords(new StringReader(json), (record, path) -> {
            assertEquals(record.get("a.x"), "y");
            List l = (List) record.get(null);
            Map m = (Map) l.get(0);
            assertEquals(m.get("c"), "c1");
            assertEquals(m.get("e"), "e1");
            m = (Map) l.get(1);
            assertEquals(m.get("c"), "c2");
            assertEquals(m.get("e"), "e2");
            assertEquals(m.get("d.p"), "q");
        });
    }

    public void testNestedJsonWithFloats() throws Exception {

        String json = "{\n" + "        \"a_string\" : \"abc\",\n" + "        \"a_num\" : 2.0,\n"
                + "        \"a\" : {\n" + "                        \"b\" : [\n"
                + "                                {\"id\":\"1\", \"title\" : \"test1\"},\n"
                + "                                {\"id\":\"2\", \"title\" : \"test2\"}\n"
                + "                        ]\n" + "                }\n" + "}\n";

        JsonRecordReader streamer;
        List<Map<String, Object>> records;

        streamer = JsonRecordReader.getInst("/a/b", Collections.singletonList("title_s:/a/b/title"));
        records = streamer.getAllRecords(new StringReader(json));
        assertEquals(2, records.size());
    }

    public void testClearPreviousRecordFields() throws Exception {
        String json = "{\n" + "'first': 'John',\n" + "'exams': [\n"
                + "{'subject': 'Maths', 'test'   : 'term1', 'marks':90},\n"
                + "{'subject': 'Biology', 'test'   : 'term1', 'marks':86}\n" + "]\n" + "}\n" + "{\n"
                + "'first': 'Bob',\n" + "'exams': [\n" + "{'subject': 'Maths', 'test': 'term1', 'marks': 95\n"
                + "}\n" + ",\n" + "{\n" + "'subject': 'Biology', 'test'   : 'term1', 'marks': 92}\n" + "]\n" + "}";

        JsonRecordReader streamer;
        List<Map<String, Object>> records;

        streamer = JsonRecordReader.getInst("/exams", Collections.singletonList("/**"));
        records = streamer.getAllRecords(new StringReader(json));
        assertEquals(4, records.size());

        for (Map<String, Object> record : records) {
            for (Map.Entry<String, Object> e : record.entrySet()) {
                assertFalse(e.getValue() instanceof List);
            }
        }
    }

    public void testArrayOfRootObjects() throws Exception {
        String json = "[{'fieldA':'A1'}, {'fieldB':'B2'}]";
        JsonRecordReader streamer;
        List<Map<String, Object>> records;

        final AtomicReference<WeakReference<String>> ref = new AtomicReference<>();
        streamer = JsonRecordReader.getInst("/", Collections.singletonList("$FQN:/**"));
        streamer.streamRecords(new StringReader(json), (record, path) -> {
            System.gc();
            if (ref.get() != null) {
                assertNull("This reference is still intact :" + ref.get().get(), ref.get().get());
            }
            String fName = record.keySet().iterator().next();
            ref.set(new WeakReference<>(fName));
        });

    }

    public void testAIOOBE() throws IOException {
        String json = "[   {\n" + "      \"taxon_group\" : {\n" + "         \"identifiers\" : {\n"
                + "            \"bioentry_id\" : 1876284,\n" + "            \"namespace\" : \"NCBI\",\n"
                + "            \"primary_id\" : \"AAAAA_ID_19303\",\n" + "            \"version\" : null,\n"
                + "            \"name\" : \"AAAAA_ID_19303\",\n"
                + "            \"description\" : \"Taxon group for NCBI taxon 1286265\",\n"
                + "            \"accession\" : \"AAAAA_ID_19303\"\n" + "         },\n" + "         \"source\" : [\n"
                + "            {\n" + "               \"ID\" : \"AAAAA_ID_19303_0\",\n"
                + "               \"segment_group_serotype\" : \"H3\",\n"
                + "               \"primary_key\" : 11877892,\n" + "               \"name\" : \"segment_group\",\n"
                + "               \"segment_group_NA_subtype\" : \"\",\n"
                + "               \"segmentgroup_sequence_count\" : \"1\",\n"
                + "               \"source_tag\" : \"EMBL/GenBank/SwissProt\",\n"
                + "               \"segment_group_submitter_lab\" : \"Microbiology, Faculty of Medicine Sebelas Maret University, Jl. Ir. Sutami 36A, Surakarta, Jawa Tengah 57126, Indonesia\",\n"
                + "               \"strand\" : \"1\",\n"
                + "               \"segment_group_submission_date\" : \"22-JAN-2013\",\n"
                + "               \"segment_group_HA_subtype\" : \"H3\",\n"
                + "               \"start-end\" : \"1..260\"\n" + "            },\n" + "            {\n"
                + "               \"taxon_group_serotype\" : \"H3\",\n"
                + "               \"taxon_group_sequence_count\" : \"1\",\n"
                + "               \"ID\" : \"AAAAA_ID_19303\",\n" + "               \"primary_key\" : 11877893,\n"
                + "               \"name\" : \"source\",\n" + "               \"db_xref\" : [\n"
                + "                  \"taxon:1286265\"\n" + "               ],\n"
                + "               \"taxon_group_HA_subtype\" : \"H3\",\n"
                + "               \"taxon_group_segment_group_count\" : \"1\",\n"
                + "               \"source_tag\" : \"EMBL/GenBank/SwissProt\",\n"
                + "               \"strand\" : \"1\",\n" + "               \"taxon_group_NA_subtype\" : \"\",\n"
                + "               \"start-end\" : \"1..260\"\n" + "            }\n" + "         ],\n"
                + "         \"segment_groups\" : [\n" + "            {\n" + "               \"identifiers\" : {\n"
                + "                  \"bioentry_id\" : 1876283,\n" + "                  \"namespace\" : \"NCBI\",\n"
                + "                  \"primary_id\" : \"AAAAA_ID_19303_0\",\n"
                + "                  \"version\" : null,\n" + "                  \"name\" : \"AAAAA_ID_19303_0\",\n"
                + "                  \"description\" : \"Segment group 0 for AAAAA_ID_19303 (NCBI taxon 1286265)\",\n"
                + "                  \"accession\" : \"AAAAA_ID_19303_0\"\n" + "               },\n"
                + "               \"source\" : [\n" + "                  {\n"
                + "                     \"ID\" : \"KC513508\",\n"
                + "                     \"primary_key\" : 22483564,\n"
                + "                     \"nucleotide_gi\" : \"451898947\",\n"
                + "                     \"name\" : \"gene\",\n" + "                     \"HA_subtype\" : \"H3\",\n"
                + "                     \"segment\" : \"4\",\n"
                + "                     \"collection_date\" : \"22-Mar-2010\",\n"
                + "                     \"NA_subtype\" : \"N2\",\n" + "                     \"subtype\" : \"H3\",\n"
                + "                     \"source_tag\" : \"EMBL/GenBank/SwissProt\",\n"
                + "                     \"standardized_collection_date\" : \"2010-03-22T00:00:00Z\",\n"
                + "                     \"segment_name\" : \"HA\",\n" + "                     \"strand\" : \"1\",\n"
                + "                     \"serotype\" : \"H3N2\",\n"
                + "                     \"ncbi_accession\" : \"KC513508\",\n"
                + "                     \"start-end\" : \"1..260\"\n" + "                  },\n"
                + "                  {\n" + "                     \"mol_type\" : \"viral cRNA\",\n"
                + "                     \"taxonomy_strain\" : \"A/Surakarta/1/2010\",\n"
                + "                     \"identified_by\" : \"Afiono Agung Prasetyo\",\n"
                + "                     \"HA_subtype\" : \"H3\",\n"
                + "                     \"collection_date\" : \"22-Mar-2010\",\n"
                + "                     \"standardized_collection_date\" : \"2010-03-22T00:00:00Z\",\n"
                + "                     \"strand\" : \"1\",\n" + "                     \"serotype\" : \"H3N2\",\n"
                + "                     \"organism\" : \"Influenza A virus (A/Surakarta/1/2010(H3N2))\",\n"
                + "                     \"country\" : \"Indonesia\",\n"
                + "                     \"primary_key\" : 22483566,\n"
                + "                     \"isolation_source\" : \"nasal and throat swab\",\n"
                + "                     \"collected_by\" : \"Afiono Agung Prasetyo\",\n"
                + "                     \"name\" : \"source\",\n" + "                     \"flu_type\" : \"A\",\n"
                + "                     \"host\" : \"Homo sapiens\",\n" + "                     \"db_xref\" : [\n"
                + "                        \"taxon:1286265\"\n" + "                     ],\n"
                + "                     \"NA_subtype\" : \"N2\",\n"
                + "                     \"strain\" : \"A/Surakarta/1/2010\",\n"
                + "                     \"source_tag\" : \"EMBL/GenBank/SwissProt\",\n"
                + "                     \"start-end\" : \"1..260\"\n" + "                  },\n"
                + "                  {\n" + "                     \"primary_key\" : 22483572,\n"
                + "                     \"name\" : \"standard_host\",\n"
                + "                     \"Host_NCBI_taxon_id\" : \"9605\",\n"
                + "                     \"curation_status_code\" : \"150\",\n"
                + "                     \"curation_date\" : \"2015-01-12\",\n"
                + "                     \"program_version\" : \"v1.1.7\",\n"
                + "                     \"source_tag\" : \"parse_host_v1\",\n"
                + "                     \"strand\" : \"1\",\n"
                + "                     \"curation_status_message\" : \"success, archive and add on next major program revision\",\n"
                + "                     \"start-end\" : \"1..260\",\n"
                + "                     \"curation_status\" : \"true\"\n" + "                  },\n"
                + "                  {\n" + "                     \"primary_key\" : 22483576,\n"
                + "                     \"Location_Lat_Long\" : \"-0.7892749906,113.9213256836\",\n"
                + "                     \"name\" : \"standardized_location\",\n"
                + "                     \"Location_Country_Alpha2\" : \"ID\",\n"
                + "                     \"curation_status_code\" : \"150\",\n"
                + "                     \"curation_date\" : \"2015-01-15\",\n"
                + "                     \"program_version\" : \"v0.1\",\n"
                + "                     \"source_tag\" : \"xxxxx_parse_location_v0\",\n"
                + "                     \"strand\" : \"1\",\n"
                + "                     \"curation_status_message\" : \"success, archive and add on next major program revision\",\n"
                + "                     \"start-end\" : 1,\n"
                + "                     \"curation_status\" : \"true\"\n" + "                  }\n"
                + "               ],\n" + "               \"sequence\" : {\n"
                + "                  \"string\" : \"CCCTTATGATGTGCCGGATTATGCCTCCCTTAGGTCACTAGTTGCCTCATCCGGCACACTGGAGTTTAACAGTGAAAGCTTCAATTGGACTGGAGTCACTCAAAACGGAACAAGCTCTGCTTGCATAAGGAGATCTAATAATAGTTTCTTTAGTAGATTGAATTGGTTGACCCACTTAAACTTCAAATACCCAGCATTGAACGTGACTATGCCAAACAATGAACAATTTGACAAATTGTACATTTGGGGGGTTCACCACC\"\n"
                + "               },\n" + "               \"references\" : [\n" + "                  {\n"
                + "                     \"authors\" : \"Prasetyo,A.A.\",\n"
                + "                     \"location\" : \"Unpublished\",\n"
                + "                     \"title\" : \"Molecular Epidemiology Study of Human Respiratory Virus in Surakarta Indonesia\"\n"
                + "                  },\n" + "                  {\n"
                + "                     \"authors\" : \"Prasetyo,A.A.\",\n"
                + "                     \"location\" : \"Submitted (22-JAN-2013) Microbiology, Faculty of Medicine Sebelas Maret University, Jl. Ir. Sutami 36A, Surakarta, Jawa Tengah 57126, Indonesia\",\n"
                + "                     \"title\" : \"Direct Submission\"\n" + "                  }\n"
                + "               ],\n" + "               \"name\" : \"AAAAA_ID_19303_0\",\n"
                + "               \"segments\" : [\n" + "                  {\n"
                + "                     \"identifiers\" : {\n"
                + "                        \"bioentry_id\" : 1588885,\n"
                + "                        \"namespace\" : \"NCBI\",\n"
                + "                        \"primary_id\" : \"KC513508\",\n"
                + "                        \"version\" : 1,\n"
                + "                        \"name\" : \"KC513508\",\n"
                + "                        \"description\" : \"Influenza A virus (A/Surakarta/1/2010(H3N2)) segment 4 hemagglutinin (HA) gene, partial cds.\",\n"
                + "                        \"accession\" : \"KC513508\"\n" + "                     },\n"
                + "                     \"source\" : [\n" + "                        {\n"
                + "                           \"mol_type\" : \"viral cRNA\",\n"
                + "                           \"identified_by\" : \"Afiono Agung Prasetyo\",\n"
                + "                           \"HA_subtype\" : \"H3\",\n"
                + "                           \"segment\" : \"4\",\n"
                + "                           \"collection_date\" : \"22-Mar-2010\",\n"
                + "                           \"strand\" : \"1\",\n"
                + "                           \"serotype\" : \"H3N2\",\n"
                + "                           \"organism\" : \"Influenza A virus (A/Surakarta/1/2010(H3N2))\",\n"
                + "                           \"country\" : \"Indonesia\",\n"
                + "                           \"primary_key\" : 22511042,\n"
                + "                           \"isolation_source\" : \"nasal and throat swab\",\n"
                + "                           \"collected_by\" : \"Afiono Agung Prasetyo\",\n"
                + "                           \"name\" : \"source\",\n"
                + "                           \"host\" : \"Homo sapiens\",\n"
                + "                           \"NA_subtype\" : \"N2\",\n"
                + "                           \"db_xref\" : [\n"
                + "                              \"taxon:1286265\"\n" + "                           ],\n"
                + "                           \"strain\" : \"A/Surakarta/1/2010\",\n"
                + "                           \"source_tag\" : \"EMBL/GenBank/SwissProt\",\n"
                + "                           \"start-end\" : \"1..260\"\n" + "                        },\n"
                + "                        {\n" + "                           \"primary_key\" : 22511045,\n"
                + "                           \"source_tag\" : \"EMBL/GenBank/SwissProt\",\n"
                + "                           \"gene\" : \"HA\",\n"
                + "                           \"strand\" : \"1\",\n"
                + "                           \"name\" : \"gene\",\n"
                + "                           \"start-end\" : \"1..260\"\n" + "                        },\n"
                + "                        {\n" + "                           \"primary_key\" : 22511046,\n"
                + "                           \"protein_id\" : \"AGF80141.1\",\n"
                + "                           \"gene\" : \"HA\",\n"
                + "                           \"name\" : \"CDS\",\n"
                + "                           \"db_xref\" : [\n"
                + "                              \"GI:451898948\"\n" + "                           ],\n"
                + "                           \"codon_start\" : \"2\",\n"
                + "                           \"source_tag\" : \"EMBL/GenBank/SwissProt\",\n"
                + "                           \"strand\" : \"1\",\n"
                + "                           \"translation\" : \"PYDVPDYASLRSLVASSGTLEFNSESFNWTGVTQNGTSSACIRRSNNSFFSRLNWLTHLNFKYPALNVTMPNNEQFDKLYIWGVHH\",\n"
                + "                           \"product\" : \"hemagglutinin\",\n"
                + "                           \"start-end\" : \"1..260\"\n" + "                        },\n"
                + "                        {\n" + "                           \"primary_key\" : 22511053,\n"
                + "                           \"name\" : \"asdf_typing\",\n"
                + "                           \"segment\" : \"4\",\n"
                + "                           \"flu_type\" : \"A\",\n"
                + "                           \"bitscore\" : \"277.3\",\n"
                + "                           \"full_lineage\" : \"X_XX_XX_XxxxxXxxxx\",\n"
                + "                           \"lineage\" : \"AAAAAAAAAA\",\n"
                + "                           \"curation_date\" : \"2015-01-07\",\n"
                + "                           \"subtype\" : \"H3\",\n"
                + "                           \"program_version\" : \"v2.8.2\",\n"
                + "                           \"source_tag\" : \"some_text_some\",\n"
                + "                           \"Evalue\" : \"4.6e-85\",\n"
                + "                           \"segment_name\" : \"HA\",\n"
                + "                           \"strand\" : \"1\",\n"
                + "                           \"start-end\" : \"1..260\",\n"
                + "                           \"curation_status\" : \"true\"\n" + "                        },\n"
                + "                        {\n" + "                           \"bitscore\" : \"464\",\n"
                + "                           \"subj_location\" : \"342..601\",\n"
                + "                           \"slen\" : \"1701\",\n"
                + "                           \"sseqid\" : \"someID_someID_some\",\n"
                + "                           \"mismatch\" : \"3\",\n"
                + "                           \"strand\" : \"1\",\n"
                + "                           \"qcovs\" : \"100\",\n"
                + "                           \"qlen\" : \"260\",\n"
                + "                           \"qcovhsp\" : \"100\",\n"
                + "                           \"primary_key\" : 22511048,\n"
                + "                           \"pident\" : \"98.85\",\n"
                + "                           \"name\" : \"segtypeAlign\",\n"
                + "                           \"qseqid\" : \"KC513508\",\n"
                + "                           \"gaps\" : \"0\",\n"
                + "                           \"curation_date\" : \"2015-01-15\",\n"
                + "                           \"typing\" : \"A_HA_H3\",\n"
                + "                           \"length\" : \"260\",\n"
                + "                           \"evalue\" : \"2e-132\",\n"
                + "                           \"source_tag\" : \"asdf_asdf_asdfv1\",\n"
                + "                           \"program_version\" : \"v1.1.2\",\n"
                + "                           \"curation_status\" : \"true\",\n"
                + "                           \"start-end\" : \"1..260\",\n"
                + "                           \"gapopen\" : \"0\"\n" + "                        },\n"
                + "                        {\n" + "                           \"primary_key\" : 22511060,\n"
                + "                           \"name\" : \"standard_host\",\n"
                + "                           \"Host_NCBI_taxon_id\" : \"9605\",\n"
                + "                           \"curation_status_code\" : \"150\",\n"
                + "                           \"curation_date\" : \"2015-01-12\",\n"
                + "                           \"program_version\" : \"v1.1.7\",\n"
                + "                           \"source_tag\" : \"parse_host_v1\",\n"
                + "                           \"strand\" : \"1\",\n"
                + "                           \"curation_status_message\" : \"success, archive and add on next major program revision\",\n"
                + "                           \"start-end\" : \"1..260\",\n"
                + "                           \"curation_status\" : \"true\"\n" + "                        },\n"
                + "                        {\n" + "                           \"primary_key\" : 22511052,\n"
                + "                           \"name\" : \"flu_segtype\",\n"
                + "                           \"flu_type\" : \"A\",\n"
                + "                           \"curation_date\" : \"2015-01-15\",\n"
                + "                           \"subtype\" : \"H3\",\n"
                + "                           \"program_version\" : \"v1.1.2\",\n"
                + "                           \"source_tag\" : \"asdf_asdf_asd_v1\",\n"
                + "                           \"strand\" : \"1\",\n"
                + "                           \"segtype\" : \"HA\",\n"
                + "                           \"start-end\" : \"1..260\",\n"
                + "                           \"curation_status\" : \"true\"\n" + "                        },\n"
                + "                        {\n" + "                           \"primary_key\" : 22511056,\n"
                + "                           \"prot_coord\" : \"115..87\",\n"
                + "                           \"name\" : \"exon\",\n"
                + "                           \"curation_date\" : \"2015-01-07\",\n"
                + "                           \"source_tag\" : \"asdf_asdfas_v2\",\n"
                + "                           \"program_version\" : \"v2.8.2\",\n"
                + "                           \"strand\" : \"1\",\n"
                + "                           \"start-end\" : \"2..259\",\n"
                + "                           \"curation_status\" : \"true\"\n" + "                        },\n"
                + "                        {\n" + "                           \"nstart\" : \"2\",\n"
                + "                           \"primary_key\" : 22511058,\n"
                + "                           \"pend\" : \"200\",\n"
                + "                           \"aaseq\" : \"PYDVPDYASLRSLVASSGTLEFNSESFNWTGVTQNGTSSACIRRSNNSFFSRLNWLTHLNFKYPALNVTMPNNEQFDKLYIWGVHH\",\n"
                + "                           \"p_pc_coverage\" : \"15.19\",\n"
                + "                           \"name\" : \"CDS\",\n"
                + "                           \"score\" : \"461\",\n"
                + "                           \"nend\" : \"259\",\n"
                + "                           \"curation_date\" : \"2015-01-07\",\n"
                + "                           \"program_version\" : \"v2.8.2\",\n"
                + "                           \"source_tag\" : \"asdf_asdfas_v2\",\n"
                + "                           \"strand\" : \"1\",\n"
                + "                           \"product\" : \"A_HA_H3\",\n"
                + "                           \"ntlength\" : \"258\",\n"
                + "                           \"start-end\" : \"1..260\",\n"
                + "                           \"curation_status\" : \"true\",\n"
                + "                           \"pstart\" : \"115\"\n" + "                        },\n"
                + "                        {\n" + "                           \"primary_key\" : 22511062,\n"
                + "                           \"Location_Lat_Long\" : \"-0.7892749906,113.9213256836\",\n"
                + "                           \"name\" : \"standardized_location\",\n"
                + "                           \"Location_Country_Alpha2\" : \"ID\",\n"
                + "                           \"curation_status_code\" : \"150\",\n"
                + "                           \"curation_date\" : \"2015-01-15\",\n"
                + "                           \"program_version\" : \"v0.1\",\n"
                + "                           \"source_tag\" : \"asdf_asdf_asdf_asdfn_v0\",\n"
                + "                           \"strand\" : \"1\",\n"
                + "                           \"curation_status_message\" : \"success, archive and add on next major program revision\",\n"
                + "                           \"start-end\" : 1,\n"
                + "                           \"curation_status\" : \"true\"\n" + "                        }\n"
                + "                     ],\n" + "                     \"sequence\" : {\n"
                + "                        \"length\" : 260,\n"
                + "                        \"string\" : \"CCCTTATGATGTGCCGGATTATGCCTCCCTTAGGTCACTAGTTGCCTCATCCGGCACACTGGAGTTTAACAGTGAAAGCTTCAATTGGACTGGAGTCACTCAAAACGGAACAAGCTCTGCTTGCATAAGGAGATCTAATAATAGTTTCTTTAGTAGATTGAATTGGTTGACCCACTTAAACTTCAAATACCCAGCATTGAACGTGACTATGCCAAACAATGAACAATTTGACAAATTGTACATTTGGGGGGTTCACCACC\"\n"
                + "                     },\n" + "                     \"name\" : \"KC513508\",\n"
                + "                     \"annotations\" : {\n" + "                        \"keyword\" : \"\",\n"
                + "                        \"curation_date\" : \"2015-01-03\",\n"
                + "                        \"comment\" : [\n"
                + "                           \"##Assembly-Data-START## Assembly Method :: CLC Main Workbench v. 6.8 Sequencing Technology :: Sanger dideoxy1 sequencing ##Assembly-Data-END## \"\n"
                + "                        ],\n" + "                        \"date_changed\" : \"25-FEB-2013\",\n"
                + "                        \"curation_status\" : \"false\"\n" + "                     }\n"
                + "                  }\n" + "               ],\n" + "               \"annotations\" : {\n"
                + "                  \"keyword\" : \"\",\n"
                + "                  \"curation_date\" : \"2015-01-05\",\n" + "                  \"comment\" : [\n"
                + "                     \"##Assembly-Data-START## Assembly Method :: CLC Main Workbench v. 6.8 Sequencing Technology :: Sanger dideoxy sequencing ##Assembly-Data-END## \"\n"
                + "                  ]\n" + "               }}]}}]";

        RecordingJSONParser parser = new RecordingJSONParser(new StringReader(json));
        JsonRecordReader recordReader = JsonRecordReader.getInst("/", Collections.singletonList("/**"));
        try {
            recordReader.streamRecords(parser, (record, path) -> {
            }); /*don't care*/
        } catch (RuntimeException e) {
            parser.error("").printStackTrace();
            throw e;
        }
    }
}