Github_349.java

/*******************************************************************************
 * Copyright 2019 Univocity Software Pty Ltd
 *
 * Licensed under the Apache License, Version 2.0 (the "License");
 * you may not use this file except in compliance with the License.
 * You may obtain a copy of the License at
 *
 * http://www.apache.org/licenses/LICENSE-2.0
 *
 * Unless required by applicable law or agreed to in writing, software
 * distributed under the License is distributed on an "AS IS" BASIS,
 * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
 * See the License for the specific language governing permissions and
 * limitations under the License.
 ******************************************************************************/
package com.univocity.parsers.issues.github;


import com.univocity.parsers.common.*;
import com.univocity.parsers.common.record.*;
import com.univocity.parsers.csv.*;
import org.testng.annotations.*;

import java.io.*;
import java.util.*;

import static org.testng.Assert.*;

/**
 * From: https://github.com/univocity/univocity-parsers/issues/349
 *
 * @author Univocity Software Pty Ltd - <a href="mailto:dev@univocity.com">dev@univocity.com</a>
 */
public class Github_349 {

	@Test
	public void testNoDuplicates() {
		ResultIterator<Record, ParsingContext> iterator = getParsedIteratorForResource("notduplicate_1,notduplicate_2,notduplicate_3\r\nvalueForFirst,valueForSecond,valueForThird");
		Record row = iterator.next();
		Map<String, String> parsedRow = row.fillFieldMap(new HashMap<String, String>());
		assertEquals(parsedRow.size(), 3);
		assertEquals(parsedRow.get("notduplicate_1"), "valueForFirst");
		assertEquals(parsedRow.get("notduplicate_2"), "valueForSecond");
		assertEquals(parsedRow.get("notduplicate_3"), "valueForThird");
	}

	@Test
	public void duplicatesNotAtEnd() {
		ResultIterator<Record, ParsingContext> iterator = getParsedIteratorForResource("duplicate,duplicate,notduplicate\r\nvalueForFirst,valueForSecond,valueForThird");
		Record row = iterator.next();
		Map<String, String> parsedRow = row.fillFieldMap(new HashMap<String, String>());
		assertEquals(parsedRow.size(), 2);
		assertTrue(parsedRow.get("duplicate").equals("valueForFirst") || parsedRow.get("duplicate").equals("valueForSecond"));
		assertEquals(parsedRow.get("notduplicate"), "valueForThird");
	}

	@Test
	public void duplicatesAtEnd() {
		ResultIterator<Record, ParsingContext> iterator = getParsedIteratorForResource("duplicate,notduplicate,duplicate\r\nvalueForFirst,valueForSecond,valueForThird");
		Record row = iterator.next();
		Map<String, String> parsedRow = row.fillFieldMap(new HashMap<String, String>());

		assertEquals(parsedRow.size(), 2);
		assertTrue(parsedRow.get("duplicate").equals("valueForFirst") || parsedRow.get("duplicate").equals("valueForThird"));
		assertEquals(parsedRow.get("notduplicate"), "valueForSecond");
//		assertEquals(parsedRow.get("duplicate\r"), "valueForThird"); // carriage return kept
	}

	private ResultIterator<Record, ParsingContext> getParsedIteratorForResource(String input) {
		try {
			InputStream resource = new ByteArrayInputStream(input.getBytes("UTF-8"));
			CsvParser parser = new CsvParser(buildSettings());
			return parser.iterateRecords(resource, "UTF-8").iterator();
		} catch (Exception e) {
			throw new IllegalStateException(e);
		}
	}

	private CsvParserSettings buildSettings() {
		CsvParserSettings settings = new CsvParserSettings();
		settings.setReadInputOnSeparateThread(false);
		settings.getFormat().setLineSeparator("\r\n");
		settings.setHeaderExtractionEnabled(true);
		return settings;
	}
}