Github_337.java
/*******************************************************************************
* Copyright 2019 Univocity Software Pty Ltd
*
* Licensed under the Apache License, Version 2.0 (the "License");
* you may not use this file except in compliance with the License.
* You may obtain a copy of the License at
*
* http://www.apache.org/licenses/LICENSE-2.0
*
* Unless required by applicable law or agreed to in writing, software
* distributed under the License is distributed on an "AS IS" BASIS,
* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
* See the License for the specific language governing permissions and
* limitations under the License.
******************************************************************************/
package com.univocity.parsers.issues.github;
import com.univocity.parsers.csv.*;
import org.testng.annotations.*;
import static org.testng.Assert.*;
/**
* From: https://github.com/univocity/univocity-parsers/issues/337
*
* @author Univocity Software Pty Ltd - <a href="mailto:dev@univocity.com">dev@univocity.com</a>
*/
public class Github_337 {
@DataProvider
public Object[][] maxProvider() {
return new Object[][]{
{-1},
{1000},
};
}
@Test(dataProvider = "maxProvider")
public void testInconsistentParsing(int max) {
CsvParserSettings settings = new CsvParserSettings();
// we handle headers by ourselves
settings.setHeaderExtractionEnabled(false);
settings.setReadInputOnSeparateThread(false);
settings.setInputBufferSize(1024 * 1024);
// Assume 1st line EOL indicates what the others will have as well
settings.setLineSeparatorDetectionEnabled(true);
settings.setUnescapedQuoteHandling(UnescapedQuoteHandling.RAISE_ERROR);
settings.setMaxCharsPerColumn(max);
CsvFormat format = settings.getFormat();
format.setDelimiter(',');
format.setCharToEscapeQuoteEscaping('\\');
String input = "18/01/2015,\"c_Pg,%W\\\",Ci\\tHpSDgA,\"!DLBpRjdV,\",306,5,!MuhlLqK,SPC_nTA%uZG$,SSC1_Vy\\K\\HEw,SSC2_ktmaDk!b,SSC3_#pbNlkTf,SSC4_a@J\\%dDL,PC_UfKoRZsI,PSC2_oHyn\\hMn,\"PSC3_\\QvO#,iy\",PSC4_x_KwV\\Z?,PSC5_!W\\ZI#l!,61.24,4,5,7,3,False\n";
String[] result = new CsvParser(settings).parseLine(input);
assertEquals(result.length, 23);
assertEquals(result[0], "18/01/2015");
assertEquals(result[1], "c_Pg,%W\\");
assertEquals(result[2], "Ci\\tHpSDgA");
assertEquals(result[3], "!DLBpRjdV,");
assertEquals(result[4], "306");
assertEquals(result[5], "5");
assertEquals(result[6], "!MuhlLqK");
assertEquals(result[7], "SPC_nTA%uZG$");
assertEquals(result[8], "SSC1_Vy\\K\\HEw");
assertEquals(result[9], "SSC2_ktmaDk!b");
assertEquals(result[10], "SSC3_#pbNlkTf");
assertEquals(result[11], "SSC4_a@J\\%dDL");
assertEquals(result[12], "PC_UfKoRZsI");
assertEquals(result[13], "PSC2_oHyn\\hMn");
assertEquals(result[14], "PSC3_\\QvO#,iy");
assertEquals(result[15], "PSC4_x_KwV\\Z?");
assertEquals(result[16], "PSC5_!W\\ZI#l!");
assertEquals(result[17], "61.24");
assertEquals(result[18], "4");
assertEquals(result[19], "5");
assertEquals(result[20], "7");
assertEquals(result[21], "3");
assertEquals(result[22], "False");
}
}