Skip to content

Commit

Permalink
Merge pull request #640 from data-integrations/fixit-excel-date
Browse files Browse the repository at this point in the history
Fix date type handling when parsing excel files
  • Loading branch information
vanathi-g authored May 22, 2023
2 parents ddf3059 + a7117a3 commit 5886a9f
Show file tree
Hide file tree
Showing 3 changed files with 24 additions and 6 deletions.
Original file line number Diff line number Diff line change
Expand Up @@ -42,6 +42,7 @@
import org.apache.poi.hssf.usermodel.HSSFDateUtil;
import org.apache.poi.ss.usermodel.Cell;
import org.apache.poi.ss.usermodel.CellType;
import org.apache.poi.ss.usermodel.DataFormatter;
import org.apache.poi.xssf.usermodel.XSSFSheet;
import org.apache.poi.xssf.usermodel.XSSFWorkbook;
import org.slf4j.Logger;
Expand Down Expand Up @@ -101,6 +102,7 @@ public List<Row> execute(List<Row> records, final ExecutorContext context)
throws DirectiveExecutionException, ErrorRowException {
List<Row> results = new ArrayList<>();
ByteArrayInputStream input = null;
DataFormatter formatter = new DataFormatter();
try {
for (Row record : records) {
int idx = record.find(column);
Expand Down Expand Up @@ -159,25 +161,22 @@ public List<Row> execute(List<Row> records, final ExecutorContext context)
String value = "";
switch (cell.getCellTypeEnum()) {
case STRING:
newRow.add(name, cell.getStringCellValue());
value = cell.getStringCellValue();
break;

case NUMERIC:
if (HSSFDateUtil.isCellDateFormatted(cell)) {
newRow.add(name, cell.getDateCellValue());
value = cell.getDateCellValue().toString();
value = formatter.formatCellValue(cell);
} else {
newRow.add(name, cell.getNumericCellValue());
value = String.valueOf(cell.getNumericCellValue());
}
break;

case BOOLEAN:
newRow.add(name, cell.getBooleanCellValue());
value = String.valueOf(cell.getBooleanCellValue());
break;
}
newRow.add(name, value);

if (rows == 0 && firstRowAsHeader) {
columnNames.put(cell.getAddress().getColumn(), value);
Expand Down
Original file line number Diff line number Diff line change
Expand Up @@ -67,5 +67,24 @@ public void testNoSheetName() throws Exception {
Assert.assertEquals(1, pipeline.getSecond().size());
}
}
}

@Test
public void testDateFormatting() throws Exception {
try (InputStream stream =
ParseAvroFileTest.class.getClassLoader().getResourceAsStream("date-formats-test-sheet.xlsx")) {
byte[] data = IOUtils.toByteArray(stream);

String[] directives = new String[]{
"parse-as-excel :body '0'",
};

List<Row> rows = new ArrayList<>();
rows.add(new Row("body", data));
List<Row> results = TestingRig.execute(directives, rows);

for (Row result : results) {
Assert.assertEquals(result.getValue("A"), result.getValue("B"));
}
}
}
}
Binary file not shown.

0 comments on commit 5886a9f

Please sign in to comment.