RowReaderImpl.java

  1. /*
  2.  * CSVeed (https://github.com/42BV/CSVeed)
  3.  *
  4.  * Copyright 2013-2023 CSVeed.
  5.  *
  6.  * All rights reserved. This program and the accompanying materials
  7.  * are made available under the terms of The Apache Software License,
  8.  * Version 2.0 which accompanies this distribution, and is available at
  9.  * https://www.apache.org/licenses/LICENSE-2.0.txt
  10.  */
  11. package org.csveed.row;

  12. import java.io.IOException;
  13. import java.io.Reader;
  14. import java.util.ArrayList;
  15. import java.util.List;

  16. import org.csveed.api.Header;
  17. import org.csveed.api.Row;
  18. import org.csveed.report.CsvException;
  19. import org.csveed.report.RowError;
  20. import org.csveed.token.ParseException;
  21. import org.csveed.token.ParseStateMachine;

  22. /**
  23.  * Builds up a List of cells (String) per read row. Note that this class is stateful, so it can support a per-row parse
  24.  * approach as well.
  25.  */
  26. public class RowReaderImpl implements RowReader {

  27.     /** The state machine. */
  28.     private ParseStateMachine stateMachine = new ParseStateMachine();

  29.     /** The row instructions. */
  30.     private RowInstructionsImpl rowInstructions;

  31.     /** The max number of columns. */
  32.     private int maxNumberOfColumns = -1;

  33.     /** The header. */
  34.     private HeaderImpl header;

  35.     /** The reader. */
  36.     private Reader reader;

  37.     /**
  38.      * Instantiates a new row reader impl.
  39.      *
  40.      * @param reader
  41.      *            the reader
  42.      */
  43.     public RowReaderImpl(Reader reader) {
  44.         this(reader, new RowInstructionsImpl());
  45.     }

  46.     /**
  47.      * Instantiates a new row reader impl.
  48.      *
  49.      * @param reader
  50.      *            the reader
  51.      * @param instructionsInterface
  52.      *            the instructions interface
  53.      */
  54.     public RowReaderImpl(Reader reader, RowInstructions instructionsInterface) {
  55.         this.reader = reader;
  56.         this.rowInstructions = (RowInstructionsImpl) instructionsInterface;
  57.         stateMachine.setSymbolMapping(rowInstructions.getSymbolMapping());
  58.     }

  59.     @Override
  60.     public List<Row> readRows() {
  61.         List<Row> allRows = new ArrayList<>();
  62.         while (!isFinished()) {
  63.             Row row = readRow();
  64.             if (row != null && row.size() > 0) {
  65.                 allRows.add(row);
  66.             }
  67.         }
  68.         return allRows;
  69.     }

  70.     @Override
  71.     public Row readRow() {
  72.         getHeader();
  73.         Line unmappedLine = readBareLine();
  74.         if (unmappedLine == null) {
  75.             return null;
  76.         }
  77.         checkNumberOfColumns(unmappedLine);
  78.         return new RowImpl(unmappedLine, getHeader());
  79.     }

  80.     @Override
  81.     public int getCurrentLine() {
  82.         return this.stateMachine.getCurrentLine();
  83.     }

  84.     @Override
  85.     public Header getHeader() {
  86.         return header == null && rowInstructions.isUseHeader() ? readHeader() : header;
  87.     }

  88.     /**
  89.      * Gets the max number of columns.
  90.      *
  91.      * @return the max number of columns
  92.      */
  93.     public int getMaxNumberOfColumns() {
  94.         return this.maxNumberOfColumns;
  95.     }

  96.     @Override
  97.     public Header readHeader() {
  98.         if (header != null) {
  99.             return header;
  100.         }
  101.         Line unmappedLine = readBareLine();
  102.         if (unmappedLine == null) {
  103.             return null;
  104.         }
  105.         header = new HeaderImpl(unmappedLine);
  106.         return header;
  107.     }

  108.     /**
  109.      * Check number of columns.
  110.      *
  111.      * @param unmappedLine
  112.      *            the unmapped line
  113.      */
  114.     private void checkNumberOfColumns(Line unmappedLine) {
  115.         if (maxNumberOfColumns == -1) {
  116.             maxNumberOfColumns = header == null ? unmappedLine.size() : header.size();
  117.         }
  118.         if (unmappedLine.size() != maxNumberOfColumns) {
  119.             throw new CsvException(new RowError("The expected number of columns is " + maxNumberOfColumns
  120.                     + ", whereas it was " + unmappedLine.size(), unmappedLine.reportOnEndOfLine(), getCurrentLine()));
  121.         }
  122.     }

  123.     @Override
  124.     public boolean isFinished() {
  125.         return stateMachine.isFinished();
  126.     }

  127.     /**
  128.      * Log settings.
  129.      */
  130.     protected void logSettings() {
  131.         rowInstructions.logSettings();
  132.         this.stateMachine.getSymbolMapping().logSettings();
  133.     }

  134.     /**
  135.      * Read bare line.
  136.      *
  137.      * @return the line
  138.      */
  139.     protected Line readBareLine() {
  140.         logSettings();

  141.         LineWithInfo line = null;
  142.         while (line == null && !stateMachine.isFinished()) {
  143.             line = new LineWithInfo();
  144.             while (!stateMachine.isFinished()) {
  145.                 final String token;
  146.                 final int symbol;
  147.                 try {
  148.                     symbol = reader.read();
  149.                 } catch (IOException err) {
  150.                     throw new RuntimeException(err);
  151.                 }
  152.                 try {
  153.                     token = stateMachine.offerSymbol(symbol);
  154.                 } catch (ParseException e) {
  155.                     throw new CsvException(new RowError(e.getMessage(), line.reportOnEndOfLine(), getCurrentLine()));
  156.                 }
  157.                 if (stateMachine.isTrash()) {
  158.                     continue;
  159.                 }
  160.                 if (stateMachine.isTokenStart()) {
  161.                     line.markStartOfColumn();
  162.                 }
  163.                 if (token != null) {
  164.                     line.addCell(token);
  165.                 }
  166.                 line.addCharacter(symbol);
  167.                 if (stateMachine.isLineFinished()) {
  168.                     break;
  169.                 }
  170.             }
  171.             line = stateMachine.ignoreLine() && rowInstructions.isSkipEmptyLines() ? null : line;
  172.         }
  173.         return line;
  174.     }

  175.     @Override
  176.     public RowInstructions getRowInstructions() {
  177.         return this.rowInstructions;
  178.     }

  179. }