teichmann@5844: /* Copyright (C) 2011, 2012, 2013 by Bundesanstalt für Gewässerkunde teichmann@5844: * Software engineering by Intevation GmbH teichmann@5844: * teichmann@5992: * This file is Free Software under the GNU AGPL (>=v3) teichmann@5844: * and comes with ABSOLUTELY NO WARRANTY! Check out the teichmann@5992: * documentation coming with Dive4Elements River for details. teichmann@5844: */ teichmann@5844: teichmann@5829: package org.dive4elements.river.importer.parsers; ingo@2850: ingo@2850: import java.io.File; ingo@2850: import java.io.IOException; felix@5229: import java.math.BigDecimal; ingo@2850: import java.text.NumberFormat; mschaefer@8991: import java.text.ParseException; ingo@2850: import java.util.ArrayList; ingo@2850: import java.util.List; ingo@2850: import java.util.regex.Matcher; ingo@2850: import java.util.regex.Pattern; ingo@2850: ingo@2850: import org.apache.log4j.Logger; mschaefer@8989: import org.dive4elements.river.backend.utils.DateUtil; felix@6291: import org.dive4elements.river.importer.ImportTimeInterval; teichmann@5829: import org.dive4elements.river.importer.ImportUnit; teichmann@5829: import org.dive4elements.river.importer.ImportWst; teichmann@5829: import org.dive4elements.river.importer.ImportWstColumn; felix@6320: import org.dive4elements.river.importer.ImportWstColumnValue; mschaefer@8989: import org.dive4elements.river.importer.ImportWstQRange; mschaefer@8989: import org.dive4elements.river.importer.common.AbstractParser; ingo@2850: felix@5229: felix@5229: /** felix@5229: * Parse WaterlevelDifferences CSV file. felix@5229: */ ingo@2850: public class WaterlevelDifferencesParser extends LineParser { ingo@2850: ingo@2850: private static final Logger log = mschaefer@8989: Logger.getLogger(WaterlevelDifferencesParser.class); ingo@2850: ingo@2850: private static final NumberFormat nf = mschaefer@8989: NumberFormat.getInstance(DEFAULT_LOCALE); ingo@2850: ingo@2850: public static final Pattern META_UNIT = mschaefer@8989: Pattern.compile("^Einheit: \\[(.*)\\].*"); ingo@2850: felix@6287: public static final Pattern YEARS_IN_COLUMN = mschaefer@8989: Pattern.compile(".*(\\d{4})-(\\d{4})$"); felix@6287: mschaefer@8989: public static final BigDecimal INTERVAL_GAP = new BigDecimal("0.00001"); tom@7377: felix@5233: /** List of parsed differences as ImportWst s. */ mschaefer@8989: private final List differences; ingo@2850: felix@5233: private ImportWstColumn[] columns; ingo@2850: felix@5233: /** The currently processed dataset. */ felix@5233: private ImportWst current; ingo@2850: ingo@2850: ingo@2850: public WaterlevelDifferencesParser() { mschaefer@8989: this.differences = new ArrayList<>(); ingo@2850: } ingo@2850: ingo@2850: felix@5233: /** Get the differences as wst parsed so far. */ felix@5233: public List getDifferences() { mschaefer@8989: return this.differences; ingo@2850: } ingo@2850: felix@5234: felix@5234: /** felix@5234: * Parse a csv waterleveldifferenceparser and create a ImportWst object felix@5234: * from it. felix@5234: */ ingo@2850: @Override mschaefer@8989: public void parse(final File file) throws IOException { mschaefer@8989: this.current = new ImportWst(file.getName()); mschaefer@8989: this.current.setKind(6); ingo@2850: ingo@2850: super.parse(file); ingo@2850: } ingo@2850: ingo@2850: felix@5234: /** No rewind implemented. */ ingo@2850: @Override ingo@2850: protected void reset() { ingo@2850: } ingo@2850: ingo@2850: ingo@2850: @Override ingo@2850: protected void finish() { mschaefer@8989: if (this.columns != null && this.current != null) { felix@5233: // TODO figure out if its needed, as the columns felix@5233: // are registered at their construction time. mschaefer@8989: for (final ImportWstColumn col: this.columns) { felix@5233: // TODO place a current.addColumn(col); here? ingo@2850: } ingo@2850: mschaefer@8989: this.differences.add(this.current); ingo@2850: } ingo@2850: felix@6320: // For all differences columns, add a single Q-Range with tom@7377: // -1. tom@7377: // Expand range to minimal length in case it would be 0 teichmann@7883: // TODO: should otherwise be extended to teichmann@7883: // (first station of next range - INTERVAL_GAP), tom@7377: // assuming always ascending stations mschaefer@8989: for (final ImportWstColumn column: this.columns) { mschaefer@8989: final List cValues = column.getColumnValues(); mschaefer@8989: final BigDecimal a = cValues.get(0).getPosition(); tom@7377: BigDecimal b = cValues.get(cValues.size() - 1).getPosition(); tom@7377: if (a.compareTo(b) == 0) { mschaefer@8989: b = b.add(INTERVAL_GAP); tom@7377: } felix@6320: column.addColumnQRange( mschaefer@8989: new ImportWstQRange( mschaefer@8989: a, mschaefer@8989: b, mschaefer@8989: new BigDecimal(-1d)) mschaefer@8989: ); felix@6320: } mschaefer@8989: this.current = null; mschaefer@8989: this.columns = null; ingo@2850: } ingo@2850: felix@5234: ingo@2850: @Override mschaefer@8989: protected void handleLine(final int lineNum, final String line) { ingo@2850: if (line.startsWith(START_META_CHAR)) { ingo@2850: handleMetaLine(stripMetaLine(line)); ingo@2850: } ingo@2850: else { ingo@2850: handleDataLine(line); ingo@2850: } ingo@2850: } ingo@2850: ingo@2850: mschaefer@8989: private void handleMetaLine(final String meta) { ingo@2850: if (handleMetaUnit(meta)) { ingo@2850: return; ingo@2850: } ingo@2850: else { ingo@2850: handleMetaColumnNames(meta); ingo@2850: } ingo@2850: } ingo@2850: ingo@2850: mschaefer@8989: private boolean handleMetaUnit(final String meta) { mschaefer@8989: final Matcher m = META_UNIT.matcher(meta); ingo@2850: ingo@2850: if (m.matches()) { mschaefer@8989: final String unit = m.group(1); ingo@2850: log.debug("Found unit: '" + unit + "'"); ingo@2850: mschaefer@8989: this.current.setUnit(new ImportUnit(unit)); ingo@2850: ingo@2850: return true; ingo@2850: } ingo@2850: ingo@2850: return false; ingo@2850: } ingo@2850: ingo@2850: mschaefer@8989: private boolean handleMetaColumnNames(final String meta) { mschaefer@8989: final Pattern META_COLUMN_NAMES = Pattern.compile("Fluss-km;(.*)"); mschaefer@8989: final Matcher m = META_COLUMN_NAMES.matcher(meta); ingo@2850: ingo@2850: if (m.matches()) { mschaefer@8989: final String colStr = m.group(1); mschaefer@8989: final String[] cols = colStr.split(SEPERATOR_CHAR); ingo@2850: ingo@2850: log.debug("Found " + cols.length + " columns."); ingo@2850: ingo@2850: initColumns(cols); ingo@2850: ingo@2850: return true; ingo@2850: } ingo@2850: ingo@2850: return false; ingo@2850: } ingo@2850: ingo@2850: felix@6286: /** Setup column structures with name, description and time interval. */ mschaefer@8989: private void initColumns(final String[] cols) { mschaefer@8989: this.current.setNumberColumns(cols.length); mschaefer@8989: this.columns = this.current.getColumns().toArray( mschaefer@8989: new ImportWstColumn[cols.length]); ingo@2850: ingo@2850: for (int i = 0; i < cols.length; i++) { mschaefer@8989: final String name = cols[i].replace("\"", ""); ingo@2850: ingo@2850: log.debug("Create new column '" + name + "'"); mschaefer@8989: final ImportWstColumn column = this.current.getColumn(i); felix@6290: column.setName(name); felix@6290: column.setDescription(name); felix@6287: mschaefer@8989: final Matcher m = YEARS_IN_COLUMN.matcher(name); felix@6287: felix@6287: if (m.matches()) { mschaefer@8989: final int startYear = Integer.parseInt(m.group(1)); mschaefer@8989: final int endYear = Integer.parseInt(m.group(2)); mschaefer@8989: final ImportTimeInterval time = new ImportTimeInterval( mschaefer@8989: DateUtil.getStartDateFromYear(startYear), mschaefer@8989: DateUtil.getEndDateFromYear(endYear) mschaefer@8989: ); felix@6291: column.setTimeInterval(time); felix@6287: } else { felix@6287: log.debug("No time interval in column header found: " + name); felix@6287: } ingo@2850: } ingo@2850: } ingo@2850: ingo@2850: felix@6752: /** Handle one line of data, add one value for all columns. felix@6752: * @param line the line to parse felix@6752: */ mschaefer@8989: private void handleDataLine(final String line) { felix@6753: // Split by separator, do not exclude trailing empty string. mschaefer@8989: final String[] cols = line.split(SEPERATOR_CHAR, -1); ingo@2850: ingo@2850: if (cols == null || cols.length < 2) { felix@5230: log.warn("skip invalid waterlevel-diff line: '" + line + "'"); ingo@2850: return; ingo@2850: } ingo@2850: ingo@2850: try { tom@8856: // The first value in a line like 12,9;4,3;4,5 is the station, tom@8856: // later real values. mschaefer@8989: final BigDecimal station = AbstractParser.parseDecimal(cols[0]); ingo@2850: mschaefer@8989: for (int i = 0; i < this.columns.length; i++) { mschaefer@8989: final int idx = i+1; ingo@3940: ingo@3940: if (idx >= cols.length) { ingo@3940: log.warn("Insufficient column numbers: " + line); ingo@3940: continue; ingo@3940: } ingo@3940: mschaefer@8989: final String value = cols[idx]; ingo@2850: felix@6752: if (value != null && !value.equals("")) { felix@6752: try { mschaefer@8989: this.columns[i].addColumnValue( mschaefer@8989: station, mschaefer@8989: AbstractParser.parseDecimal(value)); felix@6752: } mschaefer@8991: catch (final ParseException pe) { felix@6752: log.warn("Could not parse value: '" + value + "'"); felix@6752: } ingo@2850: } ingo@2850: } ingo@2850: } mschaefer@8991: catch (final ParseException pe) { tom@5490: log.warn("Could not parse station: '" + line + "'"); ingo@2850: } ingo@2850: } ingo@2850: } ingo@2850: // vim:set ts=4 sw=4 si et sta sts=4 fenc=utf8 :