teichmann@5844: /* Copyright (C) 2011, 2012, 2013 by Bundesanstalt für Gewässerkunde teichmann@5844: * Software engineering by Intevation GmbH teichmann@5844: * teichmann@5992: * This file is Free Software under the GNU AGPL (>=v3) teichmann@5844: * and comes with ABSOLUTELY NO WARRANTY! Check out the teichmann@5992: * documentation coming with Dive4Elements River for details. teichmann@5844: */ teichmann@5844: teichmann@5829: package org.dive4elements.river.importer.parsers; ingo@2850: ingo@2850: import java.io.File; ingo@2850: import java.io.IOException; felix@5229: import java.math.BigDecimal; ingo@2850: import java.text.NumberFormat; ingo@2850: import java.text.ParseException; ingo@2850: import java.util.ArrayList; ingo@2850: import java.util.List; ingo@2850: import java.util.regex.Matcher; ingo@2850: import java.util.regex.Pattern; ingo@2850: ingo@2850: import org.apache.log4j.Logger; ingo@2850: teichmann@5829: import org.dive4elements.river.importer.ImportUnit; ingo@2850: teichmann@5829: import org.dive4elements.river.importer.ImportWst; teichmann@5829: import org.dive4elements.river.importer.ImportWstColumn; ingo@2850: felix@5229: felix@5229: /** felix@5229: * Parse WaterlevelDifferences CSV file. felix@5229: */ ingo@2850: public class WaterlevelDifferencesParser extends LineParser { ingo@2850: ingo@2850: private static final Logger log = ingo@2850: Logger.getLogger(WaterlevelDifferencesParser.class); ingo@2850: ingo@2850: private static final NumberFormat nf = ingo@2850: NumberFormat.getInstance(DEFAULT_LOCALE); ingo@2850: ingo@2850: public static final Pattern META_UNIT = ingo@2850: Pattern.compile("^Einheit: \\[(.*)\\].*"); ingo@2850: felix@6287: public static final Pattern YEARS_IN_COLUMN = felix@6287: Pattern.compile(".*(\\d{4})-(\\d{4})$"); felix@6287: felix@5233: /** List of parsed differences as ImportWst s. */ felix@5233: private List differences; ingo@2850: felix@5233: private ImportWstColumn[] columns; ingo@2850: felix@5233: /** The currently processed dataset. */ felix@5233: private ImportWst current; ingo@2850: ingo@2850: ingo@2850: public WaterlevelDifferencesParser() { felix@5233: differences = new ArrayList(); ingo@2850: } ingo@2850: ingo@2850: felix@5233: /** Get the differences as wst parsed so far. */ felix@5233: public List getDifferences() { ingo@2850: return differences; ingo@2850: } ingo@2850: felix@5234: felix@5234: /** felix@5234: * Parse a csv waterleveldifferenceparser and create a ImportWst object felix@5234: * from it. felix@5234: */ ingo@2850: @Override ingo@2850: public void parse(File file) throws IOException { felix@5233: current = new ImportWst(file.getName()); felix@6282: current.setKind(6); ingo@2850: ingo@2850: super.parse(file); ingo@2850: } ingo@2850: ingo@2850: felix@5234: /** No rewind implemented. */ ingo@2850: @Override ingo@2850: protected void reset() { ingo@2850: } ingo@2850: ingo@2850: ingo@2850: @Override ingo@2850: protected void finish() { ingo@2850: if (columns != null && current != null) { felix@5233: // TODO figure out if its needed, as the columns felix@5233: // are registered at their construction time. felix@5233: for (ImportWstColumn col: columns) { felix@5233: // TODO place a current.addColumn(col); here? ingo@2850: } ingo@2850: ingo@2850: differences.add(current); ingo@2850: } ingo@2850: ingo@2850: current = null; ingo@2850: columns = null; ingo@2850: } ingo@2850: felix@5234: ingo@2850: @Override ingo@4193: protected void handleLine(int lineNum, String line) { ingo@2850: if (line.startsWith(START_META_CHAR)) { ingo@2850: handleMetaLine(stripMetaLine(line)); ingo@2850: } ingo@2850: else { ingo@2850: handleDataLine(line); ingo@2850: } ingo@2850: } ingo@2850: ingo@2850: ingo@2850: private void handleMetaLine(String meta) { ingo@2850: if (handleMetaUnit(meta)) { ingo@2850: return; ingo@2850: } ingo@2850: else { ingo@2850: handleMetaColumnNames(meta); ingo@2850: } ingo@2850: } ingo@2850: ingo@2850: ingo@2850: private boolean handleMetaUnit(String meta) { ingo@2850: Matcher m = META_UNIT.matcher(meta); ingo@2850: ingo@2850: if (m.matches()) { ingo@2850: String unit = m.group(1); ingo@2850: log.debug("Found unit: '" + unit + "'"); ingo@2850: ingo@2850: current.setUnit(new ImportUnit(unit)); ingo@2850: ingo@2850: return true; ingo@2850: } ingo@2850: ingo@2850: return false; ingo@2850: } ingo@2850: ingo@2850: ingo@2850: private boolean handleMetaColumnNames(String meta) { ingo@2850: Pattern META_COLUMN_NAMES = Pattern.compile("Fluss-km;(.*)"); ingo@2850: Matcher m = META_COLUMN_NAMES.matcher(meta); ingo@2850: ingo@2850: if (m.matches()) { ingo@2850: String colStr = m.group(1); ingo@2850: String[] cols = colStr.split(SEPERATOR_CHAR); ingo@2850: ingo@2850: log.debug("Found " + cols.length + " columns."); ingo@2850: ingo@2850: initColumns(cols); ingo@2850: ingo@2850: return true; ingo@2850: } ingo@2850: ingo@2850: return false; ingo@2850: } ingo@2850: ingo@2850: felix@6286: /** Setup column structures with name, description and time interval. */ ingo@2850: private void initColumns(String[] cols) { felix@5264: current.setNumberColumns(cols.length); felix@5264: columns = current.getColumns().toArray(new ImportWstColumn[cols.length]); ingo@2850: ingo@2850: for (int i = 0; i < cols.length; i++) { ingo@2850: String name = cols[i].replace("\"", ""); ingo@2850: ingo@2850: log.debug("Create new column '" + name + "'"); felix@6290: ImportWstColumn column = current.getColumn(i); felix@6290: column.setName(name); felix@6290: column.setDescription(name); felix@6287: felix@6287: Matcher m = YEARS_IN_COLUMN.matcher(name); felix@6287: felix@6287: if (m.matches()) { felix@6287: String startYear = m.group(1); felix@6287: String endYear = m.group(2); felix@6287: // TODO create and set ImportTimeInterval felix@6287: } else { felix@6287: log.debug("No time interval in column header found: " + name); felix@6287: } ingo@2850: } ingo@2850: } ingo@2850: ingo@2850: ingo@2850: private void handleDataLine(String line) { ingo@2850: String[] cols = line.split(SEPERATOR_CHAR); ingo@2850: ingo@2850: if (cols == null || cols.length < 2) { felix@5230: log.warn("skip invalid waterlevel-diff line: '" + line + "'"); ingo@2850: return; ingo@2850: } ingo@2850: ingo@2850: try { ingo@2850: Double station = nf.parse(cols[0]).doubleValue(); ingo@2850: ingo@2850: for (int i = 0; i < columns.length; i++) { ingo@3940: int idx = i+1; ingo@3940: ingo@3940: if (idx >= cols.length) { ingo@3940: log.warn("Insufficient column numbers: " + line); ingo@3940: continue; ingo@3940: } ingo@3940: ingo@3940: String value = cols[idx]; ingo@2850: ingo@2850: try { felix@5233: columns[i].addColumnValue( felix@5233: new BigDecimal(station), felix@5233: new BigDecimal(nf.parse(value).doubleValue())); ingo@2850: } ingo@2850: catch (ParseException pe) { tom@5490: log.warn("Could not parse value: '" + value + "'"); ingo@2850: } ingo@2850: } ingo@2850: } ingo@2850: catch (ParseException pe) { tom@5490: log.warn("Could not parse station: '" + line + "'"); ingo@2850: } ingo@2850: } ingo@2850: } ingo@2850: // vim:set ts=4 sw=4 si et sta sts=4 fenc=utf8 :