Mercurial > dive4elements > river
comparison backend/src/main/java/org/dive4elements/river/importer/sinfo/parsers/DailyDischargeParser.java @ 8971:50416a0df385
Importer for the Schifffahrt (S-INFO) and Oekologie (U-INFO) files
author | mschaefer |
---|---|
date | Tue, 03 Apr 2018 10:18:30 +0200 |
parents | |
children | ae76f618d990 |
comparison
equal
deleted
inserted
replaced
8970:da5dc7446652 | 8971:50416a0df385 |
---|---|
1 /* Copyright (C) 2017 by Bundesanstalt für Gewässerkunde | |
2 * Software engineering by | |
3 * Björnsen Beratende Ingenieure GmbH | |
4 * Dr. Schumacher Ingenieurbüro für Wasser und Umwelt | |
5 * | |
6 * This file is Free Software under the GNU AGPL (>=v3) | |
7 * and comes with ABSOLUTELY NO WARRANTY! Check out the | |
8 * documentation coming with Dive4Elements River for details. | |
9 */ | |
10 | |
11 package org.dive4elements.river.importer.sinfo.parsers; | |
12 | |
13 import java.io.File; | |
14 import java.io.FilenameFilter; | |
15 import java.text.DateFormat; | |
16 import java.text.SimpleDateFormat; | |
17 import java.util.ArrayList; | |
18 import java.util.Date; | |
19 import java.util.List; | |
20 import java.util.regex.Matcher; | |
21 import java.util.regex.Pattern; | |
22 | |
23 import org.apache.log4j.Logger; | |
24 import org.dive4elements.river.importer.Config; | |
25 import org.dive4elements.river.importer.ImportRiver; | |
26 import org.dive4elements.river.importer.common.AbstractParser; | |
27 import org.dive4elements.river.importer.common.ParsingState; | |
28 import org.dive4elements.river.importer.sinfo.importitem.DailyDischargeDayLineImport; | |
29 import org.dive4elements.river.importer.sinfo.importitem.DailyDischargeSeriesImport; | |
30 import org.dive4elements.river.model.sinfo.DailyDischarge; | |
31 import org.dive4elements.river.model.sinfo.DailyDischargeValue; | |
32 | |
33 /** | |
34 * Reads and parses a daily discharge file | |
35 * | |
36 * @author Matthias Schäfer | |
37 * | |
38 */ | |
39 public class DailyDischargeParser extends AbstractParser<DailyDischarge, DailyDischargeValue, DailyDischargeDayLineImport, DailyDischargeSeriesImport> { | |
40 | |
41 /***** FIELDS *****/ | |
42 | |
43 private static final Logger log = Logger.getLogger(DailyDischargeParser.class); | |
44 | |
45 static final Pattern IMPORT_FILENAME = Pattern.compile("^(.+)_mittlerer_Tagesabfluss.csv", Pattern.CASE_INSENSITIVE); | |
46 | |
47 private static final Pattern META_GAUGENAME = Pattern.compile("^#\\s*Stations-*Name:\\s*(\\S[^;]*).*", Pattern.CASE_INSENSITIVE); | |
48 | |
49 private static final Pattern META_GAUGENUMBER = Pattern.compile("^#\\s*Stations-*Nummer:\\s*(\\S[^;]*).*", Pattern.CASE_INSENSITIVE); | |
50 | |
51 private static final Pattern META_COLUMNTITLES = Pattern.compile("^#*\\s*Datum\\s*;\\s*Q.*", Pattern.CASE_INSENSITIVE); | |
52 | |
53 private static final DateFormat dateFormat = new SimpleDateFormat("dd.MM.yyyy"); | |
54 | |
55 | |
56 /***** CONSTRUCTORS *****/ | |
57 | |
58 public DailyDischargeParser(final File importPath, final File rootRelativePath, final ImportRiver river) { | |
59 super(importPath, rootRelativePath, river); | |
60 } | |
61 | |
62 | |
63 /***** METHODS *****/ | |
64 | |
65 @Override | |
66 protected Logger getLog() { | |
67 return log; | |
68 } | |
69 | |
70 /** | |
71 * Whether this import type shall be skipped | |
72 */ | |
73 public static boolean shallSkip() { | |
74 return Config.INSTANCE.skipSInfoDailyDischarge(); | |
75 } | |
76 | |
77 /** | |
78 * Creates a list of parsers for all daily discharge import files in a directory | |
79 */ | |
80 public static List<DailyDischargeParser> createParsers(final File importDir, final File relativeDir, final ImportRiver river) { | |
81 final List<DailyDischargeParser> parsers = new ArrayList<>(); | |
82 final File[] files = importDir.listFiles(new FilenameFilter() { | |
83 @Override | |
84 public boolean accept(final File dir, final String name) { | |
85 return IMPORT_FILENAME.matcher(name).matches(); | |
86 } | |
87 }); | |
88 for (final File file : files) | |
89 parsers.add(new DailyDischargeParser(file, new File(relativeDir, file.getName()), river)); | |
90 return parsers; | |
91 } | |
92 | |
93 @Override | |
94 protected boolean kmMustBeUnique() { | |
95 return false; | |
96 } | |
97 | |
98 @Override | |
99 protected DailyDischargeSeriesImport createSeriesImport(final String filename) { | |
100 return new DailyDischargeSeriesImport(filename); | |
101 } | |
102 | |
103 @Override | |
104 protected DailyDischargeDayLineImport createKmLineImport(final Double km, final String[] values) { | |
105 Date day = null; | |
106 try { | |
107 day = dateFormat.parse(values[0]); | |
108 } | |
109 catch (final Exception e) { | |
110 logError("Invalid date in line " + this.in.getLineNumber()); | |
111 return null; | |
112 } | |
113 if (parseDoubleWithNull(values[1]) == null) { | |
114 logError("Invalid discharge value in line " + this.in.getLineNumber()); | |
115 return null; | |
116 } | |
117 return new DailyDischargeDayLineImport(day, Double.valueOf(parseDoubleWithNull(values[1]).doubleValue())); | |
118 } | |
119 | |
120 @Override | |
121 protected boolean handleMetaOther() { | |
122 if (handleMetaGaugeName()) | |
123 return true; | |
124 else if (handleMetaGaugeNumber()) | |
125 return true; | |
126 else | |
127 return false; | |
128 } | |
129 | |
130 private boolean handleMetaGaugeName() { | |
131 final Matcher m = META_GAUGENAME.matcher(this.currentLine); | |
132 if (m.matches()) { | |
133 this.metaPatternsMatched.add(META_GAUGENAME); | |
134 this.seriesHeader.setGaugeName(m.group(1).trim()); | |
135 return true; | |
136 } | |
137 return false; | |
138 } | |
139 | |
140 private boolean handleMetaGaugeNumber() { | |
141 final Matcher m = META_GAUGENUMBER.matcher(this.currentLine); | |
142 if (m.matches()) { | |
143 this.metaPatternsMatched.add(META_GAUGENUMBER); | |
144 this.seriesHeader.setGaugeNumber(Long.parseLong(m.group(1))); | |
145 return true; | |
146 } | |
147 return false; | |
148 } | |
149 | |
150 @Override | |
151 protected boolean handleMetaColumnTitles() { | |
152 if (!META_COLUMNTITLES.matcher(this.currentLine).matches()) | |
153 return false; | |
154 this.metaPatternsMatched.add(META_COLUMNTITLES); | |
155 this.columnTitles.clear(); | |
156 final String[] titles = this.currentLine.split(SEPARATOR_CHAR, 0); | |
157 for (int i = 0; i <= titles.length - 1; i++) | |
158 this.columnTitles.add(titles[i].trim()); | |
159 this.seriesHeader.setGauge(this.river.getPeer().findGauge(this.seriesHeader.getGaugeNumber(), this.seriesHeader.getGaugeName())); | |
160 if (this.seriesHeader.getGauge() == null) { | |
161 logError("Gauge not found, file skipped"); | |
162 this.headerParsingState = ParsingState.STOP; | |
163 } | |
164 return true; | |
165 } | |
166 } |