view artifacts/src/main/java/org/dive4elements/river/artifacts/sinfo/tkhcalculation/BedQualityD50KmValueFinder.java @ 9665:8a84c9fef8ec

S-info/tkh: d50 average changed from median to arithmetic mean
author mschaefer
date Wed, 06 May 2020 16:17:38 +0200
parents 8e6b9cb9486a
children
line wrap: on
line source
/* Copyright (C) 2017 by Bundesanstalt für Gewässerkunde
 * Software engineering by
 *  Björnsen Beratende Ingenieure GmbH
 *  Dr. Schumacher Ingenieurbüro für Wasser und Umwelt
 *
 * This file is Free Software under the GNU AGPL (>=v3)
 * and comes with ABSOLUTELY NO WARRANTY! Check out the
 * documentation coming with Dive4Elements River for details.
 */

package org.dive4elements.river.artifacts.sinfo.tkhcalculation;

import java.io.IOException;
import java.util.Date;
import java.util.List;

import org.apache.commons.lang.math.DoubleRange;
import org.apache.commons.math.ArgumentOutsideDomainException;
import org.apache.commons.math.analysis.interpolation.LinearInterpolator;
import org.apache.commons.math.analysis.polynomials.PolynomialSplineFunction;
import org.apache.log4j.Logger;
import org.dive4elements.river.artifacts.math.Utils;
import org.dive4elements.river.artifacts.model.Calculation;
import org.dive4elements.river.artifacts.model.DateRange;
import org.dive4elements.river.artifacts.sinfo.tkhstate.BedQualityD50TimeRangeConfig;
import org.dive4elements.river.artifacts.sinfo.tkhstate.TsvHelper.TsvReaderException;
import org.dive4elements.river.backend.SedDBSessionHolder;
import org.dive4elements.river.model.River;
import org.hibernate.SQLQuery;
import org.hibernate.Session;
import org.hibernate.type.StandardBasicTypes;

import gnu.trove.TDoubleArrayList;

/**
 * Searchable sorted km array with parallel bed measurements value array and linear interpolation for km and d50 between
 * the array elements.<br />
 * <br />
 * See comment of SQL command on how the values are filtered and aggregated.
 *
 * @author Matthias Schäfer
 *
 */
public class BedQualityD50KmValueFinder {

    /***** FIELDS *****/

    /**
     * Private log to use here.
     */
    private static Logger log = Logger.getLogger(BedQualityD50KmValueFinder.class);

    /**
     * Query selecting all sub layer bed measurements with their d50 for a km range and a time period<br />
     * <br />
     * A km may have bed measurements for multiple dates, multiple distances from the river bank, and multiple depth layers.
     * The query filters by km range, time period and layer (sub layer: below bed to max. 50 cm depth).<br />
     *
     * If PostgreSQL would support a median aggregate function like Oracle does, the aggregation could be placed into this
     * query.
     */
    private static final String SQL_BED_D50_SUBLAYER_MEASUREMENT = //
            "SELECT s.km, t.datum, p.tiefevon, p.tiefebis, a.d50" //
                    + " FROM sohltest t INNER JOIN station s ON t.stationid = s.stationid" //
                    + "    INNER JOIN gewaesser g ON s.gewaesserid = g.gewaesserid" //
                    + "    INNER JOIN sohlprobe p ON t.sohltestid = p.sohltestid" //
                    + "    INNER JOIN siebanalyse a ON p.sohlprobeid = a.sohlprobeid" //
                    + " WHERE (g.name = :name)" //
                    + "    AND (p.tiefevon > 0.0) AND (p.tiefebis <= 0.5)" //
                    + "    AND (t.datum BETWEEN :fromdate AND :todate)" //
                    + " ORDER BY s.km ASC, a.d50 ASC";

    public static final Date MIN_DATE = new Date(-10000000000000l); // Database does not cope with Long.MIN/Long.Max, so we go just a few hundred years
    // back/forward
    public static final Date MAX_DATE = new Date(10000000000000l);

    private Calculation problems;

    /**
     * Real linear interpolator for kms and d50 values (m)
     */
    private final PolynomialSplineFunction interpolator;

    /***** CONSTRUCTORS *****/

    private BedQualityD50KmValueFinder(final Calculation problems, final double[] kms, final double[] values) {
        this.problems = problems;

        this.interpolator = new LinearInterpolator().interpolate(kms, values);
    }

    /***** METHODS *****/

    /**
     * Sohlbeschaffenheit (D50 Korndurchmesser aus Seddb)
     * Abhängig von Peiljahr
     *
     * @param problems
     * @throws TsvReaderException
     * @throws IOException
     */
    public static BedQualityD50KmValueFinder loadBedMeasurements(final Calculation problems, final River river, final DoubleRange kmRange,
            final int soundingYear) {

        final DateRange dateRange = BedQualityD50TimeRangeConfig.getDefaults(river, soundingYear, problems);
        if (dateRange == null)
            return null;

        return loadBedMeasurements(problems, river, kmRange, dateRange, soundingYear);
    }

    private static BedQualityD50KmValueFinder loadBedMeasurements(final Calculation problems, final River river, final DoubleRange kmRange,
            final DateRange dateRange, final int soundingYear) {

        final Date startTime = dateRange.getFrom();
        final Date endTime = dateRange.getTo();

        final String seddbRiver = river.nameForSeddb();
        log.debug(String.format("loadValues '%s' km %.3f - %.3f %tF - %tF", seddbRiver, kmRange.getMinimumDouble(), kmRange.getMaximumDouble(), startTime,
                endTime));
        final Session session = SedDBSessionHolder.HOLDER.get();
        final SQLQuery sqlQuery = session.createSQLQuery(SQL_BED_D50_SUBLAYER_MEASUREMENT).addScalar("km", StandardBasicTypes.DOUBLE)
                .addScalar("datum", StandardBasicTypes.DATE).addScalar("tiefevon", StandardBasicTypes.DOUBLE).addScalar("tiefebis", StandardBasicTypes.DOUBLE)
                .addScalar("d50", StandardBasicTypes.DOUBLE);
        sqlQuery.setString("name", seddbRiver);
        // sqlQuery.setDouble("fromkm", kmRange.getMinimumDouble());
        // sqlQuery.setDouble("tokm", kmRange.getMaximumDouble());
        sqlQuery.setDate("fromdate", startTime);
        sqlQuery.setDate("todate", endTime);
        final List<Object[]> rows = sqlQuery.list();

        // Aggregate d50 values for each km
        // final TDoubleArrayList kmsm = new TDoubleArrayList();
        // final TDoubleArrayList valuesm = new TDoubleArrayList();
        final TDoubleArrayList kms = new TDoubleArrayList();
        final TDoubleArrayList values = new TDoubleArrayList();
        if (rows != null) {
            // // median
            // final TDoubleArrayList kmd50s = new TDoubleArrayList();
            // for (int i = 0; i <= rows.size() - 1; i++) {
            // log.trace("loadValues rows(" + i + ") " + rows.get(i)[0] + " " + rows.get(i)[1] + " " + rows.get(i)[2] + " " +
            // rows.get(i)[3] + " "
            // + rows.get(i)[4]);
            // kmd50s.add((double) rows.get(i)[4]);
            // if (((i == rows.size() - 1) || !Utils.epsilonEquals((double) rows.get(i)[0], (double) rows.get(i + 1)[0], 0.0001))) {
            // final int k = kmd50s.size() / 2;
            // valuesm.add(((k + k < kmd50s.size()) ? kmd50s.get(k) : (kmd50s.get(k - 1) + kmd50s.get(k)) / 2) / 1000);
            // kmsm.add((double) rows.get(i)[0]);
            // log.debug(String.format("loadValues km %.3f d50(mm) %.1f count %d", kmsm.get(kmsm.size() - 1),
            // valuesm.get(valuesm.size() - 1) * 1000,
            // kmd50s.size()));
            // kmd50s.clear();
            // }
            // }
            // arithmetic mean
            double sum = 0;
            int n = 0;
            for (int i = 0; i <= rows.size() - 1; i++) {
                sum += (double) rows.get(i)[4];
                n++;
                if (((i == rows.size() - 1) || !Utils.epsilonEquals((double) rows.get(i)[0], (double) rows.get(i + 1)[0], 0.0001))) {
                    kms.add((double) rows.get(i)[0]);
                    values.add((sum / n) / 1000);
                    log.debug(String.format("loadValues km %.3f d50(mm) %.1f count %d", kms.get(kms.size() - 1), values.get(values.size() - 1) * 1000, n));
                    sum = 0;
                    n = 0;
                }
            }
        }
        if (kms.size() >= 1)
            log.debug(String.format("loadValues: %d kms found from %.3f to %.3f", kms.size(), kms.get(0), kms.get(kms.size() - 1)));
        else
            log.debug("loadValues: no kms found");

        if (kms.size() < 2 || values.size() < 2) {
            problems.addProblem("bedqualityd50kmvaluefinder.empty", Integer.toString(soundingYear));
            return null;
        }

        try {
            return new BedQualityD50KmValueFinder(problems, kms.toNativeArray(), values.toNativeArray());
        }
        catch (final Exception e) {
            e.printStackTrace();
            problems.addProblem("bedqualityd50kmvaluefinder.error", e.getLocalizedMessage());
            return null;
        }
    }

    /**
     * Returns the d50 value interpolated according to a km
     *
     * @return d50 (m) of the km, or NaN
     */
    public double findD50(final double km) {
        try {
            return this.interpolator.value(km);
        }
        catch (final ArgumentOutsideDomainException e) {
            // No stack trace because this might happen a lot (intended) and we produce an error message anyways.
            // e.printStackTrace();

            if (this.problems != null) {
                this.problems.addProblem(km, "bedqualityd50kmvaluefinder.missing");
                // Report only once
                this.problems = null;
            }

            return Double.NaN;
        }
    }
}

http://dive4elements.wald.intevation.org