/*************************************************************************** qgsstringstatisticalsummary.h ----------------------------- Date : May 2016 Copyright : (C) 2016 by Nyall Dawson Email : nyall dot dawson at gmail dot com *************************************************************************** * * * This program is free software; you can redistribute it and/or modify * * it under the terms of the GNU General Public License as published by * * the Free Software Foundation; either version 2 of the License, or * * (at your option) any later version. * * * ***************************************************************************/ #ifndef QGSSTRINGSTATISTICALSUMMARY_H #define QGSSTRINGSTATISTICALSUMMARY_H #include #include #include "qgis_core.h" /*************************************************************************** * This class is considered CRITICAL and any change MUST be accompanied with * full unit tests in test_qgsstringstatisticalsummary.py. * See details in QEP #17 ****************************************************************************/ /** * \ingroup core * \class QgsStringStatisticalSummary * \brief Calculator for summary statistics and aggregates for a list of strings. * * Statistics are calculated by calling calculate() and passing a list of strings. The * individual statistics can then be retrieved using the associated methods. Note that not all statistics * are calculated by default. Statistics which require slower computations are only calculated by * specifying the statistic in the constructor or via setStatistics(). * * \since QGIS 2.16 */ class CORE_EXPORT QgsStringStatisticalSummary { public: //! Enumeration of flags that specify statistics to be calculated enum Statistic { Count = 1, //!< Count CountDistinct = 2, //!< Number of distinct string values CountMissing = 4, //!< Number of missing (null) values Min = 8, //!< Minimum string value Max = 16, //!< Maximum string value MinimumLength = 32, //!< Minimum length of string MaximumLength = 64, //!< Maximum length of string MeanLength = 128, //!< Mean length of strings All = Count | CountDistinct | CountMissing | Min | Max | MinimumLength | MaximumLength | MeanLength, //! All statistics }; Q_DECLARE_FLAGS( Statistics, Statistic ) /** * Constructor for QgsStringStatistics * \param stats flags for statistics to calculate */ QgsStringStatisticalSummary( QgsStringStatisticalSummary::Statistics stats = QgsStringStatisticalSummary::All ); /** * Returns flags which specify which statistics will be calculated. Some statistics * are always calculated (e.g., count). * \see setStatistics */ Statistics statistics() const { return mStatistics; } /** * Sets flags which specify which statistics will be calculated. Some statistics * are always calculated (e.g., count). * \param stats flags for statistics to calculate * \see statistics */ void setStatistics( QgsStringStatisticalSummary::Statistics stats ) { mStatistics = stats; } /** * Resets the calculated values */ void reset(); /** * Calculates summary statistics for an entire list of strings at once. * \param values list of strings * \see calculateFromVariants() * \see addString() */ void calculate( const QStringList &values ); /** * Calculates summary statistics for an entire list of variants at once. Any * non-string variants will be ignored. * \param values list of variants * \see calculate() * \see addValue() */ void calculateFromVariants( const QVariantList &values ); /** * Adds a single string to the statistics calculation. Calling this method * allows strings to be added to the calculation one at a time. For large * quantities of strings this may be more efficient then first adding all the * strings to a list and calling calculate(). * \param string string to add * \note call reset() before adding the first string using this method * to clear the results from any previous calculations * \note finalize() must be called after adding the final string and before * retrieving calculated statistics. * \see calculate() * \see addValue() * \see finalize() */ void addString( const QString &string ); /** * Adds a single variant to the statistics calculation. Calling this method * allows variants to be added to the calculation one at a time. For large * quantities of variants this may be more efficient then first adding all the * variants to a list and calling calculateFromVariants(). * \param value variant to add * \note call reset() before adding the first string using this method * to clear the results from any previous calculations * \note finalize() must be called after adding the final value and before * retrieving calculated statistics. * \see calculateFromVariants() * \see finalize() */ void addValue( const QVariant &value ); /** * Must be called after adding all strings with addString() and before retrieving * any calculated string statistics. * \see addString() */ void finalize(); /** * Returns the value of a specified statistic * \param stat statistic to return * \returns calculated value of statistic */ QVariant statistic( QgsStringStatisticalSummary::Statistic stat ) const; /** * Returns the calculated count of values. */ int count() const { return mCount; } /** * Returns the number of distinct string values. * \see distinctValues() */ int countDistinct() const { return mValues.count(); } /** * Returns the set of distinct string values. * \see countDistinct() */ QSet< QString > distinctValues() const { return mValues; } /** * Returns the number of missing (null) string values. */ int countMissing() const { return mCountMissing; } /** * Returns the minimum (non-null) string value. */ QString min() const { return mMin; } /** * Returns the maximum (non-null) string value. */ QString max() const { return mMax; } /** * Returns the minimum length of strings. */ int minLength() const { return mMinLength; } /** * Returns the maximum length of strings. */ int maxLength() const { return mMaxLength; } /** * Returns the mean length of strings. * \since QGIS 3.0 */ double meanLength() const { return mMeanLength; } /** * Returns the friendly display name for a statistic * \param statistic statistic to return name for */ static QString displayName( QgsStringStatisticalSummary::Statistic statistic ); private: Statistics mStatistics; int mCount; QSet< QString > mValues; int mCountMissing; QString mMin; QString mMax; int mMinLength; int mMaxLength; long mSumLengths; double mMeanLength; void testString( const QString &string ); }; Q_DECLARE_OPERATORS_FOR_FLAGS( QgsStringStatisticalSummary::Statistics ) #endif // QGSSTRINGSTATISTICALSUMMARY_H