# -*- coding: utf-8 -*- """ *************************************************************************** StatisticsByCategories.py --------------------- Date : September 2012 Copyright : (C) 2012 by Victor Olaya Email : volayaf at gmail dot com *************************************************************************** * * * This program is free software; you can redistribute it and/or modify * * it under the terms of the GNU General Public License as published by * * the Free Software Foundation; either version 2 of the License, or * * (at your option) any later version. * * * *************************************************************************** """ __author__ = 'Victor Olaya' __date__ = 'September 2012' __copyright__ = '(C) 2012, Victor Olaya' # This will get replaced with a git SHA1 when you do a git archive __revision__ = '$Format:%H$' import math from PyQt4.QtCore import * from qgis.core import * from processing.outputs.OutputTable import OutputTable from processing.core.GeoAlgorithm import GeoAlgorithm from processing.core.QGisLayers import QGisLayers from processing.parameters.ParameterVector import ParameterVector from processing.parameters.ParameterTableField import ParameterTableField class StatisticsByCategories(GeoAlgorithm): INPUT_LAYER = "INPUT_LAYER" VALUES_FIELD_NAME = "VALUES_FIELD_NAME" CATEGORIES_FIELD_NAME = "CATEGORIES_FIELD_NAME" OUTPUT = "OUTPUT" def defineCharacteristics(self): self.name = "Statistics by categories" self.group = "Vector table tools" self.addParameter(ParameterVector(self.INPUT_LAYER, "Input vector layer", [ParameterVector.VECTOR_TYPE_ANY], False)) self.addParameter(ParameterTableField(self.VALUES_FIELD_NAME, "Field to calculate statistics on", self.INPUT_LAYER, ParameterTableField.DATA_TYPE_NUMBER)) self.addParameter(ParameterTableField(self.CATEGORIES_FIELD_NAME, "Field with categories", self.INPUT_LAYER, ParameterTableField.DATA_TYPE_ANY)) self.addOutput(OutputTable(self.OUTPUT, "Statistics")) def processAlgorithm(self, progress): layer = QGisLayers.getObjectFromUri(self.getParameterValue(self.INPUT_LAYER)) valuesFieldName = self.getParameterValue(self.VALUES_FIELD_NAME) categoriesFieldName = self.getParameterValue(self.CATEGORIES_FIELD_NAME) output = self.getOutputFromName(self.OUTPUT) valuesField = layer.fieldNameIndex(valuesFieldName) categoriesField = layer.fieldNameIndex(categoriesFieldName) features = QGisLayers.features(layer) nFeats = len(features) values = {} nFeat = 0 for feat in features: nFeat += 1 progress.setPercentage(int((100 * nFeats) / nFeat)) attrs = feat.attributes() try: value = float(attrs[valuesField]) cat = unicode(attrs[categoriesField]) if cat not in values: values[cat] = [] values[cat].append(value) except: pass #fields = [QgsField("category", QVariant.String), QgsField("min", QVariant.Double), # QgsField("max", QVariant.Double), QgsField("mean", QVariant.Double), # QgsField("stddev", QVariant.Double)] fields = ["category", "min", "max", "mean", "stddev"] writer = output.getTableWriter(fields) for cat, v in values.items(): min, max, mean, stddev = calculateStats(v) record = [cat, min, max, mean, stddev] writer.addRecord(record) def calculateStats(values): n = 0 sum = 0 mean = 0 M2 = 0 minvalue = None maxvalue = None for v in values: sum += v n = n + 1 delta = v - mean mean = mean + delta/n M2 = M2 + delta*(v - mean) if minvalue is None: minvalue = v maxvalue = v else: minvalue = min(v, minvalue) maxvalue = max(v, maxvalue) if n > 1: variance = M2/(n - 1) else: variance = 0; stddev = math.sqrt(variance) return minvalue,maxvalue, mean, stddev