mirror of
https://github.com/qgis/QGIS.git
synced 2025-03-03 00:02:25 -05:00
349 lines
15 KiB
Python
349 lines
15 KiB
Python
# -*- coding: utf-8 -*-
|
|
|
|
"""
|
|
***************************************************************************
|
|
SpatialJoin.py
|
|
---------------------
|
|
Date : September 2017
|
|
Copyright : (C) 2017 by Nyall Dawson
|
|
Email : nyall dot dawson at gmail dot com
|
|
***************************************************************************
|
|
* *
|
|
* This program is free software; you can redistribute it and/or modify *
|
|
* it under the terms of the GNU General Public License as published by *
|
|
* the Free Software Foundation; either version 2 of the License, or *
|
|
* (at your option) any later version. *
|
|
* *
|
|
***************************************************************************
|
|
"""
|
|
from builtins import range
|
|
|
|
__author__ = 'Nyall Dawson'
|
|
__date__ = 'September 2017'
|
|
__copyright__ = '(C) 2017, Nyall Dawson'
|
|
|
|
# This will get replaced with a git SHA1 when you do a git archive
|
|
|
|
__revision__ = '$Format:%H$'
|
|
|
|
import os
|
|
|
|
from collections import defaultdict
|
|
|
|
from qgis.PyQt.QtGui import QIcon
|
|
from qgis.PyQt.QtCore import QVariant
|
|
from qgis.core import (NULL,
|
|
QgsField,
|
|
QgsFields,
|
|
QgsFeatureSink,
|
|
QgsFeatureRequest,
|
|
QgsGeometry,
|
|
QgsCoordinateTransform,
|
|
QgsStatisticalSummary,
|
|
QgsDateTimeStatisticalSummary,
|
|
QgsStringStatisticalSummary,
|
|
QgsProcessing,
|
|
QgsProcessingUtils,
|
|
QgsProcessingParameterBoolean,
|
|
QgsProcessingParameterFeatureSource,
|
|
QgsProcessingParameterEnum,
|
|
QgsProcessingParameterField,
|
|
QgsProcessingParameterFeatureSink)
|
|
|
|
from processing.algs.qgis.QgisAlgorithm import QgisAlgorithm
|
|
from processing.tools import vector
|
|
|
|
pluginPath = os.path.split(os.path.split(os.path.dirname(__file__))[0])[0]
|
|
|
|
|
|
class SpatialJoinSummary(QgisAlgorithm):
|
|
INPUT = "INPUT"
|
|
JOIN = "JOIN"
|
|
PREDICATE = "PREDICATE"
|
|
JOIN_FIELDS = "JOIN_FIELDS"
|
|
SUMMARIES = "SUMMARIES"
|
|
DISCARD_NONMATCHING = "DISCARD_NONMATCHING"
|
|
OUTPUT = "OUTPUT"
|
|
|
|
def icon(self):
|
|
return QIcon(os.path.join(pluginPath, 'images', 'ftools', 'join_location.png'))
|
|
|
|
def group(self):
|
|
return self.tr('Vector general')
|
|
|
|
def __init__(self):
|
|
super().__init__()
|
|
|
|
def initAlgorithm(self, config=None):
|
|
self.predicates = (
|
|
('intersects', self.tr('intersects')),
|
|
('contains', self.tr('contains')),
|
|
('equals', self.tr('equals')),
|
|
('touches', self.tr('touches')),
|
|
('overlaps', self.tr('overlaps')),
|
|
('within', self.tr('within')),
|
|
('crosses', self.tr('crosses')))
|
|
|
|
self.statistics = [
|
|
('count', self.tr('count')),
|
|
('unique', self.tr('unique')),
|
|
('min', self.tr('min')),
|
|
('max', self.tr('max')),
|
|
('range', self.tr('range')),
|
|
('sum', self.tr('sum')),
|
|
('mean', self.tr('mean')),
|
|
('median', self.tr('median')),
|
|
('stddev', self.tr('stddev')),
|
|
('minority', self.tr('minority')),
|
|
('majority', self.tr('majority')),
|
|
('q1', self.tr('q1')),
|
|
('q3', self.tr('q3')),
|
|
('iqr', self.tr('iqr')),
|
|
('empty', self.tr('empty')),
|
|
('filled', self.tr('filled')),
|
|
('min_length', self.tr('min_length')),
|
|
('max_length', self.tr('max_length')),
|
|
('mean_length', self.tr('mean_length'))]
|
|
|
|
self.addParameter(QgsProcessingParameterFeatureSource(self.INPUT,
|
|
self.tr('Input layer'),
|
|
[QgsProcessing.TypeVectorAnyGeometry]))
|
|
self.addParameter(QgsProcessingParameterFeatureSource(self.JOIN,
|
|
self.tr('Join layer'),
|
|
[QgsProcessing.TypeVectorAnyGeometry]))
|
|
predicate = QgsProcessingParameterEnum(self.PREDICATE,
|
|
self.tr('Geometric predicate'),
|
|
options=[p[1] for p in self.predicates],
|
|
allowMultiple=True, defaultValue=[0])
|
|
predicate.setMetadata({
|
|
'widget_wrapper': {
|
|
'class': 'processing.gui.wrappers.EnumWidgetWrapper',
|
|
'useCheckBoxes': True,
|
|
'columns': 2}})
|
|
self.addParameter(predicate)
|
|
self.addParameter(QgsProcessingParameterField(self.JOIN_FIELDS,
|
|
self.tr('Fields to summarise (leave empty to use all fields)'),
|
|
parentLayerParameterName=self.JOIN,
|
|
allowMultiple=True, optional=True))
|
|
self.addParameter(QgsProcessingParameterEnum(self.SUMMARIES,
|
|
self.tr(
|
|
'Summaries to calculate (leave empty to use all available)'),
|
|
options=[p[1] for p in self.statistics],
|
|
allowMultiple=True, optional=True))
|
|
self.addParameter(QgsProcessingParameterBoolean(self.DISCARD_NONMATCHING,
|
|
self.tr('Discard records which could not be joined'),
|
|
defaultValue=False))
|
|
self.addParameter(QgsProcessingParameterFeatureSink(self.OUTPUT,
|
|
self.tr('Joined layer')))
|
|
|
|
def name(self):
|
|
return 'joinbylocationsummary'
|
|
|
|
def displayName(self):
|
|
return self.tr('Join attributes by location (summary)')
|
|
|
|
def tags(self):
|
|
return self.tr(
|
|
"summary,aggregate,join,intersects,intersecting,touching,within,contains,overlaps,relation,spatial").split(
|
|
',')
|
|
|
|
def processAlgorithm(self, parameters, context, feedback):
|
|
source = self.parameterAsSource(parameters, self.INPUT, context)
|
|
join_source = self.parameterAsSource(parameters, self.JOIN, context)
|
|
join_fields = self.parameterAsFields(parameters, self.JOIN_FIELDS, context)
|
|
discard_nomatch = self.parameterAsBool(parameters, self.DISCARD_NONMATCHING, context)
|
|
summaries = [self.statistics[i][0] for i in
|
|
sorted(self.parameterAsEnums(parameters, self.SUMMARIES, context))]
|
|
|
|
if not summaries:
|
|
# none selected, so use all
|
|
summaries = [s[0] for s in self.statistics]
|
|
|
|
source_fields = source.fields()
|
|
fields_to_join = QgsFields()
|
|
join_field_indexes = []
|
|
if not join_fields:
|
|
# no fields selected, use all
|
|
join_fields = [join_source.fields().at(i).name() for i in range(len(join_source.fields()))]
|
|
|
|
def addFieldKeepType(original, stat):
|
|
"""
|
|
Adds a field to the output, keeping the same data type as the original
|
|
"""
|
|
field = QgsField(original)
|
|
field.setName(field.name() + '_' + stat)
|
|
fields_to_join.append(field)
|
|
|
|
def addField(original, stat, type):
|
|
"""
|
|
Adds a field to the output, with a specified type
|
|
"""
|
|
field = QgsField(original)
|
|
field.setName(field.name() + '_' + stat)
|
|
field.setType(type)
|
|
if type == QVariant.Double:
|
|
field.setLength(20)
|
|
field.setPrecision(6)
|
|
fields_to_join.append(field)
|
|
|
|
numeric_fields = (
|
|
('count', QVariant.Int, 'count'),
|
|
('unique', QVariant.Int, 'variety'),
|
|
('min', QVariant.Double, 'min'),
|
|
('max', QVariant.Double, 'max'),
|
|
('range', QVariant.Double, 'range'),
|
|
('sum', QVariant.Double, 'sum'),
|
|
('mean', QVariant.Double, 'mean'),
|
|
('median', QVariant.Double, 'median'),
|
|
('stddev', QVariant.Double, 'stDev'),
|
|
('minority', QVariant.Double, 'minority'),
|
|
('majority', QVariant.Double, 'majority'),
|
|
('q1', QVariant.Double, 'firstQuartile'),
|
|
('q3', QVariant.Double, 'thirdQuartile'),
|
|
('iqr', QVariant.Double, 'interQuartileRange')
|
|
)
|
|
|
|
datetime_fields = (
|
|
('count', QVariant.Int, 'count'),
|
|
('unique', QVariant.Int, 'countDistinct'),
|
|
('empty', QVariant.Int, 'countMissing'),
|
|
('filled', QVariant.Int),
|
|
('min', None),
|
|
('max', None)
|
|
)
|
|
|
|
string_fields = (
|
|
('count', QVariant.Int, 'count'),
|
|
('unique', QVariant.Int, 'countDistinct'),
|
|
('empty', QVariant.Int, 'countMissing'),
|
|
('filled', QVariant.Int),
|
|
('min', None, 'min'),
|
|
('max', None, 'max'),
|
|
('min_length', QVariant.Int, 'minLength'),
|
|
('max_length', QVariant.Int, 'maxLength'),
|
|
('mean_length', QVariant.Double, 'meanLength')
|
|
)
|
|
|
|
field_types = []
|
|
for f in join_fields:
|
|
idx = join_source.fields().lookupField(f)
|
|
if idx >= 0:
|
|
join_field_indexes.append(idx)
|
|
|
|
join_field = join_source.fields().at(idx)
|
|
if join_field.isNumeric():
|
|
field_types.append('numeric')
|
|
field_list = numeric_fields
|
|
elif join_field.type() in (QVariant.Date, QVariant.Time, QVariant.DateTime):
|
|
field_types.append('datetime')
|
|
field_list = datetime_fields
|
|
else:
|
|
field_types.append('string')
|
|
field_list = string_fields
|
|
|
|
for f in field_list:
|
|
if f[0] in summaries:
|
|
if f[1] is not None:
|
|
addField(join_field, f[0], f[1])
|
|
else:
|
|
addFieldKeepType(join_field, f[0])
|
|
|
|
out_fields = QgsProcessingUtils.combineFields(source_fields, fields_to_join)
|
|
|
|
(sink, dest_id) = self.parameterAsSink(parameters, self.OUTPUT, context,
|
|
out_fields, source.wkbType(), source.sourceCrs())
|
|
|
|
# do the join
|
|
predicates = [self.predicates[i][0] for i in self.parameterAsEnums(parameters, self.PREDICATE, context)]
|
|
|
|
features = source.getFeatures()
|
|
total = 100.0 / source.featureCount() if source.featureCount() else 0
|
|
|
|
# bounding box transform
|
|
bbox_transform = QgsCoordinateTransform(source.sourceCrs(), join_source.sourceCrs())
|
|
|
|
for current, f in enumerate(features):
|
|
if feedback.isCanceled():
|
|
break
|
|
|
|
if not f.hasGeometry():
|
|
if not discard_nomatch:
|
|
sink.addFeature(f, QgsFeatureSink.FastInsert)
|
|
continue
|
|
|
|
bbox = bbox_transform.transformBoundingBox(f.geometry().boundingBox())
|
|
engine = None
|
|
|
|
values = []
|
|
|
|
request = QgsFeatureRequest().setFilterRect(bbox).setSubsetOfAttributes(join_field_indexes).setDestinationCrs(source.sourceCrs())
|
|
for test_feat in join_source.getFeatures(request):
|
|
if feedback.isCanceled():
|
|
break
|
|
|
|
join_attributes = []
|
|
for a in join_field_indexes:
|
|
join_attributes.append(test_feat.attributes()[a])
|
|
|
|
if engine is None:
|
|
engine = QgsGeometry.createGeometryEngine(f.geometry().constGet())
|
|
engine.prepareGeometry()
|
|
|
|
for predicate in predicates:
|
|
if getattr(engine, predicate)(test_feat.geometry().constGet()):
|
|
values.append(join_attributes)
|
|
break
|
|
|
|
feedback.setProgress(int(current * total))
|
|
|
|
if len(values) == 0:
|
|
if discard_nomatch:
|
|
continue
|
|
else:
|
|
sink.addFeature(f, QgsFeatureSink.FastInsert)
|
|
else:
|
|
attrs = f.attributes()
|
|
for i in range(len(join_field_indexes)):
|
|
attribute_values = [v[i] for v in values]
|
|
field_type = field_types[i]
|
|
if field_type == 'numeric':
|
|
stat = QgsStatisticalSummary()
|
|
for v in attribute_values:
|
|
stat.addVariant(v)
|
|
stat.finalize()
|
|
for s in numeric_fields:
|
|
if s[0] in summaries:
|
|
attrs.append(getattr(stat, s[2])())
|
|
elif field_type == 'datetime':
|
|
stat = QgsDateTimeStatisticalSummary()
|
|
stat.calculate(attribute_values)
|
|
for s in datetime_fields:
|
|
if s[0] in summaries:
|
|
if s[0] == 'filled':
|
|
attrs.append(stat.count() - stat.countMissing())
|
|
elif s[0] == 'min':
|
|
attrs.append(stat.statistic(QgsDateTimeStatisticalSummary.Min))
|
|
elif s[0] == 'max':
|
|
attrs.append(stat.statistic(QgsDateTimeStatisticalSummary.Max))
|
|
else:
|
|
attrs.append(getattr(stat, s[2])())
|
|
else:
|
|
stat = QgsStringStatisticalSummary()
|
|
for v in attribute_values:
|
|
if v == NULL:
|
|
stat.addString('')
|
|
else:
|
|
stat.addString(str(v))
|
|
stat.finalize()
|
|
for s in string_fields:
|
|
if s[0] in summaries:
|
|
if s[0] == 'filled':
|
|
attrs.append(stat.count() - stat.countMissing())
|
|
else:
|
|
attrs.append(getattr(stat, s[2])())
|
|
|
|
f.setAttributes(attrs)
|
|
sink.addFeature(f, QgsFeatureSink.FastInsert)
|
|
|
|
return {self.OUTPUT: dest_id}
|