QGIS API Documentation 4.1.0-Master (5bf3c20f3c9)
Loading...
Searching...
No Matches
qgsalgorithmjoinbynearest.cpp
Go to the documentation of this file.
1/***************************************************************************
2 qgsalgorithmjoinbynearest.cpp
3 ---------------------
4 begin : April 2017
5 copyright : (C) 2017 by Nyall Dawson
6 email : nyall dot dawson at gmail dot com
7 ***************************************************************************/
8
9/***************************************************************************
10 * *
11 * This program is free software; you can redistribute it and/or modify *
12 * it under the terms of the GNU General Public License as published by *
13 * the Free Software Foundation; either version 2 of the License, or *
14 * (at your option) any later version. *
15 * *
16 ***************************************************************************/
17
19
20#include <algorithm>
21
22#include "qgslinestring.h"
24#include "qgsspatialindex.h"
25
26#include <QString>
27
28using namespace Qt::StringLiterals;
29
31
32QString QgsJoinByNearestAlgorithm::name() const
33{
34 return u"joinbynearest"_s;
35}
36
37QString QgsJoinByNearestAlgorithm::displayName() const
38{
39 return QObject::tr( "Join attributes by nearest" );
40}
41
42QStringList QgsJoinByNearestAlgorithm::tags() const
43{
44 return QObject::tr( "join,connect,attributes,values,fields,tables,proximity,closest,neighbour,neighbor,n-nearest,distance" ).split( ',' );
45}
46
47QString QgsJoinByNearestAlgorithm::group() const
48{
49 return QObject::tr( "Vector general" );
50}
51
52QString QgsJoinByNearestAlgorithm::groupId() const
53{
54 return u"vectorgeneral"_s;
55}
56
57void QgsJoinByNearestAlgorithm::initAlgorithm( const QVariantMap & )
58{
59 addParameter( new QgsProcessingParameterFeatureSource( u"INPUT"_s, QObject::tr( "Input layer" ) ) );
60 addParameter( new QgsProcessingParameterFeatureSource( u"INPUT_2"_s, QObject::tr( "Input layer 2" ) ) );
61
62 addParameter(
63 new QgsProcessingParameterField( u"FIELDS_TO_COPY"_s, QObject::tr( "Layer 2 fields to copy (leave empty to copy all fields)" ), QVariant(), u"INPUT_2"_s, Qgis::ProcessingFieldParameterDataType::Any, true, true )
64 );
65
66 addParameter( new QgsProcessingParameterBoolean( u"DISCARD_NONMATCHING"_s, QObject::tr( "Discard records which could not be joined" ), false ) );
67
68 addParameter( new QgsProcessingParameterString( u"PREFIX"_s, QObject::tr( "Joined field prefix" ), QVariant(), false, true ) );
69
70 addParameter( new QgsProcessingParameterNumber( u"NEIGHBORS"_s, QObject::tr( "Maximum nearest neighbors" ), Qgis::ProcessingNumberParameterType::Integer, 1, false, 1 ) );
71
72 addParameter( new QgsProcessingParameterDistance( u"MAX_DISTANCE"_s, QObject::tr( "Maximum distance" ), QVariant(), u"INPUT"_s, true, 0 ) );
73
74 addParameter( new QgsProcessingParameterFeatureSink( u"OUTPUT"_s, QObject::tr( "Joined layer" ), Qgis::ProcessingSourceType::VectorAnyGeometry, QVariant(), true, true ) );
75
76 auto nonMatchingSink
77 = std::make_unique<QgsProcessingParameterFeatureSink>( u"NON_MATCHING"_s, QObject::tr( "Unjoinable features from first layer" ), Qgis::ProcessingSourceType::VectorAnyGeometry, QVariant(), true, false );
78 // TODO GUI doesn't support advanced outputs yet
79 //nonMatchingSink->setFlags(nonMatchingSink->flags() | Qgis::ProcessingParameterFlag::Advanced );
80 addParameter( nonMatchingSink.release() );
81
82 addOutput( new QgsProcessingOutputNumber( u"JOINED_COUNT"_s, QObject::tr( "Number of joined features from input table" ) ) );
83 addOutput( new QgsProcessingOutputNumber( u"UNJOINABLE_COUNT"_s, QObject::tr( "Number of unjoinable features from input table" ) ) );
84}
85
86QString QgsJoinByNearestAlgorithm::shortHelpString() const
87{
88 return QObject::tr(
89 "This algorithm takes an input vector layer and creates a new vector layer that is an extended version of the "
90 "input one, with additional attributes in its attribute table.\n\n"
91 "The additional attributes and their values are taken from a second vector layer, where features are joined "
92 "by finding the closest features from each layer. By default only the single nearest feature is joined,"
93 "but optionally the join can use the n-nearest neighboring features instead. If multiple features are found "
94 "with identical distances these will all be returned (even if the total number of features exceeds the specified "
95 "maximum feature count).\n\n"
96 "If a maximum distance is specified, then only features which are closer than this distance "
97 "will be matched.\n\n"
98 "The output features will contain the selected attributes from the nearest feature, "
99 "along with new attributes for the distance to the near feature, the index of the feature, "
100 "and the coordinates of the closest point on the input feature (feature_x, feature_y) "
101 "to the matched nearest feature, and the coordinates of the closet point on the matched feature "
102 "(nearest_x, nearest_y).\n\n"
103 "This algorithm uses purely Cartesian calculations for distance, and does not consider "
104 "geodetic or ellipsoid properties when determining feature proximity."
105 );
106}
107
108QString QgsJoinByNearestAlgorithm::shortDescription() const
109{
110 return QObject::tr( "Joins a layer to another layer, using the closest features (nearest neighbors)." );
111}
112
113Qgis::ProcessingAlgorithmDocumentationFlags QgsJoinByNearestAlgorithm::documentationFlags() const
114{
116}
117
118QgsJoinByNearestAlgorithm *QgsJoinByNearestAlgorithm::createInstance() const
119{
120 return new QgsJoinByNearestAlgorithm();
121}
122
123QVariantMap QgsJoinByNearestAlgorithm::processAlgorithm( const QVariantMap &parameters, QgsProcessingContext &context, QgsProcessingFeedback *feedback )
124{
125 const int neighbors = parameterAsInt( parameters, u"NEIGHBORS"_s, context );
126 const bool discardNonMatching = parameterAsBoolean( parameters, u"DISCARD_NONMATCHING"_s, context );
127 const double maxDistance = parameters.value( u"MAX_DISTANCE"_s ).isValid() ? parameterAsDouble( parameters, u"MAX_DISTANCE"_s, context ) : std::numeric_limits<double>::quiet_NaN();
128 std::unique_ptr<QgsProcessingFeatureSource> input( parameterAsSource( parameters, u"INPUT"_s, context ) );
129 if ( !input )
130 throw QgsProcessingException( invalidSourceError( parameters, u"INPUT"_s ) );
131
132 std::unique_ptr<QgsProcessingFeatureSource> input2( parameterAsSource( parameters, u"INPUT_2"_s, context ) );
133 if ( !input2 )
134 throw QgsProcessingException( invalidSourceError( parameters, u"INPUT_2"_s ) );
135
136 const bool sameSourceAndTarget = parameters.value( u"INPUT"_s ) == parameters.value( u"INPUT_2"_s );
137
138 const QString prefix = parameterAsString( parameters, u"PREFIX"_s, context );
139 const QStringList fieldsToCopy = parameterAsStrings( parameters, u"FIELDS_TO_COPY"_s, context );
140
141 QgsFields outFields2;
142 QgsAttributeList fields2Indices;
143 if ( fieldsToCopy.empty() )
144 {
145 outFields2 = input2->fields();
146 fields2Indices.reserve( outFields2.count() );
147 for ( int i = 0; i < outFields2.count(); ++i )
148 {
149 fields2Indices << i;
150 }
151 }
152 else
153 {
154 fields2Indices.reserve( fieldsToCopy.count() );
155 for ( const QString &field : fieldsToCopy )
156 {
157 const int index = input2->fields().lookupField( field );
158 if ( index >= 0 )
159 {
160 fields2Indices << index;
161 outFields2.append( input2->fields().at( index ) );
162 }
163 }
164 }
165
166 if ( !prefix.isEmpty() )
167 {
168 for ( int i = 0; i < outFields2.count(); ++i )
169 {
170 outFields2.rename( i, prefix + outFields2[i].name() );
171 }
172 }
173
174 const QgsAttributeList fields2Fetch = fields2Indices;
175
176 QgsFields outFields = QgsProcessingUtils::combineFields( input->fields(), outFields2 );
177
178 QgsFields resultFields;
179 resultFields.append( QgsField( u"n"_s, QMetaType::Type::Int ) );
180 resultFields.append( QgsField( u"distance"_s, QMetaType::Type::Double ) );
181 resultFields.append( QgsField( u"feature_x"_s, QMetaType::Type::Double ) );
182 resultFields.append( QgsField( u"feature_y"_s, QMetaType::Type::Double ) );
183 resultFields.append( QgsField( u"nearest_x"_s, QMetaType::Type::Double ) );
184 resultFields.append( QgsField( u"nearest_y"_s, QMetaType::Type::Double ) );
185 outFields = QgsProcessingUtils::combineFields( outFields, resultFields );
186
187 QString dest;
188 std::unique_ptr<QgsFeatureSink> sink( parameterAsSink( parameters, u"OUTPUT"_s, context, dest, outFields, input->wkbType(), input->sourceCrs(), QgsFeatureSink::RegeneratePrimaryKey ) );
189 if ( parameters.value( u"OUTPUT"_s ).isValid() && !sink )
190 throw QgsProcessingException( invalidSinkError( parameters, u"OUTPUT"_s ) );
191
192 QString destNonMatching1;
193 std::unique_ptr<QgsFeatureSink> sinkNonMatching1(
194 parameterAsSink( parameters, u"NON_MATCHING"_s, context, destNonMatching1, input->fields(), input->wkbType(), input->sourceCrs(), QgsFeatureSink::RegeneratePrimaryKey )
195 );
196 if ( parameters.value( u"NON_MATCHING"_s ).isValid() && !sinkNonMatching1 )
197 throw QgsProcessingException( invalidSinkError( parameters, u"NON_MATCHING"_s ) );
198
199 // make spatial index
200 const QgsFeatureIterator f2 = input2->getFeatures( QgsFeatureRequest().setDestinationCrs( input->sourceCrs(), context.transformContext() ).setSubsetOfAttributes( fields2Fetch ) );
201 QHash<QgsFeatureId, QgsAttributes> input2AttributeCache;
202 double step = input2->featureCount() > 0 ? 50.0 / input2->featureCount() : 1;
203 int i = 0;
204 const QgsSpatialIndex index(
205 f2,
206 [&]( const QgsFeature &f ) -> bool {
207 i++;
208 if ( feedback->isCanceled() )
209 return false;
210
211 feedback->setProgress( i * step );
212
213 if ( !f.hasGeometry() )
214 return true;
215
216 // only keep selected attributes
217 QgsAttributes attributes;
218 for ( int field2Index : fields2Indices )
219 {
220 attributes << f.attribute( field2Index );
221 }
222 input2AttributeCache.insert( f.id(), attributes );
223
224 return true;
225 },
227 );
228
229 QgsFeature f;
230
231 // create extra null attributes for non-matched records (the +2 is for the "n" and "distance", and start/end x/y fields)
232 QgsAttributes nullMatch;
233 nullMatch.reserve( fields2Indices.size() + 6 );
234 for ( int i = 0; i < fields2Indices.count() + 6; ++i )
235 nullMatch << QVariant();
236
237 long long joinedCount = 0;
238 long long unjoinedCount = 0;
239
240 // Create output vector layer with additional attributes
241 step = input->featureCount() > 0 ? 50.0 / input->featureCount() : 1;
242 QgsFeatureIterator features = input->getFeatures();
243 i = 0;
244 while ( features.nextFeature( f ) )
245 {
246 i++;
247 if ( feedback->isCanceled() )
248 {
249 break;
250 }
251
252 feedback->setProgress( 50 + i * step );
253
254 if ( !f.hasGeometry() )
255 {
256 unjoinedCount++;
257 if ( sinkNonMatching1 )
258 {
259 if ( !sinkNonMatching1->addFeature( f, QgsFeatureSink::FastInsert ) )
260 throw QgsProcessingException( writeFeatureError( sinkNonMatching1.get(), parameters, u"NON_MATCHING"_s ) );
261 }
262 if ( sink && !discardNonMatching )
263 {
264 QgsAttributes attr = f.attributes();
265 attr.append( nullMatch );
266 f.setAttributes( attr );
267 if ( !sink->addFeature( f, QgsFeatureSink::FastInsert ) )
268 throw QgsProcessingException( writeFeatureError( sink.get(), parameters, u"OUTPUT"_s ) );
269 }
270 }
271 else
272 {
273 // note - if using same source as target, we have to get one extra neighbor, since the first match will be the input feature
274
275 // if the user didn't specify a distance (isnan), then use 0 for nearestNeighbor() parameter
276 // if the user specified 0 exactly, then use the smallest positive double value instead
277 const double searchDistance = std::isnan( maxDistance ) ? 0 : std::max( std::numeric_limits<double>::min(), maxDistance );
278 const QList<QgsFeatureId> nearest = index.nearestNeighbor( f.geometry(), neighbors + ( sameSourceAndTarget ? 1 : 0 ), searchDistance );
279
280 if ( nearest.count() > neighbors + ( sameSourceAndTarget ? 1 : 0 ) )
281 {
282 feedback->pushInfo(
283 QObject::tr( "Multiple matching features found at same distance from search feature, found %n feature(s) instead of %1", nullptr, nearest.count() - ( sameSourceAndTarget ? 1 : 0 ) ).arg( neighbors )
284 );
285 }
286 QgsFeature out;
287 out.setGeometry( f.geometry() );
288 int j = 0;
289 for ( const QgsFeatureId id : nearest )
290 {
291 if ( sameSourceAndTarget && id == f.id() )
292 continue; // don't match to same feature if using a single input table
293 j++;
294 if ( sink )
295 {
296 QgsAttributes attr = f.attributes();
297 attr.append( input2AttributeCache.value( id ) );
298 attr.append( j );
299
300 const QgsGeometry closestLine = f.geometry().shortestLine( index.geometry( id ) );
301 if ( const QgsLineString *line = qgsgeometry_cast<const QgsLineString *>( closestLine.constGet() ) )
302 {
303 attr.append( line->length() );
304 attr.append( line->startPoint().x() );
305 attr.append( line->startPoint().y() );
306 attr.append( line->endPoint().x() );
307 attr.append( line->endPoint().y() );
308 }
309 else
310 {
311 attr.append( QVariant() ); //distance
312 attr.append( QVariant() ); //start x
313 attr.append( QVariant() ); //start y
314 attr.append( QVariant() ); //end x
315 attr.append( QVariant() ); //end y
316 }
317 out.setAttributes( attr );
318 if ( !sink->addFeature( out, QgsFeatureSink::FastInsert ) )
319 throw QgsProcessingException( writeFeatureError( sink.get(), parameters, u"OUTPUT"_s ) );
320 }
321 }
322 if ( j > 0 )
323 joinedCount++;
324 else
325 {
326 if ( sinkNonMatching1 )
327 {
328 if ( !sinkNonMatching1->addFeature( f, QgsFeatureSink::FastInsert ) )
329 throw QgsProcessingException( writeFeatureError( sinkNonMatching1.get(), parameters, u"NON_MATCHING"_s ) );
330 }
331 if ( !discardNonMatching && sink )
332 {
333 QgsAttributes attr = f.attributes();
334 attr.append( nullMatch );
335 f.setAttributes( attr );
336 if ( !sink->addFeature( f, QgsFeatureSink::FastInsert ) )
337 throw QgsProcessingException( writeFeatureError( sink.get(), parameters, u"OUTPUT"_s ) );
338 }
339 unjoinedCount++;
340 }
341 }
342 }
343
344 QVariantMap outputs;
345 outputs.insert( u"JOINED_COUNT"_s, joinedCount );
346 outputs.insert( u"UNJOINABLE_COUNT"_s, unjoinedCount );
347 if ( sink )
348 {
349 sink->finalize();
350 outputs.insert( u"OUTPUT"_s, dest );
351 }
352 if ( sinkNonMatching1 )
353 {
354 sinkNonMatching1->finalize();
355 outputs.insert( u"NON_MATCHING"_s, destNonMatching1 );
356 }
357 return outputs;
358}
359
360
@ VectorAnyGeometry
Any vector layer with geometry.
Definition qgis.h:3647
@ RegeneratesPrimaryKey
Algorithm always drops any existing primary keys or FID values and regenerates them in outputs.
Definition qgis.h:3734
QFlags< ProcessingAlgorithmDocumentationFlag > ProcessingAlgorithmDocumentationFlags
Flags describing algorithm behavior for documentation purposes.
Definition qgis.h:3745
A vector of attributes.
Wrapper for iterator of features from vector data provider or vector layer.
bool nextFeature(QgsFeature &f)
Fetch next feature and stores in f, returns true on success.
Wraps a request for features to a vector layer (or directly its vector data provider).
QgsFeatureRequest & setSubsetOfAttributes(const QgsAttributeList &attrs)
Set a subset of attributes that will be fetched.
@ FastInsert
Use faster inserts, at the cost of updating the passed features to reflect changes made at the provid...
@ RegeneratePrimaryKey
This flag indicates, that a primary key field cannot be guaranteed to be unique and the sink should i...
The feature class encapsulates a single feature including its unique ID, geometry and a list of field...
Definition qgsfeature.h:60
QgsFeatureId id
Definition qgsfeature.h:68
void setAttributes(const QgsAttributes &attrs)
Sets the feature's attributes.
bool hasGeometry() const
Returns true if the feature has an associated geometry.
Q_INVOKABLE QVariant attribute(const QString &name) const
Lookup attribute value by attribute name.
void setGeometry(const QgsGeometry &geometry)
Set the feature's geometry.
bool isCanceled() const
Tells whether the operation has been canceled already.
Definition qgsfeedback.h:56
void setProgress(double progress)
Sets the current progress for the feedback object.
Definition qgsfeedback.h:65
Encapsulate a field in an attribute table or data source.
Definition qgsfield.h:56
Container of fields for a vector layer.
Definition qgsfields.h:46
bool append(const QgsField &field, Qgis::FieldOrigin origin=Qgis::FieldOrigin::Provider, int originIndex=-1)
Appends a field.
Definition qgsfields.cpp:75
int count
Definition qgsfields.h:50
bool rename(int fieldIdx, const QString &name)
Renames a name of field.
A geometry is the spatial representation of a feature.
const QgsAbstractGeometry * constGet() const
Returns a non-modifiable (const) reference to the underlying abstract geometry primitive.
QgsGeometry shortestLine(const QgsGeometry &other) const
Returns the shortest line joining this geometry to another geometry.
Line string geometry type, with support for z-dimension and m-values.
Contains information about the context in which a processing algorithm is executed.
QgsCoordinateTransformContext transformContext() const
Returns the coordinate transform context.
Custom exception class for processing related exceptions.
Base class for providing feedback from a processing algorithm.
virtual void pushInfo(const QString &info)
Pushes a general informational message from the algorithm.
A numeric output for processing algorithms.
A boolean parameter for processing algorithms.
A double numeric parameter for distance values.
A feature sink output for processing algorithms.
An input feature source (such as vector layers) parameter for processing algorithms.
A vector layer or feature source field parameter for processing algorithms.
A numeric parameter for processing algorithms.
A string parameter for processing algorithms.
static QgsFields combineFields(const QgsFields &fieldsA, const QgsFields &fieldsB, const QString &fieldsBPrefix=QString())
Combines two field lists, avoiding duplicate field names (in a case-insensitive manner).
A spatial index for QgsFeature objects.
@ FlagStoreFeatureGeometries
Indicates that the spatial index should also store feature geometries. This requires more memory,...
T qgsgeometry_cast(QgsAbstractGeometry *geom)
qint64 QgsFeatureId
64 bit feature ids negative numbers are used for uncommitted/newly added features
QList< int > QgsAttributeList
Definition qgsfield.h:30