22 QString QgsRemoveDuplicatesByAttributeAlgorithm::name()
const 24 return QStringLiteral(
"removeduplicatesbyattribute" );
27 QString QgsRemoveDuplicatesByAttributeAlgorithm::displayName()
const 29 return QObject::tr(
"Delete duplicates by attribute" );
32 QStringList QgsRemoveDuplicatesByAttributeAlgorithm::tags()
const 34 return QObject::tr(
"drop,remove,field,value,same,filter" ).split(
',' );
37 QString QgsRemoveDuplicatesByAttributeAlgorithm::group()
const 39 return QObject::tr(
"Vector general" );
42 QString QgsRemoveDuplicatesByAttributeAlgorithm::groupId()
const 44 return QStringLiteral(
"vectorgeneral" );
47 void QgsRemoveDuplicatesByAttributeAlgorithm::initAlgorithm(
const QVariantMap & )
57 addParameter( failOutput );
59 addOutput(
new QgsProcessingOutputNumber( QStringLiteral(
"RETAINED_COUNT" ), QObject::tr(
"Count of retained records" ) ) );
60 addOutput(
new QgsProcessingOutputNumber( QStringLiteral(
"DUPLICATE_COUNT" ), QObject::tr(
"Count of discarded duplicate records" ) ) );
63 QString QgsRemoveDuplicatesByAttributeAlgorithm::shortHelpString()
const 65 return QObject::tr(
"Removes duplicate rows by a field value (or multiple field values). The first matching row will be retained, and duplicates will be discarded.\n\n" 66 "Optionally, these duplicate records can be saved to a separate output for analysis." );
69 QString QgsRemoveDuplicatesByAttributeAlgorithm::shortDescription()
const 71 return QObject::tr(
"Removes duplicate rows by a field value (or multiple field values)." );
74 QgsRemoveDuplicatesByAttributeAlgorithm *QgsRemoveDuplicatesByAttributeAlgorithm::createInstance()
const 76 return new QgsRemoveDuplicatesByAttributeAlgorithm();
81 std::unique_ptr< QgsProcessingFeatureSource > source( parameterAsSource( parameters, QStringLiteral(
"INPUT" ), context ) );
85 const QStringList fieldNames = parameterAsFields( parameters, QStringLiteral(
"FIELDS" ), context );
88 for (
const QString &field : fieldNames )
90 const int index = source->fields().lookupField( field );
92 feedback->
reportError( QObject::tr(
"Field %1 not found in INPUT layer, skipping" ).arg( field ) );
94 attributes.append( index );
96 if ( attributes.isEmpty() )
100 QString noDupeSinkId;
101 std::unique_ptr< QgsFeatureSink > noDupeSink( parameterAsSink( parameters, QStringLiteral(
"OUTPUT" ), context, noDupeSinkId, source->fields(),
102 source->wkbType(), source->sourceCrs() ) );
107 std::unique_ptr< QgsFeatureSink > dupesSink( parameterAsSink( parameters, QStringLiteral(
"DUPLICATES" ), context, dupeSinkId, source->fields(),
108 source->wkbType(), source->sourceCrs() ) );
110 const long count = source->featureCount();
111 double step = count > 0 ? 100.0 / count : 1;
114 long long keptCount = 0;
115 long long discardedCount = 0;
117 QSet< QVariantList > matched;
122 QVariantList dupeKey;
123 dupeKey.reserve( attributes.size() );
124 for (
int i : attributes )
127 dupeKey.append( QVariant() );
138 for (
int attr : attributes )
141 if ( matched.contains( dupeKey ) )
152 matched.insert( dupeKey );
161 outputs.insert( QStringLiteral(
"RETAINED_COUNT" ), keptCount );
162 outputs.insert( QStringLiteral(
"DUPLICATE_COUNT" ), discardedCount );
163 outputs.insert( QStringLiteral(
"OUTPUT" ), noDupeSinkId );
165 outputs.insert( QStringLiteral(
"DUPLICATES" ), dupeSinkId );
Wrapper for iterator of features from vector data provider or vector layer.
Use faster inserts, at the cost of updating the passed features to reflect changes made at the provid...
Base class for providing feedback from a processing algorithm.
Invalid geometry checks should always be skipped. This flag can be useful for algorithms which always...
A vector layer or feature source field parameter for processing algorithms.
void setProgress(double progress)
Sets the current progress for the feedback object.
A numeric output for processing algorithms.
The feature class encapsulates a single feature including its id, geometry and a list of field/values...
A feature sink output for processing algorithms.
This class wraps a request for features to a vector layer (or directly its vector data provider)...
Custom exception class for processing related exceptions.
void setCreateByDefault(bool createByDefault)
Sets whether the destination should be created by default.
bool isCanceled() const
Tells whether the operation has been canceled already.
An input feature source (such as vector layers) parameter for processing algorithms.
Tables (i.e. vector layers with or without geometry). When used for a sink this indicates the sink ha...
QList< int > QgsAttributeList
bool nextFeature(QgsFeature &f)
QVariant attribute(const QString &name) const
Lookup attribute value from attribute name.
Contains information about the context in which a processing algorithm is executed.
virtual void reportError(const QString &error, bool fatalError=false)
Reports that the algorithm encountered an error while executing.
Any vector layer with geometry.