22 QString QgsRemoveDuplicatesByAttributeAlgorithm::name()
 const 
   24   return QStringLiteral( 
"removeduplicatesbyattribute" );
 
   27 QString QgsRemoveDuplicatesByAttributeAlgorithm::displayName()
 const 
   29   return QObject::tr( 
"Delete duplicates by attribute" );
 
   32 QStringList QgsRemoveDuplicatesByAttributeAlgorithm::tags()
 const 
   34   return QObject::tr( 
"drop,remove,field,value,same,filter" ).split( 
',' );
 
   37 QString QgsRemoveDuplicatesByAttributeAlgorithm::group()
 const 
   39   return QObject::tr( 
"Vector general" );
 
   42 QString QgsRemoveDuplicatesByAttributeAlgorithm::groupId()
 const 
   44   return QStringLiteral( 
"vectorgeneral" );
 
   47 void QgsRemoveDuplicatesByAttributeAlgorithm::initAlgorithm( 
const QVariantMap & )
 
   57   addParameter( failOutput );
 
   59   addOutput( 
new QgsProcessingOutputNumber( QStringLiteral( 
"RETAINED_COUNT" ), QObject::tr( 
"Count of retained records" ) ) );
 
   60   addOutput( 
new QgsProcessingOutputNumber( QStringLiteral( 
"DUPLICATE_COUNT" ), QObject::tr( 
"Count of discarded duplicate records" ) ) );
 
   63 QString QgsRemoveDuplicatesByAttributeAlgorithm::shortHelpString()
 const 
   65   return QObject::tr( 
"Removes duplicate rows by a field value (or multiple field values). The first matching row will be retained, and duplicates will be discarded.\n\n" 
   66                       "Optionally, these duplicate records can be saved to a separate output for analysis." );
 
   69 QString QgsRemoveDuplicatesByAttributeAlgorithm::shortDescription()
 const 
   71   return QObject::tr( 
"Removes duplicate rows by a field value (or multiple field values)." );
 
   74 QgsRemoveDuplicatesByAttributeAlgorithm *QgsRemoveDuplicatesByAttributeAlgorithm::createInstance()
 const 
   76   return new QgsRemoveDuplicatesByAttributeAlgorithm();
 
   81   std::unique_ptr< QgsProcessingFeatureSource > source( parameterAsSource( parameters, QStringLiteral( 
"INPUT" ), context ) );
 
   85   const QStringList fieldNames = parameterAsFields( parameters, QStringLiteral( 
"FIELDS" ), context );
 
   88   for ( 
const QString &
field : fieldNames )
 
   90     const int index = source->fields().lookupField( 
field );
 
   92       feedback->
reportError( QObject::tr( 
"Field %1 not found in INPUT layer, skipping" ).arg( 
field ) );
 
   94       attributes.append( index );
 
   96   if ( attributes.isEmpty() )
 
  100   QString noDupeSinkId;
 
  101   std::unique_ptr< QgsFeatureSink > noDupeSink( parameterAsSink( parameters, QStringLiteral( 
"OUTPUT" ), context, noDupeSinkId, source->fields(),
 
  102       source->wkbType(), source->sourceCrs() ) );
 
  107   std::unique_ptr< QgsFeatureSink > dupesSink( parameterAsSink( parameters, QStringLiteral( 
"DUPLICATES" ), context, dupeSinkId, source->fields(),
 
  108       source->wkbType(), source->sourceCrs() ) );
 
  110   const long count = source->featureCount();
 
  111   double step = count > 0 ? 100.0 / count : 1;
 
  114   long long keptCount = 0;
 
  115   long long discardedCount = 0;
 
  117   QSet< QVariantList > matched;
 
  122   QVariantList dupeKey;
 
  123   dupeKey.reserve( attributes.size() );
 
  124   for ( 
int i : attributes )
 
  127     dupeKey.append( QVariant() );
 
  138     for ( 
int attr : attributes )
 
  141     if ( matched.contains( dupeKey ) )
 
  152       matched.insert( dupeKey );
 
  161   outputs.insert( QStringLiteral( 
"RETAINED_COUNT" ), keptCount );
 
  162   outputs.insert( QStringLiteral( 
"DUPLICATE_COUNT" ), discardedCount );
 
  163   outputs.insert( QStringLiteral( 
"OUTPUT" ), noDupeSinkId );
 
  165     outputs.insert( QStringLiteral( 
"DUPLICATES" ), dupeSinkId );
 
Wrapper for iterator of features from vector data provider or vector layer.
bool nextFeature(QgsFeature &f)
This class wraps a request for features to a vector layer (or directly its vector data provider).
@ FastInsert
Use faster inserts, at the cost of updating the passed features to reflect changes made at the provid...
The feature class encapsulates a single feature including its unique ID, geometry and a list of field...
QVariant attribute(const QString &name) const
Lookup attribute value by attribute name.
bool isCanceled() const SIP_HOLDGIL
Tells whether the operation has been canceled already.
void setProgress(double progress)
Sets the current progress for the feedback object.
Contains information about the context in which a processing algorithm is executed.
void setCreateByDefault(bool createByDefault)
Sets whether the destination should be created by default.
Custom exception class for processing related exceptions.
@ FlagSkipGeometryValidityChecks
Invalid geometry checks should always be skipped. This flag can be useful for algorithms which always...
Base class for providing feedback from a processing algorithm.
virtual void reportError(const QString &error, bool fatalError=false)
Reports that the algorithm encountered an error while executing.
A numeric output for processing algorithms.
A feature sink output for processing algorithms.
An input feature source (such as vector layers) parameter for processing algorithms.
A vector layer or feature source field parameter for processing algorithms.
@ TypeVector
Tables (i.e. vector layers with or without geometry). When used for a sink this indicates the sink ha...
@ TypeVectorAnyGeometry
Any vector layer with geometry.
QList< int > QgsAttributeList