skipHiveColumnLineageHive20633InputsThreshold=atlasProperties.getInt(HOOK_SKIP_HIVE_COLUMN_LINEAGE_HIVE_20633_INPUTS_THRESHOLD,15);// skip if avg # of inputs is > 15
largeMessageProcessingTimeThresholdMs=applicationProperties.getInt("atlas.notification.consumer.large.message.processing.time.threshold.ms",60*1000);// 60 sec by default
// find if all hive_column_lineage entities have same number of inputs, which is likely to be caused by HIVE-20633 that results in incorrect lineage in some cases
@@ -777,11 +880,38 @@ public class NotificationHookConsumer implements Service, ActiveStateChangeHandl
}
if(numRemovedEntities>0){
LOG.warn("removed {} hive_column_lineage entities. Average # of inputs={}, threshold={}, total # of inputs={}. topic-offset={}, partition={}",numRemovedEntities,avgInputsCount,skipHiveColumnLineageHive20633InputsThreshold,lineageInputsCount,kafkaMessage.getOffset(),kafkaMessage.getPartition());
LOG.warn("removed {} hive_column_lineage entities. Average # of inputs={}, threshold={}, total # of inputs={}. topic-offset={}, partition={}",numRemovedEntities,avgInputsCount,skipHiveColumnLineageHive20633InputsThreshold,lineageInputsCount,context.getKafkaMessageOffset(),context.getKafkaPartition());