skipHiveColumnLineageHive20633InputsThreshold=atlasProperties.getInt(HOOK_SKIP_HIVE_COLUMN_LINEAGE_HIVE_20633_INPUTS_THRESHOLD,5);// skip greater-than 5 inputs by default
skipHiveColumnLineageHive20633InputsThreshold=atlasProperties.getInt(HOOK_SKIP_HIVE_COLUMN_LINEAGE_HIVE_20633_INPUTS_THRESHOLD,15);// skip if avg # of inputs is > 15
LOG.warn("skipping {} hive_column_lineage entities, each having {} inputs",columnLineages.size(),lineageInputsSize);
LOG.warn("skipped {} hive_column_lineage entities. Average # of inputs={}, threshold={}, total # of inputs={}",columnLineages.size(),avgInputsCount,context.getSkipHiveColumnLineageHive20633InputsThreshold(),lineageInputsCount);
skipHiveColumnLineageHive20633InputsThreshold=applicationProperties.getInt(CONSUMER_SKIP_HIVE_COLUMN_LINEAGE_HIVE_20633_INPUTS_THRESHOLD,5);// skip greater-than 5 inputs by default
skipHiveColumnLineageHive20633InputsThreshold=applicationProperties.getInt(CONSUMER_SKIP_HIVE_COLUMN_LINEAGE_HIVE_20633_INPUTS_THRESHOLD,15);// skip if avg # of inputs is > 15
@@ -685,34 +685,29 @@ public class NotificationHookConsumer implements Service, ActiveStateChangeHandl
...
@@ -685,34 +685,29 @@ public class NotificationHookConsumer implements Service, ActiveStateChangeHandl
}
}
if(entities!=null&&entities.getEntities()!=null){
if(entities!=null&&entities.getEntities()!=null){
booleanisSameInputsSize=true;
intlineageCount=0;
intlineageInputsSize=-1;
intlineageInputsCount=0;
intlineageCount=0;
// find if all hive_column_lineage entities have same number of inputs, which is likely to be caused by HIVE-20633 that results in incorrect lineage in some cases
// find if all hive_column_lineage entities have same number of inputs, which is likely to be caused by HIVE-20633 that results in incorrect lineage in some cases
@@ -726,7 +721,7 @@ public class NotificationHookConsumer implements Service, ActiveStateChangeHandl
...
@@ -726,7 +721,7 @@ public class NotificationHookConsumer implements Service, ActiveStateChangeHandl
}
}
if(numRemovedEntities>0){
if(numRemovedEntities>0){
LOG.warn("removed {} hive_column_lineage entities, each having {} inputs. offset={}, partition={}",numRemovedEntities,lineageInputsSize,kafkaMessage.getOffset(),kafkaMessage.getPartition());
LOG.warn("removed {} hive_column_lineage entities. Average # of inputs={}, threshold={}, total # of inputs={}. topic-offset={}, partition={}",numRemovedEntities,avgInputsCount,skipHiveColumnLineageHive20633InputsThreshold,lineageInputsCount,kafkaMessage.getOffset(),kafkaMessage.getPartition());