Skip to content

Commit 4b1b209

Browse files
HIVE-29389: HiveProtoLoggingHook populates duplicate entries in TablesRead metrics for tables with multiple partitions (#6253)
1 parent 26ea12b commit 4b1b209

File tree

1 file changed

+3
-2
lines changed

1 file changed

+3
-2
lines changed

ql/src/java/org/apache/hadoop/hive/ql/hooks/HiveProtoLoggingHook.java

Lines changed: 3 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -92,6 +92,7 @@
9292
import java.util.ArrayList;
9393
import java.util.Arrays;
9494
import java.util.HashMap;
95+
import java.util.HashSet;
9596
import java.util.List;
9697
import java.util.Map;
9798
import java.util.Set;
@@ -489,13 +490,13 @@ private String getQueueName(ExecutionMode mode, HiveConf conf) {
489490
}
490491

491492
private List<String> getTablesFromEntitySet(Set<? extends Entity> entities) {
492-
List<String> tableNames = new ArrayList<>();
493+
Set<String> tableNames = new HashSet<>();
493494
for (Entity entity : entities) {
494495
if (entity.getType() == TABLE || entity.getType() == PARTITION) {
495496
tableNames.add(entity.getTable().getDbName() + "." + entity.getTable().getTableName());
496497
}
497498
}
498-
return tableNames;
499+
return new ArrayList<>(tableNames);
499500
}
500501

501502
private ExecutionMode getExecutionMode(QueryPlan plan, List<ExecDriver> mrTasks,

0 commit comments

Comments
 (0)