Skip to content

Commit

Permalink
Include S3 counters in heuristics (linkedin#670)
Browse files Browse the repository at this point in the history
The Tez heuristics assume that all of the S3-related counters are
prefixed with either "S3A_" or "S3N_". In our case, it's simply "S3_",
so our Mapper heuristics all show 0 bytes read per task.

This updates the heuristics to include the "S3_*" counters (the
MapReduce heuristics already do this).
  • Loading branch information
astahlman authored Apr 8, 2020
1 parent cbdf629 commit 48b2a2f
Show file tree
Hide file tree
Showing 7 changed files with 12 additions and 1 deletion.
7 changes: 6 additions & 1 deletion app/com/linkedin/drelephant/tez/data/TezCounterData.java
Original file line number Diff line number Diff line change
Expand Up @@ -100,11 +100,16 @@ public static enum CounterName {
HDFS_READ_OPS(GroupName.FileSystemCounters, "HDFS_READ_OPS", "HDFS_READ_OPS"),
HDFS_LARGE_READ_OPS(GroupName.FileSystemCounters, "HDFS_LARGE_READ_OPS", "HDFS_LARGE_READ_OPS"),
HDFS_WRITE_OPS(GroupName.FileSystemCounters, "HDFS_WRITE_OPS", "HDFS_WRITE_OPS"),
S3_BYTES_READ(GroupName.FileSystemCounters, "S3_BYTES_READ", "S3_BYTES_READ"),
S3_BYTES_WRITTEN(GroupName.FileSystemCounters, "S3_BYTES_WRITTEN", "S3_BYTES_WRITTEN"),
S3_READ_OPS(GroupName.FileSystemCounters, "S3_READ_OPS", "S3_READ_OPS"),
S3_LARGE_READ_OPS(GroupName.FileSystemCounters, "S3_LARGE_READ_OPS", "S3_LARGE_READ_OPS"),
S3_WRITE_OPS(GroupName.FileSystemCounters, "S3_WRITE_OPS", "S3_WRITE_OPS"),
S3A_BYTES_READ(GroupName.FileSystemCounters, "S3A_BYTES_READ", "S3A_BYTES_READ"),
S3A_BYTES_WRITTEN(GroupName.FileSystemCounters, "S3A_BYTES_WRITTEN", "S3A_BYTES_WRITTEN"),
S3A_READ_OPS(GroupName.FileSystemCounters, "S3A_READ_OPS", "S3A_READ_OPS"),
S3A_LARGE_READ_OPS(GroupName.FileSystemCounters, "S3A_LARGE_READ_OPS", "S3A_LARGE_READ_OPS"),
S3A_WRITE_OPS(GroupName.FileSystemCounters, "S3A_WRITE_OPS", "S3_WRITE_OPS"),
S3A_WRITE_OPS(GroupName.FileSystemCounters, "S3A_WRITE_OPS", "S3A_WRITE_OPS"),
S3N_BYTES_READ(GroupName.FileSystemCounters, "S3N_BYTES_READ", "S3N_BYTES_READ"),
S3N_BYTES_WRITTEN(GroupName.FileSystemCounters, "S3N_BYTES_WRITTEN", "S3N_BYTES_WRITTEN"),
S3N_READ_OPS(GroupName.FileSystemCounters, "S3N_READ_OPS", "S3N_READ_OPS"),
Expand Down
Original file line number Diff line number Diff line change
Expand Up @@ -35,6 +35,7 @@ public class MapperDataSkewHeuristic extends GenericDataSkewHeuristic {
public MapperDataSkewHeuristic(HeuristicConfigurationData heuristicConfData) {
super(Arrays.asList(
TezCounterData.CounterName.HDFS_BYTES_READ,
TezCounterData.CounterName.S3_BYTES_READ,
TezCounterData.CounterName.S3A_BYTES_READ,
TezCounterData.CounterName.S3N_BYTES_READ
), heuristicConfData);
Expand Down
Original file line number Diff line number Diff line change
Expand Up @@ -53,6 +53,7 @@ public class MapperSpeedHeuristic implements Heuristic<TezApplicationData> {

private List<TezCounterData.CounterName> _counterNames = Arrays.asList(
TezCounterData.CounterName.HDFS_BYTES_READ,
TezCounterData.CounterName.S3_BYTES_READ,
TezCounterData.CounterName.S3A_BYTES_READ,
TezCounterData.CounterName.S3N_BYTES_READ
);
Expand Down
Original file line number Diff line number Diff line change
Expand Up @@ -51,6 +51,7 @@ public class MapperTimeHeuristic implements Heuristic<TezApplicationData> {

private List<TezCounterData.CounterName> _counterNames = Arrays.asList(
TezCounterData.CounterName.HDFS_BYTES_READ,
TezCounterData.CounterName.S3_BYTES_READ,
TezCounterData.CounterName.S3A_BYTES_READ,
TezCounterData.CounterName.S3N_BYTES_READ
);
Expand Down
Original file line number Diff line number Diff line change
Expand Up @@ -35,6 +35,7 @@ public class TezScopeDataSkewHeuristic extends GenericDataSkewHeuristic {
public TezScopeDataSkewHeuristic(HeuristicConfigurationData heuristicConfData) {
super(Arrays.asList(
TezCounterData.CounterName.HDFS_BYTES_READ,
TezCounterData.CounterName.S3_BYTES_READ,
TezCounterData.CounterName.S3A_BYTES_READ,
TezCounterData.CounterName.S3N_BYTES_READ
), heuristicConfData);
Expand Down
Original file line number Diff line number Diff line change
Expand Up @@ -53,6 +53,7 @@ public class TezScopeSpeedHeuristic implements Heuristic<TezApplicationData> {

private List<TezCounterData.CounterName> _counterNames = Arrays.asList(
TezCounterData.CounterName.HDFS_BYTES_READ,
TezCounterData.CounterName.S3_BYTES_READ,
TezCounterData.CounterName.S3A_BYTES_READ,
TezCounterData.CounterName.S3N_BYTES_READ
);
Expand Down
Original file line number Diff line number Diff line change
Expand Up @@ -51,6 +51,7 @@ public class TezScopeTimeHeuristic implements Heuristic<TezApplicationData> {

private List<TezCounterData.CounterName> _counterNames = Arrays.asList(
TezCounterData.CounterName.HDFS_BYTES_READ,
TezCounterData.CounterName.S3_BYTES_READ,
TezCounterData.CounterName.S3A_BYTES_READ,
TezCounterData.CounterName.S3N_BYTES_READ
);
Expand Down

0 comments on commit 48b2a2f

Please sign in to comment.