org.apache.hadoop.mapreduce.TaskCompletionEvent源码实例Demo-ICode联盟

类org.apache.hadoop.mapreduce.TaskCompletionEvent源码实例Demo

下面列出了怎么用org.apache.hadoop.mapreduce.TaskCompletionEvent的API类实例代码及写法，或者点击链接到github查看源代码。

源代码1 项目： kylin-on-parquet-v2 文件： HadoopCmdOutput.java

private TaskCompletionEvent getOneTaskFailure(Job job) throws IOException, InterruptedException {
    TaskCompletionEvent lastEvent = null;
    int index = 0;
    int failCount = 0;
    TaskCompletionEvent[] events = job.getTaskCompletionEvents(index);
    //This returns either nothing (if no task executions or no exceptions at all) or the last failure event within a subset of the exceptions from the first
    //index at which exceptions are found in the task completion events
    if (events == null) {
        return lastEvent;
    }
    while (events.length > 0 && failCount == 0) {
        for (TaskCompletionEvent event : events) {
            if (event.getStatus().equals(TaskCompletionEvent.Status.FAILED)) {
                failCount++;
                lastEvent = event;
            }
        }
        index += 10;
        events = job.getTaskCompletionEvents(index);
    }
    return lastEvent;
}

源代码2 项目： kylin 文件： HadoopCmdOutput.java

private TaskCompletionEvent getOneTaskFailure(Job job) throws IOException, InterruptedException {
    TaskCompletionEvent lastEvent = null;
    int index = 0;
    int failCount = 0;
    TaskCompletionEvent[] events = job.getTaskCompletionEvents(index);
    //This returns either nothing (if no task executions or no exceptions at all) or the last failure event within a subset of the exceptions from the first
    //index at which exceptions are found in the task completion events
    if (events == null) {
        return lastEvent;
    }
    while (events.length > 0 && failCount == 0) {
        for (TaskCompletionEvent event : events) {
            if (event.getStatus().equals(TaskCompletionEvent.Status.FAILED)) {
                failCount++;
                lastEvent = event;
            }
        }
        index += 10;
        events = job.getTaskCompletionEvents(index);
    }
    return lastEvent;
}

源代码3 项目： incubator-gobblin 文件： CompactionJobConfigurator.java

private static List<TaskCompletionEvent> getAllTaskCompletionEvent(Job completedJob) {
  List<TaskCompletionEvent> completionEvents = new LinkedList<>();

  while (true) {
    try {
      TaskCompletionEvent[] bunchOfEvents;
      bunchOfEvents = completedJob.getTaskCompletionEvents(completionEvents.size());
      if (bunchOfEvents == null || bunchOfEvents.length == 0) {
        break;
      }
      completionEvents.addAll(Arrays.asList(bunchOfEvents));
    } catch (IOException e) {
      break;
    }
  }

  return completionEvents;
}

源代码4 项目： incubator-gobblin 文件： CompactionJobConfigurator.java

/**
 * Get good files
 * The problem happens when speculative task attempt initialized but then killed in the middle of processing.
 * Some partial file was generated at {tmp_output}/_temporary/1/_temporary/attempt_xxx_xxx/xxxx(Avro file
 * might have .avro as extension file name), without being committed to its final destination
 * at {tmp_output}/xxxx.
 *
 * @param job Completed MR job
 * @param fs File system that can handle file system
 * @param acceptableExtension file extension acceptable as "good files".
 * @return all successful files that has been committed
 */
public static List<Path> getGoodFiles(Job job, Path tmpPath, FileSystem fs, List<String> acceptableExtension)
    throws IOException {
  List<TaskCompletionEvent> failedEvents = getUnsuccessfulTaskCompletionEvent(job);

  List<Path> allFilePaths = DatasetHelper.getApplicableFilePaths(fs, tmpPath, acceptableExtension);
  List<Path> goodPaths = new ArrayList<>();
  for (Path filePath : allFilePaths) {
    if (isFailedPath(filePath, failedEvents)) {
      fs.delete(filePath, false);
      log.error("{} is a bad path so it was deleted", filePath);
    } else {
      goodPaths.add(filePath);
    }
  }

  return goodPaths;
}

源代码5 项目： hadoop 文件： CLI.java

/**
 * List the events for the given job
 * @param jobId the job id for the job's events to list
 * @throws IOException
 */
private void listEvents(Job job, int fromEventId, int numEvents)
    throws IOException, InterruptedException {
  TaskCompletionEvent[] events = job.
    getTaskCompletionEvents(fromEventId, numEvents);
  System.out.println("Task completion events for " + job.getJobID());
  System.out.println("Number of events (from " + fromEventId + ") are: " 
    + events.length);
  for(TaskCompletionEvent event: events) {
    System.out.println(event.getStatus() + " " + 
      event.getTaskAttemptId() + " " + 
      getTaskLogURL(event.getTaskAttemptId(), event.getTaskTrackerHttp()));
  }
}

源代码6 项目： big-c 文件： CLI.java

/**
 * List the events for the given job
 * @param jobId the job id for the job's events to list
 * @throws IOException
 */
private void listEvents(Job job, int fromEventId, int numEvents)
    throws IOException, InterruptedException {
  TaskCompletionEvent[] events = job.
    getTaskCompletionEvents(fromEventId, numEvents);
  System.out.println("Task completion events for " + job.getJobID());
  System.out.println("Number of events (from " + fromEventId + ") are: " 
    + events.length);
  for(TaskCompletionEvent event: events) {
    System.out.println(event.getStatus() + " " + 
      event.getTaskAttemptId() + " " + 
      getTaskLogURL(event.getTaskAttemptId(), event.getTaskTrackerHttp()));
  }
}

源代码7 项目： incubator-tez 文件： ClientServiceDelegate.java

public TaskCompletionEvent[] getTaskCompletionEvents(JobID jobId,
    int fromEventId, int maxEvents)
    throws IOException, InterruptedException {
  // FIXME seems like there is support in client to query task failure
  // related information
  // However, api does not make sense for DAG
  return new TaskCompletionEvent[0];
}

源代码8 项目： tez 文件： ClientServiceDelegate.java

public TaskCompletionEvent[] getTaskCompletionEvents(JobID jobId,
    int fromEventId, int maxEvents)
    throws IOException, InterruptedException {
  // FIXME seems like there is support in client to query task failure
  // related information
  // However, api does not make sense for DAG
  return new TaskCompletionEvent[0];
}

源代码9 项目： kylin-on-parquet-v2 文件： HadoopCmdOutput.java

public void updateJobCounter() {
    try {
        Counters counters = job.getCounters();
        if (counters == null) {
            String errorMsg = "no counters for job " + getMrJobId();
            logger.warn(errorMsg);
            output.append(errorMsg);
        } else {
            this.output.append(counters.toString()).append("\n");
            logger.debug(counters.toString());

            mapInputRecords = String.valueOf(counters.findCounter(TaskCounter.MAP_INPUT_RECORDS).getValue());
            rawInputBytesRead = String.valueOf(counters.findCounter(RawDataCounter.BYTES).getValue());

            String outputFolder = job.getConfiguration().get("mapreduce.output.fileoutputformat.outputdir",
                    KylinConfig.getInstanceFromEnv().getHdfsWorkingDirectory());
            logger.debug("outputFolder is " + outputFolder);
            Path outputPath = new Path(outputFolder);
            String fsScheme = outputPath.getFileSystem(job.getConfiguration()).getScheme();
            long bytesWritten = counters.findCounter(fsScheme, FileSystemCounter.BYTES_WRITTEN).getValue();
            if (bytesWritten == 0) {
                logger.debug("Seems no counter found for " + fsScheme);
                bytesWritten = counters.findCounter("FileSystemCounters", "HDFS_BYTES_WRITTEN").getValue();
            }
            hdfsBytesWritten = String.valueOf(bytesWritten);
        }
        JobStatus jobStatus = job.getStatus();
        if (jobStatus.getState() == JobStatus.State.FAILED) {
            logger.warn("Job Diagnostics:" + jobStatus.getFailureInfo());
            output.append("Job Diagnostics:").append(jobStatus.getFailureInfo()).append("\n");
            TaskCompletionEvent taskEvent = getOneTaskFailure(job);
            if (taskEvent != null) {
                String[] fails = job.getTaskDiagnostics(taskEvent.getTaskAttemptId());
                logger.warn("Failure task Diagnostics:");
                output.append("Failure task Diagnostics:").append("\n");
                for (String failure : fails) {
                    logger.warn(failure);
                    output.append(failure).append("\n");
                }
            }
        }
    } catch (Exception e) {
        logger.error(e.getLocalizedMessage(), e);
        output.append(e.getLocalizedMessage());
    }
}

源代码10 项目： hadoop 文件： YARNRunner.java

@Override
public TaskCompletionEvent[] getTaskCompletionEvents(JobID arg0, int arg1,
    int arg2) throws IOException, InterruptedException {
  return clientCache.getClient(arg0).getTaskCompletionEvents(arg0, arg1, arg2);
}

源代码11 项目： hadoop 文件： LocalJobRunner.java

public MapTaskCompletionEventsUpdate getMapCompletionEvents(JobID jobId, 
    int fromEventId, int maxLocs, TaskAttemptID id) throws IOException {
  return new MapTaskCompletionEventsUpdate(
    org.apache.hadoop.mapred.TaskCompletionEvent.EMPTY_ARRAY, false);
}

源代码12 项目： hadoop 文件： LocalJobRunner.java

public TaskCompletionEvent[] getTaskCompletionEvents(
    org.apache.hadoop.mapreduce.JobID jobid
    , int fromEventId, int maxEvents) throws IOException {
  return TaskCompletionEvent.EMPTY_ARRAY;
}

源代码13 项目： big-c 文件： YARNRunner.java

@Override
public TaskCompletionEvent[] getTaskCompletionEvents(JobID arg0, int arg1,
    int arg2) throws IOException, InterruptedException {
  return clientCache.getClient(arg0).getTaskCompletionEvents(arg0, arg1, arg2);
}

源代码14 项目： big-c 文件： LocalJobRunner.java

public MapTaskCompletionEventsUpdate getMapCompletionEvents(JobID jobId, 
    int fromEventId, int maxLocs, TaskAttemptID id) throws IOException {
  return new MapTaskCompletionEventsUpdate(
    org.apache.hadoop.mapred.TaskCompletionEvent.EMPTY_ARRAY, false);
}

源代码15 项目： big-c 文件： LocalJobRunner.java

public TaskCompletionEvent[] getTaskCompletionEvents(
    org.apache.hadoop.mapreduce.JobID jobid
    , int fromEventId, int maxEvents) throws IOException {
  return TaskCompletionEvent.EMPTY_ARRAY;
}

源代码16 项目： ignite 文件： HadoopClientProtocol.java

/** {@inheritDoc} */
@Override public TaskCompletionEvent[] getTaskCompletionEvents(JobID jobid, int fromEventId, int maxEvents)
    throws IOException, InterruptedException {
    return new TaskCompletionEvent[0];
}

源代码17 项目： kylin 文件： HadoopCmdOutput.java

public void updateJobCounter() {
    try {
        Counters counters = job.getCounters();
        if (counters == null) {
            String errorMsg = "no counters for job " + getMrJobId();
            logger.warn(errorMsg);
            output.append(errorMsg);
        } else {
            this.output.append(counters.toString()).append("\n");
            logger.debug(counters.toString());

            mapInputRecords = String.valueOf(counters.findCounter(TaskCounter.MAP_INPUT_RECORDS).getValue());
            rawInputBytesRead = String.valueOf(counters.findCounter(RawDataCounter.BYTES).getValue());

            String outputFolder = job.getConfiguration().get("mapreduce.output.fileoutputformat.outputdir",
                    KylinConfig.getInstanceFromEnv().getHdfsWorkingDirectory());
            logger.debug("outputFolder is " + outputFolder);
            Path outputPath = new Path(outputFolder);
            String fsScheme = outputPath.getFileSystem(job.getConfiguration()).getScheme();
            long bytesWritten = counters.findCounter(fsScheme, FileSystemCounter.BYTES_WRITTEN).getValue();
            if (bytesWritten == 0) {
                logger.debug("Seems no counter found for " + fsScheme);
                bytesWritten = counters.findCounter("FileSystemCounters", "HDFS_BYTES_WRITTEN").getValue();
            }
            hdfsBytesWritten = String.valueOf(bytesWritten);
        }
        JobStatus jobStatus = job.getStatus();
        if (jobStatus.getState() == JobStatus.State.FAILED) {
            logger.warn("Job Diagnostics:" + jobStatus.getFailureInfo());
            output.append("Job Diagnostics:").append(jobStatus.getFailureInfo()).append("\n");
            TaskCompletionEvent taskEvent = getOneTaskFailure(job);
            if (taskEvent != null) {
                String[] fails = job.getTaskDiagnostics(taskEvent.getTaskAttemptId());
                logger.warn("Failure task Diagnostics:");
                output.append("Failure task Diagnostics:").append("\n");
                for (String failure : fails) {
                    logger.warn(failure);
                    output.append(failure).append("\n");
                }
            }
        }
    } catch (Exception e) {
        logger.error(e.getLocalizedMessage(), e);
        output.append(e.getLocalizedMessage());
    }
}

源代码18 项目： incubator-gobblin 文件： CompactionJobConfigurator.java

private static List<TaskCompletionEvent> getUnsuccessfulTaskCompletionEvent(Job completedJob) {
  return getAllTaskCompletionEvent(completedJob).stream()
      .filter(te -> te.getStatus() != TaskCompletionEvent.Status.SUCCEEDED)
      .collect(Collectors.toList());
}

源代码19 项目： incubator-gobblin 文件： CompactionJobConfigurator.java

private static boolean isFailedPath(Path path, List<TaskCompletionEvent> failedEvents) {
  return path.toString().contains("_temporary") || failedEvents.stream()
      .anyMatch(
          event -> path.toString().contains(Path.SEPARATOR + event.getTaskAttemptId().toString() + Path.SEPARATOR));
}

源代码20 项目： incubator-tez 文件： YARNRunner.java

@Override
public TaskCompletionEvent[] getTaskCompletionEvents(JobID arg0, int arg1,
    int arg2) throws IOException, InterruptedException {
  return clientCache.getClient(arg0).getTaskCompletionEvents(arg0, arg1, arg2);
}

源代码21 项目： tez 文件： YARNRunner.java

@Override
public TaskCompletionEvent[] getTaskCompletionEvents(JobID arg0, int arg1,
    int arg2) throws IOException, InterruptedException {
  return clientCache.getClient(arg0).getTaskCompletionEvents(arg0, arg1, arg2);
}

源代码22 项目： hadoop 文件： ClientProtocol.java

/**
 * Get task completion events for the jobid, starting from fromEventId. 
 * Returns empty array if no events are available. 
 * @param jobid job id 
 * @param fromEventId event id to start from.
 * @param maxEvents the max number of events we want to look at 
 * @return array of task completion events. 
 * @throws IOException
 */
public TaskCompletionEvent[] getTaskCompletionEvents(JobID jobid,
  int fromEventId, int maxEvents) throws IOException, InterruptedException;

源代码23 项目： big-c 文件： ClientProtocol.java

/**
 * Get task completion events for the jobid, starting from fromEventId. 
 * Returns empty array if no events are available. 
 * @param jobid job id 
 * @param fromEventId event id to start from.
 * @param maxEvents the max number of events we want to look at 
 * @return array of task completion events. 
 * @throws IOException
 */
public TaskCompletionEvent[] getTaskCompletionEvents(JobID jobid,
  int fromEventId, int maxEvents) throws IOException, InterruptedException;

类所在包

org.apache.hadoop.mapreduce

类方法

同包方法

org.apache.hadoop.mapreduce.Job

org.apache.hadoop.mapreduce.lib.input.FileInputFormat

org.apache.hadoop.mapreduce.lib.output.FileOutputFormat

org.apache.hadoop.mapreduce.Mapper

org.apache.hadoop.mapreduce.TaskAttemptContext

org.apache.hadoop.mapreduce.InputSplit

org.apache.hadoop.mapreduce.JobContext

org.apache.hadoop.mapreduce.Reducer