org.apache.hadoop.mapreduce.lib.map.MultithreadedMapper源码实例Demo-ICode联盟

类org.apache.hadoop.mapreduce.lib.map.MultithreadedMapper源码实例Demo

下面列出了怎么用org.apache.hadoop.mapreduce.lib.map.MultithreadedMapper的API类实例代码及写法，或者点击链接到github查看源代码。

源代码1 项目： hadoop 文件： MultithreadedMapRunner.java

@SuppressWarnings("unchecked")
public void configure(JobConf jobConf) {
  int numberOfThreads =
    jobConf.getInt(MultithreadedMapper.NUM_THREADS, 10);
  if (LOG.isDebugEnabled()) {
    LOG.debug("Configuring jobConf " + jobConf.getJobName() +
              " to use " + numberOfThreads + " threads");
  }

  this.job = jobConf;
  //increment processed counter only if skipping feature is enabled
  this.incrProcCount = SkipBadRecords.getMapperMaxSkipRecords(job)>0 && 
    SkipBadRecords.getAutoIncrMapperProcCount(job);
  this.mapper = ReflectionUtils.newInstance(jobConf.getMapperClass(),
      jobConf);

  // Creating a threadpool of the configured size to execute the Mapper
  // map method in parallel.
  executorService = new ThreadPoolExecutor(numberOfThreads, numberOfThreads, 
                                           0L, TimeUnit.MILLISECONDS,
                                           new BlockingArrayQueue
                                             (numberOfThreads));
}

源代码2 项目： marklogic-contentpump 文件： MultithreadedZipContentLoader.java

public static void main(String[] args) throws Exception {
    Configuration conf = new Configuration();
    String[] otherArgs = new GenericOptionsParser(conf, args).getRemainingArgs();
    if (otherArgs.length < 2) {
        System.err.println("Usage: MultithreadedZipContentLoader configFile inputDir threadCount");
        System.exit(2);
    }
    
    Job job = Job.getInstance(conf);
    job.setJarByClass(MultithreadedZipContentLoader.class);
    job.setInputFormatClass(ZipContentInputFormat.class);
    job.setMapperClass(MultithreadedMapper.class);
    MultithreadedMapper.setMapperClass(job, ZipContentMapper.class);
    MultithreadedMapper.setNumberOfThreads(job, Integer.parseInt(args[2]));
    job.setMapOutputKeyClass(DocumentURI.class);
    job.setMapOutputValueClass(Text.class);
    job.setOutputFormatClass(ContentOutputFormat.class);
    
    ZipContentInputFormat.setInputPaths(job, new Path(otherArgs[1]));

    conf = job.getConfiguration();
    conf.addResource(otherArgs[0]);
     
    System.exit(job.waitForCompletion(true) ? 0 : 1);
}

源代码3 项目： big-c 文件： MultithreadedMapRunner.java

@SuppressWarnings("unchecked")
public void configure(JobConf jobConf) {
  int numberOfThreads =
    jobConf.getInt(MultithreadedMapper.NUM_THREADS, 10);
  if (LOG.isDebugEnabled()) {
    LOG.debug("Configuring jobConf " + jobConf.getJobName() +
              " to use " + numberOfThreads + " threads");
  }

  this.job = jobConf;
  //increment processed counter only if skipping feature is enabled
  this.incrProcCount = SkipBadRecords.getMapperMaxSkipRecords(job)>0 && 
    SkipBadRecords.getAutoIncrMapperProcCount(job);
  this.mapper = ReflectionUtils.newInstance(jobConf.getMapperClass(),
      jobConf);

  // Creating a threadpool of the configured size to execute the Mapper
  // map method in parallel.
  executorService = new ThreadPoolExecutor(numberOfThreads, numberOfThreads, 
                                           0L, TimeUnit.MILLISECONDS,
                                           new BlockingArrayQueue
                                             (numberOfThreads));
}

类所在包

org.apache.hadoop.mapreduce

类方法

同包方法

org.apache.hadoop.mapreduce.Job

org.apache.hadoop.mapreduce.lib.input.FileInputFormat

org.apache.hadoop.mapreduce.lib.output.FileOutputFormat

org.apache.hadoop.mapreduce.Mapper

org.apache.hadoop.mapreduce.TaskAttemptContext

org.apache.hadoop.mapreduce.InputSplit

org.apache.hadoop.mapreduce.JobContext

org.apache.hadoop.mapreduce.Reducer

org.apache.hadoop.mapreduce.RecordReader

org.apache.hadoop.mapreduce.RecordWriter

org.apache.hadoop.mapreduce.lib.input.FileSplit

org.apache.hadoop.mapreduce.InputFormat

org.apache.hadoop.mapreduce.lib.input.TextInputFormat

org.apache.hadoop.mapreduce.lib.output.TextOutputFormat

org.apache.hadoop.mapreduce.TaskAttemptID

org.apache.hadoop.mapreduce.OutputCommitter

org.apache.hadoop.mapreduce.OutputFormat

org.apache.hadoop.mapreduce.Partitioner

org.apache.hadoop.mapreduce.JobID

org.apache.hadoop.mapreduce.Counter

org.apache.hadoop.mapreduce.lib.output.SequenceFileOutputFormat

org.apache.hadoop.mapreduce.lib.input.SequenceFileInputFormat

org.apache.hadoop.mapreduce.lib.output.FileOutputCommitter

org.apache.hadoop.mapreduce.task.TaskAttemptContextImpl

org.apache.hadoop.mapreduce.TaskType

org.apache.hadoop.mapreduce.MRJobConfig

org.apache.hadoop.mapreduce.lib.output.NullOutputFormat

org.apache.hadoop.mapreduce.Mapper.Context

org.apache.hadoop.mapreduce.Counters

org.apache.hadoop.mapreduce.JobStatus

org.apache.hadoop.mapreduce.TaskID

org.apache.hadoop.mapreduce.task.JobContextImpl

org.apache.hadoop.mapreduce.TaskInputOutputContext

org.apache.hadoop.mapreduce.lib.input.LineRecordReader

org.apache.hadoop.mapreduce.security.TokenCache

org.apache.hadoop.mapreduce.MapContext

org.apache.hadoop.mapreduce.lib.output.MultipleOutputs

org.apache.hadoop.mapreduce.lib.input.CombineFileSplit

org.apache.hadoop.mapreduce.lib.input.CombineFileInputFormat

org.apache.hadoop.mapreduce.CounterGroup

org.apache.hadoop.mapreduce.Cluster

org.apache.hadoop.mapreduce.lib.partition.HashPartitioner

org.apache.hadoop.mapreduce.lib.map.WrappedMapper

org.apache.hadoop.mapreduce.TaskCounter

org.apache.hadoop.mapreduce.lib.input.SequenceFileRecordReader

org.apache.hadoop.mapreduce.lib.output.LazyOutputFormat

org.apache.hadoop.mapreduce.StatusReporter

org.apache.hadoop.mapreduce.lib.partition.TotalOrderPartitioner

org.apache.hadoop.mapreduce.lib.input.CombineFileRecordReader

org.apache.hadoop.mapreduce.TaskReport

org.apache.hadoop.mapreduce.lib.input.MultipleInputs

org.apache.hadoop.mapreduce.ReduceContext

org.apache.hadoop.mapreduce.lib.input.NLineInputFormat

org.apache.hadoop.mapreduce.security.token.delegation.DelegationTokenIdentifier

org.apache.hadoop.mapreduce.v2.MiniMRYarnCluster

org.apache.hadoop.mapreduce.Reducer.Context

org.apache.hadoop.mapreduce.MRConfig

org.apache.hadoop.mapreduce.filecache.DistributedCache

org.apache.hadoop.mapreduce.JobSubmissionFiles

org.apache.hadoop.mapreduce.lib.reduce.WrappedReducer

org.apache.hadoop.mapreduce.v2.jobhistory.JHAdminConfig

org.apache.hadoop.mapreduce.TaskCompletionEvent

org.apache.hadoop.mapreduce.FileSystemCounter

org.apache.hadoop.mapreduce.lib.output.MapFileOutputFormat

org.apache.hadoop.mapreduce.task.MapContextImpl

org.apache.hadoop.mapreduce.JobPriority

org.apache.hadoop.mapreduce.task.ReduceContextImpl

org.apache.hadoop.mapreduce.JobStatus.State

org.apache.hadoop.mapreduce.lib.input.KeyValueTextInputFormat

org.apache.hadoop.mapreduce.QueueAclsInfo

org.apache.hadoop.mapreduce.lib.reduce.LongSumReducer

org.apache.hadoop.mapreduce.v2.api.records.TaskAttemptId

org.apache.hadoop.mapreduce.protocol.ClientProtocol

org.apache.hadoop.mapreduce.ClusterMetrics

org.apache.hadoop.mapreduce.counters.GenericCounter

org.apache.hadoop.mapreduce.v2.api.protocolrecords.GetDelegationTokenRequest

org.apache.hadoop.mapreduce.lib.partition.InputSampler

org.apache.hadoop.mapreduce.v2.api.HSClientProtocol

org.apache.hadoop.mapreduce.v2.jobhistory.JobHistoryUtils

org.apache.hadoop.mapreduce.v2.api.MRClientProtocol

org.apache.hadoop.mapreduce.QueueInfo

org.apache.hadoop.mapreduce.TypeConverter

org.apache.hadoop.mapreduce.TaskTrackerInfo

org.apache.hadoop.mapreduce.split.SplitMetaInfoReader

org.apache.hadoop.mapreduce.v2.api.protocolrecords.GetJobReportResponse

org.apache.hadoop.mapreduce.protocol.ClientProtocolProvider

org.apache.hadoop.mapreduce.v2.api.protocolrecords.GetTaskReportResponse

org.apache.hadoop.mapreduce.v2.api.protocolrecords.GetTaskAttemptReportRequest

org.apache.hadoop.mapreduce.v2.api.protocolrecords.CancelDelegationTokenRequest

org.apache.hadoop.mapreduce.server.jobtracker.JTConfig

org.apache.hadoop.mapreduce.v2.api.protocolrecords.GetJobReportRequest

org.apache.hadoop.mapreduce.v2.util.MRApps

org.apache.hadoop.mapreduce.v2.api.protocolrecords.GetTaskReportRequest

org.apache.hadoop.mapreduce.v2.api.protocolrecords.GetTaskAttemptReportResponse

org.apache.hadoop.mapreduce.v2.LogParams

org.apache.hadoop.mapreduce.lib.join.TupleWritable

org.apache.hadoop.mapreduce.lib.db.DBWritable

org.apache.hadoop.mapreduce.v2.api.records.TaskReport

org.apache.hadoop.mapreduce.v2.api.records.JobReport

org.apache.hadoop.mapreduce.lib.join.CompositeInputFormat

org.apache.hadoop.mapreduce.v2.api.protocolrecords.KillJobResponse

org.apache.hadoop.mapreduce.JobACL

org.apache.hadoop.mapreduce.v2.api.protocolrecords.KillJobRequest

org.apache.hadoop.mapreduce.v2.api.protocolrecords.FailTaskAttemptResponse

org.apache.hadoop.mapreduce.v2.api.protocolrecords.GetDiagnosticsResponse

org.apache.hadoop.mapreduce.v2.api.protocolrecords.GetCountersRequest

org.apache.hadoop.mapreduce.split.JobSplitWriter

org.apache.hadoop.mapreduce.v2.api.protocolrecords.KillTaskAttemptResponse

org.apache.hadoop.mapreduce.v2.api.protocolrecords.GetTaskReportsRequest

org.apache.hadoop.mapreduce.v2.api.records.Counters

org.apache.hadoop.mapreduce.v2.api.records.JobState

org.apache.hadoop.mapreduce.v2.api.records.CounterGroup

org.apache.hadoop.mapreduce.security.token.JobTokenSecretManager

org.apache.hadoop.mapreduce.v2.api.protocolrecords.GetTaskAttemptCompletionEventsResponse

org.apache.hadoop.mapreduce.v2.api.records.TaskType

org.apache.hadoop.mapreduce.v2.api.protocolrecords.KillTaskAttemptRequest

org.apache.hadoop.mapreduce.Cluster.JobTrackerStatus

org.apache.hadoop.mapreduce.lib.db.DBOutputFormat

org.apache.hadoop.mapreduce.server.tasktracker.TTConfig

org.apache.hadoop.mapreduce.v2.api.records.TaskId

org.apache.hadoop.mapreduce.jobhistory.EventType

org.apache.hadoop.mapreduce.v2.api.protocolrecords.CancelDelegationTokenResponse

org.apache.hadoop.mapreduce.split.JobSplit.TaskSplitMetaInfo

org.apache.hadoop.mapreduce.v2.api.records.TaskAttemptCompletionEvent

org.apache.hadoop.mapreduce.jobhistory.JobHistoryParser

org.apache.hadoop.mapreduce.v2.api.protocolrecords.KillTaskResponse

org.apache.hadoop.mapreduce.lib.db.DBInputFormat.NullDBWritable

org.apache.hadoop.mapreduce.v2.api.records.TaskState

org.apache.hadoop.mapreduce.v2.api.protocolrecords.GetTaskAttemptCompletionEventsRequest

org.apache.hadoop.mapreduce.v2.api.records.JobId

org.apache.hadoop.mapreduce.v2.api.protocolrecords.GetDelegationTokenResponse

org.apache.hadoop.mapreduce.v2.api.protocolrecords.KillTaskRequest

org.apache.hadoop.mapreduce.v2.api.protocolrecords.GetTaskReportsResponse

org.apache.hadoop.mapreduce.v2.api.protocolrecords.RenewDelegationTokenRequest

org.apache.hadoop.mapreduce.v2.api.protocolrecords.FailTaskAttemptRequest

org.apache.hadoop.mapreduce.v2.api.protocolrecords.GetDiagnosticsRequest

org.apache.hadoop.mapreduce.v2.api.protocolrecords.GetCountersResponse

org.apache.hadoop.mapreduce.counters.CounterGroupBase

org.apache.hadoop.mapreduce.split.JobSplit.TaskSplitIndex

org.apache.hadoop.mapreduce.split.JobSplit.SplitMetaInfo

org.apache.hadoop.mapreduce.v2.api.protocolrecords.RenewDelegationTokenResponse

org.apache.hadoop.mapreduce.lib.jobcontrol.ControlledJob

org.apache.hadoop.mapreduce.v2.api.protocolrecords.impl.pb.KillJobRequestPBImpl

org.apache.hadoop.mapreduce.jobhistory.HistoryViewer

org.apache.hadoop.mapreduce.v2.api.protocolrecords.impl.pb.GetJobReportRequestPBImpl

org.apache.hadoop.mapreduce.lib.reduce.IntSumReducer

org.apache.hadoop.mapreduce.v2.app.AppContext

org.apache.hadoop.mapreduce.v2.app.job.Task

org.apache.hadoop.mapreduce.v2.api.MRDelegationTokenIdentifier

org.apache.hadoop.mapreduce.v2.jobhistory.JobIndexInfo

org.apache.hadoop.mapreduce.jobhistory.JobHistoryParser.TaskAttemptInfo

org.apache.hadoop.mapreduce.task.TaskAttemptContextImpl.DummyReporter

org.apache.hadoop.mapreduce.lib.output.FileOutputFormatCounter

org.apache.hadoop.mapreduce.v2.hs.HistoryContext

org.apache.hadoop.mapreduce.v2.app.job.Job

org.apache.hadoop.mapreduce.lib.map.MultithreadedMapper

org.apache.hadoop.mapreduce.jobhistory.MapAttemptFinishedEvent

org.apache.hadoop.mapreduce.lib.jobcontrol.ControlledJob.State

org.apache.hadoop.mapreduce.lib.input.InvalidInputException

org.apache.hadoop.mapreduce.filecache.ClientDistributedCacheManager

org.apache.hadoop.mapreduce.v2.hs.HistoryServerStateStoreService.HistoryServerState

org.apache.hadoop.mapreduce.jobhistory.HistoryEvent

org.apache.hadoop.mapreduce.lib.chain.ChainReducer

org.apache.hadoop.mapreduce.lib.chain.ChainMapper

org.apache.hadoop.mapreduce.v2.proto.MRServiceProtos.GetTaskAttemptReportRequestProto

org.apache.hadoop.mapreduce.v2.proto.MRServiceProtos.GetJobReportRequestProto

org.apache.hadoop.mapreduce.lib.input.SplitLineReader

org.apache.hadoop.mapreduce.v2.jobhistory.FileNameIndexUtils

org.apache.hadoop.mapreduce.lib.jobcontrol.JobControl

org.apache.hadoop.mapreduce.lib.db.DBConfiguration

org.apache.hadoop.mapreduce.v2.proto.MRServiceProtos.KillJobRequestProto

org.apache.hadoop.mapreduce.jobhistory.Event

org.apache.hadoop.mapreduce.v2.hs.JobHistoryServer

org.apache.hadoop.mapreduce.split.JobSplit

org.apache.hadoop.mapreduce.counters.AbstractCounters

org.apache.hadoop.mapreduce.v2.app.webapp.App

org.apache.hadoop.mapreduce.v2.proto.MRServiceProtos.GetTaskReportRequestProto

org.apache.hadoop.mapreduce.counters.Limits

org.apache.hadoop.mapreduce.lib.input.CombineTextInputFormat

org.apache.hadoop.mapreduce.v2.api.records.TaskAttemptReport

org.apache.hadoop.mapreduce.jobhistory.ReduceAttemptFinishedEvent

org.apache.hadoop.mapreduce.lib.input.CompressedSplitLineReader

org.apache.hadoop.mapreduce.v2.util.MRBuilderUtils

org.apache.hadoop.mapreduce.jobhistory.NormalizedResourceEvent

org.apache.hadoop.mapreduce.MapReduceTestUtil

org.apache.hadoop.mapreduce.v2.api.protocolrecords.impl.pb.GetTaskAttemptReportRequestPBImpl

org.apache.hadoop.mapreduce.JobCounter

org.apache.hadoop.mapreduce.v2.hs.JHSDelegationTokenSecretManager

org.apache.hadoop.mapreduce.v2.api.protocolrecords.impl.pb.GetTaskReportRequestPBImpl

org.apache.hadoop.mapreduce.v2.app.security.authorize.ClientHSPolicyProvider

org.apache.hadoop.mapreduce.lib.db.DBInputFormat

org.apache.hadoop.mapreduce.jobhistory.JobHistoryParser.JobInfo