org.apache.nutch.util
Class NutchJob

java.lang.Object
  extended by org.apache.hadoop.mapreduce.JobContext
      extended by org.apache.hadoop.mapreduce.Job
          extended by org.apache.nutch.util.NutchJob

public class NutchJob
extends Job

A Job for Nutch jobs.


Nested Class Summary
 
Nested classes/interfaces inherited from class org.apache.hadoop.mapreduce.Job
Job.JobState
 
Field Summary
 
Fields inherited from class org.apache.hadoop.mapreduce.JobContext
CACHE_ARCHIVES_VISIBILITIES, CACHE_FILE_VISIBILITIES, COMBINE_CLASS_ATTR, conf, credentials, INPUT_FORMAT_CLASS_ATTR, JOB_ACL_MODIFY_JOB, JOB_ACL_VIEW_JOB, JOB_CANCEL_DELEGATION_TOKEN, JOB_NAMENODES, MAP_CLASS_ATTR, OUTPUT_FORMAT_CLASS_ATTR, PARTITIONER_CLASS_ATTR, REDUCE_CLASS_ATTR, ugi, USER_LOG_RETAIN_HOURS
 
Constructor Summary
NutchJob(Configuration conf)
           
NutchJob(Configuration conf, String jobName)
           
 
Method Summary
static boolean shouldProcess(org.apache.avro.util.Utf8 mark, org.apache.avro.util.Utf8 batchId)
           
 boolean waitForCompletion(boolean verbose)
           
 
Methods inherited from class org.apache.hadoop.mapreduce.Job
failTask, getCounters, getJar, getTaskCompletionEvents, getTrackingURL, isComplete, isSuccessful, killJob, killTask, mapProgress, reduceProgress, setCancelDelegationTokenUponJobCompletion, setCombinerClass, setGroupingComparatorClass, setInputFormatClass, setJarByClass, setJobName, setMapOutputKeyClass, setMapOutputValueClass, setMapperClass, setMapSpeculativeExecution, setNumReduceTasks, setOutputFormatClass, setOutputKeyClass, setOutputValueClass, setPartitionerClass, setReducerClass, setReduceSpeculativeExecution, setSortComparatorClass, setSpeculativeExecution, setupProgress, setWorkingDirectory, submit
 
Methods inherited from class org.apache.hadoop.mapreduce.JobContext
getCombinerClass, getConfiguration, getCredentials, getGroupingComparator, getInputFormatClass, getJobID, getJobName, getMapOutputKeyClass, getMapOutputValueClass, getMapperClass, getNumReduceTasks, getOutputFormatClass, getOutputKeyClass, getOutputValueClass, getPartitionerClass, getReducerClass, getSortComparator, getWorkingDirectory
 
Methods inherited from class java.lang.Object
clone, equals, finalize, getClass, hashCode, notify, notifyAll, toString, wait, wait, wait
 

Constructor Detail

NutchJob

public NutchJob(Configuration conf)
         throws IOException
Throws:
IOException

NutchJob

public NutchJob(Configuration conf,
                String jobName)
         throws IOException
Throws:
IOException
Method Detail

waitForCompletion

public boolean waitForCompletion(boolean verbose)
                          throws IOException,
                                 InterruptedException,
                                 ClassNotFoundException
Overrides:
waitForCompletion in class Job
Throws:
IOException
InterruptedException
ClassNotFoundException

shouldProcess

public static boolean shouldProcess(org.apache.avro.util.Utf8 mark,
                                    org.apache.avro.util.Utf8 batchId)


Copyright © 2012 The Apache Software Foundation