public class GiraphConfiguration extends org.apache.hadoop.conf.Configuration implements GiraphConstants
ADDITIONAL_EDGE_REQUEST_SIZE, ADDITIONAL_MSG_REQUEST_SIZE, ADDITIONAL_VERTEX_REQUEST_SIZE, AGGREGATOR_WRITER_CLASS, ASYNC_MESSAGE_STORE_THREADS_COUNT, AUTHENTICATE, BASE_ZNODE_KEY, CHANNELS_PER_SERVER, CHECKPOINT_COMPRESSION_CODEC, CHECKPOINT_DIRECTORY, CHECKPOINT_FREQUENCY, CHECKPOINT_SUPPORTED_CHECKER, CLEANUP_CHECKPOINTS_AFTER_SUCCESS, CLIENT_RECEIVE_BUFFER_SIZE, CLIENT_SEND_BUFFER_SIZE, COMPUTATION_CLASS, COMPUTATION_FACTORY_CLASS, COMPUTATION_LANGUAGE, CREATE_EDGE_SOURCE_VERTICES, CREATE_EDGE_SOURCE_VERTICES_CALLBACK, DEFAULT_ZOOKEEPER_MAX_CLIENT_CNXNS, DEFAULT_ZOOKEEPER_SNAP_COUNT, DEFAULT_ZOOKEEPER_TICK_TIME, DISABLE_GIRAPH_CLASS_RESOLVER, DNS_INTERFACE, DNS_NAMESERVER, DO_OUTPUT_DURING_COMPUTATION, EDGE_INPUT_FILTER_CLASS, EDGE_INPUT_FORMAT_CLASS, EDGE_OUTPUT_FORMAT_CLASS, EDGE_OUTPUT_FORMAT_SUBDIR, EDGE_STORE_FACTORY_CLASS, EDGE_TRANSLATION_CLASS, EDGE_VALUE_CLASS, EDGE_VALUE_FACTORY_CLASS, EVENT_WAIT_MSECS, FAIL_FIRST_IPC_PORT_BIND_ATTEMPT, FAIL_ON_EMPTY_INPUT, GC_OBSERVER_CLASSES, GIRAPH_TEXT_OUTPUT_FORMAT_REVERSE, GIRAPH_TEXT_OUTPUT_FORMAT_SEPARATOR, GIRAPH_YARN_CONF_FILE, GIRAPH_YARN_LIBJARS, GIRAPH_YARN_PRIORITY, GIRAPH_YARN_TASK_HEAP_MB, GIRAPH_YARN_TASK_HEAP_MB_DEFAULT, GRAPH_PARTITIONER_FACTORY_CLASS, GRAPH_TYPE_LANGUAGES, GRAPH_TYPES_NEEDS_WRAPPERS, HADOOP_OUTPUT_FORMAT_CLASS, HALT_INSTRUCTIONS_WRITER_CLASS, HDFS_FILE_CREATION_RETRIES, HDFS_FILE_CREATION_RETRY_WAIT_MS, INPUT_SPLIT_MAX_EDGES, INPUT_SPLIT_MAX_VERTICES, INPUT_SPLIT_SAMPLE_PERCENT, INPUT_VERTEX_EDGES_CLASS, INPUT_VERTEX_EDGES_FACTORY_CLASS, IPC_INITIAL_PORT, IS_PURE_YARN_JOB, JMAP_ENABLE, JMAP_LIVE_ONLY, JMAP_PATH, JMAP_PRINT_LINES, JMAP_SLEEP_MILLIS, JOB_OBSERVER_CLASS, JOB_PROGRESS_TRACKER_CLIENT_CLASS, JOB_PROGRESS_TRACKER_SERVICE_CLASS, JOB_RETRY_CHECKER_CLASS, KEEP_ZOOKEEPER_DATA, LB_MAPPINGSTORE_LOWER, LB_MAPPINGSTORE_UPPER, LOCAL_TEST_MODE, LOG_LEVEL, LOG_THREAD_LAYOUT, MAPPER_OBSERVER_CLASSES, MAPPING_INPUT_FORMAT_CLASS, MAPPING_STORE_CLASS, MAPPING_STORE_OPS_CLASS, MASTER_COMPUTE_CLASS, MASTER_OBSERVER_CLASSES, MAX_ALLOWED_JOB_TIME_MS, MAX_COUNTER_WAIT_MSECS, MAX_EDGE_REQUEST_SIZE, MAX_IPC_PORT_BIND_ATTEMPTS, MAX_MASTER_SUPERSTEP_WAIT_MSECS, MAX_MSG_REQUEST_SIZE, MAX_MUTATIONS_PER_REQUEST, MAX_NUMBER_OF_SUPERSTEPS, MAX_PARTITIONS_IN_MEMORY, MAX_REQUEST_MILLISECONDS, MAX_RESOLVE_ADDRESS_ATTEMPTS, MAX_TASK_ATTEMPTS, MAX_VERTEX_REQUEST_SIZE, MAX_WORKERS, MESSAGE_COMBINER_CLASS, MESSAGE_ENCODE_AND_STORE_TYPE, MESSAGE_STORE_FACTORY_CLASS, METRICS_DIRECTORY, METRICS_ENABLE, MIN_FREE_MBS_ON_HEAP, MIN_PARTITIONS_PER_COMPUTE_THREAD, MIN_PERCENT_RESPONDED, MIN_WORKERS, MSG_NUM_FLUSH_THREADS, NETTY_CLIENT_EXECUTION_AFTER_HANDLER, NETTY_CLIENT_EXECUTION_THREADS, NETTY_CLIENT_THREADS, NETTY_CLIENT_USE_EXECUTION_HANDLER, NETTY_COMPRESSION_ALGORITHM, NETTY_MAX_CONNECTION_FAILURES, NETTY_REQUEST_ENCODER_BUFFER_SIZE, NETTY_SERVER_EXECUTION_AFTER_HANDLER, NETTY_SERVER_EXECUTION_THREADS, NETTY_SERVER_THREADS, NETTY_SERVER_USE_EXECUTION_HANDLER, NETTY_SIMULATE_FIRST_REQUEST_CLOSED, NETTY_SIMULATE_FIRST_RESPONSE_FAILED, NETTY_USE_DIRECT_MEMORY, NETTY_USE_POOLED_ALLOCATOR, NUM_CHECKPOINT_IO_THREADS, NUM_COMPUTE_THREADS, NUM_INPUT_THREADS, NUM_OUT_OF_CORE_THREADS, NUM_OUTPUT_THREADS, ONE_KB, ONE_MB, OUT_OF_CORE_DATA_ACCESSOR, OUT_OF_CORE_ORACLE, OUTGOING_MESSAGE_VALUE_CLASS, OUTGOING_MESSAGE_VALUE_FACTORY_CLASS, PARTITION_CLASS, PARTITION_COUNT_MULTIPLIER, PARTITION_LONG_TAIL_MIN_PRINT, PARTITION_VERTEX_KEY_SPACE_SIZE, PARTITIONS_DIRECTORY, PREFER_IP_ADDRESSES, REACTIVE_JMAP_ENABLE, REQUEST_SIZE_WARNING_THRESHOLD, RESEND_TIMED_OUT_REQUESTS, RESOLVER_CREATE_VERTEX_ON_MSGS, RESTART_JOB_ID, RESTART_SUPERSTEP, SERVER_RECEIVE_BUFFER_SIZE, SERVER_SEND_BUFFER_SIZE, SPLIT_MASTER_WORKER, STATIC_GRAPH, SUPERSTEP_COUNT, TCP_BACKLOG, TRACK_JOB_PROGRESS_ON_CLIENT, TYPES_HOLDER_CLASS, USE_BIG_DATA_IO_FOR_MESSAGES, USE_INPUT_SPLIT_LOCALITY, USE_MESSAGE_SIZE_ENCODING, USE_OUT_OF_CORE_GRAPH, USE_SUPERSTEP_COUNTERS, USE_UNSAFE_SERIALIZATION, USER_PARTITION_COUNT, VERTEX_CLASS, VERTEX_EDGES_CLASS, VERTEX_EDGES_FACTORY_CLASS, VERTEX_ID_CLASS, VERTEX_ID_FACTORY_CLASS, VERTEX_INPUT_FILTER_CLASS, VERTEX_INPUT_FORMAT_CLASS, VERTEX_OUTPUT_FORMAT_CLASS, VERTEX_OUTPUT_FORMAT_SUBDIR, VERTEX_OUTPUT_FORMAT_THREAD_SAFE, VERTEX_RESOLVER_CLASS, VERTEX_VALUE_CLASS, VERTEX_VALUE_COMBINER_CLASS, VERTEX_VALUE_FACTORY_CLASS, VERTICES_TO_UPDATE_PROGRESS, WAIT_FOR_OTHER_WORKERS_TIMEOUT_MSEC, WAIT_TASK_DONE_TIMEOUT_MS, WAIT_TIME_BETWEEN_CONNECTION_RETRIES_MS, WAIT_ZOOKEEPER_TIMEOUT_MSEC, WAITING_REQUEST_MSECS, WORKER_CONTEXT_CLASS, WORKER_OBSERVER_CLASSES, YOURKIT_OUTPUT_DIR, YOURKIT_OUTPUT_DIR_DEFAULT, ZOOKEEPER_BASE_PATH_COUNTER_GROUP, ZOOKEEPER_CONNECTION_ATTEMPTS, ZOOKEEPER_DIR, ZOOKEEPER_FORCE_SYNC, ZOOKEEPER_HALT_NODE_COUNTER_GROUP, ZOOKEEPER_IS_EXTERNAL, ZOOKEEPER_LIST, ZOOKEEPER_MANAGER_DIRECTORY, ZOOKEEPER_MAX_SESSION_TIMEOUT, ZOOKEEPER_MIN_SESSION_TIMEOUT, ZOOKEEPER_OPS_MAX_ATTEMPTS, ZOOKEEPER_OPS_RETRY_WAIT_MSECS, ZOOKEEPER_PURGE_INTERVAL, ZOOKEEPER_SERVER_PORT, ZOOKEEPER_SERVER_PORT_COUNTER_GROUP, ZOOKEEPER_SERVERLIST_POLL_MSECS, ZOOKEEPER_SESSION_TIMEOUT, ZOOKEEPER_SKIP_ACL, ZOOKEEPER_SNAP_RETAIN_COUNT
Constructor and Description |
---|
GiraphConfiguration()
Constructor that creates the configuration
|
GiraphConfiguration(org.apache.hadoop.conf.Configuration conf)
Constructor.
|
Modifier and Type | Method and Description |
---|---|
void |
addGcObserverClass(Class<? extends GcObserver> gcObserverClass)
Add a GcObserver class (optional)
|
void |
addMapperObserverClass(Class<? extends MapperObserver> mapperObserverClass)
Add a MapperObserver class (optional)
|
void |
addMasterObserverClass(Class<? extends MasterObserver> masterObserverClass)
Add a MasterObserver class (optional)
|
void |
addWorkerObserverClass(Class<? extends WorkerObserver> workerObserverClass)
Add a WorkerObserver class (optional)
|
boolean |
authenticate()
Use authentication? (if supported)
|
void |
configureHadoopSecurity()
Check environment for Hadoop security token location in case we are
executing the Giraph job on a MRv1 Hadoop cluster.
|
boolean |
doOutputDuringComputation()
Check if output should be done during computation
|
int |
getCheckpointFrequency()
Get the checkpoint frequeuncy of how many supersteps to wait
before checkpointing
|
Class<? extends Computation> |
getComputationClass()
Get the user's subclassed
Computation |
Class<? extends ComputationFactory> |
getComputationFactoryClass()
Get the user's subclassed
ComputationFactory |
String |
getComputationName()
Get name of computation being run.
|
boolean |
getCreateSourceVertex()
Get option whether to create a source vertex present only in edge input
|
int |
getEventWaitMsecs()
Get the number of milliseconds to wait for an event before continuing on
|
Class<? extends GcObserver>[] |
getGcObserverClasses()
Get array of GcObserver classes set in configuration.
|
int |
getHdfsFileCreationRetries() |
int |
getHdfsFileCreationRetryWaitMs() |
long |
getInputSplitMaxEdges() |
long |
getInputSplitMaxVertices() |
Class<? extends GiraphJobObserver> |
getJobObserverClass()
Get job observer class
|
Class<? extends GiraphJobRetryChecker> |
getJobRetryCheckerClass()
Get job retry checker class
|
String |
getLocalHostname()
Get the local hostname on the given interface.
|
String |
getLocalHostOrIp()
Return local host name by default.
|
String |
getLocalLevel() |
boolean |
getLocalTestMode()
is this job run a local test?
|
Class<? extends MapperObserver>[] |
getMapperObserverClasses()
Get array of MapperObserver classes set in configuration.
|
int |
getMapTasks()
Get the number of map tasks in this job
|
Class<? extends MasterObserver>[] |
getMasterObserverClasses()
Get array of MasterObserver classes set in the configuration.
|
int |
getMaxCounterWaitMsecs() |
int |
getMaxMappers()
How many mappers is job asking for, taking into account whether master
is running on the same mapper as worker or not
|
int |
getMaxMasterSuperstepWaitMsecs()
Get the maximum milliseconds to wait before giving up trying to get the
minimum number of workers before a superstep.
|
int |
getMaxNumberOfSupersteps()
Get the maximum number of supersteps of this application.
|
int |
getMaxTaskAttempts()
Get the max task attempts
|
int |
getMaxWorkers() |
float |
getMinPercentResponded() |
int |
getMinWorkers() |
io.netty.buffer.ByteBufAllocator |
getNettyAllocator()
Used by netty client and server to create ByteBufAllocator
|
int |
getNettyServerExecutionConcurrency()
Get the netty server execution concurrency.
|
int |
getNettyServerExecutionThreads() |
int |
getNettyServerThreads() |
boolean |
getNettyServerUseExecutionHandler() |
int |
getNumComputeThreads() |
int |
getNumInputSplitsThreads() |
int |
getNumOutputThreads()
Get the number of threads to use for writing output in the end of the
application.
|
Class<? extends OutEdges> |
getOutEdgesClass()
Get the vertex edges class
|
Class<? extends Partition> |
getPartitionClass()
Get Partition class used
|
boolean |
getResolverCreateVertexOnMessages()
Whether to create a vertex that doesn't exist when it receives messages.
|
boolean |
getSplitMasterWorker()
Getter for SPLIT_MASTER_WORKER flag.
|
String |
getStringVars(String key,
org.apache.hadoop.mapreduce.Mapper.Context context)
Get string, replacing variables in the output.
|
String |
getStringVars(String key,
String defaultValue,
org.apache.hadoop.mapreduce.Mapper.Context context)
Get string, replacing variables in the output.
|
int |
getTaskPartition()
Get the task partition
|
int |
getWaitTaskDoneTimeoutMs()
Get the maximum timeout (in milliseconds) for waiting for all tasks
to complete after the job is done.
|
Class<? extends WorkerObserver>[] |
getWorkerObserverClasses()
Get array of WorkerObserver classes set in configuration.
|
String |
getYarnLibJars()
Jars required in "Pure YARN" jobs (names only, no paths) should
be listed here in full, including Giraph framework jar(s).
|
int |
getYarnTaskHeapMb()
Get heap size (in MB) for each task in our Giraph job run,
assuming this job will run on the "pure YARN" profile.
|
String |
getYourKitOutputDir(org.apache.hadoop.mapreduce.Mapper.Context context)
Get the output directory to write YourKit snapshots to
|
int |
getZookeeperConnectionAttempts() |
String |
getZookeeperList()
Get the ZooKeeper list.
|
int |
getZooKeeperMaxSessionTimeout() |
int |
getZooKeeperMinSessionTimeout() |
int |
getZookeeperOpsMaxAttempts() |
int |
getZookeeperOpsRetryWaitMsecs() |
int |
getZooKeeperSessionTimeout() |
boolean |
hasEdgeInputFormat()
Does the job have a
EdgeInputFormat ? |
boolean |
hasEdgeOutputFormat()
Does the job have a
EdgeOutputFormat ? |
boolean |
hasEdgeOutputFormatSubdir()
Does the job have a
EdgeOutputFormat subdir? |
boolean |
hasVertexInputFormat()
Does the job have a
VertexInputFormat ? |
boolean |
hasVertexOutputFormat()
Does the job have a
VertexOutputFormat ? |
boolean |
hasVertexOutputFormatSubdir()
Does the job have a
EdgeOutputFormat subdir? |
boolean |
isJMapHistogramDumpEnabled()
Check whether to enable jmap dumping thread.
|
boolean |
isPureYarnJob()
Is this a "pure YARN" Giraph job, or is a MapReduce layer (v1 or v2)
actually managing our cluster nodes, i.e.
|
boolean |
isReactiveJmapHistogramDumpEnabled()
Check whether to enable heap memory supervisor thread
|
boolean |
isZookeeperExternal()
Was ZooKeeper provided externally?
|
boolean |
metricsEnabled()
Whether to track, print, and aggregate metrics.
|
boolean |
reuseEdgeObjects()
True if the
OutEdges implementation
copies the passed edges to its own data structure,
i.e. |
boolean |
reuseVertexObjects()
True if the
Partition implementation copies the passed vertices
to its own data structure, i.e. |
void |
setAggregatorWriterClass(Class<? extends AggregatorWriter> aggregatorWriterClass)
Set the aggregator writer class (optional)
|
void |
setCheckpointFrequency(int checkpointFrequency)
Set the checkpoint frequeuncy of how many supersteps to wait before
checkpointing
|
void |
setCheckpointSupportedChecker(Class<? extends CheckpointSupportedChecker> clazz)
Set runtime checkpoint support checker.
|
void |
setClasses(String name,
Class<?> xface,
Class<?>... klasses)
Set mapping from a key name to a list of classes.
|
void |
setComputationClass(Class<? extends Computation> computationClass)
Set the computation class (required)
|
void |
setCreateSourceVertex(boolean createVertex)
set option whether to create a source vertex present only in edge input
|
void |
setDoOutputDuringComputation(boolean doOutputDuringComputation)
Set whether or not we should do output during computation
|
void |
setEdgeInputFilterClass(Class<? extends EdgeInputFilter> edgeFilterClass)
Set the edge input filter class
|
void |
setEdgeInputFormatClass(Class<? extends EdgeInputFormat> edgeInputFormatClass)
Set the edge input format class (required)
|
void |
setEdgeOutputFormatClass(Class<? extends EdgeOutputFormat> edgeOutputFormatClass)
Set the edge output format class (optional)
|
void |
setEdgeOutputFormatSubdir(String path)
Set the edge output format path
|
void |
setEventWaitMsecs(int eventWaitMsecs)
Set the number of milliseconds to wait for an event before continuing on
|
void |
setGraphPartitionerFactoryClass(Class<? extends GraphPartitionerFactory> graphPartitionerFactoryClass)
Set the graph partitioner class (optional)
|
void |
setInputOutEdgesClass(Class<? extends OutEdges> inputOutEdgesClass)
Set the vertex edges class used during edge-based input (if different
from the one used during computation)
|
void |
setJobObserverClass(Class<? extends GiraphJobObserver> klass)
Set job observer class
|
void |
setJobRetryCheckerClass(Class<? extends GiraphJobRetryChecker> klass)
Set job retry checker class
|
void |
setLocalTestMode(boolean flag)
Flag this job as a local test run.
|
void |
setMappingInputFormatClass(Class<? extends MappingInputFormat> mappingInputFormatClass)
Set the mapping input format class (optional)
|
void |
setMasterComputeClass(Class<? extends MasterCompute> masterComputeClass)
Set the master class (optional)
|
void |
setMaxMasterSuperstepWaitMsecs(int maxMasterSuperstepWaitMsecs)
Set the maximum milliseconds to wait before giving up trying to get the
minimum number of workers before a superstep.
|
void |
setMaxNumberOfSupersteps(int maxNumberOfSupersteps)
Set the maximum number of supersteps of this application.
|
void |
setMaxTaskAttempts(int maxTaskAttempts)
Set the max task attempts
|
void |
setMessageCombinerClass(Class<? extends MessageCombiner> messageCombinerClass)
Set the message combiner class (optional)
|
void |
setNumComputeThreads(int numComputeThreads)
Set the number of compute threads
|
void |
setNumInputSplitsThreads(int numInputSplitsThreads)
Set the number of input split threads
|
void |
setNumOutputThreads(int numOutputThreads)
Set the number of threads to use for writing output in the end of the
application.
|
void |
setOutEdgesClass(Class<? extends OutEdges> outEdgesClass)
Set the vertex edges class
|
void |
setPartitionClass(Class<? extends Partition> partitionClass)
Set the partition class (optional)
|
void |
setResolverCreateVertexOnMessages(boolean v)
Set whether to create non existent vertices when they receive messages.
|
void |
setVertexClass(Class<? extends Vertex> vertexClass)
Set the vertex implementation class
|
void |
setVertexInputFilterClass(Class<? extends VertexInputFilter> vertexFilterClass)
Set the vertex input filter class
|
void |
setVertexInputFormatClass(Class<? extends VertexInputFormat> vertexInputFormatClass)
Set the vertex input format class (required)
|
void |
setVertexOutputFormatClass(Class<? extends VertexOutputFormat> vertexOutputFormatClass)
Set the vertex output format class (optional)
|
void |
setVertexOutputFormatSubdir(String path)
Set the vertex output format path
|
void |
setVertexOutputFormatThreadSafe(boolean vertexOutputFormatThreadSafe)
Set whether or not selected VertexOutputFormat is thread-safe
|
void |
setVertexResolverClass(Class<? extends VertexResolver> vertexResolverClass)
Set the vertex resolver class (optional)
|
void |
setVertexValueCombinerClass(Class<? extends VertexValueCombiner> vertexValueCombinerClass)
Set the vertex value combiner class (optional)
|
void |
setVertexValueFactoryClass(Class<? extends VertexValueFactory> vertexValueFactoryClass)
Set the vertex value factory class
|
void |
setWaitTaskDoneTimeoutMs(int ms)
Set the maximum timeout (in milliseconds) for waiting for all tasks
to complete after the job is done.
|
void |
setWorkerConfiguration(int minWorkers,
int maxWorkers,
float minPercentResponded)
Set worker configuration for determining what is required for
a superstep.
|
void |
setWorkerContextClass(Class<? extends WorkerContext> workerContextClass)
Set the worker context class (optional)
|
void |
setYarnLibJars(String jarList)
Populate jar list for Pure YARN jobs.
|
void |
setYarnTaskHeapMb(int heapMb)
Set heap size for Giraph tasks in our job run, assuming
the job will run on the "pure YARN" profile.
|
void |
setZooKeeperConfiguration(String serverList)
Utilize an existing ZooKeeper service.
|
void |
setZookeeperList(String zkList)
Set the ZooKeeper list to the provided list.
|
boolean |
trackJobProgressOnClient()
Check whether to track job progress on client or not
|
boolean |
useCheckpointing()
Check if checkpointing is used
|
boolean |
useInputSplitLocality()
Check if we want to prioritize input splits which reside on the host.
|
boolean |
useLogThreadLayout()
Use the log thread layout option?
|
void |
useUnsafeSerialization(boolean useUnsafeSerialization)
Set whether to use unsafe serialization
|
boolean |
vertexOutputFormatThreadSafe()
Check if VertexOutputFormat is thread-safe
|
addDefaultResource, addDeprecation, addDeprecation, addDeprecation, addDeprecation, addDeprecations, addResource, addResource, addResource, addResource, addResource, addResource, clear, dumpConfiguration, dumpDeprecatedKeys, get, get, getBoolean, getClass, getClass, getClassByName, getClassByNameOrNull, getClasses, getClassLoader, getConfResourceAsInputStream, getConfResourceAsReader, getDouble, getEnum, getFile, getFinalParameters, getFloat, getInstances, getInt, getInts, getLocalPath, getLong, getLongBytes, getPattern, getPropertySources, getProps, getRange, getRaw, getResource, getSocketAddr, getStringCollection, getStrings, getStrings, getTimeDuration, getTrimmed, getTrimmed, getTrimmedStringCollection, getTrimmedStrings, getTrimmedStrings, getValByRegex, hasWarnedDeprecation, isDeprecated, iterator, main, readFields, reloadConfiguration, set, set, setBoolean, setBooleanIfUnset, setClass, setClassLoader, setDouble, setEnum, setFloat, setIfUnset, setInt, setLong, setPattern, setQuietMode, setSocketAddr, setStrings, setTimeDuration, size, toString, unset, updateConnectAddr, write, writeXml, writeXml
clone, equals, finalize, getClass, hashCode, notify, notifyAll, wait, wait, wait
forEach, spliterator
public GiraphConfiguration()
public GiraphConfiguration(org.apache.hadoop.conf.Configuration conf)
conf
- Configurationpublic String getComputationName()
ComputationFactory
to decide what to return.public Class<? extends ComputationFactory> getComputationFactoryClass()
ComputationFactory
public Class<? extends Computation> getComputationClass()
Computation
public void setComputationClass(Class<? extends Computation> computationClass)
computationClass
- Runs vertex computationpublic final void setVertexValueFactoryClass(Class<? extends VertexValueFactory> vertexValueFactoryClass)
vertexValueFactoryClass
- Creates default vertex valuespublic void setEdgeInputFilterClass(Class<? extends EdgeInputFilter> edgeFilterClass)
edgeFilterClass
- class to usepublic void setVertexInputFilterClass(Class<? extends VertexInputFilter> vertexFilterClass)
vertexFilterClass
- class to usepublic Class<? extends OutEdges> getOutEdgesClass()
public final void setOutEdgesClass(Class<? extends OutEdges> outEdgesClass)
outEdgesClass
- Determines the way edges are storedpublic final void setVertexClass(Class<? extends Vertex> vertexClass)
vertexClass
- class of the vertex implementationpublic final void setInputOutEdgesClass(Class<? extends OutEdges> inputOutEdgesClass)
inputOutEdgesClass
- Determines the way edges are storedpublic boolean reuseEdgeObjects()
OutEdges
implementation
copies the passed edges to its own data structure,
i.e. it doesn't keep references to Edge objects, target vertex ids or edge
values passed to add() or initialize().
This makes it possible to reuse edge objects passed to the data
structure, to minimize object instantiation (see for example
EdgeStore#addPartitionEdges()).public boolean reuseVertexObjects()
Partition
implementation copies the passed vertices
to its own data structure, i.e. it doesn't keep references to Vertex
objects passed to it.
This makes it possible to reuse vertex objects passed to the data
structure, to minimize object instantiation.public Class<? extends Partition> getPartitionClass()
public boolean hasVertexInputFormat()
VertexInputFormat
?VertexInputFormat
has been specified.public void setVertexInputFormatClass(Class<? extends VertexInputFormat> vertexInputFormatClass)
vertexInputFormatClass
- Determines how graph is inputpublic boolean hasEdgeInputFormat()
EdgeInputFormat
?EdgeInputFormat
has been specified.public void setEdgeInputFormatClass(Class<? extends EdgeInputFormat> edgeInputFormatClass)
edgeInputFormatClass
- Determines how graph is inputpublic void setMappingInputFormatClass(Class<? extends MappingInputFormat> mappingInputFormatClass)
mappingInputFormatClass
- Determines how mappings are inputpublic final void setMasterComputeClass(Class<? extends MasterCompute> masterComputeClass)
masterComputeClass
- Runs master computationpublic final void addMasterObserverClass(Class<? extends MasterObserver> masterObserverClass)
masterObserverClass
- MasterObserver class to add.public final void addWorkerObserverClass(Class<? extends WorkerObserver> workerObserverClass)
workerObserverClass
- WorkerObserver class to add.public final void addMapperObserverClass(Class<? extends MapperObserver> mapperObserverClass)
mapperObserverClass
- MapperObserver class to add.public final void addGcObserverClass(Class<? extends GcObserver> gcObserverClass)
gcObserverClass
- GcObserver class to add.public Class<? extends GiraphJobObserver> getJobObserverClass()
public void setJobObserverClass(Class<? extends GiraphJobObserver> klass)
klass
- GiraphJobObserver class to set.public Class<? extends GiraphJobRetryChecker> getJobRetryCheckerClass()
public void setJobRetryCheckerClass(Class<? extends GiraphJobRetryChecker> klass)
klass
- GiraphJobRetryChecker class to set.public boolean isJMapHistogramDumpEnabled()
public boolean isReactiveJmapHistogramDumpEnabled()
public final void setClasses(String name, Class<?> xface, Class<?>... klasses)
name
- String key name to use.xface
- interface of the classes being set.klasses
- Classes to set.public boolean hasVertexOutputFormat()
VertexOutputFormat
?VertexOutputFormat
has been specified.public final void setVertexOutputFormatClass(Class<? extends VertexOutputFormat> vertexOutputFormatClass)
vertexOutputFormatClass
- Determines how graph is outputpublic boolean hasVertexOutputFormatSubdir()
EdgeOutputFormat
subdir?EdgeOutputFormat
subdir has been specified.public final void setVertexOutputFormatSubdir(String path)
path
- path where the verteces will be writtenpublic final boolean doOutputDuringComputation()
public final void setDoOutputDuringComputation(boolean doOutputDuringComputation)
doOutputDuringComputation
- True iff we want output to happen
during computationpublic final boolean vertexOutputFormatThreadSafe()
public final void setVertexOutputFormatThreadSafe(boolean vertexOutputFormatThreadSafe)
vertexOutputFormatThreadSafe
- True iff selected VertexOutputFormat
is thread-safepublic boolean hasEdgeOutputFormat()
EdgeOutputFormat
?EdgeOutputFormat
has been specified.public final void setEdgeOutputFormatClass(Class<? extends EdgeOutputFormat> edgeOutputFormatClass)
edgeOutputFormatClass
- Determines how graph is outputpublic boolean hasEdgeOutputFormatSubdir()
EdgeOutputFormat
subdir?EdgeOutputFormat
subdir has been specified.public final void setEdgeOutputFormatSubdir(String path)
path
- path where the edges will be writtenpublic final int getNumOutputThreads()
public void setNumOutputThreads(int numOutputThreads)
numOutputThreads
- Number of output threadspublic void setMessageCombinerClass(Class<? extends MessageCombiner> messageCombinerClass)
messageCombinerClass
- Determines how vertex messages are combinedpublic final void setGraphPartitionerFactoryClass(Class<? extends GraphPartitionerFactory> graphPartitionerFactoryClass)
graphPartitionerFactoryClass
- Determines how the graph is partitionedpublic final void setVertexResolverClass(Class<? extends VertexResolver> vertexResolverClass)
vertexResolverClass
- Determines how vertex mutations are resolvedpublic final boolean getResolverCreateVertexOnMessages()
public final void setResolverCreateVertexOnMessages(boolean v)
v
- true if we should create vertices when they get messages.public final void setVertexValueCombinerClass(Class<? extends VertexValueCombiner> vertexValueCombinerClass)
vertexValueCombinerClass
- Determines how vertices are combinedpublic final void setWorkerContextClass(Class<? extends WorkerContext> workerContextClass)
workerContextClass
- Determines what code is executed on a each
worker before and after each superstep and computationpublic final void setAggregatorWriterClass(Class<? extends AggregatorWriter> aggregatorWriterClass)
aggregatorWriterClass
- Determines how the aggregators are
written to file at the end of the jobpublic final void setPartitionClass(Class<? extends Partition> partitionClass)
partitionClass
- Determines the why partitions are storedpublic final void setWorkerConfiguration(int minWorkers, int maxWorkers, float minPercentResponded)
minWorkers
- Minimum workers to do a superstepmaxWorkers
- Maximum workers to do a superstep
(max map tasks in job)minPercentResponded
- 0 - 100 % of the workers required to
have responded before continuing the supersteppublic final int getMinWorkers()
public final int getMaxWorkers()
public final float getMinPercentResponded()
public final int getMaxMappers()
public final void setZooKeeperConfiguration(String serverList)
serverList
- Comma separated list of servers and ports
(i.e. zk1:2221,zk2:2221)public final boolean getSplitMasterWorker()
public Class<? extends MasterObserver>[] getMasterObserverClasses()
public Class<? extends WorkerObserver>[] getWorkerObserverClasses()
public Class<? extends MapperObserver>[] getMapperObserverClasses()
public Class<? extends GcObserver>[] getGcObserverClasses()
public boolean metricsEnabled()
public int getTaskPartition()
public boolean isPureYarnJob()
public String getYarnLibJars()
public void setYarnLibJars(String jarList)
jarList
- a comma-separated list of jar namespublic int getYarnTaskHeapMb()
public void setYarnTaskHeapMb(int heapMb)
heapMb
- the heap size for all taskspublic String getZookeeperList()
public void setZookeeperList(String zkList)
zkList
- list of strings, comma separated of zookeeper serverspublic boolean isZookeeperExternal()
public String getLocalLevel()
public boolean useLogThreadLayout()
public boolean getLocalTestMode()
public void setLocalTestMode(boolean flag)
flag
- the test status for this jobpublic int getZooKeeperSessionTimeout()
public int getZookeeperOpsMaxAttempts()
public int getZookeeperOpsRetryWaitMsecs()
public boolean getNettyServerUseExecutionHandler()
public int getNettyServerThreads()
public int getNettyServerExecutionThreads()
public int getNettyServerExecutionConcurrency()
public io.netty.buffer.ByteBufAllocator getNettyAllocator()
public int getZookeeperConnectionAttempts()
public int getZooKeeperMinSessionTimeout()
public int getZooKeeperMaxSessionTimeout()
public int getMapTasks()
public boolean authenticate()
public void setNumComputeThreads(int numComputeThreads)
numComputeThreads
- Number of compute threads to usepublic int getNumComputeThreads()
public void setNumInputSplitsThreads(int numInputSplitsThreads)
numInputSplitsThreads
- Number of input split threads to usepublic int getNumInputSplitsThreads()
public long getInputSplitMaxVertices()
public long getInputSplitMaxEdges()
public void useUnsafeSerialization(boolean useUnsafeSerialization)
useUnsafeSerialization
- If true, use unsafe serializationpublic void setCheckpointFrequency(int checkpointFrequency)
checkpointFrequency
- How often to checkpoint (0 means never)public int getCheckpointFrequency()
public boolean useCheckpointing()
public void setCheckpointSupportedChecker(Class<? extends CheckpointSupportedChecker> clazz)
clazz
- checkpoint supported checker classpublic void setMaxTaskAttempts(int maxTaskAttempts)
maxTaskAttempts
- Max task attempts to usepublic int getMaxTaskAttempts()
public int getEventWaitMsecs()
public void setEventWaitMsecs(int eventWaitMsecs)
eventWaitMsecs
- Number of milliseconds to wait for an event before
continuing onpublic int getMaxMasterSuperstepWaitMsecs()
public int getMaxCounterWaitMsecs()
public void setMaxMasterSuperstepWaitMsecs(int maxMasterSuperstepWaitMsecs)
maxMasterSuperstepWaitMsecs
- Maximum milliseconds to wait before
giving up trying to get the minimum
number of workers before a supersteppublic void configureHadoopSecurity()
public boolean useInputSplitLocality()
public String getLocalHostname() throws UnknownHostException
UnknownHostException
- IP address of a host could not be determinedpublic String getLocalHostOrIp() throws UnknownHostException
UnknownHostException
- IP address of a host could not be determinedpublic void setMaxNumberOfSupersteps(int maxNumberOfSupersteps)
maxNumberOfSupersteps
- Maximum number of superstepspublic int getMaxNumberOfSupersteps()
public String getYourKitOutputDir(org.apache.hadoop.mapreduce.Mapper.Context context)
context
- Map contextpublic String getStringVars(String key, org.apache.hadoop.mapreduce.Mapper.Context context)
key
- name of key to lookupcontext
- mapper contextpublic String getStringVars(String key, String defaultValue, org.apache.hadoop.mapreduce.Mapper.Context context)
key
- name of key to lookupdefaultValue
- value to return if no mapping exists. This can also
have variables, which will be substituted.context
- mapper contextpublic boolean getCreateSourceVertex()
public void setCreateSourceVertex(boolean createVertex)
createVertex
- create source vertex optionpublic int getWaitTaskDoneTimeoutMs()
public void setWaitTaskDoneTimeoutMs(int ms)
ms
- Milliseconds to setpublic boolean trackJobProgressOnClient()
public int getHdfsFileCreationRetries()
public int getHdfsFileCreationRetryWaitMs()
Copyright © 2011-2020 The Apache Software Foundation. All Rights Reserved.