object SparkDistCP extends Logging
Spark-based DistCp application. SparkDistCP.main is the command-line entry to the application and SparkDistCP.run is the programmatic API entry to the application
- Alphabetic
- By Inheritance
- SparkDistCP
- Logging
- AnyRef
- Any
- Hide All
- Show All
- Public
- All
Type Members
- type KeyedCopyDefinition = (URI, CopyDefinitionWithDependencies)
Value Members
-
final
def
!=(arg0: Any): Boolean
- Definition Classes
- AnyRef → Any
-
final
def
##(): Int
- Definition Classes
- AnyRef → Any
-
final
def
==(arg0: Any): Boolean
- Definition Classes
- AnyRef → Any
-
final
def
asInstanceOf[T0]: T0
- Definition Classes
- Any
-
def
clone(): AnyRef
- Attributes
- protected[lang]
- Definition Classes
- AnyRef
- Annotations
- @throws( ... ) @native()
-
final
def
eq(arg0: AnyRef): Boolean
- Definition Classes
- AnyRef
-
def
equals(arg0: Any): Boolean
- Definition Classes
- AnyRef → Any
-
def
finalize(): Unit
- Attributes
- protected[lang]
- Definition Classes
- AnyRef
- Annotations
- @throws( classOf[java.lang.Throwable] )
-
final
def
getClass(): Class[_]
- Definition Classes
- AnyRef → Any
- Annotations
- @native()
-
def
hashCode(): Int
- Definition Classes
- AnyRef → Any
- Annotations
- @native()
-
final
def
isInstanceOf[T0]: Boolean
- Definition Classes
- Any
-
def
isTraceEnabled: Boolean
- Attributes
- protected
- Definition Classes
- Logging
-
def
logDebug(msg: ⇒ String, throwable: Throwable): Unit
- Attributes
- protected
- Definition Classes
- Logging
-
def
logDebug(msg: ⇒ String): Unit
- Attributes
- protected
- Definition Classes
- Logging
-
def
logError(msg: ⇒ String, throwable: Throwable): Unit
- Attributes
- protected
- Definition Classes
- Logging
-
def
logError(msg: ⇒ String): Unit
- Attributes
- protected
- Definition Classes
- Logging
-
def
logInfo(msg: ⇒ String, throwable: Throwable): Unit
- Attributes
- protected
- Definition Classes
- Logging
-
def
logInfo(msg: ⇒ String): Unit
- Attributes
- protected
- Definition Classes
- Logging
-
def
logName: String
- Attributes
- protected
- Definition Classes
- Logging
-
def
logTrace(msg: ⇒ String, throwable: Throwable): Unit
- Attributes
- protected
- Definition Classes
- Logging
-
def
logTrace(msg: ⇒ String): Unit
- Attributes
- protected
- Definition Classes
- Logging
-
def
logWarning(msg: ⇒ String, throwable: Throwable): Unit
- Attributes
- protected
- Definition Classes
- Logging
-
def
logWarning(msg: ⇒ String): Unit
- Attributes
- protected
- Definition Classes
- Logging
-
def
main(args: Array[String]): Unit
Main entry point for command-line.
Main entry point for command-line. Arguments are currently: Usage: SparkDistCP [options] [source_path...] <target_path>
--i Ignore failures --log <value> Write logs to a URI --dryrun Perform a trial run with no changes made --verbose Run in verbose mode --overwrite Overwrite destination --update Overwrite if source and destination differ in size, or checksum --filters <value> The path to a file containing a list of pattern strings, one string per line, such that paths matching the pattern will be excluded from the copy. --delete Delete the files existing in the dst but not in src --numListstatusThreads <value> Number of threads to use for building file listing --consistentPathBehaviour Revert the path behaviour when using overwrite or update to the path behaviour of non-overwrite/non-update --maxFilesPerTask <value> Maximum number of files to copy in a single Spark task --maxBytesPerTask <value> Maximum number of bytes to copy in a single Spark task --help prints this usage text [source_path...] <target_path>
-
final
def
ne(arg0: AnyRef): Boolean
- Definition Classes
- AnyRef
-
final
def
notify(): Unit
- Definition Classes
- AnyRef
- Annotations
- @native()
-
final
def
notifyAll(): Unit
- Definition Classes
- AnyRef
- Annotations
- @native()
-
def
run(sparkSession: SparkSession, sourcePaths: Seq[Path], destinationPath: Path, options: SparkDistCPOptions): Unit
Main entry point for programmatic access to the application.
Main entry point for programmatic access to the application.
- sparkSession
Active Spark Session
- sourcePaths
Source paths to copy from
- destinationPath
Destination path to copy to
- options
Options to use in the application
-
def
setLogLevel(level: Level): Unit
- Attributes
- protected
- Definition Classes
- Logging
-
final
def
synchronized[T0](arg0: ⇒ T0): T0
- Definition Classes
- AnyRef
-
def
toString(): String
- Definition Classes
- AnyRef → Any
-
final
def
wait(): Unit
- Definition Classes
- AnyRef
- Annotations
- @throws( ... )
-
final
def
wait(arg0: Long, arg1: Int): Unit
- Definition Classes
- AnyRef
- Annotations
- @throws( ... )
-
final
def
wait(arg0: Long): Unit
- Definition Classes
- AnyRef
- Annotations
- @throws( ... ) @native()