TextDelimitedIndexedDatasetReader

Instance Constructors

new TextDelimitedIndexedDatasetReader(readSchema: Schema)(implicit mc: DistributedContext)

readSchema
describes the delimiters and position of values in the text delimited file to be read.
mc
Spark context for reading files

Value Members

final def !=(arg0: AnyRef): Boolean

Definition Classes
AnyRef
final def !=(arg0: Any): Boolean

Definition Classes
Any
final def ##(): Int

Definition Classes
AnyRef → Any
final def ==(arg0: AnyRef): Boolean

Definition Classes
AnyRef
final def ==(arg0: Any): Boolean

Definition Classes
Any
final def asInstanceOf[T0]: T0

Definition Classes
Any
def clone(): AnyRef

Attributes
protected[java.lang]
Definition Classes
AnyRef
Annotations
@throws( ... )
def elementReader(mc: DistributedContext, readSchema: Schema, source: String, existingRowIDs: Option[BiDictionary] = None): IndexedDatasetSpark

Read in text delimited elements from all URIs in the comma delimited source String and return the DRM of all elements updating the dictionaries for row and column dictionaries.
Read in text delimited elements from all URIs in the comma delimited source String and return the DRM of all elements updating the dictionaries for row and column dictionaries. If there is no strength value in the element, assume it's presence means a strength of 1.
mc
context for the Spark job
readSchema
describes the delimiters and positions of values in the text delimited file.
source
comma delimited URIs of text files to be read from
returns
a new org.apache.mahout.sparkbindings.indexeddataset.IndexedDatasetSpark

Attributes
protected
Definition Classes
TDIndexedDatasetReader → Reader
final def eq(arg0: AnyRef): Boolean

Definition Classes
AnyRef
def equals(arg0: Any): Boolean

Definition Classes
AnyRef → Any
def finalize(): Unit

Attributes
protected[java.lang]
Definition Classes
AnyRef
Annotations
@throws( classOf[java.lang.Throwable] )
final def getClass(): Class[_]

Definition Classes
AnyRef → Any
def hashCode(): Int

Definition Classes
AnyRef → Any
final def isInstanceOf[T0]: Boolean

Definition Classes
Any
implicit val mc: DistributedContext

Spark context for reading files
Spark context for reading files

Definition Classes
TextDelimitedIndexedDatasetReader → Reader
final def ne(arg0: AnyRef): Boolean

Definition Classes
AnyRef
final def notify(): Unit

Definition Classes
AnyRef
final def notifyAll(): Unit

Definition Classes
AnyRef
def readElementsFrom(source: String, existingRowIDs: Option[BiDictionary]): IndexedDatasetSpark

Definition Classes
Reader
def readRowsFrom(source: String, existingRowIDs: Option[BiDictionary]): IndexedDatasetSpark

Definition Classes
Reader
val readSchema: Schema

describes the delimiters and position of values in the text delimited file to be read.
describes the delimiters and position of values in the text delimited file to be read.

Definition Classes
TextDelimitedIndexedDatasetReader → Reader
def rowReader(mc: DistributedContext, readSchema: Schema, source: String, existingRowIDs: Option[BiDictionary] = None): IndexedDatasetSpark

Read in text delimited rows from all URIs in this comma delimited source String and return the DRM of all elements updating the dictionaries for row and column dictionaries.
Read in text delimited rows from all URIs in this comma delimited source String and return the DRM of all elements updating the dictionaries for row and column dictionaries. If there is no strength value in the element, assume it's presence means a strength of 1. Note: if the input file has a strength delimiter but none is seen in rows, we assume there is none and give the strength as 1 in the input DRM.
mc
context for the Spark job
readSchema
describes the delimiters and positions of values in the text delimited file.
source
comma delimited URIs of text files to be read into the IndexedDatasetSpark
returns
a new org.apache.mahout.sparkbindings.indexeddataset.IndexedDatasetSpark

Attributes
protected
Definition Classes
TDIndexedDatasetReader → Reader
final def synchronized[T0](arg0: ⇒ T0): T0

Definition Classes
AnyRef
def toString(): String

Definition Classes
AnyRef → Any
final def wait(): Unit

Definition Classes
AnyRef
Annotations
@throws( ... )
final def wait(arg0: Long, arg1: Int): Unit

Definition Classes
AnyRef
Annotations
@throws( ... )
final def wait(arg0: Long): Unit

Definition Classes
AnyRef
Annotations
@throws( ... )

class TextDelimitedIndexedDatasetReader extends TDIndexedDatasetReader

Instance Constructors

new TextDelimitedIndexedDatasetReader(readSchema: Schema)(implicit mc: DistributedContext)

Value Members

final def !=(arg0: AnyRef): Boolean

final def !=(arg0: Any): Boolean

final def ##(): Int

final def ==(arg0: AnyRef): Boolean

final def ==(arg0: Any): Boolean

final def asInstanceOf[T0]: T0

def clone(): AnyRef

def elementReader(mc: DistributedContext, readSchema: Schema, source: String, existingRowIDs: Option[BiDictionary] = None): IndexedDatasetSpark

final def eq(arg0: AnyRef): Boolean

def equals(arg0: Any): Boolean

def finalize(): Unit

final def getClass(): Class[_]

def hashCode(): Int

final def isInstanceOf[T0]: Boolean

implicit val mc: DistributedContext

final def ne(arg0: AnyRef): Boolean

final def notify(): Unit

final def notifyAll(): Unit

def readElementsFrom(source: String, existingRowIDs: Option[BiDictionary]): IndexedDatasetSpark

def readRowsFrom(source: String, existingRowIDs: Option[BiDictionary]): IndexedDatasetSpark

val readSchema: Schema

def rowReader(mc: DistributedContext, readSchema: Schema, source: String, existingRowIDs: Option[BiDictionary] = None): IndexedDatasetSpark

final def synchronized[T0](arg0: ⇒ T0): T0

def toString(): String

final def wait(): Unit

final def wait(arg0: Long, arg1: Int): Unit

final def wait(arg0: Long): Unit

Inherited from TDIndexedDatasetReader

Inherited from Reader[IndexedDatasetSpark]

Inherited from AnyRef

Inherited from Any

Ungrouped