RDD<T>
persist(storageType?: StorageType): CacheRDD<T>
cache(): CachedRDD<T>
getNumPartitions: Promise<number>
> rdd = sc.parallelize([1, 2, 3, 4], 2)
> rdd.getNumPartitions()
2collect(): Promise<T[]>
take(count: number): Promise<T[]>
count(): Promise<number>
max(): Promise<T | null>
min(): Promise<T | null>
mapPartitions<T1>(func: (v: T[]) => T1[] | Promise<T1[]>, env?: FunctionEnv): RDD<T1>
glom(): RDD<T[]>
map<T1>(func: ((v: T) => T1), env?: FunctionEnv): RDD<T1>
reduce(func: ((a: T, b: T) => T), env?: FunctionEnv): Promise<T | null>
flatMap<T1>(func: ((v: T) => T1[]), env?: FunctionEnv): RDD<T1>
filter(func: (v: T) => boolean, env?: FunctionEnv): RDD<T>
distinct(numPartitions?: number): RDD<T>
repartition(numPartitions: number): RDD<T>
partitionBy(numPartitions: number, partitionFunc: (v: T) => number, env?: FunctionEnv): GeneratedRDD<T>
coalesce(numPartitions: number): GeneratedRDD<T>
reduceByKey<K, V>(this: RDD<[K, V]>, func: ((a: V, B: V) => V), numPartitions?: number, partitionFunc?: (v: K) => number, env?: FunctionEnv, ): RDD<[K, V]>
combineByKey<K, V, C>( this: RDD<[K, V]>, createCombiner: ((a: V) => C), mergeValue: ((a: C, b: V) => C), mergeCombiners: ((a: C, b: C) => C), numPartitions?: number, partitionFunc?: (v: K) => number, env?: FunctionEnv, ): RDD<[K, C]>
union(...others: RDD<T>[]): RDD<T>
saveAsTextFile(baseUrl: string, options?: Options): Promise<void>
Options
groupWith<K, V, ...V1>(this: RDD<[K, V]>, ...others: RDD<[K, ...V1]>): RDD<[K, [V[], ...V1[]]]>
cogroup<K, V, V1>(this: RDD<[K, V]>, other: RDD<[K, V1]>, numPartitions?: number): RDD<[K, [V[], V1[]]]>
join<K, V, V1>(this: RDD<[K, V]>, other: RDD<[K, V1]>, numPartitions?: number): RDD<[K, [V, V1]]>
leftOuterJoin<K, V, V1>(this: RDD<[K, V]>, other: RDD<[K, V1]>, numPartitions?: number): RDD<[K, [V, V1]]>
rightOuterJoin<K, V, V1>(this: RDD<[K, V]>, other: RDD<[K, V1]>, numPartitions?: number): RDD<[K, [V, V1]]>
fullOuterJoin<K, V, V1>(this: RDD<[K, V]>, other: RDD<[K, V1]>, numPartitions?: number): RDD<[K, [V, V1]]>
sort(ascending?: boolean, numPartitions?: number): RDD<T>
sortBy<K>(keyFunc: (data: T) => K, ascending?: boolean, numPartitions?: number, env?: FunctionEnv): RDD<T>
CachedRDD<T> extends RDD<T>
unpersist(): Promise<void>
Last updated