1
|
val
b
=
a.map(func)
|
1
|
val
linesNew
=
lines.map(lines
=
> lines +
"_NEW"
)
|
1
|
val
b
=
a.flatMap(func)
|
1
|
val
words
=
lines.flatMap(
_
.split(
" "
))
|
1
|
val
b
=
a.filter(func)
|
1
2
3
4
5
6
7
|
val
wordsOne
=
words.map(
_
+
"_one"
)
val
wordsTwo
=
words.map(
_
+
"_two"
)
val
unionWords
=
wordsOne.union(wordsTwo)
wordsOne.print()
wordsTwo.print()
unionWords.print()
|
1
|
val
wordsCount
=
words.count()
|
1
|
val
reduceWords
=
words.reduce(
_
+
"-"
+
_
)
|
1
|
val
countByValueWords
=
words.countByValue()
|
1
2
|
val
pairs
=
words.map(word
=
> (word ,
1
))
val
wordCounts
=
pairs.reduceByKey(
_
+
_
)
|
1
2
3
|
val
wordsOne
=
words.map(word
=
> (word , word +
"_one"
))
val
wordsTwo
=
words.map(word
=
> (word , word +
"_two"
))
val
joinWords
=
wordsOne.join(wordsTwo)
|
1
|
val
windowWords
=
words.window(Seconds(
3
), Seconds(
1
))
|
1
|
val
windowWords
=
words.countByWindow(Seconds(
3
), Seconds(
1
))
|
1
|
val
windowWords
=
words.reduceByWindow(
_
+
"-"
+
_
, Seconds(
3
) , Seconds(
1
))
|
1
|
val
windowWords
=
pairs.reduceByKeyAndWindow((a
:
Int , b
:
Int)
=
> (a + b) , Seconds(
3
) , Seconds(
1
))
|
1
|
val
windowWords
=
pairs.reduceByKeyAndWindow((a
:
Int, b
:
Int )
=
> (a + b) , (a
:
Int, b
:
Int)
=
> (a - b) , Seconds(
3
), Seconds(
1
))
|
1
|
val
windowWords
=
words.countByValueAndWindow(Seconds(
3
), Seconds(
1
))[/align]
|
1
2
|
val
words
=
lines.flatMap(
_
.split(
" "
))
words.print()
|
1
|
lines.saveAsTextFiles(
"satf"
,
".txt"
)[/align][align
=
left]
|