pip install dpark
python
import dpark
python
context = dpark.DparkContext()
python
data = context.textFile("data.txt")
python
result = data.filter(lambda x: x.startswith("A")).map(lambda x: (x, 1)).reduceByKey(lambda x, y: x + y)
python
print(result.collect())