pyspark 读取本txt 构建RDD
#!/usr/bin/env python3# -*- coding: utf-8 -*-"""Created on Fri Mar8 18:51:51 2019@author: lg"""from pyspark import SparkContext ,SparkConfconf=SparkConf().setAppName(&quo
·
#!/usr/bin/env python3
# -*- coding: utf-8 -*-
"""
Created on Fri Mar 8 18:51:51 2019
@author: lg
"""
from pyspark import SparkContext ,SparkConf
conf=SparkConf().setAppName("miniProject").setMaster("local[1]")
#conf=SparkConf().setAppName("lg").setMaster("spark://192.168.10.182:7077")
sc = SparkContext(conf=conf)
lines = sc.textFile("data.txt")
lineLengths = lines.map(lambda s: len(s))
print (lines.collect())
totalLength = lineLengths.reduce(lambda a, b: a + b)
sc.stop()
更多推荐
所有评论(0)