from pyspark import SparkContext
import random
OutputFile = "file:///usr/local/spark/mycode/exercise/people"
sc = SparkContext(‘local‘,‘createPeopleAgeData‘)
peopleAge = []
for i in range(1,1001):
rand = random.randint(1,100)
peopleAge.append(str(i)+" "+str(rand))
RDD = sc.parallelize(peopleAge)
RDD.saveAsTextFile(OutputFile)