val rawData = sc.textFile("/user/zhaoja/test/input/xxt.txt")
val data = rawData.map { line =>
val values = line.split(',').map(_.toDouble)

//创建向量
val featureVector = Vectors.dense(values.init)
val label = values.last - 1

//含有类标签的点
LabeledPoint(label, featureVector)
}

 

scala> data.take(1)
res70: Array[org.apache.spark.mllib.regression.LabeledPoint] = Array((0.0,[9.0,21.0,3.0,4.0,5.0]))

 

posted on 2017-08-16 15:41  充实自己  阅读(90)  评论(0编辑  收藏  举报