Don't clone records for text files

This commit is contained in:
Patrick Wendell 2014-01-14 11:57:53 -08:00
parent b07bc02a00
commit 6f965a46a9

View file

@ -340,8 +340,8 @@ class SparkContext(
* Hadoop-supported file system URI, and return it as an RDD of Strings.
*/
def textFile(path: String, minSplits: Int = defaultMinSplits): RDD[String] = {
hadoopFile(path, classOf[TextInputFormat], classOf[LongWritable], classOf[Text], minSplits)
.map(pair => pair._2.toString)
hadoopFile(path, classOf[TextInputFormat], classOf[LongWritable], classOf[Text],
minSplits, false).map(pair => pair._2.toString)
}
/**