我有data.txt如下文件。
12, 345, 6789
Run Code Online (Sandbox Code Playgroud)
现在,我想在参数文件或标准输入的指定字段中使用指定的位数执行前导零填充。自变量文件的指定字段中指定的位数为 8 位数。我该怎么办?
这是我的代码:
import org.apache.spark.sql.types._
import org.apache.spark.sql.types._
import org.apache.spark.SparkConf
import org.apache.spark.SparkContext
import org.apache.spark.SparkContext._
import org.apache.spark.sql._
//Convert textfile to DF
val conf = new SparkConf().setAppName("ct").setMaster("local").set("spark.driver.allowMultipleContexts", "true")
val sc = SparkContext(conf)
val sparkSess = SparkSession.builder().appName("SparkSessionZipsExample").config(conf).getOrCreate()
val path = "data.txt"
val data = sc.textFile(path)
val colNum = data.first().split(",").size
var schemaString = "key"
for( i <- 1 to colNum - 1) {
schemaString += " value" + i
}
val fields = schemaString.split(" ").map(fieldName => StructField(fieldName, StringType, …Run Code Online (Sandbox Code Playgroud)