利用spark将表中数据拆分


i
# coding:utf-8
from pyspark.sql import SparkSession

import os

if __name__ == '__main__':
os.environ['JAVA_HOME'] = 'C:Program FilesJavajdk1.8.0_211'
print(os.path)
spark = SparkSession
.builder
.appName("Python Spark SQL basic example")
.config("spark.some.config.option", "some-value")
.getOrCreate(http://www.my516.com)
path = "C:/Users/Administrator/Desktop/vedios.txt"
df = spark.read.csv(path, header=True)
df.createOrReplaceTempView("movies")
df = spark.sql("select * from movies lateral view explode(split(category,'#')) as type1")
df.show()
 
---------------------

原文地址:https://www.cnblogs.com/ly570/p/11357420.html