Not a member of Pastebin yet?
Sign Up,
it unlocks many cool features!
- >>> from pyspark.sql import functions as F
- >>> df1 = spark.read.format("csv").option("inferSchema", "true").option("header","true").load('file:///info_new2.txt')
- WARN util.SizeEstimator: Failed to check whether UseCompressedOops is set; assuming yes
- >>> df1.show()
- +---+-------+--------+-------+----+------+-----+
- | id| circle|operator| info|prio| info1|prio1|
- +---+-------+--------+-------+----+------+-----+
- | 1| delhi| airtel| 1234|1.05| 212| 1.8|
- | 2|lucknow|vodafone| 23412|1.01| 2321| 1.5|
- | 3|gurgaon| idea| 21|1.05|123123| 1.0|
- | 4|chennai| airtel| 1232| 1.1| 12| 1.1|
- | 2|lucknow|vodafone|3432423| 1.6|123213| 1.1|
- | 3| ggn| ideas| 34324| 1.4| 23213| 1.9|
- +---+-------+--------+-------+----+------+-----+
- >>> df3 = df1.groupBy('id').agg(F.min('prio').alias('prio'),F.min('prio1').alias('prio1'),F.min('circle').alias('circle'),F.min('operator').alias('operator')).sort('id')
- >>> df3 = df1.groupBy('id').agg(F.min('prio').alias('prio'),F.min('prio1').alias('prio1'),F.min('circle').alias('circle'),F.min('operator').alias('operator')).sort('id')
- >>> df3.show()
- +---+----+-----+-------+--------+
- | id|prio|prio1| circle|operator|
- +---+----+-----+-------+--------+
- | 1|1.05| 1.8| delhi| airtel|
- | 2|1.01| 1.1|lucknow|vodafone|
- | 3|1.05| 1.0| ggn| idea|
- | 4| 1.1| 1.1|chennai| airtel|
- +---+----+-----+-------+--------+
- >>> df4=df3.join(df1, ["id", "prio"]).select(["id","prio","info"])
- >>> df5=df3.join(df1, ["id", "prio1"]).select(["id","prio1","info1"])
- >>>
- >>> df6=df4.join(df5, ["id"])
- >>> df4.show()
- +---+----+-----+
- | id|prio| info|
- +---+----+-----+
- | 1|1.05| 1234|
- | 2|1.01|23412|
- | 3|1.05| 21|
- | 4| 1.1| 1232|
- +---+----+-----+
- >>> df5.show()
- +---+-----+------+
- | id|prio1| info1|
- +---+-----+------+
- | 1| 1.8| 212|
- | 2| 1.1|123213|
- | 3| 1.0|123123|
- | 4| 1.1| 12|
- +---+-----+------+
- >>> df6.show()
- +---+----+-----+-----+------+
- | id|prio| info|prio1| info1|
- +---+----+-----+-----+------+
- | 1|1.05| 1234| 1.8| 212|
- | 2|1.01|23412| 1.1|123213|
- | 3|1.05| 21| 1.0|123123|
- | 4| 1.1| 1232| 1.1| 12|
- +---+----+-----+-----+------+
Add Comment
Please, Sign In to add comment