0% found this document useful (0 votes)

9 views35 pages

V2 SQL Final Document

The document contains a Spark application that reads multiple CSV files into DataFrames and performs various SQL operations on them, including filtering, aggregation, and joins. It demonstrates data manipulation techniques such as selecting specific columns, applying conditions, and using window functions. Additionally, it showcases data formatting and handling of null values, along with examples of union and subqueries.

Uploaded by

Renuka Meduri

We take content rights seriously. If you suspect this is your content, claim it here.

Available Formats

Download as DOCX, PDF, TXT or read online on Scribd

0% found this document useful (0 votes)

9 views35 pages

V2 SQL Final Document

Uploaded by

Renuka Meduri

We take content rights seriously. If you suspect this is your content, claim it here.

Available Formats

Download as DOCX, PDF, TXT or read online on Scribd

You are on page 1/ 35

val df = spark.read.option("header","true").csv("file:///C:/data/df.

csv")

val df1 = spark.read.option("header","true").csv("file:///C:/data/df1.csv")

val cust = spark.read.option("header","true").csv("file:///C:/data/cust.csv")

val prod = spark.read.option("header","true").csv("file:///C:/data/prod.csv")

df.show()
df1.show()
cust.show()
prod.show()

df.createOrReplaceTempView("df")
df1.createOrReplaceTempView("df1")
cust.createOrReplaceTempView("cust")
prod.createOrReplaceTempView("prod")

sc.setLogLevel("ERROR")
spark.sql("select * from df order by id").show()
spark.sql("select * from df1 order by id").show()
====================================
Validate data
====================================

spark.sql("select * from df ").show()

====================================
Select two columns
====================================

spark.sql("select id,tdate from df order by id").show()

====================================
Select column with category filter = Exercise
====================================

spark.sql("select id,tdate,category from df where category='Exercise'

order by id").show()

====================================
Multi Column filter
====================================
spark.sql("select id,tdate,category,spendby from df where category='Exercise'
and spendby='cash' ").show()

====================================
Multi Value Filter
====================================

spark.sql("select * from df where category in

('Exercise','Gymnastics')").show()

====================================
Like Filter
====================================

spark.sql("select * from df where product like ('%Gymnastics%')").show()

====================================
Not Filters
====================================

spark.sql("select * from df where category != 'Exercise'").show()

====================================
Not In Filters
====================================
spark.sql("select * from df where category not in
('Exercise','Gymnastics')").show()

====================================
Null Filters
====================================
spark.sql("select * from df where product is null").show()

====================================
Not Null Filters
====================================
====================================
Max Function
====================================

spark.sql("select max(id) from df ").show()

====================================
Min Funtion
====================================
spark.sql("select min(id) from df ").show()

====================================
Count
====================================

spark.sql("select count(1) from df ").show()

====================================
Condition statement
====================================

spark.sql("select *,case when spendby='cash' then 1 else 0 end as status from

df ").show()

====================================
Concat data
====================================
spark.sql("select id,category,concat(id,'-',category) as condata from df").show()
====================================
Concat_ws data
====================================

spark.sql("select
id,category,product,concat_ws('-',id,cate
gory,product) as condata from df").show()
====================================
Lower Case data
====================================

spark.sql("select category,lower(category) as lower from df ").show()

====================================
Ceil data
====================================

spark.sql("select amount,ceil(amount) as ceil from df").show()

====================================
Round the data
====================================

spark.sql("select amount,round(amount) as round from df").show()

====================================
Replace Nulls
====================================

spark.sql("select
product,coalesce(product,'NA') as nullrep
from df").show()

====================================
Trim the space
====================================

spark.sql("select trim(product) from df").show()

====================================
Distinct the columns
====================================

spark.sql("select distinct category,spendby from df").show()

====================================
Substring with Trim
====================================

spark.sql("select substring(product,1,10)
as sub from df").show()

====================================
Substring/Split operation
====================================

spark.sql("select SUBSTRING_INDEX(category,' ',1) as spl from df").show()

====================================
Union all
====================================

spark.sql("select * from df union all select * from df1").show()

====================================
Union
====================================

spark.sql("select * from df union select * from df1 order by id").show()

====================================
Aggregate Sum
====================================

spark.sql("select category, sum(amount) as total from df group by

category").show()
====================================
Aggregate sum with two columns
====================================

spark.sql("select category,spendby,sum(amount) as total from df group by

category,spendby").show()

====================================
Aggregate Count
====================================

spark.sql("select category,spendby,sum(amount) As total,count(amount) as

cnt from df group by category,spendby").show()
====================================
Aggregate Max
====================================

spark.sql("select category, max(amount) as max from df group by

category").show()

====================================
Aggregate with Order Descending
====================================

spark.sql("select category, max(amount) as max from df group by category

order by category desc").show()
====================================
Window Row Number
====================================

spark.sql("SELECT category,amount, row_number() OVER ( partition by

category order by amount desc ) AS row_number FROM df").show()

====================================
Window Dense_rank Number
====================================
spark.sql("SELECT category,amount, dense_rank() OVER ( partition by category
order by amount desc ) AS dense_rank FROM df").show()

====================================
Window rank Number
====================================

spark.sql("SELECT category,amount, rank() OVER ( partition by category order

by amount desc ) AS rank FROM df").show()
====================================
Window Lead function
====================================

spark.sql("SELECT category,amount, lead(amount) OVER ( partition by category

order by amount desc ) AS lead FROM df").show()
====================================
Window lag function
====================================

spark.sql("SELECT category,amount, lag(amount) OVER ( partition by category

order by amount desc ) AS lag FROM df").show()

====================================
Having function
====================================

spark.sql("select category,count(category) as cnt from df group by category

having count(category)>1").show()
====================================
Inner Join
====================================
spark.sql("select a.id,a.name,b.product from cust a join prod b on
a.id=b.id").show()

====================================
Left Join
====================================
spark.sql("select a.id,a.name,b.product from cust a left join prod b on
a.id=b.id").show()
====================================
Right Join
====================================

spark.sql("select a.id,a.name,b.product from cust a right join prod b on

a.id=b.id").show()

====================================
Full Join
====================================

spark.sql("select a.id,a.name,b.product from cust a full join prod b on

a.id=b.id").show()
====================================
left anti Join
====================================

spark.sql("select a.id,a.name from cust a LEFT ANTI JOIN prod b on

a.id=b.id").show()
====================================
Date format
====================================

spark.sql("select id,tdate,from_unixtime(unix_timestamp(tdate,'MM-dd-
yyyy'),'yyyy-MM-dd') as con_date from df").show()

====================================
Sub query
====================================

spark.sql("""

select sum(amount) as total , con_date from(

select id,tdate,from_unixtime(unix_timestamp(tdate,'MM-dd-yyyy'),'yyyy-MM-
dd') as con_date,amount,category,product,spendby from df)

group by con_date

""").show()

====================================
Total Eclipse Code
====================================
package pack

import org.apache.spark.SparkContext // rdd

import org.apache.spark.sql.SparkSession // dataframe
import org.apache.spark.SparkConf
import org.apache.spark.sql._
import org.apache.spark.sql.types._
import org.apache.spark.sql.types.IntegerType
import org.apache.spark.sql.functions.upper
import org.apache.spark.sql.catalyst.expressions.Upper
import org.apache.spark.sql.functions._
import org.apache.spark.sql.expressions.Window
import scala.io.Source

object obj {
def main(args:Array[String]):Unit={
val conf = new
SparkConf().setAppName("Revision").setMaster("local[*]")
val sc = new SparkContext(conf)
sc.setLogLevel("ERROR")

val spark =
SparkSession.builder().enableHiveSupport()
.config("spark.sql.warehouse.dir",
"file:///C:/hivewarehou/")
.config("spark.sql.catalogImplementation","hiv
e").getOrCreate()
import spark.implicits._

// ------- URL read

val df =
spark.read.option("header","true").csv("file:///C:/data/df.csv")
val df1 =
spark.read.option("header","true").csv("file:///C:/data/df1.csv")

val cust =
spark.read.option("header","true").csv("file:///C:/data/cust.csv")

val prod =
spark.read.option("header","true").csv("file:///C:/data/prod.csv")

df.show()
df1.show()
cust.show()
prod.show()

df.createOrReplaceTempView("df")
df1.createOrReplaceTempView("df1")
cust.createOrReplaceTempView("cust")
prod.createOrReplaceTempView("prod")

spark.sql("select * from df ").show()

spark.sql("select id,tdate from df order by id").show()
spark.sql("select id,tdate,category from df where
category='Exercise' order by id").show()
spark.sql("select id,tdate,category,spendby from df where
category='Exercise' and spendby='cash' ").show()
spark.sql("select id,tdate from df where
category='Exercise' and spendby='cash' ").show()

spark.sql("select id,tdate from df where

category='Exercise' and spendby='cash' ").show()
spark.sql("select * from df where category in
('Exercise','Gymnastics')").show()

spark.sql("select * from df where product like

('%Gymnastics%')").show()
spark.sql("select * from df where category !=
'Exercise'").show()
spark.sql("select * from df where category not in
('Exercise','Gymnastics')").show()

spark.sql("select * from df where product is null").show()

spark.sql("select max(id) from df ").show()
spark.sql("select min(id) from df ").show()

spark.sql("select count(1) from df ").show()

spark.sql("select *,case when spendby='cash' then 1 else 0 end as status from

df ").show()
spark.sql("select concat(id,'-',category) as concat from df ").show()
spark.sql("select concat_ws('-',id,category,product) as concat from df
").show()
spark.sql("select category,lower(category) as lower from df ").show()

spark.sql("select amount,ceil(amount) from df").show()

spark.sql("select amount,round(amount) from df").show()
spark.sql("select coalesce(product,'NA') from df").show()
spark.sql("select trim(product) from df").show()

spark.sql("select distinct category,spendby from df").show()

spark.sql("select substring(trim(product),1,10) from df").show()

spark.sql("select SUBSTRING_INDEX(category,' ',1) as spl from df").show()

spark.sql("select * from df union all select * from df1").show()

spark.sql("select * from df union select * from df1 order by id").show()

spark.sql("select category, sum(amount) as total from df group by

category").show()

spark.sql("select category,spendby,sum(amount) as total from df group by

category,spendby").show()

spark.sql("select category,spendby,sum(amount) As total,count(amount)

as cnt from df group by category,spendby").show()
spark.sql("select category, max(amount) as max from df group by
category").show()

spark.sql("select category, max(amount) as max from df group by category

order by category").show()

spark.sql("select category, max(amount) as max from df group by category

order by category desc").show()

spark.sql("SELECT category,amount, row_number() OVER ( partition by

category order by amount desc ) AS row_number FROM df").show()

spark.sql("SELECT category,amount, dense_rank() OVER ( partition by category

order by amount desc ) AS dense_rank FROM df").show()

spark.sql("SELECT category,amount, rank() OVER ( partition by category order

by amount desc ) AS rank FROM df").show()

spark.sql("SELECT category,amount, lead(amount) OVER ( partition by category

order by amount desc ) AS lead FROM df").show()
spark.sql("SELECT category,amount, lag(amount) OVER ( partition by category
order by amount desc ) AS lag FROM df").show()
spark.sql("select category,count(category) as cnt from df group by category
having count(category)>1").show()

spark.sql("select a.id,a.name,b.product from cust a join prod b on

a.id=b.id").show()

spark.sql("select a.id,a.name,b.product from cust a left join prod b on

a.id=b.id").show()

spark.sql("select a.id,a.name,b.product from cust a right join prod b on

a.id=b.id").show()

spark.sql("select a.id,a.name,b.product from cust a full join prod b on

a.id=b.id").show()

spark.sql("select a.id,a.name from cust a LEFT ANTI JOIN prod b on

a.id=b.id").show()
spark.sql("select a.id,a.name from cust a LEFT SEMI JOIN prod b on
a.id=b.id").show()

spark.sql("select id,tdate,from_unixtime(unix_timestamp(tdate,'MM-dd-
yyyy'),'yyyy-MM-dd') as con_date from df").show()

spark.sql("""

select sum(amount) as total , con_date from(

select id,tdate,from_unixtime(unix_timestamp(tdate,'MM-dd-yyyy'),'yyyy-MM-
dd') as con_date,amount,category,product,spendby from df)

group by con_date

""").show()
}

SQL Vs PySpark 1678871778
No ratings yet
SQL Vs PySpark 1678871778
8 pages
SQL Final Document
No ratings yet
SQL Final Document
37 pages
Pyspark SQL Final Document
No ratings yet
Pyspark SQL Final Document
31 pages
Quewtion SQL - Pyspark
No ratings yet
Quewtion SQL - Pyspark
4 pages
Pyspark SQL and DataFrames
No ratings yet
Pyspark SQL and DataFrames
6 pages
Comparison of SQL
No ratings yet
Comparison of SQL
11 pages
SQL To Pyspark Conversion
No ratings yet
SQL To Pyspark Conversion
9 pages
SQL PySpark Cheat Sheet 1731729790
No ratings yet
SQL PySpark Cheat Sheet 1731729790
9 pages
SQL & pySPARK
No ratings yet
SQL & pySPARK
9 pages
SQL Vs Pyspark-1
No ratings yet
SQL Vs Pyspark-1
9 pages
Pyspark Syntax Using Simple Examples
No ratings yet
Pyspark Syntax Using Simple Examples
28 pages
SQL For Data Science
No ratings yet
SQL For Data Science
8 pages
SQL and PySpark
No ratings yet
SQL and PySpark
80 pages
Pyspark Interview Questions
No ratings yet
Pyspark Interview Questions
4 pages
Answers 4
No ratings yet
Answers 4
7 pages
SQL Cheat Sheet With Tips
No ratings yet
SQL Cheat Sheet With Tips
3 pages
Subqueries Video SQL Scripts
No ratings yet
Subqueries Video SQL Scripts
6 pages
DBMS Mini Notes
No ratings yet
DBMS Mini Notes
2 pages
SQL Functions CheatSheet
No ratings yet
SQL Functions CheatSheet
4 pages
SQL - Eda Process
No ratings yet
SQL - Eda Process
7 pages
SQL Cheatsheet
No ratings yet
SQL Cheatsheet
16 pages
Essential SQL Queries Reference Guide
No ratings yet
Essential SQL Queries Reference Guide
8 pages
Practical 2 Analytical Queries
No ratings yet
Practical 2 Analytical Queries
5 pages
Databricks Vs SQL Cheat Sheet
No ratings yet
Databricks Vs SQL Cheat Sheet
11 pages
SQL For Data Scientist
No ratings yet
SQL For Data Scientist
3 pages
Unit 4 Spark SQL
No ratings yet
Unit 4 Spark SQL
49 pages
Ade 1737191501
No ratings yet
Ade 1737191501
29 pages
Abcd of SQL
No ratings yet
Abcd of SQL
4 pages
Data Engineering 101 SQL and PySpark 1727161935
No ratings yet
Data Engineering 101 SQL and PySpark 1727161935
58 pages
PySpark Transformations
No ratings yet
PySpark Transformations
18 pages
Mysql Guide
No ratings yet
Mysql Guide
6 pages
122CS0079 A8 (Leknath Ghakkey)
No ratings yet
122CS0079 A8 (Leknath Ghakkey)
3 pages
SQL Cheat Sheet
No ratings yet
SQL Cheat Sheet
5 pages
Quick SQL Cheatsheet: SELECT: Used To Select Data From A Database
No ratings yet
Quick SQL Cheatsheet: SELECT: Used To Select Data From A Database
8 pages
Basic Select, Where, Distinct
No ratings yet
Basic Select, Where, Distinct
11 pages
SQL Cheatsheet 123
No ratings yet
SQL Cheatsheet 123
14 pages
PostgreSQL Mastery Cheat Sheet
No ratings yet
PostgreSQL Mastery Cheat Sheet
1 page
Revision Mid 496
No ratings yet
Revision Mid 496
12 pages
Data Engineering 101 - Day 24 - SQL Vs PySpark
No ratings yet
Data Engineering 101 - Day 24 - SQL Vs PySpark
82 pages
SQL Fundamentals
No ratings yet
SQL Fundamentals
45 pages
Dma - Assignmnet 2 - 241114 - 092531
No ratings yet
Dma - Assignmnet 2 - 241114 - 092531
8 pages
Practicals Ak
No ratings yet
Practicals Ak
5 pages
Database Management Practical File
100% (1)
Database Management Practical File
17 pages
Learn Advanced SQL
No ratings yet
Learn Advanced SQL
48 pages
SQL 2
No ratings yet
SQL 2
7 pages
Rajat Kumar Behera Lab4
No ratings yet
Rajat Kumar Behera Lab4
12 pages
SQL Short Notes Top 10 Questions 1748266007
No ratings yet
SQL Short Notes Top 10 Questions 1748266007
8 pages
SQL Notes
No ratings yet
SQL Notes
5 pages
SQL Subqueries Guide Standardized
No ratings yet
SQL Subqueries Guide Standardized
5 pages
Day3 - Assignments Solutions
No ratings yet
Day3 - Assignments Solutions
4 pages
My SQL Cheat Sheet PDF 1730815018
No ratings yet
My SQL Cheat Sheet PDF 1730815018
8 pages
Wa0003
No ratings yet
Wa0003
35 pages
Pyspark SQL Basics Cheat Sheet: Python For Data Science
No ratings yet
Pyspark SQL Basics Cheat Sheet: Python For Data Science
1 page
SQL Cheatsheet
No ratings yet
SQL Cheatsheet
14 pages
DBMS 6,7,8,9
No ratings yet
DBMS 6,7,8,9
22 pages
Polio 065640
No ratings yet
Polio 065640
9 pages
SQL Code 1
No ratings yet
SQL Code 1
2 pages
SQL Functions
No ratings yet
SQL Functions
6 pages
How to a Developers Guide to 4k: Developer edition, #3
From Everand
How to a Developers Guide to 4k: Developer edition, #3
Xinc Cyberwizard
No ratings yet
Computer Engineering Laboratory Solution Primer
From Everand
Computer Engineering Laboratory Solution Primer
Karan Bhandari
No ratings yet
CMMS OptiMaint - Installation and Update Procedure
No ratings yet
CMMS OptiMaint - Installation and Update Procedure
20 pages
Entity Extraction System
No ratings yet
Entity Extraction System
6 pages
Article Writing
No ratings yet
Article Writing
8 pages
Year 8 Common Programme 2025
No ratings yet
Year 8 Common Programme 2025
9 pages
EDSE351 Instructional Processs Notes
No ratings yet
EDSE351 Instructional Processs Notes
1 page
Context Free Grammar - Kannada
No ratings yet
Context Free Grammar - Kannada
6 pages
Assignment 6-Fall 2024
No ratings yet
Assignment 6-Fall 2024
5 pages
PQP1
No ratings yet
PQP1
15 pages
DFC20123 Chap 1 Fundamentals of DBMS
No ratings yet
DFC20123 Chap 1 Fundamentals of DBMS
48 pages
Margin Untuk Thesis
100% (2)
Margin Untuk Thesis
7 pages
PDF 20220904 234628 0000
No ratings yet
PDF 20220904 234628 0000
16 pages
Java I - O
No ratings yet
Java I - O
30 pages
Chapter - Xii Society, Religion and Temple: /j-U-V-/J-U-V-/J-u-u-u-u-u-u-u-U-U-U-u-U-U-VJ-VJ-U-U-U-U-U-U-U-VJ
No ratings yet
Chapter - Xii Society, Religion and Temple: /j-U-V-/J-U-V-/J-u-u-u-u-u-u-u-U-U-U-u-U-U-VJ-VJ-U-U-U-U-U-U-U-VJ
35 pages
Data Communication Slide
No ratings yet
Data Communication Slide
309 pages
New+Interchange+1+ +Teacher+Book +u07
0% (1)
New+Interchange+1+ +Teacher+Book +u07
7 pages
Themes & Symbols - A Doll's House
No ratings yet
Themes & Symbols - A Doll's House
5 pages
UVM Interview Questions - VLSI Encyclopedia
No ratings yet
UVM Interview Questions - VLSI Encyclopedia
7 pages
Ict Group Assignment Word
No ratings yet
Ict Group Assignment Word
8 pages
Project Report PDF
No ratings yet
Project Report PDF
5 pages
Math Grade 7 DLL Q2 W7 JAN
No ratings yet
Math Grade 7 DLL Q2 W7 JAN
4 pages
SSC CGL Pre 01 (Eng Sol) - 1
No ratings yet
SSC CGL Pre 01 (Eng Sol) - 1
7 pages
Mathematics For Junior High Schools: September 2012
No ratings yet
Mathematics For Junior High Schools: September 2012
121 pages
Test Units 3-4 (A) 7th Grade
No ratings yet
Test Units 3-4 (A) 7th Grade
5 pages
Chapter 1
No ratings yet
Chapter 1
13 pages
ART Py-Pde A Python Package For Solving Partial Differential Equtions
No ratings yet
ART Py-Pde A Python Package For Solving Partial Differential Equtions
4 pages
Pink Widgets - Google Search
No ratings yet
Pink Widgets - Google Search
1 page
Types of Fiction
100% (2)
Types of Fiction
2 pages
CCA - Module 2 - CC Architecture
No ratings yet
CCA - Module 2 - CC Architecture
25 pages
English Literature
No ratings yet
English Literature
6 pages
Truth Table
No ratings yet
Truth Table
15 pages

V2 SQL Final Document

Uploaded by

V2 SQL Final Document

Uploaded by

val df = spark.read.option("header","true").csv("file:///C:/data/df.

val df1 = spark.read.option("header","true").csv("file:///C:/data/df1.csv")

val cust = spark.read.option("header","true").csv("file:///C:/data/cust.csv")

val prod = spark.read.option("header","true").csv("file:///C:/data/prod.csv")

spark.sql("select * from df ").show()

spark.sql("select id,tdate from df order by id").show()

spark.sql("select id,tdate,category from df where category='Exercise'

spark.sql("select * from df where category in

spark.sql("select * from df where product like ('%Gymnastics%')").show()

spark.sql("select * from df where category != 'Exercise'").show()

spark.sql("select max(id) from df ").show()

spark.sql("select count(1) from df ").show()

spark.sql("select *,case when spendby='cash' then 1 else 0 end as status from

spark.sql("select category,lower(category) as lower from df ").show()

spark.sql("select amount,ceil(amount) as ceil from df").show()

spark.sql("select amount,round(amount) as round from df").show()

spark.sql("select trim(product) from df").show()

spark.sql("select distinct category,spendby from df").show()

spark.sql("select SUBSTRING_INDEX(category,' ',1) as spl from df").show()

spark.sql("select * from df union all select * from df1").show()

spark.sql("select * from df union select * from df1 order by id").show()

spark.sql("select category, sum(amount) as total from df group by

spark.sql("select category,spendby,sum(amount) as total from df group by

spark.sql("select category,spendby,sum(amount) As total,count(amount) as

spark.sql("select category, max(amount) as max from df group by

spark.sql("select category, max(amount) as max from df group by category

spark.sql("SELECT category,amount, row_number() OVER ( partition by

spark.sql("SELECT category,amount, rank() OVER ( partition by category order

spark.sql("SELECT category,amount, lead(amount) OVER ( partition by category

spark.sql("SELECT category,amount, lag(amount) OVER ( partition by category

spark.sql("select category,count(category) as cnt from df group by category

spark.sql("select a.id,a.name,b.product from cust a right join prod b on

spark.sql("select a.id,a.name,b.product from cust a full join prod b on

spark.sql("select a.id,a.name from cust a LEFT ANTI JOIN prod b on

select sum(amount) as total , con_date from(

import org.apache.spark.SparkContext // rdd

// ------- URL read

spark.sql("select * from df ").show()

spark.sql("select id,tdate from df where

spark.sql("select * from df where product like

spark.sql("select * from df where product is null").show()

spark.sql("select count(1) from df ").show()

spark.sql("select *,case when spendby='cash' then 1 else 0 end as status from

spark.sql("select amount,ceil(amount) from df").show()

spark.sql("select distinct category,spendby from df").show()

spark.sql("select substring(trim(product),1,10) from df").show()

spark.sql("select SUBSTRING_INDEX(category,' ',1) as spl from df").show()

spark.sql("select * from df union select * from df1 order by id").show()

spark.sql("select category, sum(amount) as total from df group by

spark.sql("select category,spendby,sum(amount) as total from df group by

spark.sql("select category,spendby,sum(amount) As total,count(amount)

spark.sql("select category, max(amount) as max from df group by category

spark.sql("select category, max(amount) as max from df group by category

spark.sql("SELECT category,amount, row_number() OVER ( partition by

spark.sql("SELECT category,amount, dense_rank() OVER ( partition by category

spark.sql("SELECT category,amount, rank() OVER ( partition by category order

spark.sql("SELECT category,amount, lead(amount) OVER ( partition by category

spark.sql("select a.id,a.name,b.product from cust a join prod b on

spark.sql("select a.id,a.name,b.product from cust a left join prod b on

spark.sql("select a.id,a.name,b.product from cust a right join prod b on

spark.sql("select a.id,a.name,b.product from cust a full join prod b on

spark.sql("select a.id,a.name from cust a LEFT ANTI JOIN prod b on

select sum(amount) as total , con_date from(

You might also like