0% found this document useful (0 votes)

12 views18 pages

Course SQL Scripts

Uploaded by

vx2004

We take content rights seriously. If you suspect this is your content, claim it here.

Available Formats

Download as PDF, TXT or read online on Scribd

0% found this document useful (0 votes)

12 views18 pages

Course SQL Scripts

Uploaded by

vx2004

We take content rights seriously. If you suspect this is your content, claim it here.

Available Formats

Download as PDF, TXT or read online on Scribd

You are on page 1/ 18

SQL SCRIPTS

AWS REDSHIFT: A COMPREHENSIVE GUIDE

Demo: Creating Cluster
-- Find total sales on a given calendar date.
SELECT sum(qtysold)
FROM sales, date
WHERE sales.dateid = date.dateid
AND caldate = '2008-01-06';

-- Find top 10 buyers by quantity.

SELECT firstname, lastname, total_quantity
FROM (SELECT buyerid, sum(qtysold) total_quantity
FROM sales
GROUP BY buyerid
ORDER BY total_quantity desc limit 10) Q, users
WHERE Q.buyerid = userid
ORDER BY Q.total_quantity desc;
Demo: Uploading External File

--create schema
create schema ext_file_demo

--create table: sales

create table ext_file_demo.sales(
salesid integer not null,
listid integer not null distkey,
sellerid integer not null,
buyerid integer not null,
eventid integer not null,
dateid smallint not null sortkey,
qtysold smallint not null,
pricepaid decimal(8,2),
commission decimal(8,2),
saletime timestamp);

--load data from external file

COPY ext_file_demo.sales from
's3://test-redshift-demo/demo-2/sales_tab.txt'
credentials
'aws_iam_role=arn:aws:iam::$account_id:role/test-redshift-role-s3'
delimiter '\t'
timeformat 'MM/DD/YYYY HH:MI:SS'
region 'us-west-2';

--validation query: get total count of sales records

SELECT count(*) from ext_file_demo.sales;

--validation query: Find total sales on a given calendar date

SELECT sum(qtysold)
FROM ext_file_demo.sales s, date
WHERE s.dateid = date.dateid
AND caldate = '2008-01-05';
Demo: Accessing Redshift Externally

--create user
CREATE USER test_user_1 WITH PASSWORD 'test_USER_1' VALID UNTIL
'2022-01-01';

-- assign permissions to user

GRANT ALL PRIVILEGES ON ALL TABLES IN SCHEMA public TO test_user_1;
Demo: Loading & Unloading Data

--create schema
create schema loading_data_demo

--setting search path

SET search_path = loading_data_demo,public;

--create table: sales

create table sales(
salesid integer not null,
listid integer not null distkey,
sellerid integer not null,
buyerid integer not null,
eventid integer not null,
dateid smallint not null sortkey,
qtysold smallint not null,
pricepaid decimal(8,2),
commission decimal(8,2),
saletime timestamp);

--load data from s3

copy sales from 's3://test-redshift-demo/demo-4/sales_'
credentials
'aws_iam_role=arn:aws:iam::$account_id:role/test-redshift-role-s3'
delimiter '\t'
timeformat 'MM/DD/YYYY HH:MI:SS'
region 'us-west-2';

-- create table sales_update with source as sales

create table sales_update as

select * from sales;
-- change every fifth seller, so we have updates in sales_update table
update sales_update
set qtysold = qtysold*2,
pricepaid = pricepaid*0.8,
commission = commission*1.1
where saletime > '2008-11-30'
and mod(sellerid, 5) = 0;

-- Add some new rows so we have sample insert data. The query creates a
duplicate of every fourth seller id

insert into sales_update

select (salesid + 172456) as salesid, listid, sellerid, buyerid, eventid,
dateid, qtysold, pricepaid, commission, getdate() as saletime
from sales
where saletime > '2008-11-30'
and mod(sellerid, 4) = 0;

-- Create a staging table and populate it with updated rows from

SALES_UPDATE

create temp table stagesales as

select * from sales_update
where sales_update.saletime > '2008-11-30'
and sales_update.salesid = (select sales.salesid from sales
where sales.salesid = sales_update.salesid
and sales.listid = sales_update.listid
and (sales_update.qtysold != sales.qtysold
or sales_update.pricepaid != sales.pricepaid));

-- insert the new records into the stage table

insert into stagesales

select
su.salesid,su.listid,su.sellerid,su.buyerid,su.eventid,su.dateid,su.qtysold
,su.pricepaid,su.commission,su.saletime
from sales_update su left join sales on su.salesid = sales.salesid
where sales.salesid is null;
-- Start a new transaction
begin transaction;

delete from sales

using stagesales
where sales.salesid = stagesales.salesid
and sales.listid = stagesales.listid
and sales.saletime > '2008-11-30';

-- Insert all the rows from the staging table into the target table
insert into sales
select * from stagesales;

-- End transaction and commit

end transaction;

-- Drop the staging table

drop table stagesales;

-- validating results

select count(*) from sales

select count(*) from sales_update

where sales_update.saletime > '2008-11-30'
and sales_update.salesid = (select sales.salesid from sales
where sales.salesid = sales_update.salesid
and sales.listid = sales_update.listid
and (sales_update.qtysold != sales.qtysold
or sales_update.pricepaid != sales.pricepaid));

-- unload
unload ('select * from sales')
to 's3://test-redshift-demo/demo-4/unload/sales_'
iam_role 'arn:aws:iam::$account_id:role/test-redshift-role-s3';
Demo: Materialized View

-- create schema
create schema mat_view_demo

-- set search path

SET search_path = mat_view_demo,public;

-- sales table contains eventids

-- event table contains eventname
-- query to get the event(eventname) and the total sales associated with it

SELECT e.eventname eventname,

sum(s.pricepaid) total_sales
FROM event e, sales s
WHERE e.eventid = s.eventid
GROUP BY e.eventname
order by e.eventname

-- create materialized view

CREATE MATERIALIZED VIEW tickets_mv
AS (SELECT e.eventname eventname,
sum(s.pricepaid) total_sales
FROM event e, sales s
WHERE e.eventid = s.eventid
GROUP BY e.eventname)

-- check the view data

select * from mat_view_demo.tickets_mv order by eventname

-- update the results

update sales s set pricepaid= pricepaid*2 where eventid in (select eventid
from event where eventname = '.38 Special')
-- refresh the view data
refresh materialized view mat_view_demo.tickets_mv;

-- auto refresh
CREATE MATERIALIZED VIEW tickets_mv_2 AUTO REFRESH YES
AS (SELECT e.eventname eventname,
sum(s.pricepaid) total_sales
FROM event e, sales s
WHERE e.eventid = s.eventid
GROUP BY e.eventname)
Demo: Table Design - Distribution Style
-- create schema
create schema table_design_demo

-- setting search path

SET search_path = table_design_demo,public;

-- checking the sortkey for users

select "column", type, distkey
from pg_table_def where tablename = 'users' and schemaname='public';

select * from svv_table_info s where s.schema='public' and s.table ='users'

---checking the disk usage, distribution

select slice, col, num_values as rows, minvalue, maxvalue
from svv_diskusage
where name='users' and tbl = (select table_id from svv_table_info s where
s.schema='public' and s.table ='users')
and col=0
and num_values>0
order by slice, col;

-- state as the dist key

create table userskey distkey(state) as select * from users;

-- checking the disk usage with state as distkey

select slice, col, num_values as rows, minvalue, maxvalue
from svv_diskusage
where name='userskey' and tbl = (select table_id from svv_table_info s
where s.schema='table_design_demo' and s.table ='userskey')
and col=0
and num_values>0
-- even example
create table userseven diststyle even as
select * from users;

select slice, col, num_values as rows, minvalue, maxvalue

from svv_diskusage
where name='userseven' and tbl = (select table_id from svv_table_info s
where s.schema='table_design_demo' and s.table ='userseven')
and col=0
and num_values>0

-- all example
create table usersall diststyle all as
select * from users;

select slice, col, num_values as rows, minvalue, maxvalue

from svv_diskusage
where name='usersall' and tbl = (select table_id from svv_table_info s
where s.schema='table_design_demo' and s.table ='usersall')
and col=0
and num_values>0

-- auto example
create table usersauto as
select * from users;

select slice, col, num_values as rows, minvalue, maxvalue

from svv_diskusage
where name='usersauto' and tbl = (select table_id from svv_table_info s
where s.schema='table_design_demo' and s.table ='usersauto')
and col=0
and num_values>0

select * from svv_table_info s where s.schema='table_design_demo' and

s.table ='usersauto'
Demo: Table Design - Sort Key

-- check sortkey
select "column", type, sortkey
from pg_table_def where tablename = 'usersauto';

-- update the sort key

create table users_custom_sort sortkey (firstname, lastname) as
select * from users;

-- check sortkey
select "column", type, sortkey
from pg_table_def where tablename = 'users_custom_sort';

-- explain functions
explain SELECT firstname, lastname, total_quantity
FROM (SELECT buyerid, sum(qtysold) total_quantity
FROM sales
GROUP BY buyerid
ORDER BY total_quantity desc limit 10) Q,
table_design_demo.users_custom_sort U
WHERE Q.buyerid = U.userid
ORDER BY Q.total_quantity desc;
Demo: Table Design - Compression
-- compression
select "column", type, encoding
from pg_table_def where tablename = 'usersauto' and
schemaname='table_design_demo';

-- Analyse Command
ANALYSE COMPRESSION usersauto;

-- create user table with custom compression

create table users_custom_compression(
userid integer not null distkey sortkey,
username char(8) encode zstd,
firstname varchar(30) encode zstd,
lastname varchar(30) encode zstd,
city varchar(30),
state char(2),
email varchar(100),
phone char(14),
likesports boolean,
liketheatre boolean,
likeconcerts boolean,
likejazz boolean,
likeclassical boolean,
likeopera boolean,
likerock boolean,
likevegas boolean,
likebroadway boolean,
likemusicals boolean);

-- inserting records from users

insert into users_custom_compression
select * from users

-- checking compression style

select "column", type, encoding
from pg_table_def where tablename = 'users_custom_compression' and
schemaname='table_design_demo';

-- analyse command
ANALYSE COMPRESSION users_custom_compression;
Demo: Redshift ML

-- create schema
create schema redshift_ml_demo

-- setting search context

SET search_path = redshift_ml_demo,public;

-- create table: customer_activity

CREATE TABLE customer_activity (
state varchar(2),
account_length int,
area_code int,
phone varchar(8),
intl_plan varchar(3),
vMail_plan varchar(3),
vMail_message int,
day_mins float,
day_calls int,
day_charge float,
total_charge float,
eve_mins float,
eve_calls int,
eve_charge float,
night_mins float,
night_calls int,
night_charge float,
intl_mins float,
intl_calls int,
intl_charge float,
cust_serv_calls int,
churn varchar(6),
record_date date);

-- load data
COPY customer_activity
FROM 's3://test-redshift-demo/demo-15/input/customer_activity.csv'
REGION 'us-west-2' IAM_ROLE 'arn:aws:iam::$account:role/test-redshift-ml'
DELIMITER ','
IGNOREHEADER 1;

-- create ML model
CREATE MODEL customer_churn_auto_model FROM (SELECT state,
account_length,
area_code,
total_charge/account_length AS average_daily_spend,
cust_serv_calls/account_length AS average_daily_cases,
churn
FROM customer_activity
WHERE record_date < '2020-01-01'
)
TARGET churn FUNCTION ml_fn_customer_churn_auto
IAM_ROLE 'arn:aws:iam::480935361548:role/test-redshift-ml'SETTINGS (
S3_BUCKET 'test-redshift-demo'
);

-- view model details

select schema_name, model_name, model_state from stv_ml_model_info;

-- use ML model to predict active customers

SELECT phone,
ml_fn_customer_churn_auto(
state,
account_length,
area_code,
total_charge/account_length,
cust_serv_calls/account_length )
AS active FROM customer_activity WHERE record_date >
'2020-01-01';

-- using ML model: finding churners, non-churners state wise

WITH inferred AS (SELECT state,
ml_fn_customer_churn_auto(
state,
account_length,
area_code,
total_charge/account_length,
cust_serv_calls/account_length )::varchar(6)
AS active FROM customer_activity
WHERE record_date > '2020-01-01' )
SELECT state, SUM(CASE WHEN active = 'True.' THEN 1 ELSE 0 END) AS
churners,
SUM(CASE WHEN active = 'False.' THEN 1 ELSE 0 END) AS nonchurners,
COUNT(*) AS total_per_state
FROM inferred
GROUP BY state
ORDER BY state;

A380 Level I Ata 44 Cabin Systems PDF
No ratings yet
A380 Level I Ata 44 Cabin Systems PDF
42 pages
EY & Zepto Data Analyst Interview Questions
No ratings yet
EY & Zepto Data Analyst Interview Questions
24 pages
Malasakit Form
100% (1)
Malasakit Form
2 pages
Chapter 9 Real Mortgage
100% (3)
Chapter 9 Real Mortgage
6 pages
Electrical Testing Dry Type Transformers
100% (1)
Electrical Testing Dry Type Transformers
5 pages
Interview Questions SQL
No ratings yet
Interview Questions SQL
20 pages
Bcomdbmsrecord
No ratings yet
Bcomdbmsrecord
24 pages
Gucci Strategic MGT
0% (1)
Gucci Strategic MGT
18 pages
Chapter-3, Size of Business
No ratings yet
Chapter-3, Size of Business
4 pages
MTP3 & M3ua
No ratings yet
MTP3 & M3ua
40 pages
SQL Data
No ratings yet
SQL Data
179 pages
Basic SQL Queries On PostgreSQL
No ratings yet
Basic SQL Queries On PostgreSQL
16 pages
Cibse Ken Dale Award Report 2020 2022 John Smyth
No ratings yet
Cibse Ken Dale Award Report 2020 2022 John Smyth
213 pages
Essential n8n Playbook
From Everand
Essential n8n Playbook
Leandro Calado
No ratings yet
Alphamaquet 1150 Brochure en PDF
No ratings yet
Alphamaquet 1150 Brochure en PDF
24 pages
Blinkit & Zepto Interview Questions
No ratings yet
Blinkit & Zepto Interview Questions
21 pages
Template Erasmus Mundus
100% (1)
Template Erasmus Mundus
3 pages
Top 100 Must Know SQL Queries
No ratings yet
Top 100 Must Know SQL Queries
10 pages
U00 Syllabus 1
No ratings yet
U00 Syllabus 1
55 pages
DBMS Project
No ratings yet
DBMS Project
74 pages
AGS Guide To Ground Investigation Reports Final
No ratings yet
AGS Guide To Ground Investigation Reports Final
6 pages
POint of Sale Project Report
No ratings yet
POint of Sale Project Report
31 pages
Atty. Agbayani Cases
No ratings yet
Atty. Agbayani Cases
46 pages
7 SQL Tricks in Data Analysis
No ratings yet
7 SQL Tricks in Data Analysis
9 pages
11 Best Step - How To Plant An Avocado Seed in Soil - October 2024
No ratings yet
11 Best Step - How To Plant An Avocado Seed in Soil - October 2024
31 pages
Internship Report
No ratings yet
Internship Report
38 pages
CSIR CLRI Junior Secretariat Assistant Paper II 2018 English
No ratings yet
CSIR CLRI Junior Secretariat Assistant Paper II 2018 English
24 pages
SQL Project - Exploring Trends, Segmentation & KPIs
No ratings yet
SQL Project - Exploring Trends, Segmentation & KPIs
43 pages
Prevention and Management of Obstetric Lacerations at Vaginal Delivery ACOG
No ratings yet
Prevention and Management of Obstetric Lacerations at Vaginal Delivery ACOG
46 pages
Angular Shopping Store: From Scratch to Successful Payment
From Everand
Angular Shopping Store: From Scratch to Successful Payment
Abdelfattah Ragab
No ratings yet
Data Base Lab Manual
No ratings yet
Data Base Lab Manual
33 pages
DBMSBCOM
No ratings yet
DBMSBCOM
24 pages
Birdmobile
No ratings yet
Birdmobile
9 pages
ADPIE From "The Nursing Process in Action by Nurse Erica.": Assessment
No ratings yet
ADPIE From "The Nursing Process in Action by Nurse Erica.": Assessment
2 pages
Lecture Week 3-Databases
No ratings yet
Lecture Week 3-Databases
17 pages
Data Warehouse Management Systems
No ratings yet
Data Warehouse Management Systems
56 pages
Practical File of SQLLLL Bhavishya-1
No ratings yet
Practical File of SQLLLL Bhavishya-1
19 pages
Superstore Sales Analysis
No ratings yet
Superstore Sales Analysis
20 pages
ARM313R Data Sheet
No ratings yet
ARM313R Data Sheet
2 pages
SQL Assignment 4
100% (1)
SQL Assignment 4
3 pages
Strategic Competitice Analysis
No ratings yet
Strategic Competitice Analysis
30 pages
DBMS Practical FIle
No ratings yet
DBMS Practical FIle
32 pages
RDBMS Lab Record-IV Sem-1
No ratings yet
RDBMS Lab Record-IV Sem-1
39 pages
SQL Notes
No ratings yet
SQL Notes
10 pages
SQL Master
No ratings yet
SQL Master
10 pages
10 Most Asked SQL Questions With Answers and Explanations
No ratings yet
10 Most Asked SQL Questions With Answers and Explanations
6 pages
SQL Short Notes Top 10 Questions 1748266007
No ratings yet
SQL Short Notes Top 10 Questions 1748266007
8 pages
No Ph.D. Game Design With Three.js
From Everand
No Ph.D. Game Design With Three.js
Nikiforos Kontopoulos
No ratings yet
SQL Practice
No ratings yet
SQL Practice
5 pages
Store Id Quantity Sold: Customers Orders
No ratings yet
Store Id Quantity Sold: Customers Orders
37 pages
Stripe Integration in Angular: A Step-by-Step Guide to Creating Payment Functionality
From Everand
Stripe Integration in Angular: A Step-by-Step Guide to Creating Payment Functionality
Abdelfattah Ragab
No ratings yet
MySQL Cheat Sheet & Quick Reference
No ratings yet
MySQL Cheat Sheet & Quick Reference
26 pages
Structured Query Language (SQL)
No ratings yet
Structured Query Language (SQL)
17 pages
Create Database
No ratings yet
Create Database
11 pages
Amey B-50 DWM Lab Experiment-2
No ratings yet
Amey B-50 DWM Lab Experiment-2
19 pages
SQL-Data Analytcs
No ratings yet
SQL-Data Analytcs
13 pages
Module10 Activity
No ratings yet
Module10 Activity
4 pages
(UPDATED) SQL Level 3
No ratings yet
(UPDATED) SQL Level 3
9 pages
April Assignment
No ratings yet
April Assignment
7 pages
Dbms Lab File: Submitted To: DR Parul Tomar
No ratings yet
Dbms Lab File: Submitted To: DR Parul Tomar
26 pages
Research Proposal
No ratings yet
Research Proposal
5 pages
Ads Ise 2
No ratings yet
Ads Ise 2
11 pages
SQL Intro
No ratings yet
SQL Intro
3 pages
SQL For Data Science
No ratings yet
SQL For Data Science
8 pages
Performance Review of Thermal Power Stations 2011-12: Sl. No Name of Station Unit No Organisation Capacity
No ratings yet
Performance Review of Thermal Power Stations 2011-12: Sl. No Name of Station Unit No Organisation Capacity
4 pages
Air Act 1981 Project Arjun Dubey 4046
No ratings yet
Air Act 1981 Project Arjun Dubey 4046
3 pages
Risk Assessment Template Teen Fashion
No ratings yet
Risk Assessment Template Teen Fashion
2 pages
Sales Inventory Project Formatted
No ratings yet
Sales Inventory Project Formatted
5 pages
Assignment 2
No ratings yet
Assignment 2
23 pages
Mysql Project
No ratings yet
Mysql Project
7 pages
Data Project 3
No ratings yet
Data Project 3
3 pages
Segmentspace Management
No ratings yet
Segmentspace Management
15 pages
Dbms Lab Work
No ratings yet
Dbms Lab Work
10 pages
ADBMS Lab Manuals
No ratings yet
ADBMS Lab Manuals
14 pages
SQL Notes
No ratings yet
SQL Notes
9 pages
Basic SQL Queries-1
No ratings yet
Basic SQL Queries-1
9 pages
RDBMS Lab Manual
No ratings yet
RDBMS Lab Manual
10 pages
Analytical SQL Documentation
No ratings yet
Analytical SQL Documentation
10 pages
SQL Retail Sales Project
No ratings yet
SQL Retail Sales Project
5 pages
Database Testing Using SQL
No ratings yet
Database Testing Using SQL
6 pages
SQL Cheat Sheet
No ratings yet
SQL Cheat Sheet
4 pages
Datawarehouse
No ratings yet
Datawarehouse
5 pages
P1
No ratings yet
P1
3 pages
John Devereux of Bodenham and Decies Was An Anglo-Norman
No ratings yet
John Devereux of Bodenham and Decies Was An Anglo-Norman
7 pages
Nlud Circ CPL Sep 2017 Batch
No ratings yet
Nlud Circ CPL Sep 2017 Batch
1 page
New Doc 2018-07-21
No ratings yet
New Doc 2018-07-21
3 pages
Resumão - SQL Com Databricks
No ratings yet
Resumão - SQL Com Databricks
2 pages
How To Convert A Section 8 Company Into A Public Limited Company
No ratings yet
How To Convert A Section 8 Company Into A Public Limited Company
3 pages
Oracle8i Data Warehousing Guide
No ratings yet
Oracle8i Data Warehousing Guide
6 pages
C Language Programming Codes
From Everand
C Language Programming Codes
Durgesh
No ratings yet

Course SQL Scripts

Uploaded by

Course SQL Scripts

Uploaded by

SQL SCRIPTS

AWS REDSHIFT: A COMPREHENSIVE GUIDE

-- Find top 10 buyers by quantity.

--create table: sales

--load data from external file

--validation query: get total count of sales records

--validation query: Find total sales on a given calendar date

-- assign permissions to user

--setting search path

--create table: sales

--load data from s3

-- create table sales_update with source as sales

create table sales_update as

insert into sales_update

-- Create a staging table and populate it with updated rows from

create temp table stagesales as

-- insert the new records into the stage table

insert into stagesales

delete from sales

-- End transaction and commit

-- Drop the staging table

select count(*) from sales

select count(*) from sales_update

select count(*) from sales_update

-- set search path

-- sales table contains eventids

SELECT e.eventname eventname,

-- create materialized view

-- check the view data

-- update the results

-- setting search path

-- checking the sortkey for users

select * from svv_table_info s where s.schema='public' and s.table ='users'

---checking the disk usage, distribution

-- state as the dist key

-- checking the disk usage with state as distkey

select slice, col, num_values as rows, minvalue, maxvalue

select slice, col, num_values as rows, minvalue, maxvalue

select slice, col, num_values as rows, minvalue, maxvalue

select * from svv_table_info s where s.schema='table_design_demo' and

-- update the sort key

-- create user table with custom compression

-- inserting records from users

-- checking compression style

-- setting search context

-- create table: customer_activity

-- view model details

-- use ML model to predict active customers

-- using ML model: finding churners, non-churners state wise

You might also like