PostgreSQL - queries by examples
Basic queries
-- select
select first_name, last_name, email
from customer;
-- distinct: both the following two forms work
select distinct rating
from film;
select distinct(rating)
from film;
-- count
select count(distinct first_name )
from actor;
-- readable
select count(distinct(first_name))
from actor;
-- this doesn't work, parentheses are required
-- select count distinct first_name
-- from actor;
-- where
select email
from customer
where first_name = 'Nancy' and last_name = 'Thomas';
-- limit
select customer_id
from payment
order by payment_date ASC
limit 10;
-- between and
--- both inclusive
--- not between and
--- when used for timestamp, it includes the time part
select count(*)
from payment
where amount between 5 and 6;
select count(*)
from payment
where amount not between 5 and 6;
select *
from payment
where payment_date between '2007-05-12' and '2007-05-15'
order by payment_date asc;
-- in, not in
select *
from city
where city in ('Hoshiarpur', 'Hino');
information_schema
select *
from city
where city not in ('Hoshiarpur', 'Hino');
-- like, ilike
--- like: case sensitive
--- ilike: case insensitive
--- like: match any characters
--- _: match only one character
select *
from customer
where first_name like 'M%' and last_name ilike 's%';
select *
from customer
where first_name like '_her%';
Date time
-- PostgreSQL time data types
--- TIME: contains only time
--- DATE: contains only date
--- TIMESTAMP: contains date and time
--- TIMESTAMPTZ: contains date, time and timezone
--- related functions and operators: TIMEZONE, NOW, TIMEOFDAY, CURRENT_TIME, CURRENT_DATE
--- show the values of all configuration parameters, with descriptions
SHOW ALL;
--- display the current setting of run-time parameters
SHOW TIMEZONE;
--- date and time functions
SELECT now(), timeofday(), CURRENT_TIME, CURRENT_DATE, CURRENT_TIMESTAMP;
------------------------------------------------------------------------------------------
-- extract information from a time based data type using
--- EXTRACT(): retrieves subfields such as year/month/hour from date/time values
--- AGE(): subtract argument from current_date
--- TO_CHAR(): convert various data types (date/time, numeric) to formatted strings, and convert from formatted strings to specific data types.
SELECT extract(year from payment_date) as payment_year,
extract(quarter from payment_date) as payment_quarter,
extract(month from payment_date) as payment_month,
extract(day from payment_date) as payment_day,
extract(hour from payment_date) as payment_hour,
extract(minute from payment_date) as payment_minute,
extract(second from payment_date) as payment_second,
extract(century from payment_date) as payment_century,
extract(dow from payment_date) as payment_dow
FROM payment;
--- example result: 16 years 4 mons 22 days 1 hours 34 mins 13.003423 secs
SELECT age(payment_date)
FROM payment;
--- example result: 02-15-2007,THURSDAY /FEBRUARY /2007, 7.99
SELECT to_char(payment_date, 'mm-dd-YYYY'),
to_char(payment_date, 'DAY/MONTH/YYYY'),
to_char(amount, '999D00')
FROM payment;
--- During which months did payments occur? Format your answer to return back the full month name.
SELECT distinct to_char(payment_date, 'MONTH')
FROM payment;
--- How many payments occurred on a Monday using extract()
SELECT count(*)
FROM payment
WHERE extract(dow from payment_date) = 1; -- The day of the week as Monday (1) to Sunday (7)
--- How many payments occurred on a Monday using to_char()
SELECT count(*)
FROM payment
WHERE to_char(payment_date, 'D') = '2'; -- day of the week, Sunday (1) to Saturday (7)
-- date()
select b.starttime, f.name
from bookings as b inner join facilities f on f.facid = b.facid
where f.name like 'Tennis Court%'
and date(b.starttime) = '2012-09-21';
Group By
-- most common aggregate functions
--- COUNT(): simply returns the number of rows
--- AVG(): returns a floating point, you can use ROUND() to specify precision after the decimal
--- MAX(): returns the maximum element
--- MIN(): returns the minimum element
--- SUM(): returns the sum
--- aggregate functions can appear in SELECT, HAVING and ORDER BY clauses, but not WHERE statements
select min(replacement_cost), max(replacement_cost), round(avg(replacement_cost), 2), sum(replacement_cost)
from film;
-- group by: aggregate on one or more columns
--- in the SELECT statement, columns must either have an aggregate function or be in the GROUP BY call
--- WHERE statements should not refer to the aggregation result, should use HAVING to filter on aggregation result
--- can use ORDER BY to sort results based on the aggregate, but make sure to reference the entire aggregate function
-- the total amount per customer per staff
select customer_id, staff_id, sum(amount)
from payment
group by customer_id, staff_id
order by customer_id, staff_id, sum(amount);
select date(payment_date), sum(amount)
from payment
group by date(payment_date)
order by date(payment_date), sum(amount) desc;
select staff_id, count(*)
from payment
group by staff_id
order by count(*) desc;
select rating, round(avg(replacement_cost), 2)
from film
group by rating;
select customer_id, sum(amount)
from payment
group by customer_id
order by sum(amount) desc
limit 5;
-- HAVING: filter on the aggregate
--- we can use filter on non-aggregate columns in WHERE because they're valid before GROUP BY
--- we can NOT use filter on aggregate columns in WHERE because they're valid AFTER GROUP BY
select customer_id, sum(amount)
from payment
where customer_id not in (184, 477, 550)
group by customer_id
having sum(amount) > 100
order by sum(amount) desc;
select customer_id, count(*)
from payment
group by customer_id
having count(*) >= 40;
select customer_id, sum(amount)
from payment
where staff_id = 2
group by customer_id
having sum(amount) > 110;
Join
-- AS
--- it's an alias of a column or an aggregate
--- it's executed at the very end of a query, so we cannot use the alias inside a WHERE operator
select count(*) as num_transactions
from payment;
select customer_id, sum(amount) as total_spent
from payment
group by customer_id
having sum(amount) > 100; -- cannot use 'total_spent' here because it doesn't exist yet
-- INNER JOIN
--- results with a set of records that match in both tables
--- the order of the tables to INNER JOIN doesn't matter
--- if you use just JOIN without the INNER, PostgreSQL will treat it as an INNER JOIN
select payment_id, customer.customer_id, first_name, last_name -- we need to prefix the table if the join column appears in SELECT
from customer inner join payment on customer.customer_id = payment.customer_id;
---------------------------------------------------------------------------------------------------------------------
-- FULL [OUTER] JOIN
--- OUTER is optional
--- grab everything in both tables, columns that don't match will be filled with NULL
---- if table A has 200 records, table B has 300 records, and the matched records is 150, then the result will be:
---- 150 + (200 - 150) + (300 - 150) = 350
--- the table order doesn't matter
--- use WHERE to get rows unique to either table (rows not found in both tables), this is opposite to INNER JOIN
--- get everything from customer and payment
--- rows in both tables, rows in only one table and the value for the other table fields are null
select *
from customer full outer join payment
on customer.customer_id = payment.customer_id;
--- do we have any customer without payment, or any payment without customer?
--- this is opposite to INNER JOIN
select *
from customer full outer join payment
on customer.customer_id = payment.customer_id
where customer.customer_id is null or payment.payment_id is null;
---------------------------------------------------------------------------------------------------------------------
-- A LEFT [OUTER] JOIN B
--- OUTER is optional
--- return records in table A, if there is no match with table B, the the column values are null
--- the table order does matter
--- use WHERE to get rows unique to table A
--- get all films and their inventory (even the films don't have inventory)
select film.film_id, film.title, inventory.inventory_id, inventory.store_id
from film left join inventory on film.film_id = inventory.film_id;
--- do we have any film that are not linked to inventory?
select film.film_id, film.title, inventory.inventory_id, inventory.store_id
from film left join inventory on film.film_id = inventory.film_id
where inventory.film_id is null;
---------------------------------------------------------------------------------------------------------------------
-- A RIGHT [OUTER] JOIN B
--- OUTER is optional
--- essentially the same as LEFT JOIN, except the tables are switched
--- return records in table B, if there is no match with table A, the the column values are null
--- do we have any film that are not linked to inventory?
select film.film_id, film.title, inventory.inventory_id, inventory.store_id
from inventory right join film on film.film_id = inventory.film_id
where inventory.film_id is null;
---------------------------------------------------------------------------------------------------------------------
-- UNION
--- combine the result-set of two or more SELECT statements
--- directly concatenate two results together
--- the columns in SELECT statements MUST be exactly the same
select customer_id
from payment
union
select customer_id
from customer;
---------------------------------------------------------------------------------------------------------------------
-- self join is using standard join to join two copies of the same table on different columns.
--- find the film pair whose film length is the same
select f1.title, f2.title
from film as f1
inner join film as f2
on f1.film_id != f2.film_id -- if f1.film_id = f2.film_id, then the same film will be mapped to itself
and f1.length = f2.length;