This walkalong consists of medium questions and their solutions from sql-practice.com, written in both SQL and django
ORM, They query results are also compared for equality.
Insert, Update and Delete queries are not included to keep database consistent.
The notebook (Django Shell-plus) is located in here
First cd into the notebook directory cd server/notebook
Then open the notebook using python ../manage.py shell_plus --notebook
import os
os.environ["DJANGO_ALLOW_ASYNC_UNSAFE"] = "true"
from utils import *
from sqlparse import format
from django.db.models import (
Q,
F,
Case,
When,
Count,
Func,
Min,
Max,
Sum,
Avg,
Value,
OuterRef,
Subquery,
CharField,
)
from django.db.models.functions import Concat, Cast, Round, Length, Upper, Lower
from django.db import connection
from customer_db.models import Provinces, Patients, Doctors, Admissions
def print_sql(queryset):
formatted = format(str(queryset.query), reindent=True)
print(formatted)
admission_fields = [
"id",
"patient_id",
"admission_date",
"discharge_date",
"diagnosis",
"attending_doctor_id",
]
class NonAggrCount(Count):
"""
This aggregation will not trigger a group by
"""
contains_aggregate = False
class NonAggrSum(Sum):
contains_aggregate = False
Show unique birth years from patients and order them by ascending.
# Use YEAR(birth_date) for most databases
qstr = """
SELECT
DISTINCT strftime('%Y', birth_date) birth_year
FROM patients
ORDER BY birth_year;
"""
sqlq = sql_raw(qstr)
ormq = (
Patients.objects.annotate(birth_year=Cast(F("birth_date__year"), CharField()))
.distinct()
.order_by("birth_year")
.values("birth_year")
)
equal(sqlq, ormq)
print_sql(ormq)
Equal ✔️
SELECT DISTINCT CAST(django_date_extract(year, "patients"."birth_date") AS text) AS "birth_year"
FROM "patients"
ORDER BY 1 ASC
orm_to_df(ormq[:3])
| | birth_year |
|---:|-------------:|
| 0 | 1975 |
| 1 | 1976 |
| 2 | 1977 |
Show unique first names from the patients table which only occurs once in the list.
For example, if two or more people are named 'John' in the first_name column then don't include their name in the output list. If only 1 person is named 'Leo' then include them in the output.
qstr = """
SELECT first_name
FROM patients
GROUP BY first_name
HAVING COUNT(first_name) = 1
"""
sqlq = sql_raw(qstr)
ormq = (
Patients.objects.values("first_name")
.annotate(occurance=Count("first_name"))
.filter(occurance=1)
.values("first_name")
)
equal(sqlq, ormq)
print_sql(ormq)
Equal ✔️
SELECT "patients"."first_name"
FROM "patients"
GROUP BY "patients"."first_name"
HAVING COUNT("patients"."first_name") = 1
orm_to_df(ormq[:3])
| | first_name |
|---:|:-------------|
| 0 | Abigail |
| 1 | Alicia |
| 2 | Allison |
Show patient_id and first_name from patients where their first_name start and ends with 's' and is at least 6 characters long. We will do start and ends with 'n' and is at least 6 characters long.
qstr = """
SELECT
patient_id,
first_name
FROM patients
WHERE first_name LIKe "n____%n"
"""
sqlq = sql_raw(qstr)
ormq = Patients.objects.filter(first_name__regex=r"(?i)^n\w{4,}n$").values(
"first_name", patient_id=F("id")
)
equal(sqlq, ormq)
print_sql(ormq)
Equal ✔️
SELECT "patients"."first_name",
"patients"."patient_id" AS "patient_id"
FROM "patients"
WHERE "patients"."first_name" REGEXP (?i)^n\w{4,}n$
orm_to_df(ormq[:3])
| | first_name | patient_id |
|---:|:-------------|-------------:|
| 0 | Nathan | 54 |
| 1 | Nathan | 100 |
Show patient_id, first_name, last_name from patients whos diagnosis is 'Dementia'. We will do Diabetes. Primary diagnosis is stored in the admissions table.
qstr = """
SELECT
p.patient_id,
first_name,
last_name
FROM patients p
INNER JOIN admissions a ON p.patient_id = a.patient_id
WHERE diagnosis = 'Diabetes'
"""
sqlq = sql_raw(qstr)
ormq = Admissions.objects.filter(diagnosis="Diabetes").values(
"patient_id", first_name=F("patient__first_name"), last_name=F("patient__last_name")
)
equal(sqlq, ormq)
print_sql(ormq)
Equal ✔️
SELECT "admissions"."patient_id",
"patients"."first_name" AS "first_name",
"patients"."last_name" AS "last_name"
FROM "admissions"
INNER JOIN "patients" ON ("admissions"."patient_id" = "patients"."patient_id")
WHERE "admissions"."diagnosis" = Diabetes
# Note the result of the ORM query in the next cell is equivalent to that of the last cell,
# except for the ordering.
qstr = """
SELECT
p.patient_id,
first_name,
last_name
FROM patients p
INNER JOIN admissions a ON p.patient_id = a.patient_id
WHERE diagnosis = 'Diabetes'
ORDER BY p.patient_id
"""
sqlq = sql_raw(qstr)
diabetic_patients = (
Admissions.objects.filter(diagnosis="Diabetes").values_list("patient_id").distinct()
)
ormq1 = (
Patients.objects.filter(id__in=diabetic_patients)
.values("first_name", "last_name", patient_id=F("id"))
.order_by("patient_id")
.values("patient_id", "first_name", "last_name")
)
equal(sqlq, ormq1)
print_sql(ormq1)
Equal ✔️
SELECT "patients"."first_name",
"patients"."last_name",
"patients"."patient_id" AS "patient_id"
FROM "patients"
WHERE "patients"."patient_id" IN
(SELECT DISTINCT U0."patient_id"
FROM "admissions" U0
WHERE U0."diagnosis" = Diabetes)
ORDER BY 3 ASC
orm_to_df(ormq[:3])
| | patient_id | first_name | last_name |
|---:|-------------:|:-------------|:------------|
| 0 | 6 | Gavin | Bryant |
| 1 | 17 | Emily | Tran |
| 2 | 27 | Allison | Rogers |
Display every patient's first_name. Order the list by the length of each name and then by alphbetically
qstr = """
SELECT
first_name
FROM patients p
ORDER BY
LENGTH(first_name),
first_name;
"""
sqlq = sql_raw(qstr)
ormq = Patients.objects.order_by(Length("first_name"), "first_name").values(
"first_name"
)
equal(sqlq, ormq)
print_sql(ormq)
Equal ✔️
SELECT "patients"."first_name"
FROM "patients"
ORDER BY LENGTH("patients"."first_name") ASC, "patients"."first_name" ASC
orm_to_df(ormq[:3])
| | first_name |
|---:|:-------------|
| 0 | Eli |
| 1 | Eli |
| 2 | Eli |
Show the total amount of male patients and the total amount of female patients in the patients table. Display the two results in the same row.
qstr = """
SELECT (
SELECT COUNT(gender)
FROM patients
WHERE gender = 'M'
) AS male, (
SELECT COUNT(gender)
FROM patients
WHERE gender = 'F'
) AS female;
"""
sqlq = sql_raw(qstr)
male_subquery, female_subquery = [
Patients.objects.filter(gender=g)
.annotate(**{f"{g}_count": Func(F("gender"), function="COUNT")})
.values(f"{g}_count")
for g in ["M", "F"]
]
ormq = Patients.objects.annotate(
male=Subquery(male_subquery), female=Subquery(female_subquery)
).values("male", "female")[:1]
equal(sqlq, ormq)
print_sql(ormq)
Equal ✔️
SELECT
(SELECT COUNT(U0."gender") AS "M_count"
FROM "patients" U0
WHERE U0."gender" = M) AS "male",
(SELECT COUNT(U0."gender") AS "F_count"
FROM "patients" U0
WHERE U0."gender" = F) AS "female"
FROM "patients"
LIMIT 1
ormq = Patients.objects.annotate(
male=NonAggrSum(Case(When(gender="M", then=1))),
female=NonAggrSum(Case(When(gender="F", then=1))),
).values("male", "female")
equal(sqlq, ormq)
print_sql(ormq)
Equal ✔️
SELECT SUM(CASE
WHEN "patients"."gender" = M THEN 1
ELSE NULL
END) AS "male",
SUM(CASE
WHEN "patients"."gender" = F THEN 1
ELSE NULL
END) AS "female"
FROM "patients"
orm_to_df(ormq)
| | male | female |
|---:|-------:|---------:|
| 0 | 50 | 51 |
Show first and last name, allergies from patients which have allergies to either 'Penicillin' or 'Morphine'. Show results ordered ascending by allergies then by first_name then by last_name.
qstr = """
SELECT
first_name,
last_name,
allergies
FROM patients
WHERE
allergies IN ('Penicillin', 'Morphine')
ORDER BY
allergies,
first_name,
last_name;
"""
sqlq = sql_raw(qstr)
ormq = (
Patients.objects.filter(allergies__in=["Penicillin", "Morphine"])
.values("first_name", "last_name", "allergies")
.order_by("allergies", "first_name", "last_name")
)
equal(sqlq, ormq)
print_sql(ormq)
Equal ✔️
SELECT "patients"."first_name",
"patients"."last_name",
"patients"."allergies"
FROM "patients"
WHERE "patients"."allergies" IN (Penicillin,
Morphine)
ORDER BY "patients"."allergies" ASC,
"patients"."first_name" ASC,
"patients"."last_name" ASC
orm_to_df(ormq)
| | first_name | last_name | allergies |
|---:|:-------------|:------------|:------------|
| 0 | Gavin | Bryant | Penicillin |
| 1 | Jeremy | Kim | Penicillin |
| 2 | Trevor | Baker | Penicillin |
Show patient_id, diagnosis from admissions. Find patients admitted multiple times for the same diagnosis.
qstr = """
SELECT
patient_id,
diagnosis
FROM admissions
GROUP BY
patient_id,
diagnosis
HAVING COUNT(*) > 1
"""
sqlq = sql_raw(qstr)
ormq = (
Admissions.objects.values("patient_id", "diagnosis")
.annotate(count=Count("patient_id"))
.filter(count__gt=1)
.values("patient_id", "diagnosis")
)
equal(sqlq, ormq)
print_sql(ormq)
Equal ✔️
SELECT "admissions"."patient_id",
"admissions"."diagnosis"
FROM "admissions"
GROUP BY "admissions"."patient_id",
"admissions"."diagnosis"
HAVING COUNT("admissions"."patient_id") > 1
orm_to_df(ormq)
| | patient_id | diagnosis |
|---:|-------------:|:------------|
| 0 | 5 | Meningitis |
Show the city and the total number of patients in the city. Order from most to least patients and then by city name ascending.
qstr = """
SELECT
city,
COUNT(*) population
FROM patients
GROUP BY city
ORDER BY population DESC, city
"""
sqlq = sql_raw(qstr)
ormq = (
Patients.objects.values("city")
.annotate(population=Count("id"))
.order_by("-population", "city")
)
equal(sqlq, ormq)
print_sql(ormq)
Equal ✔️
SELECT "patients"."city",
COUNT("patients"."patient_id") AS "population"
FROM "patients"
GROUP BY "patients"."city"
ORDER BY 2 DESC,
"patients"."city" ASC
orm_to_df(ormq)
| | city | population |
|---:|:----------|-------------:|
| 0 | Montreal | 14 |
| 1 | Calgary | 13 |
| 2 | Toronto | 13 |
| 3 | Vancouver | 13 |
| 4 | Halifax | 12 |
| 5 | Ottawa | 12 |
| 6 | Victoria | 12 |
| 7 | Winnipeg | 12 |
Show first name, last name and role of every person that is either patient or doctor. The roles are either "Patient" or "Doctor"
qstr = """
SELECT
first_name,
last_name,
'patient' AS Role
FROM patients
UNION ALL
SELECT
first_name,
last_name,
'doctor' AS Role
FROM doctors;
"""
sqlq = sql_raw(qstr)
ormq = (
Patients.objects.annotate(role=Value("patient", output_field=CharField()))
.values("first_name", "last_name", "role")
.union(
Doctors.objects.annotate(role=Value("doctor", output_field=CharField())).values(
"first_name", "last_name", "role"
),
all=True,
)
)
equal(sqlq, ormq)
print_sql(ormq)
Equal ✔️
SELECT "patients"."first_name" AS "col1",
"patients"."last_name" AS "col2",
patient AS "role"
FROM "patients"
UNION ALL
SELECT "doctors"."first_name" AS "col1",
"doctors"."last_name" AS "col2",
doctor AS "role"
FROM "doctors"
orm_to_df(ormq[:3])
| | first_name | last_name | role |
|---:|:-------------|:------------|:--------|
| 0 | Cheryl | Mason | patient |
| 1 | Jason | Fleming | patient |
| 2 | Tiffany | McDonald | patient |
Show all allergies and their occurance ordered by occurance. Remove NULL values from query.
qstr = """
SELECT
allergies,
COUNT (*) AS total_occurance
FROM patients
WHERE allergies IS NOT null
GROUP BY allergies
ORDER BY total_occurance DESC
"""
sqlq = sql_raw(qstr)
ormq = (
Patients.objects.values("allergies")
.filter(allergies__isnull=False)
.annotate(total_occurance=Count("allergies"))
.order_by("-total_occurance")
)
equal(sqlq, ormq)
print_sql(ormq)
Equal ✔️
SELECT "patients"."allergies",
COUNT("patients"."allergies") AS "total_occurance"
FROM "patients"
WHERE "patients"."allergies" IS NOT NULL
GROUP BY "patients"."allergies"
ORDER BY 2 DESC
orm_to_df(ormq[:3])
| | allergies | total_occurance |
|---:|:------------|------------------:|
| 0 | Pollen | 15 |
| 1 | Lactose | 13 |
| 2 | Sulfa drugs | 8 |
Show all patient's first_name, last_name, and birth_date who were born in the 1970s decade. Sort the list starting from the earliest birth_date.
# use YEAR(birth_date) if year function is available
qstr = """
SELECT
first_name,
last_name,
birth_date
FROM patients
WHERE CAST(strftime('%Y', birth_date) AS INT) BETWEEN 1970 AND 1979
ORDER BY birth_date
"""
sqlq = sql_raw(qstr)
ormq = (
Patients.objects.filter(birth_date__year__gte=1970, birth_date__year__lte=1979)
.order_by("birth_date")
.values("first_name", "last_name", "birth_date")
)
equal(sqlq, ormq)
print_sql(ormq)
Equal ✔️
SELECT "patients"."first_name",
"patients"."last_name",
"patients"."birth_date"
FROM "patients"
WHERE ("patients"."birth_date" >= 1970-01-01
AND "patients"."birth_date" <= 1979-12-31)
ORDER BY "patients"."birth_date" ASC
orm_to_df(ormq[:3])
| | first_name | last_name | birth_date |
|---:|:-------------|:------------|:-------------|
| 0 | Jeremy | Kim | 1975-07-19 |
| 1 | Samantha | Garcia | 1975-11-30 |
| 2 | Olivia | Li | 1976-03-11 |
We want to display each patient's full name in a single column. Their last_name in all upper letters must appear first, then first_name in all lower case letters. Separate the last_name and first_name with a comma. Order the list by the first_name in decending order EX: SMITH,jane
qstr = """
SELECT
UPPER(last_name) || ',' || LOWER(first_name) AS full_name
FROM patients
ORDER BY first_name DESC
"""
sqlq = sql_raw(qstr)
ormq = Patients.objects.values(
full_name=Concat(Upper("last_name"), Value(","), Lower("first_name"))
).order_by("-first_name")
equal(sqlq, ormq)
print_sql(ormq)
Equal ✔️
SELECT COALESCE(UPPER("patients"."last_name"),) || COALESCE(COALESCE(,,) || COALESCE(LOWER("patients"."first_name"),),) AS "full_name"
FROM "patients"
ORDER BY "patients"."first_name" DESC
orm_to_df(ormq[:3])
| | full_name |
|---:|:---------------|
| 0 | NGUYEN,william |
| 1 | LIU,victor |
| 2 | BAKER,trevor |
Show the province_id(s), sum of height; where the total sum of its patient's height is greater than or equal to 7,000. We will do 3000
qstr = """
SELECT
province_id,
SUM(height) AS sum_height
FROM patients
GROUP BY province_id
HAVING SUM(height) > 3000;
"""
sqlq = sql_raw(qstr)
ormq = (
Patients.objects.values("province_id")
.annotate(sum_height=Sum("height"))
.filter(sum_height__gt=3000)
.values("province_id", "sum_height")
)
equal(sqlq, ormq)
print_sql(ormq)
Equal ✔️
SELECT "patients"."province_id",
SUM("patients"."height") AS "sum_height"
FROM "patients"
GROUP BY "patients"."province_id"
HAVING SUM("patients"."height") > 3000
orm_to_df(ormq[:3])
| | province_id | sum_height |
|---:|:--------------|-------------:|
| 0 | BC | 4357 |
| 1 | ON | 4331 |
Show the difference between the largest weight and smallest weight for patients with the last name 'Maroni'. We will do Lee.
qstr = """
SELECT
(MAX(weight) - MIN(weight)) AS weight_dif
FROM patients
WHERE last_name = 'Lee';
"""
sqlq = sql_raw(qstr)
ormq = Patients.objects.filter(last_name="Lee").aggregate(
weight_dif=Max("weight") - Min("weight")
)
equal(sqlq, ormq)
# print_sql(ormq)
Equal ✔️
ormq = (
Patients.objects.filter(last_name="Lee")
.annotate(
weight_dif=Func(F("weight"), function="MAX") - Func(F("weight"), function="MIN")
)
.values("weight_dif")
)
equal(sqlq, ormq)
print_sql(ormq)
Equal ✔️
SELECT (MAX("patients"."weight") - MIN("patients"."weight")) AS "weight_dif"
FROM "patients"
WHERE "patients"."last_name" = Lee
orm_to_df(ormq)
| | weight_dif |
|---:|-------------:|
| 0 | 23 |
Show all of the days of the month (1-31) and how many admission_dates occurred on that day. Sort by the day with most admissions to least admissions.
qstr = """
SELECT
CAST(strftime('%d', admission_date) as INT) AS month_day,
COUNT(patient_id) AS daily_admission
FROM admissions
GROUP BY strftime('%d', admission_date)
ORDER BY daily_admission DESC;
"""
sqlq = sql_raw(qstr)
ormq = (
Admissions.objects.values(month_day=F("admission_date__day"))
.annotate(daily_admission=Count("id"))
.order_by("-daily_admission")
)
equal(sqlq, ormq)
print_sql(ormq)
Equal ✔️
SELECT django_date_extract(day, "admissions"."admission_date") AS "month_day",
COUNT("admissions"."id") AS "daily_admission"
FROM "admissions"
GROUP BY 1
ORDER BY 2 DESC
orm_to_df(ormq[:3])
| | month_day | daily_admission |
|---:|------------:|------------------:|
| 0 | 28 | 6 |
| 1 | 18 | 6 |
| 2 | 17 | 6 |
Show all columns for patient_id 54's most recent admission_date.
qstr = """
SELECT *
FROM admissions
WHERE patient_id = 54 AND admission_date = (
SELECT max(admission_date)
FROM admissions
WHERE patient_id = 54
)
"""
sqlq = sql_raw(qstr)
ormq = Admissions.objects.filter(
patient_id=54,
admission_date=Admissions.objects.filter(patient_id=54).aggregate(
max_admission=Max("admission_date")
)["max_admission"],
).values(*admission_fields)
equal(sqlq, ormq)
print_sql(ormq)
Equal ✔️
SELECT "admissions"."id",
"admissions"."patient_id",
"admissions"."admission_date",
"admissions"."discharge_date",
"admissions"."diagnosis",
"admissions"."attending_doctor_id"
FROM "admissions"
WHERE ("admissions"."admission_date" = 2022-06-02
AND "admissions"."patient_id" = 54)
ormq = Admissions.objects.filter(
patient_id=54,
admission_date=Subquery(
Admissions.objects.filter(patient_id=54)
.annotate(max_admission=Func(F("admission_date"), function="Max"))
.values("max_admission")
),
).values(*admission_fields)
equal(sqlq, ormq)
print_sql(ormq)
Equal ✔️
SELECT "admissions"."id",
"admissions"."patient_id",
"admissions"."admission_date",
"admissions"."discharge_date",
"admissions"."diagnosis",
"admissions"."attending_doctor_id"
FROM "admissions"
WHERE ("admissions"."admission_date" =
(SELECT Max(U0."admission_date") AS "max_admission"
FROM "admissions" U0
WHERE U0."patient_id" = 54)
AND "admissions"."patient_id" = 54)
ormq = (
Admissions.objects.filter(patient_id=54)
.order_by("-admission_date")[:1]
.values(*admission_fields)
)
equal(sqlq, ormq)
print_sql(ormq)
Equal ✔️
SELECT "admissions"."id",
"admissions"."patient_id",
"admissions"."admission_date",
"admissions"."discharge_date",
"admissions"."diagnosis",
"admissions"."attending_doctor_id"
FROM "admissions"
WHERE "admissions"."patient_id" = 54
ORDER BY "admissions"."admission_date" DESC
LIMIT 1
orm_to_df(ormq[:3])
| | id | patient_id | admission_date | discharge_date | diagnosis | attending_doctor_id |
|---:|-----:|-------------:|:-----------------|:-----------------|:------------|----------------------:|
| 0 | 154 | 54 | 2022-06-02 | 2022-06-06 | Migraine | 11 |
Show patient_id, attending_doctor_id, and diagnosis for admissions that match one of the two criteria: 1. patient_id is an odd number and attending_doctor_id is either 1, 5, or 19. 2. attending_doctor_id contains a 2 and the length of patient_id is 3 characters.
qstr = """
SELECT
patient_id,
attending_doctor_id,
diagnosis
FROM admissions
WHERE
(
patient_id % 2 = 1
and attending_doctor_id IN (1, 5, 19)
)
OR (
CAST(attending_doctor_id AS varchar) LIKE "%2%"
AND length(CAST(patient_id AS VARCHAR)) = 2
)
"""
sqlq = sql_raw(qstr)
f1 = Q(attending_doctor_id__in=[1, 5, 19], pi_mod=1)
f2 = Q(adi_str__icontains="2", pi_len=2)
ormq = (
Admissions.objects.annotate(
pi_mod=F("patient_id") % 2,
adi_str=Cast(F("attending_doctor_id"), CharField()),
pi_len=Length(Cast(F("patient_id"), CharField())),
)
.filter(f1 | f2)
.values("patient_id", "attending_doctor_id", "diagnosis")
)
equal(sqlq, ormq)
print_sql(ormq)
Equal ✔️
SELECT "admissions"."patient_id",
"admissions"."attending_doctor_id",
"admissions"."diagnosis"
FROM "admissions"
WHERE (("admissions"."attending_doctor_id" IN (1,
5,
19)
AND ("admissions"."patient_id" % 2) = 1)
OR (CAST("admissions"."attending_doctor_id" AS text) LIKE %2% ESCAPE '\'
AND LENGTH(CAST("admissions"."patient_id" AS text)) = 2))
orm_to_df(ormq[:3])
| | patient_id | attending_doctor_id | diagnosis |
|---:|-------------:|----------------------:|:------------|
| 0 | 14 | 20 | Arthritis |
| 1 | 15 | 2 | Bronchitis |
| 2 | 25 | 20 | Asthma |
Show first_name, last_name, and the total number of admissions attended for each doctor.
Every admission has been attended by a doctor.
qstr = """
SELECT
first_name,
last_name,
COUNT(*) AS patient_count
FROM admissions
JOIN doctors ON attending_doctor_id = doctor_id
GROUP BY attending_doctor_id
"""
sqlq = sql_raw(qstr)
ormq = (
Admissions.objects.values("attending_doctor_id")
.annotate(patient_count=Count("attending_doctor_id"))
.values(
"patient_count",
first_name=F("attending_doctor_id__first_name"),
last_name=F("attending_doctor_id__last_name"),
)
)
equal(sqlq, ormq)
print_sql(ormq)
Equal ✔️
SELECT COUNT("admissions"."attending_doctor_id") AS "patient_count",
"doctors"."first_name" AS "first_name",
"doctors"."last_name" AS "last_name"
FROM "admissions"
INNER JOIN "doctors" ON ("admissions"."attending_doctor_id" = "doctors"."doctor_id")
GROUP BY "admissions"."attending_doctor_id",
2,
3
orm_to_df(ormq[:3])
| | patient_count | first_name | last_name |
|---:|----------------:|:-------------|:------------|
| 0 | 8 | Maggie | Chen |
| 1 | 8 | Karen | Wong |
| 2 | 7 | Samuel | Nguyen |
For each doctor, display their id, full name, and the first and last admission date they attended.
qstr = """
SELECT
doctor_id,
first_name || ' ' || last_name AS full_name,
MIN(admission_date) AS min_admission,
MAX(admission_date) AS max_admission
FROM doctors
JOIN admissions ON attending_doctor_id = doctor_id
GROUP BY doctor_id
"""
sqlq = sql_raw(qstr)
ormq = (
Admissions.objects.values("attending_doctor_id")
.annotate(
min_admission=Cast(Min("admission_date"), CharField()),
max_admission=Cast(Max("admission_date"), CharField()),
)
.values(
"min_admission",
"max_admission",
doctor_id=F("attending_doctor_id"),
full_name=Concat(
F("attending_doctor_id__first_name"),
Value(" "),
F("attending_doctor_id__last_name"),
),
)
)
equal(sqlq, ormq)
print_sql(ormq)
Equal ✔️
SELECT CAST(MIN("admissions"."admission_date") AS text) AS "min_admission",
CAST(MAX("admissions"."admission_date") AS text) AS "max_admission",
"admissions"."attending_doctor_id" AS "doctor_id",
COALESCE("doctors"."first_name",) || COALESCE(COALESCE(,) || COALESCE("doctors"."last_name",),) AS "full_name"
FROM "admissions"
INNER JOIN "doctors" ON ("admissions"."attending_doctor_id" = "doctors"."doctor_id")
GROUP BY 3,
4
orm_to_df(ormq[:3])
| | min_admission | max_admission | doctor_id | full_name |
|---:|:----------------|:----------------|------------:|:--------------|
| 0 | 2022-01-08 | 2022-06-11 | 1 | Maggie Chen |
| 1 | 2022-01-15 | 2022-06-18 | 2 | Karen Wong |
| 2 | 2022-01-01 | 2022-05-27 | 3 | Samuel Nguyen |
Display the total amount of patients for each province. Order by descending.
qstr = """
SELECT
pn.province_name,
count(patient_id) population
FROM patients p
JOIN province_names pn ON p.province_id = pn.province_id
GROUP BY pn.province_id
ORDER BY population desc
"""
sqlq = sql_raw(qstr)
ormq = (
Patients.objects.values("province")
.annotate(population=Count("province"))
.filter(province__name__isnull=False)
.order_by("-population")
.values("population", province_name=F("province__name"))
)
equal(sqlq, ormq)
print_sql(ormq)
Equal ✔️
SELECT COUNT("patients"."province_id") AS "population",
"province_names"."province_name" AS "province_name"
FROM "patients"
INNER JOIN "province_names" ON ("patients"."province_id" = "province_names"."province_id")
WHERE "province_names"."province_name" IS NOT NULL
GROUP BY "patients"."province_id",
2
ORDER BY 1 DESC
orm_to_df(ormq)
| | population | province_name |
|---:|-------------:|:-----------------|
| 0 | 25 | British Columbia |
| 1 | 25 | Ontario |
| 2 | 14 | Quebec |
| 3 | 13 | Alberta |
| 4 | 12 | Manitoba |
| 5 | 12 | Nova Scotia |
For every admission, display the patient's full name, their admission diagnosis, and their doctor's full name who diagnosed their problem.
qstr = """
SELECT
p.first_name || ' ' || p.last_name AS patient_name,
diagnosis,
d.first_name || ' ' || d.last_name AS doctor_name
FROM patients p
JOIN admissions a ON p.patient_id = a.patient_id
JOIN doctors d ON a.attending_doctor_id = d.doctor_id
"""
sqlq = sql_raw(qstr)
ormq = Admissions.objects.values(
"diagnosis",
patient_name=Concat(F("patient__first_name"), Value(" "), F("patient__last_name")),
doctor_name=Concat(
F("attending_doctor__first_name"), Value(" "), F("attending_doctor__last_name")
),
)
equal(sqlq, ormq)
print_sql(ormq)
Equal ✔️
SELECT "admissions"."diagnosis",
COALESCE("patients"."first_name",) || COALESCE(COALESCE(,) || COALESCE("patients"."last_name",),) AS "patient_name",
COALESCE("doctors"."first_name",) || COALESCE(COALESCE(,) || COALESCE("doctors"."last_name",),) AS "doctor_name"
FROM "admissions"
INNER JOIN "patients" ON ("admissions"."patient_id" = "patients"."patient_id")
INNER JOIN "doctors" ON ("admissions"."attending_doctor_id" = "doctors"."doctor_id")
orm_to_df(ormq[:3])
| | diagnosis | patient_name | doctor_name |
|---:|:------------|:-----------------|:----------------|
| 0 | Bronchitis | Cheryl Mason | Samuel Nguyen |
| 1 | Migraine | Jason Fleming | Lisa Tran |
| 2 | Pneumonia | Tiffany McDonald | Catherine Cheng |
display the number of duplicate patients based on their first_name and last_name.
# use YEAR(birth_date) if year function is available
qstr = """
SELECT
first_name,
last_name,
count(*) duplicates
FROM patients
GROUP BY
first_name,
last_name
HAVING COUNT(*) > 1
"""
sqlq = sql_raw(qstr)
ormq = (
Patients.objects.values("first_name", "last_name")
.annotate(duplicates=Count("id"))
.filter(duplicates__gt=1)
)
equal(sqlq, ormq)
print_sql(ormq)
Equal ✔️
SELECT "patients"."first_name",
"patients"."last_name",
COUNT("patients"."patient_id") AS "duplicates"
FROM "patients"
GROUP BY "patients"."first_name",
"patients"."last_name"
HAVING COUNT("patients"."patient_id") > 1
orm_to_df(ormq[:3])
| | first_name | last_name | duplicates |
|---:|:-------------|:------------|-------------:|
| 0 | Emma | Gagnon | 2 |
| 1 | Isaac | Nguyen | 2 |
| 2 | Nora | Singh | 2 |
Display patient's full name, height in the units feet rounded to 1 decimal, weight in the unit pounds rounded to 0 decimals, birth_date, gender non abbreviated.
Convert CM to feet by dividing by 30.48. Convert KG to pounds by multiplying by 2.205.
qstr = """
SELECT
first_name || ' ' || last_name AS full_name,
ROUND(height / 30.48, 1) AS height_inc,
ROUND(weight * 2.205, 0) AS weight_pound,
birth_date,
CASE
WHEN gender = 'M' THEN 'Male'
WHEN gender = 'F' THEN 'Female'
END AS gender_full
FROM patients
"""
sqlq = sql_raw(qstr)
ormq = Patients.objects.values(
"birth_date",
full_name=Concat(F("first_name"), Value(" "), F("last_name")),
height_inc=Round(F("height") / 30.48, 1),
weight_pound=Round(F("weight") * 2.205, 0),
gender_full=Case(
When(gender="M", then=Value("Male")), When(gender="F", then=Value("Female"))
),
)
equal(sqlq, ormq)
print_sql(ormq)
Equal ✔️
SELECT "patients"."birth_date",
COALESCE("patients"."first_name",) || COALESCE(COALESCE(,) || COALESCE("patients"."last_name",),) AS "full_name",
ROUND(("patients"."height" / 30.48), 1) AS "height_inc",
ROUND(("patients"."weight" * 2.205), 0) AS "weight_pound",
CASE
WHEN "patients"."gender" = M THEN Male
WHEN "patients"."gender" = F THEN Female
ELSE NULL
END AS "gender_full"
FROM "patients"
orm_to_df(ormq[:3])
| | birth_date | full_name | height_inc | weight_pound | gender_full |
|---:|:-------------|:-----------------|-------------:|---------------:|:--------------|
| 0 | 1978-05-14 | Cheryl Mason | 5.6 | 143 | Female |
| 1 | 1990-08-02 | Jason Fleming | 6.1 | 176 | Male |
| 2 | 1985-03-27 | Tiffany McDonald | 5.1 | 128 | Female |
Show patient_id, first_name, last_name from patients whose does not have any records in the admissions table. (Their patient_id does not exist in any admissions.patient_id rows.)
qstr = """
SELECT
patient_id,
first_name,
last_name
FROM patients
WHERE patient_id NOT IN (
SELECT patient_id
FROM admissions
)
"""
sqlq = sql_raw(qstr)
ormq = Patients.objects.filter(
~Q(id__in=Subquery(Admissions.objects.values("patient_id")))
).values(
"first_name",
"last_name",
patient_id=F("id"),
)
equal(sqlq, ormq)
print_sql(ormq)
Equal ✔️
SELECT "patients"."first_name",
"patients"."last_name",
"patients"."patient_id" AS "patient_id"
FROM "patients"
WHERE NOT ("patients"."patient_id" IN
(SELECT U0."patient_id"
FROM "admissions" U0))
orm_to_df(sqlq)
| | patient_id | first_name | last_name |
|---:|-------------:|:-------------|:------------|
| 0 | 101 | Edward | Kenway |