See the model guide dbt and erd for schema and column details.
-- find me what cases should be preformed for WGS analysis from the weekly sequencing?
select
*
from lims
where
sequencing_run_id in ('250509_A01052_0262_BHFGJWDSXF')
and type = 'WGS'
and workflow in ('clinical', 'research')
and phenotype in ('tumor', 'normal')
order by internal_subject_id;
-- find me what cases should be preformed for WTS analysis from the weekly sequencing?
select
*
from lims
where
sequencing_run_id in ('250509_A01052_0262_BHFGJWDSXF')
and type = 'WTS'
and workflow in ('clinical', 'research')
and phenotype in ('tumor')
order by internal_subject_id;
-- find me what cases should be preformed for ctTSO analysis from the weekly sequencing?
select
*
from lims
where
sequencing_run_id in ('250417_A01052_0261_AHFHG7DSXF')
and assay in ('ctTSO', 'ctTSOv2')
and workflow in ('clinical', 'research')
and phenotype in ('tumor')
order by internal_subject_id;
-- list all ctTSO assay samples sorted by recent sequencing
select
*
from lims
where
assay in ('ctTSO', 'ctTSOv2')
order by sequencing_run_id desc;
-- find all libraries from the project owned by PI on the specified date range
select
*
from lims
where
sequencing_run_date between cast('2025-03-27' as date) and cast('2025-03-31' as date)
and project_id = 'CUP'
and owner_id = 'Tothill';
-- find all LIMS entries and FASTQ locations for given SequencingRunID and Owner
select
lims.*,
fastq.*
from lims
join fastq on fastq.sequencing_run_id = lims.sequencing_run_id and fastq.library_id = lims.library_id
where
lims.sequencing_run_id in ('250328_A01052_0257_BHFFVFDSXF', '250328_A01052_0258_AHFGM7DSXF')
and lims.owner_id = 'Tothill';
-- list all PI/Owner sorted alphabetically and null entries to the last
select distinct owner_id from lims order by owner_id nulls last;
NOTE:
-- find me WGS tumor normal pair based on the Centre InternalSubjectID
select
*
from lims
where
type = 'WGS'
and workflow in ('clinical', 'research')
and phenotype in ('tumor', 'normal')
and internal_subject_id = 'SBJ06470';
-- find me WGS tumor normal pair along with FASTQ in ORA format based on the Centre InternalSubjectID
select
*
from lims
join fastq on fastq.sequencing_run_id = lims.sequencing_run_id and fastq.library_id = lims.library_id
where
fastq.format = 'ora'
and lims.type = 'WGS'
and lims.workflow in ('clinical', 'research')
and lims.phenotype in ('tumor', 'normal')
and lims.internal_subject_id = 'SBJ06470';
-- find me WGS tumor normal pair along with FASTQ in ORA format based on the Centre LibraryID that I have chosen
select
*
from lims
join fastq on fastq.sequencing_run_id = lims.sequencing_run_id and fastq.library_id = lims.library_id
where
fastq.format = 'ora'
and lims.type = 'WGS'
and lims.workflow in ('clinical', 'research')
and lims.phenotype in ('tumor', 'normal')
-- and lims.internal_subject_id = 'SBJ06464'
and lims.library_id in ('L2500458', 'L2500267');
-- find me the latest sequencing done by "PO"
select distinct
sequencing_run_id,
sequencing_run_date
from lims
where
sequencing_run_id like '%A01052%'
order by sequencing_run_date desc;
-- find me the latest sequencing done by "Baymax"
select distinct
sequencing_run_id,
sequencing_run_date
from lims
where
sequencing_run_id like '%A00130%'
order by sequencing_run_date desc;
-- list all successful sequencing done by "PO" in 2025 sorted the latest first
select distinct
sequencing_run_id
from lims
where
sequencing_run_id like '%A01052%'
and year(sequencing_run_date) = 2025
order by sequencing_run_id desc;
-- give me the successful sequencing run count for each year by "PO"
select
year(sequencing_run_date) as YEAR,
count(distinct sequencing_run_id) as RUN_COUNT
from lims
where
sequencing_run_id like '%A01052%'
group by year(sequencing_run_date)
order by year(sequencing_run_date) desc;
-- give me the successful sequencing run count for each year by "Baymax"
select
year(sequencing_run_date) as YEAR,
count(distinct sequencing_run_id) as RUN_COUNT
from lims
where
sequencing_run_id like '%A00130%'
group by year(sequencing_run_date)
order by year(sequencing_run_date) desc;
-- list OWNER, PROJECT unique combination count sorted by highest row count
select distinct
owner_id,
project_id,
count(1) as row_count
from lims
group by owner_id, project_id
order by count(1) desc;
-- find OWNER, PROJECT unique combination counts all matches to specific owner or project
select distinct
owner_id,
project_id,
count(1) as row_count
from lims
where
owner_id = 'Tothill' or lower(project_id) like '%tothill%'
group by owner_id, project_id
order by count(1) desc;
-- find WTS library count group by sample TYPE, ASSAY sorted by assay
select
type,
assay,
count(1) as library_count
from lims
where
type = 'WTS'
group by type, assay
order by assay;
-- find WGS sample unique TYPE, ASSAY combination
select distinct
type,
assay,
count(1) as row_count
from lims
where
type = 'WGS'
group by type, assay
order by type, assay nulls last;
-- find all unique TYPE, ASSAY combination
select distinct
type,
assay,
count(1) as row_count
from lims
group by type, assay
order by type, assay nulls last;