Skip to content

Instantly share code, notes, and snippets.

View lfy79001's full-sized avatar

Fangyu Lei lfy79001

View GitHub Profile
SELECT
wx.date,
MAX(prcp) AS prcp,
MAX(tmin) AS tmin,
MAX(tmax) AS tmax,
IF(MAX(haswx) = 'True', 'True', 'False') AS haswx
FROM (
SELECT
wx.date,
IF (wx.element = 'PRCP', wx.value/10, NULL) AS prcp,
SELECT
name,
value/10 AS min_temperature,
latitude,
longitude
FROM
`bigquery-public-data.ghcn_d.ghcnd_stations` AS stn
JOIN
`bigquery-public-data.ghcn_d.ghcnd_2016` AS wx
ON
SELECT
state_code,
evaluation_group,
evaluation_description,
state_name,
sum(macroplot_acres) + sum(subplot_acres) as total_acres,
latest
FROM (SELECT
state_code,
evaluation_group,
SELECT
`isb-cgc.TARGET_hg38_data_v0.RNAseq_Gene_Expression`.case_barcode,
`isb-cgc.TARGET_hg38_data_v0.RNAseq_Gene_Expression`.HTSeq__FPKM_UQ,
`isb-cgc.TARGET_hg38_data_v0.RNAseq_Gene_Expression`.Ensembl_gene_id,
`isb-cgc.TARGET_hg38_data_v0.RNAseq_Gene_Expression`.gene_name,
`isb-cgc.TARGET_bioclin_v0.Clinical`.CR_status_at_end_of_course_1,
`isb-cgc.TARGET_bioclin_v0.Clinical`.CR_status_at_end_of_course_2
FROM
`isb-cgc.TARGET_hg38_data_v0.RNAseq_Gene_Expression`
JOIN
SELECT
file.project_short_name,
file.data_category,
file.data_type,
file.data_format,
COUNT(file.file_gdc_id) as n
FROM
`isb-cgc-bq.GDC_case_file_metadata.fileData_active_current` AS file
WHERE
associated_entities__case_gdc_id IN ('{case_ids}')
SELECT
c.case_id,
c.exp__years_smoked,
r.fpkm_unstranded
FROM
`isb-cgc-bq.TCGA_versioned.clinical_gdc_r37` AS c
JOIN
`isb-cgc-bq.TCGA_versioned.RNAseq_hg38_gdc_r35` AS r
ON
c.case_id = r.case_gdc_id
WITH
select_on_annotations AS (
SELECT
case_barcode,
category AS categoryName,
classification AS classificationName
FROM
`isb-cgc.TCGA_bioclin_v0.Annotations`
WHERE
( entity_type="Patient"
WITH
mutCounts AS (
SELECT
COUNT(DISTINCT( Tumor_SampleBarcode )) AS CaseCount,
Hugo_Symbol,
HGVSc
FROM
`isb-cgc-bq.pancancer_atlas.Filtered_MC3_MAF_V5_one_per_tumor_sample`
GROUP BY
Hugo_Symbol,
SELECT
*
FROM (
SELECT
reference_name,
COUNT(reference_name) / r.length AS variant_density,
COUNT(reference_name) AS variant_count,
r.length AS reference_length
FROM
`bigquery-public-data.genomics_cannabis.MNPR01_201703` v,
SELECT
A.state,
drug_name,
total_claim_count,
day_supply,
ROUND(total_cost_millions) AS total_cost_millions
FROM (
SELECT
generic_name AS drug_name,
nppes_provider_state AS state,