Skip to content

Instantly share code, notes, and snippets.

@alex-wilmer
Created January 29, 2018 15:47
Show Gist options
  • Save alex-wilmer/3dc9c4c5f7944a5ce2a0b1d884fcd921 to your computer and use it in GitHub Desktop.
Save alex-wilmer/3dc9c4c5f7944a5ce2a0b1d884fcd921 to your computer and use it in GitHub Desktop.
PUT case_centric
{
"mappings": {
"case_centric": {
"_all": {
"enabled": false
},
"_source": {
"excludes": [
"gene.*"
]
},
"properties": {
"available_variation_data": {
"type": "keyword"
},
"case_autocomplete": {
"type": "keyword",
"fields": {
"analyzed": {
"type": "text",
"analyzer": "autocomplete_analyzed",
"search_analyzer": "lowercase_keyword"
},
"lowercase": {
"type": "text",
"analyzer": "lowercase_keyword"
},
"prefix": {
"type": "text",
"analyzer": "autocomplete_prefix",
"search_analyzer": "lowercase_keyword"
}
}
},
"case_id": {
"type": "keyword",
"copy_to": [
"case_autocomplete"
]
},
"created_datetime": {
"type": "date"
},
"days_to_index": {
"type": "long"
},
"demographic": {
"properties": {
"created_datetime": {
"type": "date"
},
"demographic_id": {
"type": "keyword"
},
"ethnicity": {
"type": "keyword"
},
"gender": {
"type": "keyword"
},
"race": {
"type": "keyword"
},
"state": {
"type": "keyword"
},
"submitter_id": {
"type": "keyword"
},
"updated_datetime": {
"type": "date"
},
"year_of_birth": {
"type": "long"
},
"year_of_death": {
"type": "long"
}
}
},
"diagnoses": {
"type": "nested",
"properties": {
"age_at_diagnosis": {
"type": "long"
},
"ajcc_clinical_m": {
"type": "keyword"
},
"ajcc_clinical_n": {
"type": "keyword"
},
"ajcc_clinical_stage": {
"type": "keyword"
},
"ajcc_clinical_t": {
"type": "keyword"
},
"ajcc_pathologic_m": {
"type": "keyword"
},
"ajcc_pathologic_n": {
"type": "keyword"
},
"ajcc_pathologic_stage": {
"type": "keyword"
},
"ajcc_pathologic_t": {
"type": "keyword"
},
"ann_arbor_b_symptoms": {
"type": "keyword"
},
"ann_arbor_clinical_stage": {
"type": "keyword"
},
"ann_arbor_extranodal_involvement": {
"type": "keyword"
},
"ann_arbor_pathologic_stage": {
"type": "keyword"
},
"burkitt_lymphoma_clinical_variant": {
"type": "keyword"
},
"cause_of_death": {
"type": "keyword"
},
"circumferential_resection_margin": {
"type": "long"
},
"classification_of_tumor": {
"type": "keyword"
},
"colon_polyps_history": {
"type": "keyword"
},
"created_datetime": {
"type": "date"
},
"days_to_birth": {
"type": "long"
},
"days_to_death": {
"type": "long"
},
"days_to_hiv_diagnosis": {
"type": "long"
},
"days_to_last_follow_up": {
"type": "long"
},
"days_to_last_known_disease_status": {
"type": "long"
},
"days_to_new_event": {
"type": "long"
},
"days_to_recurrence": {
"type": "long"
},
"diagnosis_id": {
"type": "keyword"
},
"figo_stage": {
"type": "keyword"
},
"hiv_positive": {
"type": "keyword"
},
"hpv_positive_type": {
"type": "keyword"
},
"hpv_status": {
"type": "keyword"
},
"last_known_disease_status": {
"type": "keyword"
},
"laterality": {
"type": "keyword"
},
"ldh_level_at_diagnosis": {
"type": "long"
},
"ldh_normal_range_upper": {
"type": "long"
},
"lymph_nodes_positive": {
"type": "long"
},
"lymphatic_invasion_present": {
"type": "keyword"
},
"method_of_diagnosis": {
"type": "keyword"
},
"morphology": {
"type": "keyword"
},
"new_event_anatomic_site": {
"type": "keyword"
},
"new_event_type": {
"type": "keyword"
},
"perineural_invasion_present": {
"type": "keyword"
},
"primary_diagnosis": {
"type": "keyword"
},
"prior_malignancy": {
"type": "keyword"
},
"prior_treatment": {
"type": "keyword"
},
"progression_or_recurrence": {
"type": "keyword"
},
"residual_disease": {
"type": "keyword"
},
"site_of_resection_or_biopsy": {
"type": "keyword"
},
"state": {
"type": "keyword"
},
"submitter_id": {
"type": "keyword"
},
"tissue_or_organ_of_origin": {
"type": "keyword"
},
"treatments": {
"type": "nested",
"properties": {
"created_datetime": {
"type": "date"
},
"days_to_treatment": {
"type": "long"
},
"days_to_treatment_end": {
"type": "long"
},
"days_to_treatment_start": {
"type": "long"
},
"state": {
"type": "keyword"
},
"submitter_id": {
"type": "keyword"
},
"therapeutic_agents": {
"type": "keyword"
},
"treatment_anatomic_site": {
"type": "keyword"
},
"treatment_id": {
"type": "keyword"
},
"treatment_intent_type": {
"type": "keyword"
},
"treatment_or_therapy": {
"type": "keyword"
},
"treatment_outcome": {
"type": "keyword"
},
"treatment_type": {
"type": "keyword"
},
"updated_datetime": {
"type": "date"
}
}
},
"tumor_grade": {
"type": "keyword"
},
"tumor_stage": {
"type": "keyword"
},
"updated_datetime": {
"type": "date"
},
"vascular_invasion_present": {
"type": "keyword"
},
"vital_status": {
"type": "keyword"
},
"year_of_diagnosis": {
"type": "long"
}
}
},
"disease_type": {
"type": "keyword",
"copy_to": [
"case_autocomplete"
]
},
"exposures": {
"type": "nested",
"properties": {
"alcohol_history": {
"type": "keyword"
},
"alcohol_intensity": {
"type": "keyword"
},
"bmi": {
"type": "float"
},
"cigarettes_per_day": {
"type": "float"
},
"created_datetime": {
"type": "date"
},
"exposure_id": {
"type": "keyword"
},
"height": {
"type": "float"
},
"pack_years_smoked": {
"type": "long"
},
"state": {
"type": "keyword"
},
"submitter_id": {
"type": "keyword"
},
"tobacco_smoking_onset_year": {
"type": "long"
},
"tobacco_smoking_quit_year": {
"type": "long"
},
"tobacco_smoking_status": {
"type": "keyword"
},
"updated_datetime": {
"type": "date"
},
"weight": {
"type": "float"
},
"years_smoked": {
"type": "float"
}
}
},
"family_histories": {
"type": "nested",
"properties": {
"created_datetime": {
"type": "date"
},
"family_history_id": {
"type": "keyword"
},
"relationship_age_at_diagnosis": {
"type": "long"
},
"relationship_gender": {
"type": "keyword"
},
"relationship_primary_diagnosis": {
"type": "keyword"
},
"relationship_type": {
"type": "keyword"
},
"relative_with_cancer_history": {
"type": "keyword"
},
"state": {
"type": "keyword"
},
"submitter_id": {
"type": "keyword"
},
"updated_datetime": {
"type": "date"
}
}
},
"gene": {
"type": "nested",
"properties": {
"biotype": {
"type": "keyword"
},
"canonical_transcript_id": {
"type": "text",
"fields": {
"keyword": {
"type": "keyword",
"ignore_above": 256
}
}
},
"cytoband": {
"type": "text",
"fields": {
"keyword": {
"type": "keyword",
"ignore_above": 256
}
}
},
"description": {
"type": "text",
"fields": {
"keyword": {
"type": "keyword",
"ignore_above": 256
}
}
},
"external_db_ids": {
"properties": {
"entrez_gene": {
"type": "text",
"fields": {
"keyword": {
"type": "keyword",
"ignore_above": 256
}
}
},
"hgnc": {
"type": "text",
"fields": {
"keyword": {
"type": "keyword",
"ignore_above": 256
}
}
},
"omim_gene": {
"type": "text",
"fields": {
"keyword": {
"type": "keyword",
"ignore_above": 256
}
}
},
"uniprotkb_swissprot": {
"type": "text",
"fields": {
"keyword": {
"type": "keyword",
"ignore_above": 256
}
}
}
}
},
"gene_chromosome": {
"type": "text",
"fields": {
"keyword": {
"type": "keyword",
"ignore_above": 256
}
}
},
"gene_end": {
"type": "long"
},
"gene_id": {
"type": "keyword"
},
"gene_start": {
"type": "long"
},
"gene_strand": {
"type": "long"
},
"is_cancer_gene_census": {
"type": "boolean"
},
"name": {
"type": "text",
"fields": {
"keyword": {
"type": "keyword",
"ignore_above": 256
}
}
},
"ssm": {
"type": "nested",
"properties": {
"chromosome": {
"type": "keyword"
},
"consequence": {
"type": "nested",
"properties": {
"consequence_id": {
"type": "keyword"
},
"transcript": {
"properties": {
"aa_change": {
"type": "keyword"
},
"annotation": {
"properties": {
"amino_acids": {
"type": "keyword"
},
"ccds": {
"type": "keyword"
},
"cdna_position": {
"type": "keyword"
},
"cds_end": {
"type": "long"
},
"cds_length": {
"type": "long"
},
"cds_position": {
"type": "keyword"
},
"cds_start": {
"type": "long"
},
"clin_sig": {
"type": "keyword"
},
"codons": {
"type": "keyword"
},
"dbsnp_rs": {
"type": "keyword"
},
"dbsnp_val_status": {
"type": "keyword"
},
"domains": {
"type": "keyword"
},
"ensp": {
"type": "keyword"
},
"existing_variation": {
"type": "keyword"
},
"hgvsc": {
"type": "keyword"
},
"hgvsp": {
"type": "keyword"
},
"hgvsp_short": {
"type": "keyword"
},
"impact": {
"type": "keyword"
},
"polyphen": {
"type": "text",
"fields": {
"keyword": {
"type": "keyword",
"ignore_above": 256
}
}
},
"polyphen_impact": {
"type": "keyword"
},
"polyphen_score": {
"type": "float"
},
"protein_position": {
"type": "keyword"
},
"pubmed": {
"type": "keyword"
},
"sift": {
"type": "text",
"fields": {
"keyword": {
"type": "keyword",
"ignore_above": 256
}
}
},
"sift_impact": {
"type": "keyword"
},
"sift_score": {
"type": "float"
},
"swissprot": {
"type": "keyword"
},
"transcript_id": {
"type": "keyword"
},
"trembl": {
"type": "keyword"
},
"uniparc": {
"type": "keyword"
}
}
},
"consequence_type": {
"type": "keyword"
},
"ref_seq_accession": {
"type": "keyword"
},
"transcript_id": {
"type": "keyword"
}
}
}
}
},
"cosmic_id": {
"type": "keyword"
},
"end_position": {
"type": "long"
},
"genomic_dna_change": {
"type": "keyword"
},
"mutation_subtype": {
"type": "keyword"
},
"mutation_type": {
"type": "keyword"
},
"ncbi_build": {
"type": "keyword"
},
"observation": {
"type": "nested",
"properties": {
"acl": {
"type": "keyword"
},
"center": {
"type": "keyword"
},
"input_bam_file": {
"properties": {
"normal_bam_uuid": {
"type": "keyword"
},
"tumor_bam_uuid": {
"type": "keyword"
}
}
},
"mutation_status": {
"type": "keyword"
},
"normal_genotype": {
"properties": {
"match_norm_seq_allele1": {
"type": "keyword"
},
"match_norm_seq_allele2": {
"type": "keyword"
}
}
},
"observation_id": {
"type": "keyword"
},
"read_depth": {
"properties": {
"n_depth": {
"type": "long"
},
"t_alt_count": {
"type": "long"
},
"t_depth": {
"type": "long"
},
"t_ref_count": {
"type": "long"
}
}
},
"sample": {
"properties": {
"matched_norm_sample_barcode": {
"type": "keyword"
},
"matched_norm_sample_uuid": {
"type": "keyword"
},
"tumor_sample_barcode": {
"type": "keyword"
},
"tumor_sample_uuid": {
"type": "keyword"
}
}
},
"src_vcf_id": {
"type": "keyword"
},
"tumor_genotype": {
"properties": {
"tumor_seq_allele1": {
"type": "keyword"
},
"tumor_seq_allele2": {
"type": "keyword"
}
}
},
"validation": {
"properties": {
"tumor_validation_allele1": {
"type": "keyword"
},
"tumor_validation_allele2": {
"type": "keyword"
},
"validation_method": {
"type": "keyword"
}
}
},
"variant_calling": {
"properties": {
"variant_caller": {
"type": "keyword"
},
"variant_process": {
"type": "keyword"
}
}
}
}
},
"reference_allele": {
"type": "keyword"
},
"ssm_id": {
"type": "keyword"
},
"start_position": {
"type": "long"
},
"tumor_allele": {
"type": "keyword"
}
}
},
"symbol": {
"type": "keyword"
},
"synonyms": {
"type": "text",
"fields": {
"keyword": {
"type": "keyword",
"ignore_above": 256
}
}
},
"transcripts": {
"properties": {
"biotype": {
"type": "text",
"fields": {
"keyword": {
"type": "keyword",
"ignore_above": 256
}
}
},
"cdna_coding_end": {
"type": "long"
},
"cdna_coding_start": {
"type": "long"
},
"coding_region_end": {
"type": "long"
},
"coding_region_start": {
"type": "long"
},
"domains": {
"properties": {
"description": {
"type": "text",
"fields": {
"keyword": {
"type": "keyword",
"ignore_above": 256
}
}
},
"end": {
"type": "long"
},
"gff_source": {
"type": "text",
"fields": {
"keyword": {
"type": "keyword",
"ignore_above": 256
}
}
},
"hit_name": {
"type": "text",
"fields": {
"keyword": {
"type": "keyword",
"ignore_above": 256
}
}
},
"interpro_id": {
"type": "text",
"fields": {
"keyword": {
"type": "keyword",
"ignore_above": 256
}
}
},
"start": {
"type": "long"
}
}
},
"end": {
"type": "long"
},
"end_exon": {
"type": "long"
},
"exons": {
"properties": {
"cdna_coding_end": {
"type": "long"
},
"cdna_coding_start": {
"type": "long"
},
"cdna_end": {
"type": "long"
},
"cdna_start": {
"type": "long"
},
"end": {
"type": "long"
},
"end_phase": {
"type": "long"
},
"genomic_coding_end": {
"type": "long"
},
"genomic_coding_start": {
"type": "long"
},
"start": {
"type": "long"
},
"start_phase": {
"type": "long"
}
}
},
"is_canonical": {
"type": "boolean"
},
"length": {
"type": "long"
},
"length_amino_acid": {
"type": "long"
},
"length_cds": {
"type": "long"
},
"name": {
"type": "text",
"fields": {
"keyword": {
"type": "keyword",
"ignore_above": 256
}
}
},
"number_of_exons": {
"type": "long"
},
"seq_exon_end": {
"type": "long"
},
"seq_exon_start": {
"type": "long"
},
"start": {
"type": "long"
},
"start_exon": {
"type": "long"
},
"transcript_id": {
"type": "text",
"fields": {
"keyword": {
"type": "keyword",
"ignore_above": 256
}
}
},
"translation_id": {
"type": "text",
"fields": {
"keyword": {
"type": "keyword",
"ignore_above": 256
}
}
}
}
}
}
},
"primary_site": {
"type": "keyword",
"copy_to": [
"case_autocomplete"
]
},
"project": {
"properties": {
"dbgap_accession_number": {
"type": "keyword"
},
"disease_type": {
"type": "keyword",
"copy_to": [
"case_autocomplete"
]
},
"intended_release_date": {
"type": "keyword"
},
"name": {
"type": "keyword",
"copy_to": [
"case_autocomplete"
]
},
"primary_site": {
"type": "keyword",
"copy_to": [
"case_autocomplete"
]
},
"program": {
"properties": {
"dbgap_accession_number": {
"type": "keyword"
},
"name": {
"type": "keyword"
},
"program_id": {
"type": "keyword"
}
}
},
"project_id": {
"type": "keyword",
"copy_to": [
"case_autocomplete"
]
},
"releasable": {
"type": "keyword"
},
"released": {
"type": "boolean"
},
"state": {
"type": "keyword"
}
}
},
"state": {
"type": "keyword"
},
"submitter_id": {
"type": "keyword",
"copy_to": [
"case_autocomplete"
]
},
"summary": {
"properties": {
"data_categories": {
"type": "nested",
"properties": {
"data_category": {
"type": "keyword"
},
"file_count": {
"type": "long"
}
}
},
"experimental_strategies": {
"type": "nested",
"properties": {
"experimental_strategy": {
"type": "keyword"
},
"file_count": {
"type": "long"
}
}
},
"file_count": {
"type": "long"
},
"file_size": {
"type": "long"
}
}
},
"tissue_source_site": {
"properties": {
"bcr_id": {
"type": "keyword"
},
"code": {
"type": "keyword"
},
"name": {
"type": "keyword"
},
"project": {
"type": "keyword"
},
"tissue_source_site_id": {
"type": "keyword"
}
}
},
"updated_datetime": {
"type": "date"
}
}
}
}
}
Sign up for free to join this conversation on GitHub. Already have an account? Sign in to comment