Skip to content

Instantly share code, notes, and snippets.

@cyclecycle
Created November 30, 2018 10:45
Show Gist options
  • Save cyclecycle/66b6c7e1eb80fe0e434c13dfc33bffe2 to your computer and use it in GitHub Desktop.
Save cyclecycle/66b6c7e1eb80fe0e434c13dfc33bffe2 to your computer and use it in GitHub Desktop.
parse tree data structure example
{
"sent_i": 3,
"start_idx": 273,
"text": "Overstimulation of mTOR by its ligands, amino acids, sugars, and/or growth factors leads to physiological disorders, including cancer and neurodegenerative diseases",
"tokens": [
{
"dep_": "nsubj",
"dep_i": 12,
"i": 0,
"idx": 0,
"lemma_": "overstimulation",
"pos_": "NOUN",
"tag_": "NN",
"text": "Overstimulation",
"text_with_ws": "Overstimulation "
},
{
"dep_": "prep",
"dep_i": 0,
"i": 1,
"idx": 16,
"lemma_": "of",
"pos_": "ADP",
"tag_": "IN",
"text": "of",
"text_with_ws": "of "
},
{
"dep_": "pobj",
"dep_i": 1,
"i": 2,
"idx": 19,
"lemma_": "mtor",
"pos_": "NOUN",
"tag_": "NN",
"text": "mTOR",
"text_with_ws": "mTOR "
},
{
"dep_": "prep",
"dep_i": 0,
"i": 3,
"idx": 24,
"lemma_": "by",
"pos_": "ADP",
"tag_": "IN",
"text": "by",
"text_with_ws": "by "
},
{
"dep_": "pobj",
"dep_i": 3,
"i": 4,
"idx": 27,
"lemma_": "it",
"pos_": "NOUN",
"tag_": "NNS",
"text": "its ligands",
"text_with_ws": "its ligands"
},
{
"dep_": "punct",
"dep_i": 0,
"i": 5,
"idx": 38,
"lemma_": ",",
"pos_": "PUNCT",
"tag_": ",",
"text": ",",
"text_with_ws": ", "
},
{
"dep_": "conj",
"dep_i": 0,
"i": 6,
"idx": 40,
"lemma_": "amino",
"pos_": "NOUN",
"tag_": "NNS",
"text": "amino acids",
"text_with_ws": "amino acids"
},
{
"dep_": "punct",
"dep_i": 6,
"i": 7,
"idx": 51,
"lemma_": ",",
"pos_": "PUNCT",
"tag_": ",",
"text": ",",
"text_with_ws": ", "
},
{
"dep_": "conj",
"dep_i": 6,
"i": 8,
"idx": 53,
"lemma_": "sugar",
"pos_": "NOUN",
"tag_": "NNS",
"text": "sugars",
"text_with_ws": "sugars"
},
{
"dep_": "punct",
"dep_i": 8,
"i": 9,
"idx": 59,
"lemma_": ",",
"pos_": "PUNCT",
"tag_": ",",
"text": ",",
"text_with_ws": ", "
},
{
"dep_": "cc",
"dep_i": 8,
"i": 10,
"idx": 61,
"lemma_": "and/or",
"pos_": "CCONJ",
"tag_": "CC",
"text": "and/or",
"text_with_ws": "and/or "
},
{
"dep_": "conj",
"dep_i": 8,
"i": 11,
"idx": 68,
"lemma_": "growth",
"pos_": "NOUN",
"tag_": "NNS",
"text": "growth factors",
"text_with_ws": "growth factors "
},
{
"dep_": "ROOT",
"dep_i": 12,
"i": 12,
"idx": 83,
"lemma_": "lead",
"pos_": "VERB",
"tag_": "VBZ",
"text": "leads",
"text_with_ws": "leads "
},
{
"dep_": "prep",
"dep_i": 12,
"i": 13,
"idx": 89,
"lemma_": "to",
"pos_": "ADP",
"tag_": "IN",
"text": "to",
"text_with_ws": "to "
},
{
"dep_": "pobj",
"dep_i": 13,
"i": 14,
"idx": 92,
"lemma_": "physiological",
"pos_": "NOUN",
"tag_": "NNS",
"text": "physiological disorders",
"text_with_ws": "physiological disorders"
},
{
"dep_": "punct",
"dep_i": 14,
"i": 15,
"idx": 115,
"lemma_": ",",
"pos_": "PUNCT",
"tag_": ",",
"text": ",",
"text_with_ws": ", "
},
{
"dep_": "prep",
"dep_i": 14,
"i": 16,
"idx": 117,
"lemma_": "include",
"pos_": "VERB",
"tag_": "VBG",
"text": "including",
"text_with_ws": "including "
},
{
"dep_": "pobj",
"dep_i": 16,
"i": 17,
"idx": 127,
"lemma_": "cancer",
"pos_": "NOUN",
"tag_": "NN",
"text": "cancer",
"text_with_ws": "cancer "
},
{
"dep_": "cc",
"dep_i": 17,
"i": 18,
"idx": 134,
"lemma_": "and",
"pos_": "CCONJ",
"tag_": "CC",
"text": "and",
"text_with_ws": "and "
},
{
"dep_": "conj",
"dep_i": 17,
"i": 19,
"idx": 138,
"lemma_": "neurodegenerative",
"pos_": "NOUN",
"tag_": "NNS",
"text": "neurodegenerative diseases",
"text_with_ws": "neurodegenerative diseases"
}
],
"tree_i": 3
},
Sign up for free to join this conversation on GitHub. Already have an account? Sign in to comment