Skip to content

Instantly share code, notes, and snippets.

@proycon
Created October 4, 2017 22:01
Show Gist options
  • Star 1 You must be signed in to star a gist
  • Fork 0 You must be signed in to fork a gist
  • Save proycon/ad6d51c8500281266f8e4aea4801e05d to your computer and use it in GitHub Desktop.
Save proycon/ad6d51c8500281266f8e4aea4801e05d to your computer and use it in GitHub Desktop.
#!/usr/bin/env python3
import json
from frog import Frog, FrogOptions
from pynlpl.formats import folia
frog = Frog(FrogOptions(parser=False, xmlout=True))
doc = frog.process("Dit is een test op een heel document.")
print(doc.json())
@proycon
Copy link
Author

proycon commented Oct 4, 2017

Output (heel verbose):

{'id': 'untitled', 'children': [{'type': 'text', 'id': 'untitled.text', 'auth': True, 'children': [{'type': 'p', 'id': 'untitled.p.1', 'auth': True, 'children': [{'type': 't', 'set': 'undefined', 'class': 'current', 'auth': True, 'children': ['Dit is een test op een heel document.'], 'text': 'Dit is een test op een heel document.'}, {'type': 's', 'id': 'untitled.p.1.s.1', 'auth': True, 'children': [{'type': 't', 'set': 'undefined', 'class': 'current', 'auth': True, 'children': ['Dit is een test op een heel document.'], 'text': 'Dit is een test op een heel document.'}, {'type': 'w', 'id': 'untitled.p.1.s.1.w.1', 'set': 'tokconfig-nld', 'class': 'WORD', 'annotator': 'ucto', 'annotatortype': 'auto', 'auth': True, 'datetime': '2017-10-05T00:01:22', 'children': [{'type': 't', 'set': 'undefined', 'class': 'current', 'auth': True, 'children': ['Dit'], 'text': 'Dit'}, {'type': 'pos', 'set': 'http://ilk.uvt.nl/folia/sets/frog-mbpos-cgn', 'class': 'VNW(aanw,pron,stan,vol,3o,ev)', 'annotator': 'frog-mbpos-1.0', 'annotatortype': 'auto', 'confidence': 0.777085, 'auth': True, 'datetime': '2017-10-05T00:01:22', 'children': [{'type': 'feat', 'subset': 'head', 'class': 'VNW'}, {'type': 'feat', 'subset': 'vwtype', 'class': 'aanw'}, {'type': 'feat', 'subset': 'pdtype', 'class': 'pron'}, {'type': 'feat', 'subset': 'naamval', 'class': 'stan'}, {'type': 'feat', 'subset': 'status', 'class': 'vol'}, {'type': 'feat', 'subset': 'persoon', 'class': '3o'}, {'type': 'feat', 'subset': 'getal', 'class': 'ev'}]}, {'type': 'lemma', 'set': 'http://ilk.uvt.nl/folia/sets/frog-mblem-nl', 'class': 'dit', 'annotator': 'frog-mblem-1.1', 'annotatortype': 'auto', 'auth': True, 'datetime': '2017-10-05T00:01:22', 'children': []}, {'type': 'morphology', 'set': 'http://ilk.uvt.nl/folia/sets/frog-mbma-nl', 'annotator': 'frog-mbma-1.0', 'annotatortype': 'auto', 'auth': True, 'datetime': '2017-10-05T00:01:22', 'children': [{'type': 'morpheme', 'set': 'http://ilk.uvt.nl/folia/sets/frog-mbma-nl', 'annotator': 'frog-mbma-1.0', 'annotatortype': 'auto', 'auth': True, 'datetime': '2017-10-05T00:01:22', 'children': [{'type': 't', 'set': 'undefined', 'class': 'current', 'auth': True, 'children': ['dit'], 'text': 'dit'}]}]}]}, {'type': 'w', 'id': 'untitled.p.1.s.1.w.2', 'set': 'tokconfig-nld', 'class': 'WORD', 'annotator': 'ucto', 'annotatortype': 'auto', 'auth': True, 'datetime': '2017-10-05T00:01:22', 'children': [{'type': 't', 'set': 'undefined', 'class': 'current', 'auth': True, 'children': ['is'], 'text': 'is'}, {'type': 'pos', 'set': 'http://ilk.uvt.nl/folia/sets/frog-mbpos-cgn', 'class': 'WW(pv,tgw,ev)', 'annotator': 'frog-mbpos-1.0', 'annotatortype': 'auto', 'confidence': 0.999891, 'auth': True, 'datetime': '2017-10-05T00:01:22', 'children': [{'type': 'feat', 'subset': 'head', 'class': 'WW'}, {'type': 'feat', 'subset': 'wvorm', 'class': 'pv'}, {'type': 'feat', 'subset': 'pvtijd', 'class': 'tgw'}, {'type': 'feat', 'subset': 'pvagr', 'class': 'ev'}]}, {'type': 'lemma', 'set': 'http://ilk.uvt.nl/folia/sets/frog-mblem-nl', 'class': 'zijn', 'annotator': 'frog-mblem-1.1', 'annotatortype': 'auto', 'auth': True, 'datetime': '2017-10-05T00:01:22', 'children': []}, {'type': 'morphology', 'set': 'http://ilk.uvt.nl/folia/sets/frog-mbma-nl', 'annotator': 'frog-mbma-1.0', 'annotatortype': 'auto', 'auth': True, 'datetime': '2017-10-05T00:01:22', 'children': [{'type': 'morpheme', 'set': 'http://ilk.uvt.nl/folia/sets/frog-mbma-nl', 'annotator': 'frog-mbma-1.0', 'annotatortype': 'auto', 'auth': True, 'datetime': '2017-10-05T00:01:22', 'children': [{'type': 't', 'set': 'undefined', 'class': 'current', 'auth': True, 'children': ['zijn'], 'text': 'zijn'}]}]}]}, {'type': 'w', 'id': 'untitled.p.1.s.1.w.3', 'set': 'tokconfig-nld', 'class': 'WORD', 'annotator': 'ucto', 'annotatortype': 'auto', 'auth': True, 'datetime': '2017-10-05T00:01:22', 'children': [{'type': 't', 'set': 'undefined', 'class': 'current', 'auth': True, 'children': ['een'], 'text': 'een'}, {'type': 'pos', 'set': 'http://ilk.uvt.nl/folia/sets/frog-mbpos-cgn', 'class': 'LID(onbep,stan,agr)', 'annotator': 'frog-mbpos-1.0', 'annotatortype': 'auto', 'confidence': 0.999113, 'auth': True, 'datetime': '2017-10-05T00:01:22', 'children': [{'type': 'feat', 'subset': 'head', 'class': 'LID'}, {'type': 'feat', 'subset': 'lwtype', 'class': 'onbep'}, {'type': 'feat', 'subset': 'naamval', 'class': 'stan'}, {'type': 'feat', 'subset': 'npagr', 'class': 'agr'}]}, {'type': 'lemma', 'set': 'http://ilk.uvt.nl/folia/sets/frog-mblem-nl', 'class': 'een', 'annotator': 'frog-mblem-1.1', 'annotatortype': 'auto', 'auth': True, 'datetime': '2017-10-05T00:01:22', 'children': []}, {'type': 'morphology', 'set': 'http://ilk.uvt.nl/folia/sets/frog-mbma-nl', 'annotator': 'frog-mbma-1.0', 'annotatortype': 'auto', 'auth': True, 'datetime': '2017-10-05T00:01:22', 'children': [{'type': 'morpheme', 'set': 'http://ilk.uvt.nl/folia/sets/frog-mbma-nl', 'annotator': 'frog-mbma-1.0', 'annotatortype': 'auto', 'auth': True, 'datetime': '2017-10-05T00:01:22', 'children': [{'type': 't', 'set': 'undefined', 'class': 'current', 'auth': True, 'children': ['een'], 'text': 'een'}]}]}]}, {'type': 'w', 'id': 'untitled.p.1.s.1.w.4', 'set': 'tokconfig-nld', 'class': 'WORD', 'annotator': 'ucto', 'annotatortype': 'auto', 'auth': True, 'datetime': '2017-10-05T00:01:22', 'children': [{'type': 't', 'set': 'undefined', 'class': 'current', 'auth': True, 'children': ['test'], 'text': 'test'}, {'type': 'pos', 'set': 'http://ilk.uvt.nl/folia/sets/frog-mbpos-cgn', 'class': 'N(soort,ev,basis,zijd,stan)', 'annotator': 'frog-mbpos-1.0', 'annotatortype': 'auto', 'confidence': 0.824786, 'auth': True, 'datetime': '2017-10-05T00:01:22', 'children': [{'type': 'feat', 'subset': 'head', 'class': 'N'}, {'type': 'feat', 'subset': 'ntype', 'class': 'soort'}, {'type': 'feat', 'subset': 'getal', 'class': 'ev'}, {'type': 'feat', 'subset': 'graad', 'class': 'basis'}, {'type': 'feat', 'subset': 'genus', 'class': 'zijd'}, {'type': 'feat', 'subset': 'naamval', 'class': 'stan'}]}, {'type': 'lemma', 'set': 'http://ilk.uvt.nl/folia/sets/frog-mblem-nl', 'class': 'test', 'annotator': 'frog-mblem-1.1', 'annotatortype': 'auto', 'auth': True, 'datetime': '2017-10-05T00:01:22', 'children': []}, {'type': 'morphology', 'set': 'http://ilk.uvt.nl/folia/sets/frog-mbma-nl', 'annotator': 'frog-mbma-1.0', 'annotatortype': 'auto', 'auth': True, 'datetime': '2017-10-05T00:01:22', 'children': [{'type': 'morpheme', 'set': 'http://ilk.uvt.nl/folia/sets/frog-mbma-nl', 'annotator': 'frog-mbma-1.0', 'annotatortype': 'auto', 'auth': True, 'datetime': '2017-10-05T00:01:22', 'children': [{'type': 't', 'set': 'undefined', 'class': 'current', 'auth': True, 'children': ['test'], 'text': 'test'}]}]}]}, {'type': 'w', 'id': 'untitled.p.1.s.1.w.5', 'set': 'tokconfig-nld', 'class': 'WORD', 'annotator': 'ucto', 'annotatortype': 'auto', 'auth': True, 'datetime': '2017-10-05T00:01:22', 'children': [{'type': 't', 'set': 'undefined', 'class': 'current', 'auth': True, 'children': ['op'], 'text': 'op'}, {'type': 'pos', 'set': 'http://ilk.uvt.nl/folia/sets/frog-mbpos-cgn', 'class': 'VZ(init)', 'annotator': 'frog-mbpos-1.0', 'annotatortype': 'auto', 'confidence': 0.996161, 'auth': True, 'datetime': '2017-10-05T00:01:22', 'children': [{'type': 'feat', 'subset': 'head', 'class': 'VZ'}, {'type': 'feat', 'subset': 'vztype', 'class': 'init'}]}, {'type': 'lemma', 'set': 'http://ilk.uvt.nl/folia/sets/frog-mblem-nl', 'class': 'op', 'annotator': 'frog-mblem-1.1', 'annotatortype': 'auto', 'auth': True, 'datetime': '2017-10-05T00:01:22', 'children': []}, {'type': 'morphology', 'set': 'http://ilk.uvt.nl/folia/sets/frog-mbma-nl', 'annotator': 'frog-mbma-1.0', 'annotatortype': 'auto', 'auth': True, 'datetime': '2017-10-05T00:01:22', 'children': [{'type': 'morpheme', 'set': 'http://ilk.uvt.nl/folia/sets/frog-mbma-nl', 'annotator': 'frog-mbma-1.0', 'annotatortype': 'auto', 'auth': True, 'datetime': '2017-10-05T00:01:22', 'children': [{'type': 't', 'set': 'undefined', 'class': 'current', 'auth': True, 'children': ['op'], 'text': 'op'}]}]}]}, {'type': 'w', 'id': 'untitled.p.1.s.1.w.6', 'set': 'tokconfig-nld', 'class': 'WORD', 'annotator': 'ucto', 'annotatortype': 'auto', 'auth': True, 'datetime': '2017-10-05T00:01:22', 'children': [{'type': 't', 'set': 'undefined', 'class': 'current', 'auth': True, 'children': ['een'], 'text': 'een'}, {'type': 'pos', 'set': 'http://ilk.uvt.nl/folia/sets/frog-mbpos-cgn', 'class': 'LID(onbep,stan,agr)', 'annotator': 'frog-mbpos-1.0', 'annotatortype': 'auto', 'confidence': 0.999654, 'auth': True, 'datetime': '2017-10-05T00:01:22', 'children': [{'type': 'feat', 'subset': 'head', 'class': 'LID'}, {'type': 'feat', 'subset': 'lwtype', 'class': 'onbep'}, {'type': 'feat', 'subset': 'naamval', 'class': 'stan'}, {'type': 'feat', 'subset': 'npagr', 'class': 'agr'}]}, {'type': 'lemma', 'set': 'http://ilk.uvt.nl/folia/sets/frog-mblem-nl', 'class': 'een', 'annotator': 'frog-mblem-1.1', 'annotatortype': 'auto', 'auth': True, 'datetime': '2017-10-05T00:01:22', 'children': []}, {'type': 'morphology', 'set': 'http://ilk.uvt.nl/folia/sets/frog-mbma-nl', 'annotator': 'frog-mbma-1.0', 'annotatortype': 'auto', 'auth': True, 'datetime': '2017-10-05T00:01:22', 'children': [{'type': 'morpheme', 'set': 'http://ilk.uvt.nl/folia/sets/frog-mbma-nl', 'annotator': 'frog-mbma-1.0', 'annotatortype': 'auto', 'auth': True, 'datetime': '2017-10-05T00:01:22', 'children': [{'type': 't', 'set': 'undefined', 'class': 'current', 'auth': True, 'children': ['een'], 'text': 'een'}]}]}]}, {'type': 'w', 'id': 'untitled.p.1.s.1.w.7', 'set': 'tokconfig-nld', 'class': 'WORD', 'annotator': 'ucto', 'annotatortype': 'auto', 'auth': True, 'datetime': '2017-10-05T00:01:22', 'children': [{'type': 't', 'set': 'undefined', 'class': 'current', 'auth': True, 'children': ['heel'], 'text': 'heel'}, {'type': 'pos', 'set': 'http://ilk.uvt.nl/folia/sets/frog-mbpos-cgn', 'class': 'ADJ(prenom,basis,zonder)', 'annotator': 'frog-mbpos-1.0', 'annotatortype': 'auto', 'confidence': 0.966292, 'auth': True, 'datetime': '2017-10-05T00:01:22', 'children': [{'type': 'feat', 'subset': 'head', 'class': 'ADJ'}, {'type': 'feat', 'subset': 'positie', 'class': 'prenom'}, {'type': 'feat', 'subset': 'graad', 'class': 'basis'}, {'type': 'feat', 'subset': 'buiging', 'class': 'zonder'}]}, {'type': 'lemma', 'set': 'http://ilk.uvt.nl/folia/sets/frog-mblem-nl', 'class': 'heel', 'annotator': 'frog-mblem-1.1', 'annotatortype': 'auto', 'auth': True, 'datetime': '2017-10-05T00:01:22', 'children': []}, {'type': 'morphology', 'set': 'http://ilk.uvt.nl/folia/sets/frog-mbma-nl', 'annotator': 'frog-mbma-1.0', 'annotatortype': 'auto', 'auth': True, 'datetime': '2017-10-05T00:01:22', 'children': [{'type': 'morpheme', 'set': 'http://ilk.uvt.nl/folia/sets/frog-mbma-nl', 'annotator': 'frog-mbma-1.0', 'annotatortype': 'auto', 'auth': True, 'datetime': '2017-10-05T00:01:22', 'children': [{'type': 't', 'set': 'undefined', 'class': 'current', 'auth': True, 'children': ['heel'], 'text': 'heel'}]}]}]}, {'type': 'w', 'id': 'untitled.p.1.s.1.w.8', 'set': 'tokconfig-nld', 'class': 'WORD', 'annotator': 'ucto', 'annotatortype': 'auto', 'auth': True, 'datetime': '2017-10-05T00:01:22', 'children': [{'type': 't', 'set': 'undefined', 'class': 'current', 'auth': True, 'children': ['document'], 'text': 'document'}, {'type': 'pos', 'set': 'http://ilk.uvt.nl/folia/sets/frog-mbpos-cgn', 'class': 'N(soort,ev,basis,onz,stan)', 'annotator': 'frog-mbpos-1.0', 'annotatortype': 'auto', 'confidence': 0.999409, 'auth': True, 'datetime': '2017-10-05T00:01:22', 'children': [{'type': 'feat', 'subset': 'head', 'class': 'N'}, {'type': 'feat', 'subset': 'ntype', 'class': 'soort'}, {'type': 'feat', 'subset': 'getal', 'class': 'ev'}, {'type': 'feat', 'subset': 'graad', 'class': 'basis'}, {'type': 'feat', 'subset': 'genus', 'class': 'onz'}, {'type': 'feat', 'subset': 'naamval', 'class': 'stan'}], 'space': {'space': 'no'}}, {'type': 'lemma', 'set': 'http://ilk.uvt.nl/folia/sets/frog-mblem-nl', 'class': 'document', 'annotator': 'frog-mblem-1.1', 'annotatortype': 'auto', 'auth': True, 'datetime': '2017-10-05T00:01:22', 'children': [], 'space': {'space': 'no'}}, {'type': 'morphology', 'set': 'http://ilk.uvt.nl/folia/sets/frog-mbma-nl', 'annotator': 'frog-mbma-1.0', 'annotatortype': 'auto', 'auth': True, 'datetime': '2017-10-05T00:01:22', 'children': [{'type': 'morpheme', 'set': 'http://ilk.uvt.nl/folia/sets/frog-mbma-nl', 'annotator': 'frog-mbma-1.0', 'annotatortype': 'auto', 'auth': True, 'datetime': '2017-10-05T00:01:22', 'children': [{'type': 't', 'set': 'undefined', 'class': 'current', 'auth': True, 'children': ['document'], 'text': 'document'}], 'space': {'space': 'no'}}], 'space': {'space': 'no'}}], 'space': {'space': 'no'}}, {'type': 'w', 'id': 'untitled.p.1.s.1.w.9', 'set': 'tokconfig-nld', 'class': 'PUNCTUATION', 'annotator': 'ucto', 'annotatortype': 'auto', 'auth': True, 'datetime': '2017-10-05T00:01:22', 'children': [{'type': 't', 'set': 'undefined', 'class': 'current', 'auth': True, 'children': ['.'], 'text': '.'}, {'type': 'pos', 'set': 'http://ilk.uvt.nl/folia/sets/frog-mbpos-cgn', 'class': 'LET()', 'annotator': 'frog-mbpos-1.0', 'annotatortype': 'auto', 'confidence': 1.0, 'auth': True, 'datetime': '2017-10-05T00:01:22', 'children': [{'type': 'feat', 'subset': 'head', 'class': 'LET'}]}, {'type': 'morphology', 'set': 'http://ilk.uvt.nl/folia/sets/frog-mbma-nl', 'annotator': 'frog-mbma-1.0', 'annotatortype': 'auto', 'auth': True, 'datetime': '2017-10-05T00:01:22', 'children': [{'type': 'morpheme', 'set': 'http://ilk.uvt.nl/folia/sets/frog-mbma-nl', 'annotator': 'frog-mbma-1.0', 'annotatortype': 'auto', 'auth': True, 'datetime': '2017-10-05T00:01:22', 'children': [{'type': 't', 'set': 'undefined', 'class': 'current', 'auth': True, 'children': ['.'], 'text': '.'}]}]}, {'type': 'lemma', 'set': 'http://ilk.uvt.nl/folia/sets/frog-mblem-nl', 'class': '.', 'annotator': 'frog-mblem-1.1', 'annotatortype': 'auto', 'auth': True, 'datetime': '2017-10-05T00:01:22', 'children': []}]}, {'type': 'chunking', 'id': 'untitled.p.1.s.1.chunking.1', 'set': 'http://ilk.uvt.nl/folia/sets/frog-chunker-nl', 'annotator': 'frog-chunker-1.0', 'annotatortype': 'auto', 'auth': True, 'datetime': '2017-10-05T00:01:22', 'children': [{'type': 'chunk', 'id': 'untitled.p.1.s.1.chunking.1.chunk.1', 'set': 'http://ilk.uvt.nl/folia/sets/frog-chunker-nl', 'class': 'NP', 'annotator': 'frog-chunker-1.0', 'annotatortype': 'auto', 'confidence': 0.992424, 'auth': True, 'datetime': '2017-10-05T00:01:22', 'children': [{'type': 'w', 'id': 'untitled.p.1.s.1.w.1', 'set': 'tokconfig-nld', 'class': 'WORD', 'annotator': 'ucto', 'annotatortype': 'auto', 'auth': True, 'datetime': '2017-10-05T00:01:22', 'children': [{'type': 't', 'set': 'undefined', 'class': 'current', 'auth': True, 'children': ['Dit'], 'text': 'Dit'}, {'type': 'pos', 'set': 'http://ilk.uvt.nl/folia/sets/frog-mbpos-cgn', 'class': 'VNW(aanw,pron,stan,vol,3o,ev)', 'annotator': 'frog-mbpos-1.0', 'annotatortype': 'auto', 'confidence': 0.777085, 'auth': True, 'datetime': '2017-10-05T00:01:22', 'children': [{'type': 'feat', 'subset': 'head', 'class': 'VNW'}, {'type': 'feat', 'subset': 'vwtype', 'class': 'aanw'}, {'type': 'feat', 'subset': 'pdtype', 'class': 'pron'}, {'type': 'feat', 'subset': 'naamval', 'class': 'stan'}, {'type': 'feat', 'subset': 'status', 'class': 'vol'}, {'type': 'feat', 'subset': 'persoon', 'class': '3o'}, {'type': 'feat', 'subset': 'getal', 'class': 'ev'}]}, {'type': 'lemma', 'set': 'http://ilk.uvt.nl/folia/sets/frog-mblem-nl', 'class': 'dit', 'annotator': 'frog-mblem-1.1', 'annotatortype': 'auto', 'auth': True, 'datetime': '2017-10-05T00:01:22', 'children': []}, {'type': 'morphology', 'set': 'http://ilk.uvt.nl/folia/sets/frog-mbma-nl', 'annotator': 'frog-mbma-1.0', 'annotatortype': 'auto', 'auth': True, 'datetime': '2017-10-05T00:01:22', 'children': [{'type': 'morpheme', 'set': 'http://ilk.uvt.nl/folia/sets/frog-mbma-nl', 'annotator': 'frog-mbma-1.0', 'annotatortype': 'auto', 'auth': True, 'datetime': '2017-10-05T00:01:22', 'children': [{'type': 't', 'set': 'undefined', 'class': 'current', 'auth': True, 'children': ['dit'], 'text': 'dit'}]}]}]}]}, {'type': 'chunk', 'id': 'untitled.p.1.s.1.chunking.1.chunk.2', 'set': 'http://ilk.uvt.nl/folia/sets/frog-chunker-nl', 'class': 'VP', 'annotator': 'frog-chunker-1.0', 'annotatortype': 'auto', 'confidence': 0.972459, 'auth': True, 'datetime': '2017-10-05T00:01:22', 'children': [{'type': 'w', 'id': 'untitled.p.1.s.1.w.2', 'set': 'tokconfig-nld', 'class': 'WORD', 'annotator': 'ucto', 'annotatortype': 'auto', 'auth': True, 'datetime': '2017-10-05T00:01:22', 'children': [{'type': 't', 'set': 'undefined', 'class': 'current', 'auth': True, 'children': ['is'], 'text': 'is'}, {'type': 'pos', 'set': 'http://ilk.uvt.nl/folia/sets/frog-mbpos-cgn', 'class': 'WW(pv,tgw,ev)', 'annotator': 'frog-mbpos-1.0', 'annotatortype': 'auto', 'confidence': 0.999891, 'auth': True, 'datetime': '2017-10-05T00:01:22', 'children': [{'type': 'feat', 'subset': 'head', 'class': 'WW'}, {'type': 'feat', 'subset': 'wvorm', 'class': 'pv'}, {'type': 'feat', 'subset': 'pvtijd', 'class': 'tgw'}, {'type': 'feat', 'subset': 'pvagr', 'class': 'ev'}]}, {'type': 'lemma', 'set': 'http://ilk.uvt.nl/folia/sets/frog-mblem-nl', 'class': 'zijn', 'annotator': 'frog-mblem-1.1', 'annotatortype': 'auto', 'auth': True, 'datetime': '2017-10-05T00:01:22', 'children': []}, {'type': 'morphology', 'set': 'http://ilk.uvt.nl/folia/sets/frog-mbma-nl', 'annotator': 'frog-mbma-1.0', 'annotatortype': 'auto', 'auth': True, 'datetime': '2017-10-05T00:01:22', 'children': [{'type': 'morpheme', 'set': 'http://ilk.uvt.nl/folia/sets/frog-mbma-nl', 'annotator': 'frog-mbma-1.0', 'annotatortype': 'auto', 'auth': True, 'datetime': '2017-10-05T00:01:22', 'children': [{'type': 't', 'set': 'undefined', 'class': 'current', 'auth': True, 'children': ['zijn'], 'text': 'zijn'}]}]}]}]}, {'type': 'chunk', 'id': 'untitled.p.1.s.1.chunking.1.chunk.3', 'set': 'http://ilk.uvt.nl/folia/sets/frog-chunker-nl', 'class': 'NP', 'annotator': 'frog-chunker-1.0', 'annotatortype': 'auto', 'confidence': 0.746566, 'auth': True, 'datetime': '2017-10-05T00:01:22', 'children': [{'type': 'w', 'id': 'untitled.p.1.s.1.w.3', 'set': 'tokconfig-nld', 'class': 'WORD', 'annotator': 'ucto', 'annotatortype': 'auto', 'auth': True, 'datetime': '2017-10-05T00:01:22', 'children': [{'type': 't', 'set': 'undefined', 'class': 'current', 'auth': True, 'children': ['een'], 'text': 'een'}, {'type': 'pos', 'set': 'http://ilk.uvt.nl/folia/sets/frog-mbpos-cgn', 'class': 'LID(onbep,stan,agr)', 'annotator': 'frog-mbpos-1.0', 'annotatortype': 'auto', 'confidence': 0.999113, 'auth': True, 'datetime': '2017-10-05T00:01:22', 'children': [{'type': 'feat', 'subset': 'head', 'class': 'LID'}, {'type': 'feat', 'subset': 'lwtype', 'class': 'onbep'}, {'type': 'feat', 'subset': 'naamval', 'class': 'stan'}, {'type': 'feat', 'subset': 'npagr', 'class': 'agr'}]}, {'type': 'lemma', 'set': 'http://ilk.uvt.nl/folia/sets/frog-mblem-nl', 'class': 'een', 'annotator': 'frog-mblem-1.1', 'annotatortype': 'auto', 'auth': True, 'datetime': '2017-10-05T00:01:22', 'children': []}, {'type': 'morphology', 'set': 'http://ilk.uvt.nl/folia/sets/frog-mbma-nl', 'annotator': 'frog-mbma-1.0', 'annotatortype': 'auto', 'auth': True, 'datetime': '2017-10-05T00:01:22', 'children': [{'type': 'morpheme', 'set': 'http://ilk.uvt.nl/folia/sets/frog-mbma-nl', 'annotator': 'frog-mbma-1.0', 'annotatortype': 'auto', 'auth': True, 'datetime': '2017-10-05T00:01:22', 'children': [{'type': 't', 'set': 'undefined', 'class': 'current', 'auth': True, 'children': ['een'], 'text': 'een'}]}]}]}, {'type': 'w', 'id': 'untitled.p.1.s.1.w.4', 'set': 'tokconfig-nld', 'class': 'WORD', 'annotator': 'ucto', 'annotatortype': 'auto', 'auth': True, 'datetime': '2017-10-05T00:01:22', 'children': [{'type': 't', 'set': 'undefined', 'class': 'current', 'auth': True, 'children': ['test'], 'text': 'test'}, {'type': 'pos', 'set': 'http://ilk.uvt.nl/folia/sets/frog-mbpos-cgn', 'class': 'N(soort,ev,basis,zijd,stan)', 'annotator': 'frog-mbpos-1.0', 'annotatortype': 'auto', 'confidence': 0.824786, 'auth': True, 'datetime': '2017-10-05T00:01:22', 'children': [{'type': 'feat', 'subset': 'head', 'class': 'N'}, {'type': 'feat', 'subset': 'ntype', 'class': 'soort'}, {'type': 'feat', 'subset': 'getal', 'class': 'ev'}, {'type': 'feat', 'subset': 'graad', 'class': 'basis'}, {'type': 'feat', 'subset': 'genus', 'class': 'zijd'}, {'type': 'feat', 'subset': 'naamval', 'class': 'stan'}]}, {'type': 'lemma', 'set': 'http://ilk.uvt.nl/folia/sets/frog-mblem-nl', 'class': 'test', 'annotator': 'frog-mblem-1.1', 'annotatortype': 'auto', 'auth': True, 'datetime': '2017-10-05T00:01:22', 'children': []}, {'type': 'morphology', 'set': 'http://ilk.uvt.nl/folia/sets/frog-mbma-nl', 'annotator': 'frog-mbma-1.0', 'annotatortype': 'auto', 'auth': True, 'datetime': '2017-10-05T00:01:22', 'children': [{'type': 'morpheme', 'set': 'http://ilk.uvt.nl/folia/sets/frog-mbma-nl', 'annotator': 'frog-mbma-1.0', 'annotatortype': 'auto', 'auth': True, 'datetime': '2017-10-05T00:01:22', 'children': [{'type': 't', 'set': 'undefined', 'class': 'current', 'auth': True, 'children': ['test'], 'text': 'test'}]}]}]}]}, {'type': 'chunk', 'id': 'untitled.p.1.s.1.chunking.1.chunk.4', 'set': 'http://ilk.uvt.nl/folia/sets/frog-chunker-nl', 'class': 'PP', 'annotator': 'frog-chunker-1.0', 'annotatortype': 'auto', 'confidence': 0.953216, 'auth': True, 'datetime': '2017-10-05T00:01:22', 'children': [{'type': 'w', 'id': 'untitled.p.1.s.1.w.5', 'set': 'tokconfig-nld', 'class': 'WORD', 'annotator': 'ucto', 'annotatortype': 'auto', 'auth': True, 'datetime': '2017-10-05T00:01:22', 'children': [{'type': 't', 'set': 'undefined', 'class': 'current', 'auth': True, 'children': ['op'], 'text': 'op'}, {'type': 'pos', 'set': 'http://ilk.uvt.nl/folia/sets/frog-mbpos-cgn', 'class': 'VZ(init)', 'annotator': 'frog-mbpos-1.0', 'annotatortype': 'auto', 'confidence': 0.996161, 'auth': True, 'datetime': '2017-10-05T00:01:22', 'children': [{'type': 'feat', 'subset': 'head', 'class': 'VZ'}, {'type': 'feat', 'subset': 'vztype', 'class': 'init'}]}, {'type': 'lemma', 'set': 'http://ilk.uvt.nl/folia/sets/frog-mblem-nl', 'class': 'op', 'annotator': 'frog-mblem-1.1', 'annotatortype': 'auto', 'auth': True, 'datetime': '2017-10-05T00:01:22', 'children': []}, {'type': 'morphology', 'set': 'http://ilk.uvt.nl/folia/sets/frog-mbma-nl', 'annotator': 'frog-mbma-1.0', 'annotatortype': 'auto', 'auth': True, 'datetime': '2017-10-05T00:01:22', 'children': [{'type': 'morpheme', 'set': 'http://ilk.uvt.nl/folia/sets/frog-mbma-nl', 'annotator': 'frog-mbma-1.0', 'annotatortype': 'auto', 'auth': True, 'datetime': '2017-10-05T00:01:22', 'children': [{'type': 't', 'set': 'undefined', 'class': 'current', 'auth': True, 'children': ['op'], 'text': 'op'}]}]}]}]}, {'type': 'chunk', 'id': 'untitled.p.1.s.1.chunking.1.chunk.5', 'set': 'http://ilk.uvt.nl/folia/sets/frog-chunker-nl', 'class': 'NP', 'annotator': 'frog-chunker-1.0', 'annotatortype': 'auto', 'confidence': 0.964902, 'auth': True, 'datetime': '2017-10-05T00:01:22', 'children': [{'type': 'w', 'id': 'untitled.p.1.s.1.w.6', 'set': 'tokconfig-nld', 'class': 'WORD', 'annotator': 'ucto', 'annotatortype': 'auto', 'auth': True, 'datetime': '2017-10-05T00:01:22', 'children': [{'type': 't', 'set': 'undefined', 'class': 'current', 'auth': True, 'children': ['een'], 'text': 'een'}, {'type': 'pos', 'set': 'http://ilk.uvt.nl/folia/sets/frog-mbpos-cgn', 'class': 'LID(onbep,stan,agr)', 'annotator': 'frog-mbpos-1.0', 'annotatortype': 'auto', 'confidence': 0.999654, 'auth': True, 'datetime': '2017-10-05T00:01:22', 'children': [{'type': 'feat', 'subset': 'head', 'class': 'LID'}, {'type': 'feat', 'subset': 'lwtype', 'class': 'onbep'}, {'type': 'feat', 'subset': 'naamval', 'class': 'stan'}, {'type': 'feat', 'subset': 'npagr', 'class': 'agr'}]}, {'type': 'lemma', 'set': 'http://ilk.uvt.nl/folia/sets/frog-mblem-nl', 'class': 'een', 'annotator': 'frog-mblem-1.1', 'annotatortype': 'auto', 'auth': True, 'datetime': '2017-10-05T00:01:22', 'children': []}, {'type': 'morphology', 'set': 'http://ilk.uvt.nl/folia/sets/frog-mbma-nl', 'annotator': 'frog-mbma-1.0', 'annotatortype': 'auto', 'auth': True, 'datetime': '2017-10-05T00:01:22', 'children': [{'type': 'morpheme', 'set': 'http://ilk.uvt.nl/folia/sets/frog-mbma-nl', 'annotator': 'frog-mbma-1.0', 'annotatortype': 'auto', 'auth': True, 'datetime': '2017-10-05T00:01:22', 'children': [{'type': 't', 'set': 'undefined', 'class': 'current', 'auth': True, 'children': ['een'], 'text': 'een'}]}]}]}, {'type': 'w', 'id': 'untitled.p.1.s.1.w.7', 'set': 'tokconfig-nld', 'class': 'WORD', 'annotator': 'ucto', 'annotatortype': 'auto', 'auth': True, 'datetime': '2017-10-05T00:01:22', 'children': [{'type': 't', 'set': 'undefined', 'class': 'current', 'auth': True, 'children': ['heel'], 'text': 'heel'}, {'type': 'pos', 'set': 'http://ilk.uvt.nl/folia/sets/frog-mbpos-cgn', 'class': 'ADJ(prenom,basis,zonder)', 'annotator': 'frog-mbpos-1.0', 'annotatortype': 'auto', 'confidence': 0.966292, 'auth': True, 'datetime': '2017-10-05T00:01:22', 'children': [{'type': 'feat', 'subset': 'head', 'class': 'ADJ'}, {'type': 'feat', 'subset': 'positie', 'class': 'prenom'}, {'type': 'feat', 'subset': 'graad', 'class': 'basis'}, {'type': 'feat', 'subset': 'buiging', 'class': 'zonder'}]}, {'type': 'lemma', 'set': 'http://ilk.uvt.nl/folia/sets/frog-mblem-nl', 'class': 'heel', 'annotator': 'frog-mblem-1.1', 'annotatortype': 'auto', 'auth': True, 'datetime': '2017-10-05T00:01:22', 'children': []}, {'type': 'morphology', 'set': 'http://ilk.uvt.nl/folia/sets/frog-mbma-nl', 'annotator': 'frog-mbma-1.0', 'annotatortype': 'auto', 'auth': True, 'datetime': '2017-10-05T00:01:22', 'children': [{'type': 'morpheme', 'set': 'http://ilk.uvt.nl/folia/sets/frog-mbma-nl', 'annotator': 'frog-mbma-1.0', 'annotatortype': 'auto', 'auth': True, 'datetime': '2017-10-05T00:01:22', 'children': [{'type': 't', 'set': 'undefined', 'class': 'current', 'auth': True, 'children': ['heel'], 'text': 'heel'}]}]}]}, {'type': 'w', 'id': 'untitled.p.1.s.1.w.8', 'set': 'tokconfig-nld', 'class': 'WORD', 'annotator': 'ucto', 'annotatortype': 'auto', 'auth': True, 'datetime': '2017-10-05T00:01:22', 'children': [{'type': 't', 'set': 'undefined', 'class': 'current', 'auth': True, 'children': ['document'], 'text': 'document'}, {'type': 'pos', 'set': 'http://ilk.uvt.nl/folia/sets/frog-mbpos-cgn', 'class': 'N(soort,ev,basis,onz,stan)', 'annotator': 'frog-mbpos-1.0', 'annotatortype': 'auto', 'confidence': 0.999409, 'auth': True, 'datetime': '2017-10-05T00:01:22', 'children': [{'type': 'feat', 'subset': 'head', 'class': 'N'}, {'type': 'feat', 'subset': 'ntype', 'class': 'soort'}, {'type': 'feat', 'subset': 'getal', 'class': 'ev'}, {'type': 'feat', 'subset': 'graad', 'class': 'basis'}, {'type': 'feat', 'subset': 'genus', 'class': 'onz'}, {'type': 'feat', 'subset': 'naamval', 'class': 'stan'}], 'space': {'space': 'no'}}, {'type': 'lemma', 'set': 'http://ilk.uvt.nl/folia/sets/frog-mblem-nl', 'class': 'document', 'annotator': 'frog-mblem-1.1', 'annotatortype': 'auto', 'auth': True, 'datetime': '2017-10-05T00:01:22', 'children': [], 'space': {'space': 'no'}}, {'type': 'morphology', 'set': 'http://ilk.uvt.nl/folia/sets/frog-mbma-nl', 'annotator': 'frog-mbma-1.0', 'annotatortype': 'auto', 'auth': True, 'datetime': '2017-10-05T00:01:22', 'children': [{'type': 'morpheme', 'set': 'http://ilk.uvt.nl/folia/sets/frog-mbma-nl', 'annotator': 'frog-mbma-1.0', 'annotatortype': 'auto', 'auth': True, 'datetime': '2017-10-05T00:01:22', 'children': [{'type': 't', 'set': 'undefined', 'class': 'current', 'auth': True, 'children': ['document'], 'text': 'document'}], 'space': {'space': 'no'}}], 'space': {'space': 'no'}}], 'space': {'space': 'no'}}]}]}]}]}]}], 'declarations': [{'annotationtype': 'token', 'set': 'tokconfig-nld', 'annotator': 'ucto', 'annotatortype': 'auto', 'datetime': '2017-10-05T00:01:22'}, {'annotationtype': 'pos', 'set': 'http://ilk.uvt.nl/folia/sets/frog-mbpos-cgn', 'annotator': 'frog-mbpos-1.0', 'annotatortype': 'auto', 'datetime': '2017-10-05T00:01:22'}, {'annotationtype': 'lemma', 'set': 'http://ilk.uvt.nl/folia/sets/frog-mblem-nl', 'annotator': 'frog-mblem-1.1', 'annotatortype': 'auto', 'datetime': '2017-10-05T00:01:22'}, {'annotationtype': 'morphological', 'set': 'http://ilk.uvt.nl/folia/sets/frog-mbma-nl', 'annotator': 'frog-mbma-1.0', 'annotatortype': 'auto', 'datetime': '2017-10-05T00:01:22'}, {'annotationtype': 'chunking', 'set': 'http://ilk.uvt.nl/folia/sets/frog-chunker-nl', 'annotator': 'frog-chunker-1.0', 'annotatortype': 'auto', 'datetime': '2017-10-05T00:01:22'}, {'annotationtype': 'entity', 'set': 'http://ilk.uvt.nl/folia/sets/frog-ner-nl', 'annotator': 'frog-ner-1.0', 'annotatortype': 'auto', 'datetime': '2017-10-05T00:01:22'}, {'annotationtype': 'entity', 'set': 'http://ilk.uvt.nl/folia/sets/frog-mwu-nl', 'annotator': 'frog-mwu-1.0', 'annotatortype': 'auto', 'datetime': '2017-10-05T00:01:22'}], 'version': '1.4.3', 'generator': 'pynlpl.formats.folia-v1.5.0.87'}

Sign up for free to join this conversation on GitHub. Already have an account? Sign in to comment