Skip to content

Instantly share code, notes, and snippets.

@douglasgoodwin
Created May 7, 2019 05:37
Show Gist options
  • Save douglasgoodwin/0742f3ba83c419a92ed8b6efb22defc2 to your computer and use it in GitHub Desktop.
Save douglasgoodwin/0742f3ba83c419a92ed8b6efb22defc2 to your computer and use it in GitHub Desktop.
NLTK analysis of Jane Austen
Display the source blob
Display the rendered blob
Raw
{
"cells": [
{
"cell_type": "code",
"execution_count": 5,
"metadata": {},
"outputs": [],
"source": [
"import os\n",
"import nltk\n",
"from nltk.parse.malt import MaltParser\n",
"\n",
"mp = MaltParser('/Users/dgoodwin/janeausten/maltparser-1.9.2', 'engmalt.linear-1.7.mco')"
]
},
{
"cell_type": "code",
"execution_count": 6,
"metadata": {},
"outputs": [
{
"data": {
"image/png": "iVBORw0KGgoAAAANSUhEUgAAAbcAAACMCAIAAABwP3BmAAAJMmlDQ1BkZWZhdWx0X3JnYi5pY2MAAEiJlZVnUJNZF8fv8zzphUASQodQQ5EqJYCUEFoo0quoQOidUEVsiLgCK4qINEWQRQEXXJUia0UUC4uCAhZ0gywCyrpxFVFBWXDfGZ33HT+8/5l7z2/+c+bec8/5cAEgiINlwct7YlK6wNvJjhkYFMwE3yiMn5bC8fR0A9/VuxEArcR7ut/P+a4IEZFp/OW4uLxy+SmCdACg7GXWzEpPWeGjy0wPj//CZ1dYsFzgMt9Y4eh/eexLzr8s+pLj681dfhUKABwp+hsO/4b/c++KVDiC9NioyGymT3JUelaYIJKZttIJHpfL9BQkR8UmRH5T8P+V/B2lR2anr0RucsomQWx0TDrzfw41MjA0BF9n8cbrS48hRv9/z2dFX73kegDYcwAg+7564ZUAdO4CQPrRV09tua+UfAA67vAzBJn/eqiVDQ0IgALoQAYoAlWgCXSBETADlsAWOAAX4AF8QRDYAPggBiQCAcgCuWAHKABFYB84CKpALWgATaAVnAad4Dy4Aq6D2+AuGAaPgRBMgpdABN6BBQiCsBAZokEykBKkDulARhAbsoYcIDfIGwqCQqFoKAnKgHKhnVARVApVQXVQE/QLdA66At2EBqGH0Dg0A/0NfYQRmATTYQVYA9aH2TAHdoV94fVwNJwK58D58F64Aq6HT8Id8BX4NjwMC+GX8BwCECLCQJQRXYSNcBEPJBiJQgTIVqQQKUfqkVakG+lD7iFCZBb5gMKgaCgmShdliXJG+aH4qFTUVlQxqgp1AtWB6kXdQ42jRKjPaDJaHq2DtkDz0IHoaHQWugBdjm5Et6OvoYfRk+h3GAyGgWFhzDDOmCBMHGYzphhzGNOGuYwZxExg5rBYrAxWB2uF9cCGYdOxBdhK7EnsJewQdhL7HkfEKeGMcI64YFwSLg9XjmvGXcQN4aZwC3hxvDreAu+Bj8BvwpfgG/Dd+Dv4SfwCQYLAIlgRfAlxhB2ECkIr4RphjPCGSCSqEM2JXsRY4nZiBfEU8QZxnPiBRCVpk7ikEFIGaS/pOOky6SHpDZlM1iDbkoPJ6eS95CbyVfJT8nsxmpieGE8sQmybWLVYh9iQ2CsKnqJO4VA2UHIo5ZQzlDuUWXG8uIY4VzxMfKt4tfg58VHxOQmahKGEh0SiRLFEs8RNiWkqlqpBdaBGUPOpx6hXqRM0hKZK49L4tJ20Bto12iQdQ2fRefQ4ehH9Z/oAXSRJlTSW9JfMlqyWvCApZCAMDQaPkcAoYZxmjDA+SilIcaQipfZItUoNSc1Ly0nbSkdKF0q3SQ9Lf5RhyjjIxMvsl+mUeSKLktWW9ZLNkj0ie012Vo4uZynHlyuUOy33SB6W15b3lt8sf0y+X35OQVHBSSFFoVLhqsKsIkPRVjFOsUzxouKMEk3JWilWqUzpktILpiSTw0xgVjB7mSJleWVn5QzlOuUB5QUVloqfSp5Km8oTVYIqWzVKtUy1R1WkpqTmrpar1qL2SB2vzlaPUT+k3qc+r8HSCNDYrdGpMc2SZvFYOawW1pgmWdNGM1WzXvO+FkaLrRWvdVjrrjasbaIdo12tfUcH1jHVidU5rDO4Cr3KfFXSqvpVo7okXY5upm6L7rgeQ89NL0+vU++Vvpp+sP5+/T79zwYmBgkGDQaPDamGLoZ5ht2GfxtpG/GNqo3uryavdly9bXXX6tfGOsaRxkeMH5jQTNxNdpv0mHwyNTMVmLaazpipmYWa1ZiNsulsT3Yx+4Y52tzOfJv5efMPFqYW6RanLf6y1LWMt2y2nF7DWhO5pmHNhJWKVZhVnZXQmmkdan3UWmijbBNmU2/zzFbVNsK20XaKo8WJ45zkvLIzsBPYtdvNcy24W7iX7RF7J/tC+wEHqoOfQ5XDU0cVx2jHFkeRk4nTZqfLzmhnV+f9zqM8BR6f18QTuZi5bHHpdSW5+rhWuT5z03YTuHW7w+4u7gfcx9aqr01a2+kBPHgeBzyeeLI8Uz1/9cJ4eXpVez33NvTO9e7zofls9Gn2eedr51vi+9hP0y/Dr8ef4h/i3+Q/H2AfUBogDNQP3BJ4O0g2KDaoKxgb7B/cGDy3zmHdwXWTISYhBSEj61nrs9ff3CC7IWHDhY2UjWEbz4SiQwNCm0MXwzzC6sPmwnnhNeEiPpd/iP8ywjaiLGIm0iqyNHIqyiqqNGo62ir6QPRMjE1MecxsLDe2KvZ1nHNcbdx8vEf88filhICEtkRcYmjiuSRqUnxSb7JicnbyYIpOSkGKMNUi9WCqSOAqaEyD0tandaXTlz/F/gzNjF0Z45nWmdWZ77P8s85kS2QnZfdv0t60Z9NUjmPOT5tRm/mbe3KVc3fkjm/hbKnbCm0N39qzTXVb/rbJ7U7bT+wg7Ijf8VueQV5p3tudATu78xXyt+dP7HLa1VIgViAoGN1tubv2B9QPsT8M7Fm9p3LP58KIwltFBkXlRYvF/OJbPxr+WPHj0t6ovQMlpiVH9mH2Je0b2W+z/0SpRGlO6cQB9wMdZcyywrK3BzcevFluXF57iHAo45Cwwq2iq1Ktcl/lYlVM1XC1XXVbjXzNnpr5wxGHh47YHmmtVagtqv14NPbogzqnuo56jfryY5hjmceeN/g39P3E/qmpUbaxqPHT8aTjwhPeJ3qbzJqamuWbS1rgloyWmZMhJ+/+bP9zV6tua10bo63oFDiVcerFL6G/jJx2Pd1zhn2m9az62Zp2WnthB9SxqUPUGdMp7ArqGjzncq6n27K7/Ve9X4+fVz5ffUHyQslFwsX8i0uXci7NXU65PHsl+spEz8aex1cDr97v9eoduOZ67cZ1x+tX+zh9l25Y3Th/0+LmuVvsW523TW939Jv0t/9m8lv7gOlAxx2zO113ze92D64ZvDhkM3Tlnv296/d5928Prx0eHPEbeTAaMip8EPFg+mHCw9ePMh8tPN4+hh4rfCL+pPyp/NP637V+bxOaCi+M24/3P/N59niCP/Hyj7Q/Fifzn5Ofl08pTTVNG02fn3Gcufti3YvJlykvF2YL/pT4s+aV5quzf9n+1S8KFE2+Frxe+rv4jcyb42+N3/bMec49fZf4bmG+8L3M+xMf2B/6PgZ8nFrIWsQuVnzS+tT92fXz2FLi0tI/QiyQvpTNDAsAAAAJcEhZcwAADdcAAA3XAUIom3gAAAAddEVYdFNvZnR3YXJlAEdQTCBHaG9zdHNjcmlwdCA5LjI2WJButwAAFopJREFUeJzt3U9s49h9B/A3iwGSeLaouYEmQIBW1nPTg+awgWj3VGAMiDrsDNKT6evMRVSBHJsVBfSwuzdqNugtAci9zOZQIOJcdxaB3gL2qcFYXKAF5FNES91DAakQXWTlAEER9fDrvmX050nWf1vfz2EgkRTfo0T/5vf+kLzX7/cZAACM8da6KwAAsNEQJQEAVBAlAQBU7q+7AltKCOG6bhRFjDFd18vl8rprBACjIUquQRiGtm37vs85D8OQYiUAbCZEyTUIw9AwDM45Y4z+BYCNdQ8zgZZBCOE4ThRFURRRg5qiYRiGlmXRchkfhRBrrSwAqCBKLl4QBJZlUYOaMSaEsCwrCAJN02gDIUS1WkVfJMCtgDHuxXMcRyaPjDHDMEqlkud5660VAMwGUXLxhBCGYcSXcM6r1eq66gMA80CUXDxd18MwjC+h3sl11QcA5oEouXiFQsG2bfk2iiLXdQuFwhqrBAAzw0ygxTNNk5JHwzCiKAqCoFQqUTdlEAS2bdMYdxAEDFPKATYexriXRcbBgT5KALhdECUBAFTQLwkAoIIoCQCggigJAKCCKAkAoIKZQKsQttv//tVX//Kb36R/+EPz8FB78EDf21t3pQBgKhjjXgpRrwetVvfrr4NW699+97vrP/5xeJvdnR19b48nEtrOzv7DhzyR0Pf2tAcPVl9bAFBAlFyAoNkMO53a5WXY6QSt1mWnI1fdf+ut//3Tn75z/342nf6HH//4H3/1q795+PCn2ex/XV1F19dhpxM0m1fX1/G9ZZJJ7cEDPZlkjOUePULiCbBeiJI3FvV6QbNZrdcpzH1xcSFXpRKJv3rnnXuM/We3S7Hy+OAg9+iRdXREG3inp4VPP80/fuw9fx7fp6jXGWPVep0xFrRaUa/3ZasV3yCeeB6kUtrODhJPgNVAlJxM1Othp9Not4NWK576UeTSk8l33n5bTyaj6+vKmzevajXGWCqRKBwdmQcH/OHDgb1ZL19+cnbmPnsmQ+c4YbsddjpUdNjpRNfXw4lnNp1mjMk6IPEEWDhEyUFhux20WtR8DjudeE6XSSZ5IsETidyjRzyRoAgYNJuVN2+8s7Or6+vdnR3z8LBwdKQIVVGvZ3z8cdjpiPffny2iTUw8U4kE1ROJJ8D8tj1KUvM5aLUoXxtoPvNEQk8m9x8+1Pf2BiJa1Ot5Z2eVN28oQg20rNWCZtP4+GOeSIj3319U8BpOPOPHQpB4Asxg66Jk0GwGzSY1n8NOJz7Skk2nZQRRJF/++fk0LWs16qA8Pjjwf/rTeQ5nIlGvR9fXtctLxtjwIbPYfwaMMUo8jUePllolgNvljkdJyrCq9bqi+XyQSunJ5MQwd9OW9UR2pfLi888d07SfPJl5J7Ohr4XmKikST21nhycS9N+G7GEA2DZ3LUrGJyrG//LlSAvNTJw+XZqnZT2R/uGHX7ZatQ8+2JCWLxJPgGG3O0rKiYojm888kdh/+FDdfFZYSMtaLWy39Y8+YoyFL15s7OhKPPEMWi3GGBJP2Cq3KUrK5jPNiYk3n1OJBP1xHqRSdBHLzKUsvGWtJur13M9/nk2nxfvvL6mIZaBRL0o8ad7ocOI5MD2eMYbEE26jjY6SEycq3rT5rLDUlrUadVAW33uvfHKyguKWKmg2o15PkXjSb0eJJ/18SDxhw21QlFRc55ehVvPOTnyi4qKsoGU9kfHxx19cXFR/9rM7mW0h8YRbbW1RcpqJivM3nxVW3LJWi3o9XiwyxoIPPtiexIoSz4nXZcYTT0yPh9VbXZQc13xmfz5RcdkZxBpb1mpBs3nw0UeZZDL48MN112Wd6L9POlVwQxDYBMuKkje9zm8FNqFlrVZ+/brk+3ejg3Lhpkw8cSc6WLjFREnZfB6eqKi+zm8FNqplPZH5i1+8qtWmuRcGMCSesBIzRkn1dX5zTlRciI1tWavNfy8MYLgTHSzUjaMkXS4i3970Or/V8M/PT375S7apLWs1uheGkU4v+xLvbTPlnehu18RVWIEbR0m7UmGMLXCi4jKE7bbz+vUmt6zV/PNzI51GarMaA4knoiQM2KD5kgAAGwhPmgUAUPn2SbNCiOHVmqbpui6EcBxH1/VyubzAsoUQrutGUcQYi+/csqwwDBlj5XJZ1/UFlsgYMwyjVCoZhrHY3Q5Y6iEAwCp9GyVzuVw2m2WMhWGoaZqmaVEUaZomhDC+scCCwzC0bdv3fc55GIYUK4nneYwx27bjCxdF13VN0xa+2wFLPQQAWKX78TeUTtq2ncvlDMOgFHJJBYdhaBgG55wxRv+uxmLTYQC4877tl2w0GgPrDMOgnEiybVvXdV3XDcOIZ0mUElLUsyxLnUBRfKREcoYsleowsqwgCGhvQRBQlTjn8hAsy5Jrh4/Utm1qHY/cxrZteYAyuaY29QzGHQLV0DRNXddN0/Q8T9d1znkQBLZt088Rr4nv+/Hdyl9B13XLsmzbnq16d4DneQO/4/ASxUmrPpFudLbDXdAfUiwWq9Xq8HLGmOM49Np13ePjY/k6n893u116W6lUstns8McHVKvVYrGo2GBcNeILHceRVZKy2Wwmk6EqdbvdgQ0URyfrU6lU5NHRR+QBdrvdTCYz8ntbyCEwxlzX7ff7+XyevsZGo0GVKRaLu7u7tJaWZzKZSqUiP5tKpRqNhjyEaX6FOyybzdJP1mg06IXruvInnuakHXkizXa2w612gyiZyWTib+XJkUql5Ekj9yD/mMeZOUr2+/1arVb9xvBOstmsYs9THt3u7q58nUql4qso6VbUfGJZ/fGHIPcc/yx91RSsB2oS/xNNpVKu68pAWavVpqnkXVUsFum/kEwmQ99w/Cud5qQdeSLNdrbDrXZflWf+uXGDHlEUmaY5sHB/f3+WzHaSIAhM0+Sc08AxNX6HN8vlcjfd88DRXV1dydcD3aZz9qJOeQjTVJJzHm/u0ZyBarUaRVEURaVSaZuH13O5XLVapcYydbgLIWSv9JQn7fCJtMqzHTbEDaLkONRBtoKBY8aYZVm+78s/fiFEtVpddqE0BC8PcLhb80bmOYSBooUQMmRTuJRRgDp/DcNYze+ygQzDoLHHXC5Xq9UG+nBnPmlXebbDhljArPKTk5OBgQIhxMjZl/OLoigeF1zXXUYpA8rlshyrEULMOSoyzyEEQSCHC4QQlmWVSiVa5ThOfFf0Z7zlAwtRFPm+b5pmoVCg4S+5auaTdpVnO2yIP7tCsVwuV6tVOV+yUChQ44LGWGngz/d9anQEQUATzhljtm3LliMlOJ7njfv/lvZGrUKKF/Ep5Z7nVSoVFpu2yWJzsz3PcxzHNM0oimR95Fg8VTIIAs45fVAegmK3YRhaliX3xhgzTfPVq1fFYlHWSk6A55yXSqX9/f3++Cs7Zz4Ey7I++eSTfD5PY9lCCBrm1jTNsiza+f7+Pu2caiIDbrlcpuU0/SAIgkKhID+1neg0o3ODc14ul+ONZcVJqziR1B+EO2mR13FTxFz2tG0KAXRR0PJKUaMp9zN/fLZDoBRGPd+T9swYW/bFRXfGzCftas522AS428WNTROt7lK5AFsOd7uYCrWd7927R4mD7A1cGdu2X7x48eLFi3v37g0MRADAUiGXBABQQS4JAKCCKAkAoLKAWeUAd0DQbIqLi3/97W/f/s53/v5HP9rwZ5bAKqFfEraXqNer9XrQasUfE/aX3/ve//zhD3Kb+KOSETe3E6IkbJGw3Q5ardrlpbi4kI8C/evvf393Z+c/vvrqL7773X/+yU/sJ08YY/SY79rlZdjpBK1W/FnK8eeG8kTilj6BDqaHKAl3HDWla5eX8WCXTaf1ZPIglbr/1lv/9OtfX3Y6xwcHZdNUPJFY1Ov0lNrhZ9Ajbt5tiJJw10S9XtBsUlP6i4sLWri7s2Ok0zyRyD16RK3mqNdzPvvsxeef7+7seM+fm4eHNy0oHjcHHu2dTad5IqHt7OQePeKJxC16HDwMQ5SEuyBst8XFRa3ZDJpN2ZTOJJP63t7B3p6+tzeQ34l63fr0U0ohvefPF/Loc4rOQavV/fprddzU9/bwsPVbBFESbitRr8tORhmPZFPaSKdHRqKo17NevnxVq82cQk5Pxs1Gux12OjKxZYzt7uzoe3t6MvnO22/rySTi5iZDlIRbI+r1ZA/jQFP6IJXSk8mJA9D++bn18uXV9XXxvfdKT5+uPjCF7XbY6VTr9ej6elzcxGD6pkGUhI0WNJtBs1lrNsXFhRwwySSTRjq9//ChkU5P2eUnU8hUIuE9e7Y5MUjGzbDTCTsd2V3AMAlpYyBKwsahaYxhpzPclJ6tU887PbV9f40p5I3EJyGNi5sYTF8lRElYPzmNMd6UTiUSMmGcORyE7bb16adfXFxsWgp5I5RQYxLSuiBKwnrQNMZGuz3clKZOxvlnz5Rfv3Y++4xSyPLJydxV3iDqyZv63h4mIS0QoiSsSHwao5wlI4cs5DTGhZApZCaZ9J4/34YMi0b8J05CQtycAaIkLBFNY6SEUfavUVN65DTGhbArFe/s7E6mkNObOHkTk5CmhygJC6a+InDcNMZFFW29fPllq5VNp8umuQ0p5PSmmYSEuDkSoiTMSzGNMX5F4LLZlQpdblh6+pTuWAFqmLw5JURJmIX6isDppzEuRDyF9J49Q7/bzKaZhLSFcRNREqY12xWBSxW/YwVSyGXAHeQYoiQojGxKp76Z1TzPNMaFiN+xQn3TM1igLbyDHKIkjMWLRfobmOGKwBXgxWLU6y37jhUw0bg7yLnPnllHR2ut2mIgSsJY3ukpZQSbOeIZNJs8kdjMum0zOQnJPDjYnP9T54EoCQCggifNAgCoIErCXWAYhhBi3bXYanf4J0CUhLtA13VN09Zdi612h38C9EsCAKggl4QRbNvWdd0wDM65ZVlRFE3zqSAITNPUv2Hbtu/70+wzCALDMAzDCILA933OOefc8zz1KmJZltzgpgdi2zbnnNYKIWg/YRgyxqism34D20nxExiGYdt2uVymX2Hcz7Tp+gBDqtWqfO04juM4Ez/SaDRSqVStVpNvM5lMsVicfp/ZbDaTyeTz+W632+124xsoVpFisRjf/zSFFotF2mG/3+92u5lMRv45uK4rV/X7/Uqlks1mJ34DW27cT8AYk6dBpVI5Pj5ebb0WAC1uGC0IAplAVavVcrms3t627f39fcuy5BLf9zVNMwxjyn0ahqHr+siCFKtk6blcLl7WxEI555Q2kjAM9/f36c+Bcx4EQbyXbfjoYMC4n0DX9Xj+qGnarUvM76+7ArBxqOHMOdd1nTFGTdFpPpXL5eJLTNO86T4H9jDlKkWVFIVyzuMbx99GURSvPNnf379pBYAxNjCkc3V1ta6azAxREgZZluX7PkUWxpgQolqtTvwU51yRI8y2zzmpCw3DMIoi+Tccz3c455QIL7uGcCtg9AYGRVEkE6soilzXneZTJycnjuPEA6UQwrbtefY5J3Wh5XJZjtXEq8oYOzk5ib+lDe7qZECYCLkkDCqVSrqum6YZRRENMfu+H0VRfGR5mGEYhUKBhjI1TRNCxHsS1fu0bTsIgiAIbNumDK5QKFCbV7GKMeZ5XqVSYYyFYSiEoA1oRHVioaZpappm2zYFU8/zZJvatm05OM4YE0IMDKyDpPgJwjC0LIv6PWi2g/xNJ3ZzbxSM3sAIFFY0TZPN1elRzjU8x3iefc7sRoUODyyMOxbYKoiSAIwxRk3s25XjwGqgXxK2VxiGmqbdu3ePUsVSqbTuGsEmQi4JAKCCXBIAQAVREgBABTOBAGDBRL3uvH7937///d9xXnry5LY/1wH9kgCwMN7pqfP69WWns7uz87c/+MGby0vGWDadLj15cnsf4Y0oCQDzogej+7XaZaeTSiTMg4PS06fagwdhu+2ennpnZ1fX16lEovTkyW18qiKiJADMLmy3ndev/fPzq+vrTDJZODoajoNRr+ednbmnp5RjWo8fUwxdR31ngSgJALMQ9bp7evqqVmOMHR8cFI6OJrapvdNT9/T0y1Zrd2fHPDy8LV2WiJIAcDPe6Wnl/PyLiwvGWP7x45sGuxnC63ohSgLAVBbbcJ6mqb4hECUBYILlDcLQsI/cc+HoyHr8eNO6LBElAWCsoNl0T08/OTtjS57QE59CZD1+XDg62pwuS0RJABjBPz93T09n7nycDU1Hl4WeHB5uQpcloiQAfCvq9fzz8/WmddRlKRPYk8PD9XZZIkoCAGOjOh/Nw8M1dhEOdFmusT6IkgDbbiB3KxwdmYeH667U/9uE3BZREmB7bWY/4EgD/aSFoyN9b281RSNKAmyjTR5TVljZmHscoiTAFrkV8xMnWvFNNBAlAbbCpg0cz29lN9FAlAS4427dddM3Ned15RMhSgLcWf75ufPZZ7fuHjyzEfV65fx8GV2WiJIAd5b18qW4uJD3xF13dVZB3kSj9PSp/eTJQvaJKAlwZ4Xt9h1OHhWiXo8xtqj/GBAlAQBU8KRZAAAVREmAxTAMQwixlqItyzIMIwiC9VaJqjGyJsuwsqNDlARYDF3XNU1bS9Ge5+m6HkXR/FUyDGOeagghRtZkGVb2hd9fQRkA26BcLq+7CoM2sEoLtLKjQy4JMK9xLU1abpqmruumaVLGxzkPgkCxSn7c933OuWEYnHPLsgYSNLlW1/XheKFo/Nq2rev68G6FELS9ETOu0JFVGknuUFbStm1aMnJ7z/NorWVZjLEoimRl5LEojm5cDeVu5UeGl4zVB4BFKBaL1Wp1YCFjzHXdfr+fz+ez2Wy/3280GsfHx+pV/X7fdd18Pt/tdultpVKhbUauzefzqVRquPSRVYovcRzHcZz42ngpA9RVUhRarVbz+fxAKY1GY1xB1WpVfg8kk8nIchUFqWuYzWZpVaPRoBeu6xaLxXHVkJBLAiwX5USappVKJcYY51wmOIpVjuOUy2XZ70ZZp+d5I9d6njd9Dx1lT0II6kPsdrtTflBdJXWJYRiGYUhvhRCcc865YvsoiuT2lPRNc4DqGuq6TqM9pmk6jsMYazQauVxu4m7RLwmwiaIoMk1zYOH+/j694JwPRI0pR12CIDBNk3Ou6zr7ppW9kCqplUolx3EoYMkXCicnJ3KzSqUyTSyeWMNcLletVilAU7gUQkzTuYkoCbCJOOe+749LoGSeJQkhpkmLLMvyfZ9CJH2qWq0upEpqhmE4jkOxSZ1Iyno6jhNFURAE02w/TQ2pDoyxXC5Xq9V835+y8mhxA2yik5MT27bjS6iNTK9N04yv9TxvOG6OFEWRjDhRFLmuO7CBpmnx0Yz4btVVmojSSdd1pxybltsXCoUpi5hYwyiKfN83TbNQKNAg0sAegiDQNC3e9cEYRm8A5uO6bjabzWazqVQqk8nQ61qt1u/38/k8Y4wGLorFYiaToeW7u7vvvvvuuFVyPIGWF4tFenF8fBwfwZBrj4+P8/k8vaXhIEWVXNdNpVLFYjGfz9PHU6lUfGilVqvRBupCh9cqCpWy2ew0oyWk2+2mUqnhASJ1QRO/NHmwqVSqUqkM7Jwy693d3fjgEq7jBtholAqNnEFNQyLTN0gJNWM1TZPt7pEbjCtUXSU1mvO0gqngM9eQxdJJuQRREgBWwff9Wq12Gye6Y/QGAJYoDENd16+uruSSWxcokUsCAKhgjBsAQAVREgBABVESAEAFURIAQAVREgBA5f8AFuWEHFAKW2oAAAAASUVORK5CYII=",
"text/plain": [
"Tree('of', ['The', 'flaring', 'lamps', Tree('were', ['a', 'carriage', Tree('in', ['immediately', 'view.'])])])"
]
},
"execution_count": 6,
"metadata": {},
"output_type": "execute_result"
}
],
"source": [
"quote = \"\"\"The flaring lamps of a carriage were immediately in view. \n",
"By their uncertain light she thought she could discern it to be drawn by four horses; \n",
"and this, while it told the excess of her poor mother’s alarm, \n",
"gave some explanation to such unexpected rapidity.\"\"\"\n",
"\n",
"quote = \"The flaring lamps of a carriage were immediately in view.\"\n",
"mp.parse_one(quote.split()).tree()"
]
},
{
"cell_type": "markdown",
"metadata": {},
"source": [
"|Abbreviation | part o |\n",
"|-- |-- |\n",
"| NN | singular noun |\n",
"NNS plural noun\n",
"NNP proper noun\n",
"VBD past tense verb \n",
"VBZ 3rd person singular present tense verb\n",
"VBP non-3rd person singular present tense verb\n",
"VBN past participle\n",
"PRP pronoun\n",
"PRP possessive pronoun \n",
"JJ adjective\n",
"IN preposition complementizer \n",
"DT determiner\n",
"\n",
"NP noun phrase \n",
"VP verb phrase \n",
"PP prepositional phrase \n",
"S sentence\n"
]
},
{
"cell_type": "code",
"execution_count": 7,
"metadata": {},
"outputs": [
{
"data": {
"text/plain": [
"[('The', 'DT'),\n",
" ('flaring', 'VBG'),\n",
" ('lamps', 'NNS'),\n",
" ('of', 'IN'),\n",
" ('a', 'DT'),\n",
" ('carriage', 'NN'),\n",
" ('were', 'VBD'),\n",
" ('immediately', 'RB'),\n",
" ('in', 'IN'),\n",
" ('view', 'NN'),\n",
" ('.', '.')]"
]
},
"execution_count": 7,
"metadata": {},
"output_type": "execute_result"
}
],
"source": [
"tokens = nltk.word_tokenize(quote)\n",
"tagged = nltk.pos_tag(tokens)\n",
"\n",
"tagged"
]
},
{
"cell_type": "code",
"execution_count": 8,
"metadata": {},
"outputs": [
{
"data": {
"image/png": "iVBORw0KGgoAAAANSUhEUgAAAOsAAACzCAIAAADntXwYAAAJMmlDQ1BkZWZhdWx0X3JnYi5pY2MAAEiJlZVnUJNZF8fv8zzphUASQodQQ5EqJYCUEFoo0quoQOidUEVsiLgCK4qINEWQRQEXXJUia0UUC4uCAhZ0gywCyrpxFVFBWXDfGZ33HT+8/5l7z2/+c+bec8/5cAEgiINlwct7YlK6wNvJjhkYFMwE3yiMn5bC8fR0A9/VuxEArcR7ut/P+a4IEZFp/OW4uLxy+SmCdACg7GXWzEpPWeGjy0wPj//CZ1dYsFzgMt9Y4eh/eexLzr8s+pLj681dfhUKABwp+hsO/4b/c++KVDiC9NioyGymT3JUelaYIJKZttIJHpfL9BQkR8UmRH5T8P+V/B2lR2anr0RucsomQWx0TDrzfw41MjA0BF9n8cbrS48hRv9/z2dFX73kegDYcwAg+7564ZUAdO4CQPrRV09tua+UfAA67vAzBJn/eqiVDQ0IgALoQAYoAlWgCXSBETADlsAWOAAX4AF8QRDYAPggBiQCAcgCuWAHKABFYB84CKpALWgATaAVnAad4Dy4Aq6D2+AuGAaPgRBMgpdABN6BBQiCsBAZokEykBKkDulARhAbsoYcIDfIGwqCQqFoKAnKgHKhnVARVApVQXVQE/QLdA66At2EBqGH0Dg0A/0NfYQRmATTYQVYA9aH2TAHdoV94fVwNJwK58D58F64Aq6HT8Id8BX4NjwMC+GX8BwCECLCQJQRXYSNcBEPJBiJQgTIVqQQKUfqkVakG+lD7iFCZBb5gMKgaCgmShdliXJG+aH4qFTUVlQxqgp1AtWB6kXdQ42jRKjPaDJaHq2DtkDz0IHoaHQWugBdjm5Et6OvoYfRk+h3GAyGgWFhzDDOmCBMHGYzphhzGNOGuYwZxExg5rBYrAxWB2uF9cCGYdOxBdhK7EnsJewQdhL7HkfEKeGMcI64YFwSLg9XjmvGXcQN4aZwC3hxvDreAu+Bj8BvwpfgG/Dd+Dv4SfwCQYLAIlgRfAlxhB2ECkIr4RphjPCGSCSqEM2JXsRY4nZiBfEU8QZxnPiBRCVpk7ikEFIGaS/pOOky6SHpDZlM1iDbkoPJ6eS95CbyVfJT8nsxmpieGE8sQmybWLVYh9iQ2CsKnqJO4VA2UHIo5ZQzlDuUWXG8uIY4VzxMfKt4tfg58VHxOQmahKGEh0SiRLFEs8RNiWkqlqpBdaBGUPOpx6hXqRM0hKZK49L4tJ20Bto12iQdQ2fRefQ4ehH9Z/oAXSRJlTSW9JfMlqyWvCApZCAMDQaPkcAoYZxmjDA+SilIcaQipfZItUoNSc1Ly0nbSkdKF0q3SQ9Lf5RhyjjIxMvsl+mUeSKLktWW9ZLNkj0ie012Vo4uZynHlyuUOy33SB6W15b3lt8sf0y+X35OQVHBSSFFoVLhqsKsIkPRVjFOsUzxouKMEk3JWilWqUzpktILpiSTw0xgVjB7mSJleWVn5QzlOuUB5QUVloqfSp5Km8oTVYIqWzVKtUy1R1WkpqTmrpar1qL2SB2vzlaPUT+k3qc+r8HSCNDYrdGpMc2SZvFYOawW1pgmWdNGM1WzXvO+FkaLrRWvdVjrrjasbaIdo12tfUcH1jHVidU5rDO4Cr3KfFXSqvpVo7okXY5upm6L7rgeQ89NL0+vU++Vvpp+sP5+/T79zwYmBgkGDQaPDamGLoZ5ht2GfxtpG/GNqo3uryavdly9bXXX6tfGOsaRxkeMH5jQTNxNdpv0mHwyNTMVmLaazpipmYWa1ZiNsulsT3Yx+4Y52tzOfJv5efMPFqYW6RanLf6y1LWMt2y2nF7DWhO5pmHNhJWKVZhVnZXQmmkdan3UWmijbBNmU2/zzFbVNsK20XaKo8WJ45zkvLIzsBPYtdvNcy24W7iX7RF7J/tC+wEHqoOfQ5XDU0cVx2jHFkeRk4nTZqfLzmhnV+f9zqM8BR6f18QTuZi5bHHpdSW5+rhWuT5z03YTuHW7w+4u7gfcx9aqr01a2+kBPHgeBzyeeLI8Uz1/9cJ4eXpVez33NvTO9e7zofls9Gn2eedr51vi+9hP0y/Dr8ef4h/i3+Q/H2AfUBogDNQP3BJ4O0g2KDaoKxgb7B/cGDy3zmHdwXWTISYhBSEj61nrs9ff3CC7IWHDhY2UjWEbz4SiQwNCm0MXwzzC6sPmwnnhNeEiPpd/iP8ywjaiLGIm0iqyNHIqyiqqNGo62ir6QPRMjE1MecxsLDe2KvZ1nHNcbdx8vEf88filhICEtkRcYmjiuSRqUnxSb7JicnbyYIpOSkGKMNUi9WCqSOAqaEyD0tandaXTlz/F/gzNjF0Z45nWmdWZ77P8s85kS2QnZfdv0t60Z9NUjmPOT5tRm/mbe3KVc3fkjm/hbKnbCm0N39qzTXVb/rbJ7U7bT+wg7Ijf8VueQV5p3tudATu78xXyt+dP7HLa1VIgViAoGN1tubv2B9QPsT8M7Fm9p3LP58KIwltFBkXlRYvF/OJbPxr+WPHj0t6ovQMlpiVH9mH2Je0b2W+z/0SpRGlO6cQB9wMdZcyywrK3BzcevFluXF57iHAo45Cwwq2iq1Ktcl/lYlVM1XC1XXVbjXzNnpr5wxGHh47YHmmtVagtqv14NPbogzqnuo56jfryY5hjmceeN/g39P3E/qmpUbaxqPHT8aTjwhPeJ3qbzJqamuWbS1rgloyWmZMhJ+/+bP9zV6tua10bo63oFDiVcerFL6G/jJx2Pd1zhn2m9az62Zp2WnthB9SxqUPUGdMp7ArqGjzncq6n27K7/Ve9X4+fVz5ffUHyQslFwsX8i0uXci7NXU65PHsl+spEz8aex1cDr97v9eoduOZ67cZ1x+tX+zh9l25Y3Th/0+LmuVvsW523TW939Jv0t/9m8lv7gOlAxx2zO113ze92D64ZvDhkM3Tlnv296/d5928Prx0eHPEbeTAaMip8EPFg+mHCw9ePMh8tPN4+hh4rfCL+pPyp/NP637V+bxOaCi+M24/3P/N59niCP/Hyj7Q/Fifzn5Ofl08pTTVNG02fn3Gcufti3YvJlykvF2YL/pT4s+aV5quzf9n+1S8KFE2+Frxe+rv4jcyb42+N3/bMec49fZf4bmG+8L3M+xMf2B/6PgZ8nFrIWsQuVnzS+tT92fXz2FLi0tI/QiyQvpTNDAsAAAAJcEhZcwAADdcAAA3XAUIom3gAAAAddEVYdFNvZnR3YXJlAEdQTCBHaG9zdHNjcmlwdCA5LjI2WJButwAAEQZJREFUeJztnT9s49i1xu9s0sQBAmkAb/GKeMgBUniaB9Ke7sEGRBeZbUW1M40oIEmZkOp2p6N2UgVJAHKLnSmXTJNinEJ3EU07JpNK7kRrWxsRBw9jL15S6BVn5y6XlChKIiVe6vwqmf/uNfXx8NxL6nz3ptMpQRBu+WjbHUCQtUAFI3yDCkb4BhWM8E3FFUwpVRTFMIztdkPTNEVRfN/fbjcqScUVrCgKpXTr0rFtW5blMAy3241KUnEFI5WnOgr2fV9VVfkDhmG4rsvWGoYByxVFicVCWKUoiiiKmqbF1rquK4qioiiyLGuaFk1I2KqFO/Z6vWL+aYSQaSUYjUaCIHiex/6UJEnXdfiTEGKaJny2LKvZbEb37ff77LNpmmxLQBCE0WgEnx3HaTQa7DjtdnsymSRXJde2221BEKINIXlREQXrum5ZVnSJ4zhMMZIkRVdFpQZ4ntf/ANM9IAiCZVlMxOwiEQSBCTTZh+RaSZJQwUXw423fA/LB9/2zs7PoElVV2ed6vZ6yo6qqoijKskw+zF1EN6CUWpbV7/fDMAzDsNvtwpZhGEabAB4+fAgfRFGMNRo7LJIXFVGwKIqrjfQ1TXNdF0RJCKGU9vt9thaOybLYIAgURVEUpV6vi6Louu68ayMIgtgSSmnsGkNyoSIjuVarZZpmVMSU0izTwGEYiqLIPluWFV1rmmZ0CegVWmm1WrHjU0oppfBZVdXoWtu2k5pGcuHetCrvptm2bZomBEhKKcwABEFgGIbv+4qiuK4Lt37f92VZBrXBXqqqhmHINlMUxbZtQkiv13MchxACMxi+73c6HU3ToEXDMFjWQSkVRdG2bRaV2dogCOr1OvQqujuSC9VRMAC6lGU5JfeNAdKs1+ssl5i5AZmTy6a0GARBEASiKLIwj+RO1RSM7BoVyYORnQUVjPANKhjhG1TwbP45Hoe3t9vuBbKYijzRyAv34qI/HLoXFz/66KN/vX8vHRy0Hj9Wj47Ejz/edteQ2eBcBAlvb0G4f/E8WNI8Ovrvn//8f7/91vW8q5sbQoiwv68eHbUeP5YfPNhmX5EEu6vg4Pra9Tzn7dt/fPMNIaS2t6ceH589eqQcHtZ/+lO2mT8e08vL5Gbq8fHWuo5E2DkF++Ox8/ZtLLiePXqkPHqUvmNwfU0vL2OhGqQcVTyyYXZFwZAn0MtLEC4kuMrh4QpZQXh7C1J2Ly7e3d0RQhqHh2ePHmG6vBWqrGCW4NLLS5Ba8+joSBBylJp7ceFdXbGILh0cKIeHmC5vkgoqGBLc/nD49eUl+ZC5Hj14UOjtHpITenkJ6bKwv69AYMZ0uWCqo+CkhlSIuJvVEFw/3tUVpMubuX52Ge4VXNr7OOQw3njM0uXccxiEcKrgpDhKPpZKjiNLcplVAJ4UnLxBs1yTlxt0SVKdKsGBgmPPFKoxSJo53Ew+T0EWUl4F0+GwPxxW/rnuzGfaIOVyZkRlo1wKTj4s2Kl3a9h7RdH/fbXHLrtDKRQ8Lw5xlODmy8xH39W7/+TCNhU8790arhPcfMFTtJAtKBgDzArgbWoem1MwJnm5sONDhSSFKzi4vjZcFwfaRZCcrumcnhpPnmy7XxtlEzFY1HWYwcXJzoJgU+atx49RwQjCE/hbZYRvUMEcAz43GTcuia1T7qCCOWZegcOZFQpLYuuUO1gvgmPQYIasPJLTNA3K4kJ10bOzM8uywjCM1kOHArqwjaIovV4PAgbY+9y/f99xHFjS6/XmVT7dQWzbhqLF7LQkl8D5J4lTRyk1TRMKJLOF0VrzcPIh96jX6yll6LlhZQcOQggYn7TbbfBWGY1GUZugFI8gQggzXHEcJ2YuhDQaDTCSGY1G8MGyrJhFzXQ61XV9prtM0uqGQVJtnXhkrTwYypHX6/Vut0sSZhbgwwq1+WVZnkwmbJUkSewOqKpq9uHIjsDCpKqqpmkSQkajUS42HJIkscFc0gOPR4rKg9M9gmJ3rnfv3hXUDU45Ozvr9/tQ/B2kTCnNJevlPmdIUJSC0z2CkHQURYHQe3Z25nle1JwUiVHUbFq6RxCyEBgWq6ra6XQMw1jKjq5er0dnzSpuo7Ra+txutwkh7XZ7Op3qui5JEphd1mo1GHBYliUIgq7r7XYbDGIFQWi326PRqNFo1Go1NoZoNpskMrBDADh18FkQBMdx2CrLshqNRqPREARBkiT4zMxGp9Op53lw8uGraTabk8nE87zomZ9MJvBnyrCPCwp8L2KhRxBSHMx/aSlbJx7BN3sQvsGnygjfoIIRvkEFI3yDCkb4pnAF0+GQDodFt4IQQuhw2Hv9Ori+3nZHNkqxcxGG43z+t78RQhqHh/bTp/jrzoKgw6F5fv715eW9e/em02nj8LB1fKydnm67X5ugKAX747H28uU/vvmmeXT0X7XaHyit7e11P/lk136HWDT2YGCen1/d3PzsJz/5v//8539+8Qvp4MB+8+bd3V1tb087Oal8IY5CFNw7PzdfvyaE9FQVIgETNAbjXAhvb+03b6zB4OrmBn5k/+2///38r3/t//a3YMpkDwasPIp0cNA5Pa1qbZScFRze3movX/7F86SDA/dXv4opFZKK2t6e/ewZ1k1ajfD21nz9GqKssL/fffIEYoSo64SQ4PPPoxsH19fWYAAFJaBiVef0tGIhOU8F0+FQ/fOf393d6b/8Za/VmrlNNLuwnz2rZFQoiOD62jw//+LNG0JI4/Cw++QJ88CzB4POq1fW06fzcl/34sJ5+7aSITk3BUN8Ffb37adP090FIYpgMM4OHQ6diwvQbvvkpHV8HDvDyosX/ngc/ulP6cdJhuTkobgjBwWvFlbpcKi9enV1c4PBOAU2yUAIaZ+cdJ88SQ4h/PH46PnzlPteEqhhB5cEpNHayQmnX8G6Ck4O2rLDgnGWyL1rsEkGmFLofvLJPIVpL19+8ebNqNdbdnwcHQ6SOdG9/Kyu4PRBW3ai2XPK97QjJCcZ0qNjeHt7/ze/aZ+c2M+erdxoNEvhLiSvqOAsg7bssIthl4PxvEmGdGD4wSbR1uxANCQ3j45ajx+Xf5SyioKzD9qWwr240F6+zOuq4IiUSYaFiLpe39vzP/ssx/7447E1GEB9YqhP3jk9Le0U/nIKLnouLJqZ2M+eVWzmMsnCSYZ0Fk6irQNUjbcGAzBAKG1IXkLB6wzalsIeDAzXrXYwzjLJsBD5s8/Cu7vYU4zcKXlIzqTgvAZt2Qmur7VXr76+vKxeMM4+yZAOHQ7Pfv/7jV3ksZBcnpeHFis430HbUkDUf3d3Z6oq768ELTvJsBCYRJv88Y8bnjSAxyLRl4e2G5IXKLigQVt2WDDm95Wg1SYZ0gmurx8axpqTaGtiDwbOxQUkQlsMyXMVXKoXGNgrQXy9n7nOJEM6cEK8Tz/den6VDMkbfp9ztoI3NmjLDl/vZ645ybCQ+q9/LT94QH/3uxyPuSbbep9zhoJ75+dd193YoG0pWDBe+BbLFmG/TFl5kiGdQifR1iT28pD/6aeFSyhZxmfy/r3+1VdFFgpaC+/qyvr737fdizS8qyv9q68m798X2kRxB88F5+3b9pdfbqAhrNmD8A3+2h7hm+8VTD9QtmKdS3lOISsA1V1t2952R1bhOwW7rmuapmEYrOx9eah89cUcWarMMAPsZEajUe792QDf1XBXVVVVVbAbMk0zDMPyiAY9p5AUfpAHO44DRcNLckPRNE1RFHCUiS4Hb0qIHDM32BaGYUCXRFFc2WcFLEjkDxiGEXUhmNcEOJX4vq9EWLYDcHAgmrmxw/q+77ouGHxERQKty7IsiqKqqrFEdOZa+HLhP1VV1bZt2GDpr5LNSnieB0XDJ5OJJEkbmAfJyEzPKVJKP68UA7KMjEYjQRBYQfbRaAQV8DM2sXJBdl3Xa7UaOxq0GzvtjUZDkqR2uz2ZTCaTCdvY8zxJkkajEeuhIAhgIpa+liwydMvC9wput9us1H2z2YxWtd8uMxUcu8ZqtdoGe5SG53n9D6xgraDrOnypDMdxYv9+ShPrKJiZHgD9fj8mpkajMfM/ajabsR5alsX0nbKWBdDoV7zsv/B9FuG6rmVZ7GZRcu+WEvp5+b4viqJhGKCt1Ty44SDRJaqqsvFZLk3MI3ZKFUVJzkrN9LSLWa0RQkRRZNZV6WvX57uRnG3bmqZFx0yyLJdqPFd+cjEgi7lKFtFERsB1OMuWsiyDOTFbEoYh62T62vX5Lgb3+/1OpxNdoSgK2pgtRS4GZK1WC+aC2BJKKYu1C5tYx4fLtu3ovoZhxCQxD/ALY39Cx9i+6WsXAmZCaRf29IMfVqPRYBkYWGiBo9NSSUmOzPOcKq2f1zwDstWO0263wUsLRk4Zm5jpw7WwRTiOruuNRqPZbMKf0TEirKrVauyLiLqDQcegP9CxLGsXGroBcJOp1WpsLBgD34vIkxwNyGAyK/k0Z2ETa/pw+b4Pd/ll92Xtznyqkr52YZcgDM9ciwpG+Abf7EH4BhWM8A0qGOEbVDDCN6hgpED88bjoJvhTsPLihfLixbZ7gSzGcJyj58+LboU/BSNIFFQwUhQPP/6YFJ9IoIKRohD39wkh4e1toa2gghG+QQUjfIMKRvgGFYzwDSoY4RtUMFIs4d1docdHBSNFASWTvaurQltBBSN8gwpG+AYVjPANKhjhG1QwwjeoYIRvUMFIgQj7+8HNTaFN/LjQoxeBfHCw7S4gWRH39+Edy+LAiicI32AWgfANKhjhm5IqOFk2GUFmUlIF51L+EdkFcCSH8E2eMZhZQxqGIYoiOEbFCsGn+1X1er2omVTMFGzmvllMndIbBXspsIvSNC1fc4rdJBdXsqwsLPC9FGDqxGrBg6lTtKJ3dr+qpFHPvH3JIlOn9EYFQWD1wR3HWdkOCGGs70qWnfyfaKiqqmkafIYYrGmaqqqwBIyS4KKUZXkpI5OUfaHFer3e7XZJwk9lYaMwcAS/vnm1wpHsrPMtL0v+Co5Vr4+KCdwqRVGEUdpSEw4r77twR0qpZVn9fj8MwzAMu90uDiLXYZ1veQXyV3DMVZRSyqLaOmZSK++bviNcXcyGLAgCSMHRhmxlNmkZRoqYTfN9nyXvlFJN0+DOTtbzq1p53/QdTdOMLgHhFjvyqDq5uJJlJ/8YrGnaw4cPIfEVRTEag+EGraoqONuAZV0YhlmMyOftyxqFgxiGAdMRvu+De3h6o/fv33ccBwbOsEG328VUeB3W+ZZXIOf5YJiKinqDxsjuV+W6rud50UOt7HWV3cEKHwTmQo6uZAvZtIIzEoahpmmdTgclhSwgx5k5XdfZYWOujsseIeYpiSDzwKfKCN+U9M0eBMkIKhjhG/4U7I/HG/B4QniBPwUbrmv88H03ZJfhT8EIEgUVjPANKhjhG1QwwjeoYIRvUMEI36CCEb5BBSN8gwpG+AYVjPANKhjhG1QwwjeoYIRvUMEI36CCEb5BBSN8gwpG+IY/N67W8fG2u4CUCPy1PcI3mEUgfIMKRvimLAqGOslZPCwURaGUbqBLCBeURcGgy1j17JnIsozlqREGf3MR6xfGRKpEWWIwA4ycWEnq6Cow3gKXkdhe6Ki1u2y7eOYPIISwoquWZUUdtRi6rkfNngB01NpZyhWDJUli4XNZJz1KaRAEhBBVVTHT2B3KpeCVh2iU0tFoBKaisiyDlJFdgL+RXBJ01NplyhWDVwMdtXaZssRgMM8CO0gwb1JVFbyc4PmFbduO4xBCgiCglIJMe72eLMvoqLXLVOfNHnTU2k2qo2BkN6lCHozsMqhghG9QwQjfoIIRvkEFI3yDCkb4BhWM8M3/A7r8m2WLL2CWAAAAAElFTkSuQmCC",
"text/plain": [
"Tree('chased', [Tree('man', ['A', Tree('in', [Tree('pajamas', ['his'])])]), Tree('with', ['a', 'cat', Tree('broom.', ['a'])])])"
]
},
"execution_count": 8,
"metadata": {},
"output_type": "execute_result"
}
],
"source": [
"quote = \"A man in his pajamas chased a cat with a broom.\"\n",
"mp.parse_one(quote.split()).tree()\n",
"\n",
"# Does the cat have a broom?"
]
},
{
"cell_type": "code",
"execution_count": 20,
"metadata": {},
"outputs": [
{
"data": {
"image/png": "iVBORw0KGgoAAAANSUhEUgAAAQMAAACzCAIAAAACDu5dAAAJMmlDQ1BkZWZhdWx0X3JnYi5pY2MAAEiJlZVnUJNZF8fv8zzphUASQodQQ5EqJYCUEFoo0quoQOidUEVsiLgCK4qINEWQRQEXXJUia0UUC4uCAhZ0gywCyrpxFVFBWXDfGZ33HT+8/5l7z2/+c+bec8/5cAEgiINlwct7YlK6wNvJjhkYFMwE3yiMn5bC8fR0A9/VuxEArcR7ut/P+a4IEZFp/OW4uLxy+SmCdACg7GXWzEpPWeGjy0wPj//CZ1dYsFzgMt9Y4eh/eexLzr8s+pLj681dfhUKABwp+hsO/4b/c++KVDiC9NioyGymT3JUelaYIJKZttIJHpfL9BQkR8UmRH5T8P+V/B2lR2anr0RucsomQWx0TDrzfw41MjA0BF9n8cbrS48hRv9/z2dFX73kegDYcwAg+7564ZUAdO4CQPrRV09tua+UfAA67vAzBJn/eqiVDQ0IgALoQAYoAlWgCXSBETADlsAWOAAX4AF8QRDYAPggBiQCAcgCuWAHKABFYB84CKpALWgATaAVnAad4Dy4Aq6D2+AuGAaPgRBMgpdABN6BBQiCsBAZokEykBKkDulARhAbsoYcIDfIGwqCQqFoKAnKgHKhnVARVApVQXVQE/QLdA66At2EBqGH0Dg0A/0NfYQRmATTYQVYA9aH2TAHdoV94fVwNJwK58D58F64Aq6HT8Id8BX4NjwMC+GX8BwCECLCQJQRXYSNcBEPJBiJQgTIVqQQKUfqkVakG+lD7iFCZBb5gMKgaCgmShdliXJG+aH4qFTUVlQxqgp1AtWB6kXdQ42jRKjPaDJaHq2DtkDz0IHoaHQWugBdjm5Et6OvoYfRk+h3GAyGgWFhzDDOmCBMHGYzphhzGNOGuYwZxExg5rBYrAxWB2uF9cCGYdOxBdhK7EnsJewQdhL7HkfEKeGMcI64YFwSLg9XjmvGXcQN4aZwC3hxvDreAu+Bj8BvwpfgG/Dd+Dv4SfwCQYLAIlgRfAlxhB2ECkIr4RphjPCGSCSqEM2JXsRY4nZiBfEU8QZxnPiBRCVpk7ikEFIGaS/pOOky6SHpDZlM1iDbkoPJ6eS95CbyVfJT8nsxmpieGE8sQmybWLVYh9iQ2CsKnqJO4VA2UHIo5ZQzlDuUWXG8uIY4VzxMfKt4tfg58VHxOQmahKGEh0SiRLFEs8RNiWkqlqpBdaBGUPOpx6hXqRM0hKZK49L4tJ20Bto12iQdQ2fRefQ4ehH9Z/oAXSRJlTSW9JfMlqyWvCApZCAMDQaPkcAoYZxmjDA+SilIcaQipfZItUoNSc1Ly0nbSkdKF0q3SQ9Lf5RhyjjIxMvsl+mUeSKLktWW9ZLNkj0ie012Vo4uZynHlyuUOy33SB6W15b3lt8sf0y+X35OQVHBSSFFoVLhqsKsIkPRVjFOsUzxouKMEk3JWilWqUzpktILpiSTw0xgVjB7mSJleWVn5QzlOuUB5QUVloqfSp5Km8oTVYIqWzVKtUy1R1WkpqTmrpar1qL2SB2vzlaPUT+k3qc+r8HSCNDYrdGpMc2SZvFYOawW1pgmWdNGM1WzXvO+FkaLrRWvdVjrrjasbaIdo12tfUcH1jHVidU5rDO4Cr3KfFXSqvpVo7okXY5upm6L7rgeQ89NL0+vU++Vvpp+sP5+/T79zwYmBgkGDQaPDamGLoZ5ht2GfxtpG/GNqo3uryavdly9bXXX6tfGOsaRxkeMH5jQTNxNdpv0mHwyNTMVmLaazpipmYWa1ZiNsulsT3Yx+4Y52tzOfJv5efMPFqYW6RanLf6y1LWMt2y2nF7DWhO5pmHNhJWKVZhVnZXQmmkdan3UWmijbBNmU2/zzFbVNsK20XaKo8WJ45zkvLIzsBPYtdvNcy24W7iX7RF7J/tC+wEHqoOfQ5XDU0cVx2jHFkeRk4nTZqfLzmhnV+f9zqM8BR6f18QTuZi5bHHpdSW5+rhWuT5z03YTuHW7w+4u7gfcx9aqr01a2+kBPHgeBzyeeLI8Uz1/9cJ4eXpVez33NvTO9e7zofls9Gn2eedr51vi+9hP0y/Dr8ef4h/i3+Q/H2AfUBogDNQP3BJ4O0g2KDaoKxgb7B/cGDy3zmHdwXWTISYhBSEj61nrs9ff3CC7IWHDhY2UjWEbz4SiQwNCm0MXwzzC6sPmwnnhNeEiPpd/iP8ywjaiLGIm0iqyNHIqyiqqNGo62ir6QPRMjE1MecxsLDe2KvZ1nHNcbdx8vEf88filhICEtkRcYmjiuSRqUnxSb7JicnbyYIpOSkGKMNUi9WCqSOAqaEyD0tandaXTlz/F/gzNjF0Z45nWmdWZ77P8s85kS2QnZfdv0t60Z9NUjmPOT5tRm/mbe3KVc3fkjm/hbKnbCm0N39qzTXVb/rbJ7U7bT+wg7Ijf8VueQV5p3tudATu78xXyt+dP7HLa1VIgViAoGN1tubv2B9QPsT8M7Fm9p3LP58KIwltFBkXlRYvF/OJbPxr+WPHj0t6ovQMlpiVH9mH2Je0b2W+z/0SpRGlO6cQB9wMdZcyywrK3BzcevFluXF57iHAo45Cwwq2iq1Ktcl/lYlVM1XC1XXVbjXzNnpr5wxGHh47YHmmtVagtqv14NPbogzqnuo56jfryY5hjmceeN/g39P3E/qmpUbaxqPHT8aTjwhPeJ3qbzJqamuWbS1rgloyWmZMhJ+/+bP9zV6tua10bo63oFDiVcerFL6G/jJx2Pd1zhn2m9az62Zp2WnthB9SxqUPUGdMp7ArqGjzncq6n27K7/Ve9X4+fVz5ffUHyQslFwsX8i0uXci7NXU65PHsl+spEz8aex1cDr97v9eoduOZ67cZ1x+tX+zh9l25Y3Th/0+LmuVvsW523TW939Jv0t/9m8lv7gOlAxx2zO113ze92D64ZvDhkM3Tlnv296/d5928Prx0eHPEbeTAaMip8EPFg+mHCw9ePMh8tPN4+hh4rfCL+pPyp/NP637V+bxOaCi+M24/3P/N59niCP/Hyj7Q/Fifzn5Ofl08pTTVNG02fn3Gcufti3YvJlykvF2YL/pT4s+aV5quzf9n+1S8KFE2+Frxe+rv4jcyb42+N3/bMec49fZf4bmG+8L3M+xMf2B/6PgZ8nFrIWsQuVnzS+tT92fXz2FLi0tI/QiyQvpTNDAsAAAAJcEhZcwAADdcAAA3XAUIom3gAAAAddEVYdFNvZnR3YXJlAEdQTCBHaG9zdHNjcmlwdCA5LjI2WJButwAAD7JJREFUeJztnT9s22Yaxt+0d0CQ4g5SAHvpIJPenBsK0g5uSwHRQ5ebRM8pcKKHrAXpMaPUdDwEoJZ2uoG86YZ2EA/XWw5FQraTXRSoGHm1ATM4wEXRRTe8yVeWkiiKEkVKen4TzX/fK4qPvvf9SH/PndFoRABsPe+UHQAAlQBKAIAISgCAgRIAIFp3JWia5nlexp09z9M0zbKsQkMCa8p6K0FV1Xq9Pr5e07SJKz3PC4Kg+LjA+vG7sgNYiG63W3YIYEOoYp/Q6/U0TdM0Tfx+j68xDCOxhuEUKAgCLUYURfF9LMtSVVVV1fFNYHsZVZJms3lzczMajQaDAS/Ytm2aZmI30zT7/f7Ew6edmYg6nQ4v27bdarWWFjRYZ6rYJxCRqqpcCuu63ul0iGgwGBwfHy9+ZkVRRNFsGAb6BMBUVAnHx8e+7wdBIMsyS4LTnsXPPLHCBqCiFbOmadwVsCRc1y07IrDhVFQJRBRFkeu6QRCoqqrruq7r2Y+t1+t8IP8ZhqEsy8WECTaE6iqBB3bq9Trf0IeHh2JTr9dzHIeIwjD0PI8Tnm63K279s7MzIR7P82RZ7vV6YRhalhUEga7rrutGUaTrOo8yZX88BzaVO6MNfSs7iiIeYJ329A2AOBurBADmoqJjRwCsGCgBACIoAQBmo5QQ3d7++/vvo9vbsgMB60d1R1GzE15dub7/z++++++PP/7x7t3//fyz0mioe3v7u7tqo6E9eFB2gGANWOOxI+/8vH9+7vr+q+trInrnzp3fv/tu8+DgT++/H1xeBsPh659+4j2bBwdqo7G/u6vu7al7e2UGDarKmikhur11X770h0P35Uu+0ZVG4w937/7nhx+URqP3+HH8Rg+Gw2A4HFxdBZeX/7q4EOtZGIeSpDYa8u7u6j8FqCDroQTOf/rn53xD1+7d0w4Ojh88OJKkv37++beXl+1Hj7q6Xn/vvZSTBMOhd3ExuLoKhsNvLy95JZ9K3tk5fvBA3dtLPwPYYCqthET+I+3s6IeHh5KkHx0RkfvypfHFF0TU1XXjww/znTy8vg4uL/n83IR2cIACYwupnBIm5j8nDx9qBwfxzMdynE+/+mo8I8rdqHdx4b96lSgwlEbjjTBQYGw6VVHCtPxHPzpKZCzh1ZX+/HnGjCh3MG/yKBQYW0PJSkjPf8ZZMCPKB1fe/nCYKDDUvT210UCBsRmUoISM+c84y82IcuOdnweXl5xKxQsM0V2gwFhHVqeE7PnPxGOLzojyEd3eBsNh//x8vMDgR3sz5Q0qQuFKmDf/GaeUjCgf4dWV6C7GCwwWBgqMalKIEnLnP+NUJCPKh3i0511cjBcYh5KkHRxUp3/bcpaphEXyn4lnq2ZGlBsuMFgYiQKDH+2hwCiRJShh8fxnnDXKiPIhCozw+tq7uBgvMFB5r5icSlhi/jPOWmdE+YgXGHh3sBTmU8Jy85+J59+wjCgfE98djBcYeLS3dDIpoYj8Z5yNz4hyIwqM+KO9eIGBR3uLM1UJheY/42xhRpSPeIGBdweXyAQleOfnnS+/LCj/mYj69CkyonykvzvYPTkpN7w1YoISguFQf/68iPxnGpbj7O/uIiNanPi7g9HtbfD0adkRrQ1VeRcVgHLZqLktAMjNr0rw3hKGYYkBgQQVsQxlO68N9mt8kx25rmvbdhRFYRjqut7r9coODPyGKkzobVnW8fHxUvxcKsibPkHXdc/zTk5Out2u53nwXALbxm9m/nIch2XQ6/UW7I4NwwjDsF6vs4vH8fEx9zmu67LLgWVZbH0QhqGmad1uV8ztrmmaqqr37993HGfcG2FTCYKg0+mI1FTTtMPDw7h/Cl8xIqrX667risuVciWJyHVdy7JkWY6iiCfQj1v3iq0zjz3Z+AFZ4T3o+3673R6NRjc3N4qiLG5mSES2bY9Go3a7zWaYg8FAeF3GPTM7nY7wwxTHCqdNx3E23iFzMBhIkuT7vvhTUZS41yhNtwxNv5KSJA0GA152HCfuSmrbdrvdZmvTmVvb7bYkSROdTjeDX5XQbrcdx+HlVqslvpX8p34rs7hXbPxa+77ff0vCYTYhxVqttmAwFcc0Tf7VEDiOE7/tEhckYbObciUlSbJtW4gh/rVKkiRu9PEwxrcqirLBSvg1O3JdNwxD27aJiBeKq5vZ4kmWZc55xn01Ey44r1+/LiiSihAEQcJjN+ErN80WaOaV9DzPtu1+vx9FURRFZ2dnIs9kf63ECff393lBluVEo5taKzNvlNDr9QzDiGeQqqqyzVkRrRqGIQoGIvI8r9/vF9HQusC5eI4D068kn1N8rVwMaJrGX6ssy/F6I8H4YLrneUuxxK4mb8aO+v3+6elpfIOmacV5v0ZRJMwwoyjijmibOTk56XQ6cTF4npdl0CL9SnY6nfgavulFKycnJ4km+IESL+u6Ht/Klo1zfag1YzQatVotImo2myJHbLfbiqJIkpRIOrPTbreJiEtw0zQVReEMtVarcTLKJ+eGTNOUJIl3HgwGzWazVquJopDDyx3JusDXpN1u8+US1arv+/ELcnNzw39yqZByJUejUafTURSF1/MOiWqE2zJNkxdarVa8NhBbW62WCCxxho2htPeO2BtTmMwChn+S5/ILnXklhQ3ptEQ/pdEwDHkcfOMNrfEGHgBEeAMPAAZKAIAISgCAgRIAINoM702QgGdj+OmXX/7ywQeYDCYjGDvaHFgA/fPzf/i+WMn/2n/y8CFmDEkHSlh7EgKo3bunHx39/Ztv/izL6t6emJyYZ6mCJKYBJawrEwXA8/GEV1f7lmV+9BHP8sIzFzovXrAk4nuW/BmqBJSwZqQIQOzjvnx58vx5/5NPElOATTz2cG+v0Mms1gUoYT1I/K6npzo8oeDN3/427f4en+CwdXhY9PxuFQdKqDRzCUCgPXsWXl+Hn36apQnuJRJzfuqHh9s26AQlVJF8AhDUnzzRDg7cJ0/majQYDp0XL8Q80Ns26AQlVIgFBSBOEi+Xc8CS2LZBJyihfJYiAMG0cnnxwDZ70AlKKI3lCkAws1zOwTYMOkEJq6YgAQjmKpfnZYMHnaCEFREMh97FhRBAcfVovnI5Bxs26AQlFMv4gEyht8vi5XIONmPQCUoohBULQLDEcjkHaz3oBCUsk7IEICiiXM7BOg46QQlLoHQBCAotl3OwRoNOUEJ+qiMAwcrK5Xmp/qATlDA3FRQAU0q5nINqDjpBCfMhm2bVBCDwzs+PP/usrHI5B4nflPajR73Hj8sKBkqYDzbMrU6fniAYDuWdnWrGlgJLolwnYigBACLM8gIAsy1KsCxL0zR4ilaKKhiKCrZFCexZOBgMyg6kHKpphzPXlOBFg5m/QGnEPZxKZ1v6BIFlWepbRNccBAHbLgVB4Lou2wXEUyn2L1NVVZZlXdcT7jLTtrKvva7rqqqy3zvvk8/pni3VRPCWZcVNj/hzaZomy7JhGMI4h2MTH5Ap3W+brwwHFl+vaZplWdyBT9yhQFboWlIypmnWajVh0spOr3EzyWazKcxsbm5uxJ6+7yuKIuwr+/1+3JcyfSulWvFmZ6ZNbboXbcKrsyLETVkFVJIB8XYpQdguMf1+P36hm83mRA+rVquV+MJs2xa3WvpWmmXFmz34dJvaUaoX7RopoSwD4u3KjsZtVRN5zkRvyXFrV1mWhcVl+tZlEQRBwt9J13XRLm+1LItlkMWqsLKUZUC81RVzGIZZxi5UVWWvMbEmiiJhapa+dVmk29TC1XdxtqtP6PV68QrMsqyE9+5ETk9P47+ybPYqDkzfuizSbWpnuvrW6/X4B99wP9l8rCYJKx22ZzVNs9lstlot/lNk87y+VqspitJsNpvNpuM48cNt2457uWbcmm7FO+9HmGZTO5rlRTsajXzf5x0mus2uGNu2+SJLkiQuuO/75RoQb+N7R0EQcAIz12OddC/XmU6vy2KaY2x2L9pKPc+qDtuoBADG2a46AYBpQAkAEEEJADBQAgBEUMK8hFdX4dVV2VGA5QMlzMe+Zdlff112FFO58/HHluOUHUVOtGfPtGfPymodSgCACEoAgIESACCCEgBgoAQAiKCEeVEajeDysuwowPKBEuZj7SZaBBmBEgAgghIAYKAEAIigBAAYKAEAIihhXur37oXX12VHAZYPlDAf8s7OKyhhE4ESACCCEgBgoAQAiLZ8XtR8SDs7ZYcwlebBwX5lXHHnRW00SmwdM38BQITsCAAGSgCACEoARTPutFJNoARQLCnTd1cKVMwAEKFPyM40m9eKsNzwLMvSNK3X61mWJcsynzZuejuzxW63G/e9jVv6Tjs2i2lveqPsIMyOwIZhzOc3twK3ks0g3ea1dJYeHpv2CsNP9r2Nmwllb3HcC3TasTTLtDe9UUmShB2w4zhzOY7iyVpW2CWbf4RUVa2apV8R4em6bhgGL3OfYBiGruuLt5hyLLdYr9fPzs5ozGpxZqNcoLNFfMKtNB0oIRNBEPCV5eKvauMhBYWXMKGK35SLtJj72JkHep5n23a/34+iKIqis7Oz7MU6lJCJitu8FhRePEHn04pf2UVazH1s+oGs0m63y3+GYcglSkZTOVTMmZhp81ouBYUXBIGoSj3PMwyDM5YFW8x9bPqBnU4nvoYFkCip2ZRxork1+oRMcD+r6zo7WGqa5rpuFEWJIZGyKCg8wzD29/e5MJBlOd4nLNLitGNFo3wSy7J4+CgIAsuyut1ueqP37993HIdHlniHs7OzRKkQRdHr1695IdFX4HlCVmbavJbL0sPjIUiRbCzSouu6vu/HT5U72uxmu9NqD9EtJNZDCWAyM5WQkSiKDMM4PT2t1BjDBLIPuILtwTRNcYfEnyHkOIMkSVV79jIR9AkAEGHsCAAGSgCACEoA1SEYDoPhsKzWoQRQFSzXtX77uusqgRIAIIISAGCgBACIoAQAGCgBACIoAQAGSgCACEoAgIESACCCEgBgoAQAiKAEABgoAQAiKAEABkoAgAhKAICBEgAgwhx4oDqcHB2V2DpmeQGACNkRAAyUAAARlACKhv0+ZlqeaZrmed5qQpoIlACKhW/xhCnJOKqqZrT8KAiMHYFKsPik3AuCPgGsCDaQFU4fYj2bz7KV4PhRCxnLzkXZk3WDrYCIxNzxtm3HjWUZ0zTjDrOCRYxl5wJ9AlgFiqKIn/N5jdM9zwvDkIh0XS8uiYISwCrIXQ17njcYDCzL4gSJJVEEqJhBdVnQWHYu0CeA6pLFWHZZoE8AxcIeskEQ6LrOprG6rrOHrOd5vV7PcRwiCsPQ8zy+17vdLltrZjGWXRZ4Aw9UnZnGsksBSgCACHUCAAyUAAARlAAAAyUAQAQlAMBACQAQQQkAMP8HPnF/iq0DgxoAAAAASUVORK5CYII=",
"text/plain": [
"Tree('with', ['A', 'man', Tree('chased', [Tree('broom', ['a']), Tree('cat', ['a']), Tree('in', [Tree('pajamas.', ['his'])])])])"
]
},
"execution_count": 20,
"metadata": {},
"output_type": "execute_result"
}
],
"source": [
"quote = \"A man with a broom chased a cat in his pajamas.\"\n",
"mp.parse_one(quote.split()).tree()\n",
"\n",
"# Cats don't wear pajamas."
]
},
{
"cell_type": "code",
"execution_count": 21,
"metadata": {},
"outputs": [
{
"data": {
"image/png": "iVBORw0KGgoAAAANSUhEUgAAAQ8AAACzCAIAAAAYMg7TAAAJMmlDQ1BkZWZhdWx0X3JnYi5pY2MAAEiJlZVnUJNZF8fv8zzphUASQodQQ5EqJYCUEFoo0quoQOidUEVsiLgCK4qINEWQRQEXXJUia0UUC4uCAhZ0gywCyrpxFVFBWXDfGZ33HT+8/5l7z2/+c+bec8/5cAEgiINlwct7YlK6wNvJjhkYFMwE3yiMn5bC8fR0A9/VuxEArcR7ut/P+a4IEZFp/OW4uLxy+SmCdACg7GXWzEpPWeGjy0wPj//CZ1dYsFzgMt9Y4eh/eexLzr8s+pLj681dfhUKABwp+hsO/4b/c++KVDiC9NioyGymT3JUelaYIJKZttIJHpfL9BQkR8UmRH5T8P+V/B2lR2anr0RucsomQWx0TDrzfw41MjA0BF9n8cbrS48hRv9/z2dFX73kegDYcwAg+7564ZUAdO4CQPrRV09tua+UfAA67vAzBJn/eqiVDQ0IgALoQAYoAlWgCXSBETADlsAWOAAX4AF8QRDYAPggBiQCAcgCuWAHKABFYB84CKpALWgATaAVnAad4Dy4Aq6D2+AuGAaPgRBMgpdABN6BBQiCsBAZokEykBKkDulARhAbsoYcIDfIGwqCQqFoKAnKgHKhnVARVApVQXVQE/QLdA66At2EBqGH0Dg0A/0NfYQRmATTYQVYA9aH2TAHdoV94fVwNJwK58D58F64Aq6HT8Id8BX4NjwMC+GX8BwCECLCQJQRXYSNcBEPJBiJQgTIVqQQKUfqkVakG+lD7iFCZBb5gMKgaCgmShdliXJG+aH4qFTUVlQxqgp1AtWB6kXdQ42jRKjPaDJaHq2DtkDz0IHoaHQWugBdjm5Et6OvoYfRk+h3GAyGgWFhzDDOmCBMHGYzphhzGNOGuYwZxExg5rBYrAxWB2uF9cCGYdOxBdhK7EnsJewQdhL7HkfEKeGMcI64YFwSLg9XjmvGXcQN4aZwC3hxvDreAu+Bj8BvwpfgG/Dd+Dv4SfwCQYLAIlgRfAlxhB2ECkIr4RphjPCGSCSqEM2JXsRY4nZiBfEU8QZxnPiBRCVpk7ikEFIGaS/pOOky6SHpDZlM1iDbkoPJ6eS95CbyVfJT8nsxmpieGE8sQmybWLVYh9iQ2CsKnqJO4VA2UHIo5ZQzlDuUWXG8uIY4VzxMfKt4tfg58VHxOQmahKGEh0SiRLFEs8RNiWkqlqpBdaBGUPOpx6hXqRM0hKZK49L4tJ20Bto12iQdQ2fRefQ4ehH9Z/oAXSRJlTSW9JfMlqyWvCApZCAMDQaPkcAoYZxmjDA+SilIcaQipfZItUoNSc1Ly0nbSkdKF0q3SQ9Lf5RhyjjIxMvsl+mUeSKLktWW9ZLNkj0ie012Vo4uZynHlyuUOy33SB6W15b3lt8sf0y+X35OQVHBSSFFoVLhqsKsIkPRVjFOsUzxouKMEk3JWilWqUzpktILpiSTw0xgVjB7mSJleWVn5QzlOuUB5QUVloqfSp5Km8oTVYIqWzVKtUy1R1WkpqTmrpar1qL2SB2vzlaPUT+k3qc+r8HSCNDYrdGpMc2SZvFYOawW1pgmWdNGM1WzXvO+FkaLrRWvdVjrrjasbaIdo12tfUcH1jHVidU5rDO4Cr3KfFXSqvpVo7okXY5upm6L7rgeQ89NL0+vU++Vvpp+sP5+/T79zwYmBgkGDQaPDamGLoZ5ht2GfxtpG/GNqo3uryavdly9bXXX6tfGOsaRxkeMH5jQTNxNdpv0mHwyNTMVmLaazpipmYWa1ZiNsulsT3Yx+4Y52tzOfJv5efMPFqYW6RanLf6y1LWMt2y2nF7DWhO5pmHNhJWKVZhVnZXQmmkdan3UWmijbBNmU2/zzFbVNsK20XaKo8WJ45zkvLIzsBPYtdvNcy24W7iX7RF7J/tC+wEHqoOfQ5XDU0cVx2jHFkeRk4nTZqfLzmhnV+f9zqM8BR6f18QTuZi5bHHpdSW5+rhWuT5z03YTuHW7w+4u7gfcx9aqr01a2+kBPHgeBzyeeLI8Uz1/9cJ4eXpVez33NvTO9e7zofls9Gn2eedr51vi+9hP0y/Dr8ef4h/i3+Q/H2AfUBogDNQP3BJ4O0g2KDaoKxgb7B/cGDy3zmHdwXWTISYhBSEj61nrs9ff3CC7IWHDhY2UjWEbz4SiQwNCm0MXwzzC6sPmwnnhNeEiPpd/iP8ywjaiLGIm0iqyNHIqyiqqNGo62ir6QPRMjE1MecxsLDe2KvZ1nHNcbdx8vEf88filhICEtkRcYmjiuSRqUnxSb7JicnbyYIpOSkGKMNUi9WCqSOAqaEyD0tandaXTlz/F/gzNjF0Z45nWmdWZ77P8s85kS2QnZfdv0t60Z9NUjmPOT5tRm/mbe3KVc3fkjm/hbKnbCm0N39qzTXVb/rbJ7U7bT+wg7Ijf8VueQV5p3tudATu78xXyt+dP7HLa1VIgViAoGN1tubv2B9QPsT8M7Fm9p3LP58KIwltFBkXlRYvF/OJbPxr+WPHj0t6ovQMlpiVH9mH2Je0b2W+z/0SpRGlO6cQB9wMdZcyywrK3BzcevFluXF57iHAo45Cwwq2iq1Ktcl/lYlVM1XC1XXVbjXzNnpr5wxGHh47YHmmtVagtqv14NPbogzqnuo56jfryY5hjmceeN/g39P3E/qmpUbaxqPHT8aTjwhPeJ3qbzJqamuWbS1rgloyWmZMhJ+/+bP9zV6tua10bo63oFDiVcerFL6G/jJx2Pd1zhn2m9az62Zp2WnthB9SxqUPUGdMp7ArqGjzncq6n27K7/Ve9X4+fVz5ffUHyQslFwsX8i0uXci7NXU65PHsl+spEz8aex1cDr97v9eoduOZ67cZ1x+tX+zh9l25Y3Th/0+LmuVvsW523TW939Jv0t/9m8lv7gOlAxx2zO113ze92D64ZvDhkM3Tlnv296/d5928Prx0eHPEbeTAaMip8EPFg+mHCw9ePMh8tPN4+hh4rfCL+pPyp/NP637V+bxOaCi+M24/3P/N59niCP/Hyj7Q/Fifzn5Ofl08pTTVNG02fn3Gcufti3YvJlykvF2YL/pT4s+aV5quzf9n+1S8KFE2+Frxe+rv4jcyb42+N3/bMec49fZf4bmG+8L3M+xMf2B/6PgZ8nFrIWsQuVnzS+tT92fXz2FLi0tI/QiyQvpTNDAsAAAAJcEhZcwAADdcAAA3XAUIom3gAAAAddEVYdFNvZnR3YXJlAEdQTCBHaG9zdHNjcmlwdCA5LjI2WJButwAAELtJREFUeJzt3T9s48i9B/DxwyEJvAhgLeBFOps0AgRyE5DabXcBUcUFrzTd3qYQDeTSrqgum07ypkxDprjdltz6LoAYwNeuySsCSHkNabkK4AXEBQIdkocAfsXvPOGjZHpE/aEofT+VLIriUOJXwxnR+u3c3t4yABDwX0U3AKA0kBYAUUgLgCikBUBUudPieZ6maaZpFtsMwzA0TQuCoNhmwLKVOy2apnmeV/hhatu2qqpxHBfbDFi2cqcFYJXKkZYgCHRdV++Ypum6bvIBpmnSIk3TUp/xtEjTNFmWDcNILXVdV5ZlTdNUVTUMI3lSxxc9uGK3213CTsP6uV17YRhKkuT7Pv9TUZRWq8UfwBjrdDp027Ksk5OT5Oq9Xo/f7nQ6/JFEkqQwDOm24zj1ep0/T7PZHI1Gk4smlzabTUmSkhuCjVSCtLRaLcuykvc4jpM8NBVFSS5NHtbE9/3enWTMbm9vJUmyLIsHhmdSkiQehslmTC5VFAVp2XifFd23PSwIgkajkbxH1/Xkn5VKJWNdXddlWVZVld3NoSUf4HmeZVm9Xi+O4ziO2+02PTKO49RWGGNHR0d0Q5bl1EZTTwsbqQRpkWU593STYRiu61IAGGOe5/V6Pb6UnpaPOqIo0jRN07RKpSLLsuu69+UwiqLUPZ7npSINm6cEo/zT09NOp5MMjOd5gt+xxHEsyzK/bVlWcmmn00neQ9mgDZ2enqY24Xme53l0W9f15FLbtifzA5tn57YM1yDbtt3pdOhT3/M8moaqVCpBEJimGQSBpmmu69LpUxAEqqrSkU0r6roexzF/mKZptm0zxrrdruM4jDGaSQuC4OzszDAM2qhpmvzMzfM8WZZt2+a9DV8aRVGlUqGGJVeHzVOOtBAKgKqqGQOVSRSDSqXCz8emPoDdM/bI2GgURVEUybLMuy/YbGVKC0CxSjBuAVgTSAuAKKQFQNQ2piUejy/+9rd4PC66IVAyJfh2clGimxvX9/2rq/e+/9Mf//gf//qXtL+vVau1w0P18FA9PCy6gbDuNn9OzL289K+uXN+/+viRMfbTn/zkH//85zNJevGLXwTX138ZDPgj69WqenDQOD5WDw8rjx4V12RYU5uZlujmxhsMev2+Nxh8+v57xphycPDfv/yl8+HD//z9783nz+2XL/mDg+HQGwzCmxtvMKBEMcbQ7cCkjUpLMBw6Hz54g8F319eMsb3dXf3p09rhof70KWNMe/Pmu+tr64svjBcv7nuGeDz2BgP/6grdDkwqfVri8di9vPSHQ/fykncjWrV6+uwZ7xPi8VgkKpPQ7UBSWdMy2Y1o1Wrj+FirVuUnT1KPNN6+zRGVFHQ7UKa00PFKoxH6pJf29/VarXF8rB0fT10lGA61N28YY11dnycqU58Z3c62KUFaaOa31+/zT/STWq0mSXqtlupGUnhUvFevlnrsotvZEuubltTML31sN46Pacj+oJVFZeqm0e1spPVKC5/5fe/7dE/9bjQy0xFmX1yYrsuKiEoKup1NshZp8fp9Go1MzvzmOJLsi4uzd++UgwP75ct1+xRHt1NqhaVFZOY3Bx4V79WrNf/MRrdTOqtOy30zv/m6kZQSRWUSup31t4q08JnfVDeSMfObg/H27Z++/bakUUlBt7OelpgW+rDMMfObA0Wl+fx5V9c37zBCt7MmFp+WyZlfnUIiNvObA49K8lrJTYVup0CLSUvyX0fonnwzv7OKx2PTdbcnKpPQ7azSXGmZOvNLIVnBxxu/VnJro5KCbmfZ8qQlurkxXTf5ryPzz/zmoL5+Pf+1khsso9vZyNHdCuTsW+RWi/r6hcz85tP9+uvK7i6iIiLV7dx+9VXRLSqltfguH6AUtvE3XwDyQVo2H9WyLboVm2DT0oKqQ5Nm/Z11uM8W/Z7Y1kIR2UX5zyjfMAwqRUJVFhqNhmVZcRwna2tR0RJ6jKZpVESFMUalfR8/fuw4Dt3T7XbvqwAhIgiCTqfDSwhpmlar1Xhpu6nN8Dyv0+lQ8Rb+PBn1vbYBvads4u1Y+Pu1LZJFKBljVIi02WxSrdMwDJMlgjPqAzPGeAFUx3FShYVn8mAR44xmTJZohVarNVlBdoHv1/ZIn4lRaatKpdJut9lEzUdN04IgoHtUVU3WcFQUhff4uq7PUyLLsixeLZXa0G63k11ERjNA0ALfr+0xw7gluz5w6oTn06dPuduUXcT4wTLFIGKB79f2mCEt2fWBFyi7iPHKmgGQMsMMcnZ94AXKLmKc3Qwq3cr/RKlhWCQ+gmk2m4yxZrN5e3vbarUURaFx9t7eHg0HLcuSJKnVajWbTRp2S5LUbDbDMKzX63t7e3ykeHJywhKDyBxoW81mk1rSbDZHo1Fy0WQzaKnv+7SUVjw5OeErbhvLsur1er1elyRJURS67fv+Mt6vLTHbdWIP1gderPvqCWc3g9coxrdysFi4qhJA1KZd+QKwPEgLgCikBUAU0gIgCmkBEJUnLfbFBRV7KBAVnAiGw2KbUUam45iOU3QrSinP/7eENzfJH+ApRDwe/2UwiMfjYptRRsH1ddFNKCuciQGIQloARCEtAKKQFgBRSAuAKKQFQBTSAiAKaQEQhbQAiEJaAEQhLQCikBYAUUgLgCikBUAU0gIgCmkBEIW0AIjCr+8BiELfAiAKaQEQNVtavDuo9FAiM1UAp+pRvP4HJM3wmy+u61Ld1iiKdF23bXt5zYIFmlpr4L4IaXdW0rSSmSEtuq7ruk4FhKkaEeo9lAIqgC/KzOMWx3F0XT87OyuwbzFNU1VVTdNkWTYMI6Ps3gazbZs6AV4LbfIewzBS97C7c60gCLSEydeQXmR6nbfzFZ5iptpIvu9TFa7RaKQoyhKqLwnJqAC+Ver1OlU+C8OQbliWNVnia2oF8OxS6Ywx/qpaloX64GS2vsWyLKo2XKlUZFlOfmKtEn000nyDqqqj0aiQZhROVVUae+i63ul0GGNhGKbKQeejKAof6G9t7z1ptl92dV03iiIqjEo3Vn8+hgrgXKPR6PV6sizLskyx8TxvIaMUjEinmiEttm0bhpF8M1RVXf1YHxXAOU3TqEtpNBq+77uuW3SLNtwMZ2K9Xu/s7Cx5j6Zpq3+HVlaIvBTiOHZdl+ZdTNMU72ZRKj0PwfENFYmu1+uWZdE9VICbym0vbVg1RXYF8G1DrwPdliTJcRy+6L4K4LT0vlLpvu8n64OPRiP6M3tWYEuU8qrKFRci31QolT6rUqYFoBC4qhJAFNICIAppARCFtACIylOlFUoqurlxff/Pf/3rz3/2s9rhoVatyk+eFN2oMsGc2Obz+v1ev+8NBt/dVTP+0Wef/e+//80Yk/b39VqtJklatVp59KjQZpYA0rKZopsbbzCgkHz6/nvGmHJwoFWrjx89ar9/7/zmN5Xd3V6/H1xf82Lu9IDG8bF2fFxo29cX0rJRUt3I3u6u/vRp7fBQf/qUug7j7ds/ffvt7VdfJddyLy/9q6tk51OvVtWDg9Nnz9TDw5XvxPpCWkovHo/dy8vJbmTqsS63WvL+vvfq1X1PxXukq48fGWN7u7tatUqnakgO0lJWwXDofPiQ7EZ+OI+6f+we3dwcmWbr88+7p6cPPj+dy/nDoXt5SSGU9ve1anWbpweQljKhbiR5BM802LAvLs7evfN/97tZe4lgOPQGAzpb48nZwukBzCCXQI5uZKpev7+3u5vjhEo9PORr0dAouL4+/+Ybumd7pgfQt6wpPoRIngjptdo8B2Xlyy+1atX98stFNXLbpgeQlvVC5zy9fp9P7J7UajVJ0mu1OYcKwXBY+/3vO7pu/upXi2jp/7Ml0wNIS/EmDzU+KtCfPl3UVrpff9123bDbXfYAfYOnB5CWwiyvG5lKe/Mm+vgxOj9f+DNn2LDpAaRl1ehc3/V93o3QEHmB3chUO7/+dfP5c/vly6VuJQOfHijv1QNIyyrQ5Yz+1dV736d76neTWqs5p/f6/cYf/mB98YXx4sUKNvegkk4PIC1LdF83svqTENNxzr/5ZvTHP67byU+5pgeQlgUrvBuZSn39mjEWvH5dVANErP/0ANKyGA9ezligeDx+/NvfCl7wsibWc3oA3+XnN/Wq+Nbnn6/bybc3GDDGapJUdENmsJ5XD6Bvmdk6dyNTTb1Kv6SKnR5AWmZDFyayzKvi143x9m308eN9V+mX1OT0wApm/JCW2dBVwGsy6ARCp8Qr6NuRFgBR+IUkAFFIyww1r2cqpb1KJSr5RGUzSloQG2n5IQMiVQHX9rfoS1RuoNvtqqoahmHRDckD37fMYG1LaVPx4aJbsfnQt/xHRs3rqaW0Odd1ZVnWNE1VVcMwRE7q+BbptMQ0TXoGWZaT5daya513u91kFe/U6c1969K+6Lquqqqu67Ztq6qarLmbvdHcOzu57+qd5PktL00eBAFtS5Zlvmt0zkkN1nU9VdLsvqUP7rKoldZWWmNMoOb11FLat7e3kiSFYUi3HceZqYxWq9Xa29vjFdfCMFQUhZf4Eq913uv1UkXaMtZljNEWm80mtTYMQ77L2RudZ2cJ7TJ/Wtrl1Atbr9cVRWk2m6PRaDQa0YN931cUhW+91+tJkkQlzR5cmr3LgpCWHyiKkvxz6kGQkRbLsvj7xKvViUiWwiNhGCa37vt+705G0cKpS+9bl39KJvdIcKPz7CzfaGqXe71e6sCt1+uTu3NycpJ6/S3L4qnLXvrgLovAmdgP5hm+e54XhiGdVqmqOmvF09SmZVmmk58gCGRZNk2TjtqZznlyr/vginPuLEntsqZpk8/TaDQmN52a+pNlmVe0zl66EBjlz4uObD4BEEURnXaLxy919ux5HhVtnqfWee51s1ecf2eniqJI5BkonLyiNbWHNzV76UKgb5lXp9NJViGndz01Ms4WBAEfTHueZxhGu91m89U6z71u9orz7yyxbTv5GWGaZqq4/FRU5TzZVMuy+IrZS0VQ6V/et09C38KCIDBNMwgCXddd143jWNd1mpmhuRrbth3HYYxFUeR5Hh0i9L0BY+zx48eO4/CZtCAI2u128hPuQYZhHB0d6brOGJNlmfct7Xab5nDoaTVNo+aJfLWXsa5hGLRReh7TNGmOiF6H7I3Ov7OmabquS5NpdGi6rnt2dka7Tw8IgoAaQy81X0qtum/rGUuzd5l3lXEcf/r0iW5M7etwndhi8Gras36nTh+H932TI17r3HVd3/eTz5O7TvqDK+be2ZQgCOj4nulELnvrc7aNdy9TlyItBctOi6A4jg3DODs7K8v1LyWFcUuRTNM8Pz8/Pz/f2dlJfikpvvrOzs7Ozo6qqrVaDVFZNvQtAKLQtwCIQloARCEtsAnsiwuv31/2VpAW2ARn7971kBaA9YG0AIhCWgBEIS0AopAW2AT1ajW4+63X5UFaAEQhLQCikBYAUUgLgCikBUAU0gIgCmmBTSDv7wfD4bK3grTAJqjs7lLpz6VCWgBEIS0AopAWAFFIC4AopAU2wdGTJ83nz5e9FfxCEoAo9C0AopAWAFFIC4AopAVAFNICIAppgXLLrle+WEgLlFuj0QiCwPO8KIqOjo5ECqflhkp6UG6aplGNMcaYqqqLLWKcgrRAiVG1UFmWqejfZBHwxUJaoMTmKZKeA8YtUGLzFEnPAX0LlNg8RdJzwFWVUG65C53ngLQAiMK4BUAU0gIgCmkBEIW0AIhCWgBEIS0AopAWAFH/B8hsYEUMdBvOAAAAAElFTkSuQmCC",
"text/plain": [
"Tree('chased', [Tree('man', ['A']), Tree('cat', ['a']), Tree('in', [Tree('with', ['his', 'pajamas', Tree('broom.', ['a'])])])])"
]
},
"execution_count": 21,
"metadata": {},
"output_type": "execute_result"
}
],
"source": [
"quote = \"A man chased a cat in his pajamas with a broom.\"\n",
"mp.parse_one(quote.split()).tree()\n",
"\n",
"# Does the man have a cat in his pajamas?"
]
},
{
"cell_type": "code",
"execution_count": 17,
"metadata": {},
"outputs": [
{
"name": "stdout",
"output_type": "stream",
"text": [
"original: 14862748245026736845 A\n",
"lowercased: 11901859001352538922 a\n",
"lemma: 14862748245026736845 A\n",
"shape: 101 X\n",
"prefix: 14862748245026736845 A\n",
"suffix: 14862748245026736845 A\n",
"log probability: -20.0\n",
"Brown cluster id: 0\n",
" — — — — — — — — — — — — — — — — — — — — \n",
"original: 3104811030673030468 man\n",
"lowercased: 3104811030673030468 man\n",
"lemma: 3104811030673030468 man\n",
"shape: 4088098365541558500 xxx\n",
"prefix: 646772771845179972 m\n",
"suffix: 3104811030673030468 man\n",
"log probability: -20.0\n",
"Brown cluster id: 0\n",
" — — — — — — — — — — — — — — — — — — — — \n",
"original: 3002984154512732771 in\n",
"lowercased: 3002984154512732771 in\n",
"lemma: 3002984154512732771 in\n",
"shape: 4370460163704169311 xx\n",
"prefix: 5097672513440128799 i\n",
"suffix: 3002984154512732771 in\n",
"log probability: -20.0\n",
"Brown cluster id: 0\n",
" — — — — — — — — — — — — — — — — — — — — \n",
"original: 2661093235354845946 his\n",
"lowercased: 2661093235354845946 his\n",
"lemma: 2661093235354845946 his\n",
"shape: 4088098365541558500 xxx\n",
"prefix: 15817570140490810055 h\n",
"suffix: 2661093235354845946 his\n",
"log probability: -20.0\n",
"Brown cluster id: 0\n",
" — — — — — — — — — — — — — — — — — — — — \n"
]
}
],
"source": [
"# from spacy.en import English\n",
"from spacy.lang.en import English\n",
"\n",
"parser = English()\n",
"parsedData = parser(quote)\n",
"\n",
"for i, token in enumerate(parsedData):\n",
" print(\"original:\", token.orth, token.orth_)\n",
" print(\"lowercased:\", token.lower, token.lower_)\n",
" print(\"lemma:\", token.lemma, token.lemma_)\n",
" print(\"shape:\", token.shape, token.shape_)\n",
" print(\"prefix:\", token.prefix, token.prefix_)\n",
" print(\"suffix:\", token.suffix, token.suffix_)\n",
" print(\"log probability:\", token.prob)\n",
" print(\"Brown cluster id:\", token.cluster)\n",
" print(\" — — — — — — — — — — — — — — — — — — — — \")\n",
" if i > 2:\n",
" break"
]
},
{
"cell_type": "code",
"execution_count": null,
"metadata": {},
"outputs": [],
"source": []
}
],
"metadata": {
"kernelspec": {
"display_name": "Python 3",
"language": "python",
"name": "python3"
},
"language_info": {
"codemirror_mode": {
"name": "ipython",
"version": 3
},
"file_extension": ".py",
"mimetype": "text/x-python",
"name": "python",
"nbconvert_exporter": "python",
"pygments_lexer": "ipython3",
"version": "3.7.3"
}
},
"nbformat": 4,
"nbformat_minor": 2
}
Sign up for free to join this conversation on GitHub. Already have an account? Sign in to comment