Created
February 7, 2017 19:44
-
-
Save jivens/8383dcabb71857d1d4605d430aed6e24 to your computer and use it in GitHub Desktop.
New pandas dataframe load
This file contains hidden or bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
| { | |
| "cells": [ | |
| { | |
| "cell_type": "code", | |
| "execution_count": 2, | |
| "metadata": { | |
| "collapsed": true | |
| }, | |
| "outputs": [], | |
| "source": [ | |
| "import pandas as pd" | |
| ] | |
| }, | |
| { | |
| "cell_type": "code", | |
| "execution_count": 3, | |
| "metadata": { | |
| "collapsed": true | |
| }, | |
| "outputs": [], | |
| "source": [ | |
| "import numpy as np" | |
| ] | |
| }, | |
| { | |
| "cell_type": "code", | |
| "execution_count": 4, | |
| "metadata": { | |
| "collapsed": false | |
| }, | |
| "outputs": [ | |
| { | |
| "name": "stderr", | |
| "output_type": "stream", | |
| "text": [ | |
| "/Users/amyfou/anaconda3/envs/ml/lib/python3.6/site-packages/matplotlib/font_manager.py:280: UserWarning: Matplotlib is building the font cache using fc-list. This may take a moment.\n", | |
| " 'Matplotlib is building the font cache using fc-list. '\n" | |
| ] | |
| } | |
| ], | |
| "source": [ | |
| "import matplotlib.pyplot as plt" | |
| ] | |
| }, | |
| { | |
| "cell_type": "code", | |
| "execution_count": 5, | |
| "metadata": { | |
| "collapsed": true | |
| }, | |
| "outputs": [], | |
| "source": [ | |
| "data = np.zeros((2,), dtype=[('A', 'i4'),('B', 'f4'),('C', 'a10')])" | |
| ] | |
| }, | |
| { | |
| "cell_type": "code", | |
| "execution_count": 6, | |
| "metadata": { | |
| "collapsed": false | |
| }, | |
| "outputs": [ | |
| { | |
| "data": { | |
| "text/plain": [ | |
| "array([(0, 0.0, b''), (0, 0.0, b'')], \n", | |
| " dtype=[('A', '<i4'), ('B', '<f4'), ('C', 'S10')])" | |
| ] | |
| }, | |
| "execution_count": 6, | |
| "metadata": {}, | |
| "output_type": "execute_result" | |
| } | |
| ], | |
| "source": [ | |
| "data" | |
| ] | |
| }, | |
| { | |
| "cell_type": "code", | |
| "execution_count": 7, | |
| "metadata": { | |
| "collapsed": true | |
| }, | |
| "outputs": [], | |
| "source": [ | |
| "data[:] = [(1,2.,'Hello'), (2,3.,\"World\")]" | |
| ] | |
| }, | |
| { | |
| "cell_type": "code", | |
| "execution_count": 8, | |
| "metadata": { | |
| "collapsed": false | |
| }, | |
| "outputs": [ | |
| { | |
| "data": { | |
| "text/plain": [ | |
| "array([(1, 2.0, b'Hello'), (2, 3.0, b'World')], \n", | |
| " dtype=[('A', '<i4'), ('B', '<f4'), ('C', 'S10')])" | |
| ] | |
| }, | |
| "execution_count": 8, | |
| "metadata": {}, | |
| "output_type": "execute_result" | |
| } | |
| ], | |
| "source": [ | |
| "data" | |
| ] | |
| }, | |
| { | |
| "cell_type": "code", | |
| "execution_count": 9, | |
| "metadata": { | |
| "collapsed": false | |
| }, | |
| "outputs": [ | |
| { | |
| "ename": "AttributeError", | |
| "evalue": "module 'pandas' has no attribute 'dataFrame'", | |
| "output_type": "error", | |
| "traceback": [ | |
| "\u001b[0;31m---------------------------------------------------------------------------\u001b[0m", | |
| "\u001b[0;31mAttributeError\u001b[0m Traceback (most recent call last)", | |
| "\u001b[0;32m<ipython-input-9-2a28ea12b996>\u001b[0m in \u001b[0;36m<module>\u001b[0;34m()\u001b[0m\n\u001b[0;32m----> 1\u001b[0;31m \u001b[0mpd\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0mdataFrame\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0mdata\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[0m", | |
| "\u001b[0;31mAttributeError\u001b[0m: module 'pandas' has no attribute 'dataFrame'" | |
| ] | |
| } | |
| ], | |
| "source": [ | |
| "pd.dataFrame(data)" | |
| ] | |
| }, | |
| { | |
| "cell_type": "code", | |
| "execution_count": 10, | |
| "metadata": { | |
| "collapsed": false | |
| }, | |
| "outputs": [ | |
| { | |
| "data": { | |
| "text/html": [ | |
| "<div>\n", | |
| "<table border=\"1\" class=\"dataframe\">\n", | |
| " <thead>\n", | |
| " <tr style=\"text-align: right;\">\n", | |
| " <th></th>\n", | |
| " <th>A</th>\n", | |
| " <th>B</th>\n", | |
| " <th>C</th>\n", | |
| " </tr>\n", | |
| " </thead>\n", | |
| " <tbody>\n", | |
| " <tr>\n", | |
| " <th>0</th>\n", | |
| " <td>1</td>\n", | |
| " <td>2.0</td>\n", | |
| " <td>b'Hello'</td>\n", | |
| " </tr>\n", | |
| " <tr>\n", | |
| " <th>1</th>\n", | |
| " <td>2</td>\n", | |
| " <td>3.0</td>\n", | |
| " <td>b'World'</td>\n", | |
| " </tr>\n", | |
| " </tbody>\n", | |
| "</table>\n", | |
| "</div>" | |
| ], | |
| "text/plain": [ | |
| " A B C\n", | |
| "0 1 2.0 b'Hello'\n", | |
| "1 2 3.0 b'World'" | |
| ] | |
| }, | |
| "execution_count": 10, | |
| "metadata": {}, | |
| "output_type": "execute_result" | |
| } | |
| ], | |
| "source": [ | |
| "pd.DataFrame(data)" | |
| ] | |
| }, | |
| { | |
| "cell_type": "code", | |
| "execution_count": 11, | |
| "metadata": { | |
| "collapsed": true | |
| }, | |
| "outputs": [], | |
| "source": [ | |
| "data2 = [{'a': 1, 'b': 2}, {'a': 5, 'b': 10, 'c': 20}]" | |
| ] | |
| }, | |
| { | |
| "cell_type": "code", | |
| "execution_count": 12, | |
| "metadata": { | |
| "collapsed": false | |
| }, | |
| "outputs": [ | |
| { | |
| "data": { | |
| "text/plain": [ | |
| "[{'a': 1, 'b': 2}, {'a': 5, 'b': 10, 'c': 20}]" | |
| ] | |
| }, | |
| "execution_count": 12, | |
| "metadata": {}, | |
| "output_type": "execute_result" | |
| } | |
| ], | |
| "source": [ | |
| "data2" | |
| ] | |
| }, | |
| { | |
| "cell_type": "code", | |
| "execution_count": 13, | |
| "metadata": { | |
| "collapsed": false | |
| }, | |
| "outputs": [ | |
| { | |
| "data": { | |
| "text/html": [ | |
| "<div>\n", | |
| "<table border=\"1\" class=\"dataframe\">\n", | |
| " <thead>\n", | |
| " <tr style=\"text-align: right;\">\n", | |
| " <th></th>\n", | |
| " <th>a</th>\n", | |
| " <th>b</th>\n", | |
| " <th>c</th>\n", | |
| " </tr>\n", | |
| " </thead>\n", | |
| " <tbody>\n", | |
| " <tr>\n", | |
| " <th>0</th>\n", | |
| " <td>1</td>\n", | |
| " <td>2</td>\n", | |
| " <td>NaN</td>\n", | |
| " </tr>\n", | |
| " <tr>\n", | |
| " <th>1</th>\n", | |
| " <td>5</td>\n", | |
| " <td>10</td>\n", | |
| " <td>20.0</td>\n", | |
| " </tr>\n", | |
| " </tbody>\n", | |
| "</table>\n", | |
| "</div>" | |
| ], | |
| "text/plain": [ | |
| " a b c\n", | |
| "0 1 2 NaN\n", | |
| "1 5 10 20.0" | |
| ] | |
| }, | |
| "execution_count": 13, | |
| "metadata": {}, | |
| "output_type": "execute_result" | |
| } | |
| ], | |
| "source": [ | |
| "pd.DataFrame(data2)" | |
| ] | |
| }, | |
| { | |
| "cell_type": "code", | |
| "execution_count": 14, | |
| "metadata": { | |
| "collapsed": false | |
| }, | |
| "outputs": [ | |
| { | |
| "ename": "AttributeError", | |
| "evalue": "module 'pandas' has no attribute 'read_tsv'", | |
| "output_type": "error", | |
| "traceback": [ | |
| "\u001b[0;31m---------------------------------------------------------------------------\u001b[0m", | |
| "\u001b[0;31mAttributeError\u001b[0m Traceback (most recent call last)", | |
| "\u001b[0;32m<ipython-input-14-84545df27fd2>\u001b[0m in \u001b[0;36m<module>\u001b[0;34m()\u001b[0m\n\u001b[0;32m----> 1\u001b[0;31m \u001b[0mdata3\u001b[0m \u001b[0;34m=\u001b[0m \u001b[0mpd\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0mread_tsv\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0;34m'/Users/amyfou/Downloads/path_data.tsv'\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[0m", | |
| "\u001b[0;31mAttributeError\u001b[0m: module 'pandas' has no attribute 'read_tsv'" | |
| ] | |
| } | |
| ], | |
| "source": [ | |
| "data3 = pd.read_tsv('/Users/amyfou/Downloads/path_data.tsv')" | |
| ] | |
| }, | |
| { | |
| "cell_type": "code", | |
| "execution_count": 15, | |
| "metadata": { | |
| "collapsed": true | |
| }, | |
| "outputs": [], | |
| "source": [ | |
| "data3 = pd.read_table('/Users/amyfou/Downloads/path_data.tsv',sep='\\t')" | |
| ] | |
| }, | |
| { | |
| "cell_type": "code", | |
| "execution_count": 16, | |
| "metadata": { | |
| "collapsed": false | |
| }, | |
| "outputs": [ | |
| { | |
| "data": { | |
| "text/html": [ | |
| "<div>\n", | |
| "<table border=\"1\" class=\"dataframe\">\n", | |
| " <thead>\n", | |
| " <tr style=\"text-align: right;\">\n", | |
| " <th></th>\n", | |
| " <th>Event</th>\n", | |
| " <th>Trigger</th>\n", | |
| " <th>Trigger Tags</th>\n", | |
| " <th>Argument</th>\n", | |
| " <th>Argument Type</th>\n", | |
| " <th>Path</th>\n", | |
| " <th>Path Length</th>\n", | |
| " <th>Pattern Frequency</th>\n", | |
| " </tr>\n", | |
| " </thead>\n", | |
| " <tbody>\n", | |
| " <tr>\n", | |
| " <th>0</th>\n", | |
| " <td>Gene_expression</td>\n", | |
| " <td>trigger = [lemma='expression' & tag='NN']</td>\n", | |
| " <td>'NN'</td>\n", | |
| " <td>Theme</td>\n", | |
| " <td>Protein</td>\n", | |
| " <td>>nn</td>\n", | |
| " <td>1</td>\n", | |
| " <td>382</td>\n", | |
| " </tr>\n", | |
| " <tr>\n", | |
| " <th>1</th>\n", | |
| " <td>Gene_expression</td>\n", | |
| " <td>trigger = [lemma='expression' & tag='NN']</td>\n", | |
| " <td>'NN'</td>\n", | |
| " <td>Theme</td>\n", | |
| " <td>Protein</td>\n", | |
| " <td>>prep_of</td>\n", | |
| " <td>1</td>\n", | |
| " <td>201</td>\n", | |
| " </tr>\n", | |
| " <tr>\n", | |
| " <th>2</th>\n", | |
| " <td>Gene_expression</td>\n", | |
| " <td>trigger = [lemma='expression' & tag='NN']</td>\n", | |
| " <td>'NN'</td>\n", | |
| " <td>Theme</td>\n", | |
| " <td>Protein</td>\n", | |
| " <td>>prep_of >nn</td>\n", | |
| " <td>2</td>\n", | |
| " <td>122</td>\n", | |
| " </tr>\n", | |
| " <tr>\n", | |
| " <th>3</th>\n", | |
| " <td>Transcription</td>\n", | |
| " <td>trigger = [lemma='transcription' & tag='NN']</td>\n", | |
| " <td>'NN'</td>\n", | |
| " <td>Theme</td>\n", | |
| " <td>Protein</td>\n", | |
| " <td>>nn</td>\n", | |
| " <td>1</td>\n", | |
| " <td>121</td>\n", | |
| " </tr>\n", | |
| " <tr>\n", | |
| " <th>4</th>\n", | |
| " <td>Gene_expression</td>\n", | |
| " <td>trigger = [lemma='production' & tag='NN']</td>\n", | |
| " <td>'NN'</td>\n", | |
| " <td>Theme</td>\n", | |
| " <td>Protein</td>\n", | |
| " <td>>nn</td>\n", | |
| " <td>1</td>\n", | |
| " <td>91</td>\n", | |
| " </tr>\n", | |
| " <tr>\n", | |
| " <th>5</th>\n", | |
| " <td>Phosphorylation</td>\n", | |
| " <td>trigger = [lemma='phosphorylation' & tag='NN']</td>\n", | |
| " <td>'NN'</td>\n", | |
| " <td>Theme</td>\n", | |
| " <td>Protein</td>\n", | |
| " <td>>prep_of</td>\n", | |
| " <td>1</td>\n", | |
| " <td>46</td>\n", | |
| " </tr>\n", | |
| " <tr>\n", | |
| " <th>6</th>\n", | |
| " <td>Phosphorylation</td>\n", | |
| " <td>trigger = [lemma='phosphorylation' & tag='NN']</td>\n", | |
| " <td>'NN'</td>\n", | |
| " <td>Site</td>\n", | |
| " <td>Entity</td>\n", | |
| " <td>>nn</td>\n", | |
| " <td>1</td>\n", | |
| " <td>45</td>\n", | |
| " </tr>\n", | |
| " <tr>\n", | |
| " <th>7</th>\n", | |
| " <td>Positive_regulation</td>\n", | |
| " <td>trigger = [lemma='induce' & tag='VBD']</td>\n", | |
| " <td>'VBD'</td>\n", | |
| " <td>Theme</td>\n", | |
| " <td>Gene_expression</td>\n", | |
| " <td>>dobj</td>\n", | |
| " <td>1</td>\n", | |
| " <td>41</td>\n", | |
| " </tr>\n", | |
| " <tr>\n", | |
| " <th>8</th>\n", | |
| " <td>Positive_regulation</td>\n", | |
| " <td>trigger = [lemma='induction' & tag='NN']</td>\n", | |
| " <td>'NN'</td>\n", | |
| " <td>Theme</td>\n", | |
| " <td>Protein</td>\n", | |
| " <td>>prep_of</td>\n", | |
| " <td>1</td>\n", | |
| " <td>39</td>\n", | |
| " </tr>\n", | |
| " <tr>\n", | |
| " <th>9</th>\n", | |
| " <td>Positive_regulation</td>\n", | |
| " <td>trigger = [lemma='activation' & tag='NN']</td>\n", | |
| " <td>'NN'</td>\n", | |
| " <td>Theme</td>\n", | |
| " <td>Protein</td>\n", | |
| " <td>>prep_of >nn</td>\n", | |
| " <td>2</td>\n", | |
| " <td>37</td>\n", | |
| " </tr>\n", | |
| " <tr>\n", | |
| " <th>10</th>\n", | |
| " <td>Transcription</td>\n", | |
| " <td>trigger = [lemma='expression' & tag='NN']</td>\n", | |
| " <td>'NN'</td>\n", | |
| " <td>Theme</td>\n", | |
| " <td>Protein</td>\n", | |
| " <td>>prep_of >nn</td>\n", | |
| " <td>2</td>\n", | |
| " <td>37</td>\n", | |
| " </tr>\n", | |
| " <tr>\n", | |
| " <th>11</th>\n", | |
| " <td>Positive_regulation</td>\n", | |
| " <td>trigger = [lemma='induction' & tag='NN']</td>\n", | |
| " <td>'NN'</td>\n", | |
| " <td>Theme</td>\n", | |
| " <td>Protein</td>\n", | |
| " <td>>nn</td>\n", | |
| " <td>1</td>\n", | |
| " <td>35</td>\n", | |
| " </tr>\n", | |
| " <tr>\n", | |
| " <th>12</th>\n", | |
| " <td>Binding</td>\n", | |
| " <td>trigger = [lemma='binding' & tag='NN']</td>\n", | |
| " <td>'NN'</td>\n", | |
| " <td>Theme</td>\n", | |
| " <td>Protein</td>\n", | |
| " <td>>prep_of</td>\n", | |
| " <td>1</td>\n", | |
| " <td>33</td>\n", | |
| " </tr>\n", | |
| " <tr>\n", | |
| " <th>13</th>\n", | |
| " <td>Localization</td>\n", | |
| " <td>trigger = [lemma='secretion' & tag='NN']</td>\n", | |
| " <td>'NN'</td>\n", | |
| " <td>Theme</td>\n", | |
| " <td>Protein</td>\n", | |
| " <td>>nn</td>\n", | |
| " <td>1</td>\n", | |
| " <td>33</td>\n", | |
| " </tr>\n", | |
| " <tr>\n", | |
| " <th>14</th>\n", | |
| " <td>Gene_expression</td>\n", | |
| " <td>trigger = [lemma='express' & tag='VBN']</td>\n", | |
| " <td>'VBN'</td>\n", | |
| " <td>Theme</td>\n", | |
| " <td>Protein</td>\n", | |
| " <td>>nsubjpass</td>\n", | |
| " <td>1</td>\n", | |
| " <td>32</td>\n", | |
| " </tr>\n", | |
| " <tr>\n", | |
| " <th>15</th>\n", | |
| " <td>Positive_regulation</td>\n", | |
| " <td>trigger = [lemma='activation' & tag='NN']</td>\n", | |
| " <td>'NN'</td>\n", | |
| " <td>Theme</td>\n", | |
| " <td>Protein</td>\n", | |
| " <td>>nn</td>\n", | |
| " <td>1</td>\n", | |
| " <td>32</td>\n", | |
| " </tr>\n", | |
| " <tr>\n", | |
| " <th>16</th>\n", | |
| " <td>Regulation</td>\n", | |
| " <td>trigger = [lemma='regulation' & tag='NN']</td>\n", | |
| " <td>'NN'</td>\n", | |
| " <td>Theme</td>\n", | |
| " <td>Gene_expression</td>\n", | |
| " <td>>prep_of</td>\n", | |
| " <td>1</td>\n", | |
| " <td>31</td>\n", | |
| " </tr>\n", | |
| " <tr>\n", | |
| " <th>17</th>\n", | |
| " <td>Transcription</td>\n", | |
| " <td>trigger = [lemma='expression' & tag='NN']</td>\n", | |
| " <td>'NN'</td>\n", | |
| " <td>Theme</td>\n", | |
| " <td>Protein</td>\n", | |
| " <td>>nn</td>\n", | |
| " <td>1</td>\n", | |
| " <td>31</td>\n", | |
| " </tr>\n", | |
| " <tr>\n", | |
| " <th>18</th>\n", | |
| " <td>Transcription</td>\n", | |
| " <td>trigger = [lemma='transcription' & tag='NN']</td>\n", | |
| " <td>'NN'</td>\n", | |
| " <td>Theme</td>\n", | |
| " <td>Protein</td>\n", | |
| " <td>>prep_of >nn</td>\n", | |
| " <td>2</td>\n", | |
| " <td>31</td>\n", | |
| " </tr>\n", | |
| " <tr>\n", | |
| " <th>19</th>\n", | |
| " <td>Localization</td>\n", | |
| " <td>trigger = [lemma='translocation' & tag='NN']</td>\n", | |
| " <td>'NN'</td>\n", | |
| " <td>ToLoc</td>\n", | |
| " <td>Entity</td>\n", | |
| " <td>>amod</td>\n", | |
| " <td>1</td>\n", | |
| " <td>30</td>\n", | |
| " </tr>\n", | |
| " <tr>\n", | |
| " <th>20</th>\n", | |
| " <td>Phosphorylation</td>\n", | |
| " <td>trigger = [lemma='phosphorylation' & tag='NN']</td>\n", | |
| " <td>'NN'</td>\n", | |
| " <td>Theme</td>\n", | |
| " <td>Protein</td>\n", | |
| " <td>>nn</td>\n", | |
| " <td>1</td>\n", | |
| " <td>30</td>\n", | |
| " </tr>\n", | |
| " <tr>\n", | |
| " <th>21</th>\n", | |
| " <td>Positive_regulation</td>\n", | |
| " <td>trigger = [lemma='induction' & tag='NN']</td>\n", | |
| " <td>'NN'</td>\n", | |
| " <td>Theme</td>\n", | |
| " <td>Protein</td>\n", | |
| " <td>>prep_of >nn</td>\n", | |
| " <td>2</td>\n", | |
| " <td>30</td>\n", | |
| " </tr>\n", | |
| " <tr>\n", | |
| " <th>22</th>\n", | |
| " <td>Positive_regulation</td>\n", | |
| " <td>trigger = [lemma='activation' & tag='NN']</td>\n", | |
| " <td>'NN'</td>\n", | |
| " <td>Theme</td>\n", | |
| " <td>Protein</td>\n", | |
| " <td>>prep_of</td>\n", | |
| " <td>1</td>\n", | |
| " <td>30</td>\n", | |
| " </tr>\n", | |
| " <tr>\n", | |
| " <th>23</th>\n", | |
| " <td>Gene_expression</td>\n", | |
| " <td>trigger = [lemma='production' & tag='NN']</td>\n", | |
| " <td>'NN'</td>\n", | |
| " <td>Theme</td>\n", | |
| " <td>Protein</td>\n", | |
| " <td>>prep_of</td>\n", | |
| " <td>1</td>\n", | |
| " <td>26</td>\n", | |
| " </tr>\n", | |
| " <tr>\n", | |
| " <th>24</th>\n", | |
| " <td>Positive_regulation</td>\n", | |
| " <td>trigger = [lemma='induce' & tag='VBD']</td>\n", | |
| " <td>'VBD'</td>\n", | |
| " <td>Cause</td>\n", | |
| " <td>Protein</td>\n", | |
| " <td>>nsubj</td>\n", | |
| " <td>1</td>\n", | |
| " <td>26</td>\n", | |
| " </tr>\n", | |
| " <tr>\n", | |
| " <th>25</th>\n", | |
| " <td>Regulation</td>\n", | |
| " <td>trigger = [lemma='regulate' & tag='VBN']</td>\n", | |
| " <td>'VBN'</td>\n", | |
| " <td>Theme</td>\n", | |
| " <td>Gene_expression</td>\n", | |
| " <td>>nsubjpass</td>\n", | |
| " <td>1</td>\n", | |
| " <td>25</td>\n", | |
| " </tr>\n", | |
| " <tr>\n", | |
| " <th>26</th>\n", | |
| " <td>Positive_regulation</td>\n", | |
| " <td>trigger = [lemma='induction' & tag='NN']</td>\n", | |
| " <td>'NN'</td>\n", | |
| " <td>Theme</td>\n", | |
| " <td>Gene_expression</td>\n", | |
| " <td>>prep_of</td>\n", | |
| " <td>1</td>\n", | |
| " <td>24</td>\n", | |
| " </tr>\n", | |
| " <tr>\n", | |
| " <th>27</th>\n", | |
| " <td>Negative_regulation</td>\n", | |
| " <td>trigger = [lemma='inhibit' & tag='VBD']</td>\n", | |
| " <td>'VBD'</td>\n", | |
| " <td>Theme</td>\n", | |
| " <td>Positive_regulation</td>\n", | |
| " <td>>dobj</td>\n", | |
| " <td>1</td>\n", | |
| " <td>23</td>\n", | |
| " </tr>\n", | |
| " <tr>\n", | |
| " <th>28</th>\n", | |
| " <td>Gene_expression</td>\n", | |
| " <td>trigger = [lemma='overexpression' & tag='NN']</td>\n", | |
| " <td>'NN'</td>\n", | |
| " <td>Theme</td>\n", | |
| " <td>Protein</td>\n", | |
| " <td>>prep_of</td>\n", | |
| " <td>1</td>\n", | |
| " <td>22</td>\n", | |
| " </tr>\n", | |
| " <tr>\n", | |
| " <th>29</th>\n", | |
| " <td>Protein_catabolism</td>\n", | |
| " <td>trigger = [lemma='degradation' & tag='NN']</td>\n", | |
| " <td>'NN'</td>\n", | |
| " <td>Theme</td>\n", | |
| " <td>Protein</td>\n", | |
| " <td>>prep_of</td>\n", | |
| " <td>1</td>\n", | |
| " <td>22</td>\n", | |
| " </tr>\n", | |
| " <tr>\n", | |
| " <th>...</th>\n", | |
| " <td>...</td>\n", | |
| " <td>...</td>\n", | |
| " <td>...</td>\n", | |
| " <td>...</td>\n", | |
| " <td>...</td>\n", | |
| " <td>...</td>\n", | |
| " <td>...</td>\n", | |
| " <td>...</td>\n", | |
| " </tr>\n", | |
| " <tr>\n", | |
| " <th>4996</th>\n", | |
| " <td>Transcription</td>\n", | |
| " <td>trigger = [lemma='transcription' & tag='NN']</td>\n", | |
| " <td>'NN'</td>\n", | |
| " <td>Theme</td>\n", | |
| " <td>Protein</td>\n", | |
| " <td>>prep_of >dep</td>\n", | |
| " <td>2</td>\n", | |
| " <td>1</td>\n", | |
| " </tr>\n", | |
| " <tr>\n", | |
| " <th>4997</th>\n", | |
| " <td>Transcription</td>\n", | |
| " <td>trigger = [lemma='mrna' & tag='NN'] [lemma='le...</td>\n", | |
| " <td>'NN' 'NNS'</td>\n", | |
| " <td>Theme</td>\n", | |
| " <td>Protein</td>\n", | |
| " <td>>prep_for >nn</td>\n", | |
| " <td>2</td>\n", | |
| " <td>1</td>\n", | |
| " </tr>\n", | |
| " <tr>\n", | |
| " <th>4998</th>\n", | |
| " <td>Transcription</td>\n", | |
| " <td>trigger = [lemma='transcription' & tag='NN']</td>\n", | |
| " <td>'NN'</td>\n", | |
| " <td>Theme</td>\n", | |
| " <td>Protein</td>\n", | |
| " <td><prep_with >nsubjpass >prep_of >prep_on >nn</td>\n", | |
| " <td>5</td>\n", | |
| " <td>1</td>\n", | |
| " </tr>\n", | |
| " <tr>\n", | |
| " <th>4999</th>\n", | |
| " <td>Transcription</td>\n", | |
| " <td>trigger = [lemma='transcriptional' & tag='JJ']...</td>\n", | |
| " <td>'JJ' 'NN'</td>\n", | |
| " <td>Theme</td>\n", | |
| " <td>Protein</td>\n", | |
| " <td><prep_at >nsubjpass >dep >nn</td>\n", | |
| " <td>4</td>\n", | |
| " <td>1</td>\n", | |
| " </tr>\n", | |
| " <tr>\n", | |
| " <th>5000</th>\n", | |
| " <td>Transcription</td>\n", | |
| " <td>trigger = [lemma='transcriptional' & tag='JJ']</td>\n", | |
| " <td>'JJ'</td>\n", | |
| " <td>Theme</td>\n", | |
| " <td>Protein</td>\n", | |
| " <td><amod >appos</td>\n", | |
| " <td>2</td>\n", | |
| " <td>1</td>\n", | |
| " </tr>\n", | |
| " <tr>\n", | |
| " <th>5001</th>\n", | |
| " <td>Transcription</td>\n", | |
| " <td>trigger = [lemma='transcription' & tag='NN']</td>\n", | |
| " <td>'NN'</td>\n", | |
| " <td>Theme</td>\n", | |
| " <td>Protein</td>\n", | |
| " <td><prep_of <dobj <xcomp >prep_including >nn</td>\n", | |
| " <td>5</td>\n", | |
| " <td>1</td>\n", | |
| " </tr>\n", | |
| " <tr>\n", | |
| " <th>5002</th>\n", | |
| " <td>Transcription</td>\n", | |
| " <td>trigger = [lemma='at' & tag='IN'] [lemma='the'...</td>\n", | |
| " <td>'IN' 'DT' 'NN' 'IN' 'NN'</td>\n", | |
| " <td>Theme</td>\n", | |
| " <td>Protein</td>\n", | |
| " <td><prep_at >nsubj >nn</td>\n", | |
| " <td>3</td>\n", | |
| " <td>1</td>\n", | |
| " </tr>\n", | |
| " <tr>\n", | |
| " <th>5003</th>\n", | |
| " <td>Transcription</td>\n", | |
| " <td>trigger = [lemma='expression' & tag='NN']</td>\n", | |
| " <td>'NN'</td>\n", | |
| " <td>Theme</td>\n", | |
| " <td>Protein</td>\n", | |
| " <td><dobj >prep_together_with >nn</td>\n", | |
| " <td>3</td>\n", | |
| " <td>1</td>\n", | |
| " </tr>\n", | |
| " <tr>\n", | |
| " <th>5004</th>\n", | |
| " <td>Transcription</td>\n", | |
| " <td>trigger = [lemma='transcript' & tag='NN'] [lem...</td>\n", | |
| " <td>'NN' 'NNS'</td>\n", | |
| " <td>Theme</td>\n", | |
| " <td>Protein</td>\n", | |
| " <td>>prep_of >nn</td>\n", | |
| " <td>2</td>\n", | |
| " <td>1</td>\n", | |
| " </tr>\n", | |
| " <tr>\n", | |
| " <th>5005</th>\n", | |
| " <td>Transcription</td>\n", | |
| " <td>trigger = [lemma='production' & tag='NN']</td>\n", | |
| " <td>'NN'</td>\n", | |
| " <td>Theme</td>\n", | |
| " <td>Protein</td>\n", | |
| " <td><prep_in <appos <nsubj</td>\n", | |
| " <td>3</td>\n", | |
| " <td>1</td>\n", | |
| " </tr>\n", | |
| " <tr>\n", | |
| " <th>5006</th>\n", | |
| " <td>Transcription</td>\n", | |
| " <td>trigger = [lemma='production' & tag='NN']</td>\n", | |
| " <td>'NN'</td>\n", | |
| " <td>Theme</td>\n", | |
| " <td>Protein</td>\n", | |
| " <td><dep >amod >dep</td>\n", | |
| " <td>3</td>\n", | |
| " <td>1</td>\n", | |
| " </tr>\n", | |
| " <tr>\n", | |
| " <th>5007</th>\n", | |
| " <td>Transcription</td>\n", | |
| " <td>trigger = [lemma='transcription' & tag='NN']</td>\n", | |
| " <td>'NN'</td>\n", | |
| " <td>Theme</td>\n", | |
| " <td>Protein</td>\n", | |
| " <td><conj_and >amod >prepc_without >xcomp</td>\n", | |
| " <td>4</td>\n", | |
| " <td>1</td>\n", | |
| " </tr>\n", | |
| " <tr>\n", | |
| " <th>5008</th>\n", | |
| " <td>Transcription</td>\n", | |
| " <td>trigger = [lemma='mrna' & tag='NN'] [lemma='ex...</td>\n", | |
| " <td>'NN' 'NN'</td>\n", | |
| " <td>Theme</td>\n", | |
| " <td>Protein</td>\n", | |
| " <td><prep_of >prep_of >appos</td>\n", | |
| " <td>3</td>\n", | |
| " <td>1</td>\n", | |
| " </tr>\n", | |
| " <tr>\n", | |
| " <th>5009</th>\n", | |
| " <td>Transcription</td>\n", | |
| " <td>trigger = [lemma='expression' & tag='NN']</td>\n", | |
| " <td>'NN'</td>\n", | |
| " <td>Theme</td>\n", | |
| " <td>Protein</td>\n", | |
| " <td><appos</td>\n", | |
| " <td>1</td>\n", | |
| " <td>1</td>\n", | |
| " </tr>\n", | |
| " <tr>\n", | |
| " <th>5010</th>\n", | |
| " <td>Transcription</td>\n", | |
| " <td>trigger = [lemma='transcript' & tag='NN']</td>\n", | |
| " <td>'NN'</td>\n", | |
| " <td>Theme</td>\n", | |
| " <td>Protein</td>\n", | |
| " <td><nn <prep_with >nsubjpass</td>\n", | |
| " <td>3</td>\n", | |
| " <td>1</td>\n", | |
| " </tr>\n", | |
| " <tr>\n", | |
| " <th>5011</th>\n", | |
| " <td>Transcription</td>\n", | |
| " <td>trigger = [lemma='transcriptional' & tag='JJ']</td>\n", | |
| " <td>'JJ'</td>\n", | |
| " <td>Theme</td>\n", | |
| " <td>Protein</td>\n", | |
| " <td><amod <prep_at >prep_on</td>\n", | |
| " <td>3</td>\n", | |
| " <td>1</td>\n", | |
| " </tr>\n", | |
| " <tr>\n", | |
| " <th>5012</th>\n", | |
| " <td>Transcription</td>\n", | |
| " <td>trigger = [lemma='expression' & tag='NN']</td>\n", | |
| " <td>'NN'</td>\n", | |
| " <td>Theme</td>\n", | |
| " <td>Protein</td>\n", | |
| " <td>>conj_negcc >nn</td>\n", | |
| " <td>2</td>\n", | |
| " <td>1</td>\n", | |
| " </tr>\n", | |
| " <tr>\n", | |
| " <th>5013</th>\n", | |
| " <td>Transcription</td>\n", | |
| " <td>trigger = [lemma='transcript' & tag='NN']</td>\n", | |
| " <td>'NN'</td>\n", | |
| " <td>Theme</td>\n", | |
| " <td>Protein</td>\n", | |
| " <td>>nn</td>\n", | |
| " <td>1</td>\n", | |
| " <td>1</td>\n", | |
| " </tr>\n", | |
| " <tr>\n", | |
| " <th>5014</th>\n", | |
| " <td>Transcription</td>\n", | |
| " <td>trigger = [lemma='transcription' & tag='NN']</td>\n", | |
| " <td>'NN'</td>\n", | |
| " <td>Theme</td>\n", | |
| " <td>Protein</td>\n", | |
| " <td>>prep_of >prep_of >dep >appos</td>\n", | |
| " <td>4</td>\n", | |
| " <td>1</td>\n", | |
| " </tr>\n", | |
| " <tr>\n", | |
| " <th>5015</th>\n", | |
| " <td>Transcription</td>\n", | |
| " <td>trigger = [lemma='transcription' & tag='NN']</td>\n", | |
| " <td>'NN'</td>\n", | |
| " <td>Theme</td>\n", | |
| " <td>Protein</td>\n", | |
| " <td><dobj >iobj >appos</td>\n", | |
| " <td>3</td>\n", | |
| " <td>1</td>\n", | |
| " </tr>\n", | |
| " <tr>\n", | |
| " <th>5016</th>\n", | |
| " <td>Transcription</td>\n", | |
| " <td>trigger = [lemma='transcription' & tag='NN']</td>\n", | |
| " <td>'NN'</td>\n", | |
| " <td>Theme</td>\n", | |
| " <td>Protein</td>\n", | |
| " <td>>conj_negcc >prep_of</td>\n", | |
| " <td>2</td>\n", | |
| " <td>1</td>\n", | |
| " </tr>\n", | |
| " <tr>\n", | |
| " <th>5017</th>\n", | |
| " <td>Transcription</td>\n", | |
| " <td>trigger = [lemma='concentration' & tag='NN']</td>\n", | |
| " <td>'NN'</td>\n", | |
| " <td>Theme</td>\n", | |
| " <td>Protein</td>\n", | |
| " <td>>prep_of >nn</td>\n", | |
| " <td>2</td>\n", | |
| " <td>1</td>\n", | |
| " </tr>\n", | |
| " <tr>\n", | |
| " <th>5018</th>\n", | |
| " <td>Transcription</td>\n", | |
| " <td>trigger = [lemma='transcription' & tag='NN']</td>\n", | |
| " <td>'NN'</td>\n", | |
| " <td>Theme</td>\n", | |
| " <td>Protein</td>\n", | |
| " <td><conj_and >dep >xcomp</td>\n", | |
| " <td>3</td>\n", | |
| " <td>1</td>\n", | |
| " </tr>\n", | |
| " <tr>\n", | |
| " <th>5019</th>\n", | |
| " <td>Transcription</td>\n", | |
| " <td>trigger = [lemma='level' & tag='NNS']</td>\n", | |
| " <td>'NNS'</td>\n", | |
| " <td>Theme</td>\n", | |
| " <td>Protein</td>\n", | |
| " <td><conj_and</td>\n", | |
| " <td>1</td>\n", | |
| " <td>1</td>\n", | |
| " </tr>\n", | |
| " <tr>\n", | |
| " <th>5020</th>\n", | |
| " <td>Transcription</td>\n", | |
| " <td>trigger = [lemma='expression' & tag='NN'] [lem...</td>\n", | |
| " <td>'NN' 'NN'</td>\n", | |
| " <td>Theme</td>\n", | |
| " <td>Protein</td>\n", | |
| " <td>>prep_of >nn</td>\n", | |
| " <td>2</td>\n", | |
| " <td>1</td>\n", | |
| " </tr>\n", | |
| " <tr>\n", | |
| " <th>5021</th>\n", | |
| " <td>Transcription</td>\n", | |
| " <td>trigger = [lemma='expression' & tag='NN']</td>\n", | |
| " <td>'NN'</td>\n", | |
| " <td>Theme</td>\n", | |
| " <td>Protein</td>\n", | |
| " <td><prep_to >nsubj >nn</td>\n", | |
| " <td>3</td>\n", | |
| " <td>1</td>\n", | |
| " </tr>\n", | |
| " <tr>\n", | |
| " <th>5022</th>\n", | |
| " <td>Transcription</td>\n", | |
| " <td>trigger = [lemma='induction' & tag='NN']</td>\n", | |
| " <td>'NN'</td>\n", | |
| " <td>Theme</td>\n", | |
| " <td>Protein</td>\n", | |
| " <td><dep</td>\n", | |
| " <td>1</td>\n", | |
| " <td>1</td>\n", | |
| " </tr>\n", | |
| " <tr>\n", | |
| " <th>5023</th>\n", | |
| " <td>Transcription</td>\n", | |
| " <td>trigger = [lemma='level' & tag='NNS']</td>\n", | |
| " <td>'NNS'</td>\n", | |
| " <td>Theme</td>\n", | |
| " <td>Protein</td>\n", | |
| " <td><prep_in <prep_than <amod</td>\n", | |
| " <td>3</td>\n", | |
| " <td>1</td>\n", | |
| " </tr>\n", | |
| " <tr>\n", | |
| " <th>5024</th>\n", | |
| " <td>Transcription</td>\n", | |
| " <td>trigger = [lemma='expression' & tag='NN']</td>\n", | |
| " <td>'NN'</td>\n", | |
| " <td>Theme</td>\n", | |
| " <td>Protein</td>\n", | |
| " <td><nn</td>\n", | |
| " <td>1</td>\n", | |
| " <td>1</td>\n", | |
| " </tr>\n", | |
| " <tr>\n", | |
| " <th>5025</th>\n", | |
| " <td>Transcription</td>\n", | |
| " <td>trigger = [lemma='level' & tag='NNS']</td>\n", | |
| " <td>'NNS'</td>\n", | |
| " <td>Theme</td>\n", | |
| " <td>Protein</td>\n", | |
| " <td>>conj_or >nn</td>\n", | |
| " <td>2</td>\n", | |
| " <td>1</td>\n", | |
| " </tr>\n", | |
| " </tbody>\n", | |
| "</table>\n", | |
| "<p>5026 rows × 8 columns</p>\n", | |
| "</div>" | |
| ], | |
| "text/plain": [ | |
| " Event Trigger \\\n", | |
| "0 Gene_expression trigger = [lemma='expression' & tag='NN'] \n", | |
| "1 Gene_expression trigger = [lemma='expression' & tag='NN'] \n", | |
| "2 Gene_expression trigger = [lemma='expression' & tag='NN'] \n", | |
| "3 Transcription trigger = [lemma='transcription' & tag='NN'] \n", | |
| "4 Gene_expression trigger = [lemma='production' & tag='NN'] \n", | |
| "5 Phosphorylation trigger = [lemma='phosphorylation' & tag='NN'] \n", | |
| "6 Phosphorylation trigger = [lemma='phosphorylation' & tag='NN'] \n", | |
| "7 Positive_regulation trigger = [lemma='induce' & tag='VBD'] \n", | |
| "8 Positive_regulation trigger = [lemma='induction' & tag='NN'] \n", | |
| "9 Positive_regulation trigger = [lemma='activation' & tag='NN'] \n", | |
| "10 Transcription trigger = [lemma='expression' & tag='NN'] \n", | |
| "11 Positive_regulation trigger = [lemma='induction' & tag='NN'] \n", | |
| "12 Binding trigger = [lemma='binding' & tag='NN'] \n", | |
| "13 Localization trigger = [lemma='secretion' & tag='NN'] \n", | |
| "14 Gene_expression trigger = [lemma='express' & tag='VBN'] \n", | |
| "15 Positive_regulation trigger = [lemma='activation' & tag='NN'] \n", | |
| "16 Regulation trigger = [lemma='regulation' & tag='NN'] \n", | |
| "17 Transcription trigger = [lemma='expression' & tag='NN'] \n", | |
| "18 Transcription trigger = [lemma='transcription' & tag='NN'] \n", | |
| "19 Localization trigger = [lemma='translocation' & tag='NN'] \n", | |
| "20 Phosphorylation trigger = [lemma='phosphorylation' & tag='NN'] \n", | |
| "21 Positive_regulation trigger = [lemma='induction' & tag='NN'] \n", | |
| "22 Positive_regulation trigger = [lemma='activation' & tag='NN'] \n", | |
| "23 Gene_expression trigger = [lemma='production' & tag='NN'] \n", | |
| "24 Positive_regulation trigger = [lemma='induce' & tag='VBD'] \n", | |
| "25 Regulation trigger = [lemma='regulate' & tag='VBN'] \n", | |
| "26 Positive_regulation trigger = [lemma='induction' & tag='NN'] \n", | |
| "27 Negative_regulation trigger = [lemma='inhibit' & tag='VBD'] \n", | |
| "28 Gene_expression trigger = [lemma='overexpression' & tag='NN'] \n", | |
| "29 Protein_catabolism trigger = [lemma='degradation' & tag='NN'] \n", | |
| "... ... ... \n", | |
| "4996 Transcription trigger = [lemma='transcription' & tag='NN'] \n", | |
| "4997 Transcription trigger = [lemma='mrna' & tag='NN'] [lemma='le... \n", | |
| "4998 Transcription trigger = [lemma='transcription' & tag='NN'] \n", | |
| "4999 Transcription trigger = [lemma='transcriptional' & tag='JJ']... \n", | |
| "5000 Transcription trigger = [lemma='transcriptional' & tag='JJ'] \n", | |
| "5001 Transcription trigger = [lemma='transcription' & tag='NN'] \n", | |
| "5002 Transcription trigger = [lemma='at' & tag='IN'] [lemma='the'... \n", | |
| "5003 Transcription trigger = [lemma='expression' & tag='NN'] \n", | |
| "5004 Transcription trigger = [lemma='transcript' & tag='NN'] [lem... \n", | |
| "5005 Transcription trigger = [lemma='production' & tag='NN'] \n", | |
| "5006 Transcription trigger = [lemma='production' & tag='NN'] \n", | |
| "5007 Transcription trigger = [lemma='transcription' & tag='NN'] \n", | |
| "5008 Transcription trigger = [lemma='mrna' & tag='NN'] [lemma='ex... \n", | |
| "5009 Transcription trigger = [lemma='expression' & tag='NN'] \n", | |
| "5010 Transcription trigger = [lemma='transcript' & tag='NN'] \n", | |
| "5011 Transcription trigger = [lemma='transcriptional' & tag='JJ'] \n", | |
| "5012 Transcription trigger = [lemma='expression' & tag='NN'] \n", | |
| "5013 Transcription trigger = [lemma='transcript' & tag='NN'] \n", | |
| "5014 Transcription trigger = [lemma='transcription' & tag='NN'] \n", | |
| "5015 Transcription trigger = [lemma='transcription' & tag='NN'] \n", | |
| "5016 Transcription trigger = [lemma='transcription' & tag='NN'] \n", | |
| "5017 Transcription trigger = [lemma='concentration' & tag='NN'] \n", | |
| "5018 Transcription trigger = [lemma='transcription' & tag='NN'] \n", | |
| "5019 Transcription trigger = [lemma='level' & tag='NNS'] \n", | |
| "5020 Transcription trigger = [lemma='expression' & tag='NN'] [lem... \n", | |
| "5021 Transcription trigger = [lemma='expression' & tag='NN'] \n", | |
| "5022 Transcription trigger = [lemma='induction' & tag='NN'] \n", | |
| "5023 Transcription trigger = [lemma='level' & tag='NNS'] \n", | |
| "5024 Transcription trigger = [lemma='expression' & tag='NN'] \n", | |
| "5025 Transcription trigger = [lemma='level' & tag='NNS'] \n", | |
| "\n", | |
| " Trigger Tags Argument Argument Type \\\n", | |
| "0 'NN' Theme Protein \n", | |
| "1 'NN' Theme Protein \n", | |
| "2 'NN' Theme Protein \n", | |
| "3 'NN' Theme Protein \n", | |
| "4 'NN' Theme Protein \n", | |
| "5 'NN' Theme Protein \n", | |
| "6 'NN' Site Entity \n", | |
| "7 'VBD' Theme Gene_expression \n", | |
| "8 'NN' Theme Protein \n", | |
| "9 'NN' Theme Protein \n", | |
| "10 'NN' Theme Protein \n", | |
| "11 'NN' Theme Protein \n", | |
| "12 'NN' Theme Protein \n", | |
| "13 'NN' Theme Protein \n", | |
| "14 'VBN' Theme Protein \n", | |
| "15 'NN' Theme Protein \n", | |
| "16 'NN' Theme Gene_expression \n", | |
| "17 'NN' Theme Protein \n", | |
| "18 'NN' Theme Protein \n", | |
| "19 'NN' ToLoc Entity \n", | |
| "20 'NN' Theme Protein \n", | |
| "21 'NN' Theme Protein \n", | |
| "22 'NN' Theme Protein \n", | |
| "23 'NN' Theme Protein \n", | |
| "24 'VBD' Cause Protein \n", | |
| "25 'VBN' Theme Gene_expression \n", | |
| "26 'NN' Theme Gene_expression \n", | |
| "27 'VBD' Theme Positive_regulation \n", | |
| "28 'NN' Theme Protein \n", | |
| "29 'NN' Theme Protein \n", | |
| "... ... ... ... \n", | |
| "4996 'NN' Theme Protein \n", | |
| "4997 'NN' 'NNS' Theme Protein \n", | |
| "4998 'NN' Theme Protein \n", | |
| "4999 'JJ' 'NN' Theme Protein \n", | |
| "5000 'JJ' Theme Protein \n", | |
| "5001 'NN' Theme Protein \n", | |
| "5002 'IN' 'DT' 'NN' 'IN' 'NN' Theme Protein \n", | |
| "5003 'NN' Theme Protein \n", | |
| "5004 'NN' 'NNS' Theme Protein \n", | |
| "5005 'NN' Theme Protein \n", | |
| "5006 'NN' Theme Protein \n", | |
| "5007 'NN' Theme Protein \n", | |
| "5008 'NN' 'NN' Theme Protein \n", | |
| "5009 'NN' Theme Protein \n", | |
| "5010 'NN' Theme Protein \n", | |
| "5011 'JJ' Theme Protein \n", | |
| "5012 'NN' Theme Protein \n", | |
| "5013 'NN' Theme Protein \n", | |
| "5014 'NN' Theme Protein \n", | |
| "5015 'NN' Theme Protein \n", | |
| "5016 'NN' Theme Protein \n", | |
| "5017 'NN' Theme Protein \n", | |
| "5018 'NN' Theme Protein \n", | |
| "5019 'NNS' Theme Protein \n", | |
| "5020 'NN' 'NN' Theme Protein \n", | |
| "5021 'NN' Theme Protein \n", | |
| "5022 'NN' Theme Protein \n", | |
| "5023 'NNS' Theme Protein \n", | |
| "5024 'NN' Theme Protein \n", | |
| "5025 'NNS' Theme Protein \n", | |
| "\n", | |
| " Path Path Length \\\n", | |
| "0 >nn 1 \n", | |
| "1 >prep_of 1 \n", | |
| "2 >prep_of >nn 2 \n", | |
| "3 >nn 1 \n", | |
| "4 >nn 1 \n", | |
| "5 >prep_of 1 \n", | |
| "6 >nn 1 \n", | |
| "7 >dobj 1 \n", | |
| "8 >prep_of 1 \n", | |
| "9 >prep_of >nn 2 \n", | |
| "10 >prep_of >nn 2 \n", | |
| "11 >nn 1 \n", | |
| "12 >prep_of 1 \n", | |
| "13 >nn 1 \n", | |
| "14 >nsubjpass 1 \n", | |
| "15 >nn 1 \n", | |
| "16 >prep_of 1 \n", | |
| "17 >nn 1 \n", | |
| "18 >prep_of >nn 2 \n", | |
| "19 >amod 1 \n", | |
| "20 >nn 1 \n", | |
| "21 >prep_of >nn 2 \n", | |
| "22 >prep_of 1 \n", | |
| "23 >prep_of 1 \n", | |
| "24 >nsubj 1 \n", | |
| "25 >nsubjpass 1 \n", | |
| "26 >prep_of 1 \n", | |
| "27 >dobj 1 \n", | |
| "28 >prep_of 1 \n", | |
| "29 >prep_of 1 \n", | |
| "... ... ... \n", | |
| "4996 >prep_of >dep 2 \n", | |
| "4997 >prep_for >nn 2 \n", | |
| "4998 <prep_with >nsubjpass >prep_of >prep_on >nn 5 \n", | |
| "4999 <prep_at >nsubjpass >dep >nn 4 \n", | |
| "5000 <amod >appos 2 \n", | |
| "5001 <prep_of <dobj <xcomp >prep_including >nn 5 \n", | |
| "5002 <prep_at >nsubj >nn 3 \n", | |
| "5003 <dobj >prep_together_with >nn 3 \n", | |
| "5004 >prep_of >nn 2 \n", | |
| "5005 <prep_in <appos <nsubj 3 \n", | |
| "5006 <dep >amod >dep 3 \n", | |
| "5007 <conj_and >amod >prepc_without >xcomp 4 \n", | |
| "5008 <prep_of >prep_of >appos 3 \n", | |
| "5009 <appos 1 \n", | |
| "5010 <nn <prep_with >nsubjpass 3 \n", | |
| "5011 <amod <prep_at >prep_on 3 \n", | |
| "5012 >conj_negcc >nn 2 \n", | |
| "5013 >nn 1 \n", | |
| "5014 >prep_of >prep_of >dep >appos 4 \n", | |
| "5015 <dobj >iobj >appos 3 \n", | |
| "5016 >conj_negcc >prep_of 2 \n", | |
| "5017 >prep_of >nn 2 \n", | |
| "5018 <conj_and >dep >xcomp 3 \n", | |
| "5019 <conj_and 1 \n", | |
| "5020 >prep_of >nn 2 \n", | |
| "5021 <prep_to >nsubj >nn 3 \n", | |
| "5022 <dep 1 \n", | |
| "5023 <prep_in <prep_than <amod 3 \n", | |
| "5024 <nn 1 \n", | |
| "5025 >conj_or >nn 2 \n", | |
| "\n", | |
| " Pattern Frequency \n", | |
| "0 382 \n", | |
| "1 201 \n", | |
| "2 122 \n", | |
| "3 121 \n", | |
| "4 91 \n", | |
| "5 46 \n", | |
| "6 45 \n", | |
| "7 41 \n", | |
| "8 39 \n", | |
| "9 37 \n", | |
| "10 37 \n", | |
| "11 35 \n", | |
| "12 33 \n", | |
| "13 33 \n", | |
| "14 32 \n", | |
| "15 32 \n", | |
| "16 31 \n", | |
| "17 31 \n", | |
| "18 31 \n", | |
| "19 30 \n", | |
| "20 30 \n", | |
| "21 30 \n", | |
| "22 30 \n", | |
| "23 26 \n", | |
| "24 26 \n", | |
| "25 25 \n", | |
| "26 24 \n", | |
| "27 23 \n", | |
| "28 22 \n", | |
| "29 22 \n", | |
| "... ... \n", | |
| "4996 1 \n", | |
| "4997 1 \n", | |
| "4998 1 \n", | |
| "4999 1 \n", | |
| "5000 1 \n", | |
| "5001 1 \n", | |
| "5002 1 \n", | |
| "5003 1 \n", | |
| "5004 1 \n", | |
| "5005 1 \n", | |
| "5006 1 \n", | |
| "5007 1 \n", | |
| "5008 1 \n", | |
| "5009 1 \n", | |
| "5010 1 \n", | |
| "5011 1 \n", | |
| "5012 1 \n", | |
| "5013 1 \n", | |
| "5014 1 \n", | |
| "5015 1 \n", | |
| "5016 1 \n", | |
| "5017 1 \n", | |
| "5018 1 \n", | |
| "5019 1 \n", | |
| "5020 1 \n", | |
| "5021 1 \n", | |
| "5022 1 \n", | |
| "5023 1 \n", | |
| "5024 1 \n", | |
| "5025 1 \n", | |
| "\n", | |
| "[5026 rows x 8 columns]" | |
| ] | |
| }, | |
| "execution_count": 16, | |
| "metadata": {}, | |
| "output_type": "execute_result" | |
| } | |
| ], | |
| "source": [ | |
| "data3" | |
| ] | |
| }, | |
| { | |
| "cell_type": "code", | |
| "execution_count": 19, | |
| "metadata": { | |
| "collapsed": false | |
| }, | |
| "outputs": [], | |
| "source": [ | |
| "s1 = pd.Series(np.arange(5,10))" | |
| ] | |
| }, | |
| { | |
| "cell_type": "code", | |
| "execution_count": 20, | |
| "metadata": { | |
| "collapsed": false | |
| }, | |
| "outputs": [ | |
| { | |
| "data": { | |
| "text/plain": [ | |
| "0 5\n", | |
| "1 6\n", | |
| "2 7\n", | |
| "3 8\n", | |
| "4 9\n", | |
| "dtype: int64" | |
| ] | |
| }, | |
| "execution_count": 20, | |
| "metadata": {}, | |
| "output_type": "execute_result" | |
| } | |
| ], | |
| "source": [ | |
| "s1" | |
| ] | |
| }, | |
| { | |
| "cell_type": "code", | |
| "execution_count": 21, | |
| "metadata": { | |
| "collapsed": false | |
| }, | |
| "outputs": [ | |
| { | |
| "data": { | |
| "text/plain": [ | |
| "255" | |
| ] | |
| }, | |
| "execution_count": 21, | |
| "metadata": {}, | |
| "output_type": "execute_result" | |
| } | |
| ], | |
| "source": [ | |
| "s1.dot(s1)" | |
| ] | |
| }, | |
| { | |
| "cell_type": "code", | |
| "execution_count": 22, | |
| "metadata": { | |
| "collapsed": true | |
| }, | |
| "outputs": [], | |
| "source": [ | |
| "midx = pd.MultiIndex(levels=[['one', 'two'], ['x','y']], labels=[[1,1,0,0],[1,0,1,0]])" | |
| ] | |
| }, | |
| { | |
| "cell_type": "code", | |
| "execution_count": 23, | |
| "metadata": { | |
| "collapsed": true | |
| }, | |
| "outputs": [], | |
| "source": [ | |
| "df = pd.DataFrame({'A' : [1, 2, 3, 4], 'B': [5, 6, 7, 8]}, index=midx)" | |
| ] | |
| }, | |
| { | |
| "cell_type": "code", | |
| "execution_count": 24, | |
| "metadata": { | |
| "collapsed": false | |
| }, | |
| "outputs": [ | |
| { | |
| "data": { | |
| "text/html": [ | |
| "<div>\n", | |
| "<table border=\"1\" class=\"dataframe\">\n", | |
| " <thead>\n", | |
| " <tr style=\"text-align: right;\">\n", | |
| " <th></th>\n", | |
| " <th></th>\n", | |
| " <th>A</th>\n", | |
| " <th>B</th>\n", | |
| " </tr>\n", | |
| " </thead>\n", | |
| " <tbody>\n", | |
| " <tr>\n", | |
| " <th rowspan=\"2\" valign=\"top\">two</th>\n", | |
| " <th>y</th>\n", | |
| " <td>1</td>\n", | |
| " <td>5</td>\n", | |
| " </tr>\n", | |
| " <tr>\n", | |
| " <th>x</th>\n", | |
| " <td>2</td>\n", | |
| " <td>6</td>\n", | |
| " </tr>\n", | |
| " <tr>\n", | |
| " <th rowspan=\"2\" valign=\"top\">one</th>\n", | |
| " <th>y</th>\n", | |
| " <td>3</td>\n", | |
| " <td>7</td>\n", | |
| " </tr>\n", | |
| " <tr>\n", | |
| " <th>x</th>\n", | |
| " <td>4</td>\n", | |
| " <td>8</td>\n", | |
| " </tr>\n", | |
| " </tbody>\n", | |
| "</table>\n", | |
| "</div>" | |
| ], | |
| "text/plain": [ | |
| " A B\n", | |
| "two y 1 5\n", | |
| " x 2 6\n", | |
| "one y 3 7\n", | |
| " x 4 8" | |
| ] | |
| }, | |
| "execution_count": 24, | |
| "metadata": {}, | |
| "output_type": "execute_result" | |
| } | |
| ], | |
| "source": [ | |
| "df" | |
| ] | |
| }, | |
| { | |
| "cell_type": "code", | |
| "execution_count": 25, | |
| "metadata": { | |
| "collapsed": true | |
| }, | |
| "outputs": [], | |
| "source": [ | |
| "paneldf = df.to_panel()" | |
| ] | |
| }, | |
| { | |
| "cell_type": "code", | |
| "execution_count": 26, | |
| "metadata": { | |
| "collapsed": false | |
| }, | |
| "outputs": [ | |
| { | |
| "data": { | |
| "text/plain": [ | |
| "<class 'pandas.core.panel.Panel'>\n", | |
| "Dimensions: 2 (items) x 2 (major_axis) x 2 (minor_axis)\n", | |
| "Items axis: A to B\n", | |
| "Major_axis axis: one to two\n", | |
| "Minor_axis axis: x to y" | |
| ] | |
| }, | |
| "execution_count": 26, | |
| "metadata": {}, | |
| "output_type": "execute_result" | |
| } | |
| ], | |
| "source": [ | |
| "paneldf" | |
| ] | |
| }, | |
| { | |
| "cell_type": "code", | |
| "execution_count": 27, | |
| "metadata": { | |
| "collapsed": false | |
| }, | |
| "outputs": [ | |
| { | |
| "data": { | |
| "text/html": [ | |
| "<div>\n", | |
| "<table border=\"1\" class=\"dataframe\">\n", | |
| " <thead>\n", | |
| " <tr style=\"text-align: right;\">\n", | |
| " <th></th>\n", | |
| " <th>x</th>\n", | |
| " <th>y</th>\n", | |
| " </tr>\n", | |
| " </thead>\n", | |
| " <tbody>\n", | |
| " <tr>\n", | |
| " <th>one</th>\n", | |
| " <td>4</td>\n", | |
| " <td>3</td>\n", | |
| " </tr>\n", | |
| " <tr>\n", | |
| " <th>two</th>\n", | |
| " <td>2</td>\n", | |
| " <td>1</td>\n", | |
| " </tr>\n", | |
| " </tbody>\n", | |
| "</table>\n", | |
| "</div>" | |
| ], | |
| "text/plain": [ | |
| " x y\n", | |
| "one 4 3\n", | |
| "two 2 1" | |
| ] | |
| }, | |
| "execution_count": 27, | |
| "metadata": {}, | |
| "output_type": "execute_result" | |
| } | |
| ], | |
| "source": [ | |
| "paneldf['A']" | |
| ] | |
| }, | |
| { | |
| "cell_type": "code", | |
| "execution_count": null, | |
| "metadata": { | |
| "collapsed": true | |
| }, | |
| "outputs": [], | |
| "source": [] | |
| } | |
| ], | |
| "metadata": { | |
| "kernelspec": { | |
| "display_name": "Python 3", | |
| "language": "python", | |
| "name": "python3" | |
| }, | |
| "language_info": { | |
| "codemirror_mode": { | |
| "name": "ipython", | |
| "version": 3 | |
| }, | |
| "file_extension": ".py", | |
| "mimetype": "text/x-python", | |
| "name": "python", | |
| "nbconvert_exporter": "python", | |
| "pygments_lexer": "ipython3", | |
| "version": "3.6.0" | |
| } | |
| }, | |
| "nbformat": 4, | |
| "nbformat_minor": 2 | |
| } |
Sign up for free
to join this conversation on GitHub.
Already have an account?
Sign in to comment