Created
February 7, 2017 19:44
-
-
Save jivens/8383dcabb71857d1d4605d430aed6e24 to your computer and use it in GitHub Desktop.
New pandas dataframe load
This file contains hidden or bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
{ | |
"cells": [ | |
{ | |
"cell_type": "code", | |
"execution_count": 2, | |
"metadata": { | |
"collapsed": true | |
}, | |
"outputs": [], | |
"source": [ | |
"import pandas as pd" | |
] | |
}, | |
{ | |
"cell_type": "code", | |
"execution_count": 3, | |
"metadata": { | |
"collapsed": true | |
}, | |
"outputs": [], | |
"source": [ | |
"import numpy as np" | |
] | |
}, | |
{ | |
"cell_type": "code", | |
"execution_count": 4, | |
"metadata": { | |
"collapsed": false | |
}, | |
"outputs": [ | |
{ | |
"name": "stderr", | |
"output_type": "stream", | |
"text": [ | |
"/Users/amyfou/anaconda3/envs/ml/lib/python3.6/site-packages/matplotlib/font_manager.py:280: UserWarning: Matplotlib is building the font cache using fc-list. This may take a moment.\n", | |
" 'Matplotlib is building the font cache using fc-list. '\n" | |
] | |
} | |
], | |
"source": [ | |
"import matplotlib.pyplot as plt" | |
] | |
}, | |
{ | |
"cell_type": "code", | |
"execution_count": 5, | |
"metadata": { | |
"collapsed": true | |
}, | |
"outputs": [], | |
"source": [ | |
"data = np.zeros((2,), dtype=[('A', 'i4'),('B', 'f4'),('C', 'a10')])" | |
] | |
}, | |
{ | |
"cell_type": "code", | |
"execution_count": 6, | |
"metadata": { | |
"collapsed": false | |
}, | |
"outputs": [ | |
{ | |
"data": { | |
"text/plain": [ | |
"array([(0, 0.0, b''), (0, 0.0, b'')], \n", | |
" dtype=[('A', '<i4'), ('B', '<f4'), ('C', 'S10')])" | |
] | |
}, | |
"execution_count": 6, | |
"metadata": {}, | |
"output_type": "execute_result" | |
} | |
], | |
"source": [ | |
"data" | |
] | |
}, | |
{ | |
"cell_type": "code", | |
"execution_count": 7, | |
"metadata": { | |
"collapsed": true | |
}, | |
"outputs": [], | |
"source": [ | |
"data[:] = [(1,2.,'Hello'), (2,3.,\"World\")]" | |
] | |
}, | |
{ | |
"cell_type": "code", | |
"execution_count": 8, | |
"metadata": { | |
"collapsed": false | |
}, | |
"outputs": [ | |
{ | |
"data": { | |
"text/plain": [ | |
"array([(1, 2.0, b'Hello'), (2, 3.0, b'World')], \n", | |
" dtype=[('A', '<i4'), ('B', '<f4'), ('C', 'S10')])" | |
] | |
}, | |
"execution_count": 8, | |
"metadata": {}, | |
"output_type": "execute_result" | |
} | |
], | |
"source": [ | |
"data" | |
] | |
}, | |
{ | |
"cell_type": "code", | |
"execution_count": 9, | |
"metadata": { | |
"collapsed": false | |
}, | |
"outputs": [ | |
{ | |
"ename": "AttributeError", | |
"evalue": "module 'pandas' has no attribute 'dataFrame'", | |
"output_type": "error", | |
"traceback": [ | |
"\u001b[0;31m---------------------------------------------------------------------------\u001b[0m", | |
"\u001b[0;31mAttributeError\u001b[0m Traceback (most recent call last)", | |
"\u001b[0;32m<ipython-input-9-2a28ea12b996>\u001b[0m in \u001b[0;36m<module>\u001b[0;34m()\u001b[0m\n\u001b[0;32m----> 1\u001b[0;31m \u001b[0mpd\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0mdataFrame\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0mdata\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[0m", | |
"\u001b[0;31mAttributeError\u001b[0m: module 'pandas' has no attribute 'dataFrame'" | |
] | |
} | |
], | |
"source": [ | |
"pd.dataFrame(data)" | |
] | |
}, | |
{ | |
"cell_type": "code", | |
"execution_count": 10, | |
"metadata": { | |
"collapsed": false | |
}, | |
"outputs": [ | |
{ | |
"data": { | |
"text/html": [ | |
"<div>\n", | |
"<table border=\"1\" class=\"dataframe\">\n", | |
" <thead>\n", | |
" <tr style=\"text-align: right;\">\n", | |
" <th></th>\n", | |
" <th>A</th>\n", | |
" <th>B</th>\n", | |
" <th>C</th>\n", | |
" </tr>\n", | |
" </thead>\n", | |
" <tbody>\n", | |
" <tr>\n", | |
" <th>0</th>\n", | |
" <td>1</td>\n", | |
" <td>2.0</td>\n", | |
" <td>b'Hello'</td>\n", | |
" </tr>\n", | |
" <tr>\n", | |
" <th>1</th>\n", | |
" <td>2</td>\n", | |
" <td>3.0</td>\n", | |
" <td>b'World'</td>\n", | |
" </tr>\n", | |
" </tbody>\n", | |
"</table>\n", | |
"</div>" | |
], | |
"text/plain": [ | |
" A B C\n", | |
"0 1 2.0 b'Hello'\n", | |
"1 2 3.0 b'World'" | |
] | |
}, | |
"execution_count": 10, | |
"metadata": {}, | |
"output_type": "execute_result" | |
} | |
], | |
"source": [ | |
"pd.DataFrame(data)" | |
] | |
}, | |
{ | |
"cell_type": "code", | |
"execution_count": 11, | |
"metadata": { | |
"collapsed": true | |
}, | |
"outputs": [], | |
"source": [ | |
"data2 = [{'a': 1, 'b': 2}, {'a': 5, 'b': 10, 'c': 20}]" | |
] | |
}, | |
{ | |
"cell_type": "code", | |
"execution_count": 12, | |
"metadata": { | |
"collapsed": false | |
}, | |
"outputs": [ | |
{ | |
"data": { | |
"text/plain": [ | |
"[{'a': 1, 'b': 2}, {'a': 5, 'b': 10, 'c': 20}]" | |
] | |
}, | |
"execution_count": 12, | |
"metadata": {}, | |
"output_type": "execute_result" | |
} | |
], | |
"source": [ | |
"data2" | |
] | |
}, | |
{ | |
"cell_type": "code", | |
"execution_count": 13, | |
"metadata": { | |
"collapsed": false | |
}, | |
"outputs": [ | |
{ | |
"data": { | |
"text/html": [ | |
"<div>\n", | |
"<table border=\"1\" class=\"dataframe\">\n", | |
" <thead>\n", | |
" <tr style=\"text-align: right;\">\n", | |
" <th></th>\n", | |
" <th>a</th>\n", | |
" <th>b</th>\n", | |
" <th>c</th>\n", | |
" </tr>\n", | |
" </thead>\n", | |
" <tbody>\n", | |
" <tr>\n", | |
" <th>0</th>\n", | |
" <td>1</td>\n", | |
" <td>2</td>\n", | |
" <td>NaN</td>\n", | |
" </tr>\n", | |
" <tr>\n", | |
" <th>1</th>\n", | |
" <td>5</td>\n", | |
" <td>10</td>\n", | |
" <td>20.0</td>\n", | |
" </tr>\n", | |
" </tbody>\n", | |
"</table>\n", | |
"</div>" | |
], | |
"text/plain": [ | |
" a b c\n", | |
"0 1 2 NaN\n", | |
"1 5 10 20.0" | |
] | |
}, | |
"execution_count": 13, | |
"metadata": {}, | |
"output_type": "execute_result" | |
} | |
], | |
"source": [ | |
"pd.DataFrame(data2)" | |
] | |
}, | |
{ | |
"cell_type": "code", | |
"execution_count": 14, | |
"metadata": { | |
"collapsed": false | |
}, | |
"outputs": [ | |
{ | |
"ename": "AttributeError", | |
"evalue": "module 'pandas' has no attribute 'read_tsv'", | |
"output_type": "error", | |
"traceback": [ | |
"\u001b[0;31m---------------------------------------------------------------------------\u001b[0m", | |
"\u001b[0;31mAttributeError\u001b[0m Traceback (most recent call last)", | |
"\u001b[0;32m<ipython-input-14-84545df27fd2>\u001b[0m in \u001b[0;36m<module>\u001b[0;34m()\u001b[0m\n\u001b[0;32m----> 1\u001b[0;31m \u001b[0mdata3\u001b[0m \u001b[0;34m=\u001b[0m \u001b[0mpd\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0mread_tsv\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0;34m'/Users/amyfou/Downloads/path_data.tsv'\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[0m", | |
"\u001b[0;31mAttributeError\u001b[0m: module 'pandas' has no attribute 'read_tsv'" | |
] | |
} | |
], | |
"source": [ | |
"data3 = pd.read_tsv('/Users/amyfou/Downloads/path_data.tsv')" | |
] | |
}, | |
{ | |
"cell_type": "code", | |
"execution_count": 15, | |
"metadata": { | |
"collapsed": true | |
}, | |
"outputs": [], | |
"source": [ | |
"data3 = pd.read_table('/Users/amyfou/Downloads/path_data.tsv',sep='\\t')" | |
] | |
}, | |
{ | |
"cell_type": "code", | |
"execution_count": 16, | |
"metadata": { | |
"collapsed": false | |
}, | |
"outputs": [ | |
{ | |
"data": { | |
"text/html": [ | |
"<div>\n", | |
"<table border=\"1\" class=\"dataframe\">\n", | |
" <thead>\n", | |
" <tr style=\"text-align: right;\">\n", | |
" <th></th>\n", | |
" <th>Event</th>\n", | |
" <th>Trigger</th>\n", | |
" <th>Trigger Tags</th>\n", | |
" <th>Argument</th>\n", | |
" <th>Argument Type</th>\n", | |
" <th>Path</th>\n", | |
" <th>Path Length</th>\n", | |
" <th>Pattern Frequency</th>\n", | |
" </tr>\n", | |
" </thead>\n", | |
" <tbody>\n", | |
" <tr>\n", | |
" <th>0</th>\n", | |
" <td>Gene_expression</td>\n", | |
" <td>trigger = [lemma='expression' & tag='NN']</td>\n", | |
" <td>'NN'</td>\n", | |
" <td>Theme</td>\n", | |
" <td>Protein</td>\n", | |
" <td>>nn</td>\n", | |
" <td>1</td>\n", | |
" <td>382</td>\n", | |
" </tr>\n", | |
" <tr>\n", | |
" <th>1</th>\n", | |
" <td>Gene_expression</td>\n", | |
" <td>trigger = [lemma='expression' & tag='NN']</td>\n", | |
" <td>'NN'</td>\n", | |
" <td>Theme</td>\n", | |
" <td>Protein</td>\n", | |
" <td>>prep_of</td>\n", | |
" <td>1</td>\n", | |
" <td>201</td>\n", | |
" </tr>\n", | |
" <tr>\n", | |
" <th>2</th>\n", | |
" <td>Gene_expression</td>\n", | |
" <td>trigger = [lemma='expression' & tag='NN']</td>\n", | |
" <td>'NN'</td>\n", | |
" <td>Theme</td>\n", | |
" <td>Protein</td>\n", | |
" <td>>prep_of >nn</td>\n", | |
" <td>2</td>\n", | |
" <td>122</td>\n", | |
" </tr>\n", | |
" <tr>\n", | |
" <th>3</th>\n", | |
" <td>Transcription</td>\n", | |
" <td>trigger = [lemma='transcription' & tag='NN']</td>\n", | |
" <td>'NN'</td>\n", | |
" <td>Theme</td>\n", | |
" <td>Protein</td>\n", | |
" <td>>nn</td>\n", | |
" <td>1</td>\n", | |
" <td>121</td>\n", | |
" </tr>\n", | |
" <tr>\n", | |
" <th>4</th>\n", | |
" <td>Gene_expression</td>\n", | |
" <td>trigger = [lemma='production' & tag='NN']</td>\n", | |
" <td>'NN'</td>\n", | |
" <td>Theme</td>\n", | |
" <td>Protein</td>\n", | |
" <td>>nn</td>\n", | |
" <td>1</td>\n", | |
" <td>91</td>\n", | |
" </tr>\n", | |
" <tr>\n", | |
" <th>5</th>\n", | |
" <td>Phosphorylation</td>\n", | |
" <td>trigger = [lemma='phosphorylation' & tag='NN']</td>\n", | |
" <td>'NN'</td>\n", | |
" <td>Theme</td>\n", | |
" <td>Protein</td>\n", | |
" <td>>prep_of</td>\n", | |
" <td>1</td>\n", | |
" <td>46</td>\n", | |
" </tr>\n", | |
" <tr>\n", | |
" <th>6</th>\n", | |
" <td>Phosphorylation</td>\n", | |
" <td>trigger = [lemma='phosphorylation' & tag='NN']</td>\n", | |
" <td>'NN'</td>\n", | |
" <td>Site</td>\n", | |
" <td>Entity</td>\n", | |
" <td>>nn</td>\n", | |
" <td>1</td>\n", | |
" <td>45</td>\n", | |
" </tr>\n", | |
" <tr>\n", | |
" <th>7</th>\n", | |
" <td>Positive_regulation</td>\n", | |
" <td>trigger = [lemma='induce' & tag='VBD']</td>\n", | |
" <td>'VBD'</td>\n", | |
" <td>Theme</td>\n", | |
" <td>Gene_expression</td>\n", | |
" <td>>dobj</td>\n", | |
" <td>1</td>\n", | |
" <td>41</td>\n", | |
" </tr>\n", | |
" <tr>\n", | |
" <th>8</th>\n", | |
" <td>Positive_regulation</td>\n", | |
" <td>trigger = [lemma='induction' & tag='NN']</td>\n", | |
" <td>'NN'</td>\n", | |
" <td>Theme</td>\n", | |
" <td>Protein</td>\n", | |
" <td>>prep_of</td>\n", | |
" <td>1</td>\n", | |
" <td>39</td>\n", | |
" </tr>\n", | |
" <tr>\n", | |
" <th>9</th>\n", | |
" <td>Positive_regulation</td>\n", | |
" <td>trigger = [lemma='activation' & tag='NN']</td>\n", | |
" <td>'NN'</td>\n", | |
" <td>Theme</td>\n", | |
" <td>Protein</td>\n", | |
" <td>>prep_of >nn</td>\n", | |
" <td>2</td>\n", | |
" <td>37</td>\n", | |
" </tr>\n", | |
" <tr>\n", | |
" <th>10</th>\n", | |
" <td>Transcription</td>\n", | |
" <td>trigger = [lemma='expression' & tag='NN']</td>\n", | |
" <td>'NN'</td>\n", | |
" <td>Theme</td>\n", | |
" <td>Protein</td>\n", | |
" <td>>prep_of >nn</td>\n", | |
" <td>2</td>\n", | |
" <td>37</td>\n", | |
" </tr>\n", | |
" <tr>\n", | |
" <th>11</th>\n", | |
" <td>Positive_regulation</td>\n", | |
" <td>trigger = [lemma='induction' & tag='NN']</td>\n", | |
" <td>'NN'</td>\n", | |
" <td>Theme</td>\n", | |
" <td>Protein</td>\n", | |
" <td>>nn</td>\n", | |
" <td>1</td>\n", | |
" <td>35</td>\n", | |
" </tr>\n", | |
" <tr>\n", | |
" <th>12</th>\n", | |
" <td>Binding</td>\n", | |
" <td>trigger = [lemma='binding' & tag='NN']</td>\n", | |
" <td>'NN'</td>\n", | |
" <td>Theme</td>\n", | |
" <td>Protein</td>\n", | |
" <td>>prep_of</td>\n", | |
" <td>1</td>\n", | |
" <td>33</td>\n", | |
" </tr>\n", | |
" <tr>\n", | |
" <th>13</th>\n", | |
" <td>Localization</td>\n", | |
" <td>trigger = [lemma='secretion' & tag='NN']</td>\n", | |
" <td>'NN'</td>\n", | |
" <td>Theme</td>\n", | |
" <td>Protein</td>\n", | |
" <td>>nn</td>\n", | |
" <td>1</td>\n", | |
" <td>33</td>\n", | |
" </tr>\n", | |
" <tr>\n", | |
" <th>14</th>\n", | |
" <td>Gene_expression</td>\n", | |
" <td>trigger = [lemma='express' & tag='VBN']</td>\n", | |
" <td>'VBN'</td>\n", | |
" <td>Theme</td>\n", | |
" <td>Protein</td>\n", | |
" <td>>nsubjpass</td>\n", | |
" <td>1</td>\n", | |
" <td>32</td>\n", | |
" </tr>\n", | |
" <tr>\n", | |
" <th>15</th>\n", | |
" <td>Positive_regulation</td>\n", | |
" <td>trigger = [lemma='activation' & tag='NN']</td>\n", | |
" <td>'NN'</td>\n", | |
" <td>Theme</td>\n", | |
" <td>Protein</td>\n", | |
" <td>>nn</td>\n", | |
" <td>1</td>\n", | |
" <td>32</td>\n", | |
" </tr>\n", | |
" <tr>\n", | |
" <th>16</th>\n", | |
" <td>Regulation</td>\n", | |
" <td>trigger = [lemma='regulation' & tag='NN']</td>\n", | |
" <td>'NN'</td>\n", | |
" <td>Theme</td>\n", | |
" <td>Gene_expression</td>\n", | |
" <td>>prep_of</td>\n", | |
" <td>1</td>\n", | |
" <td>31</td>\n", | |
" </tr>\n", | |
" <tr>\n", | |
" <th>17</th>\n", | |
" <td>Transcription</td>\n", | |
" <td>trigger = [lemma='expression' & tag='NN']</td>\n", | |
" <td>'NN'</td>\n", | |
" <td>Theme</td>\n", | |
" <td>Protein</td>\n", | |
" <td>>nn</td>\n", | |
" <td>1</td>\n", | |
" <td>31</td>\n", | |
" </tr>\n", | |
" <tr>\n", | |
" <th>18</th>\n", | |
" <td>Transcription</td>\n", | |
" <td>trigger = [lemma='transcription' & tag='NN']</td>\n", | |
" <td>'NN'</td>\n", | |
" <td>Theme</td>\n", | |
" <td>Protein</td>\n", | |
" <td>>prep_of >nn</td>\n", | |
" <td>2</td>\n", | |
" <td>31</td>\n", | |
" </tr>\n", | |
" <tr>\n", | |
" <th>19</th>\n", | |
" <td>Localization</td>\n", | |
" <td>trigger = [lemma='translocation' & tag='NN']</td>\n", | |
" <td>'NN'</td>\n", | |
" <td>ToLoc</td>\n", | |
" <td>Entity</td>\n", | |
" <td>>amod</td>\n", | |
" <td>1</td>\n", | |
" <td>30</td>\n", | |
" </tr>\n", | |
" <tr>\n", | |
" <th>20</th>\n", | |
" <td>Phosphorylation</td>\n", | |
" <td>trigger = [lemma='phosphorylation' & tag='NN']</td>\n", | |
" <td>'NN'</td>\n", | |
" <td>Theme</td>\n", | |
" <td>Protein</td>\n", | |
" <td>>nn</td>\n", | |
" <td>1</td>\n", | |
" <td>30</td>\n", | |
" </tr>\n", | |
" <tr>\n", | |
" <th>21</th>\n", | |
" <td>Positive_regulation</td>\n", | |
" <td>trigger = [lemma='induction' & tag='NN']</td>\n", | |
" <td>'NN'</td>\n", | |
" <td>Theme</td>\n", | |
" <td>Protein</td>\n", | |
" <td>>prep_of >nn</td>\n", | |
" <td>2</td>\n", | |
" <td>30</td>\n", | |
" </tr>\n", | |
" <tr>\n", | |
" <th>22</th>\n", | |
" <td>Positive_regulation</td>\n", | |
" <td>trigger = [lemma='activation' & tag='NN']</td>\n", | |
" <td>'NN'</td>\n", | |
" <td>Theme</td>\n", | |
" <td>Protein</td>\n", | |
" <td>>prep_of</td>\n", | |
" <td>1</td>\n", | |
" <td>30</td>\n", | |
" </tr>\n", | |
" <tr>\n", | |
" <th>23</th>\n", | |
" <td>Gene_expression</td>\n", | |
" <td>trigger = [lemma='production' & tag='NN']</td>\n", | |
" <td>'NN'</td>\n", | |
" <td>Theme</td>\n", | |
" <td>Protein</td>\n", | |
" <td>>prep_of</td>\n", | |
" <td>1</td>\n", | |
" <td>26</td>\n", | |
" </tr>\n", | |
" <tr>\n", | |
" <th>24</th>\n", | |
" <td>Positive_regulation</td>\n", | |
" <td>trigger = [lemma='induce' & tag='VBD']</td>\n", | |
" <td>'VBD'</td>\n", | |
" <td>Cause</td>\n", | |
" <td>Protein</td>\n", | |
" <td>>nsubj</td>\n", | |
" <td>1</td>\n", | |
" <td>26</td>\n", | |
" </tr>\n", | |
" <tr>\n", | |
" <th>25</th>\n", | |
" <td>Regulation</td>\n", | |
" <td>trigger = [lemma='regulate' & tag='VBN']</td>\n", | |
" <td>'VBN'</td>\n", | |
" <td>Theme</td>\n", | |
" <td>Gene_expression</td>\n", | |
" <td>>nsubjpass</td>\n", | |
" <td>1</td>\n", | |
" <td>25</td>\n", | |
" </tr>\n", | |
" <tr>\n", | |
" <th>26</th>\n", | |
" <td>Positive_regulation</td>\n", | |
" <td>trigger = [lemma='induction' & tag='NN']</td>\n", | |
" <td>'NN'</td>\n", | |
" <td>Theme</td>\n", | |
" <td>Gene_expression</td>\n", | |
" <td>>prep_of</td>\n", | |
" <td>1</td>\n", | |
" <td>24</td>\n", | |
" </tr>\n", | |
" <tr>\n", | |
" <th>27</th>\n", | |
" <td>Negative_regulation</td>\n", | |
" <td>trigger = [lemma='inhibit' & tag='VBD']</td>\n", | |
" <td>'VBD'</td>\n", | |
" <td>Theme</td>\n", | |
" <td>Positive_regulation</td>\n", | |
" <td>>dobj</td>\n", | |
" <td>1</td>\n", | |
" <td>23</td>\n", | |
" </tr>\n", | |
" <tr>\n", | |
" <th>28</th>\n", | |
" <td>Gene_expression</td>\n", | |
" <td>trigger = [lemma='overexpression' & tag='NN']</td>\n", | |
" <td>'NN'</td>\n", | |
" <td>Theme</td>\n", | |
" <td>Protein</td>\n", | |
" <td>>prep_of</td>\n", | |
" <td>1</td>\n", | |
" <td>22</td>\n", | |
" </tr>\n", | |
" <tr>\n", | |
" <th>29</th>\n", | |
" <td>Protein_catabolism</td>\n", | |
" <td>trigger = [lemma='degradation' & tag='NN']</td>\n", | |
" <td>'NN'</td>\n", | |
" <td>Theme</td>\n", | |
" <td>Protein</td>\n", | |
" <td>>prep_of</td>\n", | |
" <td>1</td>\n", | |
" <td>22</td>\n", | |
" </tr>\n", | |
" <tr>\n", | |
" <th>...</th>\n", | |
" <td>...</td>\n", | |
" <td>...</td>\n", | |
" <td>...</td>\n", | |
" <td>...</td>\n", | |
" <td>...</td>\n", | |
" <td>...</td>\n", | |
" <td>...</td>\n", | |
" <td>...</td>\n", | |
" </tr>\n", | |
" <tr>\n", | |
" <th>4996</th>\n", | |
" <td>Transcription</td>\n", | |
" <td>trigger = [lemma='transcription' & tag='NN']</td>\n", | |
" <td>'NN'</td>\n", | |
" <td>Theme</td>\n", | |
" <td>Protein</td>\n", | |
" <td>>prep_of >dep</td>\n", | |
" <td>2</td>\n", | |
" <td>1</td>\n", | |
" </tr>\n", | |
" <tr>\n", | |
" <th>4997</th>\n", | |
" <td>Transcription</td>\n", | |
" <td>trigger = [lemma='mrna' & tag='NN'] [lemma='le...</td>\n", | |
" <td>'NN' 'NNS'</td>\n", | |
" <td>Theme</td>\n", | |
" <td>Protein</td>\n", | |
" <td>>prep_for >nn</td>\n", | |
" <td>2</td>\n", | |
" <td>1</td>\n", | |
" </tr>\n", | |
" <tr>\n", | |
" <th>4998</th>\n", | |
" <td>Transcription</td>\n", | |
" <td>trigger = [lemma='transcription' & tag='NN']</td>\n", | |
" <td>'NN'</td>\n", | |
" <td>Theme</td>\n", | |
" <td>Protein</td>\n", | |
" <td><prep_with >nsubjpass >prep_of >prep_on >nn</td>\n", | |
" <td>5</td>\n", | |
" <td>1</td>\n", | |
" </tr>\n", | |
" <tr>\n", | |
" <th>4999</th>\n", | |
" <td>Transcription</td>\n", | |
" <td>trigger = [lemma='transcriptional' & tag='JJ']...</td>\n", | |
" <td>'JJ' 'NN'</td>\n", | |
" <td>Theme</td>\n", | |
" <td>Protein</td>\n", | |
" <td><prep_at >nsubjpass >dep >nn</td>\n", | |
" <td>4</td>\n", | |
" <td>1</td>\n", | |
" </tr>\n", | |
" <tr>\n", | |
" <th>5000</th>\n", | |
" <td>Transcription</td>\n", | |
" <td>trigger = [lemma='transcriptional' & tag='JJ']</td>\n", | |
" <td>'JJ'</td>\n", | |
" <td>Theme</td>\n", | |
" <td>Protein</td>\n", | |
" <td><amod >appos</td>\n", | |
" <td>2</td>\n", | |
" <td>1</td>\n", | |
" </tr>\n", | |
" <tr>\n", | |
" <th>5001</th>\n", | |
" <td>Transcription</td>\n", | |
" <td>trigger = [lemma='transcription' & tag='NN']</td>\n", | |
" <td>'NN'</td>\n", | |
" <td>Theme</td>\n", | |
" <td>Protein</td>\n", | |
" <td><prep_of <dobj <xcomp >prep_including >nn</td>\n", | |
" <td>5</td>\n", | |
" <td>1</td>\n", | |
" </tr>\n", | |
" <tr>\n", | |
" <th>5002</th>\n", | |
" <td>Transcription</td>\n", | |
" <td>trigger = [lemma='at' & tag='IN'] [lemma='the'...</td>\n", | |
" <td>'IN' 'DT' 'NN' 'IN' 'NN'</td>\n", | |
" <td>Theme</td>\n", | |
" <td>Protein</td>\n", | |
" <td><prep_at >nsubj >nn</td>\n", | |
" <td>3</td>\n", | |
" <td>1</td>\n", | |
" </tr>\n", | |
" <tr>\n", | |
" <th>5003</th>\n", | |
" <td>Transcription</td>\n", | |
" <td>trigger = [lemma='expression' & tag='NN']</td>\n", | |
" <td>'NN'</td>\n", | |
" <td>Theme</td>\n", | |
" <td>Protein</td>\n", | |
" <td><dobj >prep_together_with >nn</td>\n", | |
" <td>3</td>\n", | |
" <td>1</td>\n", | |
" </tr>\n", | |
" <tr>\n", | |
" <th>5004</th>\n", | |
" <td>Transcription</td>\n", | |
" <td>trigger = [lemma='transcript' & tag='NN'] [lem...</td>\n", | |
" <td>'NN' 'NNS'</td>\n", | |
" <td>Theme</td>\n", | |
" <td>Protein</td>\n", | |
" <td>>prep_of >nn</td>\n", | |
" <td>2</td>\n", | |
" <td>1</td>\n", | |
" </tr>\n", | |
" <tr>\n", | |
" <th>5005</th>\n", | |
" <td>Transcription</td>\n", | |
" <td>trigger = [lemma='production' & tag='NN']</td>\n", | |
" <td>'NN'</td>\n", | |
" <td>Theme</td>\n", | |
" <td>Protein</td>\n", | |
" <td><prep_in <appos <nsubj</td>\n", | |
" <td>3</td>\n", | |
" <td>1</td>\n", | |
" </tr>\n", | |
" <tr>\n", | |
" <th>5006</th>\n", | |
" <td>Transcription</td>\n", | |
" <td>trigger = [lemma='production' & tag='NN']</td>\n", | |
" <td>'NN'</td>\n", | |
" <td>Theme</td>\n", | |
" <td>Protein</td>\n", | |
" <td><dep >amod >dep</td>\n", | |
" <td>3</td>\n", | |
" <td>1</td>\n", | |
" </tr>\n", | |
" <tr>\n", | |
" <th>5007</th>\n", | |
" <td>Transcription</td>\n", | |
" <td>trigger = [lemma='transcription' & tag='NN']</td>\n", | |
" <td>'NN'</td>\n", | |
" <td>Theme</td>\n", | |
" <td>Protein</td>\n", | |
" <td><conj_and >amod >prepc_without >xcomp</td>\n", | |
" <td>4</td>\n", | |
" <td>1</td>\n", | |
" </tr>\n", | |
" <tr>\n", | |
" <th>5008</th>\n", | |
" <td>Transcription</td>\n", | |
" <td>trigger = [lemma='mrna' & tag='NN'] [lemma='ex...</td>\n", | |
" <td>'NN' 'NN'</td>\n", | |
" <td>Theme</td>\n", | |
" <td>Protein</td>\n", | |
" <td><prep_of >prep_of >appos</td>\n", | |
" <td>3</td>\n", | |
" <td>1</td>\n", | |
" </tr>\n", | |
" <tr>\n", | |
" <th>5009</th>\n", | |
" <td>Transcription</td>\n", | |
" <td>trigger = [lemma='expression' & tag='NN']</td>\n", | |
" <td>'NN'</td>\n", | |
" <td>Theme</td>\n", | |
" <td>Protein</td>\n", | |
" <td><appos</td>\n", | |
" <td>1</td>\n", | |
" <td>1</td>\n", | |
" </tr>\n", | |
" <tr>\n", | |
" <th>5010</th>\n", | |
" <td>Transcription</td>\n", | |
" <td>trigger = [lemma='transcript' & tag='NN']</td>\n", | |
" <td>'NN'</td>\n", | |
" <td>Theme</td>\n", | |
" <td>Protein</td>\n", | |
" <td><nn <prep_with >nsubjpass</td>\n", | |
" <td>3</td>\n", | |
" <td>1</td>\n", | |
" </tr>\n", | |
" <tr>\n", | |
" <th>5011</th>\n", | |
" <td>Transcription</td>\n", | |
" <td>trigger = [lemma='transcriptional' & tag='JJ']</td>\n", | |
" <td>'JJ'</td>\n", | |
" <td>Theme</td>\n", | |
" <td>Protein</td>\n", | |
" <td><amod <prep_at >prep_on</td>\n", | |
" <td>3</td>\n", | |
" <td>1</td>\n", | |
" </tr>\n", | |
" <tr>\n", | |
" <th>5012</th>\n", | |
" <td>Transcription</td>\n", | |
" <td>trigger = [lemma='expression' & tag='NN']</td>\n", | |
" <td>'NN'</td>\n", | |
" <td>Theme</td>\n", | |
" <td>Protein</td>\n", | |
" <td>>conj_negcc >nn</td>\n", | |
" <td>2</td>\n", | |
" <td>1</td>\n", | |
" </tr>\n", | |
" <tr>\n", | |
" <th>5013</th>\n", | |
" <td>Transcription</td>\n", | |
" <td>trigger = [lemma='transcript' & tag='NN']</td>\n", | |
" <td>'NN'</td>\n", | |
" <td>Theme</td>\n", | |
" <td>Protein</td>\n", | |
" <td>>nn</td>\n", | |
" <td>1</td>\n", | |
" <td>1</td>\n", | |
" </tr>\n", | |
" <tr>\n", | |
" <th>5014</th>\n", | |
" <td>Transcription</td>\n", | |
" <td>trigger = [lemma='transcription' & tag='NN']</td>\n", | |
" <td>'NN'</td>\n", | |
" <td>Theme</td>\n", | |
" <td>Protein</td>\n", | |
" <td>>prep_of >prep_of >dep >appos</td>\n", | |
" <td>4</td>\n", | |
" <td>1</td>\n", | |
" </tr>\n", | |
" <tr>\n", | |
" <th>5015</th>\n", | |
" <td>Transcription</td>\n", | |
" <td>trigger = [lemma='transcription' & tag='NN']</td>\n", | |
" <td>'NN'</td>\n", | |
" <td>Theme</td>\n", | |
" <td>Protein</td>\n", | |
" <td><dobj >iobj >appos</td>\n", | |
" <td>3</td>\n", | |
" <td>1</td>\n", | |
" </tr>\n", | |
" <tr>\n", | |
" <th>5016</th>\n", | |
" <td>Transcription</td>\n", | |
" <td>trigger = [lemma='transcription' & tag='NN']</td>\n", | |
" <td>'NN'</td>\n", | |
" <td>Theme</td>\n", | |
" <td>Protein</td>\n", | |
" <td>>conj_negcc >prep_of</td>\n", | |
" <td>2</td>\n", | |
" <td>1</td>\n", | |
" </tr>\n", | |
" <tr>\n", | |
" <th>5017</th>\n", | |
" <td>Transcription</td>\n", | |
" <td>trigger = [lemma='concentration' & tag='NN']</td>\n", | |
" <td>'NN'</td>\n", | |
" <td>Theme</td>\n", | |
" <td>Protein</td>\n", | |
" <td>>prep_of >nn</td>\n", | |
" <td>2</td>\n", | |
" <td>1</td>\n", | |
" </tr>\n", | |
" <tr>\n", | |
" <th>5018</th>\n", | |
" <td>Transcription</td>\n", | |
" <td>trigger = [lemma='transcription' & tag='NN']</td>\n", | |
" <td>'NN'</td>\n", | |
" <td>Theme</td>\n", | |
" <td>Protein</td>\n", | |
" <td><conj_and >dep >xcomp</td>\n", | |
" <td>3</td>\n", | |
" <td>1</td>\n", | |
" </tr>\n", | |
" <tr>\n", | |
" <th>5019</th>\n", | |
" <td>Transcription</td>\n", | |
" <td>trigger = [lemma='level' & tag='NNS']</td>\n", | |
" <td>'NNS'</td>\n", | |
" <td>Theme</td>\n", | |
" <td>Protein</td>\n", | |
" <td><conj_and</td>\n", | |
" <td>1</td>\n", | |
" <td>1</td>\n", | |
" </tr>\n", | |
" <tr>\n", | |
" <th>5020</th>\n", | |
" <td>Transcription</td>\n", | |
" <td>trigger = [lemma='expression' & tag='NN'] [lem...</td>\n", | |
" <td>'NN' 'NN'</td>\n", | |
" <td>Theme</td>\n", | |
" <td>Protein</td>\n", | |
" <td>>prep_of >nn</td>\n", | |
" <td>2</td>\n", | |
" <td>1</td>\n", | |
" </tr>\n", | |
" <tr>\n", | |
" <th>5021</th>\n", | |
" <td>Transcription</td>\n", | |
" <td>trigger = [lemma='expression' & tag='NN']</td>\n", | |
" <td>'NN'</td>\n", | |
" <td>Theme</td>\n", | |
" <td>Protein</td>\n", | |
" <td><prep_to >nsubj >nn</td>\n", | |
" <td>3</td>\n", | |
" <td>1</td>\n", | |
" </tr>\n", | |
" <tr>\n", | |
" <th>5022</th>\n", | |
" <td>Transcription</td>\n", | |
" <td>trigger = [lemma='induction' & tag='NN']</td>\n", | |
" <td>'NN'</td>\n", | |
" <td>Theme</td>\n", | |
" <td>Protein</td>\n", | |
" <td><dep</td>\n", | |
" <td>1</td>\n", | |
" <td>1</td>\n", | |
" </tr>\n", | |
" <tr>\n", | |
" <th>5023</th>\n", | |
" <td>Transcription</td>\n", | |
" <td>trigger = [lemma='level' & tag='NNS']</td>\n", | |
" <td>'NNS'</td>\n", | |
" <td>Theme</td>\n", | |
" <td>Protein</td>\n", | |
" <td><prep_in <prep_than <amod</td>\n", | |
" <td>3</td>\n", | |
" <td>1</td>\n", | |
" </tr>\n", | |
" <tr>\n", | |
" <th>5024</th>\n", | |
" <td>Transcription</td>\n", | |
" <td>trigger = [lemma='expression' & tag='NN']</td>\n", | |
" <td>'NN'</td>\n", | |
" <td>Theme</td>\n", | |
" <td>Protein</td>\n", | |
" <td><nn</td>\n", | |
" <td>1</td>\n", | |
" <td>1</td>\n", | |
" </tr>\n", | |
" <tr>\n", | |
" <th>5025</th>\n", | |
" <td>Transcription</td>\n", | |
" <td>trigger = [lemma='level' & tag='NNS']</td>\n", | |
" <td>'NNS'</td>\n", | |
" <td>Theme</td>\n", | |
" <td>Protein</td>\n", | |
" <td>>conj_or >nn</td>\n", | |
" <td>2</td>\n", | |
" <td>1</td>\n", | |
" </tr>\n", | |
" </tbody>\n", | |
"</table>\n", | |
"<p>5026 rows × 8 columns</p>\n", | |
"</div>" | |
], | |
"text/plain": [ | |
" Event Trigger \\\n", | |
"0 Gene_expression trigger = [lemma='expression' & tag='NN'] \n", | |
"1 Gene_expression trigger = [lemma='expression' & tag='NN'] \n", | |
"2 Gene_expression trigger = [lemma='expression' & tag='NN'] \n", | |
"3 Transcription trigger = [lemma='transcription' & tag='NN'] \n", | |
"4 Gene_expression trigger = [lemma='production' & tag='NN'] \n", | |
"5 Phosphorylation trigger = [lemma='phosphorylation' & tag='NN'] \n", | |
"6 Phosphorylation trigger = [lemma='phosphorylation' & tag='NN'] \n", | |
"7 Positive_regulation trigger = [lemma='induce' & tag='VBD'] \n", | |
"8 Positive_regulation trigger = [lemma='induction' & tag='NN'] \n", | |
"9 Positive_regulation trigger = [lemma='activation' & tag='NN'] \n", | |
"10 Transcription trigger = [lemma='expression' & tag='NN'] \n", | |
"11 Positive_regulation trigger = [lemma='induction' & tag='NN'] \n", | |
"12 Binding trigger = [lemma='binding' & tag='NN'] \n", | |
"13 Localization trigger = [lemma='secretion' & tag='NN'] \n", | |
"14 Gene_expression trigger = [lemma='express' & tag='VBN'] \n", | |
"15 Positive_regulation trigger = [lemma='activation' & tag='NN'] \n", | |
"16 Regulation trigger = [lemma='regulation' & tag='NN'] \n", | |
"17 Transcription trigger = [lemma='expression' & tag='NN'] \n", | |
"18 Transcription trigger = [lemma='transcription' & tag='NN'] \n", | |
"19 Localization trigger = [lemma='translocation' & tag='NN'] \n", | |
"20 Phosphorylation trigger = [lemma='phosphorylation' & tag='NN'] \n", | |
"21 Positive_regulation trigger = [lemma='induction' & tag='NN'] \n", | |
"22 Positive_regulation trigger = [lemma='activation' & tag='NN'] \n", | |
"23 Gene_expression trigger = [lemma='production' & tag='NN'] \n", | |
"24 Positive_regulation trigger = [lemma='induce' & tag='VBD'] \n", | |
"25 Regulation trigger = [lemma='regulate' & tag='VBN'] \n", | |
"26 Positive_regulation trigger = [lemma='induction' & tag='NN'] \n", | |
"27 Negative_regulation trigger = [lemma='inhibit' & tag='VBD'] \n", | |
"28 Gene_expression trigger = [lemma='overexpression' & tag='NN'] \n", | |
"29 Protein_catabolism trigger = [lemma='degradation' & tag='NN'] \n", | |
"... ... ... \n", | |
"4996 Transcription trigger = [lemma='transcription' & tag='NN'] \n", | |
"4997 Transcription trigger = [lemma='mrna' & tag='NN'] [lemma='le... \n", | |
"4998 Transcription trigger = [lemma='transcription' & tag='NN'] \n", | |
"4999 Transcription trigger = [lemma='transcriptional' & tag='JJ']... \n", | |
"5000 Transcription trigger = [lemma='transcriptional' & tag='JJ'] \n", | |
"5001 Transcription trigger = [lemma='transcription' & tag='NN'] \n", | |
"5002 Transcription trigger = [lemma='at' & tag='IN'] [lemma='the'... \n", | |
"5003 Transcription trigger = [lemma='expression' & tag='NN'] \n", | |
"5004 Transcription trigger = [lemma='transcript' & tag='NN'] [lem... \n", | |
"5005 Transcription trigger = [lemma='production' & tag='NN'] \n", | |
"5006 Transcription trigger = [lemma='production' & tag='NN'] \n", | |
"5007 Transcription trigger = [lemma='transcription' & tag='NN'] \n", | |
"5008 Transcription trigger = [lemma='mrna' & tag='NN'] [lemma='ex... \n", | |
"5009 Transcription trigger = [lemma='expression' & tag='NN'] \n", | |
"5010 Transcription trigger = [lemma='transcript' & tag='NN'] \n", | |
"5011 Transcription trigger = [lemma='transcriptional' & tag='JJ'] \n", | |
"5012 Transcription trigger = [lemma='expression' & tag='NN'] \n", | |
"5013 Transcription trigger = [lemma='transcript' & tag='NN'] \n", | |
"5014 Transcription trigger = [lemma='transcription' & tag='NN'] \n", | |
"5015 Transcription trigger = [lemma='transcription' & tag='NN'] \n", | |
"5016 Transcription trigger = [lemma='transcription' & tag='NN'] \n", | |
"5017 Transcription trigger = [lemma='concentration' & tag='NN'] \n", | |
"5018 Transcription trigger = [lemma='transcription' & tag='NN'] \n", | |
"5019 Transcription trigger = [lemma='level' & tag='NNS'] \n", | |
"5020 Transcription trigger = [lemma='expression' & tag='NN'] [lem... \n", | |
"5021 Transcription trigger = [lemma='expression' & tag='NN'] \n", | |
"5022 Transcription trigger = [lemma='induction' & tag='NN'] \n", | |
"5023 Transcription trigger = [lemma='level' & tag='NNS'] \n", | |
"5024 Transcription trigger = [lemma='expression' & tag='NN'] \n", | |
"5025 Transcription trigger = [lemma='level' & tag='NNS'] \n", | |
"\n", | |
" Trigger Tags Argument Argument Type \\\n", | |
"0 'NN' Theme Protein \n", | |
"1 'NN' Theme Protein \n", | |
"2 'NN' Theme Protein \n", | |
"3 'NN' Theme Protein \n", | |
"4 'NN' Theme Protein \n", | |
"5 'NN' Theme Protein \n", | |
"6 'NN' Site Entity \n", | |
"7 'VBD' Theme Gene_expression \n", | |
"8 'NN' Theme Protein \n", | |
"9 'NN' Theme Protein \n", | |
"10 'NN' Theme Protein \n", | |
"11 'NN' Theme Protein \n", | |
"12 'NN' Theme Protein \n", | |
"13 'NN' Theme Protein \n", | |
"14 'VBN' Theme Protein \n", | |
"15 'NN' Theme Protein \n", | |
"16 'NN' Theme Gene_expression \n", | |
"17 'NN' Theme Protein \n", | |
"18 'NN' Theme Protein \n", | |
"19 'NN' ToLoc Entity \n", | |
"20 'NN' Theme Protein \n", | |
"21 'NN' Theme Protein \n", | |
"22 'NN' Theme Protein \n", | |
"23 'NN' Theme Protein \n", | |
"24 'VBD' Cause Protein \n", | |
"25 'VBN' Theme Gene_expression \n", | |
"26 'NN' Theme Gene_expression \n", | |
"27 'VBD' Theme Positive_regulation \n", | |
"28 'NN' Theme Protein \n", | |
"29 'NN' Theme Protein \n", | |
"... ... ... ... \n", | |
"4996 'NN' Theme Protein \n", | |
"4997 'NN' 'NNS' Theme Protein \n", | |
"4998 'NN' Theme Protein \n", | |
"4999 'JJ' 'NN' Theme Protein \n", | |
"5000 'JJ' Theme Protein \n", | |
"5001 'NN' Theme Protein \n", | |
"5002 'IN' 'DT' 'NN' 'IN' 'NN' Theme Protein \n", | |
"5003 'NN' Theme Protein \n", | |
"5004 'NN' 'NNS' Theme Protein \n", | |
"5005 'NN' Theme Protein \n", | |
"5006 'NN' Theme Protein \n", | |
"5007 'NN' Theme Protein \n", | |
"5008 'NN' 'NN' Theme Protein \n", | |
"5009 'NN' Theme Protein \n", | |
"5010 'NN' Theme Protein \n", | |
"5011 'JJ' Theme Protein \n", | |
"5012 'NN' Theme Protein \n", | |
"5013 'NN' Theme Protein \n", | |
"5014 'NN' Theme Protein \n", | |
"5015 'NN' Theme Protein \n", | |
"5016 'NN' Theme Protein \n", | |
"5017 'NN' Theme Protein \n", | |
"5018 'NN' Theme Protein \n", | |
"5019 'NNS' Theme Protein \n", | |
"5020 'NN' 'NN' Theme Protein \n", | |
"5021 'NN' Theme Protein \n", | |
"5022 'NN' Theme Protein \n", | |
"5023 'NNS' Theme Protein \n", | |
"5024 'NN' Theme Protein \n", | |
"5025 'NNS' Theme Protein \n", | |
"\n", | |
" Path Path Length \\\n", | |
"0 >nn 1 \n", | |
"1 >prep_of 1 \n", | |
"2 >prep_of >nn 2 \n", | |
"3 >nn 1 \n", | |
"4 >nn 1 \n", | |
"5 >prep_of 1 \n", | |
"6 >nn 1 \n", | |
"7 >dobj 1 \n", | |
"8 >prep_of 1 \n", | |
"9 >prep_of >nn 2 \n", | |
"10 >prep_of >nn 2 \n", | |
"11 >nn 1 \n", | |
"12 >prep_of 1 \n", | |
"13 >nn 1 \n", | |
"14 >nsubjpass 1 \n", | |
"15 >nn 1 \n", | |
"16 >prep_of 1 \n", | |
"17 >nn 1 \n", | |
"18 >prep_of >nn 2 \n", | |
"19 >amod 1 \n", | |
"20 >nn 1 \n", | |
"21 >prep_of >nn 2 \n", | |
"22 >prep_of 1 \n", | |
"23 >prep_of 1 \n", | |
"24 >nsubj 1 \n", | |
"25 >nsubjpass 1 \n", | |
"26 >prep_of 1 \n", | |
"27 >dobj 1 \n", | |
"28 >prep_of 1 \n", | |
"29 >prep_of 1 \n", | |
"... ... ... \n", | |
"4996 >prep_of >dep 2 \n", | |
"4997 >prep_for >nn 2 \n", | |
"4998 <prep_with >nsubjpass >prep_of >prep_on >nn 5 \n", | |
"4999 <prep_at >nsubjpass >dep >nn 4 \n", | |
"5000 <amod >appos 2 \n", | |
"5001 <prep_of <dobj <xcomp >prep_including >nn 5 \n", | |
"5002 <prep_at >nsubj >nn 3 \n", | |
"5003 <dobj >prep_together_with >nn 3 \n", | |
"5004 >prep_of >nn 2 \n", | |
"5005 <prep_in <appos <nsubj 3 \n", | |
"5006 <dep >amod >dep 3 \n", | |
"5007 <conj_and >amod >prepc_without >xcomp 4 \n", | |
"5008 <prep_of >prep_of >appos 3 \n", | |
"5009 <appos 1 \n", | |
"5010 <nn <prep_with >nsubjpass 3 \n", | |
"5011 <amod <prep_at >prep_on 3 \n", | |
"5012 >conj_negcc >nn 2 \n", | |
"5013 >nn 1 \n", | |
"5014 >prep_of >prep_of >dep >appos 4 \n", | |
"5015 <dobj >iobj >appos 3 \n", | |
"5016 >conj_negcc >prep_of 2 \n", | |
"5017 >prep_of >nn 2 \n", | |
"5018 <conj_and >dep >xcomp 3 \n", | |
"5019 <conj_and 1 \n", | |
"5020 >prep_of >nn 2 \n", | |
"5021 <prep_to >nsubj >nn 3 \n", | |
"5022 <dep 1 \n", | |
"5023 <prep_in <prep_than <amod 3 \n", | |
"5024 <nn 1 \n", | |
"5025 >conj_or >nn 2 \n", | |
"\n", | |
" Pattern Frequency \n", | |
"0 382 \n", | |
"1 201 \n", | |
"2 122 \n", | |
"3 121 \n", | |
"4 91 \n", | |
"5 46 \n", | |
"6 45 \n", | |
"7 41 \n", | |
"8 39 \n", | |
"9 37 \n", | |
"10 37 \n", | |
"11 35 \n", | |
"12 33 \n", | |
"13 33 \n", | |
"14 32 \n", | |
"15 32 \n", | |
"16 31 \n", | |
"17 31 \n", | |
"18 31 \n", | |
"19 30 \n", | |
"20 30 \n", | |
"21 30 \n", | |
"22 30 \n", | |
"23 26 \n", | |
"24 26 \n", | |
"25 25 \n", | |
"26 24 \n", | |
"27 23 \n", | |
"28 22 \n", | |
"29 22 \n", | |
"... ... \n", | |
"4996 1 \n", | |
"4997 1 \n", | |
"4998 1 \n", | |
"4999 1 \n", | |
"5000 1 \n", | |
"5001 1 \n", | |
"5002 1 \n", | |
"5003 1 \n", | |
"5004 1 \n", | |
"5005 1 \n", | |
"5006 1 \n", | |
"5007 1 \n", | |
"5008 1 \n", | |
"5009 1 \n", | |
"5010 1 \n", | |
"5011 1 \n", | |
"5012 1 \n", | |
"5013 1 \n", | |
"5014 1 \n", | |
"5015 1 \n", | |
"5016 1 \n", | |
"5017 1 \n", | |
"5018 1 \n", | |
"5019 1 \n", | |
"5020 1 \n", | |
"5021 1 \n", | |
"5022 1 \n", | |
"5023 1 \n", | |
"5024 1 \n", | |
"5025 1 \n", | |
"\n", | |
"[5026 rows x 8 columns]" | |
] | |
}, | |
"execution_count": 16, | |
"metadata": {}, | |
"output_type": "execute_result" | |
} | |
], | |
"source": [ | |
"data3" | |
] | |
}, | |
{ | |
"cell_type": "code", | |
"execution_count": 19, | |
"metadata": { | |
"collapsed": false | |
}, | |
"outputs": [], | |
"source": [ | |
"s1 = pd.Series(np.arange(5,10))" | |
] | |
}, | |
{ | |
"cell_type": "code", | |
"execution_count": 20, | |
"metadata": { | |
"collapsed": false | |
}, | |
"outputs": [ | |
{ | |
"data": { | |
"text/plain": [ | |
"0 5\n", | |
"1 6\n", | |
"2 7\n", | |
"3 8\n", | |
"4 9\n", | |
"dtype: int64" | |
] | |
}, | |
"execution_count": 20, | |
"metadata": {}, | |
"output_type": "execute_result" | |
} | |
], | |
"source": [ | |
"s1" | |
] | |
}, | |
{ | |
"cell_type": "code", | |
"execution_count": 21, | |
"metadata": { | |
"collapsed": false | |
}, | |
"outputs": [ | |
{ | |
"data": { | |
"text/plain": [ | |
"255" | |
] | |
}, | |
"execution_count": 21, | |
"metadata": {}, | |
"output_type": "execute_result" | |
} | |
], | |
"source": [ | |
"s1.dot(s1)" | |
] | |
}, | |
{ | |
"cell_type": "code", | |
"execution_count": 22, | |
"metadata": { | |
"collapsed": true | |
}, | |
"outputs": [], | |
"source": [ | |
"midx = pd.MultiIndex(levels=[['one', 'two'], ['x','y']], labels=[[1,1,0,0],[1,0,1,0]])" | |
] | |
}, | |
{ | |
"cell_type": "code", | |
"execution_count": 23, | |
"metadata": { | |
"collapsed": true | |
}, | |
"outputs": [], | |
"source": [ | |
"df = pd.DataFrame({'A' : [1, 2, 3, 4], 'B': [5, 6, 7, 8]}, index=midx)" | |
] | |
}, | |
{ | |
"cell_type": "code", | |
"execution_count": 24, | |
"metadata": { | |
"collapsed": false | |
}, | |
"outputs": [ | |
{ | |
"data": { | |
"text/html": [ | |
"<div>\n", | |
"<table border=\"1\" class=\"dataframe\">\n", | |
" <thead>\n", | |
" <tr style=\"text-align: right;\">\n", | |
" <th></th>\n", | |
" <th></th>\n", | |
" <th>A</th>\n", | |
" <th>B</th>\n", | |
" </tr>\n", | |
" </thead>\n", | |
" <tbody>\n", | |
" <tr>\n", | |
" <th rowspan=\"2\" valign=\"top\">two</th>\n", | |
" <th>y</th>\n", | |
" <td>1</td>\n", | |
" <td>5</td>\n", | |
" </tr>\n", | |
" <tr>\n", | |
" <th>x</th>\n", | |
" <td>2</td>\n", | |
" <td>6</td>\n", | |
" </tr>\n", | |
" <tr>\n", | |
" <th rowspan=\"2\" valign=\"top\">one</th>\n", | |
" <th>y</th>\n", | |
" <td>3</td>\n", | |
" <td>7</td>\n", | |
" </tr>\n", | |
" <tr>\n", | |
" <th>x</th>\n", | |
" <td>4</td>\n", | |
" <td>8</td>\n", | |
" </tr>\n", | |
" </tbody>\n", | |
"</table>\n", | |
"</div>" | |
], | |
"text/plain": [ | |
" A B\n", | |
"two y 1 5\n", | |
" x 2 6\n", | |
"one y 3 7\n", | |
" x 4 8" | |
] | |
}, | |
"execution_count": 24, | |
"metadata": {}, | |
"output_type": "execute_result" | |
} | |
], | |
"source": [ | |
"df" | |
] | |
}, | |
{ | |
"cell_type": "code", | |
"execution_count": 25, | |
"metadata": { | |
"collapsed": true | |
}, | |
"outputs": [], | |
"source": [ | |
"paneldf = df.to_panel()" | |
] | |
}, | |
{ | |
"cell_type": "code", | |
"execution_count": 26, | |
"metadata": { | |
"collapsed": false | |
}, | |
"outputs": [ | |
{ | |
"data": { | |
"text/plain": [ | |
"<class 'pandas.core.panel.Panel'>\n", | |
"Dimensions: 2 (items) x 2 (major_axis) x 2 (minor_axis)\n", | |
"Items axis: A to B\n", | |
"Major_axis axis: one to two\n", | |
"Minor_axis axis: x to y" | |
] | |
}, | |
"execution_count": 26, | |
"metadata": {}, | |
"output_type": "execute_result" | |
} | |
], | |
"source": [ | |
"paneldf" | |
] | |
}, | |
{ | |
"cell_type": "code", | |
"execution_count": 27, | |
"metadata": { | |
"collapsed": false | |
}, | |
"outputs": [ | |
{ | |
"data": { | |
"text/html": [ | |
"<div>\n", | |
"<table border=\"1\" class=\"dataframe\">\n", | |
" <thead>\n", | |
" <tr style=\"text-align: right;\">\n", | |
" <th></th>\n", | |
" <th>x</th>\n", | |
" <th>y</th>\n", | |
" </tr>\n", | |
" </thead>\n", | |
" <tbody>\n", | |
" <tr>\n", | |
" <th>one</th>\n", | |
" <td>4</td>\n", | |
" <td>3</td>\n", | |
" </tr>\n", | |
" <tr>\n", | |
" <th>two</th>\n", | |
" <td>2</td>\n", | |
" <td>1</td>\n", | |
" </tr>\n", | |
" </tbody>\n", | |
"</table>\n", | |
"</div>" | |
], | |
"text/plain": [ | |
" x y\n", | |
"one 4 3\n", | |
"two 2 1" | |
] | |
}, | |
"execution_count": 27, | |
"metadata": {}, | |
"output_type": "execute_result" | |
} | |
], | |
"source": [ | |
"paneldf['A']" | |
] | |
}, | |
{ | |
"cell_type": "code", | |
"execution_count": null, | |
"metadata": { | |
"collapsed": true | |
}, | |
"outputs": [], | |
"source": [] | |
} | |
], | |
"metadata": { | |
"kernelspec": { | |
"display_name": "Python 3", | |
"language": "python", | |
"name": "python3" | |
}, | |
"language_info": { | |
"codemirror_mode": { | |
"name": "ipython", | |
"version": 3 | |
}, | |
"file_extension": ".py", | |
"mimetype": "text/x-python", | |
"name": "python", | |
"nbconvert_exporter": "python", | |
"pygments_lexer": "ipython3", | |
"version": "3.6.0" | |
} | |
}, | |
"nbformat": 4, | |
"nbformat_minor": 2 | |
} |
Sign up for free
to join this conversation on GitHub.
Already have an account?
Sign in to comment