jimregan commited on
Commit
c62b96f
·
1 Parent(s): c6b1f01
kaggle-notebooks/wer/AWB_WER_plots.ipynb ADDED
@@ -0,0 +1,335 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "nbformat": 4,
3
+ "nbformat_minor": 0,
4
+ "metadata": {
5
+ "colab": {
6
+ "name": "AWB WER plots.ipynb",
7
+ "provenance": [],
8
+ "collapsed_sections": []
9
+ },
10
+ "kernelspec": {
11
+ "name": "python3",
12
+ "display_name": "Python 3"
13
+ },
14
+ "language_info": {
15
+ "name": "python"
16
+ }
17
+ },
18
+ "cells": [
19
+ {
20
+ "cell_type": "code",
21
+ "execution_count": 1,
22
+ "metadata": {
23
+ "id": "vK9KbVT8ClG0"
24
+ },
25
+ "outputs": [],
26
+ "source": [
27
+ "import matplotlib.pyplot as plt\n",
28
+ "import pandas as pd"
29
+ ]
30
+ },
31
+ {
32
+ "cell_type": "code",
33
+ "source": [
34
+ "MINS_DATA = \"\"\"\n",
35
+ "5\t0.057692307692307696\n",
36
+ "10\t0.057692307692307696\n",
37
+ "15\t0.05576923076923077\n",
38
+ "20\t0.046153846153846156\n",
39
+ "25\t0.038461538461538464\n",
40
+ "30\t0.046153846153846156\n",
41
+ "35\t0.03653846153846154\n",
42
+ "40\t0.03653846153846154\n",
43
+ "45\t0.025\n",
44
+ "50\t0.03653846153846154\n",
45
+ "55\t0.026923076923076925\n",
46
+ "60\t0.032692307692307694\n",
47
+ "\"\"\""
48
+ ],
49
+ "metadata": {
50
+ "id": "xTj5ZZWmEDoB"
51
+ },
52
+ "execution_count": 2,
53
+ "outputs": []
54
+ },
55
+ {
56
+ "cell_type": "code",
57
+ "source": [
58
+ "mins = []\n",
59
+ "wer = []\n",
60
+ "for line in MINS_DATA.split(\"\\n\"):\n",
61
+ " if \"\\t\" in line:\n",
62
+ " parts = line.split(\"\\t\")\n",
63
+ " mins.append(int(parts[0]))\n",
64
+ " wer.append(float(parts[1]) * 100)"
65
+ ],
66
+ "metadata": {
67
+ "id": "cbSr-TOTNy6m"
68
+ },
69
+ "execution_count": 3,
70
+ "outputs": []
71
+ },
72
+ {
73
+ "cell_type": "code",
74
+ "source": [
75
+ "pd.options.display.float_format = '{:,.2f}'.format\n",
76
+ "df = pd.DataFrame(data={\"Minutes\": mins, \"WER\": wer})"
77
+ ],
78
+ "metadata": {
79
+ "id": "F6pLJCGFN5e6"
80
+ },
81
+ "execution_count": 4,
82
+ "outputs": []
83
+ },
84
+ {
85
+ "cell_type": "code",
86
+ "source": [
87
+ "df"
88
+ ],
89
+ "metadata": {
90
+ "colab": {
91
+ "base_uri": "https://localhost:8080/",
92
+ "height": 425
93
+ },
94
+ "id": "saY52xevV9zo",
95
+ "outputId": "f3e8eb1c-b664-4949-c3df-b8dc9d5df5ac"
96
+ },
97
+ "execution_count": 5,
98
+ "outputs": [
99
+ {
100
+ "output_type": "execute_result",
101
+ "data": {
102
+ "text/plain": [
103
+ " Minutes WER\n",
104
+ "0 5 5.77\n",
105
+ "1 10 5.77\n",
106
+ "2 15 5.58\n",
107
+ "3 20 4.62\n",
108
+ "4 25 3.85\n",
109
+ "5 30 4.62\n",
110
+ "6 35 3.65\n",
111
+ "7 40 3.65\n",
112
+ "8 45 2.50\n",
113
+ "9 50 3.65\n",
114
+ "10 55 2.69\n",
115
+ "11 60 3.27"
116
+ ],
117
+ "text/html": [
118
+ "\n",
119
+ " <div id=\"df-9390132b-c2ff-4e3b-9528-b03b74f0357a\">\n",
120
+ " <div class=\"colab-df-container\">\n",
121
+ " <div>\n",
122
+ "<style scoped>\n",
123
+ " .dataframe tbody tr th:only-of-type {\n",
124
+ " vertical-align: middle;\n",
125
+ " }\n",
126
+ "\n",
127
+ " .dataframe tbody tr th {\n",
128
+ " vertical-align: top;\n",
129
+ " }\n",
130
+ "\n",
131
+ " .dataframe thead th {\n",
132
+ " text-align: right;\n",
133
+ " }\n",
134
+ "</style>\n",
135
+ "<table border=\"1\" class=\"dataframe\">\n",
136
+ " <thead>\n",
137
+ " <tr style=\"text-align: right;\">\n",
138
+ " <th></th>\n",
139
+ " <th>Minutes</th>\n",
140
+ " <th>WER</th>\n",
141
+ " </tr>\n",
142
+ " </thead>\n",
143
+ " <tbody>\n",
144
+ " <tr>\n",
145
+ " <th>0</th>\n",
146
+ " <td>5</td>\n",
147
+ " <td>5.77</td>\n",
148
+ " </tr>\n",
149
+ " <tr>\n",
150
+ " <th>1</th>\n",
151
+ " <td>10</td>\n",
152
+ " <td>5.77</td>\n",
153
+ " </tr>\n",
154
+ " <tr>\n",
155
+ " <th>2</th>\n",
156
+ " <td>15</td>\n",
157
+ " <td>5.58</td>\n",
158
+ " </tr>\n",
159
+ " <tr>\n",
160
+ " <th>3</th>\n",
161
+ " <td>20</td>\n",
162
+ " <td>4.62</td>\n",
163
+ " </tr>\n",
164
+ " <tr>\n",
165
+ " <th>4</th>\n",
166
+ " <td>25</td>\n",
167
+ " <td>3.85</td>\n",
168
+ " </tr>\n",
169
+ " <tr>\n",
170
+ " <th>5</th>\n",
171
+ " <td>30</td>\n",
172
+ " <td>4.62</td>\n",
173
+ " </tr>\n",
174
+ " <tr>\n",
175
+ " <th>6</th>\n",
176
+ " <td>35</td>\n",
177
+ " <td>3.65</td>\n",
178
+ " </tr>\n",
179
+ " <tr>\n",
180
+ " <th>7</th>\n",
181
+ " <td>40</td>\n",
182
+ " <td>3.65</td>\n",
183
+ " </tr>\n",
184
+ " <tr>\n",
185
+ " <th>8</th>\n",
186
+ " <td>45</td>\n",
187
+ " <td>2.50</td>\n",
188
+ " </tr>\n",
189
+ " <tr>\n",
190
+ " <th>9</th>\n",
191
+ " <td>50</td>\n",
192
+ " <td>3.65</td>\n",
193
+ " </tr>\n",
194
+ " <tr>\n",
195
+ " <th>10</th>\n",
196
+ " <td>55</td>\n",
197
+ " <td>2.69</td>\n",
198
+ " </tr>\n",
199
+ " <tr>\n",
200
+ " <th>11</th>\n",
201
+ " <td>60</td>\n",
202
+ " <td>3.27</td>\n",
203
+ " </tr>\n",
204
+ " </tbody>\n",
205
+ "</table>\n",
206
+ "</div>\n",
207
+ " <button class=\"colab-df-convert\" onclick=\"convertToInteractive('df-9390132b-c2ff-4e3b-9528-b03b74f0357a')\"\n",
208
+ " title=\"Convert this dataframe to an interactive table.\"\n",
209
+ " style=\"display:none;\">\n",
210
+ " \n",
211
+ " <svg xmlns=\"http://www.w3.org/2000/svg\" height=\"24px\"viewBox=\"0 0 24 24\"\n",
212
+ " width=\"24px\">\n",
213
+ " <path d=\"M0 0h24v24H0V0z\" fill=\"none\"/>\n",
214
+ " <path d=\"M18.56 5.44l.94 2.06.94-2.06 2.06-.94-2.06-.94-.94-2.06-.94 2.06-2.06.94zm-11 1L8.5 8.5l.94-2.06 2.06-.94-2.06-.94L8.5 2.5l-.94 2.06-2.06.94zm10 10l.94 2.06.94-2.06 2.06-.94-2.06-.94-.94-2.06-.94 2.06-2.06.94z\"/><path d=\"M17.41 7.96l-1.37-1.37c-.4-.4-.92-.59-1.43-.59-.52 0-1.04.2-1.43.59L10.3 9.45l-7.72 7.72c-.78.78-.78 2.05 0 2.83L4 21.41c.39.39.9.59 1.41.59.51 0 1.02-.2 1.41-.59l7.78-7.78 2.81-2.81c.8-.78.8-2.07 0-2.86zM5.41 20L4 18.59l7.72-7.72 1.47 1.35L5.41 20z\"/>\n",
215
+ " </svg>\n",
216
+ " </button>\n",
217
+ " \n",
218
+ " <style>\n",
219
+ " .colab-df-container {\n",
220
+ " display:flex;\n",
221
+ " flex-wrap:wrap;\n",
222
+ " gap: 12px;\n",
223
+ " }\n",
224
+ "\n",
225
+ " .colab-df-convert {\n",
226
+ " background-color: #E8F0FE;\n",
227
+ " border: none;\n",
228
+ " border-radius: 50%;\n",
229
+ " cursor: pointer;\n",
230
+ " display: none;\n",
231
+ " fill: #1967D2;\n",
232
+ " height: 32px;\n",
233
+ " padding: 0 0 0 0;\n",
234
+ " width: 32px;\n",
235
+ " }\n",
236
+ "\n",
237
+ " .colab-df-convert:hover {\n",
238
+ " background-color: #E2EBFA;\n",
239
+ " box-shadow: 0px 1px 2px rgba(60, 64, 67, 0.3), 0px 1px 3px 1px rgba(60, 64, 67, 0.15);\n",
240
+ " fill: #174EA6;\n",
241
+ " }\n",
242
+ "\n",
243
+ " [theme=dark] .colab-df-convert {\n",
244
+ " background-color: #3B4455;\n",
245
+ " fill: #D2E3FC;\n",
246
+ " }\n",
247
+ "\n",
248
+ " [theme=dark] .colab-df-convert:hover {\n",
249
+ " background-color: #434B5C;\n",
250
+ " box-shadow: 0px 1px 3px 1px rgba(0, 0, 0, 0.15);\n",
251
+ " filter: drop-shadow(0px 1px 2px rgba(0, 0, 0, 0.3));\n",
252
+ " fill: #FFFFFF;\n",
253
+ " }\n",
254
+ " </style>\n",
255
+ "\n",
256
+ " <script>\n",
257
+ " const buttonEl =\n",
258
+ " document.querySelector('#df-9390132b-c2ff-4e3b-9528-b03b74f0357a button.colab-df-convert');\n",
259
+ " buttonEl.style.display =\n",
260
+ " google.colab.kernel.accessAllowed ? 'block' : 'none';\n",
261
+ "\n",
262
+ " async function convertToInteractive(key) {\n",
263
+ " const element = document.querySelector('#df-9390132b-c2ff-4e3b-9528-b03b74f0357a');\n",
264
+ " const dataTable =\n",
265
+ " await google.colab.kernel.invokeFunction('convertToInteractive',\n",
266
+ " [key], {});\n",
267
+ " if (!dataTable) return;\n",
268
+ "\n",
269
+ " const docLinkHtml = 'Like what you see? Visit the ' +\n",
270
+ " '<a target=\"_blank\" href=https://colab.research.google.com/notebooks/data_table.ipynb>data table notebook</a>'\n",
271
+ " + ' to learn more about interactive tables.';\n",
272
+ " element.innerHTML = '';\n",
273
+ " dataTable['output_type'] = 'display_data';\n",
274
+ " await google.colab.output.renderOutput(dataTable, element);\n",
275
+ " const docLink = document.createElement('div');\n",
276
+ " docLink.innerHTML = docLinkHtml;\n",
277
+ " element.appendChild(docLink);\n",
278
+ " }\n",
279
+ " </script>\n",
280
+ " </div>\n",
281
+ " </div>\n",
282
+ " "
283
+ ]
284
+ },
285
+ "metadata": {},
286
+ "execution_count": 5
287
+ }
288
+ ]
289
+ },
290
+ {
291
+ "cell_type": "code",
292
+ "source": [
293
+ "import numpy as np\n",
294
+ "ax = plt.gca()\n",
295
+ "ax.set_xticks(np.arange(5, 125, 5))\n",
296
+ "ax.set_xticklabels(labels=mins, minor=True)\n",
297
+ "\n",
298
+ "df.plot(kind='line', x='Minutes', y='WER', ax=ax)"
299
+ ],
300
+ "metadata": {
301
+ "colab": {
302
+ "base_uri": "https://localhost:8080/",
303
+ "height": 297
304
+ },
305
+ "id": "yxMFzpL4N9q3",
306
+ "outputId": "c4b04593-2e33-458f-8752-44fc1ba23830"
307
+ },
308
+ "execution_count": 7,
309
+ "outputs": [
310
+ {
311
+ "output_type": "execute_result",
312
+ "data": {
313
+ "text/plain": [
314
+ "<matplotlib.axes._subplots.AxesSubplot at 0x7f271c39dcd0>"
315
+ ]
316
+ },
317
+ "metadata": {},
318
+ "execution_count": 7
319
+ },
320
+ {
321
+ "output_type": "display_data",
322
+ "data": {
323
+ "text/plain": [
324
+ "<Figure size 432x288 with 1 Axes>"
325
+ ],
326
+ "image/png": "\n"
327
+ },
328
+ "metadata": {
329
+ "needs_background": "light"
330
+ }
331
+ }
332
+ ]
333
+ }
334
+ ]
335
+ }