diff --git a/src/explore.ipynb b/src/explore.ipynb index b9015d4d380de17e9deec8087c810fde68c0bf7f..3ab417adbfe8b8520dbf4c877296e47a7b1b0ef3 100644 --- a/src/explore.ipynb +++ b/src/explore.ipynb @@ -996,7 +996,7 @@ " <td>disallow</td>\n", " <td>1165</td>\n", " <td>Prevent indexing userspaces by newer users</td>\n", - " <td>wiki_policy?</td>\n", + " <td>wiki_policy, good_faith, seo</td>\n", " <td>https://en.wikipedia.org/wiki/Wikipedia:Contro...</td>\n", " </tr>\n", " <tr>\n", @@ -1222,7 +1222,7 @@ "158 vandalism?, spam?, sockpuppetry? \n", "171 vandalism \n", "234 bad_style?, misc? \n", - "239 wiki_policy? \n", + "239 wiki_policy, good_faith, seo \n", "268 vandalism? \n", "271 good_faith? \n", "302 vandalism \n", @@ -1303,182 +1303,182 @@ " <tbody>\n", " <tr>\n", " <th>0</th>\n", - " <td>201903</td>\n", - " <td>log</td>\n", + " <td>2019-03-01</td>\n", + " <td>log only</td>\n", " <td>14103</td>\n", " </tr>\n", " <tr>\n", " <th>1</th>\n", - " <td>201903</td>\n", + " <td>2019-03-01</td>\n", " <td>disallow</td>\n", " <td>9430</td>\n", " </tr>\n", " <tr>\n", " <th>2</th>\n", - " <td>201903</td>\n", + " <td>2019-03-01</td>\n", " <td>tag</td>\n", " <td>13283</td>\n", " </tr>\n", " <tr>\n", " <th>3</th>\n", - " <td>201903</td>\n", + " <td>2019-03-01</td>\n", " <td>warn</td>\n", " <td>6001</td>\n", " </tr>\n", " <tr>\n", " <th>4</th>\n", - " <td>201902</td>\n", - " <td>log</td>\n", + " <td>2019-02-01</td>\n", + " <td>log only</td>\n", " <td>73101</td>\n", " </tr>\n", " <tr>\n", " <th>5</th>\n", - " <td>201902</td>\n", + " <td>2019-02-01</td>\n", " <td>disallow</td>\n", " <td>47242</td>\n", " </tr>\n", " <tr>\n", " <th>6</th>\n", - " <td>201902</td>\n", + " <td>2019-02-01</td>\n", " <td>disallow,tag</td>\n", " <td>8</td>\n", " </tr>\n", " <tr>\n", " <th>7</th>\n", - " <td>201902</td>\n", + " <td>2019-02-01</td>\n", " <td>tag</td>\n", " <td>81279</td>\n", " </tr>\n", " <tr>\n", " <th>8</th>\n", - " <td>201902</td>\n", + " <td>2019-02-01</td>\n", " <td>warn</td>\n", " <td>34976</td>\n", " </tr>\n", " <tr>\n", " <th>9</th>\n", - " <td>201901</td>\n", - " <td>log</td>\n", + " <td>2019-01-01</td>\n", + " <td>log only</td>\n", " <td>81745</td>\n", " </tr>\n", " <tr>\n", " <th>10</th>\n", - " <td>201901</td>\n", + " <td>2019-01-01</td>\n", " <td>disallow</td>\n", " <td>44370</td>\n", " </tr>\n", " <tr>\n", " <th>11</th>\n", - " <td>201901</td>\n", + " <td>2019-01-01</td>\n", " <td>disallow,tag</td>\n", " <td>8</td>\n", " </tr>\n", " <tr>\n", " <th>12</th>\n", - " <td>201901</td>\n", + " <td>2019-01-01</td>\n", " <td>tag</td>\n", " <td>89263</td>\n", " </tr>\n", " <tr>\n", " <th>13</th>\n", - " <td>201901</td>\n", + " <td>2019-01-01</td>\n", " <td>warn</td>\n", " <td>37282</td>\n", " </tr>\n", " <tr>\n", " <th>14</th>\n", - " <td>201812</td>\n", - " <td>log</td>\n", + " <td>2018-12-01</td>\n", + " <td>log only</td>\n", " <td>83958</td>\n", " </tr>\n", " <tr>\n", " <th>15</th>\n", - " <td>201812</td>\n", + " <td>2018-12-01</td>\n", " <td>disallow</td>\n", " <td>33417</td>\n", " </tr>\n", " <tr>\n", " <th>16</th>\n", - " <td>201812</td>\n", + " <td>2018-12-01</td>\n", " <td>disallow,tag</td>\n", " <td>6</td>\n", " </tr>\n", " <tr>\n", " <th>17</th>\n", - " <td>201812</td>\n", + " <td>2018-12-01</td>\n", " <td>tag</td>\n", " <td>76257</td>\n", " </tr>\n", " <tr>\n", " <th>18</th>\n", - " <td>201812</td>\n", + " <td>2018-12-01</td>\n", " <td>warn</td>\n", " <td>32649</td>\n", " </tr>\n", " <tr>\n", " <th>19</th>\n", - " <td>201811</td>\n", - " <td>log</td>\n", + " <td>2018-11-01</td>\n", + " <td>log only</td>\n", " <td>83866</td>\n", " </tr>\n", " <tr>\n", " <th>20</th>\n", - " <td>201811</td>\n", + " <td>2018-11-01</td>\n", " <td>disallow</td>\n", " <td>43244</td>\n", " </tr>\n", " <tr>\n", " <th>21</th>\n", - " <td>201811</td>\n", + " <td>2018-11-01</td>\n", " <td>disallow,tag</td>\n", " <td>5</td>\n", " </tr>\n", " <tr>\n", " <th>22</th>\n", - " <td>201811</td>\n", + " <td>2018-11-01</td>\n", " <td>tag</td>\n", " <td>86062</td>\n", " </tr>\n", " <tr>\n", " <th>23</th>\n", - " <td>201811</td>\n", + " <td>2018-11-01</td>\n", " <td>warn</td>\n", " <td>40056</td>\n", " </tr>\n", " <tr>\n", " <th>24</th>\n", - " <td>201810</td>\n", - " <td>log</td>\n", + " <td>2018-10-01</td>\n", + " <td>log only</td>\n", " <td>87070</td>\n", " </tr>\n", " <tr>\n", " <th>25</th>\n", - " <td>201810</td>\n", + " <td>2018-10-01</td>\n", " <td>disallow</td>\n", " <td>38163</td>\n", " </tr>\n", " <tr>\n", " <th>26</th>\n", - " <td>201810</td>\n", + " <td>2018-10-01</td>\n", " <td>disallow,tag</td>\n", " <td>8</td>\n", " </tr>\n", " <tr>\n", " <th>27</th>\n", - " <td>201810</td>\n", + " <td>2018-10-01</td>\n", " <td>tag</td>\n", " <td>86140</td>\n", " </tr>\n", " <tr>\n", " <th>28</th>\n", - " <td>201810</td>\n", + " <td>2018-10-01</td>\n", " <td>warn</td>\n", " <td>45057</td>\n", " </tr>\n", " <tr>\n", " <th>29</th>\n", - " <td>201809</td>\n", - " <td>log</td>\n", + " <td>2018-09-01</td>\n", + " <td>log only</td>\n", " <td>88941</td>\n", " </tr>\n", " <tr>\n", @@ -1489,181 +1489,181 @@ " </tr>\n", " <tr>\n", " <th>547</th>\n", - " <td>200908</td>\n", + " <td>2009-08-01</td>\n", " <td>tag</td>\n", " <td>89814</td>\n", " </tr>\n", " <tr>\n", " <th>548</th>\n", - " <td>200908</td>\n", + " <td>2009-08-01</td>\n", " <td>warn</td>\n", " <td>53021</td>\n", " </tr>\n", " <tr>\n", " <th>549</th>\n", - " <td>200907</td>\n", - " <td>log</td>\n", + " <td>2009-07-01</td>\n", + " <td>log only</td>\n", " <td>15288</td>\n", " </tr>\n", " <tr>\n", " <th>550</th>\n", - " <td>200907</td>\n", + " <td>2009-07-01</td>\n", " <td>blockautopromote</td>\n", " <td>37</td>\n", " </tr>\n", " <tr>\n", " <th>551</th>\n", - " <td>200907</td>\n", + " <td>2009-07-01</td>\n", " <td>disallow</td>\n", " <td>4037</td>\n", " </tr>\n", " <tr>\n", " <th>552</th>\n", - " <td>200907</td>\n", + " <td>2009-07-01</td>\n", " <td>tag</td>\n", " <td>89516</td>\n", " </tr>\n", " <tr>\n", " <th>553</th>\n", - " <td>200907</td>\n", + " <td>2009-07-01</td>\n", " <td>warn</td>\n", " <td>52115</td>\n", " </tr>\n", " <tr>\n", " <th>554</th>\n", - " <td>200906</td>\n", - " <td>log</td>\n", + " <td>2009-06-01</td>\n", + " <td>log only</td>\n", " <td>13096</td>\n", " </tr>\n", " <tr>\n", " <th>555</th>\n", - " <td>200906</td>\n", + " <td>2009-06-01</td>\n", " <td>blockautopromote</td>\n", " <td>35</td>\n", " </tr>\n", " <tr>\n", " <th>556</th>\n", - " <td>200906</td>\n", + " <td>2009-06-01</td>\n", " <td>disallow</td>\n", " <td>4102</td>\n", " </tr>\n", " <tr>\n", " <th>557</th>\n", - " <td>200906</td>\n", + " <td>2009-06-01</td>\n", " <td>tag</td>\n", " <td>96801</td>\n", " </tr>\n", " <tr>\n", " <th>558</th>\n", - " <td>200906</td>\n", + " <td>2009-06-01</td>\n", " <td>warn</td>\n", " <td>65142</td>\n", " </tr>\n", " <tr>\n", " <th>559</th>\n", - " <td>200905</td>\n", - " <td>log</td>\n", + " <td>2009-05-01</td>\n", + " <td>log only</td>\n", " <td>56138</td>\n", " </tr>\n", " <tr>\n", " <th>560</th>\n", - " <td>200905</td>\n", + " <td>2009-05-01</td>\n", " <td>blockautopromote</td>\n", " <td>42</td>\n", " </tr>\n", " <tr>\n", " <th>561</th>\n", - " <td>200905</td>\n", + " <td>2009-05-01</td>\n", " <td>disallow</td>\n", " <td>4750</td>\n", " </tr>\n", " <tr>\n", " <th>562</th>\n", - " <td>200905</td>\n", + " <td>2009-05-01</td>\n", " <td>disallow,tag</td>\n", " <td>11</td>\n", " </tr>\n", " <tr>\n", " <th>563</th>\n", - " <td>200905</td>\n", + " <td>2009-05-01</td>\n", " <td>tag</td>\n", " <td>63420</td>\n", " </tr>\n", " <tr>\n", " <th>564</th>\n", - " <td>200905</td>\n", + " <td>2009-05-01</td>\n", " <td>warn</td>\n", " <td>87518</td>\n", " </tr>\n", " <tr>\n", " <th>565</th>\n", - " <td>200904</td>\n", - " <td>log</td>\n", + " <td>2009-04-01</td>\n", + " <td>log only</td>\n", " <td>52076</td>\n", " </tr>\n", " <tr>\n", " <th>566</th>\n", - " <td>200904</td>\n", + " <td>2009-04-01</td>\n", " <td>blockautopromote</td>\n", " <td>118</td>\n", " </tr>\n", " <tr>\n", " <th>567</th>\n", - " <td>200904</td>\n", + " <td>2009-04-01</td>\n", " <td>disallow</td>\n", " <td>4637</td>\n", " </tr>\n", " <tr>\n", " <th>568</th>\n", - " <td>200904</td>\n", + " <td>2009-04-01</td>\n", " <td>disallow,tag</td>\n", " <td>10</td>\n", " </tr>\n", " <tr>\n", " <th>569</th>\n", - " <td>200904</td>\n", + " <td>2009-04-01</td>\n", " <td>tag</td>\n", " <td>33447</td>\n", " </tr>\n", " <tr>\n", " <th>570</th>\n", - " <td>200904</td>\n", + " <td>2009-04-01</td>\n", " <td>warn</td>\n", " <td>88864</td>\n", " </tr>\n", " <tr>\n", " <th>571</th>\n", - " <td>200903</td>\n", - " <td>log</td>\n", + " <td>2009-03-01</td>\n", + " <td>log only</td>\n", " <td>24757</td>\n", " </tr>\n", " <tr>\n", " <th>572</th>\n", - " <td>200903</td>\n", + " <td>2009-03-01</td>\n", " <td>blockautopromote</td>\n", " <td>272</td>\n", " </tr>\n", " <tr>\n", " <th>573</th>\n", - " <td>200903</td>\n", + " <td>2009-03-01</td>\n", " <td>blockautopromote,tag</td>\n", " <td>2</td>\n", " </tr>\n", " <tr>\n", " <th>574</th>\n", - " <td>200903</td>\n", + " <td>2009-03-01</td>\n", " <td>disallow</td>\n", " <td>2807</td>\n", " </tr>\n", " <tr>\n", " <th>575</th>\n", - " <td>200903</td>\n", + " <td>2009-03-01</td>\n", " <td>tag</td>\n", " <td>17865</td>\n", " </tr>\n", " <tr>\n", " <th>576</th>\n", - " <td>200903</td>\n", + " <td>2009-03-01</td>\n", " <td>warn</td>\n", " <td>53305</td>\n", " </tr>\n", @@ -1673,73 +1673,73 @@ "</div>" ], "text/plain": [ - " LogMonth FilterActions Freq\n", - "0 201903 log 14103\n", - "1 201903 disallow 9430\n", - "2 201903 tag 13283\n", - "3 201903 warn 6001\n", - "4 201902 log 73101\n", - "5 201902 disallow 47242\n", - "6 201902 disallow,tag 8\n", - "7 201902 tag 81279\n", - "8 201902 warn 34976\n", - "9 201901 log 81745\n", - "10 201901 disallow 44370\n", - "11 201901 disallow,tag 8\n", - "12 201901 tag 89263\n", - "13 201901 warn 37282\n", - "14 201812 log 83958\n", - "15 201812 disallow 33417\n", - "16 201812 disallow,tag 6\n", - "17 201812 tag 76257\n", - "18 201812 warn 32649\n", - "19 201811 log 83866\n", - "20 201811 disallow 43244\n", - "21 201811 disallow,tag 5\n", - "22 201811 tag 86062\n", - "23 201811 warn 40056\n", - "24 201810 log 87070\n", - "25 201810 disallow 38163\n", - "26 201810 disallow,tag 8\n", - "27 201810 tag 86140\n", - "28 201810 warn 45057\n", - "29 201809 log 88941\n", - ".. ... ... ...\n", - "547 200908 tag 89814\n", - "548 200908 warn 53021\n", - "549 200907 log 15288\n", - "550 200907 blockautopromote 37\n", - "551 200907 disallow 4037\n", - "552 200907 tag 89516\n", - "553 200907 warn 52115\n", - "554 200906 log 13096\n", - "555 200906 blockautopromote 35\n", - "556 200906 disallow 4102\n", - "557 200906 tag 96801\n", - "558 200906 warn 65142\n", - "559 200905 log 56138\n", - "560 200905 blockautopromote 42\n", - "561 200905 disallow 4750\n", - "562 200905 disallow,tag 11\n", - "563 200905 tag 63420\n", - "564 200905 warn 87518\n", - "565 200904 log 52076\n", - "566 200904 blockautopromote 118\n", - "567 200904 disallow 4637\n", - "568 200904 disallow,tag 10\n", - "569 200904 tag 33447\n", - "570 200904 warn 88864\n", - "571 200903 log 24757\n", - "572 200903 blockautopromote 272\n", - "573 200903 blockautopromote,tag 2\n", - "574 200903 disallow 2807\n", - "575 200903 tag 17865\n", - "576 200903 warn 53305\n", + " LogMonth FilterActions Freq\n", + "0 2019-03-01 log only 14103\n", + "1 2019-03-01 disallow 9430\n", + "2 2019-03-01 tag 13283\n", + "3 2019-03-01 warn 6001\n", + "4 2019-02-01 log only 73101\n", + "5 2019-02-01 disallow 47242\n", + "6 2019-02-01 disallow,tag 8\n", + "7 2019-02-01 tag 81279\n", + "8 2019-02-01 warn 34976\n", + "9 2019-01-01 log only 81745\n", + "10 2019-01-01 disallow 44370\n", + "11 2019-01-01 disallow,tag 8\n", + "12 2019-01-01 tag 89263\n", + "13 2019-01-01 warn 37282\n", + "14 2018-12-01 log only 83958\n", + "15 2018-12-01 disallow 33417\n", + "16 2018-12-01 disallow,tag 6\n", + "17 2018-12-01 tag 76257\n", + "18 2018-12-01 warn 32649\n", + "19 2018-11-01 log only 83866\n", + "20 2018-11-01 disallow 43244\n", + "21 2018-11-01 disallow,tag 5\n", + "22 2018-11-01 tag 86062\n", + "23 2018-11-01 warn 40056\n", + "24 2018-10-01 log only 87070\n", + "25 2018-10-01 disallow 38163\n", + "26 2018-10-01 disallow,tag 8\n", + "27 2018-10-01 tag 86140\n", + "28 2018-10-01 warn 45057\n", + "29 2018-09-01 log only 88941\n", + ".. ... ... ...\n", + "547 2009-08-01 tag 89814\n", + "548 2009-08-01 warn 53021\n", + "549 2009-07-01 log only 15288\n", + "550 2009-07-01 blockautopromote 37\n", + "551 2009-07-01 disallow 4037\n", + "552 2009-07-01 tag 89516\n", + "553 2009-07-01 warn 52115\n", + "554 2009-06-01 log only 13096\n", + "555 2009-06-01 blockautopromote 35\n", + "556 2009-06-01 disallow 4102\n", + "557 2009-06-01 tag 96801\n", + "558 2009-06-01 warn 65142\n", + "559 2009-05-01 log only 56138\n", + "560 2009-05-01 blockautopromote 42\n", + "561 2009-05-01 disallow 4750\n", + "562 2009-05-01 disallow,tag 11\n", + "563 2009-05-01 tag 63420\n", + "564 2009-05-01 warn 87518\n", + "565 2009-04-01 log only 52076\n", + "566 2009-04-01 blockautopromote 118\n", + "567 2009-04-01 disallow 4637\n", + "568 2009-04-01 disallow,tag 10\n", + "569 2009-04-01 tag 33447\n", + "570 2009-04-01 warn 88864\n", + "571 2009-03-01 log only 24757\n", + "572 2009-03-01 blockautopromote 272\n", + "573 2009-03-01 blockautopromote,tag 2\n", + "574 2009-03-01 disallow 2807\n", + "575 2009-03-01 tag 17865\n", + "576 2009-03-01 warn 53305\n", "\n", "[577 rows x 3 columns]" ] }, - "execution_count": 3, + "execution_count": 22, "metadata": {}, "output_type": "execute_result" }