diff --git a/thesis/2-Background.tex b/thesis/2-Background.tex index afc908fd073a11feb9dd5a6a08853fa60b7650f9..cc40e9bda04dc10abfcd1ec7f68e8ea4f8a3a5e4 100644 --- a/thesis/2-Background.tex +++ b/thesis/2-Background.tex @@ -56,20 +56,26 @@ examples of disruptive editing: "Rejects or ignores community input: resists moderation and/or requests for comment, continuing to edit in pursuit of a certain point despite an opposing consensus from impartial editors." -\section{Algorithmic quality-control mechanisms on Wikipedia} +\section{Quality-control mechanisms on Wikipedia} %Context Context of work: algorithmic quality-control mechanisms (bots, ORES, humans) -> filter? %TODO Literature review! Distinction filters/Bots: what tasks are handled by bots and what by filters (and why)? What difference does it make for admins? For users whose edits are being targeted? -\subsection{Bots} +socio-technical assemblages (see Geiger) + +\subsection{Humans} \subsection{Semi-automatic tools} +\subsection{Bots} \subsection{ORES} -\subsection{Humans} %\section{Harassment and bullying} +\section{Algorithmic Governance} + +maybe move it to edit filters chapter + \begin{itemize} \item Hier sollte enthalten sein, welche Anwendungen in diesem Bereich bereits existieren und warum bei diesen ein Defizit besteht. \item Falls genutzt, sollten hier die entsprechenden Algorithmen erläutert werden. diff --git a/thesis/4-Data.tex b/thesis/4-Data.tex deleted file mode 100644 index a4decf97af249384b0f86b40f4086402d02f37f7..0000000000000000000000000000000000000000 --- a/thesis/4-Data.tex +++ /dev/null @@ -1,123 +0,0 @@ -\chapter{Data} -\label{chap:Data} - -For the present analysis we have analysed EN Wikipedia's policies and guidelines on the one hand, and the database tables of the AbuseFilter extension on the other. - -The \emph{abuse\_filter} and \emph{abuse\_filter\_action} tables from \emph{enwiki\_p} were downloaded on 6.01.2019 via quarry~\footnote{\url{https://quarry.wmflabs.org/}}. -The complete files can be found in the repository for the present paper~\cite{github}. % TODO add a more specific link - -These tables, along with \emph{abuse\_filter\_log} and \emph{abuse\_filter\_history}, are created and used by the AbuseFilter MediaWiki extension~\cite{gerrit-abusefilter}. -Selected queries have been run against the \emph{abuse\_filter\_log} table as well. -Unfortunately, currently the \emph{abuse\_filter\_history} table is not exposed to the public due to security/privacy concerns~\cite{phabricator}. -We hope to be shortly able to access a view of this table in order to conduct historic inquirements. - -The schemas of these tables can be viewed in Figures~\ref{fig:db-schemas-af},~\ref{fig:db-schemas-afl},~\ref{fig:db-schemas-afh} and~\ref{fig:db-schemas-afa}. - -\begin{figure*} -\begin{verbatim} -abuse_filter -+--------------------+---------------------+------+-----+---------+----------------+ -| Field | Type | Null | Key | Default | Extra | -+--------------------+---------------------+------+-----+---------+----------------+ -| af_id | bigint(20) unsigned | NO | PRI | NULL | auto_increment | -| af_pattern | blob | NO | | NULL | | -| af_user | bigint(20) unsigned | NO | MUL | NULL | | -| af_user_text | varbinary(255) | NO | | NULL | | -| af_timestamp | binary(14) | NO | | NULL | | -| af_enabled | tinyint(1) | NO | | 1 | | -| af_comments | blob | YES | | NULL | | -| af_public_comments | tinyblob | YES | | NULL | | -| af_hidden | tinyint(1) | NO | | 0 | | -| af_hit_count | bigint(20) | NO | | 0 | | -| af_throttled | tinyint(1) | NO | | 0 | | -| af_deleted | tinyint(1) | NO | | 0 | | -| af_actions | varbinary(255) | NO | | | | -| af_global | tinyint(1) | NO | | 0 | | -| af_group | varbinary(64) | NO | MUL | default | | -+--------------------+---------------------+------+-----+---------+----------------+ -\end{verbatim} - \caption{abuse\_filter schema}~\label{fig:db-schemas-af} -\end{figure*} - -\begin{figure*} -\begin{verbatim} -abuse_filter_log -+------------------+---------------------+------+-----+---------+----------------+ -| Field | Type | Null | Key | Default | Extra | -+------------------+---------------------+------+-----+---------+----------------+ -| afl_id | bigint(20) unsigned | NO | PRI | NULL | auto_increment | -| afl_filter | varbinary(64) | NO | MUL | NULL | | -| afl_user | bigint(20) unsigned | NO | MUL | NULL | | -| afl_user_text | varbinary(255) | NO | | NULL | | -| afl_ip | varbinary(255) | NO | MUL | NULL | | -| afl_action | varbinary(255) | NO | | NULL | | -| afl_actions | varbinary(255) | NO | | NULL | | -| afl_var_dump | blob | NO | | NULL | | -| afl_timestamp | binary(14) | NO | MUL | NULL | | -| afl_namespace | tinyint(4) | NO | MUL | NULL | | -| afl_title | varbinary(255) | NO | | NULL | | -| afl_wiki | varbinary(64) | YES | MUL | NULL | | -| afl_deleted | tinyint(1) | NO | | 0 | | -| afl_patrolled_by | int(10) unsigned | YES | | NULL | | -| afl_rev_id | int(10) unsigned | YES | MUL | NULL | | -| afl_log_id | int(10) unsigned | YES | MUL | NULL | | -+------------------+---------------------+------+-----+---------+----------------+ -\end{verbatim} - \caption{abuse\_filter\_log schema}~\label{fig:db-schemas-afl} -\end{figure*} - -\begin{figure*} -\begin{verbatim} -abuse_filter_history -+---------------------+---------------------+------+-----+---------+----------------+ -| Field | Type | Null | Key | Default | Extra | -+---------------------+---------------------+------+-----+---------+----------------+ -| afh_id | bigint(20) unsigned | NO | PRI | NULL | auto_increment | -| afh_filter | bigint(20) unsigned | NO | MUL | NULL | | -| afh_user | bigint(20) unsigned | NO | MUL | NULL | | -| afh_user_text | varbinary(255) | NO | MUL | NULL | | -| afh_timestamp | binary(14) | NO | MUL | NULL | | -| afh_pattern | blob | NO | | NULL | | -| afh_comments | blob | NO | | NULL | | -| afh_flags | tinyblob | NO | | NULL | | -| afh_public_comments | tinyblob | YES | | NULL | | -| afh_actions | blob | YES | | NULL | | -| afh_deleted | tinyint(1) | NO | | 0 | | -| afh_changed_fields | varbinary(255) | NO | | | | -| afh_group | varbinary(64) | YES | | NULL | | -+---------------------+---------------------+------+-----+---------+----------------+ -\end{verbatim} - \caption{abuse\_filter\_history schema}~\label{fig:db-schemas-afh} -\end{figure*} - -\begin{figure*} -\begin{verbatim} -abuse_filter_action -+-----------------+---------------------+------+-----+---------+-------+ -| Field | Type | Null | Key | Default | Extra | -+-----------------+---------------------+------+-----+---------+-------+ -| afa_filter | bigint(20) unsigned | NO | PRI | NULL | | -| afa_consequence | varbinary(255) | NO | PRI | NULL | | -| afa_parameters | tinyblob | NO | | NULL | | -+-----------------+---------------------+------+-----+---------+-------+ -\end{verbatim} - \caption{abuse\_filter\_action schema}~\label{fig:db-schemas-afa} -\end{figure*} - -\begin{comment} -* Describe analysed filter data set - * How does it look like? : describe schema? -* What other data sources can I explore? - * Interview with filter managers? with admins? with new editors? - -vgl \cite{GeiHal2017} -iterative mixed method -combination of: -* quantitative methods: mining big data sets/computational social science -"begin with one or -more large (but often thin) datasets generated by a software platform, which has recorded digital -traces that users leave in interacting on that platform. Such researchers then seek to mine as much -signal and significance from these found datasets as they can at scale in order to answer a research -question" -* more traditional social science/qualitative methods, e.g. interviews, observations, experiments -\end{comment} diff --git a/thesis/5-Edit-Filters.tex b/thesis/4-Edit-Filters.tex similarity index 93% rename from thesis/5-Edit-Filters.tex rename to thesis/4-Edit-Filters.tex index d6b0b0687f976daaef75c9b997dd4f887f906ec2..d370a880e658db136fec4a560dda710619b59fcd 100644 --- a/thesis/5-Edit-Filters.tex +++ b/thesis/4-Edit-Filters.tex @@ -1,8 +1,37 @@ -\chapter{Edit Filters} +\chapter{Edit Filters as part of Wikipedia's socio-technical infrastructure} \label{chap:filters} +algorithmic governance?/socio-technical assemblage +* humans +* software +* tech. infrastructure + \section{Genesis} +\section{Data} + +The foundations for the present chapter lie in EN Wikipedia's policies and guidelines. +Following pages were analysed in depth: <insert pages here>. + +Following other pages looked interesting or related, but were left out, mainly because of insufficient time. +(Is there a better reasoning why I looked at the pages I looked at specifically, while left particularly these other pages for later?) + +* for the edit filter chapter: which pages have I studied and which I haven't (why I limited the choice there? it's not possible to study everything, but study the things I study, well!) +(or should this go to limitations?) + +\begin{comment} +vgl \cite{GeiHal2017} +iterative mixed method +combination of: +* quantitative methods: mining big data sets/computational social science +"begin with one or +more large (but often thin) datasets generated by a software platform, which has recorded digital +traces that users leave in interacting on that platform. Such researchers then seek to mine as much +signal and significance from these found datasets as they can at scale in order to answer a research +question" +* more traditional social science/qualitative methods, e.g. interviews, observations, experiments +\end{comment} + \section{Definition} According to EN Wikipedia's own definition, an edit filter is ``a tool that allows editors in the edit filter manager group to set controls mainly[1] to address common patterns of harmful editing. @@ -88,8 +117,10 @@ Further down on the page it is clarified that it's administrators who can assign If editors wish to be given this permission, they can hone and prove their skills by helping with requested edit filters and false positives~\cite{Wikipedia:EditFilter}. The formal process for requesting the \emph{abusefilter-modify} permission is to raise it to the edit filter noticeboard~\footnote{\url{https://en.wikipedia.org/wiki/Wikipedia:Edit_filter_noticeboard}}. +%TODO who can raise the issue to the noticeboard? A discussion is held there, usually for 7 days, before a decision is reached~\cite{Wikipedia:EditFilter}. + \begin{comment} \url{https://en.wikipedia.org/wiki/Wikipedia:Edit_filter} "The assignment of the edit filter manager user right to non-admins is highly restricted. It should only be requested by and given to highly trusted users, when there is a clear and demonstrated need for it." @@ -120,6 +151,7 @@ Furthermore, on the noticeboard discussions take place about giving edit filter False positives among the filter hits are reported and discussed on a separate page~\footnote{\url{https://en.wikipedia.org/wiki/Wikipedia:Edit_filter/False_positives}}. Edit filter managers monitor this page and improve filters based on true false positives, give advice to good faith editors who tripped a filter or discourage authors of vandalism edits to continue with them. +%TODO who moderates the false positives page? where does the info come from that it is edit filter managers? Moreover, edit filter managers are advised to consult and comply with personal security best practices (such as choosing a strong password and using two-factor authentication). If such an account is compromised, it loses its edit filter manager rights and gets blocked, since this threatens site security~\cite{Wikipedia:EditFilter}. @@ -256,7 +288,41 @@ The groupings are which sets of people should have aggregate (shared) throttles. 2.9 Tagging: The edit or change can be 'tagged' with a particular tag, which will be shown on Recent Changes, contributions, logs, new pages, history, and everywhere else. These tags are styleable, so you can have items with a certain tag appear in a different colour or similar. \end{comment} +What happens when an editor triggers an edit filter? Do they notice this at all? + +As described in the previous section, a variety of different actions may occur when a filter gets tripped. +If a filter is set to ``warn'' or ``disallow'', the editor is notified that they hit a filter by a warning message (see~\ref{fig:screenshot-warn-disallow}). +These warnings describe the problem that occurred and present the editor with possible actions: +complain on the FalsePositives page (\url{https://en.wikipedia.org/wiki/Wikipedia:Edit_filter/False_positives}) in case of a disallow, +or, complain on the FalsePositives page and publish the change anyway in case of a warning. +(Of course, in case of a warning, the editor can modify their edit before publishing it.) +On the other hand, when the filter action is set to "tag" or "log" only, the editor doesn't really notice they tripped a filter unless they are looking more closely. +Tagged edits are marked as such in the page's revision history (see~\ref{fig:tags-in-history}) +and all edits that trigger an edit filter are listed in the AbuseLog (\url{https://en.wikipedia.org/wiki/Special:AbuseLog}) (see~\ref{fig:screenshot-abuse-log}). + +\begin{figure} +\centering + \includegraphics[width=0.9\columnwidth]{pics/screenshots-filter-trigger/Screenshot-tags-in-revision-history.png} + \caption{Tagged edits are marked as such in a page's revision history}~\label{fig:tags-in-history} +\end{figure} + +\begin{figure} +\centering + \includegraphics[width=0.9\columnwidth]{pics/screenshots-filter-trigger/Screenshot-abuse-log.png} + \caption{Abuse Log showing all filter triggers by User Schnuppi4223}~\label{fig:screenshot-abuse-log} +\end{figure} + +If the filter is set to disallow, a specific template is shown to the editor: "An automated filter has identified this edit as potentially unconstructive, so it has been disallowed. If this edit is constructive, please report this error. Disruptive editing may result in a block from editing." +"report this error" links to the FalsePositives page: \url{https://en.wikipedia.org/wiki/Wikipedia:Edit_filter/False_positives} +"block from editing" links to \url{https://en.wikipedia.org/wiki/Wikipedia:Blocking_policy} + +The edit is not saved. +\begin{figure} +\centering + \includegraphics[width=0.9\columnwidth]{pics/screenshots-filter-trigger/Screenshot-trigger-warning-filter.png} + \caption{Editor gets notified their edit triggered multiple edit filters}~\label{fig:screenshot-warn-disallow} +\end{figure} \subsection{what happens afterwards} @@ -299,45 +365,10 @@ statistics are info such as "Of the last 1,728 actions, this filter has matched "There is a bot reporting users tripping certain filters at WP:AIV and WP:UAA; you can specify the filters here." \url{https://en.wikipedia.org/wiki/User:DatBot/filters} +* consider collaborations filters/bots (e.g. MrZ Bot which puts editors found on the abuse log often on the AIV noticeboard.) are there further exampled for this kind of collaborations? - -\section{Impact on editors} - -What happens when an editor triggers an edit filter? Do they notice this at all? - -As described in the previous section, a variety of different actions may occur when a filter gets tripped. -If a filter is set to ``warn'' or ``disallow'', the editor is notified that they hit a filter by a warning message (see~\ref{fig:screenshot-warn-disallow}). -These warnings describe the problem that occurred and present the editor with possible actions: -complain on the FalsePositives page (\url{https://en.wikipedia.org/wiki/Wikipedia:Edit_filter/False_positives}) in case of a disallow, -or, complain on the FalsePositives page and publish the change anyway in case of a warning. -(Of course, in case of a warning, the editor can modify their edit before publishing it.) -On the other hand, when the filter action is set to "tag" or "log" only, the editor doesn't really notice they tripped a filter unless they are looking more closely. -Tagged edits are marked as such in the page's revision history (see~\ref{fig:tags-in-history}) -and all edits that trigger an edit filter are listed in the AbuseLog (\url{https://en.wikipedia.org/wiki/Special:AbuseLog}) (see~\ref{fig:screenshot-abuse-log}). - -\begin{figure} -\centering - \includegraphics[width=0.9\columnwidth]{pics/screenshots-filter-trigger/Screenshot-tags-in-revision-history.png} - \caption{Tagged edits are marked as such in a page's revision history}~\label{fig:tags-in-history} -\end{figure} - -\begin{figure} -\centering - \includegraphics[width=0.9\columnwidth]{pics/screenshots-filter-trigger/Screenshot-abuse-log.png} - \caption{Abuse Log showing all filter triggers by User Schnuppi4223}~\label{fig:screenshot-abuse-log} -\end{figure} - -If the filter is set to disallow, a specific template is shown to the editor: "An automated filter has identified this edit as potentially unconstructive, so it has been disallowed. If this edit is constructive, please report this error. Disruptive editing may result in a block from editing." -"report this error" links to the FalsePositives page: \url{https://en.wikipedia.org/wiki/Wikipedia:Edit_filter/False_positives} -"block from editing" links to \url{https://en.wikipedia.org/wiki/Wikipedia:Blocking_policy} - -The edit is not saved. - -\begin{figure} -\centering - \includegraphics[width=0.9\columnwidth]{pics/screenshots-filter-trigger/Screenshot-trigger-warning-filter.png} - \caption{Editor gets notified their edit triggered multiple edit filters}~\label{fig:screenshot-warn-disallow} -\end{figure} +\url{https://en.wikipedia.org/wiki/Wikipedia:Administrator_intervention_against_vandalism} +\url{https://en.wikipedia.org/wiki/Wikipedia:Bots/Requests_for_approval/Mr.Z-bot_7} \begin{comment} Not sure where this fits in diff --git a/thesis/6-Overview-EN-Wiki.tex b/thesis/5-Overview-EN-Wiki.tex similarity index 72% rename from thesis/6-Overview-EN-Wiki.tex rename to thesis/5-Overview-EN-Wiki.tex index ffa4264bce233546ae6ce0b371d91d86204b15c4..f3e396bb3b1d50cb0411ebc28c0a8115c61e07e7 100644 --- a/thesis/6-Overview-EN-Wiki.tex +++ b/thesis/5-Overview-EN-Wiki.tex @@ -1,6 +1,123 @@ \chapter{Descriptive overview of Edit Filters on the English Wikipedia} \label{chap:overview-en-wiki} +\section{Data} + +\begin{comment} +vgl \cite{GeiHal2017} +iterative mixed method +combination of: +* quantitative methods: mining big data sets/computational social science +"begin with one or +more large (but often thin) datasets generated by a software platform, which has recorded digital +traces that users leave in interacting on that platform. Such researchers then seek to mine as much +signal and significance from these found datasets as they can at scale in order to answer a research +question" +* more traditional social science/qualitative methods, e.g. interviews, observations, experiments +\end{comment} + +The \emph{abuse\_filter} and \emph{abuse\_filter\_action} tables from \emph{enwiki\_p} were downloaded on 6.01.2019 via quarry~\footnote{\url{https://quarry.wmflabs.org/}}. +The complete files can be found in the repository for the present paper~\cite{github}. % TODO add a more specific link + +These tables, along with \emph{abuse\_filter\_log} and \emph{abuse\_filter\_history}, are created and used by the AbuseFilter MediaWiki extension~\cite{gerrit-abusefilter}. +Selected queries have been run against the \emph{abuse\_filter\_log} table as well. +Unfortunately, currently the \emph{abuse\_filter\_history} table is not exposed to the public due to security/privacy concerns~\cite{phabricator}. +We hope to be shortly able to access a view of this table in order to conduct historic inquirements. + +The schemas of these tables can be viewed in Figures~\ref{fig:db-schemas-af},~\ref{fig:db-schemas-afl},~\ref{fig:db-schemas-afh} and~\ref{fig:db-schemas-afa}. + +\begin{figure*} +\begin{verbatim} +abuse_filter ++--------------------+---------------------+------+-----+---------+----------------+ +| Field | Type | Null | Key | Default | Extra | ++--------------------+---------------------+------+-----+---------+----------------+ +| af_id | bigint(20) unsigned | NO | PRI | NULL | auto_increment | +| af_pattern | blob | NO | | NULL | | +| af_user | bigint(20) unsigned | NO | MUL | NULL | | +| af_user_text | varbinary(255) | NO | | NULL | | +| af_timestamp | binary(14) | NO | | NULL | | +| af_enabled | tinyint(1) | NO | | 1 | | +| af_comments | blob | YES | | NULL | | +| af_public_comments | tinyblob | YES | | NULL | | +| af_hidden | tinyint(1) | NO | | 0 | | +| af_hit_count | bigint(20) | NO | | 0 | | +| af_throttled | tinyint(1) | NO | | 0 | | +| af_deleted | tinyint(1) | NO | | 0 | | +| af_actions | varbinary(255) | NO | | | | +| af_global | tinyint(1) | NO | | 0 | | +| af_group | varbinary(64) | NO | MUL | default | | ++--------------------+---------------------+------+-----+---------+----------------+ +\end{verbatim} + \caption{abuse\_filter schema}~\label{fig:db-schemas-af} +\end{figure*} + +\begin{figure*} +\begin{verbatim} +abuse_filter_log ++------------------+---------------------+------+-----+---------+----------------+ +| Field | Type | Null | Key | Default | Extra | ++------------------+---------------------+------+-----+---------+----------------+ +| afl_id | bigint(20) unsigned | NO | PRI | NULL | auto_increment | +| afl_filter | varbinary(64) | NO | MUL | NULL | | +| afl_user | bigint(20) unsigned | NO | MUL | NULL | | +| afl_user_text | varbinary(255) | NO | | NULL | | +| afl_ip | varbinary(255) | NO | MUL | NULL | | +| afl_action | varbinary(255) | NO | | NULL | | +| afl_actions | varbinary(255) | NO | | NULL | | +| afl_var_dump | blob | NO | | NULL | | +| afl_timestamp | binary(14) | NO | MUL | NULL | | +| afl_namespace | tinyint(4) | NO | MUL | NULL | | +| afl_title | varbinary(255) | NO | | NULL | | +| afl_wiki | varbinary(64) | YES | MUL | NULL | | +| afl_deleted | tinyint(1) | NO | | 0 | | +| afl_patrolled_by | int(10) unsigned | YES | | NULL | | +| afl_rev_id | int(10) unsigned | YES | MUL | NULL | | +| afl_log_id | int(10) unsigned | YES | MUL | NULL | | ++------------------+---------------------+------+-----+---------+----------------+ +\end{verbatim} + \caption{abuse\_filter\_log schema}~\label{fig:db-schemas-afl} +\end{figure*} + +\begin{figure*} +\begin{verbatim} +abuse_filter_history ++---------------------+---------------------+------+-----+---------+----------------+ +| Field | Type | Null | Key | Default | Extra | ++---------------------+---------------------+------+-----+---------+----------------+ +| afh_id | bigint(20) unsigned | NO | PRI | NULL | auto_increment | +| afh_filter | bigint(20) unsigned | NO | MUL | NULL | | +| afh_user | bigint(20) unsigned | NO | MUL | NULL | | +| afh_user_text | varbinary(255) | NO | MUL | NULL | | +| afh_timestamp | binary(14) | NO | MUL | NULL | | +| afh_pattern | blob | NO | | NULL | | +| afh_comments | blob | NO | | NULL | | +| afh_flags | tinyblob | NO | | NULL | | +| afh_public_comments | tinyblob | YES | | NULL | | +| afh_actions | blob | YES | | NULL | | +| afh_deleted | tinyint(1) | NO | | 0 | | +| afh_changed_fields | varbinary(255) | NO | | | | +| afh_group | varbinary(64) | YES | | NULL | | ++---------------------+---------------------+------+-----+---------+----------------+ +\end{verbatim} + \caption{abuse\_filter\_history schema}~\label{fig:db-schemas-afh} +\end{figure*} + +\begin{figure*} +\begin{verbatim} +abuse_filter_action ++-----------------+---------------------+------+-----+---------+-------+ +| Field | Type | Null | Key | Default | Extra | ++-----------------+---------------------+------+-----+---------+-------+ +| afa_filter | bigint(20) unsigned | NO | PRI | NULL | | +| afa_consequence | varbinary(255) | NO | PRI | NULL | | +| afa_parameters | tinyblob | NO | | NULL | | ++-----------------+---------------------+------+-----+---------+-------+ +\end{verbatim} + \caption{abuse\_filter\_action schema}~\label{fig:db-schemas-afa} +\end{figure*} + + \textbf{Interesting questions} \begin{itemize} \item how many filters are there (were there over the years): 954 filters (stand: 06.01.2019); TODO: historically?; This includes deleted filters diff --git a/thesis/6-Discussion.tex b/thesis/6-Discussion.tex new file mode 100644 index 0000000000000000000000000000000000000000..c870ebdcb99c46a7f56bec24c62eff975ed10933 --- /dev/null +++ b/thesis/6-Discussion.tex @@ -0,0 +1,42 @@ +\chapter{Discussion and Limitations} +\label{chap:discussion} + +\section{Discussion} + +Discuss results: +so I've now explored and gathered understanding on Background(Context), general workings of the edit filter system and the state of the art of edit filters on the EN Wikipedia. +So what? What important/interesting insights have I gathered when contemplating all of this together? + +* also comment on negative results! + +* why get certain filters (and not others?) +* do filters solve effectively the task they were conjured up to life to fulfil? +* what kinds of biases/problems are there? +* who is allowed to edit edit filters? + +Alternative approaches to community management: +compare with Surviving the Eternal September paper~\cite{KieMonHill2016} +"importance of strong +systems of norm enforcement made possible by leadership, +community engagement, and technology." + +"emphasizing decentralized moderation" //all community members help enforce the norms +"ensuring enough leadership capacity is available +when an influx of newcomers is anticipated." +"Designers may +benefit by focusing on tools to let existing leaders bring others +on board and help them clearly communicate norms." +"designers should support an ecosystem of accessible and ap- +propriate moderator tools." + + +\section{Limitations} + +This work presents a first attempt at analysing Wikipedia's edit filter system. +It has several limitations (we could think of). +First, it focuses on English Wikipedia only. +We are convinced that there are valuable lessons to be learnt (about the communities, usefulness of filters, ..) from comparing edit filter use across different language versions. +Second, unfortunately, including an ethnographic analysis was not possible. +This is partially due to the fact that we employ a computer science perspective on the question and partially due to limited time. +Third, the manual filter classification was undertaken by one person only, so biases of this person have certainly shaped the labels. + diff --git a/thesis/7-Discussion.tex b/thesis/7-Discussion.tex deleted file mode 100644 index 742567f61fc55f4bcb307450384f0c37711ddac5..0000000000000000000000000000000000000000 --- a/thesis/7-Discussion.tex +++ /dev/null @@ -1,65 +0,0 @@ -\chapter{Discussion and Limitations} -\label{chap:discussion} - -\section{Limitations} - -This work presents a first attempt at analysing Wikipedia's edit filter system. -It has several limitations (we could think of). -First, it focuses on English Wikipedia only. -We are convinced that there are valuable lessons to be learnt (about the communities, usefulness of filters, ..) from comparing edit filter use across different language versions. -Second, unfortunately, including an ethnographic analysis was not possible. -This is partially due to the fact that we employ a computer science perspective on the question and partially due to limited time. -Third, the manual filter classification was undertaken by one person only, so biases of this person have certainly shaped the labels. - -\section{Discussion} - -* why get certain filters (and not others?) -* do filters solve effectively the task they were conjured up to life to fulfil? -* what kinds of biases/problems are there? -* who is allowed to edit edit filters? - -Alternative approaches to community management: -compare with Surviving the Eternal September paper~\cite{KieMonHill2016} -"importance of strong -systems of norm enforcement made possible by leadership, -community engagement, and technology." - -"emphasizing decentralized moderation" //all community members help enforce the norms -"ensuring enough leadership capacity is available -when an influx of newcomers is anticipated." -"Designers may -benefit by focusing on tools to let existing leaders bring others -on board and help them clearly communicate norms." -"designers should support an ecosystem of accessible and ap- -propriate moderator tools." - - -\subsection{The bigger picture: Upload filters} - -The planned introduction of upload filters by the EU copyright reform is seen critically by Wikimedia Germany: -\begin{figure} -\centering - \includegraphics[width=0.9\columnwidth]{pics/Blackout_of_wikipediade_by_Wikimedia_Deutschland_-_March_2019.png} - \caption{Blackout of wikipedia.de by Wikimedia Deutschland}~\label{fig:blackout-upload-filters} -\end{figure} - -via -\url{https://de.wikipedia.org/wiki/Abschaltung_der_deutschsprachigen_Wikipedia_am_21._M%C3%A4rz_2019#/media/File:Blackout_of_wikipedia.de_by_Wikimedia_Deutschland_-_March_2019.png} - -see also -\url{https://wikimediafoundation.org/2019/03/20/four-wikipedias-to-black-out-over-eu-copyright-directive/} -"Volunteer editor communities in four language Wikipedias—German, Czech, Danish, and Slovak—have decided to black out the sites on 21 March in opposition to the current version of the proposed EU Copyright Directive. - -Those language editions of Wikipedia will redirect all visitors to a banner about the directive, blocking access to content on Wikipedia for 24 hours. " -"These independent language communities decided to black out in the same way most decisions are made on Wikipedia—through discussion and consensus, " - -and -\url{https://wikimediafoundation.org/2019/02/28/we-do-not-support-the-eu-copyright-directive-in-its-current-form-heres-why-you-shouldnt-either/} - -timeline -\url{https://edri.org/upload-filters-status-of-the-copyright-discussions-and-next-steps/} - -\url{https://en.wikipedia.org/wiki/Directive_on_Copyright_in_the_Digital_Single_Market#Positions} - -\subsection{Directions for further studies} -<insert long list of interesting questions here> diff --git a/thesis/conclusion.tex b/thesis/conclusion.tex index 358122d42504cbb19516eb4e84412c93115c2584..6e73ba0018816e9bd4fe1c24eafc0330c1de9919 100644 --- a/thesis/conclusion.tex +++ b/thesis/conclusion.tex @@ -8,6 +8,36 @@ \chapter{Conclusion} \label{chap:conclusion} +\section{The bigger picture: Upload filters} + +The planned introduction of upload filters by the EU copyright reform is seen critically by Wikimedia Germany: +\begin{figure} +\centering + \includegraphics[width=0.9\columnwidth]{pics/Blackout_of_wikipediade_by_Wikimedia_Deutschland_-_March_2019.png} + \caption{Blackout of wikipedia.de by Wikimedia Deutschland}~\label{fig:blackout-upload-filters} +\end{figure} + +via +\url{https://de.wikipedia.org/wiki/Abschaltung_der_deutschsprachigen_Wikipedia_am_21._M%C3%A4rz_2019#/media/File:Blackout_of_wikipedia.de_by_Wikimedia_Deutschland_-_March_2019.png} + +see also +\url{https://wikimediafoundation.org/2019/03/20/four-wikipedias-to-black-out-over-eu-copyright-directive/} +"Volunteer editor communities in four language Wikipedias—German, Czech, Danish, and Slovak—have decided to black out the sites on 21 March in opposition to the current version of the proposed EU Copyright Directive. + +Those language editions of Wikipedia will redirect all visitors to a banner about the directive, blocking access to content on Wikipedia for 24 hours. " +"These independent language communities decided to black out in the same way most decisions are made on Wikipedia—through discussion and consensus, " + +and +\url{https://wikimediafoundation.org/2019/02/28/we-do-not-support-the-eu-copyright-directive-in-its-current-form-heres-why-you-shouldnt-either/} + +timeline +\url{https://edri.org/upload-filters-status-of-the-copyright-discussions-and-next-steps/} + +\url{https://en.wikipedia.org/wiki/Directive_on_Copyright_in_the_Digital_Single_Market#Positions} + +\section{Directions for further studies} +<insert long list of interesting questions here> + \begin{itemize} \item Die Zusammenfassung sollte das Ziel der Arbeit und die zentralen Ergebnisse beschreiben. Des Weiteren sollten auch bestehende Probleme bei der Arbeit aufgezählt werden und Vorschläge herausgearbeitet werden, die helfen, diese Probleme zukünftig zu umgehen. Mögliche Erweiterungen für die umgesetzte Anwendung sollten hier auch beschrieben werden. \end{itemize} diff --git a/thesis/thesis_main.tex b/thesis/thesis_main.tex index a6ff88e4ba7c6fb468847e1b89ed76e69b9bd419..2b77a121c99fbb3d4807b5f81d83a4ddc26124b9 100755 --- a/thesis/thesis_main.tex +++ b/thesis/thesis_main.tex @@ -130,12 +130,11 @@ preface, introduction, 2-Background, 3-Methods, -4-Data, -5-Edit-Filters, -6-Overview-EN-Wiki, -7-Discussion, +4-Edit-Filters, +5-Overview-EN-Wiki, +6-Discussion, conclusion, -appendix +%appendix } %%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%% @@ -223,10 +222,9 @@ appendix \include{introduction} \include{2-Background} %Vandalism, Alg. quality control mechanisms, what gap is there in the research \include{3-Methods} %Trace ethnography, GT, .. -\include{4-Data} -\include{5-Edit-Filters} %Governance, Technic -\include{6-Overview-EN-Wiki} -\include{7-Discussion} %and limitations +\include{4-Edit-Filters} %Governance, Technic +\include{5-Overview-EN-Wiki} +\include{6-Discussion} %and limitations \include{conclusion} @@ -243,6 +241,6 @@ appendix %----- Appendix %--------------------------------------------------- \backmatter -\include{appendix} +%\include{appendix} \end{document}