{ "cells": [ { "cell_type": "markdown", "metadata": {}, "source": [ "# Exploration of tools.wmflabs.org click events" ] }, { "cell_type": "code", "execution_count": 1, "metadata": {}, "outputs": [], "source": [ "# basic defaults, including study dates, common SQL exclusions and parquet files for anonymized data\n", "%run -i 'data-defaults.py'" ] }, { "cell_type": "markdown", "metadata": {}, "source": [ "## tools.wmflabs.org link counts" ] }, { "cell_type": "markdown", "metadata": {}, "source": [ "### 2019-07-26 [count of distinct page/externallink to tools.wmflabs.org](https://quarry.wmflabs.org/query/37908)\n", "\n", "select count(distinct el_from, el_to) from externallinks where el_to like '%tools.wmflabs.org%';\n", "\n", "\n", "| count(distinct el_from, el_to) |\n", "|--------------------------------|\n", "| 12804396 |" ] }, { "cell_type": "markdown", "metadata": {}, "source": [ "### count of tools.wmflabs.org links in 20190420 externallinks table" ] }, { "cell_type": "code", "execution_count": 2, "metadata": {}, "outputs": [ { "name": "stdout", "output_type": "stream", "text": [ "+--------+\n", "| links|\n", "+--------+\n", "|12664610|\n", "+--------+\n", "\n" ] } ], "source": [ "# count of tools.wmflabs.org links in 20190420 externallinks table\n", "query = \"\"\"\n", "select count(distinct el_from, el_to) AS links \n", "FROM ryanmax.population_externallinks \n", "WHERE LOWER(el_to) LIKE '%tools.wmflabs.org%'\n", "\"\"\"\n", "spark.sql(query).show()" ] }, { "cell_type": "code", "execution_count": 3, "metadata": {}, "outputs": [ { "data": { "text/html": [ "
| \n", " | link_path | \n", "count | \n", "
|---|---|---|
| 0 | \n", "tools.wmflabs.org/geohack | \n", "1053717 | \n", "
| 1 | \n", "tools.wmflabs.org/os | \n", "15816 | \n", "
| 2 | \n", "tools.wmflabs.org/osm4wiki | \n", "11249 | \n", "
| 3 | \n", "tools.wmflabs.org/isin | \n", "2239 | \n", "
| 4 | \n", "tools.wmflabs.org/kmlexport | \n", "1966 | \n", "
| 5 | \n", "tools.wmflabs.org/timescale | \n", "1780 | \n", "
| 6 | \n", "tools.wmflabs.org/bibleversefinder2 | \n", "1331 | \n", "
| 7 | \n", "tools.wmflabs.org/ftl | \n", "1115 | \n", "
| 8 | \n", "tools.wmflabs.org/scholia | \n", "435 | \n", "
| 9 | \n", "tools.wmflabs.org/panoviewer | \n", "184 | \n", "
| 10 | \n", "tools.wmflabs.org/dupdet | \n", "50 | \n", "
| 11 | \n", "tools.wmflabs.org/wikidata-externalid-url | \n", "46 | \n", "
| 12 | \n", "tools.wmflabs.org/citeplato | \n", "41 | \n", "
| 13 | \n", "tools.wmflabs.org/zoomviewer | \n", "37 | \n", "
| 14 | \n", "tools.wmflabs.org/copyvios | \n", "30 | \n", "
| 15 | \n", "tools.wmflabs.org/wiwosm | \n", "28 | \n", "
| 16 | \n", "tools.wmflabs.org/family | \n", "26 | \n", "
| 17 | \n", "tools.wmflabs.org/reasonator | \n", "21 | \n", "
| 18 | \n", "tools.wmflabs.org/makeref | \n", "13 | \n", "
| 19 | \n", "tools.wmflabs.org/citations | \n", "11 | \n", "
| 20 | \n", "tools.wmflabs.org/dplbot | \n", "9 | \n", "
| 21 | \n", "tools.wmflabs.org/dispenser | \n", "6 | \n", "
| 22 | \n", "tools.wmflabs.org/refill | \n", "5 | \n", "
| 23 | \n", "tools.wmflabs.org/hashtags | \n", "4 | \n", "
| 24 | \n", "tools.wmflabs.org/wikivoyage | \n", "3 | \n", "
| 25 | \n", "tools.wmflabs.org/magnustools | \n", "3 | \n", "
| 26 | \n", "tools.wmflabs.org/citation-template-filling | \n", "2 | \n", "
| 27 | \n", "tools.wmflabs.org/denkmalliste | \n", "1 | \n", "
| 28 | \n", "tools.wmflabs.org/templatecount | \n", "1 | \n", "
| 29 | \n", "tools.wmflabs.org/pageviews | \n", "1 | \n", "
| 30 | \n", "tools.wmflabs.org/citer | \n", "1 | \n", "