{ "cells": [ { "cell_type": "code", "execution_count": 1, "metadata": {}, "outputs": [ { "data": { "text/plain": [ "RendererRegistry.enable('mimetype')" ] }, "execution_count": 1, "metadata": {}, "output_type": "execute_result" } ], "source": [ "from splink.duckdb.duckdb_linker import DuckDBLinker\n", "import altair as alt\n", "alt.renderers.enable('mimetype')" ] }, { "cell_type": "code", "execution_count": 2, "metadata": {}, "outputs": [ { "data": { "text/html": [ "
\n", " | unique_id | \n", "cluster | \n", "full_name | \n", "first_and_surname | \n", "first_name | \n", "surname | \n", "dob | \n", "birth_place | \n", "postcode_fake | \n", "gender | \n", "occupation | \n", "
---|---|---|---|---|---|---|---|---|---|---|---|
0 | \n", "Q2296770-1 | \n", "Q2296770 | \n", "thomas clifford, 1st baron clifford of chudleigh | \n", "thomas chudleigh | \n", "thomas | \n", "chudleigh | \n", "1630-08-01 | \n", "devon | \n", "tq13 8df | \n", "male | \n", "politician | \n", "
1 | \n", "Q2296770-2 | \n", "Q2296770 | \n", "thomas of chudleigh | \n", "thomas chudleigh | \n", "thomas | \n", "chudleigh | \n", "1630-08-01 | \n", "devon | \n", "tq13 8df | \n", "male | \n", "politician | \n", "
2 | \n", "Q2296770-3 | \n", "Q2296770 | \n", "tom 1st baron clifford of chudleigh | \n", "tom chudleigh | \n", "tom | \n", "chudleigh | \n", "1630-08-01 | \n", "devon | \n", "tq13 8df | \n", "male | \n", "politician | \n", "
3 | \n", "Q2296770-4 | \n", "Q2296770 | \n", "thomas 1st chudleigh | \n", "thomas chudleigh | \n", "thomas | \n", "chudleigh | \n", "1630-08-01 | \n", "devon | \n", "tq13 8hu | \n", "None | \n", "politician | \n", "
4 | \n", "Q2296770-5 | \n", "Q2296770 | \n", "thomas clifford, 1st baron chudleigh | \n", "thomas chudleigh | \n", "thomas | \n", "chudleigh | \n", "1630-08-01 | \n", "devon | \n", "tq13 8df | \n", "None | \n", "politician | \n", "
\n", " | match_weight | \n", "match_probability | \n", "unique_id_l | \n", "unique_id_r | \n", "first_name_l | \n", "first_name_r | \n", "gamma_first_name | \n", "bf_first_name | \n", "surname_l | \n", "surname_r | \n", "... | \n", "bf_postcode_fake | \n", "birth_place_l | \n", "birth_place_r | \n", "gamma_birth_place | \n", "bf_birth_place | \n", "occupation_l | \n", "occupation_r | \n", "gamma_occupation | \n", "bf_occupation | \n", "match_key | \n", "
---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
0 | \n", "19.641479 | \n", "0.999999 | \n", "Q2296770-1 | \n", "Q2296770-14 | \n", "thomas | \n", "thomas | \n", "3 | \n", "43.427885 | \n", "chudleigh | \n", "chudleigh | \n", "... | \n", "249.467633 | \n", "devon | \n", "NaN | \n", "-1 | \n", "1.000000 | \n", "politician | \n", "politician | \n", "1 | \n", "22.77665 | \n", "0 | \n", "
1 | \n", "5.048632 | \n", "0.970672 | \n", "Q2296770-10 | \n", "Q2296770-14 | \n", "thomas | \n", "thomas | \n", "3 | \n", "43.427885 | \n", "chudleigh | \n", "chudleigh | \n", "... | \n", "0.171118 | \n", "devon | \n", "NaN | \n", "-1 | \n", "1.000000 | \n", "politician | \n", "politician | \n", "1 | \n", "22.77665 | \n", "0 | \n", "
2 | \n", "25.497744 | \n", "1.000000 | \n", "Q1443188-1 | \n", "Q1443188-3 | \n", "frank | \n", "frank | \n", "3 | \n", "43.427885 | \n", "brightman | \n", "brightman | \n", "... | \n", "4874.614882 | \n", "bristol | \n", "bristol, city of | \n", "0 | \n", "0.160976 | \n", "liturgist | \n", "liturgist | \n", "1 | \n", "22.77665 | \n", "0 | \n", "
3 | \n", "25.497744 | \n", "1.000000 | \n", "Q1443188-2 | \n", "Q1443188-3 | \n", "frank | \n", "frank | \n", "3 | \n", "43.427885 | \n", "brightman | \n", "brightman | \n", "... | \n", "4874.614882 | \n", "bristol | \n", "bristol, city of | \n", "0 | \n", "0.160976 | \n", "liturgist | \n", "liturgist | \n", "1 | \n", "22.77665 | \n", "0 | \n", "
4 | \n", "9.131831 | \n", "0.998221 | \n", "Q1443188-4 | \n", "Q1443188-5 | \n", "francis | \n", "francis | \n", "3 | \n", "43.427885 | \n", "brightman | \n", "brightman | \n", "... | \n", "0.171118 | \n", "NaN | \n", "bristol, city of | \n", "-1 | \n", "1.000000 | \n", "liturgist | \n", "liturgist | \n", "1 | \n", "22.77665 | \n", "0 | \n", "
5 rows × 29 columns
\n", "