{
"cells": [
{
"cell_type": "code",
"execution_count": 1,
"id": "eec04efd-3f8f-4032-8038-83d61bff1792",
"metadata": {},
"outputs": [],
"source": [
"import numpy as np\n",
"from scipy.stats import chi2_contingency\n",
"from statsmodels.stats.multitest import multipletests\n",
"import pandas as pd"
]
},
{
"cell_type": "code",
"execution_count": 2,
"id": "e3fcbc08-25aa-47fd-bee3-b468982bf04b",
"metadata": {},
"outputs": [],
"source": [
"def corpus_stats(word, counts_recent, counts_reference, total_recent, total_reference):\n",
" \"\"\"\n",
" word : the word being tested\n",
" counts_recent : raw count in week 5\n",
" counts_reference : raw count in weeks 1-4\n",
" total_recent : total tokens in week 5\n",
" total_reference : total tokens in weeks 1-4\n",
" \"\"\"\n",
" a = counts_recent # word in recent\n",
" b = counts_reference # word in reference\n",
" c = total_recent - a # non-word in recent\n",
" d = total_reference - b # non-word in reference\n",
"\n",
" contingency = np.array([[a, b],\n",
" [c, d]])\n",
"\n",
" # --- Chi-Squared ---\n",
" chi2_stat, p_chi2, _, _ = chi2_contingency(contingency, correction=False)\n",
"\n",
" # --- Log-Likelihood (G²) ---\n",
" # G² = 2 * sum(observed * log(observed / expected))\n",
" # scipy's chi2_contingency with lambda_=\"log-likelihood\" computes this\n",
" g2_stat, p_g2, _, _ = chi2_contingency(contingency, lambda_=\"log-likelihood\")\n",
"\n",
" # --- Effect sizes ---\n",
" freq_recent = a / total_recent\n",
" freq_reference = b / total_reference\n",
"\n",
" pct_diff = (freq_recent - freq_reference) / freq_reference * 100\n",
"\n",
" # Avoid log(0) with a small epsilon\n",
" eps = 1e-9\n",
" log_ratio = np.log2((freq_recent + eps) / (freq_reference + eps))\n",
"\n",
" return {\n",
" \"word\": word,\n",
" \"freq_recent\": freq_recent,\n",
" \"freq_reference\": freq_reference,\n",
" \"pct_diff\": pct_diff,\n",
" \"log_ratio\": log_ratio,\n",
" \"chi2\": chi2_stat,\n",
" \"p_chi2\": p_chi2,\n",
" \"g2\": g2_stat,\n",
" \"p_g2\": p_g2,\n",
" }"
]
},
{
"cell_type": "code",
"execution_count": 3,
"id": "2888f740-1539-4f62-a13e-73512a2be290",
"metadata": {},
"outputs": [],
"source": [
"counts_recent = {}\n",
"counts_reference = {}\n",
"with open(\"data.txt\", \"rt\", encoding=\"utf-8\") as fp:\n",
" for line in fp:\n",
" aa = line.split(\"\\t\")\n",
" counts_reference[aa[0]] = max(int(aa[1]), 0.5)\n",
" counts_recent[aa[0]] = max(int(aa[2]), 0.5)\n",
"total_recent = sum(counts_recent.values())\n",
"total_reference = sum(counts_reference.values())"
]
},
{
"cell_type": "code",
"execution_count": 4,
"id": "5ef99c2b-50d9-450b-854c-bfa9d688c63b",
"metadata": {},
"outputs": [],
"source": [
"results = [\n",
" corpus_stats(word, counts_recent[word], counts_reference.get(word, 0),\n",
" total_recent, total_reference)\n",
" for word in counts_recent]"
]
},
{
"cell_type": "code",
"execution_count": 5,
"id": "285064c8-bc52-4096-9aa5-bc57115fb813",
"metadata": {},
"outputs": [],
"source": [
"# FDR correction across all words\n",
"p_values = [r[\"p_g2\"] for r in results]\n",
"_, p_adjusted, _, _ = multipletests(p_values, method=\"fdr_bh\")\n",
"\n",
"for r, p_adj in zip(results, p_adjusted):\n",
" r[\"p_g2_adjusted\"] = p_adj"
]
},
{
"cell_type": "code",
"execution_count": 6,
"id": "c0146062-608a-40dd-80b7-742df67ca9ee",
"metadata": {},
"outputs": [],
"source": [
"results = pd.DataFrame(results)"
]
},
{
"cell_type": "code",
"execution_count": 7,
"id": "8805479d-461f-4e56-8b85-b5aa65fc7f33",
"metadata": {},
"outputs": [],
"source": [
"#pd.set_option('display.max_rows', None)\n",
"#pd.set_option('display.max_columns', None)"
]
},
{
"cell_type": "code",
"execution_count": 8,
"id": "f992bc03-6529-4521-9c98-3f7fe36eb7e8",
"metadata": {},
"outputs": [
{
"data": {
"text/html": [
"
\n",
"\n",
"
\n",
" \n",
" \n",
" | \n",
" word | \n",
" freq_recent | \n",
" freq_reference | \n",
" pct_diff | \n",
" log_ratio | \n",
" chi2 | \n",
" p_chi2 | \n",
" g2 | \n",
" p_g2 | \n",
" p_g2_adjusted | \n",
"
\n",
" \n",
" \n",
" \n",
" | 4666 | \n",
" Ye | \n",
" 0.009191 | \n",
" 0.001412 | \n",
" 551.030639 | \n",
" 2.702725 | \n",
" 88.873013 | \n",
" 4.209875e-21 | \n",
" 73.611094 | \n",
" 9.512852e-18 | \n",
" 2.265010e-14 | \n",
"
\n",
" \n",
" | 2233 | \n",
" Kanye West | \n",
" 0.006175 | \n",
" 0.001150 | \n",
" 436.822849 | \n",
" 2.424445 | \n",
" 51.860997 | \n",
" 5.957208e-13 | \n",
" 42.512795 | \n",
" 7.022134e-11 | \n",
" 1.114647e-07 | \n",
"
\n",
" \n",
" | 2521 | \n",
" Lieke Marsman | \n",
" 0.002298 | \n",
" 0.000026 | \n",
" 8688.913621 | \n",
" 6.457558 | \n",
" 41.675092 | \n",
" 1.077733e-10 | \n",
" 34.046050 | \n",
" 5.382305e-09 | \n",
" 6.407634e-06 | \n",
"
\n",
" \n",
" | 55 | \n",
" Ahmed Marcouch | \n",
" 0.003016 | \n",
" 0.000261 | \n",
" 1053.544913 | \n",
" 3.527997 | \n",
" 38.897401 | \n",
" 4.466750e-10 | \n",
" 30.774198 | \n",
" 2.898665e-08 | \n",
" 2.760689e-05 | \n",
"
\n",
" \n",
" | 1343 | \n",
" Flavio Cobolli | \n",
" 0.002010 | \n",
" 0.000026 | \n",
" 7590.299418 | \n",
" 6.264913 | \n",
" 36.186456 | \n",
" 1.793125e-09 | \n",
" 29.023926 | \n",
" 7.148986e-08 | \n",
" 5.673912e-05 | \n",
"
\n",
" \n",
" | 4362 | \n",
" Van Dissel | \n",
" 0.002585 | \n",
" 0.000209 | \n",
" 1135.940978 | \n",
" 3.627532 | \n",
" 34.197157 | \n",
" 4.980167e-09 | \n",
" 26.757903 | \n",
" 2.306067e-07 | \n",
" 1.546231e-04 | \n",
"
\n",
" \n",
" | 2797 | \n",
" Marsman | \n",
" 0.001867 | \n",
" 0.000026 | \n",
" 7040.992317 | \n",
" 6.157998 | \n",
" 33.443641 | \n",
" 7.335924e-09 | \n",
" 26.527883 | \n",
" 2.597616e-07 | \n",
" 1.546231e-04 | \n",
"
\n",
" \n",
" | 2503 | \n",
" Lewis Hamilton | \n",
" 0.004021 | \n",
" 0.000784 | \n",
" 412.686628 | \n",
" 2.358076 | \n",
" 32.500200 | \n",
" 1.191803e-08 | \n",
" 26.104423 | \n",
" 3.234422e-07 | \n",
" 1.711368e-04 | \n",
"
\n",
" \n",
" | 673 | \n",
" Charles Leclerc | \n",
" 0.002872 | \n",
" 0.000418 | \n",
" 586.633877 | \n",
" 2.779538 | \n",
" 28.670638 | \n",
" 8.579474e-08 | \n",
" 22.442992 | \n",
" 2.164739e-06 | \n",
" 9.371352e-04 | \n",
"
\n",
" \n",
" | 1858 | \n",
" Jaap van Dissel | \n",
" 0.002872 | \n",
" 0.000418 | \n",
" 586.633877 | \n",
" 2.779538 | \n",
" 28.670638 | \n",
" 8.579474e-08 | \n",
" 22.442992 | \n",
" 2.164739e-06 | \n",
" 9.371352e-04 | \n",
"
\n",
" \n",
" | 4516 | \n",
" Vollering | \n",
" 0.001867 | \n",
" 0.000105 | \n",
" 1685.248079 | \n",
" 4.158040 | \n",
" 27.590589 | \n",
" 1.499064e-07 | \n",
" 21.070561 | \n",
" 4.426770e-06 | \n",
" 1.716105e-03 | \n",
"
\n",
" \n",
" | 2923 | \n",
" Mette-Marit | \n",
" 0.004595 | \n",
" 0.001307 | \n",
" 251.556545 | \n",
" 1.813756 | \n",
" 25.318681 | \n",
" 4.859791e-07 | \n",
" 20.713510 | \n",
" 5.333836e-06 | \n",
" 1.716105e-03 | \n",
"
\n",
" \n",
" | 1801 | \n",
" Ingrid Alexandra | \n",
" 0.002010 | \n",
" 0.000157 | \n",
" 1181.716570 | \n",
" 3.679997 | \n",
" 26.935070 | \n",
" 2.104062e-07 | \n",
" 20.564349 | \n",
" 5.765997e-06 | \n",
" 1.716105e-03 | \n",
"
\n",
" \n",
" | 3466 | \n",
" Pols | \n",
" 0.002010 | \n",
" 0.000157 | \n",
" 1181.716570 | \n",
" 3.679997 | \n",
" 26.935070 | \n",
" 2.104062e-07 | \n",
" 20.564349 | \n",
" 5.765997e-06 | \n",
" 1.716105e-03 | \n",
"
\n",
" \n",
" | 2717 | \n",
" Marcouch | \n",
" 0.002441 | \n",
" 0.000314 | \n",
" 678.185060 | \n",
" 2.960109 | \n",
" 26.234266 | \n",
" 3.024086e-07 | \n",
" 20.256468 | \n",
" 6.772409e-06 | \n",
" 1.897071e-03 | \n",
"
\n",
" \n",
" | 1053 | \n",
" Donald Pols | \n",
" 0.002154 | \n",
" 0.000261 | \n",
" 723.960652 | \n",
" 3.042571 | \n",
" 23.871944 | \n",
" 1.029615e-06 | \n",
" 18.209227 | \n",
" 1.979176e-05 | \n",
" 5.236021e-03 | \n",
"
\n",
" \n",
" | 3971 | \n",
" Sjoerdsma | \n",
" 0.001867 | \n",
" 0.000209 | \n",
" 792.624040 | \n",
" 3.158047 | \n",
" 21.542862 | \n",
" 3.460080e-06 | \n",
" 16.178300 | \n",
" 5.765077e-05 | \n",
" 1.372665e-02 | \n",
"
\n",
" \n",
" | 2734 | \n",
" Marianne Thieme | \n",
" 0.001149 | \n",
" 0.000026 | \n",
" 4294.456811 | \n",
" 5.457559 | \n",
" 19.755766 | \n",
" 8.799584e-06 | \n",
" 14.281240 | \n",
" 1.574261e-04 | \n",
" 2.404300e-02 | \n",
"
\n",
" \n",
" | 2583 | \n",
" Lotte van Kruistum | \n",
" 0.001149 | \n",
" 0.000026 | \n",
" 4294.456811 | \n",
" 5.457559 | \n",
" 19.755766 | \n",
" 8.799584e-06 | \n",
" 14.281240 | \n",
" 1.574261e-04 | \n",
" 2.404300e-02 | \n",
"
\n",
" \n",
" | 3003 | \n",
" Mirra Andreeva | \n",
" 0.001149 | \n",
" 0.000026 | \n",
" 4294.456811 | \n",
" 5.457559 | \n",
" 19.755766 | \n",
" 8.799584e-06 | \n",
" 14.281240 | \n",
" 1.574261e-04 | \n",
" 2.404300e-02 | \n",
"
\n",
" \n",
" | 2351 | \n",
" Kluytmans | \n",
" 0.001149 | \n",
" 0.000026 | \n",
" 4294.456811 | \n",
" 5.457559 | \n",
" 19.755766 | \n",
" 8.799584e-06 | \n",
" 14.281240 | \n",
" 1.574261e-04 | \n",
" 2.404300e-02 | \n",
"
\n",
" \n",
" | 249 | \n",
" Antonia Niedermaier | \n",
" 0.001149 | \n",
" 0.000026 | \n",
" 4294.456811 | \n",
" 5.457559 | \n",
" 19.755766 | \n",
" 8.799584e-06 | \n",
" 14.281240 | \n",
" 1.574261e-04 | \n",
" 2.404300e-02 | \n",
"
\n",
" \n",
" | 1791 | \n",
" Ilse Kuijt | \n",
" 0.001149 | \n",
" 0.000026 | \n",
" 4294.456811 | \n",
" 5.457559 | \n",
" 19.755766 | \n",
" 8.799584e-06 | \n",
" 14.281240 | \n",
" 1.574261e-04 | \n",
" 2.404300e-02 | \n",
"
\n",
" \n",
" | 742 | \n",
" Cobolli | \n",
" 0.001149 | \n",
" 0.000026 | \n",
" 4294.456811 | \n",
" 5.457559 | \n",
" 19.755766 | \n",
" 8.799584e-06 | \n",
" 14.281240 | \n",
" 1.574261e-04 | \n",
" 2.404300e-02 | \n",
"
\n",
" \n",
" | 4724 | \n",
" Zoë Slagter | \n",
" 0.001149 | \n",
" 0.000026 | \n",
" 4294.456811 | \n",
" 5.457559 | \n",
" 19.755766 | \n",
" 8.799584e-06 | \n",
" 14.281240 | \n",
" 1.574261e-04 | \n",
" 2.404300e-02 | \n",
"
\n",
" \n",
" | 278 | \n",
" Arjan Veurink | \n",
" 0.001580 | \n",
" 0.000157 | \n",
" 907.063019 | \n",
" 3.332074 | \n",
" 19.268029 | \n",
" 1.135926e-05 | \n",
" 14.174484 | \n",
" 1.666147e-04 | \n",
" 2.404300e-02 | \n",
"
\n",
" \n",
" | 3098 | \n",
" Naomi Mestrum | \n",
" 0.001292 | \n",
" 0.000105 | \n",
" 1135.940978 | \n",
" 3.627525 | \n",
" 17.091366 | \n",
" 3.562389e-05 | \n",
" 12.221543 | \n",
" 4.724085e-04 | \n",
" 6.103910e-02 | \n",
"
\n",
" \n",
" | 2665 | \n",
" Maja Chwalinska | \n",
" 0.001580 | \n",
" 0.000209 | \n",
" 655.297264 | \n",
" 2.917039 | \n",
" 16.686682 | \n",
" 4.408944e-05 | \n",
" 12.214228 | \n",
" 4.742643e-04 | \n",
" 6.103910e-02 | \n",
"
\n",
" \n",
" | 4420 | \n",
" Van der Breggen | \n",
" 0.001436 | \n",
" 0.000157 | \n",
" 815.511836 | \n",
" 3.194570 | \n",
" 16.772235 | \n",
" 4.214548e-05 | \n",
" 12.131568 | \n",
" 4.957543e-04 | \n",
" 6.212584e-02 | \n",
"
\n",
" \n",
" | 1731 | \n",
" Hitler | \n",
" 0.001005 | \n",
" 0.000026 | \n",
" 3745.149709 | \n",
" 5.264914 | \n",
" 17.027730 | \n",
" 3.683788e-05 | \n",
" 11.905641 | \n",
" 5.596421e-04 | \n",
" 6.345276e-02 | \n",
"
\n",
" \n",
" | 2519 | \n",
" Lieke | \n",
" 0.001005 | \n",
" 0.000026 | \n",
" 3745.149709 | \n",
" 5.264914 | \n",
" 17.027730 | \n",
" 3.683788e-05 | \n",
" 11.905641 | \n",
" 5.596421e-04 | \n",
" 6.345276e-02 | \n",
"
\n",
" \n",
" | 4176 | \n",
" Teunissen | \n",
" 0.001005 | \n",
" 0.000026 | \n",
" 3745.149709 | \n",
" 5.264914 | \n",
" 17.027730 | \n",
" 3.683788e-05 | \n",
" 11.905641 | \n",
" 5.596421e-04 | \n",
" 6.345276e-02 | \n",
"
\n",
" \n",
" | 4464 | \n",
" Veurink | \n",
" 0.001005 | \n",
" 0.000026 | \n",
" 3745.149709 | \n",
" 5.264914 | \n",
" 17.027730 | \n",
" 3.683788e-05 | \n",
" 11.905641 | \n",
" 5.596421e-04 | \n",
" 6.345276e-02 | \n",
"
\n",
" \n",
" | 968 | \n",
" Denzel Dumfries | \n",
" 0.002010 | \n",
" 0.000418 | \n",
" 380.643714 | \n",
" 2.264965 | \n",
" 15.359454 | \n",
" 8.887510e-05 | \n",
" 11.600092 | \n",
" 6.594857e-04 | \n",
" 7.303421e-02 | \n",
"
\n",
" \n",
" | 2329 | \n",
" Kimi Antonelli | \n",
" 0.003447 | \n",
" 0.001203 | \n",
" 186.595009 | \n",
" 1.519013 | \n",
" 14.294065 | \n",
" 1.563571e-04 | \n",
" 11.539896 | \n",
" 6.811844e-04 | \n",
" 7.372272e-02 | \n",
"
\n",
" \n",
" | 2465 | \n",
" Leclerc | \n",
" 0.001292 | \n",
" 0.000157 | \n",
" 723.960652 | \n",
" 3.042567 | \n",
" 14.318772 | \n",
" 1.543183e-04 | \n",
" 10.145781 | \n",
" 1.446319e-03 | \n",
" 1.306897e-01 | \n",
"
\n",
" \n",
" | 1250 | \n",
" Esther Ouwehand | \n",
" 0.001292 | \n",
" 0.000157 | \n",
" 723.960652 | \n",
" 3.042567 | \n",
" 14.318772 | \n",
" 1.543183e-04 | \n",
" 10.145781 | \n",
" 1.446319e-03 | \n",
" 1.306897e-01 | \n",
"
\n",
" \n",
" | 713 | \n",
" Christine Teunissen | \n",
" 0.001149 | \n",
" 0.000105 | \n",
" 998.614203 | \n",
" 3.457600 | \n",
" 14.529034 | \n",
" 1.380160e-04 | \n",
" 10.122801 | \n",
" 1.464463e-03 | \n",
" 1.306897e-01 | \n",
"
\n",
" \n",
" | 1917 | \n",
" Jan Kluytmans | \n",
" 0.001149 | \n",
" 0.000105 | \n",
" 998.614203 | \n",
" 3.457600 | \n",
" 14.529034 | \n",
" 1.380160e-04 | \n",
" 10.122801 | \n",
" 1.464463e-03 | \n",
" 1.306897e-01 | \n",
"
\n",
" \n",
" | 2124 | \n",
" Joost Luiten | \n",
" 0.001149 | \n",
" 0.000105 | \n",
" 998.614203 | \n",
" 3.457600 | \n",
" 14.529034 | \n",
" 1.380160e-04 | \n",
" 10.122801 | \n",
" 1.464463e-03 | \n",
" 1.306897e-01 | \n",
"
\n",
" \n",
"
\n",
"
"
],
"text/plain": [
" word freq_recent freq_reference pct_diff \\\n",
"4666 Ye 0.009191 0.001412 551.030639 \n",
"2233 Kanye West 0.006175 0.001150 436.822849 \n",
"2521 Lieke Marsman 0.002298 0.000026 8688.913621 \n",
"55 Ahmed Marcouch 0.003016 0.000261 1053.544913 \n",
"1343 Flavio Cobolli 0.002010 0.000026 7590.299418 \n",
"4362 Van Dissel 0.002585 0.000209 1135.940978 \n",
"2797 Marsman 0.001867 0.000026 7040.992317 \n",
"2503 Lewis Hamilton 0.004021 0.000784 412.686628 \n",
"673 Charles Leclerc 0.002872 0.000418 586.633877 \n",
"1858 Jaap van Dissel 0.002872 0.000418 586.633877 \n",
"4516 Vollering 0.001867 0.000105 1685.248079 \n",
"2923 Mette-Marit 0.004595 0.001307 251.556545 \n",
"1801 Ingrid Alexandra 0.002010 0.000157 1181.716570 \n",
"3466 Pols 0.002010 0.000157 1181.716570 \n",
"2717 Marcouch 0.002441 0.000314 678.185060 \n",
"1053 Donald Pols 0.002154 0.000261 723.960652 \n",
"3971 Sjoerdsma 0.001867 0.000209 792.624040 \n",
"2734 Marianne Thieme 0.001149 0.000026 4294.456811 \n",
"2583 Lotte van Kruistum 0.001149 0.000026 4294.456811 \n",
"3003 Mirra Andreeva 0.001149 0.000026 4294.456811 \n",
"2351 Kluytmans 0.001149 0.000026 4294.456811 \n",
"249 Antonia Niedermaier 0.001149 0.000026 4294.456811 \n",
"1791 Ilse Kuijt 0.001149 0.000026 4294.456811 \n",
"742 Cobolli 0.001149 0.000026 4294.456811 \n",
"4724 Zoë Slagter 0.001149 0.000026 4294.456811 \n",
"278 Arjan Veurink 0.001580 0.000157 907.063019 \n",
"3098 Naomi Mestrum 0.001292 0.000105 1135.940978 \n",
"2665 Maja Chwalinska 0.001580 0.000209 655.297264 \n",
"4420 Van der Breggen 0.001436 0.000157 815.511836 \n",
"1731 Hitler 0.001005 0.000026 3745.149709 \n",
"2519 Lieke 0.001005 0.000026 3745.149709 \n",
"4176 Teunissen 0.001005 0.000026 3745.149709 \n",
"4464 Veurink 0.001005 0.000026 3745.149709 \n",
"968 Denzel Dumfries 0.002010 0.000418 380.643714 \n",
"2329 Kimi Antonelli 0.003447 0.001203 186.595009 \n",
"2465 Leclerc 0.001292 0.000157 723.960652 \n",
"1250 Esther Ouwehand 0.001292 0.000157 723.960652 \n",
"713 Christine Teunissen 0.001149 0.000105 998.614203 \n",
"1917 Jan Kluytmans 0.001149 0.000105 998.614203 \n",
"2124 Joost Luiten 0.001149 0.000105 998.614203 \n",
"\n",
" log_ratio chi2 p_chi2 g2 p_g2 \\\n",
"4666 2.702725 88.873013 4.209875e-21 73.611094 9.512852e-18 \n",
"2233 2.424445 51.860997 5.957208e-13 42.512795 7.022134e-11 \n",
"2521 6.457558 41.675092 1.077733e-10 34.046050 5.382305e-09 \n",
"55 3.527997 38.897401 4.466750e-10 30.774198 2.898665e-08 \n",
"1343 6.264913 36.186456 1.793125e-09 29.023926 7.148986e-08 \n",
"4362 3.627532 34.197157 4.980167e-09 26.757903 2.306067e-07 \n",
"2797 6.157998 33.443641 7.335924e-09 26.527883 2.597616e-07 \n",
"2503 2.358076 32.500200 1.191803e-08 26.104423 3.234422e-07 \n",
"673 2.779538 28.670638 8.579474e-08 22.442992 2.164739e-06 \n",
"1858 2.779538 28.670638 8.579474e-08 22.442992 2.164739e-06 \n",
"4516 4.158040 27.590589 1.499064e-07 21.070561 4.426770e-06 \n",
"2923 1.813756 25.318681 4.859791e-07 20.713510 5.333836e-06 \n",
"1801 3.679997 26.935070 2.104062e-07 20.564349 5.765997e-06 \n",
"3466 3.679997 26.935070 2.104062e-07 20.564349 5.765997e-06 \n",
"2717 2.960109 26.234266 3.024086e-07 20.256468 6.772409e-06 \n",
"1053 3.042571 23.871944 1.029615e-06 18.209227 1.979176e-05 \n",
"3971 3.158047 21.542862 3.460080e-06 16.178300 5.765077e-05 \n",
"2734 5.457559 19.755766 8.799584e-06 14.281240 1.574261e-04 \n",
"2583 5.457559 19.755766 8.799584e-06 14.281240 1.574261e-04 \n",
"3003 5.457559 19.755766 8.799584e-06 14.281240 1.574261e-04 \n",
"2351 5.457559 19.755766 8.799584e-06 14.281240 1.574261e-04 \n",
"249 5.457559 19.755766 8.799584e-06 14.281240 1.574261e-04 \n",
"1791 5.457559 19.755766 8.799584e-06 14.281240 1.574261e-04 \n",
"742 5.457559 19.755766 8.799584e-06 14.281240 1.574261e-04 \n",
"4724 5.457559 19.755766 8.799584e-06 14.281240 1.574261e-04 \n",
"278 3.332074 19.268029 1.135926e-05 14.174484 1.666147e-04 \n",
"3098 3.627525 17.091366 3.562389e-05 12.221543 4.724085e-04 \n",
"2665 2.917039 16.686682 4.408944e-05 12.214228 4.742643e-04 \n",
"4420 3.194570 16.772235 4.214548e-05 12.131568 4.957543e-04 \n",
"1731 5.264914 17.027730 3.683788e-05 11.905641 5.596421e-04 \n",
"2519 5.264914 17.027730 3.683788e-05 11.905641 5.596421e-04 \n",
"4176 5.264914 17.027730 3.683788e-05 11.905641 5.596421e-04 \n",
"4464 5.264914 17.027730 3.683788e-05 11.905641 5.596421e-04 \n",
"968 2.264965 15.359454 8.887510e-05 11.600092 6.594857e-04 \n",
"2329 1.519013 14.294065 1.563571e-04 11.539896 6.811844e-04 \n",
"2465 3.042567 14.318772 1.543183e-04 10.145781 1.446319e-03 \n",
"1250 3.042567 14.318772 1.543183e-04 10.145781 1.446319e-03 \n",
"713 3.457600 14.529034 1.380160e-04 10.122801 1.464463e-03 \n",
"1917 3.457600 14.529034 1.380160e-04 10.122801 1.464463e-03 \n",
"2124 3.457600 14.529034 1.380160e-04 10.122801 1.464463e-03 \n",
"\n",
" p_g2_adjusted \n",
"4666 2.265010e-14 \n",
"2233 1.114647e-07 \n",
"2521 6.407634e-06 \n",
"55 2.760689e-05 \n",
"1343 5.673912e-05 \n",
"4362 1.546231e-04 \n",
"2797 1.546231e-04 \n",
"2503 1.711368e-04 \n",
"673 9.371352e-04 \n",
"1858 9.371352e-04 \n",
"4516 1.716105e-03 \n",
"2923 1.716105e-03 \n",
"1801 1.716105e-03 \n",
"3466 1.716105e-03 \n",
"2717 1.897071e-03 \n",
"1053 5.236021e-03 \n",
"3971 1.372665e-02 \n",
"2734 2.404300e-02 \n",
"2583 2.404300e-02 \n",
"3003 2.404300e-02 \n",
"2351 2.404300e-02 \n",
"249 2.404300e-02 \n",
"1791 2.404300e-02 \n",
"742 2.404300e-02 \n",
"4724 2.404300e-02 \n",
"278 2.404300e-02 \n",
"3098 6.103910e-02 \n",
"2665 6.103910e-02 \n",
"4420 6.212584e-02 \n",
"1731 6.345276e-02 \n",
"2519 6.345276e-02 \n",
"4176 6.345276e-02 \n",
"4464 6.345276e-02 \n",
"968 7.303421e-02 \n",
"2329 7.372272e-02 \n",
"2465 1.306897e-01 \n",
"1250 1.306897e-01 \n",
"713 1.306897e-01 \n",
"1917 1.306897e-01 \n",
"2124 1.306897e-01 "
]
},
"execution_count": 8,
"metadata": {},
"output_type": "execute_result"
}
],
"source": [
"# stijgers\n",
"results[results.pct_diff > 0].sort_values('g2', ascending=False)[:40]"
]
},
{
"cell_type": "code",
"execution_count": 9,
"id": "bccce269-9540-445e-a5f9-775d55b469b9",
"metadata": {},
"outputs": [
{
"data": {
"text/html": [
"\n",
"\n",
"
\n",
" \n",
" \n",
" | \n",
" word | \n",
" freq_recent | \n",
" freq_reference | \n",
" pct_diff | \n",
" log_ratio | \n",
" chi2 | \n",
" p_chi2 | \n",
" g2 | \n",
" p_g2 | \n",
" p_g2_adjusted | \n",
"
\n",
" \n",
" \n",
" \n",
" | 1743 | \n",
" Hondius | \n",
" 0.000431 | \n",
" 0.010457 | \n",
" -95.880197 | \n",
" -4.601278 | \n",
" 66.470517 | \n",
" 3.551664e-16 | \n",
" 98.275792 | \n",
" 3.639886e-23 | \n",
" 1.733314e-19 | \n",
"
\n",
" \n",
" | 4215 | \n",
" Thymen Arensman | \n",
" 0.000072 | \n",
" 0.002353 | \n",
" -96.948294 | \n",
" -5.034221 | \n",
" 15.256919 | \n",
" 9.383239e-05 | \n",
" 20.686464 | \n",
" 5.409706e-06 | \n",
" 1.716105e-03 | \n",
"
\n",
" \n",
" | 1508 | \n",
" Gidi Markuszower | \n",
" 0.000072 | \n",
" 0.002091 | \n",
" -96.566831 | \n",
" -4.864296 | \n",
" 13.434157 | \n",
" 2.470840e-04 | \n",
" 17.811640 | \n",
" 2.438866e-05 | \n",
" 6.112569e-03 | \n",
"
\n",
" \n",
" | 4495 | \n",
" Vingegaard | \n",
" 0.000072 | \n",
" 0.001882 | \n",
" -96.185367 | \n",
" -4.712293 | \n",
" 11.977136 | \n",
" 5.385731e-04 | \n",
" 15.534557 | \n",
" 8.101072e-05 | \n",
" 1.837014e-02 | \n",
"
\n",
" \n",
" | 2782 | \n",
" Markuszower | \n",
" 0.000072 | \n",
" 0.001830 | \n",
" -96.076378 | \n",
" -4.671651 | \n",
" 11.613072 | \n",
" 6.548989e-04 | \n",
" 14.969018 | \n",
" 1.092909e-04 | \n",
" 2.365652e-02 | \n",
"
\n",
" \n",
" | 2109 | \n",
" Jonas Vingegaard | \n",
" 0.000431 | \n",
" 0.002667 | \n",
" -83.843909 | \n",
" -2.629847 | \n",
" 12.353905 | \n",
" 4.400650e-04 | \n",
" 14.707179 | \n",
" 1.255674e-04 | \n",
" 2.404300e-02 | \n",
"
\n",
" \n",
" | 3750 | \n",
" Rubio | \n",
" 0.000287 | \n",
" 0.002301 | \n",
" -87.515748 | \n",
" -3.001814 | \n",
" 11.757125 | \n",
" 6.061077e-04 | \n",
" 14.212300 | \n",
" 1.632996e-04 | \n",
" 2.404300e-02 | \n",
"
\n",
" \n",
" | 115 | \n",
" Ali B | \n",
" 0.000072 | \n",
" 0.001725 | \n",
" -95.838583 | \n",
" -4.586762 | \n",
" 10.885206 | \n",
" 9.693541e-04 | \n",
" 13.843023 | \n",
" 1.987332e-04 | \n",
" 2.783434e-02 | \n",
"
\n",
" \n",
" | 512 | \n",
" Botic van de Zandschulp | \n",
" 0.000072 | \n",
" 0.001621 | \n",
" -95.570104 | \n",
" -4.496564 | \n",
" 10.157724 | \n",
" 1.436979e-03 | \n",
" 12.724502 | \n",
" 3.608960e-04 | \n",
" 4.910248e-02 | \n",
"
\n",
" \n",
" | 921 | \n",
" De Jong | \n",
" 0.000574 | \n",
" 0.002562 | \n",
" -77.579302 | \n",
" -2.157095 | \n",
" 9.947317 | \n",
" 1.610840e-03 | \n",
" 11.220837 | \n",
" 8.088400e-04 | \n",
" 8.559325e-02 | \n",
"
\n",
" \n",
" | 4034 | \n",
" Starmer | \n",
" 0.000574 | \n",
" 0.002510 | \n",
" -77.112204 | \n",
" -2.127348 | \n",
" 9.611842 | \n",
" 1.933266e-03 | \n",
" 10.778088 | \n",
" 1.027087e-03 | \n",
" 1.060152e-01 | \n",
"
\n",
" \n",
" | 1054 | \n",
" Donald Trump | \n",
" 0.010196 | \n",
" 0.015529 | \n",
" -34.342080 | \n",
" -0.606959 | \n",
" 10.440052 | \n",
" 1.233118e-03 | \n",
" 10.743700 | \n",
" 1.046349e-03 | \n",
" 1.060152e-01 | \n",
"
\n",
" \n",
" | 4169 | \n",
" Tedros Adhanom Ghebreyesus | \n",
" 0.000072 | \n",
" 0.001412 | \n",
" -94.913823 | \n",
" -4.297255 | \n",
" 8.704154 | \n",
" 3.174857e-03 | \n",
" 10.514021 | \n",
" 1.184722e-03 | \n",
" 1.175343e-01 | \n",
"
\n",
" \n",
" | 269 | \n",
" Arensman | \n",
" 0.000072 | \n",
" 0.001359 | \n",
" -94.718201 | \n",
" -4.242808 | \n",
" 8.341110 | \n",
" 3.875791e-03 | \n",
" 9.967878 | \n",
" 1.592950e-03 | \n",
" 1.306897e-01 | \n",
"
\n",
" \n",
" | 3185 | \n",
" Noam Bettan | \n",
" 0.000072 | \n",
" 0.001307 | \n",
" -94.506929 | \n",
" -4.186224 | \n",
" 7.978231 | \n",
" 4.734318e-03 | \n",
" 9.424725 | \n",
" 2.140792e-03 | \n",
" 1.396500e-01 | \n",
"
\n",
" \n",
" | 3082 | \n",
" Máxima | \n",
" 0.002010 | \n",
" 0.004497 | \n",
" -55.288957 | \n",
" -1.161296 | \n",
" 8.263354 | \n",
" 4.045333e-03 | \n",
" 8.639908 | \n",
" 3.288780e-03 | \n",
" 2.088156e-01 | \n",
"
\n",
" \n",
" | 1099 | \n",
" Dylan Groenewegen | \n",
" 0.000072 | \n",
" 0.001203 | \n",
" -94.029271 | \n",
" -4.065930 | \n",
" 7.253040 | \n",
" 7.078107e-03 | \n",
" 8.348388 | \n",
" 3.860297e-03 | \n",
" 2.418781e-01 | \n",
"
\n",
" \n",
" | 4258 | \n",
" Tom Berendsen | \n",
" 0.000574 | \n",
" 0.002196 | \n",
" -73.842519 | \n",
" -1.934703 | \n",
" 7.626670 | \n",
" 5.751139e-03 | \n",
" 8.204369 | \n",
" 4.178964e-03 | \n",
" 2.456818e-01 | \n",
"
\n",
" \n",
" | 4598 | \n",
" Willem-Alexander | \n",
" 0.001436 | \n",
" 0.003555 | \n",
" -59.609772 | \n",
" -1.307921 | \n",
" 7.692603 | \n",
" 5.544761e-03 | \n",
" 8.044226 | \n",
" 4.564892e-03 | \n",
" 2.587859e-01 | \n",
"
\n",
" \n",
" | 3222 | \n",
" Oceanwide Expeditions | \n",
" 0.000072 | \n",
" 0.001150 | \n",
" -93.757874 | \n",
" -4.001800 | \n",
" 6.890771 | \n",
" 8.664187e-03 | \n",
" 7.815786 | \n",
" 5.179183e-03 | \n",
" 2.603795e-01 | \n",
"
\n",
" \n",
" | 1411 | \n",
" Freek | \n",
" 0.000072 | \n",
" 0.001150 | \n",
" -93.757874 | \n",
" -4.001800 | \n",
" 6.890771 | \n",
" 8.664187e-03 | \n",
" 7.815786 | \n",
" 5.179183e-03 | \n",
" 2.603795e-01 | \n",
"
\n",
" \n",
" | 2226 | \n",
" Kaja Kallas | \n",
" 0.000072 | \n",
" 0.001098 | \n",
" -93.460630 | \n",
" -3.934686 | \n",
" 6.528755 | \n",
" 1.061442e-02 | \n",
" 7.287350 | \n",
" 6.944183e-03 | \n",
" 2.603795e-01 | \n",
"
\n",
" \n",
" | 4454 | \n",
" Verhoeven | \n",
" 0.000072 | \n",
" 0.001098 | \n",
" -93.460630 | \n",
" -3.934686 | \n",
" 6.528755 | \n",
" 1.061442e-02 | \n",
" 7.287350 | \n",
" 6.944183e-03 | \n",
" 2.603795e-01 | \n",
"
\n",
" \n",
" | 1401 | \n",
" Fred Rutten | \n",
" 0.000072 | \n",
" 0.001098 | \n",
" -93.460630 | \n",
" -3.934686 | \n",
" 6.528755 | \n",
" 1.061442e-02 | \n",
" 7.287350 | \n",
" 6.944183e-03 | \n",
" 2.603795e-01 | \n",
"
\n",
" \n",
" | 1981 | \n",
" Jerdy Schouten | \n",
" 0.000072 | \n",
" 0.001046 | \n",
" -93.133661 | \n",
" -3.864296 | \n",
" 6.167024 | \n",
" 1.301534e-02 | \n",
" 6.763485 | \n",
" 9.304187e-03 | \n",
" 3.370342e-01 | \n",
"
\n",
" \n",
" | 2977 | \n",
" Mikel Arteta | \n",
" 0.000072 | \n",
" 0.001046 | \n",
" -93.133661 | \n",
" -3.864296 | \n",
" 6.167024 | \n",
" 1.301534e-02 | \n",
" 6.763485 | \n",
" 9.304187e-03 | \n",
" 3.370342e-01 | \n",
"
\n",
" \n",
" | 3013 | \n",
" Modi | \n",
" 0.000072 | \n",
" 0.001046 | \n",
" -93.133661 | \n",
" -3.864296 | \n",
" 6.167024 | \n",
" 1.301534e-02 | \n",
" 6.763485 | \n",
" 9.304187e-03 | \n",
" 3.370342e-01 | \n",
"
\n",
" \n",
" | 3237 | \n",
" Oleksandr Usyk | \n",
" 0.000072 | \n",
" 0.001046 | \n",
" -93.133661 | \n",
" -3.864296 | \n",
" 6.167024 | \n",
" 1.301534e-02 | \n",
" 6.763485 | \n",
" 9.304187e-03 | \n",
" 3.370342e-01 | \n",
"
\n",
" \n",
" | 417 | \n",
" Berendsen | \n",
" 0.000718 | \n",
" 0.002248 | \n",
" -68.063541 | \n",
" -1.646722 | \n",
" 6.509375 | \n",
" 1.073072e-02 | \n",
" 6.756171 | \n",
" 9.342400e-03 | \n",
" 3.370342e-01 | \n",
"
\n",
" \n",
" | 2016 | \n",
" Jetten | \n",
" 0.002441 | \n",
" 0.004601 | \n",
" -46.941928 | \n",
" -0.914356 | \n",
" 5.941062 | \n",
" 1.479210e-02 | \n",
" 5.969003 | \n",
" 1.455951e-02 | \n",
" 4.952314e-01 | \n",
"
\n",
" \n",
" | 1310 | \n",
" Felix Gall | \n",
" 0.000072 | \n",
" 0.000941 | \n",
" -92.370735 | \n",
" -3.712293 | \n",
" 5.444587 | \n",
" 1.962906e-02 | \n",
" 5.731410 | \n",
" 1.666410e-02 | \n",
" 5.501480e-01 | \n",
"
\n",
" \n",
" | 1167 | \n",
" Ellen ten Damme | \n",
" 0.000072 | \n",
" 0.000941 | \n",
" -92.370735 | \n",
" -3.712293 | \n",
" 5.444587 | \n",
" 1.962906e-02 | \n",
" 5.731410 | \n",
" 1.666410e-02 | \n",
" 5.501480e-01 | \n",
"
\n",
" \n",
" | 4101 | \n",
" Suzan & Freek | \n",
" 0.000072 | \n",
" 0.000941 | \n",
" -92.370735 | \n",
" -3.712293 | \n",
" 5.444587 | \n",
" 1.962906e-02 | \n",
" 5.731410 | \n",
" 1.666410e-02 | \n",
" 5.501480e-01 | \n",
"
\n",
" \n",
" | 4141 | \n",
" Tallon Griekspoor | \n",
" 0.000431 | \n",
" 0.001621 | \n",
" -73.420624 | \n",
" -1.911618 | \n",
" 5.554715 | \n",
" 1.843098e-02 | \n",
" 5.650035 | \n",
" 1.745502e-02 | \n",
" 5.501480e-01 | \n",
"
\n",
" \n",
" | 4655 | \n",
" Xi Jinping | \n",
" 0.001149 | \n",
" 0.002719 | \n",
" -57.745608 | \n",
" -1.242826 | \n",
" 5.484134 | \n",
" 1.918982e-02 | \n",
" 5.488524 | \n",
" 1.914170e-02 | \n",
" 5.501480e-01 | \n",
"
\n",
" \n",
" | 133 | \n",
" Amalia | \n",
" 0.000431 | \n",
" 0.001569 | \n",
" -72.534645 | \n",
" -1.864313 | \n",
" 5.230992 | \n",
" 2.218788e-02 | \n",
" 5.249197 | \n",
" 2.195690e-02 | \n",
" 5.501480e-01 | \n",
"
\n",
" \n",
" | 3767 | \n",
" Rutten | \n",
" 0.000072 | \n",
" 0.000889 | \n",
" -91.921954 | \n",
" -3.629831 | \n",
" 5.083988 | \n",
" 2.414777e-02 | \n",
" 5.224377 | \n",
" 2.227242e-02 | \n",
" 5.501480e-01 | \n",
"
\n",
" \n",
" | 2970 | \n",
" Mika Godts | \n",
" 0.000072 | \n",
" 0.000889 | \n",
" -91.921954 | \n",
" -3.629831 | \n",
" 5.083988 | \n",
" 2.414777e-02 | \n",
" 5.224377 | \n",
" 2.227242e-02 | \n",
" 5.501480e-01 | \n",
"
\n",
" \n",
" | 537 | \n",
" Brekelmans | \n",
" 0.000072 | \n",
" 0.000889 | \n",
" -91.921954 | \n",
" -3.629831 | \n",
" 5.083988 | \n",
" 2.414777e-02 | \n",
" 5.224377 | \n",
" 2.227242e-02 | \n",
" 5.501480e-01 | \n",
"
\n",
" \n",
" | 2712 | \n",
" Marco Rubio | \n",
" 0.000862 | \n",
" 0.002248 | \n",
" -61.676249 | \n",
" -1.383688 | \n",
" 5.236100 | \n",
" 2.212281e-02 | \n",
" 5.213944 | \n",
" 2.240645e-02 | \n",
" 5.501480e-01 | \n",
"
\n",
" \n",
"
\n",
"
"
],
"text/plain": [
" word freq_recent freq_reference pct_diff \\\n",
"1743 Hondius 0.000431 0.010457 -95.880197 \n",
"4215 Thymen Arensman 0.000072 0.002353 -96.948294 \n",
"1508 Gidi Markuszower 0.000072 0.002091 -96.566831 \n",
"4495 Vingegaard 0.000072 0.001882 -96.185367 \n",
"2782 Markuszower 0.000072 0.001830 -96.076378 \n",
"2109 Jonas Vingegaard 0.000431 0.002667 -83.843909 \n",
"3750 Rubio 0.000287 0.002301 -87.515748 \n",
"115 Ali B 0.000072 0.001725 -95.838583 \n",
"512 Botic van de Zandschulp 0.000072 0.001621 -95.570104 \n",
"921 De Jong 0.000574 0.002562 -77.579302 \n",
"4034 Starmer 0.000574 0.002510 -77.112204 \n",
"1054 Donald Trump 0.010196 0.015529 -34.342080 \n",
"4169 Tedros Adhanom Ghebreyesus 0.000072 0.001412 -94.913823 \n",
"269 Arensman 0.000072 0.001359 -94.718201 \n",
"3185 Noam Bettan 0.000072 0.001307 -94.506929 \n",
"3082 Máxima 0.002010 0.004497 -55.288957 \n",
"1099 Dylan Groenewegen 0.000072 0.001203 -94.029271 \n",
"4258 Tom Berendsen 0.000574 0.002196 -73.842519 \n",
"4598 Willem-Alexander 0.001436 0.003555 -59.609772 \n",
"3222 Oceanwide Expeditions 0.000072 0.001150 -93.757874 \n",
"1411 Freek 0.000072 0.001150 -93.757874 \n",
"2226 Kaja Kallas 0.000072 0.001098 -93.460630 \n",
"4454 Verhoeven 0.000072 0.001098 -93.460630 \n",
"1401 Fred Rutten 0.000072 0.001098 -93.460630 \n",
"1981 Jerdy Schouten 0.000072 0.001046 -93.133661 \n",
"2977 Mikel Arteta 0.000072 0.001046 -93.133661 \n",
"3013 Modi 0.000072 0.001046 -93.133661 \n",
"3237 Oleksandr Usyk 0.000072 0.001046 -93.133661 \n",
"417 Berendsen 0.000718 0.002248 -68.063541 \n",
"2016 Jetten 0.002441 0.004601 -46.941928 \n",
"1310 Felix Gall 0.000072 0.000941 -92.370735 \n",
"1167 Ellen ten Damme 0.000072 0.000941 -92.370735 \n",
"4101 Suzan & Freek 0.000072 0.000941 -92.370735 \n",
"4141 Tallon Griekspoor 0.000431 0.001621 -73.420624 \n",
"4655 Xi Jinping 0.001149 0.002719 -57.745608 \n",
"133 Amalia 0.000431 0.001569 -72.534645 \n",
"3767 Rutten 0.000072 0.000889 -91.921954 \n",
"2970 Mika Godts 0.000072 0.000889 -91.921954 \n",
"537 Brekelmans 0.000072 0.000889 -91.921954 \n",
"2712 Marco Rubio 0.000862 0.002248 -61.676249 \n",
"\n",
" log_ratio chi2 p_chi2 g2 p_g2 \\\n",
"1743 -4.601278 66.470517 3.551664e-16 98.275792 3.639886e-23 \n",
"4215 -5.034221 15.256919 9.383239e-05 20.686464 5.409706e-06 \n",
"1508 -4.864296 13.434157 2.470840e-04 17.811640 2.438866e-05 \n",
"4495 -4.712293 11.977136 5.385731e-04 15.534557 8.101072e-05 \n",
"2782 -4.671651 11.613072 6.548989e-04 14.969018 1.092909e-04 \n",
"2109 -2.629847 12.353905 4.400650e-04 14.707179 1.255674e-04 \n",
"3750 -3.001814 11.757125 6.061077e-04 14.212300 1.632996e-04 \n",
"115 -4.586762 10.885206 9.693541e-04 13.843023 1.987332e-04 \n",
"512 -4.496564 10.157724 1.436979e-03 12.724502 3.608960e-04 \n",
"921 -2.157095 9.947317 1.610840e-03 11.220837 8.088400e-04 \n",
"4034 -2.127348 9.611842 1.933266e-03 10.778088 1.027087e-03 \n",
"1054 -0.606959 10.440052 1.233118e-03 10.743700 1.046349e-03 \n",
"4169 -4.297255 8.704154 3.174857e-03 10.514021 1.184722e-03 \n",
"269 -4.242808 8.341110 3.875791e-03 9.967878 1.592950e-03 \n",
"3185 -4.186224 7.978231 4.734318e-03 9.424725 2.140792e-03 \n",
"3082 -1.161296 8.263354 4.045333e-03 8.639908 3.288780e-03 \n",
"1099 -4.065930 7.253040 7.078107e-03 8.348388 3.860297e-03 \n",
"4258 -1.934703 7.626670 5.751139e-03 8.204369 4.178964e-03 \n",
"4598 -1.307921 7.692603 5.544761e-03 8.044226 4.564892e-03 \n",
"3222 -4.001800 6.890771 8.664187e-03 7.815786 5.179183e-03 \n",
"1411 -4.001800 6.890771 8.664187e-03 7.815786 5.179183e-03 \n",
"2226 -3.934686 6.528755 1.061442e-02 7.287350 6.944183e-03 \n",
"4454 -3.934686 6.528755 1.061442e-02 7.287350 6.944183e-03 \n",
"1401 -3.934686 6.528755 1.061442e-02 7.287350 6.944183e-03 \n",
"1981 -3.864296 6.167024 1.301534e-02 6.763485 9.304187e-03 \n",
"2977 -3.864296 6.167024 1.301534e-02 6.763485 9.304187e-03 \n",
"3013 -3.864296 6.167024 1.301534e-02 6.763485 9.304187e-03 \n",
"3237 -3.864296 6.167024 1.301534e-02 6.763485 9.304187e-03 \n",
"417 -1.646722 6.509375 1.073072e-02 6.756171 9.342400e-03 \n",
"2016 -0.914356 5.941062 1.479210e-02 5.969003 1.455951e-02 \n",
"1310 -3.712293 5.444587 1.962906e-02 5.731410 1.666410e-02 \n",
"1167 -3.712293 5.444587 1.962906e-02 5.731410 1.666410e-02 \n",
"4101 -3.712293 5.444587 1.962906e-02 5.731410 1.666410e-02 \n",
"4141 -1.911618 5.554715 1.843098e-02 5.650035 1.745502e-02 \n",
"4655 -1.242826 5.484134 1.918982e-02 5.488524 1.914170e-02 \n",
"133 -1.864313 5.230992 2.218788e-02 5.249197 2.195690e-02 \n",
"3767 -3.629831 5.083988 2.414777e-02 5.224377 2.227242e-02 \n",
"2970 -3.629831 5.083988 2.414777e-02 5.224377 2.227242e-02 \n",
"537 -3.629831 5.083988 2.414777e-02 5.224377 2.227242e-02 \n",
"2712 -1.383688 5.236100 2.212281e-02 5.213944 2.240645e-02 \n",
"\n",
" p_g2_adjusted \n",
"1743 1.733314e-19 \n",
"4215 1.716105e-03 \n",
"1508 6.112569e-03 \n",
"4495 1.837014e-02 \n",
"2782 2.365652e-02 \n",
"2109 2.404300e-02 \n",
"3750 2.404300e-02 \n",
"115 2.783434e-02 \n",
"512 4.910248e-02 \n",
"921 8.559325e-02 \n",
"4034 1.060152e-01 \n",
"1054 1.060152e-01 \n",
"4169 1.175343e-01 \n",
"269 1.306897e-01 \n",
"3185 1.396500e-01 \n",
"3082 2.088156e-01 \n",
"1099 2.418781e-01 \n",
"4258 2.456818e-01 \n",
"4598 2.587859e-01 \n",
"3222 2.603795e-01 \n",
"1411 2.603795e-01 \n",
"2226 2.603795e-01 \n",
"4454 2.603795e-01 \n",
"1401 2.603795e-01 \n",
"1981 3.370342e-01 \n",
"2977 3.370342e-01 \n",
"3013 3.370342e-01 \n",
"3237 3.370342e-01 \n",
"417 3.370342e-01 \n",
"2016 4.952314e-01 \n",
"1310 5.501480e-01 \n",
"1167 5.501480e-01 \n",
"4101 5.501480e-01 \n",
"4141 5.501480e-01 \n",
"4655 5.501480e-01 \n",
"133 5.501480e-01 \n",
"3767 5.501480e-01 \n",
"2970 5.501480e-01 \n",
"537 5.501480e-01 \n",
"2712 5.501480e-01 "
]
},
"execution_count": 9,
"metadata": {},
"output_type": "execute_result"
}
],
"source": [
"# dalers\n",
"results[results.pct_diff < 0].sort_values('g2', ascending=False)[:40]"
]
}
],
"metadata": {
"kernelspec": {
"display_name": "Python 3 (ipykernel)",
"language": "python",
"name": "python3"
},
"language_info": {
"codemirror_mode": {
"name": "ipython",
"version": 3
},
"file_extension": ".py",
"mimetype": "text/x-python",
"name": "python",
"nbconvert_exporter": "python",
"pygments_lexer": "ipython3",
"version": "3.13.5"
}
},
"nbformat": 4,
"nbformat_minor": 5
}