{ "cells": [ { "cell_type": "code", "execution_count": 2, "metadata": {}, "outputs": [], "source": [ "import pandas as pd\n", "import matplotlib.pyplot as plt\n", "import seaborn as sns\n", "import gc" ] }, { "cell_type": "code", "execution_count": 3, "metadata": {}, "outputs": [], "source": [ "unknown_traders = pd.read_parquet(\"../data/unknown_traders.parquet\")" ] }, { "cell_type": "code", "execution_count": 32, "metadata": {}, "outputs": [], "source": [ "old_unknown_traders = pd.read_parquet(\"../data/old_unknown_traders.parquet\")" ] }, { "cell_type": "code", "execution_count": 4, "metadata": {}, "outputs": [ { "data": { "text/plain": [ "Index(['trader_address', 'market_creator', 'trade_id', 'creation_timestamp',\n", " 'title', 'market_status', 'collateral_amount', 'outcome_index',\n", " 'trade_fee_amount', 'outcomes_tokens_traded', 'current_answer',\n", " 'is_invalid', 'winning_trade', 'earnings', 'redeemed',\n", " 'redeemed_amount', 'num_mech_calls', 'mech_fee_amount', 'net_earnings',\n", " 'roi', 'staking', 'nr_mech_calls'],\n", " dtype='object')" ] }, "execution_count": 4, "metadata": {}, "output_type": "execute_result" } ], "source": [ "unknown_traders.columns" ] }, { "cell_type": "code", "execution_count": 6, "metadata": {}, "outputs": [ { "data": { "text/plain": [ "Timestamp('2025-01-11 02:06:25+0000', tz='UTC')" ] }, "execution_count": 6, "metadata": {}, "output_type": "execute_result" } ], "source": [ "max(unknown_traders.creation_timestamp)" ] }, { "cell_type": "code", "execution_count": 7, "metadata": {}, "outputs": [ { "data": { "text/plain": [ "Timestamp('2024-12-01 12:55:00+0000', tz='UTC')" ] }, "execution_count": 7, "metadata": {}, "output_type": "execute_result" } ], "source": [ "min(unknown_traders.creation_timestamp)" ] }, { "cell_type": "code", "execution_count": 33, "metadata": {}, "outputs": [ { "data": { "text/plain": [ "Timestamp('2024-12-14 03:18:30+0000', tz='UTC')" ] }, "execution_count": 33, "metadata": {}, "output_type": "execute_result" } ], "source": [ "max(old_unknown_traders.creation_timestamp)" ] }, { "cell_type": "code", "execution_count": 34, "metadata": {}, "outputs": [ { "data": { "text/plain": [ "Timestamp('2024-10-13 00:01:10+0000', tz='UTC')" ] }, "execution_count": 34, "metadata": {}, "output_type": "execute_result" } ], "source": [ "min(old_unknown_traders.creation_timestamp)" ] }, { "cell_type": "code", "execution_count": 6, "metadata": {}, "outputs": [], "source": [ "from datetime import datetime, timezone\n", "def transform_to_datetime(x):\n", " return datetime.fromtimestamp(int(x), tz=timezone.utc)" ] }, { "cell_type": "code", "execution_count": 5, "metadata": {}, "outputs": [], "source": [ "def add_creation_date(df):\n", " try:\n", " df[\"creationTimestamp\"] = df[\"creationTimestamp\"].apply(\n", " lambda x: transform_to_datetime(x)\n", " )\n", " df[\"creation_timestamp\"] = pd.to_datetime(df[\"creationTimestamp\"])\n", " except Exception:\n", " print(\"Ignore\")\n", " \n", " df[\"creation_date\"] = df[\"creation_timestamp\"].dt.date\n", " df[\"creation_date\"] = pd.to_datetime(df[\"creation_date\"])\n", " return df" ] }, { "cell_type": "code", "execution_count": 35, "metadata": {}, "outputs": [ { "name": "stdout", "output_type": "stream", "text": [ "Ignore\n" ] } ], "source": [ "old_unknown_traders = add_creation_date(old_unknown_traders)" ] }, { "cell_type": "code", "execution_count": 7, "metadata": {}, "outputs": [ { "name": "stdout", "output_type": "stream", "text": [ "Ignore\n" ] } ], "source": [ "unknown_traders = add_creation_date(unknown_traders)" ] }, { "cell_type": "code", "execution_count": 8, "metadata": {}, "outputs": [ { "name": "stderr", "output_type": "stream", "text": [ "/var/folders/gp/02mb1d514ng739czlxw1lhh00000gn/T/ipykernel_6876/1622588175.py:2: UserWarning: Converting to PeriodArray/Index representation will drop timezone information.\n", " pd.to_datetime(unknown_traders[\"creation_timestamp\"]).dt.to_period(\"W\").dt.strftime(\"%b-%d-%Y\")\n" ] } ], "source": [ "unknown_traders[\"month_year_week\"] =(\n", " pd.to_datetime(unknown_traders[\"creation_timestamp\"]).dt.to_period(\"W\").dt.strftime(\"%b-%d-%Y\")\n", ")" ] }, { "cell_type": "code", "execution_count": 9, "metadata": {}, "outputs": [ { "data": { "text/html": [ "
\n", " | trader_address | \n", "market_creator | \n", "trade_id | \n", "creation_timestamp | \n", "title | \n", "market_status | \n", "collateral_amount | \n", "outcome_index | \n", "trade_fee_amount | \n", "outcomes_tokens_traded | \n", "... | \n", "redeemed | \n", "redeemed_amount | \n", "num_mech_calls | \n", "mech_fee_amount | \n", "net_earnings | \n", "roi | \n", "staking | \n", "nr_mech_calls | \n", "creation_date | \n", "month_year_week | \n", "
---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
0 | \n", "0x05e8bbdb89c84a14d05194bbbae81caf2340db72 | \n", "quickstart | \n", "0x083c9f03dfc4072082b9e10aa2137151346f6fd30x05... | \n", "2025-01-12 12:21:40+00:00 | \n", "Will federal prosecutors announce any new char... | \n", "CLOSED | \n", "0.204245 | \n", "1 | \n", "0.002042 | \n", "0.279142 | \n", "... | \n", "True | \n", "0.279142 | \n", "0 | \n", "0.0 | \n", "0.072854 | \n", "0.353167 | \n", "non_Olas | \n", "NaN | \n", "2025-01-12 | \n", "Jan-12-2025 | \n", "
1 | \n", "0x05e8bbdb89c84a14d05194bbbae81caf2340db72 | \n", "quickstart | \n", "0x0b52672f29f059b1d0c3a297b28670fb8d92c4bd0x05... | \n", "2024-12-27 00:21:40+00:00 | \n", "Will a third fight between Usyk and Fury be of... | \n", "CLOSED | \n", "0.943883 | \n", "1 | \n", "0.009439 | \n", "1.302968 | \n", "... | \n", "True | \n", "1.302968 | \n", "0 | \n", "0.0 | \n", "0.349646 | \n", "0.366766 | \n", "non_Olas | \n", "NaN | \n", "2024-12-27 | \n", "Dec-29-2024 | \n", "
2 | \n", "0x05e8bbdb89c84a14d05194bbbae81caf2340db72 | \n", "quickstart | \n", "0x0de08cc50fa523de23b95ce7ad773e038fb8590d0x05... | \n", "2025-01-09 06:21:15+00:00 | \n", "Will record-low temperatures be recorded in at... | \n", "CLOSED | \n", "2.185557 | \n", "1 | \n", "0.021856 | \n", "3.456138 | \n", "... | \n", "True | \n", "0.000000 | \n", "0 | \n", "0.0 | \n", "-2.207412 | \n", "-1.000000 | \n", "non_Olas | \n", "NaN | \n", "2025-01-09 | \n", "Jan-12-2025 | \n", "
3 | \n", "0x05e8bbdb89c84a14d05194bbbae81caf2340db72 | \n", "quickstart | \n", "0x0f90a2ea8a8b0fbca021405563e763acb9f7d9460x05... | \n", "2024-12-27 18:21:35+00:00 | \n", "Will any new unfair labor practice charges be ... | \n", "CLOSED | \n", "0.430373 | \n", "0 | \n", "0.004304 | \n", "0.586244 | \n", "... | \n", "True | \n", "0.586244 | \n", "0 | \n", "0.0 | \n", "0.151567 | \n", "0.348688 | \n", "non_Olas | \n", "NaN | \n", "2024-12-27 | \n", "Dec-29-2024 | \n", "
4 | \n", "0x05e8bbdb89c84a14d05194bbbae81caf2340db72 | \n", "quickstart | \n", "0x13e42a5f5422df80a05c4b7b8d01bd21be82289b0x05... | \n", "2025-01-08 18:22:00+00:00 | \n", "Will the Israeli government publicly acknowled... | \n", "CLOSED | \n", "3.227216 | \n", "1 | \n", "0.032272 | \n", "7.405353 | \n", "... | \n", "True | \n", "7.405353 | \n", "0 | \n", "0.0 | \n", "4.145865 | \n", "1.271938 | \n", "non_Olas | \n", "NaN | \n", "2025-01-08 | \n", "Jan-12-2025 | \n", "
5 rows × 24 columns
\n", "\n", " | trader_address | \n", "market_creator | \n", "trade_id | \n", "creation_timestamp | \n", "title | \n", "market_status | \n", "collateral_amount | \n", "outcome_index | \n", "trade_fee_amount | \n", "outcomes_tokens_traded | \n", "... | \n", "redeemed | \n", "redeemed_amount | \n", "num_mech_calls | \n", "mech_fee_amount | \n", "net_earnings | \n", "roi | \n", "staking | \n", "nr_mech_calls | \n", "creation_date | \n", "month_year_week | \n", "
---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
0 | \n", "0x05e8bbdb89c84a14d05194bbbae81caf2340db72 | \n", "quickstart | \n", "0x083c9f03dfc4072082b9e10aa2137151346f6fd30x05... | \n", "2025-01-12 12:21:40+00:00 | \n", "Will federal prosecutors announce any new char... | \n", "CLOSED | \n", "0.204245 | \n", "1 | \n", "0.002042 | \n", "0.279142 | \n", "... | \n", "True | \n", "0.279142 | \n", "0 | \n", "0.0 | \n", "0.072854 | \n", "0.353167 | \n", "non_Olas | \n", "NaN | \n", "2025-01-12 | \n", "Jan-06-2025 | \n", "
1 | \n", "0x05e8bbdb89c84a14d05194bbbae81caf2340db72 | \n", "quickstart | \n", "0x0b52672f29f059b1d0c3a297b28670fb8d92c4bd0x05... | \n", "2024-12-27 00:21:40+00:00 | \n", "Will a third fight between Usyk and Fury be of... | \n", "CLOSED | \n", "0.943883 | \n", "1 | \n", "0.009439 | \n", "1.302968 | \n", "... | \n", "True | \n", "1.302968 | \n", "0 | \n", "0.0 | \n", "0.349646 | \n", "0.366766 | \n", "non_Olas | \n", "NaN | \n", "2024-12-27 | \n", "Dec-23-2024 | \n", "
2 | \n", "0x05e8bbdb89c84a14d05194bbbae81caf2340db72 | \n", "quickstart | \n", "0x0de08cc50fa523de23b95ce7ad773e038fb8590d0x05... | \n", "2025-01-09 06:21:15+00:00 | \n", "Will record-low temperatures be recorded in at... | \n", "CLOSED | \n", "2.185557 | \n", "1 | \n", "0.021856 | \n", "3.456138 | \n", "... | \n", "True | \n", "0.000000 | \n", "0 | \n", "0.0 | \n", "-2.207412 | \n", "-1.000000 | \n", "non_Olas | \n", "NaN | \n", "2025-01-09 | \n", "Jan-06-2025 | \n", "
3 | \n", "0x05e8bbdb89c84a14d05194bbbae81caf2340db72 | \n", "quickstart | \n", "0x0f90a2ea8a8b0fbca021405563e763acb9f7d9460x05... | \n", "2024-12-27 18:21:35+00:00 | \n", "Will any new unfair labor practice charges be ... | \n", "CLOSED | \n", "0.430373 | \n", "0 | \n", "0.004304 | \n", "0.586244 | \n", "... | \n", "True | \n", "0.586244 | \n", "0 | \n", "0.0 | \n", "0.151567 | \n", "0.348688 | \n", "non_Olas | \n", "NaN | \n", "2024-12-27 | \n", "Dec-23-2024 | \n", "
4 | \n", "0x05e8bbdb89c84a14d05194bbbae81caf2340db72 | \n", "quickstart | \n", "0x13e42a5f5422df80a05c4b7b8d01bd21be82289b0x05... | \n", "2025-01-08 18:22:00+00:00 | \n", "Will the Israeli government publicly acknowled... | \n", "CLOSED | \n", "3.227216 | \n", "1 | \n", "0.032272 | \n", "7.405353 | \n", "... | \n", "True | \n", "7.405353 | \n", "0 | \n", "0.0 | \n", "4.145865 | \n", "1.271938 | \n", "non_Olas | \n", "NaN | \n", "2025-01-08 | \n", "Jan-06-2025 | \n", "
5 rows × 24 columns
\n", "\n", " | trader_address | \n", "market_creator | \n", "trade_id | \n", "creation_timestamp | \n", "title | \n", "market_status | \n", "collateral_amount | \n", "outcome_index | \n", "trade_fee_amount | \n", "outcomes_tokens_traded | \n", "... | \n", "is_invalid | \n", "winning_trade | \n", "earnings | \n", "redeemed | \n", "redeemed_amount | \n", "num_mech_calls | \n", "mech_fee_amount | \n", "net_earnings | \n", "roi | \n", "staking | \n", "
---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
0 | \n", "0x23522318aebb55b55879b60fb3ad4682abc6cc2f | \n", "quickstart | \n", "0xeeaadfc4d0ef3f3bb1c430bc96657ed01a52e3e20x23... | \n", "2024-12-23 12:36:05+00:00 | \n", "Will any additional Amazon facilities join the... | \n", "CLOSED | \n", "0.401540 | \n", "0 | \n", "0.004015 | \n", "0.939802 | \n", "... | \n", "False | \n", "True | \n", "0.939802 | \n", "True | \n", "0.939802 | \n", "0 | \n", "0.0 | \n", "0.534247 | \n", "1.317323 | \n", "non_Olas | \n", "
1 | \n", "0x8c4abc95e0091bf3bffe723d2b3c958edf642549 | \n", "quickstart | \n", "0x6df8ac2c78c8a801d6b6f30e19d3c193daf54f1e0x8c... | \n", "2024-12-24 07:22:50+00:00 | \n", "Will the World Health Organization issue an of... | \n", "CLOSED | \n", "0.298503 | \n", "0 | \n", "0.002985 | \n", "0.624681 | \n", "... | \n", "False | \n", "True | \n", "0.624681 | \n", "True | \n", "0.624681 | \n", "0 | \n", "0.0 | \n", "0.323193 | \n", "1.071994 | \n", "non_Olas | \n", "
2 | \n", "0xb3ead49f4797662511816d2798f774dee3603185 | \n", "quickstart | \n", "0x4cb63dbf490e1f8f7c10d1e62be7ae6bbbb6d0790xb3... | \n", "2024-12-23 12:50:40+00:00 | \n", "Will Dominion Energy announce any additional p... | \n", "CLOSED | \n", "0.423050 | \n", "1 | \n", "0.004230 | \n", "0.687175 | \n", "... | \n", "False | \n", "False | \n", "0.000000 | \n", "False | \n", "0.000000 | \n", "0 | \n", "0.0 | \n", "-0.427280 | \n", "-1.000000 | \n", "non_Olas | \n", "
3 | \n", "0x2dd9f5678484c1f59f97ed334725858b938b4102 | \n", "quickstart | \n", "0x005e5be235ba39c5f17622d25e77557ee79a2cba0x2d... | \n", "2024-12-22 02:40:35+00:00 | \n", "Will the Federal Reserve signal a plan to slow... | \n", "CLOSED | \n", "1.568561 | \n", "1 | \n", "0.015686 | \n", "2.474096 | \n", "... | \n", "False | \n", "False | \n", "0.000000 | \n", "True | \n", "0.000000 | \n", "0 | \n", "0.0 | \n", "-1.584247 | \n", "-1.000000 | \n", "non_Olas | \n", "
4 | \n", "0x2dd9f5678484c1f59f97ed334725858b938b4102 | \n", "quickstart | \n", "0x0080b3768232e8a2f187eaaf342923034275e0b90x2d... | \n", "2024-12-13 04:32:35+00:00 | \n", "Will Russia officially confirm Bashar al-Assad... | \n", "CLOSED | \n", "2.677632 | \n", "0 | \n", "0.026776 | \n", "5.135035 | \n", "... | \n", "False | \n", "True | \n", "5.135035 | \n", "True | \n", "5.135035 | \n", "0 | \n", "0.0 | \n", "2.430627 | \n", "0.898765 | \n", "non_Olas | \n", "
5 rows × 21 columns
\n", "