Spaces:

valory
/

trader_agents_performance

Running

App Files Files Community

cyberosa commited on Sep 27, 2024

Commit

12536a4

1 Parent(s): dc11fb3

Adjusting divergence graph

Browse files

Files changed (4) hide show

app.py +4 -11
data/closed_markets_div.parquet +2 -2
scripts/closed_markets_divergence.py +17 -0
tabs/market_plots.py +86 -3

app.py CHANGED Viewed

@@ -20,7 +20,7 @@ from tabs.trader_plots import (
     get_interpretation_text,
 )
-from tabs.market_plots import plot_kl_div_per_market
 def get_logger():
@@ -194,19 +194,12 @@ with demo:
                 )
             with gr.Row():
                 gr.Markdown(
-                    "The accuracy is measured as the difference between the distribution of the final outcome P = [prob(yes), prob(no)] and the final liquidity distribution of the market for the yes and no responses."
                 )
             with gr.Row():
-                gr.Markdown(
-                    "There are some edge cases in the Kullback-Leibler divergence formula that can lead to extreme or infinite values, particularly when the predicted probabilities are very different from the actual outcome. To handle these cases, we capped the maximum divergence value at 20. A high divergence value (close to or at 20) indicates markets where the predicted probabilities were significantly different from the real-world outcome, potentially even opposite to what actually occurred."
-                )
             with gr.Row():
-                metrics_text = get_metrics_text()
-            with gr.Row():
-                with gr.Column(scale=2):
-                    kl_div_plot = plot_kl_div_per_market(closed_markets=closed_markets)
-                with gr.Column(scale=1):
-                    interpretation_text = get_interpretation_text()
         with gr.TabItem("🎖️Weekly winning trades % per trader"):
             with gr.Row():

     get_interpretation_text,
 )
+from tabs.market_plots import plot_kl_div_per_market, plot_kl_div_per_market2
 def get_logger():
                 )
             with gr.Row():
                 gr.Markdown(
+                    "Aka, how much off is the market prediction’s accuracy from the real outcome of the event. Values capped at 20 for market outcomes completely opposite to the real outcome."
                 )
             with gr.Row():
+                trade_details_text = get_metrics_text()
             with gr.Row():
+                kl_div_plot = plot_kl_div_per_market2(closed_markets=closed_markets)
         with gr.TabItem("🎖️Weekly winning trades % per trader"):
             with gr.Row():

data/closed_markets_div.parquet CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:abdc271bdfd214e6497de73c32adeada50b680d847b1ad9b0bdf2c2fc442394b
-size 48595

 version https://git-lfs.github.com/spec/v1
+oid sha256:d1e7aeecfea8085d6b11fe66ef37ddee2b5f35b88a8503230b829c4b4501d1de
+size 52381

scripts/closed_markets_divergence.py CHANGED Viewed

@@ -177,6 +177,20 @@ def market_KL_divergence(market_row: pd.DataFrame) -> float:
     return kl_divergence(P, Q)
 def compute_tokens_prob(token_amounts: list) -> list:
     first_token_amounts = token_amounts[0]
     second_token_amounts = token_amounts[1]
@@ -247,6 +261,9 @@ def prepare_closed_markets_data():
     closed_markets["kl_divergence"] = closed_markets.apply(
         lambda x: market_KL_divergence(x), axis=1
     )
     closed_markets.to_parquet(DATA_DIR / "closed_markets_div.parquet", index=False)
     print("Finished preparing final dataset for visualization")
     print(closed_markets.head())

     return kl_divergence(P, Q)
+def off_by_values(market_row: pd.DataFrame) -> float:
+    current_answer = market_row.currentAnswer  # "yes", "no"
+    approx_prob = market_row.first_outcome_prob
+    true_prob = 1.0  # for yes outcome
+    if current_answer == "no":
+        true_prob = 0.0  # = 0% for yes outcome and 100% for no
+    # we have only one sample, the final probability based on tokens
+    # Ensure probabilities sum to 1
+    P = np.array([true_prob, 1 - true_prob])
+    Q = np.array([approx_prob, 1 - approx_prob])
+    return abs(P[0] - Q[0]) * 100.0
 def compute_tokens_prob(token_amounts: list) -> list:
     first_token_amounts = token_amounts[0]
     second_token_amounts = token_amounts[1]
     closed_markets["kl_divergence"] = closed_markets.apply(
         lambda x: market_KL_divergence(x), axis=1
     )
+    closed_markets["off_by_perc"] = closed_markets.apply(
+        lambda x: off_by_values(x), axis=1
+    )
     closed_markets.to_parquet(DATA_DIR / "closed_markets_div.parquet", index=False)
     print("Finished preparing final dataset for visualization")
     print(closed_markets.head())

tabs/market_plots.py CHANGED Viewed

@@ -1,9 +1,8 @@
 import pandas as pd
 import gradio as gr
-import matplotlib.pyplot as plt
-import seaborn as sns
-from typing import Tuple
 import plotly.express as px
 def plot_kl_div_per_market(closed_markets: pd.DataFrame) -> gr.Plot:
@@ -35,3 +34,87 @@ def plot_kl_div_per_market(closed_markets: pd.DataFrame) -> gr.Plot:
     return gr.Plot(
         value=fig,
     )

 import pandas as pd
 import gradio as gr
 import plotly.express as px
+import plotly.graph_objects as go
+from plotly.subplots import make_subplots
 def plot_kl_div_per_market(closed_markets: pd.DataFrame) -> gr.Plot:
     return gr.Plot(
         value=fig,
     )
+def plot_kl_div_per_market2(closed_markets: pd.DataFrame) -> gr.Plot:
+    # adding the total
+    all_markets = closed_markets.copy(deep=True)
+    all_markets["market_creator"] = "all"
+    # merging both dataframes
+    final_markets = pd.concat([closed_markets, all_markets], ignore_index=True)
+    final_markets = final_markets.sort_values(by="opening_datetime", ascending=True)
+    # Create the figure with secondary y-axis
+    fig = make_subplots(specs=[[{"secondary_y": True}]])
+    # Add box plots for KL divergence
+    for creator in ["pearl", "quickstart", "all"]:
+        fig.add_trace(
+            go.Box(
+                x=final_markets[final_markets["market_creator"] == creator][
+                    "month_year_week"
+                ],
+                y=final_markets[final_markets["market_creator"] == creator][
+                    "kl_divergence"
+                ],
+                name=f"{creator} kl-div",
+                boxmean=True,
+                marker_color={
+                    "pearl": "purple",
+                    "quickstart": "goldenrod",
+                    "all": "darkgreen",
+                }[creator],
+            ),
+            secondary_y=False,
+        )
+        fig.add_trace(
+            go.Box(
+                x=final_markets[final_markets["market_creator"] == creator][
+                    "month_year_week"
+                ],
+                y=final_markets[final_markets["market_creator"] == creator][
+                    "off_by_perc"
+                ],
+                name=f"{creator} off by",
+                boxmean=True,
+                marker_color={
+                    "pearl": "pink",
+                    "quickstart": "yellow",
+                    "all": "lightgreen",
+                }[creator],
+            ),
+            secondary_y=True,
+        )
+    # Update layout
+    fig.update_layout(
+        xaxis_title="Markets closing Week",
+        legend=dict(yanchor="top", y=0.5, xanchor="left", x=-0.5),
+        boxmode="group",
+        width=1000,  # Adjusted for better fit on laptop screens
+        height=600,  # Adjusted for better fit on laptop screens
+    )
+    # Calculate the range for both axes
+    # derived_min, derived_max = (
+    #     final_markets["off_by"].min(),
+    #     final_markets["off_by"].max(),
+    # )
+    # Update y-axes
+    fig.update_yaxes(
+        title_text="Kullback–Leibler divergence", secondary_y=False, side="left"
+    )
+    fig.update_yaxes(
+        title_text="Off by percentage between probabilities",
+        secondary_y=True,
+        side="right",
+        # range=[derived_min, derived_max],
+    )
+    # Update x-axis
+    fig.update_xaxes(tickformat="%b %d\n%Y")
+    return gr.Plot(
+        value=fig,
+    )