# === Setup: paths, imports, theme ===

from pathlib import Path
import sys
import matplotlib.pyplot as plt
import numpy as np
import pandas as pd

# Dev convenience
%load_ext autoreload
%autoreload 2

# Display options
pd.set_option("display.max_columns", 120)
pd.set_option("display.width", 120)

# Resolve repository root (if in notebooks/, step up one level)
REPO_ROOT = Path.cwd().resolve().parent if Path.cwd().name.lower() == "notebooks" else Path.cwd().resolve()

# Canonical paths
DATA_DIR    = REPO_ROOT / "data" 
RESULTS_DIR = REPO_ROOT / "results" / "eda"
FIG_DIR     = RESULTS_DIR / "figures"
TAB_DIR     = RESULTS_DIR / "tables"

# Ensure results dirs exist
FIG_DIR.mkdir(parents=True, exist_ok=True)
TAB_DIR.mkdir(parents=True, exist_ok=True)

# Dataset path
DATA_PATH = DATA_DIR / "raw" / "cs2_playstyle_roles_2024.csv"
assert DATA_PATH.exists(), f"Dataset not found at {DATA_PATH}"

# Local helpers
SRC_DIR = REPO_ROOT / "src"
if str(SRC_DIR) not in sys.path:
    sys.path.insert(0, str(SRC_DIR))

from style import (
    set_mpl_theme,
    set_seaborn_theme,
    ROLE_COLOURS, 
    get_role_colour,
)
from stability import (
    rates_quantile_table,
    tapd_quantile_table,
    retained_summary,
)
from viz import (
    plot_rates_quantile,
    plot_tapd_quantile,
    plot_mapcount_hist,
    summarize_side_stats,
    plot_kdes_roles_by_side,
    plot_kdes_side_compare,
    summarize_role_stats_by_side, 
    plot_correlation_split_heatmap,
    compute_feature_correlations,
    plot_positioning_residuals_by_role
    )
from hypo_tests import (
    test_side_trade_increase,
    test_side_variability_ct_less,
    test_role_contrast,
    test_role_contrast,
    compute_role_distinctiveness,
)
from viz_plotly import (
    plot_role_radars_interactive,
    plot_positioning_regression_interactive,
)
from features import (
    fit_positioning_regressions,
    compute_positioning_residuals,
    
)
# Themes
set_mpl_theme(mode="dark", preferred_font="Georgia")
set_seaborn_theme(mode="dark", preferred_font="Georgia")  

# Echo key paths
REPO_ROOT, DATA_PATH, FIG_DIR, TAB_DIR

(WindowsPath('P:/cs2-playstyle-analysis-2024'),
 WindowsPath('P:/cs2-playstyle-analysis-2024/data/raw/cs2_playstyle_roles_2024.csv'),
 WindowsPath('P:/cs2-playstyle-analysis-2024/results/eda/figures'),
 WindowsPath('P:/cs2-playstyle-analysis-2024/results/eda/tables'))

# Load dataset and run structural checks
df = pd.read_csv(DATA_PATH)

# Shape and a compact preview
print("shape:", df.shape)
display(df.head(3))

# Column summary
col_info = (
    pd.DataFrame({
        "column": df.columns,
        "dtype": df.dtypes.astype(str),
        "missing_rate": df.isna().mean().round(4)
    })
    .sort_values(["missing_rate", "column"], ascending=[False, True])
)
display(col_info.head(25))  # preview top 25 by missingness

# Quick counts by dtype for a high-level feel
dtype_counts = col_info["dtype"].value_counts().rename_axis("dtype").to_frame("n")
display(dtype_counts)

# Light check for commonly expected identifiers (report only)
expected = ["steamid", "player_name", "team_clan_name", "map_count"]
present = [c for c in expected if c in df.columns]
missing = [c for c in expected if c not in df.columns]
print("present expected cols:", present)
print("missing expected cols:", missing)

# Detect side-suffixed families (useful for later grouping)
suffixes = ("_t", "_ct", "_overall")
side_cols = {suf: [c for c in df.columns if c.endswith(suf)] for suf in suffixes}
{key: len(val) for key, val in side_cols.items()}

shape: (306, 25)

present expected cols: ['steamid', 'player_name', 'team_clan_name', 'map_count']
missing expected cols: []

{'_t': 7, '_ct': 7, '_overall': 7}

# Coverage summary, binned map-count table, role-label missingness, and threshold retention
import pandas as pd

# Coverage summary
coverage = pd.DataFrame({
    "n_players": [df["steamid"].nunique()],
    "n_teams": [df["team_clan_name"].nunique()],
    "mean_maps": [df["map_count"].mean()],
    "median_maps": [df["map_count"].median()],
    "p10_maps": [df["map_count"].quantile(0.10)],
    "p90_maps": [df["map_count"].quantile(0.90)],
    "min_maps": [df["map_count"].min()],
    "max_maps": [df["map_count"].max()],
}).round(2)
display(coverage)
coverage.to_csv(TAB_DIR / "eda_coverage_summary.csv", index=False)

# Binned map-count table (no plot)
bins = [0, 10, 20, 30, 40, 60, 80, 120, 160, 1_000]
map_bins = pd.cut(df["map_count"], bins=bins, right=False)
map_hist = (
    map_bins.value_counts()
    .sort_index()
    .rename_axis("map_count_bin")
    .reset_index(name="n_players")
)
display(map_hist)
map_hist.to_csv(TAB_DIR / "eda_mapcount_hist.csv", index=False)

# Role label missingness per field
role_cols = [c for c in ("role_overall", "role_t", "role_ct") if c in df.columns]
role_missing = df[role_cols].isna().mean().rename("missing_rate").to_frame()
display(role_missing)
role_missing.to_csv(TAB_DIR / "eda_role_missingness.csv")

# Players retained under common min-map thresholds (feeds into stability analysis)
thresholds = [20, 30, 40, 60, 80, 100, 120]
thr_table = (
    pd.DataFrame({"min_map_count": thresholds})
      .assign(n_players=lambda t: t["min_map_count"].apply(lambda m: (df["map_count"] >= m).sum()))
)
thr_table["share_players"] = (thr_table["n_players"] / df["steamid"].nunique()).round(3)
display(thr_table)
thr_table.to_csv(TAB_DIR / "eda_threshold_coverage.csv", index=False)

# === Parameters ===

# Map-count bins for summaries and plots
MAP_BINS = [0, 10, 20, 30, 40, 50, 60, 80, 100, 120, 140, 160]

# Trials-per-map assumptions (sensitivity moves levels, not shape)
K_OAP, K_PODT, K_POKT = 20.0, 18.0, 14.0

# Quantile for bin summary (p75 is conservative and robust)
Q = 0.75

# Decision lines for figures
MIN_MAPS = 40
TOL_PP   = 2.0   # percentage points for rate metrics; set None to hide

# === Stability: rates (oap/podt/pokt), pQ in percentage points ===

rates_tbl = rates_quantile_table(
    df, MAP_BINS, k_oap=K_OAP, k_podt=K_PODT, k_pokt=K_POKT, q=Q, map_col="map_count"
)

plot_rates_quantile(
    rates_tbl, q=Q, tol_pp=TOL_PP, min_maps=MIN_MAPS,
    savepath=FIG_DIR / f"stability_rates_p{int(Q*100)}_pp.png",
    savepath_svg=FIG_DIR / f"stability_rates_p{int(Q*100)}_pp.svg",
)

# === Stability: tapd (duration proxy), pQ in proxy units ===

tapd_tbl, _ = tapd_quantile_table(
    df, MAP_BINS, q=Q, map_col="map_count", scale=None, ref_mask=None
)

plot_tapd_quantile(
    tapd_tbl, q=Q, min_maps=MIN_MAPS,
    savepath=FIG_DIR / f"stability_tapd_p{int(Q*100)}_proxy.png",
savepath_svg=FIG_DIR / f"stability_tapd_p{int(Q*100)}_proxy.svg",
)

# === Coverage: players by map_count and retention at MIN_MAPS ===

ret = retained_summary(df, MIN_MAPS, map_col="map_count")

plot_mapcount_hist(
    df, bins=list(range(0, 180, 20)), min_maps=MIN_MAPS,
    savepath=FIG_DIR / "mapcount_hist.png",
    savepath_svg=FIG_DIR / "mapcount_hist.svg",
)

print(f"Total players: {ret['total']}")
print(f"Retained at MIN_MAPS={ret['min_maps']}: {ret['retained']} ({ret['retained_pct']:.1f}%)")

Total players: 306
Retained at MIN_MAPS=40: 84 (27.5%)

# === Stable cohort: create df_stable and check for missing roles ===
# Stable cohort dataframe with players having at least MIN_MAPS
df_stable = df.loc[df["map_count"] >= MIN_MAPS].copy() 

# Sanity check: no missing/empty roles in stable cohort. If you select a lower threshold, roles may be missing.
role_cols = ["role_overall", "role_t", "role_ct"]
for col in role_cols:
    mask = df_stable[col].isna() | (df_stable[col].astype(str).str.strip() == "")
    n = int(mask.sum())
    print(f"{col} missing: {n}")
    assert n == 0, f"Some players in the stable cohort are missing {col}."

role_overall missing: 0
role_t missing: 0
role_ct missing: 0

# === Role summaries and plots by side ===

plot_kdes_side_compare(
    df=df_stable,                 
    bw_adjust=1,
    min_map_count=None, # Select a min_map_count if desired (use df instead of df_stable)
    savepath=FIG_DIR / "kde_side_compare.png",
    savepath_svg=FIG_DIR / "kde_side_compare.svg",
)

#  Side summary table

stats_tbl = summarize_side_stats(df_stable, min_map_count=None)
display(stats_tbl.round(2))

(stats_tbl.round(3)
 .to_csv(RESULTS_DIR / "tables" / "side_kde_summary.csv"))

# T roles to choose from: "AWPer","Spacetaker","Lurker","Half-Lurker"

t_roles  = ["AWPer","Spacetaker","Lurker","Half-Lurker"]

plot_kdes_roles_by_side(
    df=df_stable, side="t",
    roles_order=t_roles, min_role_n=8, bw_adjust=1.2, min_map_count=None,
    savepath=FIG_DIR / "kde_roles_T.png",
    savepath_svg=FIG_DIR / "kde_roles_T.svg",
)

# Summary table for T side, use wide=False for long format (easier role comparisons)
tbl_roles_t = summarize_role_stats_by_side(
    df_stable, side="t", roles_order=t_roles, min_role_n=8,
    round_to=2, wide=True
)
display(tbl_roles_t)

# Optional save
tbl_roles_t.to_csv(RESULTS_DIR / "tables" / "role_kde_summary_T.csv", index=False)

# CT roles to choose from: "AWPer","Anchor","Rotator","Mixed"
# Toggle which roles to include (optional)
ct_roles = ["AWPer","Anchor","Rotator","Mixed",]


plot_kdes_roles_by_side(
    df=df_stable, side="ct",
    roles_order=ct_roles, min_role_n=8, bw_adjust=1.2, min_map_count=None,
    savepath=FIG_DIR / "kde_roles_CT.png",
    savepath_svg=FIG_DIR / "kde_roles_CT.svg",
)

# Summary table for CT side, use wide=False for long format (easier role comparisons)
tbl_roles_ct = summarize_role_stats_by_side(
    df_stable, side="ct", roles_order=ct_roles, min_role_n=8,
    round_to=2, wide=True
)
display(tbl_roles_ct)

# Optional save
tbl_roles_ct.to_csv(RESULTS_DIR / "tables" / "role_kde_summary_CT.csv", index=False)

# === Role radar plots (interactive) ===
fig = plot_role_radars_interactive(df, min_map_count=40)
fig.show(renderer="notebook")

# Static PNG export requires Chrome and Kaleido; commented out for portability
# fig.write_image(FIG_DIR / "role_radars_t_vs_ct.png", width=1500, height=840)

# Saving as HTML
fig.write_html(FIG_DIR / "role_radars_t_vs_ct.html", include_plotlyjs="embed")

# === Hypothesis test: is trading higher on T? ===

MIN_MAPS = 40  # minimum maps to include player in test
res_trades = test_side_trade_increase(df, min_maps=MIN_MAPS)
display(res_trades)

res_trades.to_csv(TAB_DIR / "hypo_test_t_more_trading.csv", index=False)

# === Cell — #2: CT tighter spread test (SD ratio + perm test on IQR) ===
res_var = test_side_variability_ct_less(df, min_maps=MIN_MAPS)
display(res_var)

res_var.to_csv(TAB_DIR / "hypo_test_ct_tighter_variability.csv", index=False)

# Role contrast: Aggressive vs Passive roles

# T-side: Spacetaker (aggressive) vs Lurker (passive)
result_t = test_role_contrast(
    df=df,
    role_a='Spacetaker_t',
    role_b='Lurker_t',
    min_maps=MIN_MAPS
)

print("T-Side Role Contrast: Spacetaker vs Lurker")
print("=" * 80)
display(result_t)
result_t.to_csv(RESULTS_DIR / "tables" / "hypo_test_t_spac_vs_lurk.csv", index=False)

T-Side Role Contrast: Spacetaker vs Lurker
================================================================================

# CT-side: Rotator (aggressive) vs Anchor (passive)
result_ct = test_role_contrast(
    df=df,
    role_a='Rotator_ct',
    role_b='Anchor_ct',
    min_maps=MIN_MAPS
)

print("CT-Side Role Contrast: Rotator vs Anchor")
print("=" * 80)
display(result_ct)
result_ct.to_csv(RESULTS_DIR / "tables" / "hypo_test_ct_rot_vs_anc.csv", index=False)

CT-Side Role Contrast: Rotator vs Anchor
================================================================================

# T-side distinctiveness
distinct_t = compute_role_distinctiveness(
    df=df,
    side='t',
    min_maps=MIN_MAPS
)
distinct_t.to_csv(RESULTS_DIR / "tables" / "distinct_t_roles.csv", index=False)

print("T-Side Role Distinctiveness")
print("=" * 80)
display(distinct_t)

T-Side Role Distinctiveness
================================================================================

# CT-side distinctiveness
distinct_ct = compute_role_distinctiveness(
    df=df,
    side='ct',
    min_maps=MIN_MAPS
)
distinct_ct.to_csv(RESULTS_DIR / "tables" / "distinct_ct_roles.csv", index=False)

print("CT-Side Role Distinctiveness")
print("=" * 80)
display(distinct_ct)

CT-Side Role Distinctiveness
================================================================================

# Compute correlation matrices for each side
corr_t = compute_feature_correlations(df, min_maps=MIN_MAPS, side="t")
corr_ct = compute_feature_correlations(df, min_maps=MIN_MAPS, side="ct")

# Display tables
print("T-side Feature Correlations (Pearson):")
display(corr_t.round(3))

print("\n" + "="*60 + "\n")

print("CT-side Feature Correlations (Pearson):")
display(corr_ct.round(3))

# Save tables
corr_t.to_csv(TAB_DIR / "correlation_matrix_t.csv")
corr_ct.to_csv(TAB_DIR / "correlation_matrix_ct.csv")

T-side Feature Correlations (Pearson):

============================================================

CT-side Feature Correlations (Pearson):

# Generate split-diagonal correlation heatmap
n_stable = (df["map_count"] >= MIN_MAPS).sum()

fig, ax = plot_correlation_split_heatmap(
    corr_t=corr_t,
    corr_ct=corr_ct,
    save_path=FIG_DIR / "correlation_heatmap_split",
    title="CT vs T Side Feature Correlations",
    n_stable=n_stable,
)

plt.show()

models = fit_positioning_regressions(df, MIN_MAPS)

T-side regression: ADAT = 0.979 × ADNT + 0.012
CT-side regression: ADAT = 1.009 × ADNT + -0.006

pos_residuals_df = compute_positioning_residuals(df, models)
pos_residuals_df.head()

print("Correlation between ADNT and ADAT residuals:\n")
for side in ['t', 'ct']:
    adnt_col = f'adnt_rank_{side}'
    resid_col = f'adat_residual_{side}'
    
    stable_data = pos_residuals_df[pos_residuals_df['map_count'] >= MIN_MAPS]
    corr = stable_data[[adnt_col, resid_col]].corr().iloc[0, 1]
    
    print(f"{side.upper()}-side: ρ(ADNT, residual) = {corr:.4f}")

Correlation between ADNT and ADAT residuals:

T-side: ρ(ADNT, residual) = 0.0000
CT-side: ρ(ADNT, residual) = 0.0000

fig_positioning = plot_positioning_regression_interactive(pos_residuals_df, models, MIN_MAPS)
fig_positioning.show(renderer="notebook")

fig_positioning.write_html(FIG_DIR / "pos_features_scatter.html", include_plotlyjs="embed")

fig_residuals = plot_positioning_residuals_by_role(pos_residuals_df, models, MIN_MAPS)
plt.show()

# Add residuals to original dataframe
# Use merge to ensure proper alignment on steamid (prevents NaN values from index misalignment)
enriched_df = df.merge(
    pos_residuals_df[['steamid', 'adat_residual_t', 'adat_residual_ct']],
    on='steamid',
    how='left'
)

# Save as parquet
enriched_df.to_parquet(DATA_DIR / "processed" / "cs2_playstyles_2024_with_residuals.parquet", index=False)

	steamid	player_name	team_clan_name	map_count	tapd_ct	tapd_t	tapd_overall	oap_ct	oap_t	oap_overall	podt_ct	podt_t	podt_overall	pokt_ct	pokt_t	pokt_overall	adnt_rank_ct	adnt_rank_t	adnt_rank_overall	adat_rank_ct	adat_rank_t	adat_rank_overall	role_overall	role_t	role_ct
0	76561198041683378	NiKo	G2 Esports	158	60.952893	59.136540	60.136000	24.745965	24.093423	24.424242	21.020276	24.857741	22.507740	17.051295	21.586555	19.197995	0.562493	0.621199	0.593089	0.547525	0.695336	0.616046	Lurker	Spacetaker	Rotator
1	76561198012872053	huNter	G2 Esports	158	62.048685	62.871661	62.589800	16.852540	14.807692	15.847511	21.585198	27.994772	24.696747	17.195516	27.180894	22.538284	0.480859	0.643004	0.571875	0.406082	0.615021	0.455108	Flex	Lurker	Rotator
2	76561198074762801	m0NESY	G2 Esports	155	62.786553	66.632594	64.362519	23.914373	17.754078	20.873335	19.122381	23.094640	21.473108	17.397469	26.423178	21.056274	0.577785	0.423733	0.453028	0.515617	0.409889	0.427645	AWPer	AWPer	AWPer

	column	dtype	missing_rate
role_overall	role_overall	object	0.4183
role_ct	role_ct	object	0.3856
role_t	role_t	object	0.3856
adat_rank_ct	adat_rank_ct	float64	0.0000
adat_rank_overall	adat_rank_overall	float64	0.0000
adat_rank_t	adat_rank_t	float64	0.0000
adnt_rank_ct	adnt_rank_ct	float64	0.0000
adnt_rank_overall	adnt_rank_overall	float64	0.0000
adnt_rank_t	adnt_rank_t	float64	0.0000
map_count	map_count	int64	0.0000
oap_ct	oap_ct	float64	0.0000
oap_overall	oap_overall	float64	0.0000
oap_t	oap_t	float64	0.0000
player_name	player_name	object	0.0000
podt_ct	podt_ct	float64	0.0000
podt_overall	podt_overall	float64	0.0000
podt_t	podt_t	float64	0.0000
pokt_ct	pokt_ct	float64	0.0000
pokt_overall	pokt_overall	float64	0.0000
pokt_t	pokt_t	float64	0.0000
steamid	steamid	int64	0.0000
tapd_ct	tapd_ct	float64	0.0000
tapd_overall	tapd_overall	float64	0.0000
tapd_t	tapd_t	float64	0.0000
team_clan_name	team_clan_name	object	0.0000

	n
dtype
float64	18
object	5
int64	2

	map_count_bin	n_players
0	[0, 10)	111
1	[10, 20)	58
2	[20, 30)	23
3	[30, 40)	30
4	[40, 60)	10
5	[60, 80)	31
6	[80, 120)	16
7	[120, 160)	27
8	[160, 1000)	0

	Feature	CT μ	CT σ	T μ	T σ	n
0	Time Alive Per Death (TAPD) (s)	60.67	3.34	60.29	4.60	84
1	Opening Attempt % (OAP)	20.18	3.50	20.17	5.90	84
2	Proportion of Deaths Traded % (PODT)	19.66	2.82	24.27	3.33	84
3	Proportion of Kills that are Trades % (POKT)	16.07	2.13	23.66	3.72	84
4	Distance to Nearest Teammate (ADNT) – rank	0.60	0.11	0.60	0.14	84
5	Distance from Average Teammate (ADAT) – rank	0.60	0.15	0.60	0.15	84

01 - Exploratory Data Analysis and Feature Engineering¶

Executive Summary¶

Objectives¶

Outputs¶

1. Setup & Data Overview¶

Load & structural overview¶

Coverage overview¶

2. Stability threshold analysis (Map Count)¶

Parameters¶

Proportional Features¶

Time Alive Per Death (TAPD)¶

Coverage — players by map count.¶

Summary & cutoff¶

3. Feature Distributions & Role Profiles¶

CT vs T — Distributions (KDE) + Side Summary Table¶

Roles — T Side (KDE) + Summary Table¶

Roles — CT Side (KDE) + Summary Table¶

Interactive Role Profile Radars¶

Summary and Interpretations¶

4. Exploratory Hypothesis Checks¶

#1 Are trades higher on T? (PODT & POKT)¶

#2 Are CT playstyle features tighter (less variable) than T?¶

#3 Do "aggressive" and "passive" roles show distinct behavioral profiles?¶

#4 Role Distinctiveness: Which roles have the most unique behavioral signatures?¶

Summary and Interpretations¶

5. Feature Correlations¶

Summary and Interpretations¶

6. Positional Feature Analysis & Engineering¶

Interactive Positioning Scatter: ADNT vs ADAT by Role¶

Role-Stratified Residual Analysis¶

Summary and Interpretations¶

Summary of Exploratory Data Analysis and Feature Engineering¶

	min_map_count	n_players	share_players
0	20	137	0.448
1	30	114	0.373
2	40	84	0.275
3	60	74	0.242
4	80	43	0.141
5	100	33	0.108
6	120	27	0.088

	Feature	AWPer μ	AWPer σ	Half-Lurker μ	Half-Lurker σ	Lurker μ	Lurker σ	Spacetaker μ	Spacetaker σ
0	Distance from Average Teammate (ADAT) – rank	0.43	0.06	0.66	0.09	0.75	0.08	0.55	0.10
1	Distance to Nearest Teammate (ADNT) – rank	0.43	0.08	0.65	0.08	0.72	0.09	0.57	0.11
2	Opening Attempt % (OAP)	14.20	2.85	22.42	4.12	17.68	3.82	24.51	5.30
3	Proportion of Deaths Traded % (PODT)	21.57	2.30	25.05	2.51	24.90	3.55	24.97	3.27
4	Proportion of Kills that are Trades % (POKT)	25.81	2.48	23.41	2.79	25.07	3.50	21.49	3.69
5	Time Alive Per Death (TAPD) (s)	64.36	4.40	57.24	3.78	61.89	3.25	58.00	3.77

	Feature	AWPer μ	AWPer σ	Anchor μ	Anchor σ	Mixed μ	Mixed σ	Rotator μ	Rotator σ
0	Distance from Average Teammate (ADAT) – rank	0.53	0.03	0.77	0.10	0.63	0.10	0.49	0.11
1	Distance to Nearest Teammate (ADNT) – rank	0.61	0.05	0.71	0.09	0.61	0.08	0.51	0.10
2	Opening Attempt % (OAP)	21.37	3.35	17.80	3.11	19.38	2.97	21.76	3.15
3	Proportion of Deaths Traded % (PODT)	18.80	2.69	19.06	2.44	20.42	3.46	20.15	2.60
4	Proportion of Kills that are Trades % (POKT)	15.86	2.21	15.88	2.30	16.39	2.44	16.15	1.78
5	Time Alive Per Death (TAPD) (s)	62.05	3.42	61.95	3.21	60.40	3.13	59.03	2.85

	feature	n	mean_delta	ci95_lo	ci95_hi	t_stat	p_one_sided	alternative	test	note
0	PODT	84	4.609876	3.898434	5.350810	12.486384	4.732547e-21	T > CT	paired_t (mean Δ)	Players with ≥40 maps; Δ = podt_t − podt_ct
1	POKT	84	7.587971	6.826470	8.352514	19.608965	3.363318e-33	T > CT	paired_t (mean Δ)	Players with ≥40 maps; Δ = pokt_t − pokt_ct

	feature	n_players	sd_ct	sd_t	sd_ratio_ct_over_t	ci95_lo_ratio	ci95_hi_ratio	iqr_ct	iqr_t	p_one_sided_perm_IQR
0	OAP	84	3.496475	5.903650	0.592256	0.488798	0.713436	4.467156	8.924401	0.000100
1	TAPD	84	3.335992	4.596741	0.725730	0.608445	0.871978	4.089794	6.483488	0.011199
2	PODT	84	2.818093	3.328184	0.846736	0.684628	1.054527	3.974669	4.594908	0.279072
3	POKT	84	2.126360	3.719068	0.571745	0.457596	0.716249	2.493735	4.831818	0.024998

	feature	n_Spacetaker	n_Lurker	mean_Spacetaker	mean_Lurker	cohens_d	t_stat	p_welch	U_stat	p_mw
0	OAP_T	31	24	24.509	17.683	1.447	5.545	9.59e-07	634.0	9.08e-06
1	TAPD_T	31	24	58.001	61.890	-1.095	-4.105	0.0001	167.0	0.0005
2	PODT_T	31	24	24.966	24.899	0.020	0.073	0.9425	375.0	0.9662
3	POKT_T	31	24	21.489	25.073	-0.993	-3.677	0.0006	186.0	0.0016
4	ADNT_RANK_T	31	24	0.572	0.722	-1.498	-5.602	8.15e-07	107.0	7.16e-06
5	ADAT_RANK_T	31	24	0.545	0.755	-2.205	-8.351	3.09e-11	46.0	3.31e-08

	feature	n_Rotator	n_Anchor	mean_Rotator	mean_Anchor	cohens_d	t_stat	p_welch	U_stat	p_mw
0	OAP_CT	28	21	21.756	17.804	1.261	4.376	7.44e-05	484.0	0.0001
1	TAPD_CT	28	21	59.032	61.949	-0.969	-3.299	0.0020	142.0	0.0022
2	PODT_CT	28	21	20.151	19.057	0.431	1.507	0.1388	372.0	0.1174
3	POKT_CT	28	21	16.150	15.878	0.135	0.449	0.6560	295.0	0.9919
4	ADNT_RANK_CT	28	21	0.512	0.711	-2.088	-7.323	3.52e-09	41.0	3.37e-07
5	ADAT_RANK_CT	28	21	0.493	0.773	-2.591	-9.100	8.65e-12	22.0	4.13e-08

	role	n	mahal_d_sq	oap_contrib	tapd_contrib	podt_contrib	pokt_contrib	adnt_contrib	adat_contrib
0	AWPer	17	4.396	1.607	1.234	1.036	0.523	2.318	2.052
1	Lurker	24	2.999	0.349	0.237	0.070	0.282	1.576	2.199
2	Spacetaker	31	2.126	1.354	0.623	0.110	0.858	0.082	0.308
3	Half-Lurker	12	0.922	0.196	0.600	0.074	0.006	0.211	0.223

	role	n	mahal_d_sq	oap_contrib	tapd_contrib	podt_contrib	pokt_contrib	adnt_contrib	adat_contrib
0	Anchor	21	2.746	0.822	0.263	0.082	0.015	1.693	2.462
1	AWPer	17	1.895	0.182	0.272	0.148	0.016	0.002	0.332
2	Rotator	28	1.757	0.456	0.539	0.068	0.003	1.408	1.233
3	Mixed	18	0.375	0.084	0.010	0.117	0.035	0.005	0.074

	TAPD	OAP	PODT	POKT	ADNT_RANK	ADAT_RANK
TAPD	1.000	-0.600	-0.146	0.402	-0.084	-0.077
OAP	-0.600	1.000	0.327	-0.601	0.051	0.047
PODT	-0.146	0.327	1.000	-0.091	0.033	0.098
POKT	0.402	-0.601	-0.091	1.000	-0.230	-0.159
ADNT_RANK	-0.084	0.051	0.033	-0.230	1.000	0.919
ADAT_RANK	-0.077	0.047	0.098	-0.159	0.919	1.000

	TAPD	OAP	PODT	POKT	ADNT_RANK	ADAT_RANK
TAPD	1.000	-0.567	-0.112	0.094	0.204	0.207
OAP	-0.567	1.000	0.099	-0.310	-0.195	-0.313
PODT	-0.112	0.099	1.000	0.090	-0.117	-0.060
POKT	0.094	-0.310	0.090	1.000	-0.214	-0.022
ADNT_RANK	0.204	-0.195	-0.117	-0.214	1.000	0.781
ADAT_RANK	0.207	-0.313	-0.060	-0.022	0.781	1.000