halo_comparison/sizes.py

from pathlib import Path
from sys import argv

import numpy as np
import pandas as pd
from matplotlib import pyplot as plt
from matplotlib.axes import Axes
from matplotlib.collections import QuadMesh
from matplotlib.colors import LogNorm
from matplotlib.figure import Figure
from numpy import inf

from halo_vis import get_comp_id
from paths import base_dir
from utils import figsize_from_page_fraction, rowcolumn_labels, waveforms, tex_fmt

# density like in Vr:

G = 43.022682  # in Mpc (km/s)^2 / (10^10 Msun)

vmaxs = {
    "Mvir": 52,
    "Vmax": 93,
    "cNFW": 31
}

units = {
    "distance": "Mpc",
    "Mvir": r"10^{10} \textrm{M}_\odot",
    "Vmax": r"\textrm{km} \textrm{s}^{-1}"  # TODO
}


def concentration(row, halo_type: str) -> bool:
    r_200crit = row[f'{halo_type}_R_200crit']
    if r_200crit <= 0:
        cnfw = -1
        colour = 'orange'
        return False
        # return cnfw, colour

    r_size = row[f'{halo_type}_R_size']  # largest difference from center of mass to any halo particle
    m_200crit = row[f'{halo_type}_Mass_200crit']
    vmax = row[f'{halo_type}_Vmax']  # largest velocity coming from enclosed mass profile calculation
    rmax = row[f'{halo_type}_Rmax']
    npart = row[f'{halo_type}_npart']
    VmaxVvir2 = vmax ** 2 * r_200crit / (G * m_200crit)
    if VmaxVvir2 <= 1.05:
        if m_200crit == 0:
            cnfw = r_size / rmax
            return False
            # colour = 'white'
        else:
            cnfw = r_200crit / rmax
            return False
            # colour = 'white'
    else:
        if npart >= 100:  # only calculate cnfw for groups with more than 100 particles
            cnfw = row[f'{halo_type}_cNFW']
            return True
            # colour = 'black'
        else:
            if m_200crit == 0:
                cnfw = r_size / rmax
                return False
                # colour = 'white'
            else:
                cnfw = r_200crit / rmax
                return False
                # colour = 'white'
    # assert np.isclose(cnfw, row[f'{halo_type}_cNFW'])
    #
    # return cnfw, colour


def plot_comparison_hist2d(ax: Axes, file: Path, property: str):
    print("WARNING: Can only plot hist2d of properties with comp_ or ref_ right now!")
    print(f"         Selected property: {property}")
    x_col = f"ref_{property}"
    y_col = f"comp_{property}"
    df = pd.read_csv(file)
    # if mode == 'concentration_analysis':
    #     min_x = min([min(df[x_col]), min(df[y_col])])
    #     max_x = max([max(df[x_col]), max(df[y_col])])
    #     df = df.loc[2 * df.ref_cNFW < df.comp_cNFW]
    # else:
    min_x = min([min(df[x_col]), min(df[y_col])])
    max_x = max([max(df[x_col]), max(df[y_col])])
    num_bins = 100
    bins = np.geomspace(min_x, max_x, num_bins)
    if property == 'cNFW':
        rows = []
        for i, row in df.iterrows():
            comp_cnfw_normal = concentration(row, halo_type="comp")

            ref_cnfw_normal = concentration(row, halo_type='ref')
            cnfw_normal = comp_cnfw_normal and ref_cnfw_normal
            if cnfw_normal:
                rows.append(row)
        df = pd.concat(rows, axis=1).T
        print(df)
    if property == "Mvir":
        stds = []
        means = []
        for rep_row in range(num_bins):
            rep_x_left = bins[rep_row]
            rep_x_right = bins[rep_row] + 1
            rep_bin = (rep_x_left < df[x_col]) & (df[x_col] < rep_x_right)
            rep_values = df.loc[rep_bin][y_col] / df.loc[rep_bin][x_col]
            if len(rep_bin) < 30:
                continue
            mean = rep_values.mean()
            std = rep_values.std()
            means.append(mean)
            stds.append(std)
        means = np.array(means)
        stds = np.array(stds)
        args = {
            "color": "C2",
            "zorder": 10
        }
        ax.fill_between(bins, means - stds, means + stds, alpha=.2, **args)
        ax.plot(bins, means + stds, alpha=.5, **args)
        ax.plot(bins, means - stds, alpha=.5, **args)
        # ax_scatter.plot(bins, stds, label=f"{file.stem}")

    if property in vmaxs:
        vmax = vmaxs[property]
    else:
        vmax = None
        print("WARNING: vmax not set")
    image: QuadMesh
    _, _, _, image = ax.hist2d(df[x_col], df[y_col] / df[x_col], bins=(bins, np.linspace(0, 2, num_bins)),
                               norm=LogNorm(vmax=vmax))
    # ax.plot([rep_x_left, rep_x_left], [mean - std, mean + std], c="C1")
    # ax.annotate(
    #     text=f"std={std:.2f}", xy=(rep_x_left, mean + std),
    #     textcoords="axes fraction", xytext=(0.1, 0.9),
    #     arrowprops={}
    # )
    print("vmin/vmax", image.norm.vmin, image.norm.vmax)
    # fig.colorbar(hist)

    ax.set_xscale("log")
    # ax.set_yscale("log")
    ax.set_xlim(min(df[x_col]), max(df[y_col]))

    ax.plot([min(df[x_col]), max(df[y_col])], [1, 1], linewidth=1, color="C1", zorder=10)

    return x_col, y_col
    # ax.set_title(file.name)
    # fig.savefig(Path(f"~/tmp/comparison_{file.stem}.pdf").expanduser())
    # fig.suptitle


def plot_comparison_hist(ax: Axes, file: Path, property: str, m_min=None, m_max=None):
    df = pd.read_csv(file)
    if m_min:
        df = df.loc[(m_min < df["ref_Mvir"]) & (df["ref_Mvir"] < m_max)]

    num_bins = 100
    histtype = "bar"
    label = None
    density = False

    if property == "distance":
        bins = np.geomspace(min(df[property]), max(df[property]), 100)
        mean = df[property].mean()
        median = df[property].median()
        ax.axvline(mean, label="mean", color="C1")
        ax.axvline(median, label="median", color="C2")
    else:
        bins = num_bins
    if property == "match":
        histtype = "step"
        label = f"${m_min} < M < {m_max}$"
        density = True

    ax.hist(df[property], bins=bins, histtype=histtype, label=label, density=density)


comparisons_dir = base_dir / "comparisons"
hist_properties = ["distance", "match", "num_skipped_for_mass"]

comparisons = [(256, 512), (256, 1024)]  # , (512, 1024)


def compare_property(property, show: bool):
    is_hist_property = property in hist_properties
    fig: Figure
    fig, axes = plt.subplots(
        len(waveforms), len(comparisons),
        sharey="all", sharex="all",
        figsize=figsize_from_page_fraction(columns=2)
    )
    for i, waveform in enumerate(waveforms):
        for j, (ref_res, comp_res) in enumerate(comparisons):
            file_id = get_comp_id(waveform, ref_res, waveform, comp_res)
            file = comparisons_dir / file_id
            print(file)
            ax: Axes = axes[i, j]
            is_bottom_row = i == len(waveforms) - 1
            is_left_col = j == 0
            if not is_hist_property:
                x_labels = {
                    "Mvir": ("M", "vir"),
                    "Vmax": ("V", "max"),
                    "cNFW": ("C", None),
                }
                x_col, y_col = plot_comparison_hist2d(ax, file, property)
                lab_a, lab_b = x_labels[property]
                unit = f"[{units[property]}]" if property in units and units[property] else ""
                if is_bottom_row:
                    if lab_b:
                        ax.set_xlabel(tex_fmt(r"$AA_{\textrm{BB},CC} DD$", lab_a, lab_b, ref_res, unit))
                    else:
                        ax.set_xlabel(tex_fmt(r"$AA_{BB} CC$", lab_a, ref_res, unit))
                if is_left_col:
                    if lab_b:
                        ax.set_ylabel(
                            tex_fmt(r"$AA_{\textrm{BB},\textrm{comp}} / AA_{\textrm{BB},\textrm{CC}}$",
                                    lab_a, lab_b, ref_res))
                    else:
                        ax.set_ylabel(
                            tex_fmt(r"$AA_{\textrm{comp}} / AA_{\textrm{BB}}$",
                                    lab_a, ref_res))
                    # ax.set_ylabel(f"{property}_{{comp}}/{property}_{ref_res}")
            else:
                if property == "match":
                    # mass_bins = np.geomspace(10, 30000, num_mass_bins)
                    plot_comparison_hist(ax, file, property)

                    mass_bins = [-inf, 30, 50, 100, inf]
                    for k in range(len(mass_bins) - 1):
                        m_min = mass_bins[k]
                        m_max = mass_bins[k + 1]
                        plot_comparison_hist(ax, file, property, m_min, m_max)
                    if is_bottom_row and is_left_col:
                        ax.legend()

                else:
                    plot_comparison_hist(ax, file, property)
                x_labels = {
                    "match": "$J$",
                    "distance": "$D$"
                }
                if is_bottom_row:
                    ax.set_xlabel(x_labels[property])
                if is_left_col:
                    ax.set_ylabel(r"\# Halos")
            if property == "distance":
                ax.set_xscale("log")
                ax.set_yscale("log")
                if is_bottom_row and is_left_col:
                    ax.legend()

    rowcolumn_labels(axes, comparisons, isrow=False)
    rowcolumn_labels(axes, waveforms, isrow=True)
    fig.tight_layout()
    fig.savefig(Path(f"~/tmp/comparison_{property}.pdf").expanduser())
    if show:
        plt.show()


def main():
    # properties = ['group_size', 'Mass_200crit', 'Mass_tot', 'Mvir', 'R_200crit', 'Rvir', 'Vmax', 'cNFW', 'q',
    #               's']
    if len(argv) > 1:
        properties = argv[1:]
    else:
        properties = ["Mvir", "Vmax", "cNFW"]

    for property in properties:
        compare_property(property, show=len(argv) == 2)


if __name__ == '__main__':
    main()
# axis_ratios = ['q', 's'] #they look normal

# for property in axis_ratios:
#     plot_comparison_hist2d(file, property, 'no')
#     plot_comparison_hist2d(file, property, mode)

# plot_comparison_hist2d(file, 'cNFW_200mean', mode)

# ref_property = 'ref_cNFW_200crit'
# comp_property = 'comp_cNFW_200crit'

# df = pd.read_csv(file)
# all_ref_structure_types: pd.DataFrame = df[ref_property]
# all_comp_structure_types: pd.DataFrame = df[comp_property]

# df_odd: pd.DataFrame = df.loc[2 * df.ref_cNFW < df.comp_cNFW]
# odd_ref_structure_types: pd.DataFrame = df_odd[ref_property]
# odd_comp_structure_types: pd.DataFrame = df_odd[comp_property]

# print(all_ref_structure_types.mean(), all_comp_structure_types.mean())
# print(odd_ref_structure_types.mean(), odd_comp_structure_types.mean())


# ref_colour = []
# comp_colour = []
# ref_cnfw = []
# comp_cnfw = []
# df = pd.read_csv(file)
#
# for index, row in df.iterrows():
#     cnfw, colour = concentration(row)
#     ref_cnfw.append(cnfw[0])
#     ref_colour.append(colour[0])
#     comp_cnfw.append(cnfw[1])
#     comp_colour.append(colour[1])
#
# fig: Figure = plt.figure()
# ax: Axes = fig.gca()
#
# ax.scatter(ref_cnfw, comp_cnfw, s=1, c=comp_colour, alpha=.3)
# ax.set_xscale("log")
# ax.set_yscale("log")
# plt.show()

# #Maybe for later:
# if __name__ == '__main__':
#     print('Run with sizes.py <Path to file> <property: str> <mode: str>')
#     file = Path(argv[1])
#     property = str(argv[2])
#     mode = str(argv[3])


# #This is to find the median of the quality of our matches
# matches:pd.DataFrame=df["match"]
# print(matches)
# exit()
# print(matches.median())
# print(matches.std())
# exit()

# #This is to save weird concentration data to own csv
# df_odd: pd.DataFrame = df.loc[2 * df.ref_cNFW < df.comp_cNFW]
# df_odd.to_csv("weird_cnfw.csv")
# exit()
majorly improve comparisons 2022-05-24 17:06:49 +02:00			`from pathlib import Path`
better comparison 2022-07-21 16:05:27 +02:00			`from sys import argv`
comparison plots 2022-05-09 15:20:10 +02:00
many minor changes 2022-06-10 11:06:32 +02:00			`import numpy as np`
initial version 2022-05-04 13:42:57 +02:00			`import pandas as pd`
			`from matplotlib import pyplot as plt`
			`from matplotlib.axes import Axes`
assorted changes 2022-07-18 19:27:56 +02:00			`from matplotlib.collections import QuadMesh`
many minor changes 2022-06-10 11:06:32 +02:00			`from matplotlib.colors import LogNorm`
initial version 2022-05-04 13:42:57 +02:00			`from matplotlib.figure import Figure`
move comparison improvements 2022-08-01 11:33:50 +02:00			`from numpy import inf`
log-std 2022-07-28 00:43:26 +02:00
assorted changes 2022-07-18 19:27:56 +02:00			`from halo_vis import get_comp_id`
			`from paths import base_dir`
strongly improve comparison plots 2022-07-29 13:08:05 +02:00			`from utils import figsize_from_page_fraction, rowcolumn_labels, waveforms, tex_fmt`

			`# density like in Vr:`
assorted changes 2022-07-18 19:27:56 +02:00
reorganize sizes.py 2022-07-12 16:09:52 +02:00			`G = 43.022682 # in Mpc (km/s)^2 / (10^10 Msun)`

strongly improve comparison plots 2022-07-29 13:08:05 +02:00			`vmaxs = {`
			`"Mvir": 52,`
			`"Vmax": 93,`
			`"cNFW": 31`
			`}`
reorganize sizes.py 2022-07-12 16:09:52 +02:00
strongly improve comparison plots 2022-07-29 13:08:05 +02:00			`units = {`
			`"distance": "Mpc",`
move comparison improvements 2022-08-01 11:33:50 +02:00			`"Mvir": r"10^{10} \textrm{M}_\odot",`
			`"Vmax": r"\textrm{km} \textrm{s}^{-1}" # TODO`
strongly improve comparison plots 2022-07-29 13:08:05 +02:00			`}`


			`def concentration(row, halo_type: str) -> bool:`
simplify sizes 2022-07-12 16:16:00 +02:00			`r_200crit = row[f'{halo_type}_R_200crit']`
			`if r_200crit <= 0:`
			`cnfw = -1`
			`colour = 'orange'`
strongly improve comparison plots 2022-07-29 13:08:05 +02:00			`return False`
			`# return cnfw, colour`
reorganize sizes.py 2022-07-12 16:09:52 +02:00
simplify sizes 2022-07-12 16:16:00 +02:00			`r_size = row[f'{halo_type}_R_size'] # largest difference from center of mass to any halo particle`
			`m_200crit = row[f'{halo_type}_Mass_200crit']`
			`vmax = row[f'{halo_type}_Vmax'] # largest velocity coming from enclosed mass profile calculation`
			`rmax = row[f'{halo_type}_Rmax']`
			`npart = row[f'{halo_type}_npart']`
			`VmaxVvir2 = vmax ** 2 * r_200crit / (G * m_200crit)`
			`if VmaxVvir2 <= 1.05:`
			`if m_200crit == 0:`
			`cnfw = r_size / rmax`
strongly improve comparison plots 2022-07-29 13:08:05 +02:00			`return False`
			`# colour = 'white'`
simplify sizes 2022-07-12 16:16:00 +02:00			`else:`
			`cnfw = r_200crit / rmax`
strongly improve comparison plots 2022-07-29 13:08:05 +02:00			`return False`
			`# colour = 'white'`
simplify sizes 2022-07-12 16:16:00 +02:00			`else:`
			`if npart >= 100: # only calculate cnfw for groups with more than 100 particles`
			`cnfw = row[f'{halo_type}_cNFW']`
strongly improve comparison plots 2022-07-29 13:08:05 +02:00			`return True`
			`# colour = 'black'`
reorganize sizes.py 2022-07-12 16:09:52 +02:00			`else:`
simplify sizes 2022-07-12 16:16:00 +02:00			`if m_200crit == 0:`
			`cnfw = r_size / rmax`
strongly improve comparison plots 2022-07-29 13:08:05 +02:00			`return False`
			`# colour = 'white'`
reorganize sizes.py 2022-07-12 16:09:52 +02:00			`else:`
simplify sizes 2022-07-12 16:16:00 +02:00			`cnfw = r_200crit / rmax`
strongly improve comparison plots 2022-07-29 13:08:05 +02:00			`return False`
			`# colour = 'white'`
			`# assert np.isclose(cnfw, row[f'{halo_type}_cNFW'])`
			`#`
			`# return cnfw, colour`
reorganize sizes.py 2022-07-12 16:09:52 +02:00

move comparison improvements 2022-08-01 11:33:50 +02:00			`def plot_comparison_hist2d(ax: Axes, file: Path, property: str):`
functions in sizes to study concentrations 2022-07-08 13:43:01 +02:00			`print("WARNING: Can only plot hist2d of properties with comp_ or ref_ right now!")`
			`print(f" Selected property: {property}")`
			`x_col = f"ref_{property}"`
			`y_col = f"comp_{property}"`
			`df = pd.read_csv(file)`
move comparison improvements 2022-08-01 11:33:50 +02:00			`# if mode == 'concentration_analysis':`
			`# min_x = min([min(df[x_col]), min(df[y_col])])`
			`# max_x = max([max(df[x_col]), max(df[y_col])])`
			`# df = df.loc[2 * df.ref_cNFW < df.comp_cNFW]`
			`# else:`
			`min_x = min([min(df[x_col]), min(df[y_col])])`
			`max_x = max([max(df[x_col]), max(df[y_col])])`
unify waveforms order 2022-07-21 12:34:57 +02:00			`num_bins = 100`
			`bins = np.geomspace(min_x, max_x, num_bins)`
strongly improve comparison plots 2022-07-29 13:08:05 +02:00			`if property == 'cNFW':`
			`rows = []`
assert 2022-07-12 16:12:34 +02:00			`for i, row in df.iterrows():`
strongly improve comparison plots 2022-07-29 13:08:05 +02:00			`comp_cnfw_normal = concentration(row, halo_type="comp")`

			`ref_cnfw_normal = concentration(row, halo_type='ref')`
			`cnfw_normal = comp_cnfw_normal and ref_cnfw_normal`
			`if cnfw_normal:`
			`rows.append(row)`
			`df = pd.concat(rows, axis=1).T`
			`print(df)`
			`if property == "Mvir":`
unify waveforms order 2022-07-21 12:34:57 +02:00			`stds = []`
log-std 2022-07-28 00:43:26 +02:00			`means = []`
unify waveforms order 2022-07-21 12:34:57 +02:00			`for rep_row in range(num_bins):`
			`rep_x_left = bins[rep_row]`
			`rep_x_right = bins[rep_row] + 1`
			`rep_bin = (rep_x_left < df[x_col]) & (df[x_col] < rep_x_right)`
strongly improve comparison plots 2022-07-29 13:08:05 +02:00			`rep_values = df.loc[rep_bin][y_col] / df.loc[rep_bin][x_col]`
			`if len(rep_bin) < 30:`
			`continue`
log-std 2022-07-28 00:43:26 +02:00			`mean = rep_values.mean()`
			`std = rep_values.std()`
			`means.append(mean)`
strongly improve comparison plots 2022-07-29 13:08:05 +02:00			`stds.append(std)`
log-std 2022-07-28 00:43:26 +02:00			`means = np.array(means)`
			`stds = np.array(stds)`
strongly improve comparison plots 2022-07-29 13:08:05 +02:00			`args = {`
			`"color": "C2",`
			`"zorder": 10`
			`}`
			`ax.fill_between(bins, means - stds, means + stds, alpha=.2, **args)`
			`ax.plot(bins, means + stds, alpha=.5, **args)`
			`ax.plot(bins, means - stds, alpha=.5, **args)`
			`# ax_scatter.plot(bins, stds, label=f"{file.stem}")`

			`if property in vmaxs:`
			`vmax = vmaxs[property]`
			`else:`
			`vmax = None`
			`print("WARNING: vmax not set")`
			`image: QuadMesh`
			`_, _, _, image = ax.hist2d(df[x_col], df[y_col] / df[x_col], bins=(bins, np.linspace(0, 2, num_bins)),`
			`norm=LogNorm(vmax=vmax))`
			`# ax.plot([rep_x_left, rep_x_left], [mean - std, mean + std], c="C1")`
			`# ax.annotate(`
			`# text=f"std={std:.2f}", xy=(rep_x_left, mean + std),`
			`# textcoords="axes fraction", xytext=(0.1, 0.9),`
			`# arrowprops={}`
			`# )`
			`print("vmin/vmax", image.norm.vmin, image.norm.vmax)`
			`# fig.colorbar(hist)`

			`ax.set_xscale("log")`
functions in sizes to study concentrations 2022-07-08 13:43:01 +02:00			`# ax.set_yscale("log")`
strongly improve comparison plots 2022-07-29 13:08:05 +02:00			`ax.set_xlim(min(df[x_col]), max(df[y_col]))`
functions in sizes to study concentrations 2022-07-08 13:43:01 +02:00
strongly improve comparison plots 2022-07-29 13:08:05 +02:00			`ax.plot([min(df[x_col]), max(df[y_col])], [1, 1], linewidth=1, color="C1", zorder=10)`
better comparison 2022-07-21 16:05:27 +02:00
assorted changes 2022-07-18 19:27:56 +02:00			`return x_col, y_col`
			`# ax.set_title(file.name)`
functions in sizes to study concentrations 2022-07-08 13:43:01 +02:00			`# fig.savefig(Path(f"~/tmp/comparison_{file.stem}.pdf").expanduser())`
assorted changes 2022-07-18 19:27:56 +02:00			`# fig.suptitle`
functions in sizes to study concentrations 2022-07-08 13:43:01 +02:00
reorganize sizes.py 2022-07-12 16:09:52 +02:00
move comparison improvements 2022-08-01 11:33:50 +02:00			`def plot_comparison_hist(ax: Axes, file: Path, property: str, m_min=None, m_max=None):`
functions in sizes to study concentrations 2022-07-08 13:43:01 +02:00			`df = pd.read_csv(file)`
move comparison improvements 2022-08-01 11:33:50 +02:00			`if m_min:`
			`df = df.loc[(m_min < df["ref_Mvir"]) & (df["ref_Mvir"] < m_max)]`

			`num_bins = 100`
			`histtype = "bar"`
			`label = None`
			`density = False`

			`if property == "distance":`
			`bins = np.geomspace(min(df[property]), max(df[property]), 100)`
			`mean = df[property].mean()`
			`median = df[property].median()`
			`ax.axvline(mean, label="mean", color="C1")`
			`ax.axvline(median, label="median", color="C2")`
			`else:`
			`bins = num_bins`
			`if property == "match":`
			`histtype = "step"`
			`label = f"${m_min} < M < {m_max}$"`
			`density = True`
more improvements 2022-05-06 13:23:31 +02:00
move comparison improvements 2022-08-01 11:33:50 +02:00			`ax.hist(df[property], bins=bins, histtype=histtype, label=label, density=density)`
reorganize sizes.py 2022-07-12 16:09:52 +02:00
New way of studying concentration comparisons; now compute cnfw ourselves for some cases 2022-07-12 15:55:43 +02:00
better comparison 2022-07-21 16:05:27 +02:00			`comparisons_dir = base_dir / "comparisons"`
			`hist_properties = ["distance", "match", "num_skipped_for_mass"]`
initial version 2022-05-04 13:42:57 +02:00
assorted changes 2022-07-18 19:27:56 +02:00			`comparisons = [(256, 512), (256, 1024)] # , (512, 1024)`
initial version 2022-05-04 13:42:57 +02:00
better comparison 2022-07-21 16:05:27 +02:00
move comparison improvements 2022-08-01 11:33:50 +02:00			`def compare_property(property, show: bool):`
better comparison 2022-07-21 16:05:27 +02:00			`is_hist_property = property in hist_properties`
assorted changes 2022-07-18 19:27:56 +02:00			`fig: Figure`
			`fig, axes = plt.subplots(`
			`len(waveforms), len(comparisons),`
			`sharey="all", sharex="all",`
			`figsize=figsize_from_page_fraction(columns=2)`
			`)`
			`for i, waveform in enumerate(waveforms):`
			`for j, (ref_res, comp_res) in enumerate(comparisons):`
			`file_id = get_comp_id(waveform, ref_res, waveform, comp_res)`
			`file = comparisons_dir / file_id`
			`print(file)`
			`ax: Axes = axes[i, j]`
better comparison 2022-07-21 16:05:27 +02:00			`is_bottom_row = i == len(waveforms) - 1`
			`is_left_col = j == 0`
			`if not is_hist_property:`
strongly improve comparison plots 2022-07-29 13:08:05 +02:00			`x_labels = {`
			`"Mvir": ("M", "vir"),`
			`"Vmax": ("V", "max"),`
move comparison improvements 2022-08-01 11:33:50 +02:00			`"cNFW": ("C", None),`
strongly improve comparison plots 2022-07-29 13:08:05 +02:00			`}`
move comparison improvements 2022-08-01 11:33:50 +02:00			`x_col, y_col = plot_comparison_hist2d(ax, file, property)`
strongly improve comparison plots 2022-07-29 13:08:05 +02:00			`lab_a, lab_b = x_labels[property]`
			`unit = f"[{units[property]}]" if property in units and units[property] else ""`
better comparison 2022-07-21 16:05:27 +02:00			`if is_bottom_row:`
strongly improve comparison plots 2022-07-29 13:08:05 +02:00			`if lab_b:`
			`ax.set_xlabel(tex_fmt(r"$AA_{\textrm{BB},CC} DD$", lab_a, lab_b, ref_res, unit))`
			`else:`
			`ax.set_xlabel(tex_fmt(r"$AA_{BB} CC$", lab_a, ref_res, unit))`
better comparison 2022-07-21 16:05:27 +02:00			`if is_left_col:`
strongly improve comparison plots 2022-07-29 13:08:05 +02:00			`if lab_b:`
			`ax.set_ylabel(`
			`tex_fmt(r"$AA_{\textrm{BB},\textrm{comp}} / AA_{\textrm{BB},\textrm{CC}}$",`
			`lab_a, lab_b, ref_res))`
			`else:`
			`ax.set_ylabel(`
			`tex_fmt(r"$AA_{\textrm{comp}} / AA_{\textrm{BB}}$",`
			`lab_a, ref_res))`
			`# ax.set_ylabel(f"{property}_{{comp}}/{property}_{ref_res}")`
better comparison 2022-07-21 16:05:27 +02:00			`else:`
move comparison improvements 2022-08-01 11:33:50 +02:00			`if property == "match":`
			`# mass_bins = np.geomspace(10, 30000, num_mass_bins)`
			`plot_comparison_hist(ax, file, property)`

			`mass_bins = [-inf, 30, 50, 100, inf]`
			`for k in range(len(mass_bins) - 1):`
			`m_min = mass_bins[k]`
			`m_max = mass_bins[k + 1]`
			`plot_comparison_hist(ax, file, property, m_min, m_max)`
			`if is_bottom_row and is_left_col:`
			`ax.legend()`

			`else:`
			`plot_comparison_hist(ax, file, property)`
			`x_labels = {`
			`"match": "$J$",`
			`"distance": "$D$"`
			`}`
better comparison 2022-07-21 16:05:27 +02:00			`if is_bottom_row:`
move comparison improvements 2022-08-01 11:33:50 +02:00			`ax.set_xlabel(x_labels[property])`
better comparison 2022-07-21 16:05:27 +02:00			`if is_left_col:`
strongly improve comparison plots 2022-07-29 13:08:05 +02:00			`ax.set_ylabel(r"\# Halos")`
move comparison improvements 2022-08-01 11:33:50 +02:00			`if property == "distance":`
			`ax.set_xscale("log")`
			`ax.set_yscale("log")`
			`if is_bottom_row and is_left_col:`
			`ax.legend()`
better comparison 2022-07-21 16:05:27 +02:00
assorted changes 2022-07-18 19:27:56 +02:00			`rowcolumn_labels(axes, comparisons, isrow=False)`
			`rowcolumn_labels(axes, waveforms, isrow=True)`
			`fig.tight_layout()`
			`fig.savefig(Path(f"~/tmp/comparison_{property}.pdf").expanduser())`
strongly improve comparison plots 2022-07-29 13:08:05 +02:00			`if show:`
			`plt.show()`
better comparison 2022-07-21 16:05:27 +02:00

			`def main():`
			`# properties = ['group_size', 'Mass_200crit', 'Mass_tot', 'Mvir', 'R_200crit', 'Rvir', 'Vmax', 'cNFW', 'q',`
move comparison improvements 2022-08-01 11:33:50 +02:00			`# 's']`
better comparison 2022-07-21 16:05:27 +02:00			`if len(argv) > 1:`
			`properties = argv[1:]`
			`else:`
strongly improve comparison plots 2022-07-29 13:08:05 +02:00			`properties = ["Mvir", "Vmax", "cNFW"]`
better comparison 2022-07-21 16:05:27 +02:00
			`for property in properties:`
move comparison improvements 2022-08-01 11:33:50 +02:00			`compare_property(property, show=len(argv) == 2)`
better comparison 2022-07-21 16:05:27 +02:00

			`if __name__ == '__main__':`
			`main()`
functions in sizes to study concentrations 2022-07-08 13:43:01 +02:00			`# axis_ratios = ['q', 's'] #they look normal`
majorly improve comparisons 2022-05-24 17:06:49 +02:00
functions in sizes to study concentrations 2022-07-08 13:43:01 +02:00			`# for property in axis_ratios:`
			`# plot_comparison_hist2d(file, property, 'no')`
			`# plot_comparison_hist2d(file, property, mode)`
end of day 2022-06-30 18:14:20 +02:00
functions in sizes to study concentrations 2022-07-08 13:43:01 +02:00			`# plot_comparison_hist2d(file, 'cNFW_200mean', mode)`
many minor changes 2022-06-10 11:06:32 +02:00
New way of studying concentration comparisons; now compute cnfw ourselves for some cases 2022-07-12 15:55:43 +02:00			`# ref_property = 'ref_cNFW_200crit'`
			`# comp_property = 'comp_cNFW_200crit'`

			`# df = pd.read_csv(file)`
			`# all_ref_structure_types: pd.DataFrame = df[ref_property]`
			`# all_comp_structure_types: pd.DataFrame = df[comp_property]`

			`# df_odd: pd.DataFrame = df.loc[2 * df.ref_cNFW < df.comp_cNFW]`
			`# odd_ref_structure_types: pd.DataFrame = df_odd[ref_property]`
			`# odd_comp_structure_types: pd.DataFrame = df_odd[comp_property]`

			`# print(all_ref_structure_types.mean(), all_comp_structure_types.mean())`
			`# print(odd_ref_structure_types.mean(), odd_comp_structure_types.mean())`

majorly improve comparisons 2022-05-24 17:06:49 +02:00
reorganize sizes.py 2022-07-12 16:09:52 +02:00			`# ref_colour = []`
			`# comp_colour = []`
			`# ref_cnfw = []`
			`# comp_cnfw = []`
			`# df = pd.read_csv(file)`
			`#`
			`# for index, row in df.iterrows():`
			`# cnfw, colour = concentration(row)`
			`# ref_cnfw.append(cnfw[0])`
			`# ref_colour.append(colour[0])`
			`# comp_cnfw.append(cnfw[1])`
			`# comp_colour.append(colour[1])`
			`#`
			`# fig: Figure = plt.figure()`
			`# ax: Axes = fig.gca()`
			`#`
			`# ax.scatter(ref_cnfw, comp_cnfw, s=1, c=comp_colour, alpha=.3)`
			`# ax.set_xscale("log")`
			`# ax.set_yscale("log")`
			`# plt.show()`
initial version 2022-05-04 13:42:57 +02:00
functions in sizes to study concentrations 2022-07-08 13:43:01 +02:00			`# #Maybe for later:`
			`# if __name__ == '__main__':`
			`# print('Run with sizes.py <Path to file> <property: str> <mode: str>')`
			`# file = Path(argv[1])`
			`# property = str(argv[2])`
			`# mode = str(argv[3])`
comparison plots 2022-05-09 15:20:10 +02:00

reorganize sizes.py 2022-07-12 16:09:52 +02:00			`# #This is to find the median of the quality of our matches`
			`# matches:pd.DataFrame=df["match"]`
			`# print(matches)`
			`# exit()`
			`# print(matches.median())`
			`# print(matches.std())`
			`# exit()`
comparison plots 2022-05-09 15:20:10 +02:00
reorganize sizes.py 2022-07-12 16:09:52 +02:00			`# #This is to save weird concentration data to own csv`
			`# df_odd: pd.DataFrame = df.loc[2 * df.ref_cNFW < df.comp_cNFW]`
			`# df_odd.to_csv("weird_cnfw.csv")`
			`# exit()`