{ "cells": [ { "cell_type": "code", "execution_count": 1, "metadata": {}, "outputs": [], "source": [ "%matplotlib inline\n", "import pandas as pd\n", "from pandas import DataFrame, Series\n", "import numpy as np\n", "import math\n", "\n", "import seaborn as sns\n", "import matplotlib.pyplot as plt\n", "import matplotlib.patches as mpatches\n", "import matplotlib.colors as colors\n", "from matplotlib.legend_handler import HandlerLine2D, HandlerTuple\n", "from matplotlib.colors import LinearSegmentedColormap\n", "from scipy import stats\n", "import scikit_posthocs as sp\n", "import sys\n", "\n", "from mpl_toolkits.mplot3d import axes3d" ] }, { "cell_type": "code", "execution_count": 2, "metadata": {}, "outputs": [], "source": [ "AllName=\"dataG.pkl\"\n", "ResizesName=\"dataM.pkl\"\n", "ItersName=\"dataL.pkl\"\n", "matrixIt_Total=\"data_L_Total.csv\"\n", "n_cores=20\n", "repet = 5 #CAMBIAR EL NUMERO SEGUN NUMERO DE EJECUCIONES POR CONFIG\n", "\n", "significance_value = 0.05\n", "processes = [2,10,20,40,80,120,160]\n", "\n", "positions = [321, 322, 323, 324, 325]\n", "positions_small = [221, 222, 223, 224]\n", "\n", "labels = ['(1,10)', '(1,20)', '(1,40)', '(1,80)', '(1,120)','(1,160)',\n", " '(10,1)', '(10,20)', '(10,40)', '(10,80)', '(10,120)','(10,160)',\n", " '(20,1)', '(20,10)', '(20,40)', '(20,80)', '(20,120)','(20,160)',\n", " '(40,1)', '(40,10)', '(40,20)', '(40,80)', '(40,120)','(40,160)',\n", " '(80,1)', '(80,10)', '(80,20)', '(80,40)', '(80,120)','(80,160)',\n", " '(120,1)','(120,10)', '(120,20)','(120,40)','(120,80)','(120,160)',\n", " '(160,1)','(160,10)', '(160,20)','(160,40)','(160,80)','(160,120)']\n", "\n", "labelsExpand = ['(1,10)', '(1,20)', '(1,40)', '(1,80)', '(1,120)','(1,160)',\n", " '(10,20)', '(10,40)', '(10,80)', '(10,120)','(10,160)',\n", " '(20,40)', '(20,80)', '(20,120)','(20,160)',\n", " '(40,80)', '(40,120)','(40,160)',\n", " '(80,120)','(80,160)',\n", " '(120,160)']\n", "labelsShrink = ['(10,1)', \n", " '(20,1)', '(20,10)',\n", " '(40,1)', '(40,10)', '(40,20)',\n", " '(80,1)', '(80,10)', '(80,20)', '(80,40)',\n", " '(120,1)','(120,10)', '(120,20)','(120,40)','(120,80)',\n", " '(160,1)','(160,10)', '(160,20)','(160,40)','(160,80)','(160,120)']\n", "\n", "# WORST BEST\n", "labels_dist = ['null', 'SpreadFit', 'CompactFit']\n", " #0 #1 #2 #3\n", "labelsMethods = ['Baseline', 'Baseline single','Baseline - Asynchronous','Baseline single - Asynchronous',\n", " 'Merge','Merge single','Merge - Asynchronous','Merge single - Asynchronous']\n", " #4 #5 #6 #7\n", " \n", "colors_m = ['green','springgreen','blue','darkblue','red','darkred','darkgoldenrod','olive','violet']\n", "linestyle_m = ['-', '--', '-.', ':']\n", "markers_m = ['.','v','s','p', 'h','d','X','P','^']\n", "\n", "OrMult_patch = mpatches.Patch(hatch='', facecolor='green', label='Baseline')\n", "OrSing_patch = mpatches.Patch(hatch='', facecolor='springgreen', label='Baseline single')\n", "OrPthMult_patch = mpatches.Patch(hatch='//', facecolor='blue', label='Baseline - Asyncrhonous')\n", "OrPthSing_patch = mpatches.Patch(hatch='\\\\', facecolor='darkblue', label='Baseline single - Asyncrhonous')\n", "MergeMult_patch = mpatches.Patch(hatch='||', facecolor='red', label='Merge')\n", "MergeSing_patch = mpatches.Patch(hatch='...', facecolor='darkred', label='Merge single')\n", "MergePthMult_patch = mpatches.Patch(hatch='xx', facecolor='yellow', label='Merge - Asyncrhonous')\n", "MergePthSing_patch = mpatches.Patch(hatch='++', facecolor='olive', label='Merge single - Asyncrhonous')\n", "\n", "handles_spawn = [OrMult_patch,OrSing_patch,OrPthMult_patch,OrPthSing_patch,MergeMult_patch,MergeSing_patch,MergePthMult_patch,MergePthSing_patch]" ] }, { "cell_type": "code", "execution_count": 3, "metadata": {}, "outputs": [], "source": [ "dfG = pd.read_pickle( AllName )\n", "\n", "dfG['ADR'] = round((dfG['ADR'] / dfG['DR']) * 100,1)\n", "dfG['SDR'] = round((dfG['SDR'] / dfG['DR']) * 100,1)\n", " \n", "out_group = dfG.groupby(['Groups', 'ADR','Spawn_Method','Redistribution_Method', 'Redistribution_Strategy'])['T_total']\n", "group = dfG.groupby(['ADR','Spawn_Method','Redistribution_Method', 'Redistribution_Strategy','Groups'])['T_total']\n", "\n", "grouped_aggG = group.agg(['median'])\n", "grouped_aggG.rename(columns={'median':'T_total'}, inplace=True) \n", "\n", "out_grouped_G = out_group.agg(['median'])\n", "out_grouped_G.rename(columns={'median':'T_total'}, inplace=True) " ] }, { "cell_type": "code", "execution_count": 4, "metadata": {}, "outputs": [ { "name": "stderr", "output_type": "stream", "text": [ "/tmp/ipykernel_19307/462116935.py:8: FutureWarning: Indexing with multiple keys (implicitly converted to a tuple of keys) will be deprecated, use a list instead.\n", " out_group = dfM.groupby(['NP','NC','ADR','Spawn_Method','Redistribution_Method', 'Redistribution_Strategy'])['T_Malleability','T_Redistribution','T_spawn','T_spawn_real','T_SR','T_AR']\n", "/tmp/ipykernel_19307/462116935.py:9: FutureWarning: Indexing with multiple keys (implicitly converted to a tuple of keys) will be deprecated, use a list instead.\n", " group = dfM.groupby(['ADR','Spawn_Method','Redistribution_Method', 'Redistribution_Strategy','NP','NC'])['T_Malleability','T_Redistribution','T_spawn','T_spawn_real','T_SR','T_AR']\n" ] } ], "source": [ "dfM = pd.read_pickle( ResizesName )\n", "\n", "dfM['ADR'] = round((dfM['ADR'] / dfM['DR']) * 100,1)\n", "dfM['SDR'] = round((dfM['SDR'] / dfM['DR']) * 100,1)\n", "dfM['T_Redistribution'] = dfM['T_SR'] + dfM['T_AR']\n", "dfM['T_Malleability'] = dfM['T_spawn'] + dfM['T_Redistribution']\n", " \n", "out_group = dfM.groupby(['NP','NC','ADR','Spawn_Method','Redistribution_Method', 'Redistribution_Strategy'])['T_Malleability','T_Redistribution','T_spawn','T_spawn_real','T_SR','T_AR']\n", "group = dfM.groupby(['ADR','Spawn_Method','Redistribution_Method', 'Redistribution_Strategy','NP','NC'])['T_Malleability','T_Redistribution','T_spawn','T_spawn_real','T_SR','T_AR']\n", "\n", "grouped_aggM = group.agg(['median'])\n", "grouped_aggM.columns = grouped_aggM.columns.get_level_values(0)\n", "\n", "out_grouped_M = out_group.agg(['median'])\n", "out_grouped_M.columns = out_grouped_M.columns.get_level_values(0)" ] }, { "cell_type": "code", "execution_count": 5, "metadata": {}, "outputs": [], "source": [ "dfL = pd.read_pickle( ItersName )\n", "\n", "dfL['ADR'] = round((dfL['ADR'] / dfL['DR']) * 100,1)\n", "dfL['SDR'] = round((dfL['SDR'] / dfL['DR']) * 100,1)\n", "dfL['ADR'].fillna(-1, inplace=True)\n", "dfL['SDR'].fillna(-1, inplace=True)\n", "dfL['DR'].fillna(-1, inplace=True)\n", " \n", "aux_df = dfL[(dfL.Asynch_Iters == True)]\n", "group = aux_df.groupby(['ADR','Spawn_Method','Redistribution_Method', 'Redistribution_Strategy','NP','NC'])['T_iter']\n", "grouped_aggLAsynch = group.agg(['median','count'])\n", "grouped_aggLAsynch.columns = grouped_aggLAsynch.columns.get_level_values(0)\n", "grouped_aggLAsynch['T_sum'] = grouped_aggLAsynch['count'] * grouped_aggLAsynch['median'] / repet\n", "grouped_aggLAsynch.rename(columns={'median':'T_iter'}, inplace=True) \n", "group = aux_df.groupby(['ADR','Spawn_Method','Redistribution_Method', 'Redistribution_Strategy','NP','NC'])['T_stages']\n", "aux_column = group.apply(list).apply(lambda x: np.median(x,0))\n", "grouped_aggLAsynch['T_stages'] = aux_column\n", "\n", "aux_df = dfL[(dfL.Asynch_Iters == False)]\n", "group = aux_df.groupby('NP')['T_iter']\n", "grouped_aggLSynch = group.agg(['median'])\n", "grouped_aggLSynch.rename(columns={'median':'T_iter'}, inplace=True)\n", "group = aux_df.groupby(['NP'])['T_stages']\n", "aux_column = group.apply(list).apply(lambda x: np.median(x,0))\n", "grouped_aggLSynch['T_stages'] = aux_column\n", "\n", "aux_df2 = aux_df[(aux_df.Is_Dynamic == True)]\n", "group = aux_df2.groupby(['ADR', 'Spawn_Method','Redistribution_Method', 'Redistribution_Strategy','NP','N_Parents'])['T_iter']\n", "grouped_aggLDyn = group.agg(['median'])\n", "grouped_aggLDyn.rename(columns={'median':'T_iter'}, inplace=True)\n", "group = aux_df2.groupby(['ADR', 'Spawn_Method','Redistribution_Method', 'Redistribution_Strategy','NP','N_Parents'])['T_stages']\n", "aux_column = group.apply(list).apply(lambda x: np.median(x,0))\n", "grouped_aggLDyn['T_stages'] = aux_column\n", "\n", "aux_df2 = aux_df[(aux_df.Is_Dynamic == False)]\n", "group = aux_df2.groupby('NP')['T_iter']\n", "grouped_aggLNDyn = group.agg(['median'])\n", "grouped_aggLNDyn.rename(columns={'median':'T_iter'}, inplace=True)\n", "group = aux_df2.groupby(['NP'])['T_stages']\n", "aux_column = group.apply(list).apply(lambda x: np.median(x,0))\n", "grouped_aggLNDyn['T_stages'] = aux_column" ] }, { "cell_type": "code", "execution_count": 6, "metadata": {}, "outputs": [], "source": [ "from bt_scheme import PartialSolution, BacktrackingSolver\n", "def elegirConf(parameters):\n", " class StatePS(PartialSolution):\n", " def __init__(self, config):\n", " self.config= config\n", " self.n= len(config) #Indica el valor a añadir\n", "\n", " def is_solution(self):\n", " return self.n == len(parameters)\n", "\n", " def get_solution(self):\n", " return tuple(self.config)\n", "\n", " def successors(self):\n", " array = parameters[self.n]\n", " for parameter_value in array: #Test all values of the next parameter\n", " self.config.append(parameter_value)\n", " yield StatePS(self.config)\n", " self.config.pop()\n", "\n", " initialPs= StatePS([])\n", " return BacktrackingSolver().solve(initialPs)\n", "\n", "\n", "def obtenerConfs(parameters):\n", " soluciones=[]\n", " for solucion in elegirConf(parameters):\n", " soluciones.append(solucion)\n", " return soluciones\n", "\n", "def modifyToGlobal(parameters, len_parameters, configuration):\n", " usable_configuration = []\n", " for i in range(len(parameters)):\n", " if len_parameters[i] > 1:\n", " aux = (parameters[i][0], configuration[i])\n", " else:\n", " aux = (configuration[i])\n", " usable_configuration.append(aux)\n", " \n", " return usable_configuration\n", "\n", "def modifyToLocalDynamic(parameters, len_parameters, configuration):\n", " usable_configuration = []\n", " for i in range(len(parameters)):\n", " if len_parameters[i] > 1:\n", " aux = (configuration[i], -1)\n", " else:\n", " aux = (-1)\n", " usable_configuration.append(aux)\n", " \n", " return tuple(usable_configuration)\n", "\n", "def CheckConfExists(configuration, dataSet, type_conf='global'):\n", " exists = False\n", " config = list(configuration)\n", " for np_aux in processes:\n", " for ns_aux in processes:\n", " if np_aux != ns_aux:\n", " \n", " if type_conf == 'global':\n", " config.append((np_aux, ns_aux))\n", " elif type_conf == 'malleability':\n", " config.append(np_aux)\n", " config.append(ns_aux)\n", " elif type_conf == 'local':\n", " config.append(np_aux)\n", " \n", " if tuple(config) in dataSet.index: \n", " exists = True # FIXME Return here true?\n", " config.pop()\n", " \n", " if type_conf == 'malleability':\n", " config.pop()\n", " return exists" ] }, { "cell_type": "code", "execution_count": 7, "metadata": {}, "outputs": [ { "name": "stdout", "output_type": "stream", "text": [ "[[0, 0, 0, 1], [0, 0, 1, 1], [0, 1, 0, 1], [0, 1, 1, 1], [96.6, 0, 0, 1], [96.6, 0, 0, 2], [96.6, 0, 1, 1], [96.6, 0, 1, 2], [96.6, 1, 0, 1], [96.6, 1, 0, 2], [96.6, 1, 1, 1], [96.6, 1, 1, 2]]\n", "[[-1, (0, -1), (1, -1), (2, -1)], [-1, (0, -1), (0, -1), (2, -1)], [-1, (1, -1), (0, -1), (2, -1)], [-1, (1, -1), (1, -1), (1, -1)], [-1, (0, -1), (1, -1), (1, -1)], [-1, (0, -1), (0, -1), (1, -1)], [-1, (1, -1), (1, -1), (2, -1)], [-1, (1, -1), (0, -1), (1, -1)]]\n", "[[0, (0, 0), (0, 0), (1, 1)], [0, (0, 0), (0, 1), (1, 1)], [0, (0, 1), (0, 0), (1, 1)], [0, (0, 1), (0, 1), (1, 1)], [96.6, (0, 0), (0, 0), (1, 1)], [96.6, (0, 0), (0, 0), (1, 2)], [96.6, (0, 0), (0, 1), (1, 1)], [96.6, (0, 0), (0, 1), (1, 2)], [96.6, (0, 1), (0, 0), (1, 1)], [96.6, (0, 1), (0, 0), (1, 2)], [96.6, (0, 1), (0, 1), (1, 1)], [96.6, (0, 1), (0, 1), (1, 2)]]\n", "12\n" ] } ], "source": [ "adr = [0,96.6]\n", "sp_method = [0,1]\n", "rd_method = [0,1]\n", "rd_strat = [1,2]\n", "parameters = [adr, sp_method, rd_method, rd_strat]\n", "parameters_names = ['ADR', 'Spawn_Method', 'Redistribution_Method', 'Redistribution_Strategy']\n", "len_parameters = [1,2,2,2]\n", "configurations_aux = obtenerConfs(parameters)\n", "configurations = []\n", "configurations_local_dynamic = set()\n", "configurations_local = set()\n", "configurations_simple = []\n", "for checked_conf in configurations_aux:\n", " aux_conf = modifyToGlobal(parameters, len_parameters, checked_conf)\n", " if CheckConfExists(aux_conf, grouped_aggG):\n", " configurations.append(aux_conf)\n", "\n", " if CheckConfExists(checked_conf, grouped_aggM, 'malleability'):\n", " configurations_simple.append(list(checked_conf))\n", " \n", " aux_conf = modifyToLocalDynamic(parameters, len_parameters, checked_conf)\n", " if CheckConfExists(aux_conf, grouped_aggLDyn, 'local'):\n", " configurations_local_dynamic.add(aux_conf)\n", "\n", "configurations_local_dynamic = list(configurations_local_dynamic)\n", "for index in range(len(configurations_local_dynamic)):\n", " configurations_local_dynamic[index] = list(configurations_local_dynamic[index])\n", "\n", "print(configurations_simple)\n", "print(configurations_local_dynamic)\n", "print(configurations)\n", "print(len(configurations))" ] }, { "cell_type": "code", "execution_count": 8, "metadata": {}, "outputs": [], "source": [ "#ALPHA COMPUTATION\n", "def compute_alpha(config_a, config_b):\n", " for np_aux in processes:\n", " for ns_aux in processes:\n", " if np_aux != ns_aux:\n", " config_a.append(np_aux)\n", " config_a.append(ns_aux)\n", " config_b.append(np_aux)\n", " config_b.append(ns_aux)\n", " grouped_aggM.loc[tuple(config_b),'Alpha'] = grouped_aggM.loc[tuple(config_b),'T_Malleability'] / grouped_aggM.loc[tuple(config_a),'T_Malleability']\n", " config_a.pop()\n", " config_a.pop()\n", " config_b.pop()\n", " config_b.pop()\n", " \n", " \n", " config_a.insert(0,ns_aux)\n", " config_a.insert(0,np_aux)\n", " config_b.insert(0,ns_aux)\n", " config_b.insert(0,np_aux)\n", " out_grouped_M.loc[tuple(config_b),'Alpha'] = out_grouped_M.loc[tuple(config_b),'T_Malleability'] / out_grouped_M.loc[tuple(config_a),'T_Malleability']\n", " config_a.pop(0)\n", " config_a.pop(0)\n", " config_b.pop(0)\n", " config_b.pop(0)\n", "\n", "if not ('Alpha' in grouped_aggM.columns):\n", " for config_a in configurations_simple:\n", " for config_b in configurations_simple:\n", " if config_a[1:-1] == config_b[1:-1] and config_a[0] == 0 and config_b[0] != 0:\n", " compute_alpha(config_a, config_b)\n", "else:\n", " print(\"ALPHA already exists\")" ] }, { "cell_type": "code", "execution_count": 9, "metadata": {}, "outputs": [ { "name": "stderr", "output_type": "stream", "text": [ "/home/usuario/miniconda3/lib/python3.9/site-packages/pandas/core/algorithms.py:1537: VisibleDeprecationWarning: Creating an ndarray from ragged nested sequences (which is a list-or-tuple of lists-or-tuples-or ndarrays with different lengths or shapes) is deprecated. If you meant to do this, you must specify 'dtype=object' when creating the ndarray.\n", " return arr.searchsorted(value, side=side, sorter=sorter) # type: ignore[arg-type]\n", "/home/usuario/miniconda3/lib/python3.9/site-packages/pandas/core/algorithms.py:1537: VisibleDeprecationWarning: Creating an ndarray from ragged nested sequences (which is a list-or-tuple of lists-or-tuples-or ndarrays with different lengths or shapes) is deprecated. If you meant to do this, you must specify 'dtype=object' when creating the ndarray.\n", " return arr.searchsorted(value, side=side, sorter=sorter) # type: ignore[arg-type]\n" ] } ], "source": [ "#OMEGA COMPUTATION\n", "def compute_omega(config):\n", " for np_aux in processes:\n", " for ns_aux in processes:\n", " if np_aux != ns_aux:\n", " if len(config) > len(parameters):\n", " config.pop()\n", " config.pop()\n", " config.append(np_aux)\n", " config.append(ns_aux)\n", " grouped_aggLAsynch.at[tuple(config),'Omega'] = grouped_aggLAsynch.at[tuple(config),'T_iter'] / grouped_aggLSynch.at[np_aux,'T_iter']\n", " value = grouped_aggLAsynch.at[tuple(config),'T_stages'] / grouped_aggLSynch.at[np_aux,'T_stages']\n", " grouped_aggLAsynch.at[tuple(config),'Omega_Stages'] = value.astype(object)\n", " config.pop()\n", " config.pop()\n", "\n", "if not ('Omega' in grouped_aggLAsynch.columns):\n", " for config in configurations:\n", " if config[0] != 0:\n", " compute_omega(config)\n", "else:\n", " print(\"OMEGA already exists\")" ] }, { "cell_type": "code", "execution_count": 10, "metadata": {}, "outputs": [ { "name": "stderr", "output_type": "stream", "text": [ "/home/usuario/miniconda3/lib/python3.9/site-packages/pandas/core/algorithms.py:1537: VisibleDeprecationWarning: Creating an ndarray from ragged nested sequences (which is a list-or-tuple of lists-or-tuples-or ndarrays with different lengths or shapes) is deprecated. If you meant to do this, you must specify 'dtype=object' when creating the ndarray.\n", " return arr.searchsorted(value, side=side, sorter=sorter) # type: ignore[arg-type]\n", "/home/usuario/miniconda3/lib/python3.9/site-packages/pandas/core/algorithms.py:1537: VisibleDeprecationWarning: Creating an ndarray from ragged nested sequences (which is a list-or-tuple of lists-or-tuples-or ndarrays with different lengths or shapes) is deprecated. If you meant to do this, you must specify 'dtype=object' when creating the ndarray.\n", " return arr.searchsorted(value, side=side, sorter=sorter) # type: ignore[arg-type]\n" ] } ], "source": [ "#Dynamic Coherence COMPUTATION\n", "def compute_dyn_coherency(config):\n", " for np_aux in processes:\n", " for n_parents_aux in processes:\n", " if np_aux != n_parents_aux:\n", " config.append(np_aux)\n", " config.append(n_parents_aux)\n", " grouped_aggLDyn.at[tuple(config),'Dyn_Coherency'] = grouped_aggLDyn.at[tuple(config),'T_iter'] / grouped_aggLNDyn.at[np_aux,'T_iter']\n", " value = grouped_aggLDyn.at[tuple(config),'T_stages'] / grouped_aggLNDyn.at[np_aux,'T_stages']\n", " grouped_aggLDyn.at[tuple(config),'Dyn_Coherency_Stages'] = value.astype(object)\n", " config.pop()\n", " config.pop()\n", "\n", "if not ('Dyn_Coherency' in grouped_aggLDyn.columns):\n", " for config in configurations_local_dynamic:\n", " compute_dyn_coherency(config)\n", "else:\n", " print(\"Dyn_Coherency already exists\")" ] }, { "cell_type": "code", "execution_count": null, "metadata": {}, "outputs": [], "source": [] }, { "cell_type": "code", "execution_count": 68, "metadata": {}, "outputs": [], "source": [ "out_grouped_G.to_excel(\"resultG.xlsx\") \n", "out_grouped_M.to_excel(\"resultM.xlsx\") \n", "grouped_aggLAsynch.to_excel(\"AsynchIters.xlsx\")\n", "grouped_aggLDyn.to_excel(\"DynCoherence.xlsx\")" ] }, { "cell_type": "code", "execution_count": 101, "metadata": {}, "outputs": [ { "data": { "text/html": [ "
\n", "\n", "\n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", "
T_iterT_stages
NP
20.633368[0.62166, 3.2e-05, 2e-06, 0.011353]
100.141878[0.123063, 4.4e-05, 5e-06, 0.018725]
200.100381[0.071352, 9.8e-05, 6e-06, 0.028533]
400.081748[0.035681, 0.000212, 8.4e-05, 0.045265]
800.070729[0.018738, 0.000522, 0.000155, 0.05006]
1200.069799[0.013387, 0.00101, 0.000148, 0.053359]
1600.069249[0.010712, 0.001345, 0.000194, 0.054343]
\n", "
" ], "text/plain": [ " T_iter T_stages\n", "NP \n", "2 0.633368 [0.62166, 3.2e-05, 2e-06, 0.011353]\n", "10 0.141878 [0.123063, 4.4e-05, 5e-06, 0.018725]\n", "20 0.100381 [0.071352, 9.8e-05, 6e-06, 0.028533]\n", "40 0.081748 [0.035681, 0.000212, 8.4e-05, 0.045265]\n", "80 0.070729 [0.018738, 0.000522, 0.000155, 0.05006]\n", "120 0.069799 [0.013387, 0.00101, 0.000148, 0.053359]\n", "160 0.069249 [0.010712, 0.001345, 0.000194, 0.054343]" ] }, "execution_count": 101, "metadata": {}, "output_type": "execute_result" } ], "source": [ "grouped_aggLSynch" ] }, { "cell_type": "code", "execution_count": 61, "metadata": {}, "outputs": [ { "name": "stderr", "output_type": "stream", "text": [ "/tmp/ipykernel_6934/552606136.py:3: SettingWithCopyWarning: \n", "A value is trying to be set on a copy of a slice from a DataFrame.\n", "Try using .loc[row_indexer,col_indexer] = value instead\n", "\n", "See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy\n", " test[\"Resize_Coherency\"] = test[\"T_Malleability\"] >= (test[\"T_spawn\"] + test[\"T_SR\"] + test[\"T_AR\"])\n", "/tmp/ipykernel_6934/552606136.py:4: SettingWithCopyWarning: \n", "A value is trying to be set on a copy of a slice from a DataFrame.\n", "Try using .loc[row_indexer,col_indexer] = value instead\n", "\n", "See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy\n", " test[\"Resize_Coherency2\"] = test[\"T_Malleability\"] >= 0\n" ] }, { "data": { "text/html": [ "
\n", "\n", "\n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", "
NPNCTotal_StagesGranularitySDRADRDRRedistribution_MethodRedistribution_StrategySpawn_Method...T_iterT_stagesT_spawnT_spawn_realT_SRT_ART_RedistributionT_MalleabilityResize_CoherencyResize_Coherency2
8851608041000003.496.63947883503111...(0.138975, 0.138623, 0.145609, 0.143285, 0.135...((0.010725, 0.000534, 5e-05, 0.116726), (0.010...0.6999910.01.0338151.1073742.1411892.841180FalseTrue
8861608041000003.496.63947883503111...(0.144654, 0.134697, 0.144184, 0.139219, 0.143...((0.010724, 0.000413, 0.000297, 0.122341), (0....0.2894330.01.0240051.1026392.1266442.416077FalseTrue
8971201041000003.496.63947883503111...(0.137209, 0.149927, 0.148071, 0.153846, 0.161...((0.013391, 0.000532, 0.000137, 0.113001), (0....1.1039320.00.2602672.8950403.1553074.259239FalseTrue
9711201041000003.496.63947883503011...(0.171813, 0.159961, 0.133724, 0.160519, 0.143...((0.013379, 0.000184, 0.000238, 0.136431), (0....1.2318940.00.4276623.0077013.4353634.667257FalseTrue
9741201041000003.496.63947883503011...(0.153822, 0.140212, 0.149297, 0.35497, 0.1534...((0.013389, 0.000274, 0.000135, 0.132982), (0....0.2549330.00.2961342.9132443.2093783.464311FalseTrue
..................................................................
22744012041000003.496.63947883503110...(0.166288, 0.16779, 0.178504, 0.142442, 0.1775...((0.035714, 0.000122, 7.6e-05, 0.127336), (0.0...1.5199050.00.1119951.8950832.0070783.526983FalseFalse
24001208041000003.496.63947883503010...(0.149358, 0.153831, 0.153943, 0.1395, 0.14954...((0.013389, 0.000142, 0.000235, 0.127162), (0....1.6784220.03.4499851.6559735.1059586.784380FalseFalse
2414201041000003.496.63947883503010...(0.110498, 0.098226, 0.097971, 0.09784, 0.0977...((0.071338, 7.9e-05, 6e-06, 0.039075), (0.0713...1.1127220.00.3719962.0239962.3959923.508714FalseFalse
24271016041000003.496.63947883503010...(0.160399, 0.142582, 0.142452, 0.142528, 0.142...((0.123088, 8e-05, 4e-06, 0.03722), (0.12307, ...2.1270730.01.5880133.1855454.7735586.900631FalseTrue
24381012041000003.496.63947883503111...(0.157493, 0.1416, 0.141205, 0.141221, 0.14124...((0.123101, 1.2e-05, 4e-06, 0.034375), (0.1230...1.0074960.00.0494573.2699113.3193684.326864FalseTrue
\n", "

81 rows × 28 columns

\n", "
" ], "text/plain": [ " NP NC Total_Stages Granularity SDR ADR DR \\\n", "885 160 80 4 100000 3.4 96.6 3947883503 \n", "886 160 80 4 100000 3.4 96.6 3947883503 \n", "897 120 10 4 100000 3.4 96.6 3947883503 \n", "971 120 10 4 100000 3.4 96.6 3947883503 \n", "974 120 10 4 100000 3.4 96.6 3947883503 \n", "... ... ... ... ... ... ... ... \n", "2274 40 120 4 100000 3.4 96.6 3947883503 \n", "2400 120 80 4 100000 3.4 96.6 3947883503 \n", "2414 20 10 4 100000 3.4 96.6 3947883503 \n", "2427 10 160 4 100000 3.4 96.6 3947883503 \n", "2438 10 120 4 100000 3.4 96.6 3947883503 \n", "\n", " Redistribution_Method Redistribution_Strategy Spawn_Method ... \\\n", "885 1 1 1 ... \n", "886 1 1 1 ... \n", "897 1 1 1 ... \n", "971 0 1 1 ... \n", "974 0 1 1 ... \n", "... ... ... ... ... \n", "2274 1 1 0 ... \n", "2400 0 1 0 ... \n", "2414 0 1 0 ... \n", "2427 0 1 0 ... \n", "2438 1 1 1 ... \n", "\n", " T_iter \\\n", "885 (0.138975, 0.138623, 0.145609, 0.143285, 0.135... \n", "886 (0.144654, 0.134697, 0.144184, 0.139219, 0.143... \n", "897 (0.137209, 0.149927, 0.148071, 0.153846, 0.161... \n", "971 (0.171813, 0.159961, 0.133724, 0.160519, 0.143... \n", "974 (0.153822, 0.140212, 0.149297, 0.35497, 0.1534... \n", "... ... \n", "2274 (0.166288, 0.16779, 0.178504, 0.142442, 0.1775... \n", "2400 (0.149358, 0.153831, 0.153943, 0.1395, 0.14954... \n", "2414 (0.110498, 0.098226, 0.097971, 0.09784, 0.0977... \n", "2427 (0.160399, 0.142582, 0.142452, 0.142528, 0.142... \n", "2438 (0.157493, 0.1416, 0.141205, 0.141221, 0.14124... \n", "\n", " T_stages T_spawn \\\n", "885 ((0.010725, 0.000534, 5e-05, 0.116726), (0.010... 0.699991 \n", "886 ((0.010724, 0.000413, 0.000297, 0.122341), (0.... 0.289433 \n", "897 ((0.013391, 0.000532, 0.000137, 0.113001), (0.... 1.103932 \n", "971 ((0.013379, 0.000184, 0.000238, 0.136431), (0.... 1.231894 \n", "974 ((0.013389, 0.000274, 0.000135, 0.132982), (0.... 0.254933 \n", "... ... ... \n", "2274 ((0.035714, 0.000122, 7.6e-05, 0.127336), (0.0... 1.519905 \n", "2400 ((0.013389, 0.000142, 0.000235, 0.127162), (0.... 1.678422 \n", "2414 ((0.071338, 7.9e-05, 6e-06, 0.039075), (0.0713... 1.112722 \n", "2427 ((0.123088, 8e-05, 4e-06, 0.03722), (0.12307, ... 2.127073 \n", "2438 ((0.123101, 1.2e-05, 4e-06, 0.034375), (0.1230... 1.007496 \n", "\n", " T_spawn_real T_SR T_AR T_Redistribution T_Malleability \\\n", "885 0.0 1.033815 1.107374 2.141189 2.841180 \n", "886 0.0 1.024005 1.102639 2.126644 2.416077 \n", "897 0.0 0.260267 2.895040 3.155307 4.259239 \n", "971 0.0 0.427662 3.007701 3.435363 4.667257 \n", "974 0.0 0.296134 2.913244 3.209378 3.464311 \n", "... ... ... ... ... ... \n", "2274 0.0 0.111995 1.895083 2.007078 3.526983 \n", "2400 0.0 3.449985 1.655973 5.105958 6.784380 \n", "2414 0.0 0.371996 2.023996 2.395992 3.508714 \n", "2427 0.0 1.588013 3.185545 4.773558 6.900631 \n", "2438 0.0 0.049457 3.269911 3.319368 4.326864 \n", "\n", " Resize_Coherency Resize_Coherency2 \n", "885 False True \n", "886 False True \n", "897 False True \n", "971 False True \n", "974 False True \n", "... ... ... \n", "2274 False False \n", "2400 False False \n", "2414 False False \n", "2427 False True \n", "2438 False True \n", "\n", "[81 rows x 28 columns]" ] }, "execution_count": 61, "metadata": {}, "output_type": "execute_result" } ], "source": [] }, { "cell_type": "code", "execution_count": 65, "metadata": {}, "outputs": [], "source": [ "test=dfM[(dfM.Asynch_Iters > 0) & (dfM.Spawn_Strategy == 1)]\n", "\n", "for index in range(len(test)):\n", " time_malleability_aux = test[\"T_Malleability\"].values[index]\n", " \n", " total_asynch_iters = int(test[\"Asynch_Iters\"].values[index])\n", " asynch_iters = test[\"T_iter\"].values[index][-total_asynch_iters:]\n", " time_iters_aux = 0\n", " \n", " if total_asynch_iters > 1:\n", " time_iters_aux = np.sum(asynch_iters[:-1])\n", " \n", " if time_malleability_aux < time_iters_aux:\n", " \n", " print(test.iloc[index])\n", " print(asynch_iters)\n", " print(time_iters_aux)\n", " print(time_malleability_aux)\n", " print(\"\")" ] }, { "cell_type": "code", "execution_count": 11, "metadata": {}, "outputs": [], "source": [ "def create_group_boundary(rms_boundary, np_aux, ns_aux):\n", " tc_boundary = 0\n", " boundaries = None\n", " if rms_boundary != 0:\n", " # El porcentaje de tc_boundary se tiene en cuenta para eliminar aquellos\n", " # tiempos demasiado grandes en su malleability time respecto al más pequeño\n", " boundaries = get_np_ns_data(\"T_Malleability\", grouped_aggM, configurations_simple, np_aux, ns_aux)\n", " tc_boundary = min(boundaries)\n", " tc_boundary = tc_boundary + tc_boundary*rms_boundary\n", " return tc_boundary, boundaries\n", "\n", "# Aquellos grupos que tengán valores por encima del límite no se considerarán\n", "def check_groups_boundaries(dataLists, boundaries, tc_boundary):\n", " for index in range(len(boundaries)):\n", " if boundaries[index] > tc_boundary:\n", " dataLists[index] = float('infinity')\n" ] }, { "cell_type": "code", "execution_count": 12, "metadata": {}, "outputs": [], "source": [ "def get_perc_differences(dataLists, boundaries, tc_boundary):\n", " perc = 1.05\n", " if boundaries != None: # Si se usa perspectiva de RMS, se desconsideran valores muy altos\n", " check_groups_boundaries(dataLists, boundaries, tc_boundary) \n", " indexes = np.argsort(dataLists)\n", " \n", " best = -1\n", " bestMax = -1\n", " otherBest=[]\n", " for index in indexes: # Para cada metodo -- Empezando por el tiempo más bajo en media/mediana\n", " if best == -1:\n", " best = index\n", " bestMax = dataLists[best] * perc\n", " elif dataLists[index] <= bestMax: # Media/Medianas i < Media/Mediana best\n", " otherBest.append(index)\n", " \n", " otherBest.insert(0,best)\n", " return otherBest\n", "\n", "def get_stat_differences(dataLists, df_Res, boundaries, tc_boundary):\n", " if boundaries != None: # Si se usa perspectiva de RMS, se desconsideran valores muy altos\n", " check_groups_boundaries(dataLists, boundaries, tc_boundary) \n", " indexes = np.argsort(dataLists)\n", " \n", " best = -1\n", " otherBest=[] \n", " for index in indexes: # Para cada metodo -- Empezando por el tiempo más bajo en mediana\n", " if dataLists[index] != float('infinity'):\n", " if best == -1:\n", " best = index\n", " elif not df_Res.iat[best,index]: # df_Res == False indicates 'index' and 'best' have the same mean/median\n", " otherBest.append(index)\n", " \n", " otherBest.insert(0,best)\n", " return otherBest" ] }, { "cell_type": "code", "execution_count": 43, "metadata": {}, "outputs": [], "source": [ "grouped_np = [\"T_total\"]\n", "separated_np = [\"T_Malleability\", \"T_Redistribution\", \"T_spawn\", \"T_SR\", \"T_AR\", \"Alpha\", \"Omega\"]\n", "\n", "def get_np_ns_data(tipo, data_aux, used_config, np_aux, ns_aux):\n", " dataLists=[]\n", " for config in used_config:\n", " if tipo in grouped_np:\n", " config.append((np_aux,ns_aux))\n", " elif tipo in separated_np:\n", " config.append(np_aux)\n", " config.append(ns_aux)\n", " \n", " if tuple(config) in data_aux.index:\n", " aux_value = data_aux.loc[tuple(config),tipo]\n", " if isinstance(aux_value, pd.Series):\n", " aux_value = aux_value.values[0]\n", " if aux_value == 0: #Values of zero indicate it was not performed\n", " aux_value = float('infinity')\n", " else: # This configuration is not present in the dataset\n", " aux_value = float('infinity')\n", " dataLists.append(aux_value)\n", " config.pop()\n", " if tipo in separated_np:\n", " config.pop()\n", " return dataLists\n", "\n", "def get_config_data(tipo, data_aux, config):\n", " dataLists=[]\n", " for ns_aux in processes:\n", " for np_aux in processes:\n", " if np_aux != ns_aux:\n", " \n", " if tipo in grouped_np:\n", " config.append((np_aux,ns_aux))\n", " elif tipo in separated_np:\n", " config.append(np_aux)\n", " config.append(ns_aux)\n", " if tuple(config) in data_aux.index:\n", " aux_value = data_aux.loc[tuple(config),tipo]\n", " if isinstance(aux_value, pd.Series):\n", " aux_value = aux_value.values[0]\n", " if aux_value == 0: #Values of zero indicate it was not performed\n", " aux_value = float('infinity')\n", " else: # This configuration is not present in the dataset\n", " aux_value = float('infinity')\n", " dataLists.append(aux_value)\n", " config.pop()\n", " if tipo in separated_np:\n", " config.pop()\n", " return dataLists\n", "\n", "def get_df_np_ns_data(df_check, tipo, used_config, np_aux, ns_aux):\n", " dataLists=[]\n", " if tipo in grouped_np:\n", " tuple_data = (np_aux, ns_aux)\n", " df_npns_aux = df_check.loc[(df_check['Groups']==tuple_data)]\n", " elif tipo in separated_np:\n", " df_npns_aux = df_check.loc[(df_check['NP']==np_aux)]\n", " df_npns_aux = df_npns_aux.loc[(df_npns_aux['NC']==ns_aux)]\n", " \n", " for config in used_config:\n", " df_config_aux = df_npns_aux\n", " for index in range(len(config)):\n", " aux_name = parameters_names[index]\n", " aux_value = config[index]\n", " df_config_aux = df_config_aux.loc[(df_config_aux[aux_name] == aux_value)]\n", " \n", " aux_value = list(df_config_aux[tipo])\n", " if len(aux_value) > 0:\n", " dataLists.append(aux_value)\n", " return dataLists\n", "\n", "def get_df_config_data(df_check, tipo, config):\n", " dataLists=[]\n", " df_config_aux = df_check\n", " for index in range(len(config)):\n", " aux_name = parameters_names[index]\n", " aux_value = config[index]\n", " df_config_aux = df_config_aux.loc[(df_config_aux[aux_name] == aux_value)]\n", " \n", " for np_aux in processes:\n", " for ns_aux in processes:\n", " if np_aux != ns_aux:\n", " if tipo in grouped_np:\n", " tuple_data = (np_aux, ns_aux)\n", " df_aux = df_config_aux.loc[(df_config_aux['Groups']==tuple_data)]\n", " elif tipo in separated_np:\n", " df_aux = df_config_aux.loc[(df_config_aux['NP']==np_aux)]\n", " df_aux = df_aux.loc[(df_aux['NC']==ns_aux)]\n", " aux_value = list(df_aux[tipo])\n", " if len(aux_value) > 0:\n", " dataLists.append(aux_value)\n", " return dataLists\n", " \n", " " ] }, { "cell_type": "code", "execution_count": 50, "metadata": {}, "outputs": [], "source": [ "def check_normality(df_check, tipo, used_config, fast=True):\n", " normality_array=[True] * (len(processes) * (len(processes)-1) * len(used_config))\n", " normality = True\n", " total=0\n", " i=-1\n", " #Comprobar para cada configuración si se sigue una distribución normal/gaussiana\n", " for np_aux in processes:\n", " for ns_aux in processes:\n", " if np_aux != ns_aux:\n", " i+=1\n", " dataLists = get_df_np_ns_data(df_check, tipo, used_config, np_aux, ns_aux)\n", " for data_aux in dataLists:\n", " st,p = stats.shapiro(data_aux) # Tendrían que ser al menos 20 datos y menos de 50\n", " if p < significance_value: # Reject H0\n", " if fast:\n", " return False\n", " normality_array[i] = False\n", " normality = False\n", " total+=1\n", " print(\"Se sigue una distribución guassiana: \" + str(normality) + \"\\nUn total de: \" + str(total) + \" no siguen una gaussiana\")\n", " print(normality_array)\n", " return normality\n", "\n", "def check_homoscedasticity(df_check, tipo, used_config, fast=True):\n", " homoscedasticity_array=[True] * (len(processes) * (len(processes)-1))\n", " homoscedasticity = True\n", " total=0\n", " i=-1\n", " #Comprobar para cada configuración si se sigue una distribución normal/gaussiana\n", " for np_aux in processes:\n", " for ns_aux in processes:\n", " if np_aux != ns_aux:\n", " i+=1\n", " dataLists = get_df_np_ns_data(df_check, tipo, used_config, np_aux, ns_aux)\n", " st,p = stats.levene(*dataLists) # Tendrían que ser al menos 20 datos y menos de 50\n", " if p < significance_value: # Reject H0\n", " if fast:\n", " return False\n", " homoscedasticity_array[i] = False\n", " homoscedasticity = False\n", " total+=1\n", " print(\"Se sigue una distribución de datos Homocedastica: \" + str(homoscedasticity) + \"\\nUn total de: \" + str(total) + \" no siguen una homocedastica\")\n", " print(homoscedasticity_array)\n", " return homoscedasticity\n", "\n", "def compute_global_stat_difference(dataLists, parametric, np_aux, ns_aux):\n", " if parametric:\n", " st,p=stats.f_oneway(*dataLists)\n", " else:\n", " st,p=stats.kruskal(*dataLists)\n", " if p > significance_value:\n", " print(\"For NP \" + str(np_aux) + \" and \" + str(ns_aux) + \" is accepted H0\")\n", " return True # Equal values || Accept H0\n", " return False # Some groups are different || Reject H0\n", "\n", "def compute_global_posthoc(dataLists, parametric):\n", " data_stats=[]\n", " data_stats2=[]\n", " ini=0\n", " end=len(dataLists)\n", " if parametric:\n", " df_aux = sp.posthoc_ttest(dataLists)\n", " df_Res = df_aux.copy()\n", " for i in range(ini,end):\n", " data_stats.append(np.mean(dataLists[i]))\n", " \n", " for j in range(ini,end):\n", " if df_Res.iat[i,j] < significance_value: # Different means || Reject H1\n", " df_Res.iat[i, j] = True\n", " else:\n", " df_Res.iat[i, j] = False\n", " else:\n", " df_aux = sp.posthoc_conover(dataLists)\n", " df_Res = df_aux.copy()\n", " for i in range(ini,end):\n", " data_stats.append(np.median(dataLists[i]))\n", " data_stats2.append(stats.iqr(dataLists[i],axis=0))\n", " for j in range(ini,end):\n", " if df_Res.iat[i,j] < significance_value: # Different medians || Reject H1\n", " df_Res.iat[i, j] = True\n", " else:\n", " df_Res.iat[i, j] = False\n", " #print(df_Res)\n", " #print(df_aux)\n", " #print(data_stats)\n", " #print(data_stats2)\n", " #aux_value = min(data_stats)\n", " #print(data_stats.index(aux_value))\n", " return df_Res, data_stats" ] }, { "cell_type": "code", "execution_count": 15, "metadata": {}, "outputs": [], "source": [ "def results_with_perc(tipo, data_aux, used_config, rms_boundary=0):\n", " results = []\n", " for np_aux in processes:\n", " for ns_aux in processes:\n", " if np_aux != ns_aux:\n", " tc_boundary, boundaries = create_group_boundary(rms_boundary, np_aux, ns_aux)\n", " \n", " #Get all values for particular config with these number of processes\n", " dataLists = get_np_ns_data(tipo, data_aux, used_config, np_aux, ns_aux)\n", "\n", " aux_data = get_perc_differences(dataLists, boundaries, tc_boundary)\n", " results.append(aux_data)\n", " return results\n", "\n", "def results_with_stats(tipo, df_check, used_config, rms_boundary=0):\n", " results = []\n", " use_parametric = check_normality(df_check, tipo, used_config)\n", " if use_parametric:\n", " use_parametric = check_homoscedasticity(df_check, tipo, used_config)\n", " for np_aux in processes:\n", " for ns_aux in processes:\n", " if np_aux != ns_aux:\n", " tc_boundary, boundaries = create_group_boundary(rms_boundary, np_aux, ns_aux)\n", " \n", " #Get all values for particular config with these number of processes\n", " dataLists = get_df_np_ns_data(df_check, tipo, used_config, np_aux, ns_aux)\n", " equal_set = compute_global_stat_difference(dataLists, use_parametric, np_aux, ns_aux)\n", " if equal_set:\n", " aux_data = list(range(len(used_config))) # All data is equal\n", " else:\n", " res_aux, times_aux = compute_global_posthoc(dataLists, use_parametric)\n", " aux_data = get_stat_differences(times_aux, res_aux, boundaries, tc_boundary)\n", " \n", " results.append(aux_data)\n", " \n", " return results" ] }, { "cell_type": "code", "execution_count": 182, "metadata": {}, "outputs": [ { "name": "stdout", "output_type": "stream", "text": [ "[[1], [2], [1, 3], [1], [1], [1], [2, 1], [2], [3, 1], [1], [1], [1], [2], [2], [3, 2], [1], [1], [1], [2, 3], [2, 3], [2], [2], [3, 1], [3, 1], [3], [1], [1], [3, 2, 1], [2], [2, 3], [3], [1], [1], [1, 3], [3, 2], [2], [3], [1], [1], [3, 1, 2], [3, 2], [2, 3]]\n", "42\n" ] } ], "source": [ "checked_type='T_Malleability'\n", "use_perc = False\n", "select_first_winner = False\n", "prefer_first_winner = False\n", "rms_boundary=0 # Poner a 0 para perspectiva de app. Valor >0 y <1 para perspectiva de RMS\n", "if checked_type=='T_total':\n", " tipo=\"T_total\"\n", " if use_perc:\n", " data_aux = grouped_aggG\n", " else:\n", " data_aux = dfG\n", " used_config = configurations\n", "elif checked_type=='T_Malleability' or checked_type=='T_spawn' or checked_type=='T_SR' or checked_type=='T_AR' or checked_type=='T_Redistribution':\n", " tipo=checked_type\n", " \n", " if use_perc:\n", " data_aux = grouped_aggM\n", " else:\n", " data_aux = dfM\n", " if tipo == 'T_AR':\n", " data_aux = data_aux[(data_aux.ADR > 0)]\n", " elif tipo == 'T_SR':\n", " data_aux = data_aux[(data_aux.ADR == 0)]\n", " \n", " used_config = configurations_simple\n", " \n", "if use_perc:\n", " results = results_with_perc(tipo, data_aux, used_config, rms_boundary)\n", "else:\n", " results = results_with_stats(tipo, data_aux, used_config, rms_boundary)\n", " \n", "if not use_perc and tipo == 'T_AR': #FIXME!!!! No tiene en cuenta total de configuraciones sincronos\n", " for res_index in range(len(results)):\n", " for inner_index in range(len(results[res_index])):\n", " results[res_index][inner_index]+=4\n", "\n", "#Results is a 2 dimensional array. First dimension indicates lists of winners of a particulal number of processes (NP->NC). \n", "#Second dimension is an ordered preference of indexes in the array configurations.\n", "print(results)\n", "print(len(results))" ] }, { "cell_type": "code", "execution_count": 183, "metadata": {}, "outputs": [ { "name": "stdout", "output_type": "stream", "text": [ "[[-1 1 2 1 1 1 1]\n", " [ 1 -1 2 1 1 1 1]\n", " [ 2 2 -1 2 1 1 1]\n", " [ 2 2 2 -1 2 1 1]\n", " [ 3 1 1 1 -1 2 2]\n", " [ 3 1 1 1 2 -1 2]\n", " [ 3 1 1 1 2 2 4]]\n" ] } ], "source": [ "#Lista de indices de mayor a menor según el total de ocurrencias\n", "aux_array = []\n", "for data in results:\n", " aux_array+=data\n", "aux_keys, aux_counts = np.unique(aux_array, return_counts=True)\n", "aux_ordered_index=list(reversed(np.argsort(aux_counts)))\n", "\n", "#Lista de indices de mayor a menor según el total de ocurrencias del primero de cada grupo\n", "aux_array = [0] * len(results)\n", "for index in range(len(results)):\n", " aux_array[index] = results[index][0]\n", "aux_keys_best, aux_counts_best = np.unique(aux_array, return_counts = True)\n", "aux_ordered_best_index=list(reversed(np.argsort(aux_counts_best)))\n", "\n", "def heatmap_get_best(index, ordered_array, keys_array, counts_array, prefer_winner=False):\n", " valid_candidates_indexes = []\n", " prev_counts = -1\n", " for tested_index in ordered_array:\n", " if keys_array[tested_index] in results[index]:\n", " if counts_array[tested_index] >= prev_counts:\n", " prev_counts = counts_array[tested_index]\n", " valid_candidates_indexes.append(tested_index)\n", " else:\n", " break\n", " \n", " if prefer_winner: # Si esta activo, en caso de empate en ocurrencias se selecciona el menor tiempo\n", " for tested_index in results[index]:\n", " if tested_index in valid_candidates_indexes:\n", " return tested_index\n", " return min(valid_candidates_indexes) # En caso de empate se devuelve el que tiene menor valor (Suele ser la config más simple)\n", "\n", "i=0\n", "j=0\n", "used_aux=0\n", "heatmap=np.zeros((len(processes),len(processes))).astype(int)\n", "\n", "if select_first_winner:\n", " for i in range(len(processes)):\n", " for j in range(len(processes)):\n", " if i==j:\n", " heatmap[i][j]=-1\n", " used_aux+=1\n", " else:\n", " results_index = i*len(processes) + j - used_aux\n", " heatmap[i][j] = results[results_index][0]\n", "else:\n", " for i in range(len(processes)):\n", " for j in range(len(processes)):\n", " if i==j:\n", " heatmap[i][j]=-1\n", " used_aux+=1\n", " else:\n", " results_index = i*len(processes) + j - used_aux\n", " index = heatmap_get_best(results_index, aux_ordered_index, aux_keys, aux_counts, prefer_first_winner)\n", " heatmap[i][j]=aux_keys[index]\n", " #index = heatmap_get_best(results_index, aux_ordered_best_index, aux_keys_best, aux_counts_best, prefer_first_winner)\n", " #heatmap[i][j]=aux_keys_best[index]\n", "heatmap[-1][-1]=len(used_config)\n", "print(heatmap)" ] }, { "cell_type": "code", "execution_count": 184, "metadata": {}, "outputs": [], "source": [ "#Adapta results a una cadena asegurando que cada cadena no se sale de su celda\n", "def get_heatmap_multiple_strings(results): #FIXME Deprecated\n", " results_str = []\n", " max_counts = 1\n", " max_per_line = 3\n", " for i in range(len(results)):\n", " results_str.append(list())\n", " count = len(results[i])\n", " results_aux = results[i]\n", " if count > max_counts:\n", " count = max_counts\n", " results_aux = results[i][:count]\n", " \n", " remainder = count%max_per_line\n", " if count <= max_per_line:\n", " aux_str = str(results_aux).replace('[','').replace(']','')\n", " results_str[i].append(aux_str)\n", " else:\n", " if remainder == 0:\n", " index = count//2\n", " else:\n", " index = count - ((remainder-1)*max_per_line + 1)\n", " aux_str = str(results_aux[:index]).replace('[','').replace(']','')\n", " results_str[i].append(aux_str)\n", " aux_str = str(results_aux[index:]).replace('[','').replace(']','')\n", " results_str[i].append(aux_str)\n", " return results_str\n", "\n", "def get_heatmap_strings(heatmap):\n", " results_str = []\n", " for i in range(len(processes)):\n", " for j in range(len(processes)):\n", " if i!=j:\n", " results_str.append(list())\n", " results_str[-1].append(heatmap[i][j])\n", " return results_str" ] }, { "cell_type": "code", "execution_count": 186, "metadata": {}, "outputs": [ { "name": "stderr", "output_type": "stream", "text": [ "/tmp/ipykernel_2494/1414719895.py:49: UserWarning: FixedFormatter should only be used together with FixedLocator\n", " ax.set_xticklabels(['']+processes, fontsize=36)\n", "/tmp/ipykernel_2494/1414719895.py:50: UserWarning: FixedFormatter should only be used together with FixedLocator\n", " ax.set_yticklabels(['']+processes, fontsize=36)\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Filename: Heatmap_T_Malleability.png\n" ] }, { "data": { "image/png": "\n", "text/plain": [ "
" ] }, "metadata": { "needs_background": "light" }, "output_type": "display_data" } ], "source": [ "#Crea un heatmap teniendo en cuenta los colores anteriores\n", "f=plt.figure(figsize=(24, 12))\n", "ax=f.add_subplot(111)\n", "\n", "myColors = (colors.to_rgba(\"white\"), \n", " colors.to_rgba(\"green\"), \n", " colors.to_rgba(\"darkgreen\"), # En lugar de \"darkgreen\"\n", " colors.to_rgba(\"red\"), \n", " colors.to_rgba(\"darkred\"), # En lugar de \"darkred\"\n", " colors.to_rgba(\"mediumseagreen\"), # En lugar de \"mediumseagreen\"\n", " colors.to_rgba(\"seagreen\"), # En lugar de \"seagreen\"\n", " colors.to_rgba(\"palegreen\"), \n", " colors.to_rgba(\"springgreen\"), \n", " colors.to_rgba(\"indianred\"), \n", " colors.to_rgba(\"firebrick\"),\n", " colors.to_rgba(\"darkgoldenrod\"),\n", " colors.to_rgba(\"saddlebrown\"),\n", " colors.to_rgba(\"white\"))\n", "cmap = LinearSegmentedColormap.from_list('Custom', myColors, len(myColors))\n", "\n", "im = ax.imshow(heatmap,cmap=cmap,interpolation='nearest')\n", "\n", "# Loop over data dimensions and create text annotations.\n", "used_aux=0\n", "results_str = get_heatmap_strings(heatmap)\n", "for i in range(len(processes)):\n", " for j in range(len(processes)):\n", " if i!=j:\n", " aux_color=\"white\"\n", " if 0 <= heatmap[i, j] <= 1 or 4 <= heatmap[i, j] <= 7: # El 1 puede necesitar texto en negro\n", " aux_color=\"black\"\n", " results_index = i*len(processes) +j-used_aux\n", " if len(results_str[results_index]) == 1:\n", " text = results_str[results_index][0]\n", " ax.text(j, i, text, ha=\"center\", va=\"center\", color=aux_color, fontsize=36)\n", " else:\n", " add_aux = 0.33\n", " for line in range(len(results_str[results_index])):\n", " i_range = i - 0.5 + add_aux\n", " ax.text(j, i_range, results_str[results_index][line],\n", " ha=\"center\", va=\"center\", color=aux_color, fontsize=36)\n", " add_aux+=0.33\n", " else:\n", " used_aux+=1\n", "\n", "ax.set_ylabel(\"NP\", fontsize=36)\n", "ax.set_xlabel(\"NC\", fontsize=36)\n", "\n", "ax.set_xticklabels(['']+processes, fontsize=36)\n", "ax.set_yticklabels(['']+processes, fontsize=36)\n", "\n", "\n", "labelsMethods_aux = ['Baseline - AllS (0)', 'Baseline - P2PS (1)',\n", " 'Merge - AllS (2)','Merge - P2PS (3)',\n", " 'Baseline - AllA (4)', 'Baseline - AllT (5)','Baseline - P2PA (6)','Baseline - P2PT (7)',\n", " 'Merge - AllA (8)','Merge - AllT (9)','Merge - P2PA (10)','Merge - P2PT (11)']\n", "\n", "colorbar=f.colorbar(im, ax=ax)\n", "tick_bar = []\n", "for i in range(len(used_config)):\n", " tick_bar.append(0.37 + i*0.92) #Config de 12 valores\n", "colorbar.set_ticks(tick_bar) \n", "colorbar.set_ticklabels(labelsMethods_aux)\n", "colorbar.ax.tick_params(labelsize=32)\n", "#\n", "\n", "f.tight_layout()\n", "print(\"Filename: Heatmap_\"+tipo+\".png\")\n", "f.savefig(\"Images/Heatmap_\"+tipo+\".png\", format=\"png\")" ] }, { "cell_type": "code", "execution_count": 43, "metadata": {}, "outputs": [ { "name": "stdout", "output_type": "stream", "text": [ "[ 1 2 3 4 6 8 10 11]\n", "[ 1 17 20 1 1 22 27 1]\n", "[ 2 3 8 10 11]\n", "[ 5 9 11 16 1]\n" ] } ], "source": [ "aux_array = []\n", "for data in results:\n", " aux_array+=data\n", "aux_results, aux_counts = np.unique(aux_array, return_counts=True)\n", "print(aux_results)\n", "print(aux_counts)\n", "\n", "aux_array = [0] * len(results)\n", "for index in range(len(results)):\n", " aux_array[index] = results[index][0]\n", "aux_results, aux_counts = np.unique(aux_array, return_counts = True)\n", "print(aux_results)\n", "print(aux_counts)\n" ] }, { "cell_type": "raw", "metadata": {}, "source": [ "El siguiente código asume que para cada número de procesos padre/hijo existen valores en todas las configuraciones que se van a probar" ] }, { "cell_type": "code", "execution_count": 157, "metadata": {}, "outputs": [ { "data": { "image/png": "\n", "text/plain": [ "
" ] }, "metadata": { "needs_background": "light" }, "output_type": "display_data" } ], "source": [ "used_direction='a'\n", "test_parameter='T_total' #Valores son \"alpha\" o \"omega\"\n", "\n", "if test_parameter == 'alpha':\n", " name_fig=\"Alpha_\"\n", " real_parameter='Alpha'\n", " name_legend = \"Values of α\"\n", " used_config = configurations_simple\n", " data_aux = grouped_aggM[grouped_aggM[real_parameter] > 0]\n", "elif test_parameter == 'omega':\n", " name_fig=\"Omega_\"\n", " real_parameter='Omega'\n", " name_legend = \"Values of ω\"\n", " used_config = configurations\n", " data_aux = grouped_aggLAsynch[grouped_aggLAsynch[real_parameter] > 0]\n", "elif test_parameter == 'T_total':\n", " name_fig=\"Ttotal\"\n", " real_parameter='T_total'\n", " name_legend = \"Time(s)\"\n", " used_config = configurations\n", " data_aux = grouped_aggG\n", " #data_aux = data_aux[data_aux.index.isin(df1.index)]\n", " \n", "if used_direction=='s':\n", " data_aux=data_aux.query('NP > NC')\n", " name_fig= name_fig+\"Shrink\"\n", "elif used_direction=='e':\n", " data_aux=data_aux.query('NP < NC')\n", " name_fig= name_fig+\"Expand\"\n", "elif used_direction=='a':\n", " name_fig= name_fig+\"All\" \n", "\n", "plot_data = []\n", "for config in used_config:\n", " if config[0] > 0:\n", " dataLists = get_config_data(real_parameter, data_aux, config)\n", " dataLists = list(filter(lambda x: x != float('infinity'), dataLists))\n", " plot_data.append(dataLists)\n", "\n", "labels_aux = []\n", "for ns_aux in processes:\n", " for np_aux in processes:\n", " if used_direction=='s' and np_aux > ns_aux or used_direction=='e' and np_aux < ns_aux or used_direction=='a' and np_aux != ns_aux:\n", " new_label = \"(\" + str(np_aux) + \",\" + str(ns_aux) + \")\"\n", " labels_aux.append(new_label)\n", "\n", "labelsMethods_aux = ['Baseline - AllA', 'Baseline - AllT','Baseline - P2PA','Baseline - P2PT',\n", " 'Merge - AllA','Merge - AllT','Merge - P2PA','Merge - P2PT']\n", "\n", "f=plt.figure(figsize=(22, 14))\n", "ax=f.add_subplot(111)\n", "x = np.arange(len(labels_aux))\n", "for index in range(len(plot_data)):\n", " array_aux = plot_data[index]\n", " ax.plot(x, array_aux, color=colors_m[index%len(colors_m)], linestyle=linestyle_m[index%len(linestyle_m)], \\\n", " marker=markers_m[index%len(markers_m)], markersize=18, label=labelsMethods_aux[index])\n", "\n", "ax.set_xlabel(\"(NP,NC)\", fontsize=36)\n", "ax.set_ylabel(name_legend, fontsize=36)\n", "plt.xticks(x, labels_aux,rotation=90)\n", "ax.tick_params(axis='both', which='major', labelsize=36)\n", "ax.tick_params(axis='both', which='minor', labelsize=36)\n", "plt.legend(loc='best', fontsize=30,ncol=2,framealpha=0.8)\n", " \n", "f.tight_layout()\n", "f.savefig(\"Images/LinePlot_\"+name_fig+\".png\", format=\"png\")" ] }, { "cell_type": "raw", "metadata": {}, "source}, { "cell_type": "raw", "metadata": {}, "source": [ "Gráfica de lineas para generar tiempos del grupo G." ] }, { "cell_type": "code", "execution_count": null, "metadata": {}, "outputs": [], "source": [ "used_direction='e'\n", "test_parameter='T_total' #Valores son \"alpha\" o \"omega\"\n", "\n", "if test_parameter == 'T_total':\n", " name_fig=\"Ttotal\"\n", " real_parameter='T_total'\n", " name_legend = \"Time(s)\"\n", " used_config = configurations\n", " data_aux = grouped_aggG\n", " #data_aux = data_aux[data_aux.index.isin(df1.index)]\n", " \n", "if used_direction=='s':\n", " data_aux_cmp=grouped_aggM.reset_index().query('NP > NC')\n", " name_fig= name_fig+\"Shrink\"\n", "elif used_direction=='e':\n", " data_aux_cmp=grouped_aggM.reset_index().query('NP < NC')\n", " name_fig= name_fig+\"Expand\"\n", "elif used_direction=='a':\n", " name_fig= name_fig+\"All\" \n", "\n", "if used_direction!='a':\n", " pruebaG = data_aux.reset_index()\n", " pruebaG = pruebaG.loc[pruebaG.index.intersection(data_aux_cmp.index)]\n", " data_aux = data_aux[(data_aux.T_total.isin(pruebaG.T_total))]\n", "\n", "plot_data = []\n", "for config in used_config:\n", " if config[0] == 0:\n", " dataLists = get_config_data(real_parameter, data_aux, config)\n", " dataLists = list(filter(lambda x: x != float('infinity'), dataLists))\n", " plot_data.append(dataLists)\n", "\n", "labels_aux = []\n", "for ns_aux in processes:\n", " for np_aux in processes:\n", " if used_direction=='s' and np_aux > ns_aux or used_direction=='e' and np_aux < ns_aux or used_direction=='a' and np_aux != ns_aux:\n", " new_label = \"(\" + str(np_aux) + \",\" + str(ns_aux) + \")\"\n", " labels_aux.append(new_label)\n", "\n", "labelsMethods_aux = ['Baseline - AllA', 'Baseline - AllT','Baseline - P2PA','Baseline - P2PT',\n", " 'Merge - AllA','Merge - AllT','Merge - P2PA','Merge - P2PT']\n", "\n", "f=plt.figure(figsize=(22, 14))\n", "ax=f.add_subplot(111)\n", "x = np.arange(len(labels_aux))\n", "for index in range(len(plot_data)):\n", " array_aux = plot_data[index]\n", " ax.plot(x, array_aux, color=colors_m[index%len(colors_m)], linestyle=linestyle_m[index%len(linestyle_m)], \\\n", " marker=markers_m[index%len(markers_m)], markersize=18, label=labelsMethods_aux[index])\n", "\n", "ax.set_ylim(0,140)\n", "ax.set_xlabel(\"(NP,NC)\", fontsize=36)\n", "ax.set_ylabel(name_legend, fontsize=36)\n", "plt.xticks(x, labels_aux,rotation=90)\n", "ax.tick_params(axis='both', which='major', labelsize=36)\n", "ax.tick_params(axis='both', which='minor', labelsize=36)\n", "plt.legend(loc='best', fontsize=30,ncol=2,framealpha=0.8)\n", " \n", "f.tight_layout()\n", "f.savefig(\"Images/LinePlot_\"+name_fig+\".png\", format=\"png\")" ] }, { "cell_type": "raw", "metadata": {}, "source": [ "El siguiente generá una imagen en 3d de T_total para cada una de las diferentes configuraciones." ] }, { "cell_type": "code", "execution_count": null, "metadata": {}, "outputs": [], "source": [ "def generate_3d_image(config, name):\n", " fig, ax = plt.subplots(1, 1, subplot_kw={'projection': '3d'}, figsize=(15, 15))\n", "\n", " Z = [None] * len(processes)\n", " X, Y = np.meshgrid(processes, processes)\n", " for i in range(len(processes)):\n", " np_aux = processes[i]\n", " Z[i] = [0] * len(processes)\n", " Z[i][i] = grouped_aggLSynch.loc[np_aux, 'T_iter'] * 1000\n", " for j in range(len(processes)):\n", " if i!=j:\n", " ns_aux = processes[j]\n", " config.append((np_aux,ns_aux))\n", " aux = grouped_aggG.loc[tuple(config),'T_total']\n", " config.pop()\n", " \n", " Z[i][j] = aux.values[0]\n", " #Z[i][j] = Z[i][j] / Z[i][i]\n", " #Z[i][i] = 1\n", "\n", " Z = np.array(Z)\n", "\n", " ax.plot_surface(X, Y, Z, rstride=1, cstride=1,\n", " cmap='viridis', edgecolor='none')\n", " ax.view_init(15, 25)\n", " ax.set_xlabel(\"NC\", fontsize=16)\n", " ax.set_ylabel(\"NP\", fontsize=16)\n", " ax.set_zlabel(\"Normalized time\", fontsize=16)\n", " ax.set_title(name, fontsize=10)\n", " plt.show()\n", " \n", "for index in range(len(configurations)):\n", " used_config = configurations[index]\n", " generate_3d_image(used_config,str(index))" ] }, { "cell_type": "raw", "metadata": {}, "source": [ "El siguiente código es computar la coherencia de T_malleability respecto a los tiempos internos de maleabilidad (Coherency1)\n", "y por otro lado de T_malleability respecto a iteraciones asíncronas más los pasos síncronos." ] }, { "cell_type": "code", "execution_count": null, "metadata": {}, "outputs": [], "source": [ "test=dfM[(dfM.Asynch_Iters > 0)]\n", "\n", "# El primer Coherency tendrá sentido cuando se recoga T_Malleability. Mas seguro con barriers en Malleability\n", "test[\"Resize_Coherency\"] = test[\"T_Malleability\"] >= (test[\"T_spawn\"] + test[\"T_SR\"] + test[\"T_AR\"])\n", "# El segundo Coherency tendrá sentido cuando se recoga T_Malleability. Mas seguro al usar Rigid para iteraciones\n", "test[\"Resize_Coherency2\"] = test[\"T_Malleability\"] >= 0\n", "\n", "for index in range(len(test)):\n", " time_malleability_aux = test[\"T_Malleability\"].values[index]\n", " time_synch_aux = test[\"T_SR\"].values[index]\n", " time_spawn_aux = test[\"T_spawn\"].values[index]\n", " is_asynch_spawn = (test[\"Spawn_Strategy\"].values[index] % 2 == 0)\n", " \n", " total_asynch_iters = int(test[\"Asynch_Iters\"].values[index])\n", " asynch_iters = test[\"T_iter\"].values[index][-total_asynch_iters:]\n", " time_iters_aux = np.sum(asynch_iters[:])\n", " \n", " sum_times = time_synch_aux + is_asynch_spawn * time_spawn_aux + time_iters_aux\n", " \n", " if time_malleability_aux < sum_times:\n", " real_index = test.index.values[index]\n", " test.at[real_index, \"Resize_Coherency2\"] = False\n", "test[(test.Resize_Coherency == False)]" ] }, { "cell_type": "raw", "metadata": {}, "source": [ "El siguiente código es para utilizar Dask. Una versión que paraleliza una serie de tareas de Pandas.\n", "Tras llamar a compute se realizan todas las tareas que se han pedido." ] }, { "cell_type": "code", "execution_count": null, "metadata": {}, "outputs": [], "source": [ "import dask.dataframe as dd\n", "ddf = dd.from_pandas(dfL[(dfL.Asynch_Iters == False)], npartitions=10)\n", "group = ddf.groupby('NP')['T_iter']\n", "grouped_aggLSynch = group.agg(['mean'])\n", "grouped_aggLSynch = grouped_aggLSynch.rename(columns={'mean':'T_iter'}) \n", "grouped_aggLSynch = grouped_aggLSynch.compute()" ] }, { "cell_type": "raw", "metadata": {}, "source}, { "cell_type": "code", "execution_count": 114, "metadata": {}, "outputs": [ { "name": "stdout", "output_type": "stream", "text": [ "[1.75676344 0.03701228 3.76439349]\n", "[0.20630784 0.96375203 0.04733157]\n", "[2.17054203 1.7721764 0.83496214 0.27720765 0.59800783 0.42146685]\n", "[0.19532397 0.24843587 0.47871884 0.76709983 0.5796655 0.67410377]\n" ] } ], "source": [ "a = np.array([[9.87, 9.03, 6.81],\n", " [7.18, 8.35, 7.00],\n", " [8.39, 7.58, 7.68],\n", " [7.45, 6.33, 9.35],\n", " [6.41, 7.10, 9.33],\n", " [8.00, 8.24, 8.44]])\n", "b = np.array([[6.35, 7.30, 7.16],\n", " [6.65, 6.68, 7.63],\n", " [5.72, 7.73, 6.72],\n", " [7.01, 9.19, 7.41],\n", " [7.75, 7.87, 8.30],\n", " [6.90, 7.97, 6.97]])\n", "c = np.array([[3.31, 8.77, 1.01],\n", " [8.25, 3.24, 3.62],\n", " [6.32, 8.81, 5.19],\n", " [7.48, 8.83, 8.91],\n", " [8.59, 6.01, 6.07],\n", " [3.07, 9.72, 7.48]])\n", "my_daa_aux = [a,b,c]\n", "\n", "F1, p_aux = stats.f_oneway(a, b, c)\n", "F2, p_aux2 = stats.f_oneway(*my_daa_aux,axis=0)\n", "\n", "print(F1)\n", "print(p_aux)\n", "print(F2)\n", "print(p_aux2)" ] }, { "cell_type": "code", "execution_count": 174, "metadata": {}, "outputs": [ { "data": { "text/html": [ "
\n", "\n", "\n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", "
T_total
ADRSpawn_MethodRedistribution_MethodRedistribution_StrategyGroups
0.0(0, 0)(0, 0)(1, 1)(10, 2)396.244297
(20, 2)323.197388
(20, 10)122.029776
(40, 2)363.054878
(40, 10)115.773127
..................
96.6(0, 1)(0, 1)(1, 2)(160, 10)110.560542
(160, 20)91.163625
(160, 40)85.075558
(160, 80)73.307185
(160, 120)69.804638
\n", "

252 rows × 1 columns

\n", "
" ], "text/plain": [ " T_total\n", "ADR Spawn_Method Redistribution_Method Redistribution_Strategy Groups \n", "0.0 (0, 0) (0, 0) (1, 1) (10, 2) 396.244297\n", " (20, 2) 323.197388\n", " (20, 10) 122.029776\n", " (40, 2) 363.054878\n", " (40, 10) 115.773127\n", "... ...\n", "96.6 (0, 1) (0, 1) (1, 2) (160, 10) 110.560542\n", " (160, 20) 91.163625\n", " (160, 40) 85.075558\n", " (160, 80) 73.307185\n", " (160, 120) 69.804638\n", "\n", "[252 rows x 1 columns]" ] }, "execution_count": 174, "metadata": {}, "output_type": "execute_result" } ], "source": [ "pruebaG = grouped_aggG.reset_index()\n", "pruebaM = grouped_aggM.reset_index().query('NP > NC') #Shrink\n", "pruebaG = pruebaG.loc[pruebaG.index.intersection(pruebaM.index)]\n", "prueba2 = grouped_aggG[(grouped_aggG.T_total.isin(pruebaG.T_total))]\n", "prueba2" ] }, { "cell_type": "code", "execution_count": null, "metadata": {}, "outputs": [], "source": [] } ], "metadata": { "kernelspec": { "display_name": "Python 3 (ipykernel)", "language": "python", "name": "python3" }, "language_info": { "codemirror_mode": { "name": "ipython", "version": 3 }, "file_extension": ".py", "mimetype": "text/x-python", "name": "python", "nbconvert_exporter": "python", "pygments_lexer": "ipython3", "version": "3.9.7" } }, "nbformat": 4, "nbformat_minor": 4 }