"Codes/runValgrind.sh" did not exist on "c437c2128c7ed133ffb5dce2d96f2110bc567435"
Commit 5eb9cddd authored by Iker Martín's avatar Iker Martín
Browse files

Version 2 de aplicación

parent 2663ec23
{
"cells": [
{
"cell_type": "code",
"execution_count": 1,
"metadata": {},
"outputs": [],
"source": [
"%matplotlib inline\n",
"import pandas as pd\n",
"from pandas import DataFrame, Series\n",
"import numpy as np\n",
"import seaborn as sns\n",
"import matplotlib.pyplot as plt\n",
"from scipy import stats\n",
"import sys"
]
},
{
"cell_type": "code",
"execution_count": 29,
"metadata": {},
"outputs": [],
"source": [
"matrixMalEX=\"data_GG.csv\"\n",
"matrixMal=\"data_GM.csv\"\n",
"matrixIt=\"data_L.csv\"\n",
"n_qty=2 #CAMBIAR SEGUN LA CANTIDAD DE NODOS USADOS\n",
"repet = 3 * 2 #CAMBIAR EL PRIMER NUMERO SEGUN NUMERO DE EJECUCIONES POR CONFIG\n",
"\n",
"p_value = 0.05\n",
"values = [2, 4, 8, 16, 32]\n",
"dist_names = ['null', 'BestFit', 'WorstFit']"
]
},
{
"cell_type": "code",
"execution_count": 3,
"metadata": {},
"outputs": [],
"source": [
"def speedUp(arr, seq, df):\n",
" numP = df.loc[arr.index[0]].NP\n",
" return seq[( seq.NP == numP )]['EX'] / arr.mean()"
]
},
{
"cell_type": "code",
"execution_count": 4,
"metadata": {},
"outputs": [],
"source": [
"dfG = pd.read_csv( matrixMalEX )\n",
"\n",
"dfG = dfG.drop(columns=dfG.columns[0])\n",
"dfG['S'] = dfG['N']\n",
"dfG['N'] = dfG['S'] + dfG['%Async']\n",
"dfG['%Async'] = (dfG['%Async'] / dfG['N']) * 100\n",
"\n",
"if(n_qty == 1):\n",
" group = dfG.groupby(['%Async', 'Groups'])['TE']\n",
"else: \n",
" group = dfG.groupby(['Dist', '%Async', 'Groups'])['TE']\n",
"\n",
"#group\n",
"grouped_aggG = group.agg(['mean'])\n",
"grouped_aggG.rename(columns={'mean':'TE',}, inplace=True)"
]
},
{
"cell_type": "code",
"execution_count": null,
"metadata": {},
"outputs": [],
"source": [
"from natsort import index_natsorted\n",
"grouped_aggG.sort_values(\n",
" by=\"Groups\",\n",
" key=lambda x: np.argsort(index_natsorted(df[\"Groups\"]))\n",
")\n",
"grouped_aggG"
]
},
{
"cell_type": "code",
"execution_count": 5,
"metadata": {},
"outputs": [],
"source": [
"dfM = pd.read_csv( matrixMal )\n",
"dfM = dfM.drop(columns=dfM.columns[0])\n",
"\n",
"dfM['S'] = dfM['N']\n",
"dfM['N'] = dfM['S'] + dfM['%Async']\n",
"dfM[\"TR\"] = dfM[\"TC\"] + dfM[\"TS\"] + dfM[\"TA\"]\n",
"dfM['%Async'] = (dfM['%Async'] / dfM['N']) * 100\n",
"\n",
"if(n_qty == 1):\n",
" groupM = dfM.groupby(['%Async','NP', 'NS'])['TC', 'TS', 'TA', 'TR']\n",
"else:\n",
" groupM = dfM.groupby(['Dist', '%Async','NP', 'NS'])['TC', 'TS', 'TA', 'TR']\n",
"\n",
"#group\n",
"grouped_aggM = groupM.agg(['mean'])\n",
"grouped_aggM.columns = grouped_aggM.columns.get_level_values(0)"
]
},
{
"cell_type": "code",
"execution_count": 6,
"metadata": {},
"outputs": [
{
"name": "stderr",
"output_type": "stream",
"text": [
"/home/usuario/anaconda3/lib/python3.7/site-packages/ipykernel_launcher.py:16: FutureWarning: set_axis currently defaults to operating inplace.\n",
"This will change in a future version of pandas, use inplace=True to avoid this warning.\n",
" app.launch_new_instance()\n"
]
}
],
"source": [
"dfL = pd.read_csv( matrixIt )\n",
"dfL = dfL.drop(columns=dfL.columns[0])\n",
"\n",
"dfL['S'] = dfL['N']\n",
"dfL['N'] = dfL['S'] + dfL['%Async']\n",
"dfL['%Async'] = (dfL['%Async'] / dfL['N']) * 100\n",
"\n",
"if(n_qty == 1):\n",
" groupL = dfL[dfL['NS'] != 0].groupby(['Tt', '%Async', 'NP', 'NS'])['Ti', 'To']\n",
"else:\n",
" groupL = dfL[dfL['NS'] != 0].groupby(['Tt', 'Dist', '%Async', 'NP', 'NS'])['Ti', 'To']\n",
"\n",
"#group\n",
"grouped_aggL = groupL.agg(['mean', 'count'])\n",
"grouped_aggL.columns = grouped_aggL.columns.get_level_values(0)\n",
"grouped_aggL.set_axis(['Ti', 'Iters', 'To', 'Iters2'], axis='columns')\n",
"\n",
"grouped_aggL['Iters'] = np.ceil(grouped_aggL['Iters']/6) # TODO Cambiar a repeticiones realizadas\n",
"grouped_aggL['Iters2'] = np.ceil(grouped_aggL['Iters2']/6)"
]
},
{
"cell_type": "code",
"execution_count": 7,
"metadata": {},
"outputs": [],
"source": [
"grouped_aggL.to_excel(\"resultL.xlsx\") \n",
"grouped_aggM.to_excel(\"resultM.xlsx\") \n",
"grouped_aggG.to_excel(\"resultG.xlsx\") "
]
},
{
"cell_type": "code",
"execution_count": 8,
"metadata": {},
"outputs": [
{
"data": {
"text/html": [
"<div>\n",
"<style scoped>\n",
" .dataframe tbody tr th:only-of-type {\n",
" vertical-align: middle;\n",
" }\n",
"\n",
" .dataframe tbody tr th {\n",
" vertical-align: top;\n",
" }\n",
"\n",
" .dataframe thead th {\n",
" text-align: right;\n",
" }\n",
"</style>\n",
"<table border=\"1\" class=\"dataframe\">\n",
" <thead>\n",
" <tr style=\"text-align: right;\">\n",
" <th></th>\n",
" <th>N</th>\n",
" <th>%Async</th>\n",
" <th>Groups</th>\n",
" <th>Dist</th>\n",
" <th>Matrix</th>\n",
" <th>Time</th>\n",
" <th>Iters</th>\n",
" <th>TE</th>\n",
" <th>S</th>\n",
" </tr>\n",
" </thead>\n",
" <tbody>\n",
" <tr>\n",
" <td>0</td>\n",
" <td>1000000000</td>\n",
" <td>0.0</td>\n",
" <td>8,32</td>\n",
" <td>2,2</td>\n",
" <td>100000</td>\n",
" <td>0.1</td>\n",
" <td>1000</td>\n",
" <td>31.525710</td>\n",
" <td>1000000000</td>\n",
" </tr>\n",
" <tr>\n",
" <td>1</td>\n",
" <td>1000000000</td>\n",
" <td>0.0</td>\n",
" <td>8,32</td>\n",
" <td>2,2</td>\n",
" <td>100000</td>\n",
" <td>0.1</td>\n",
" <td>1000</td>\n",
" <td>33.315857</td>\n",
" <td>1000000000</td>\n",
" </tr>\n",
" <tr>\n",
" <td>2</td>\n",
" <td>1000000000</td>\n",
" <td>0.0</td>\n",
" <td>8,32</td>\n",
" <td>2,2</td>\n",
" <td>100000</td>\n",
" <td>0.1</td>\n",
" <td>1000</td>\n",
" <td>33.347537</td>\n",
" <td>1000000000</td>\n",
" </tr>\n",
" <tr>\n",
" <td>3</td>\n",
" <td>1000000000</td>\n",
" <td>75.0</td>\n",
" <td>4,32</td>\n",
" <td>1,1</td>\n",
" <td>100000</td>\n",
" <td>0.1</td>\n",
" <td>1000</td>\n",
" <td>57.219027</td>\n",
" <td>250000000</td>\n",
" </tr>\n",
" <tr>\n",
" <td>4</td>\n",
" <td>1000000000</td>\n",
" <td>75.0</td>\n",
" <td>4,32</td>\n",
" <td>1,1</td>\n",
" <td>100000</td>\n",
" <td>0.1</td>\n",
" <td>1000</td>\n",
" <td>55.469166</td>\n",
" <td>250000000</td>\n",
" </tr>\n",
" <tr>\n",
" <td>...</td>\n",
" <td>...</td>\n",
" <td>...</td>\n",
" <td>...</td>\n",
" <td>...</td>\n",
" <td>...</td>\n",
" <td>...</td>\n",
" <td>...</td>\n",
" <td>...</td>\n",
" <td>...</td>\n",
" </tr>\n",
" <tr>\n",
" <td>595</td>\n",
" <td>1000000000</td>\n",
" <td>50.0</td>\n",
" <td>4,8</td>\n",
" <td>2,2</td>\n",
" <td>100000</td>\n",
" <td>0.1</td>\n",
" <td>1000</td>\n",
" <td>73.771357</td>\n",
" <td>500000000</td>\n",
" </tr>\n",
" <tr>\n",
" <td>596</td>\n",
" <td>1000000000</td>\n",
" <td>50.0</td>\n",
" <td>4,8</td>\n",
" <td>2,2</td>\n",
" <td>100000</td>\n",
" <td>0.1</td>\n",
" <td>1000</td>\n",
" <td>75.557508</td>\n",
" <td>500000000</td>\n",
" </tr>\n",
" <tr>\n",
" <td>597</td>\n",
" <td>1000000000</td>\n",
" <td>50.0</td>\n",
" <td>16,8</td>\n",
" <td>1,1</td>\n",
" <td>100000</td>\n",
" <td>0.1</td>\n",
" <td>1000</td>\n",
" <td>35.949913</td>\n",
" <td>500000000</td>\n",
" </tr>\n",
" <tr>\n",
" <td>598</td>\n",
" <td>1000000000</td>\n",
" <td>50.0</td>\n",
" <td>16,8</td>\n",
" <td>1,1</td>\n",
" <td>100000</td>\n",
" <td>0.1</td>\n",
" <td>1000</td>\n",
" <td>37.900348</td>\n",
" <td>500000000</td>\n",
" </tr>\n",
" <tr>\n",
" <td>599</td>\n",
" <td>1000000000</td>\n",
" <td>50.0</td>\n",
" <td>16,8</td>\n",
" <td>1,1</td>\n",
" <td>100000</td>\n",
" <td>0.1</td>\n",
" <td>1000</td>\n",
" <td>36.012772</td>\n",
" <td>500000000</td>\n",
" </tr>\n",
" </tbody>\n",
"</table>\n",
"<p>600 rows × 9 columns</p>\n",
"</div>"
],
"text/plain": [
" N %Async Groups Dist Matrix Time Iters TE \\\n",
"0 1000000000 0.0 8,32 2,2 100000 0.1 1000 31.525710 \n",
"1 1000000000 0.0 8,32 2,2 100000 0.1 1000 33.315857 \n",
"2 1000000000 0.0 8,32 2,2 100000 0.1 1000 33.347537 \n",
"3 1000000000 75.0 4,32 1,1 100000 0.1 1000 57.219027 \n",
"4 1000000000 75.0 4,32 1,1 100000 0.1 1000 55.469166 \n",
".. ... ... ... ... ... ... ... ... \n",
"595 1000000000 50.0 4,8 2,2 100000 0.1 1000 73.771357 \n",
"596 1000000000 50.0 4,8 2,2 100000 0.1 1000 75.557508 \n",
"597 1000000000 50.0 16,8 1,1 100000 0.1 1000 35.949913 \n",
"598 1000000000 50.0 16,8 1,1 100000 0.1 1000 37.900348 \n",
"599 1000000000 50.0 16,8 1,1 100000 0.1 1000 36.012772 \n",
"\n",
" S \n",
"0 1000000000 \n",
"1 1000000000 \n",
"2 1000000000 \n",
"3 250000000 \n",
"4 250000000 \n",
".. ... \n",
"595 500000000 \n",
"596 500000000 \n",
"597 500000000 \n",
"598 500000000 \n",
"599 500000000 \n",
"\n",
"[600 rows x 9 columns]"
]
},
"execution_count": 8,
"metadata": {},
"output_type": "execute_result"
}
],
"source": [
"dfG"
]
},
{
"cell_type": "code",
"execution_count": 9,
"metadata": {},
"outputs": [
{
"data": {
"text/html": [
"<div>\n",
"<style scoped>\n",
" .dataframe tbody tr th:only-of-type {\n",
" vertical-align: middle;\n",
" }\n",
"\n",
" .dataframe tbody tr th {\n",
" vertical-align: top;\n",
" }\n",
"\n",
" .dataframe thead th {\n",
" text-align: right;\n",
" }\n",
"</style>\n",
"<table border=\"1\" class=\"dataframe\">\n",
" <thead>\n",
" <tr style=\"text-align: right;\">\n",
" <th></th>\n",
" <th></th>\n",
" <th></th>\n",
" <th>TE</th>\n",
" </tr>\n",
" <tr>\n",
" <th>Dist</th>\n",
" <th>%Async</th>\n",
" <th>Groups</th>\n",
" <th></th>\n",
" </tr>\n",
" </thead>\n",
" <tbody>\n",
" <tr>\n",
" <td rowspan=\"5\" valign=\"top\">1,1</td>\n",
" <td rowspan=\"5\" valign=\"top\">0.0</td>\n",
" <td>16,2</td>\n",
" <td>112.087769</td>\n",
" </tr>\n",
" <tr>\n",
" <td>16,32</td>\n",
" <td>18.394706</td>\n",
" </tr>\n",
" <tr>\n",
" <td>16,4</td>\n",
" <td>61.887052</td>\n",
" </tr>\n",
" <tr>\n",
" <td>16,8</td>\n",
" <td>37.986463</td>\n",
" </tr>\n",
" <tr>\n",
" <td>2,16</td>\n",
" <td>113.187865</td>\n",
" </tr>\n",
" <tr>\n",
" <td>...</td>\n",
" <td>...</td>\n",
" <td>...</td>\n",
" <td>...</td>\n",
" </tr>\n",
" <tr>\n",
" <td rowspan=\"5\" valign=\"top\">2,2</td>\n",
" <td rowspan=\"5\" valign=\"top\">100.0</td>\n",
" <td>4,8</td>\n",
" <td>74.864688</td>\n",
" </tr>\n",
" <tr>\n",
" <td>8,16</td>\n",
" <td>37.999586</td>\n",
" </tr>\n",
" <tr>\n",
" <td>8,2</td>\n",
" <td>123.584176</td>\n",
" </tr>\n",
" <tr>\n",
" <td>8,32</td>\n",
" <td>31.730297</td>\n",
" </tr>\n",
" <tr>\n",
" <td>8,4</td>\n",
" <td>74.052463</td>\n",
" </tr>\n",
" </tbody>\n",
"</table>\n",
"<p>200 rows × 1 columns</p>\n",
"</div>"
],
"text/plain": [
" TE\n",
"Dist %Async Groups \n",
"1,1 0.0 16,2 112.087769\n",
" 16,32 18.394706\n",
" 16,4 61.887052\n",
" 16,8 37.986463\n",
" 2,16 113.187865\n",
"... ...\n",
"2,2 100.0 4,8 74.864688\n",
" 8,16 37.999586\n",
" 8,2 123.584176\n",
" 8,32 31.730297\n",
" 8,4 74.052463\n",
"\n",
"[200 rows x 1 columns]"
]
},
"execution_count": 9,
"metadata": {},
"output_type": "execute_result"
}
],
"source": [
"grouped_aggG"
]
},
{
"cell_type": "code",
"execution_count": 10,
"metadata": {},
"outputs": [
{
"data": {
"text/html": [
"<div>\n",
"<style scoped>\n",
" .dataframe tbody tr th:only-of-type {\n",
" vertical-align: middle;\n",
" }\n",
"\n",
" .dataframe tbody tr th {\n",
" vertical-align: top;\n",
" }\n",
"\n",
" .dataframe thead th {\n",
" text-align: right;\n",
" }\n",
"</style>\n",
"<table border=\"1\" class=\"dataframe\">\n",
" <thead>\n",
" <tr style=\"text-align: right;\">\n",
" <th></th>\n",
" <th>N</th>\n",
" <th>%Async</th>\n",
" <th>NP</th>\n",
" <th>NS</th>\n",
" <th>Dist</th>\n",
" <th>Matrix</th>\n",
" <th>Time</th>\n",
" <th>Iters</th>\n",
" <th>TC</th>\n",
" <th>TS</th>\n",
" <th>TA</th>\n",
" <th>S</th>\n",
" <th>TR</th>\n",
" </tr>\n",
" </thead>\n",
" <tbody>\n",
" <tr>\n",
" <td>0</td>\n",
" <td>1000000000</td>\n",
" <td>0.0</td>\n",
" <td>8</td>\n",
" <td>32</td>\n",
" <td>2,2</td>\n",
" <td>100000</td>\n",
" <td>0.1</td>\n",
" <td>1000</td>\n",
" <td>1.341434</td>\n",
" <td>0.695848</td>\n",
" <td>0.000000</td>\n",
" <td>1000000000</td>\n",
" <td>2.037282</td>\n",
" </tr>\n",
" <tr>\n",
" <td>1</td>\n",
" <td>1000000000</td>\n",
" <td>0.0</td>\n",
" <td>8</td>\n",
" <td>32</td>\n",
" <td>2,2</td>\n",
" <td>100000</td>\n",
" <td>0.1</td>\n",
" <td>1000</td>\n",
" <td>1.405911</td>\n",
" <td>0.639849</td>\n",
" <td>0.000000</td>\n",
" <td>1000000000</td>\n",
" <td>2.045760</td>\n",
" </tr>\n",
" <tr>\n",
" <td>2</td>\n",
" <td>1000000000</td>\n",
" <td>0.0</td>\n",
" <td>8</td>\n",
" <td>32</td>\n",
" <td>2,2</td>\n",
" <td>100000</td>\n",
" <td>0.1</td>\n",
" <td>1000</td>\n",
" <td>1.346017</td>\n",
" <td>0.747863</td>\n",
" <td>0.000000</td>\n",
" <td>1000000000</td>\n",
" <td>2.093880</td>\n",
" </tr>\n",
" <tr>\n",
" <td>3</td>\n",
" <td>1000000000</td>\n",
" <td>75.0</td>\n",
" <td>4</td>\n",
" <td>32</td>\n",
" <td>1,1</td>\n",
" <td>100000</td>\n",
" <td>0.1</td>\n",
" <td>1000</td>\n",
" <td>0.688062</td>\n",
" <td>0.064900</td>\n",
" <td>0.364941</td>\n",
" <td>250000000</td>\n",
" <td>1.117903</td>\n",
" </tr>\n",
" <tr>\n",
" <td>4</td>\n",
" <td>1000000000</td>\n",
" <td>75.0</td>\n",
" <td>4</td>\n",
" <td>32</td>\n",
" <td>1,1</td>\n",
" <td>100000</td>\n",
" <td>0.1</td>\n",
" <td>1000</td>\n",
" <td>0.702200</td>\n",
" <td>0.068039</td>\n",
" <td>0.412072</td>\n",
" <td>250000000</td>\n",
" <td>1.182311</td>\n",
" </tr>\n",
" <tr>\n",
" <td>...</td>\n",
" <td>...</td>\n",
" <td>...</td>\n",
" <td>...</td>\n",
" <td>...</td>\n",
" <td>...</td>\n",
" <td>...</td>\n",
" <td>...</td>\n",
" <td>...</td>\n",
" <td>...</td>\n",
" <td>...</td>\n",
" <td>...</td>\n",
" <td>...</td>\n",
" <td>...</td>\n",
" </tr>\n",
" <tr>\n",
" <td>595</td>\n",
" <td>1000000000</td>\n",
" <td>50.0</td>\n",
" <td>4</td>\n",
" <td>8</td>\n",
" <td>2,2</td>\n",
" <td>100000</td>\n",
" <td>0.1</td>\n",
" <td>1000</td>\n",
" <td>0.390444</td>\n",
" <td>0.142287</td>\n",
" <td>0.338576</td>\n",
" <td>500000000</td>\n",
" <td>0.871307</td>\n",
" </tr>\n",
" <tr>\n",
" <td>596</td>\n",
" <td>1000000000</td>\n",
" <td>50.0</td>\n",
" <td>4</td>\n",
" <td>8</td>\n",
" <td>2,2</td>\n",
" <td>100000</td>\n",
" <td>0.1</td>\n",
" <td>1000</td>\n",
" <td>0.351690</td>\n",
" <td>0.154699</td>\n",
" <td>0.354917</td>\n",
" <td>500000000</td>\n",
" <td>0.861306</td>\n",
" </tr>\n",
" <tr>\n",
" <td>597</td>\n",
" <td>1000000000</td>\n",
" <td>50.0</td>\n",
" <td>16</td>\n",
" <td>8</td>\n",
" <td>1,1</td>\n",
" <td>100000</td>\n",
" <td>0.1</td>\n",
" <td>1000</td>\n",
" <td>0.337472</td>\n",
" <td>0.081077</td>\n",
" <td>0.243481</td>\n",
" <td>500000000</td>\n",
" <td>0.662030</td>\n",
" </tr>\n",
" <tr>\n",
" <td>598</td>\n",
" <td>1000000000</td>\n",
" <td>50.0</td>\n",
" <td>16</td>\n",
" <td>8</td>\n",
" <td>1,1</td>\n",
" <td>100000</td>\n",
" <td>0.1</td>\n",
" <td>1000</td>\n",
" <td>0.351262</td>\n",
" <td>0.103176</td>\n",
" <td>0.261565</td>\n",
" <td>500000000</td>\n",
" <td>0.716003</td>\n",
" </tr>\n",
" <tr>\n",
" <td>599</td>\n",
" <td>1000000000</td>\n",
" <td>50.0</td>\n",
" <td>16</td>\n",
" <td>8</td>\n",
" <td>1,1</td>\n",
" <td>100000</td>\n",
" <td>0.1</td>\n",
" <td>1000</td>\n",
" <td>0.349151</td>\n",
" <td>0.094121</td>\n",
" <td>0.221750</td>\n",
" <td>500000000</td>\n",
" <td>0.665022</td>\n",
" </tr>\n",
" </tbody>\n",
"</table>\n",
"<p>600 rows × 13 columns</p>\n",
"</div>"
],
"text/plain": [
" N %Async NP NS Dist Matrix Time Iters TC TS \\\n",
"0 1000000000 0.0 8 32 2,2 100000 0.1 1000 1.341434 0.695848 \n",
"1 1000000000 0.0 8 32 2,2 100000 0.1 1000 1.405911 0.639849 \n",
"2 1000000000 0.0 8 32 2,2 100000 0.1 1000 1.346017 0.747863 \n",
"3 1000000000 75.0 4 32 1,1 100000 0.1 1000 0.688062 0.064900 \n",
"4 1000000000 75.0 4 32 1,1 100000 0.1 1000 0.702200 0.068039 \n",
".. ... ... .. .. ... ... ... ... ... ... \n",
"595 1000000000 50.0 4 8 2,2 100000 0.1 1000 0.390444 0.142287 \n",
"596 1000000000 50.0 4 8 2,2 100000 0.1 1000 0.351690 0.154699 \n",
"597 1000000000 50.0 16 8 1,1 100000 0.1 1000 0.337472 0.081077 \n",
"598 1000000000 50.0 16 8 1,1 100000 0.1 1000 0.351262 0.103176 \n",
"599 1000000000 50.0 16 8 1,1 100000 0.1 1000 0.349151 0.094121 \n",
"\n",
" TA S TR \n",
"0 0.000000 1000000000 2.037282 \n",
"1 0.000000 1000000000 2.045760 \n",
"2 0.000000 1000000000 2.093880 \n",
"3 0.364941 250000000 1.117903 \n",
"4 0.412072 250000000 1.182311 \n",
".. ... ... ... \n",
"595 0.338576 500000000 0.871307 \n",
"596 0.354917 500000000 0.861306 \n",
"597 0.243481 500000000 0.662030 \n",
"598 0.261565 500000000 0.716003 \n",
"599 0.221750 500000000 0.665022 \n",
"\n",
"[600 rows x 13 columns]"
]
},
"execution_count": 10,
"metadata": {},
"output_type": "execute_result"
}
],
"source": [
"dfM"
]
},
{
"cell_type": "code",
"execution_count": 11,
"metadata": {},
"outputs": [
{
"data": {
"text/html": [
"<div>\n",
"<style scoped>\n",
" .dataframe tbody tr th:only-of-type {\n",
" vertical-align: middle;\n",
" }\n",
"\n",
" .dataframe tbody tr th {\n",
" vertical-align: top;\n",
" }\n",
"\n",
" .dataframe thead th {\n",
" text-align: right;\n",
" }\n",
"</style>\n",
"<table border=\"1\" class=\"dataframe\">\n",
" <thead>\n",
" <tr style=\"text-align: right;\">\n",
" <th></th>\n",
" <th></th>\n",
" <th></th>\n",
" <th></th>\n",
" <th>TC</th>\n",
" <th>TS</th>\n",
" <th>TA</th>\n",
" <th>TR</th>\n",
" </tr>\n",
" <tr>\n",
" <th>Dist</th>\n",
" <th>%Async</th>\n",
" <th>NP</th>\n",
" <th>NS</th>\n",
" <th></th>\n",
" <th></th>\n",
" <th></th>\n",
" <th></th>\n",
" </tr>\n",
" </thead>\n",
" <tbody>\n",
" <tr>\n",
" <td rowspan=\"5\" valign=\"top\">1,1</td>\n",
" <td rowspan=\"5\" valign=\"top\">0.0</td>\n",
" <td rowspan=\"4\" valign=\"top\">2</td>\n",
" <td>4</td>\n",
" <td>0.220380</td>\n",
" <td>0.314893</td>\n",
" <td>0.000000</td>\n",
" <td>0.535273</td>\n",
" </tr>\n",
" <tr>\n",
" <td>8</td>\n",
" <td>0.248143</td>\n",
" <td>0.375003</td>\n",
" <td>0.000000</td>\n",
" <td>0.623146</td>\n",
" </tr>\n",
" <tr>\n",
" <td>16</td>\n",
" <td>0.339042</td>\n",
" <td>0.486650</td>\n",
" <td>0.000000</td>\n",
" <td>0.825692</td>\n",
" </tr>\n",
" <tr>\n",
" <td>32</td>\n",
" <td>0.743840</td>\n",
" <td>0.506385</td>\n",
" <td>0.000000</td>\n",
" <td>1.250225</td>\n",
" </tr>\n",
" <tr>\n",
" <td>4</td>\n",
" <td>2</td>\n",
" <td>0.197858</td>\n",
" <td>0.311136</td>\n",
" <td>0.000000</td>\n",
" <td>0.508994</td>\n",
" </tr>\n",
" <tr>\n",
" <td>...</td>\n",
" <td>...</td>\n",
" <td>...</td>\n",
" <td>...</td>\n",
" <td>...</td>\n",
" <td>...</td>\n",
" <td>...</td>\n",
" <td>...</td>\n",
" </tr>\n",
" <tr>\n",
" <td rowspan=\"5\" valign=\"top\">2,2</td>\n",
" <td rowspan=\"5\" valign=\"top\">100.0</td>\n",
" <td>16</td>\n",
" <td>32</td>\n",
" <td>1.358891</td>\n",
" <td>0.000000</td>\n",
" <td>1.419016</td>\n",
" <td>2.777907</td>\n",
" </tr>\n",
" <tr>\n",
" <td rowspan=\"4\" valign=\"top\">32</td>\n",
" <td>2</td>\n",
" <td>0.591882</td>\n",
" <td>0.000000</td>\n",
" <td>2.477300</td>\n",
" <td>3.069183</td>\n",
" </tr>\n",
" <tr>\n",
" <td>4</td>\n",
" <td>0.804965</td>\n",
" <td>0.000000</td>\n",
" <td>1.729638</td>\n",
" <td>2.534603</td>\n",
" </tr>\n",
" <tr>\n",
" <td>8</td>\n",
" <td>0.935128</td>\n",
" <td>0.000000</td>\n",
" <td>1.520682</td>\n",
" <td>2.455810</td>\n",
" </tr>\n",
" <tr>\n",
" <td>16</td>\n",
" <td>1.221248</td>\n",
" <td>0.000000</td>\n",
" <td>1.541904</td>\n",
" <td>2.763152</td>\n",
" </tr>\n",
" </tbody>\n",
"</table>\n",
"<p>200 rows × 4 columns</p>\n",
"</div>"
],
"text/plain": [
" TC TS TA TR\n",
"Dist %Async NP NS \n",
"1,1 0.0 2 4 0.220380 0.314893 0.000000 0.535273\n",
" 8 0.248143 0.375003 0.000000 0.623146\n",
" 16 0.339042 0.486650 0.000000 0.825692\n",
" 32 0.743840 0.506385 0.000000 1.250225\n",
" 4 2 0.197858 0.311136 0.000000 0.508994\n",
"... ... ... ... ...\n",
"2,2 100.0 16 32 1.358891 0.000000 1.419016 2.777907\n",
" 32 2 0.591882 0.000000 2.477300 3.069183\n",
" 4 0.804965 0.000000 1.729638 2.534603\n",
" 8 0.935128 0.000000 1.520682 2.455810\n",
" 16 1.221248 0.000000 1.541904 2.763152\n",
"\n",
"[200 rows x 4 columns]"
]
},
"execution_count": 11,
"metadata": {},
"output_type": "execute_result"
}
],
"source": [
"grouped_aggM"
]
},
{
"cell_type": "code",
"execution_count": 12,
"metadata": {},
"outputs": [
{
"data": {
"text/html": [
"<div>\n",
"<style scoped>\n",
" .dataframe tbody tr th:only-of-type {\n",
" vertical-align: middle;\n",
" }\n",
"\n",
" .dataframe tbody tr th {\n",
" vertical-align: top;\n",
" }\n",
"\n",
" .dataframe thead th {\n",
" text-align: right;\n",
" }\n",
"</style>\n",
"<table border=\"1\" class=\"dataframe\">\n",
" <thead>\n",
" <tr style=\"text-align: right;\">\n",
" <th></th>\n",
" <th>N</th>\n",
" <th>%Async</th>\n",
" <th>NP</th>\n",
" <th>N_par</th>\n",
" <th>NS</th>\n",
" <th>Dist</th>\n",
" <th>Matrix</th>\n",
" <th>Time</th>\n",
" <th>Iters</th>\n",
" <th>Ti</th>\n",
" <th>Tt</th>\n",
" <th>To</th>\n",
" <th>S</th>\n",
" </tr>\n",
" </thead>\n",
" <tbody>\n",
" <tr>\n",
" <td>0</td>\n",
" <td>1000000000</td>\n",
" <td>0.0</td>\n",
" <td>32</td>\n",
" <td>8</td>\n",
" <td>0</td>\n",
" <td>2</td>\n",
" <td>100000</td>\n",
" <td>0.1</td>\n",
" <td>1000</td>\n",
" <td>0.005463</td>\n",
" <td>0.0</td>\n",
" <td>6.0</td>\n",
" <td>1000000000</td>\n",
" </tr>\n",
" <tr>\n",
" <td>1</td>\n",
" <td>1000000000</td>\n",
" <td>0.0</td>\n",
" <td>32</td>\n",
" <td>8</td>\n",
" <td>0</td>\n",
" <td>2</td>\n",
" <td>100000</td>\n",
" <td>0.1</td>\n",
" <td>1000</td>\n",
" <td>0.005350</td>\n",
" <td>0.0</td>\n",
" <td>6.0</td>\n",
" <td>1000000000</td>\n",
" </tr>\n",
" <tr>\n",
" <td>2</td>\n",
" <td>1000000000</td>\n",
" <td>0.0</td>\n",
" <td>32</td>\n",
" <td>8</td>\n",
" <td>0</td>\n",
" <td>2</td>\n",
" <td>100000</td>\n",
" <td>0.1</td>\n",
" <td>1000</td>\n",
" <td>0.005355</td>\n",
" <td>0.0</td>\n",
" <td>6.0</td>\n",
" <td>1000000000</td>\n",
" </tr>\n",
" <tr>\n",
" <td>3</td>\n",
" <td>1000000000</td>\n",
" <td>0.0</td>\n",
" <td>32</td>\n",
" <td>8</td>\n",
" <td>0</td>\n",
" <td>2</td>\n",
" <td>100000</td>\n",
" <td>0.1</td>\n",
" <td>1000</td>\n",
" <td>0.005354</td>\n",
" <td>0.0</td>\n",
" <td>6.0</td>\n",
" <td>1000000000</td>\n",
" </tr>\n",
" <tr>\n",
" <td>4</td>\n",
" <td>1000000000</td>\n",
" <td>0.0</td>\n",
" <td>32</td>\n",
" <td>8</td>\n",
" <td>0</td>\n",
" <td>2</td>\n",
" <td>100000</td>\n",
" <td>0.1</td>\n",
" <td>1000</td>\n",
" <td>0.005352</td>\n",
" <td>0.0</td>\n",
" <td>6.0</td>\n",
" <td>1000000000</td>\n",
" </tr>\n",
" <tr>\n",
" <td>...</td>\n",
" <td>...</td>\n",
" <td>...</td>\n",
" <td>...</td>\n",
" <td>...</td>\n",
" <td>...</td>\n",
" <td>...</td>\n",
" <td>...</td>\n",
" <td>...</td>\n",
" <td>...</td>\n",
" <td>...</td>\n",
" <td>...</td>\n",
" <td>...</td>\n",
" <td>...</td>\n",
" </tr>\n",
" <tr>\n",
" <td>1199995</td>\n",
" <td>1000000000</td>\n",
" <td>50.0</td>\n",
" <td>8</td>\n",
" <td>16</td>\n",
" <td>0</td>\n",
" <td>1</td>\n",
" <td>100000</td>\n",
" <td>0.1</td>\n",
" <td>1000</td>\n",
" <td>0.024075</td>\n",
" <td>0.0</td>\n",
" <td>27.0</td>\n",
" <td>500000000</td>\n",
" </tr>\n",
" <tr>\n",
" <td>1199996</td>\n",
" <td>1000000000</td>\n",
" <td>50.0</td>\n",
" <td>8</td>\n",
" <td>16</td>\n",
" <td>0</td>\n",
" <td>1</td>\n",
" <td>100000</td>\n",
" <td>0.1</td>\n",
" <td>1000</td>\n",
" <td>0.024076</td>\n",
" <td>0.0</td>\n",
" <td>27.0</td>\n",
" <td>500000000</td>\n",
" </tr>\n",
" <tr>\n",
" <td>1199997</td>\n",
" <td>1000000000</td>\n",
" <td>50.0</td>\n",
" <td>8</td>\n",
" <td>16</td>\n",
" <td>0</td>\n",
" <td>1</td>\n",
" <td>100000</td>\n",
" <td>0.1</td>\n",
" <td>1000</td>\n",
" <td>0.024076</td>\n",
" <td>0.0</td>\n",
" <td>27.0</td>\n",
" <td>500000000</td>\n",
" </tr>\n",
" <tr>\n",
" <td>1199998</td>\n",
" <td>1000000000</td>\n",
" <td>50.0</td>\n",
" <td>8</td>\n",
" <td>16</td>\n",
" <td>0</td>\n",
" <td>1</td>\n",
" <td>100000</td>\n",
" <td>0.1</td>\n",
" <td>1000</td>\n",
" <td>0.024411</td>\n",
" <td>0.0</td>\n",
" <td>27.0</td>\n",
" <td>500000000</td>\n",
" </tr>\n",
" <tr>\n",
" <td>1199999</td>\n",
" <td>1000000000</td>\n",
" <td>50.0</td>\n",
" <td>8</td>\n",
" <td>16</td>\n",
" <td>0</td>\n",
" <td>1</td>\n",
" <td>100000</td>\n",
" <td>0.1</td>\n",
" <td>1000</td>\n",
" <td>0.024075</td>\n",
" <td>0.0</td>\n",
" <td>27.0</td>\n",
" <td>500000000</td>\n",
" </tr>\n",
" </tbody>\n",
"</table>\n",
"<p>1200000 rows × 13 columns</p>\n",
"</div>"
],
"text/plain": [
" N %Async NP N_par NS Dist Matrix Time Iters \\\n",
"0 1000000000 0.0 32 8 0 2 100000 0.1 1000 \n",
"1 1000000000 0.0 32 8 0 2 100000 0.1 1000 \n",
"2 1000000000 0.0 32 8 0 2 100000 0.1 1000 \n",
"3 1000000000 0.0 32 8 0 2 100000 0.1 1000 \n",
"4 1000000000 0.0 32 8 0 2 100000 0.1 1000 \n",
"... ... ... .. ... .. ... ... ... ... \n",
"1199995 1000000000 50.0 8 16 0 1 100000 0.1 1000 \n",
"1199996 1000000000 50.0 8 16 0 1 100000 0.1 1000 \n",
"1199997 1000000000 50.0 8 16 0 1 100000 0.1 1000 \n",
"1199998 1000000000 50.0 8 16 0 1 100000 0.1 1000 \n",
"1199999 1000000000 50.0 8 16 0 1 100000 0.1 1000 \n",
"\n",
" Ti Tt To S \n",
"0 0.005463 0.0 6.0 1000000000 \n",
"1 0.005350 0.0 6.0 1000000000 \n",
"2 0.005355 0.0 6.0 1000000000 \n",
"3 0.005354 0.0 6.0 1000000000 \n",
"4 0.005352 0.0 6.0 1000000000 \n",
"... ... ... ... ... \n",
"1199995 0.024075 0.0 27.0 500000000 \n",
"1199996 0.024076 0.0 27.0 500000000 \n",
"1199997 0.024076 0.0 27.0 500000000 \n",
"1199998 0.024411 0.0 27.0 500000000 \n",
"1199999 0.024075 0.0 27.0 500000000 \n",
"\n",
"[1200000 rows x 13 columns]"
]
},
"execution_count": 12,
"metadata": {},
"output_type": "execute_result"
}
],
"source": [
"dfL"
]
},
{
"cell_type": "code",
"execution_count": 13,
"metadata": {},
"outputs": [
{
"data": {
"text/html": [
"<div>\n",
"<style scoped>\n",
" .dataframe tbody tr th:only-of-type {\n",
" vertical-align: middle;\n",
" }\n",
"\n",
" .dataframe tbody tr th {\n",
" vertical-align: top;\n",
" }\n",
"\n",
" .dataframe thead th {\n",
" text-align: right;\n",
" }\n",
"</style>\n",
"<table border=\"1\" class=\"dataframe\">\n",
" <thead>\n",
" <tr style=\"text-align: right;\">\n",
" <th></th>\n",
" <th></th>\n",
" <th></th>\n",
" <th></th>\n",
" <th></th>\n",
" <th>Ti</th>\n",
" <th>Iters</th>\n",
" <th>To</th>\n",
" <th>Iters2</th>\n",
" </tr>\n",
" <tr>\n",
" <th>Tt</th>\n",
" <th>Dist</th>\n",
" <th>%Async</th>\n",
" <th>NP</th>\n",
" <th>NS</th>\n",
" <th></th>\n",
" <th></th>\n",
" <th></th>\n",
" <th></th>\n",
" </tr>\n",
" </thead>\n",
" <tbody>\n",
" <tr>\n",
" <td rowspan=\"5\" valign=\"top\">0.0</td>\n",
" <td rowspan=\"5\" valign=\"top\">1</td>\n",
" <td rowspan=\"5\" valign=\"top\">0.0</td>\n",
" <td rowspan=\"4\" valign=\"top\">2</td>\n",
" <td>4</td>\n",
" <td>0.099861</td>\n",
" <td>500.0</td>\n",
" <td>112.000000</td>\n",
" <td>500.0</td>\n",
" </tr>\n",
" <tr>\n",
" <td>8</td>\n",
" <td>0.099849</td>\n",
" <td>500.0</td>\n",
" <td>112.000000</td>\n",
" <td>500.0</td>\n",
" </tr>\n",
" <tr>\n",
" <td>16</td>\n",
" <td>0.099860</td>\n",
" <td>500.0</td>\n",
" <td>112.000000</td>\n",
" <td>500.0</td>\n",
" </tr>\n",
" <tr>\n",
" <td>32</td>\n",
" <td>0.099853</td>\n",
" <td>500.0</td>\n",
" <td>112.000000</td>\n",
" <td>500.0</td>\n",
" </tr>\n",
" <tr>\n",
" <td>4</td>\n",
" <td>2</td>\n",
" <td>0.049642</td>\n",
" <td>500.0</td>\n",
" <td>55.666667</td>\n",
" <td>500.0</td>\n",
" </tr>\n",
" <tr>\n",
" <td>...</td>\n",
" <td>...</td>\n",
" <td>...</td>\n",
" <td>...</td>\n",
" <td>...</td>\n",
" <td>...</td>\n",
" <td>...</td>\n",
" <td>...</td>\n",
" <td>...</td>\n",
" </tr>\n",
" <tr>\n",
" <td rowspan=\"5\" valign=\"top\">1.0</td>\n",
" <td rowspan=\"5\" valign=\"top\">2</td>\n",
" <td rowspan=\"5\" valign=\"top\">100.0</td>\n",
" <td>16</td>\n",
" <td>32</td>\n",
" <td>0.034899</td>\n",
" <td>21.0</td>\n",
" <td>14.000000</td>\n",
" <td>21.0</td>\n",
" </tr>\n",
" <tr>\n",
" <td rowspan=\"4\" valign=\"top\">32</td>\n",
" <td>2</td>\n",
" <td>0.012084</td>\n",
" <td>101.0</td>\n",
" <td>7.000000</td>\n",
" <td>101.0</td>\n",
" </tr>\n",
" <tr>\n",
" <td>4</td>\n",
" <td>0.015599</td>\n",
" <td>54.0</td>\n",
" <td>7.000000</td>\n",
" <td>54.0</td>\n",
" </tr>\n",
" <tr>\n",
" <td>8</td>\n",
" <td>0.012685</td>\n",
" <td>54.0</td>\n",
" <td>7.000000</td>\n",
" <td>54.0</td>\n",
" </tr>\n",
" <tr>\n",
" <td>16</td>\n",
" <td>0.015421</td>\n",
" <td>44.0</td>\n",
" <td>7.000000</td>\n",
" <td>44.0</td>\n",
" </tr>\n",
" </tbody>\n",
"</table>\n",
"<p>360 rows × 4 columns</p>\n",
"</div>"
],
"text/plain": [
" Ti Iters To Iters2\n",
"Tt Dist %Async NP NS \n",
"0.0 1 0.0 2 4 0.099861 500.0 112.000000 500.0\n",
" 8 0.099849 500.0 112.000000 500.0\n",
" 16 0.099860 500.0 112.000000 500.0\n",
" 32 0.099853 500.0 112.000000 500.0\n",
" 4 2 0.049642 500.0 55.666667 500.0\n",
"... ... ... ... ...\n",
"1.0 2 100.0 16 32 0.034899 21.0 14.000000 21.0\n",
" 32 2 0.012084 101.0 7.000000 101.0\n",
" 4 0.015599 54.0 7.000000 54.0\n",
" 8 0.012685 54.0 7.000000 54.0\n",
" 16 0.015421 44.0 7.000000 44.0\n",
"\n",
"[360 rows x 4 columns]"
]
},
"execution_count": 13,
"metadata": {},
"output_type": "execute_result"
}
],
"source": [
"grouped_aggL"
]
},
{
"cell_type": "code",
"execution_count": 26,
"metadata": {},
"outputs": [
{
"name": "stdout",
"output_type": "stream",
"text": [
"TIEMPO EJECUCCION\n",
"Distribución BestFit -------------------------\n",
"Para 2 padres\n",
"EX numC= 4 p = 0.039 Diff = 0.09 Asíncrono\n",
"Para 4 padres\n",
"Para 8 padres\n",
"EX numC= 4 p = 0.0 Diff = 1.411 Síncrono\n",
"Para 16 padres\n",
"EX numC= 2 p = 0.014 Diff = 3.662 Asíncrono\n",
"Para 32 padres\n",
"EX numC= 4 p = 0.002 Diff = 4.589 Asíncrono\n",
"Distribución WorstFit -------------------------\n",
"Para 2 padres\n",
"Para 4 padres\n",
"EX numC= 16 p = 0.046 Diff = 0.304 Síncrono\n",
"EX numC= 32 p = 0.012 Diff = 0.542 Síncrono\n",
"Para 8 padres\n"
]
},
{
"name": "stderr",
"output_type": "stream",
"text": [
"/home/usuario/anaconda3/lib/python3.7/site-packages/ipykernel_launcher.py:10: UserWarning: Boolean Series key will be reindexed to match DataFrame index.\n",
" # Remove the CWD from sys.path while we load stuff.\n",
"/home/usuario/anaconda3/lib/python3.7/site-packages/ipykernel_launcher.py:11: UserWarning: Boolean Series key will be reindexed to match DataFrame index.\n",
" # This is added back by InteractiveShellApp.init_path()\n"
]
},
{
"name": "stdout",
"output_type": "stream",
"text": [
"Para 16 padres\n",
"EX numC= 2 p = 0.023 Diff = 6.349 Asíncrono\n",
"EX numC= 4 p = 0.0 Diff = 1.799 Asíncrono\n",
"EX numC= 8 p = 0.046 Diff = 0.261 Asíncrono\n",
"Para 32 padres\n",
"EX numC= 2 p = 0.01 Diff = 18.514 Asíncrono\n",
"EX numC= 4 p = 0.0 Diff = 4.454 Asíncrono\n",
"EX numC= 8 p = 0.003 Diff = 1.92 Asíncrono\n"
]
}
],
"source": [
"print(\"TIEMPO EJECUCCION\")\n",
"for dist in [1,2]:\n",
" print(\"Distribución \" + dist_names[dist] + \" -------------------------\")\n",
" dist_v = str(dist)+\",\"+str(dist)\n",
" for numP in values:\n",
" print(\"Para \", numP, \" padres\")\n",
" for numC in values:\n",
" if numP != numC:\n",
" group = str(numP) + \",\" + str(numC)\n",
" v1 = dfG[(dfG[\"%Async\"] == 0.0)][(dfG.Groups == group)][(dfG[\"Dist\"] == dist_v)]['TE']\n",
" v2 = dfG[(dfG[\"%Async\"] == 100.0)][(dfG.Groups == group)][(dfG[\"Dist\"] == dist_v)]['TE']\n",
" res = stats.ttest_ind(v1, v2)\n",
" diff = grouped_aggG['TE'].loc[(dist_v, 0.0, group)] - grouped_aggG['TE'].loc[(dist_v, 100.0, group)]\n",
" if diff > 0:\n",
" mejor = \"Asíncrono\"\n",
" else:\n",
" mejor = \"Síncrono\"\n",
" \n",
" if res[1] < p_value:\n",
" print(\"EX numC=\", numC, \"p =\", round(res[1],3), \"Diff =\", abs(round(diff,3)), mejor)"
]
},
{
"cell_type": "code",
"execution_count": 19,
"metadata": {},
"outputs": [
{
"name": "stdout",
"output_type": "stream",
"text": [
"TIEMPO MALLEABILITY\n",
"Distribución 1 -------------------------\n",
"Para 2 padres\n",
"TR numC= 8 p = 0.0 Diff = 0.029 Síncrono\n",
"Para 4 padres\n",
"TR numC= 8 p = 0.006 Diff = 0.043 Síncrono\n",
"TR numC= 32 p = 0.025 Diff = 0.052 Síncrono\n",
"Para 8 padres\n",
"TR numC= 4 p = 0.016 Diff = 0.022 Asíncrono\n",
"TR numC= 16 p = 0.009 Diff = 0.031 Síncrono\n",
"TR numC= 32 p = 0.0 Diff = 0.483 Síncrono\n",
"Para 16 padres\n",
"TR numC= 8 p = 0.002 Diff = 0.072 Síncrono\n",
"TR numC= 32 p = 0.019 Diff = 0.549 Síncrono\n",
"Para 32 padres\n",
"TR numC= 4 p = 0.002 Diff = 0.981 Síncrono\n",
"TR numC= 8 p = 0.001 Diff = 0.972 Síncrono\n",
"TR numC= 16 p = 0.001 Diff = 0.831 Síncrono\n",
"Distribución 2 -------------------------\n",
"Para 2 padres\n",
"TR numC= 4 p = 0.0 Diff = 0.069 Síncrono\n"
]
},
{
"name": "stderr",
"output_type": "stream",
"text": [
"/home/usuario/anaconda3/lib/python3.7/site-packages/ipykernel_launcher.py:9: UserWarning: Boolean Series key will be reindexed to match DataFrame index.\n",
" if __name__ == '__main__':\n",
"/home/usuario/anaconda3/lib/python3.7/site-packages/ipykernel_launcher.py:10: UserWarning: Boolean Series key will be reindexed to match DataFrame index.\n",
" # Remove the CWD from sys.path while we load stuff.\n"
]
},
{
"name": "stdout",
"output_type": "stream",
"text": [
"TR numC= 8 p = 0.029 Diff = 0.035 Síncrono\n",
"Para 4 padres\n",
"TR numC= 8 p = 0.02 Diff = 0.031 Síncrono\n",
"TR numC= 32 p = 0.009 Diff = 0.601 Síncrono\n",
"Para 8 padres\n",
"TR numC= 16 p = 0.011 Diff = 0.729 Síncrono\n",
"TR numC= 32 p = 0.018 Diff = 0.423 Síncrono\n",
"Para 16 padres\n",
"TR numC= 4 p = 0.001 Diff = 0.884 Síncrono\n",
"TR numC= 32 p = 0.021 Diff = 0.36 Síncrono\n",
"Para 32 padres\n",
"TR numC= 2 p = 0.029 Diff = 1.548 Síncrono\n",
"TR numC= 4 p = 0.008 Diff = 0.84 Síncrono\n",
"TR numC= 8 p = 0.011 Diff = 0.726 Síncrono\n",
"TR numC= 16 p = 0.004 Diff = 0.606 Síncrono\n"
]
}
],
"source": [
"print(\"TIEMPO MALLEABILITY\")\n",
"for dist in [1,2]:\n",
" print(\"Distribución \" + dist_names[dist] + \" -------------------------\")\n",
" dist_v = str(dist)+\",\"+str(dist)\n",
" for numP in values:\n",
" print(\"Para \", numP, \" padres\")\n",
" for numC in values:\n",
" if numP != numC:\n",
" v1 = dfM[(dfM[\"%Async\"] == 0.0)][(dfM.NP == numP)][(dfM.NS == numC)][(dfM[\"Dist\"] == dist_v)]['TS']\n",
" v2 = dfM[(dfM[\"%Async\"] == 100.0)][(dfM.NP == numP)][(dfM.NS == numC)][(dfM[\"Dist\"] == dist_v)]['TA']\n",
" res = stats.ttest_ind(v1, v2)\n",
" diff = grouped_aggM['TS'].loc[(dist_v, 0.0, numP, numC)] - grouped_aggM['TA'].loc[(dist_v, 100.0, numP, numC)]\n",
" if diff > 0:\n",
" mejor = \"Asíncrono\"\n",
" else:\n",
" mejor = \"Síncrono\"\n",
" if res[1] < p_value:\n",
" print(\"TR numC=\", numC, \"p =\", round(res[1],3), \"Diff =\", abs(round(diff,3)), mejor)"
]
},
{
"cell_type": "code",
"execution_count": 28,
"metadata": {},
"outputs": [
{
"name": "stdout",
"output_type": "stream",
"text": [
"TIEMPO Iters\n",
"Distribución BestFit -------------------------\n",
"Para 2 padres\n",
"Ti numC= 4 p = 0.035 Diff = 0.0001 Síncrono\n"
]
},
{
"name": "stderr",
"output_type": "stream",
"text": [
"/home/usuario/anaconda3/lib/python3.7/site-packages/ipykernel_launcher.py:12: UserWarning: Boolean Series key will be reindexed to match DataFrame index.\n",
" if sys.path[0] == '':\n",
"/home/usuario/anaconda3/lib/python3.7/site-packages/ipykernel_launcher.py:13: UserWarning: Boolean Series key will be reindexed to match DataFrame index.\n",
" del sys.path[0]\n"
]
},
{
"name": "stdout",
"output_type": "stream",
"text": [
"Ti numC= 8 p = 0.025 Diff = 0.0001 Síncrono\n",
"Ti numC= 16 p = 0.002 Diff = 0.0001 Síncrono\n",
"Ti numC= 32 p = 0.007 Diff = 0.0001 Síncrono\n",
"Para 4 padres\n",
"Ti numC= 16 p = 0.0 Diff = 0.0006 Síncrono\n",
"Para 8 padres\n",
"Ti numC= 4 p = 0.0 Diff = 0.0009 Síncrono\n",
"Ti numC= 32 p = 0.007 Diff = 0.0029 Síncrono\n",
"Para 16 padres\n",
"Ti numC= 32 p = 0.0 Diff = 0.0097 Síncrono\n",
"Para 32 padres\n",
"Ti numC= 2 p = 0.0 Diff = 0.0029 Síncrono\n",
"Ti numC= 4 p = 0.0 Diff = 0.0056 Síncrono\n",
"Ti numC= 8 p = 0.0 Diff = 0.0055 Síncrono\n",
"Ti numC= 16 p = 0.0 Diff = 0.0053 Síncrono\n",
"Distribución WorstFit -------------------------\n",
"Para 2 padres\n",
"Ti numC= 32 p = 0.024 Diff = 0.0256 Síncrono\n",
"Para 4 padres\n",
"Ti numC= 16 p = 0.0 Diff = 0.0243 Síncrono\n",
"Ti numC= 32 p = 0.0 Diff = 0.0343 Síncrono\n",
"Para 8 padres\n",
"Ti numC= 4 p = 0.036 Diff = 0.0044 Síncrono\n",
"Ti numC= 16 p = 0.0 Diff = 0.008 Síncrono\n",
"Ti numC= 32 p = 0.0 Diff = 0.0225 Síncrono\n",
"Para 16 padres\n",
"Ti numC= 2 p = 0.0 Diff = 0.0067 Síncrono\n",
"Ti numC= 4 p = 0.0 Diff = 0.0092 Síncrono\n",
"Ti numC= 8 p = 0.0 Diff = 0.0098 Síncrono\n",
"Ti numC= 32 p = 0.0 Diff = 0.0224 Síncrono\n",
"Para 32 padres\n",
"Ti numC= 2 p = 0.0 Diff = 0.0058 Síncrono\n",
"Ti numC= 4 p = 0.0 Diff = 0.0094 Síncrono\n",
"Ti numC= 8 p = 0.0 Diff = 0.0064 Síncrono\n",
"Ti numC= 16 p = 0.0 Diff = 0.0092 Síncrono\n"
]
}
],
"source": [
"print(\"TIEMPO Iters\")\n",
"for dist in [1,2]:\n",
" print(\"Distribución \" + dist_names[dist] + \" -------------------------\")\n",
" dist_v = str(dist)+\",\"+str(dist)\n",
" for numP in values:\n",
" print(\"Para \", numP, \" padres\")\n",
" for numC in values:\n",
" if numP != numC:\n",
" #exp = dfL[(dfL[\"Tt\"] == 0)][(dfL[\"Dist\"] == 1)][(dfL[\"%Async\"] == 0.0)][(dfL.NP == numP)][(dfL.NS == numC)]\n",
" #TimeOp = exp['Ti'] \n",
" #print(TimeOp)\n",
" v1 = dfL[(dfL[\"Tt\"] == 0)][(dfL[\"Dist\"] == dist)][(dfL[\"%Async\"] == 100.0)][(dfL.NP == numP)][(dfL.NS == numC)]['Ti']\n",
" v2 = dfL[(dfL[\"Tt\"] == 1)][(dfL[\"Dist\"] == dist)][(dfL[\"%Async\"] == 100.0)][(dfL.NP == numP)][(dfL.NS == numC)]['Ti']\n",
" res = stats.ttest_ind(v1, v2, equal_var = False)\n",
" diff = grouped_aggL['Ti'].loc[(0, dist, 0.0, numP, numC)] - grouped_aggL['Ti'].loc[(1, dist, 100.0, numP, numC)]\n",
" if diff > 0:\n",
" mejor = \"Asíncrono\"\n",
" else:\n",
" mejor = \"Síncrono\"\n",
" if res[1] < p_value:\n",
" #and abs(diff) > grouped_aggL['Ti'].loc[(0, dist, 0.0, numP, numC)]\n",
" print(\"Ti numC=\", numC, \"p =\", round(res[1],3), \"Diff =\", abs(round(diff,4)), mejor)"
]
},
{
"cell_type": "code",
"execution_count": 22,
"metadata": {},
"outputs": [
{
"name": "stdout",
"output_type": "stream",
"text": [
"Distribución BestFit -------------------------\n",
"Para 2 padres\n",
"NC=4 Es mejor Asíncrono con una diff de 0.123\n"
]
},
{
"name": "stderr",
"output_type": "stream",
"text": [
"/home/usuario/anaconda3/lib/python3.7/site-packages/ipykernel_launcher.py:10: UserWarning: Boolean Series key will be reindexed to match DataFrame index.\n",
" # Remove the CWD from sys.path while we load stuff.\n",
"/home/usuario/anaconda3/lib/python3.7/site-packages/ipykernel_launcher.py:14: UserWarning: Boolean Series key will be reindexed to match DataFrame index.\n",
" \n",
"/home/usuario/anaconda3/lib/python3.7/site-packages/ipykernel_launcher.py:16: UserWarning: Boolean Series key will be reindexed to match DataFrame index.\n",
" app.launch_new_instance()\n"
]
},
{
"name": "stdout",
"output_type": "stream",
"text": [
"NC=8 Es mejor Asíncrono con una diff de 0.07\n",
"NC=16 Es mejor Asíncrono con una diff de 0.046\n",
"NC=32 Es mejor Asíncrono con una diff de 0.014\n",
"Para 4 padres\n",
"NC=2 Es mejor Asíncrono con una diff de 0.645\n",
"NC=8 Es mejor Asíncrono con una diff de 0.13\n",
"NC=16 Es mejor Asíncrono con una diff de 0.052\n",
"NC=32 Es mejor Síncrono con una diff de 0.005\n",
"Para 8 padres\n",
"NC=2 Es mejor Asíncrono con una diff de 1.523\n",
"NC=4 Es mejor Asíncrono con una diff de 0.354\n",
"NC=16 Es mejor Asíncrono con una diff de 0.066\n",
"NC=32 Es mejor Síncrono con una diff de 0.327\n",
"Para 16 padres\n",
"NC=2 Es mejor Asíncrono con una diff de 3.676\n",
"NC=4 Es mejor Asíncrono con una diff de 1.235\n",
"NC=8 Es mejor Asíncrono con una diff de 0.406\n",
"NC=32 Es mejor Síncrono con una diff de 0.304\n",
"Para 32 padres\n",
"NC=2 Es mejor Asíncrono con una diff de 16.171\n",
"NC=4 Es mejor Asíncrono con una diff de 4.551\n",
"NC=8 Es mejor Asíncrono con una diff de 1.599\n",
"NC=16 Es mejor Asíncrono con una diff de 0.12\n",
"Distribución WorstFit -------------------------\n",
"Para 2 padres\n",
"NC=4 Es mejor Asíncrono con una diff de 0.13\n",
"NC=8 Es mejor Asíncrono con una diff de 0.064\n",
"NC=16 Es mejor Asíncrono con una diff de 0.034\n",
"NC=32 Es mejor Síncrono con una diff de 0.151\n",
"Para 4 padres\n",
"NC=2 Es mejor Asíncrono con una diff de 0.637\n",
"NC=8 Es mejor Asíncrono con una diff de 0.142\n",
"NC=16 Es mejor Síncrono con una diff de 0.28\n",
"NC=32 Es mejor Síncrono con una diff de 0.499\n",
"Para 8 padres\n",
"NC=2 Es mejor Asíncrono con una diff de 1.575\n",
"NC=4 Es mejor Asíncrono con una diff de 0.344\n",
"NC=16 Es mejor Síncrono con una diff de 0.32\n",
"NC=32 Es mejor Síncrono con una diff de 0.278\n",
"Para 16 padres\n",
"NC=2 Es mejor Asíncrono con una diff de 6.404\n",
"NC=4 Es mejor Asíncrono con una diff de 1.803\n",
"NC=8 Es mejor Asíncrono con una diff de 0.308\n",
"NC=32 Es mejor Síncrono con una diff de 0.113\n",
"Para 32 padres\n",
"NC=2 Es mejor Asíncrono con una diff de 18.438\n",
"NC=4 Es mejor Asíncrono con una diff de 4.533\n",
"NC=8 Es mejor Asíncrono con una diff de 1.927\n",
"NC=16 Es mejor Asíncrono con una diff de 0.481\n"
]
}
],
"source": [
"iters = dfM['Iters'].mean()\n",
"resultados = [0,0]\n",
"for dist in [1,2]:\n",
" print(\"Distribución \" + dist_names[dist] + \" -------------------------\")\n",
" dist_v = str(dist)+\",\"+str(dist)\n",
" for numP in values:\n",
" print(\"Para \", numP, \" padres\")\n",
" for numC in values:\n",
" if numP != numC:\n",
" Titer = dfL[(dfL[\"Tt\"] == 0)][(dfL[\"Dist\"] == dist)][(dfL.NP == numC)]['Ti'].mean() #Tiempo por iteracion\n",
" i=0\n",
" for adr in [0.0, 100.0]:\n",
" \n",
" auxExp = dfM[(dfM[\"Dist\"] == dist_v)][(dfM[\"%Async\"] == adr)][(dfM.NP == numP)][(dfM.NS == numC)]\n",
" Tr = auxExp['TS'].mean() + auxExp['TA'].mean() #Tiempo de redistribucion\n",
" M_it = dfL[(dfL[\"Tt\"] == 1)][(dfL[\"Dist\"] == dist)][(dfL[\"%Async\"] == adr)][(dfL.NP == numP)][(dfL.NS == numC)]['Ti'].count()/3 #Iteraciones asincronas\n",
" #No se presupone una diferencia temporal entre iteraciones sincronas y asincronas\n",
" if(M_it > iters):\n",
" M_it = iters\n",
" resultados[i] = (iters - M_it) * Titer + Tr\n",
" i+=1\n",
" #print(M_it)\n",
" #print(Titer)\n",
" #print((iters - M_it) * Titer)\n",
" #print(Tr)\n",
" #print(\"End\")\n",
" \n",
" if resultados[0] > resultados[1]:\n",
" mejor = \"Asíncrono\"\n",
" else:\n",
" mejor = \"Síncrono\"\n",
" diff = abs(round(resultados[0] - resultados[1], 3))\n",
" print(\"NC=\"+ str(numC) + \" Es mejor \" + mejor + \" con una diff de \"+ str(diff))\n",
" #TODO Comprobar"
]
},
{
"cell_type": "code",
"execution_count": 48,
"metadata": {},
"outputs": [
{
"data": {
"text/html": [
"<div>\n",
"<style scoped>\n",
" .dataframe tbody tr th:only-of-type {\n",
" vertical-align: middle;\n",
" }\n",
"\n",
" .dataframe tbody tr th {\n",
" vertical-align: top;\n",
" }\n",
"\n",
" .dataframe thead th {\n",
" text-align: right;\n",
" }\n",
"</style>\n",
"<table border=\"1\" class=\"dataframe\">\n",
" <thead>\n",
" <tr style=\"text-align: right;\">\n",
" <th></th>\n",
" <th></th>\n",
" <th></th>\n",
" <th></th>\n",
" <th></th>\n",
" <th>Ti</th>\n",
" <th>Iters</th>\n",
" <th>To</th>\n",
" <th>Iters2</th>\n",
" </tr>\n",
" <tr>\n",
" <th>Tt</th>\n",
" <th>Dist</th>\n",
" <th>%Async</th>\n",
" <th>NP</th>\n",
" <th>NS</th>\n",
" <th></th>\n",
" <th></th>\n",
" <th></th>\n",
" <th></th>\n",
" </tr>\n",
" </thead>\n",
" <tbody>\n",
" <tr>\n",
" <td rowspan=\"5\" valign=\"top\">0.0</td>\n",
" <td rowspan=\"5\" valign=\"top\">1</td>\n",
" <td rowspan=\"5\" valign=\"top\">0.0</td>\n",
" <td rowspan=\"4\" valign=\"top\">2</td>\n",
" <td>4</td>\n",
" <td>0.099861</td>\n",
" <td>500.0</td>\n",
" <td>112.000000</td>\n",
" <td>500.0</td>\n",
" </tr>\n",
" <tr>\n",
" <td>8</td>\n",
" <td>0.099849</td>\n",
" <td>500.0</td>\n",
" <td>112.000000</td>\n",
" <td>500.0</td>\n",
" </tr>\n",
" <tr>\n",
" <td>16</td>\n",
" <td>0.099860</td>\n",
" <td>500.0</td>\n",
" <td>112.000000</td>\n",
" <td>500.0</td>\n",
" </tr>\n",
" <tr>\n",
" <td>32</td>\n",
" <td>0.099853</td>\n",
" <td>500.0</td>\n",
" <td>112.000000</td>\n",
" <td>500.0</td>\n",
" </tr>\n",
" <tr>\n",
" <td>4</td>\n",
" <td>2</td>\n",
" <td>0.049642</td>\n",
" <td>500.0</td>\n",
" <td>55.666667</td>\n",
" <td>500.0</td>\n",
" </tr>\n",
" <tr>\n",
" <td>...</td>\n",
" <td>...</td>\n",
" <td>...</td>\n",
" <td>...</td>\n",
" <td>...</td>\n",
" <td>...</td>\n",
" <td>...</td>\n",
" <td>...</td>\n",
" <td>...</td>\n",
" </tr>\n",
" <tr>\n",
" <td rowspan=\"5\" valign=\"top\">1.0</td>\n",
" <td rowspan=\"5\" valign=\"top\">2</td>\n",
" <td rowspan=\"5\" valign=\"top\">100.0</td>\n",
" <td>16</td>\n",
" <td>32</td>\n",
" <td>0.034899</td>\n",
" <td>21.0</td>\n",
" <td>14.000000</td>\n",
" <td>21.0</td>\n",
" </tr>\n",
" <tr>\n",
" <td rowspan=\"4\" valign=\"top\">32</td>\n",
" <td>2</td>\n",
" <td>0.012084</td>\n",
" <td>101.0</td>\n",
" <td>7.000000</td>\n",
" <td>101.0</td>\n",
" </tr>\n",
" <tr>\n",
" <td>4</td>\n",
" <td>0.015599</td>\n",
" <td>54.0</td>\n",
" <td>7.000000</td>\n",
" <td>54.0</td>\n",
" </tr>\n",
" <tr>\n",
" <td>8</td>\n",
" <td>0.012685</td>\n",
" <td>54.0</td>\n",
" <td>7.000000</td>\n",
" <td>54.0</td>\n",
" </tr>\n",
" <tr>\n",
" <td>16</td>\n",
" <td>0.015421</td>\n",
" <td>44.0</td>\n",
" <td>7.000000</td>\n",
" <td>44.0</td>\n",
" </tr>\n",
" </tbody>\n",
"</table>\n",
"<p>360 rows × 4 columns</p>\n",
"</div>"
],
"text/plain": [
" Ti Iters To Iters2\n",
"Tt Dist %Async NP NS \n",
"0.0 1 0.0 2 4 0.099861 500.0 112.000000 500.0\n",
" 8 0.099849 500.0 112.000000 500.0\n",
" 16 0.099860 500.0 112.000000 500.0\n",
" 32 0.099853 500.0 112.000000 500.0\n",
" 4 2 0.049642 500.0 55.666667 500.0\n",
"... ... ... ... ...\n",
"1.0 2 100.0 16 32 0.034899 21.0 14.000000 21.0\n",
" 32 2 0.012084 101.0 7.000000 101.0\n",
" 4 0.015599 54.0 7.000000 54.0\n",
" 8 0.012685 54.0 7.000000 54.0\n",
" 16 0.015421 44.0 7.000000 44.0\n",
"\n",
"[360 rows x 4 columns]"
]
},
"execution_count": 48,
"metadata": {},
"output_type": "execute_result"
}
],
"source": [
"grouped_aggL"
]
},
{
"cell_type": "code",
"execution_count": 88,
"metadata": {},
"outputs": [
{
"data": {
"image/png": "\n",
"text/plain": [
"<Figure size 720x504 with 1 Axes>"
]
},
"metadata": {
"needs_background": "light"
},
"output_type": "display_data"
},
{
"data": {
"image/png": "\n",
"text/plain": [
"<Figure size 720x504 with 1 Axes>"
]
},
"metadata": {
"needs_background": "light"
},
"output_type": "display_data"
}
],
"source": [
"for dist in [1,2]:\n",
" v1 = grouped_aggL.loc[(0,dist,100.0,slice(None))]\n",
" v2 = grouped_aggL.loc[(1,dist,100.0,slice(None))]\n",
" aux_aggL = v1['Ti'].values / v2['Ti'].values\n",
"\n",
" colors = ['r', 'orange', 'g', 'm', 'y']\n",
" markers = ['+', 'x', '1', '2', 'X']\n",
"\n",
" f=plt.figure(figsize=(10, 7))\n",
" ax1 = f.add_subplot(111)\n",
" plt.xlim(0, max(values)+1)\n",
" plt.ylim(0, 1.2)\n",
" plt.xticks(values)\n",
" ax1.set_ylabel('Decremento velocidad')\n",
" ax1.set_xlabel('Procesos hijo')\n",
" ax1.set_title(\"Aumento de velocidad en las iteraciones al realizar redistribuciones asíncronas\")\n",
"\n",
"\n",
" for i in range(len(values)):\n",
" numP = values[i]\n",
" c = colors[i]\n",
" \n",
" mini = i * (len(values)-1)\n",
" maxi = (i+1) * (len(values)-1)\n",
" array_values = aux_aggL[mini:maxi]\n",
" indexes = np.arange(len(values)-1)\n",
" aux_j=0\n",
" for j in range(len(values)):\n",
" if(values[j] != numP):\n",
" indexes[aux_j] = values[j]\n",
" aux_j+=1\n",
" \n",
" x = indexes\n",
" y = array_values\n",
" label = str(numP) + ' padres'\n",
" ax1.axvline(numP)\n",
" plt.plot(x, y, color=colors[i], label=label, marker=markers[1], markersize=10)\n",
" \n",
" ax1.axhline(1, color='k')\n",
" f.legend()\n",
" #f.tight_layout()\n",
" f.savefig(\"Images/\"+\"Iters\"+ dist_names[dist] +\"_SpeedUp\", format=\"png\")\n"
]
},
{
"cell_type": "code",
"execution_count": null,
"metadata": {},
"outputs": [],
"source": []
}
],
"metadata": {
"kernelspec": {
"display_name": "Python 3",
"language": "python",
"name": "python3"
},
"language_info": {
"codemirror_mode": {
"name": "ipython",
"version": 3
},
"file_extension": ".py",
"mimetype": "text/x-python",
"name": "python",
"nbconvert_exporter": "python",
"pygments_lexer": "ipython3",
"version": "3.7.4"
}
},
"nbformat": 4,
"nbformat_minor": 4
}
%% Cell type:code id: tags:
``` python
%matplotlib inline
import pandas as pd
from pandas import DataFrame, Series
import numpy as np
import seaborn as sns
import matplotlib.pyplot as plt
from scipy import stats
import sys
```
%% Cell type:code id: tags:
``` python
matrixMalEX="data_GG.csv"
matrixMal="data_GM.csv"
matrixIt="data_L.csv"
n_qty=2 #CAMBIAR SEGUN LA CANTIDAD DE NODOS USADOS
repet = 3 * 2 #CAMBIAR EL PRIMER NUMERO SEGUN NUMERO DE EJECUCIONES POR CONFIG
p_value = 0.05
values = [2, 4, 8, 16, 32]
dist_names = ['null', 'BestFit', 'WorstFit']
```
%% Cell type:code id: tags:
``` python
def speedUp(arr, seq, df):
numP = df.loc[arr.index[0]].NP
return seq[( seq.NP == numP )]['EX'] / arr.mean()
```
%% Cell type:code id: tags:
``` python
dfG = pd.read_csv( matrixMalEX )
dfG = dfG.drop(columns=dfG.columns[0])
dfG['S'] = dfG['N']
dfG['N'] = dfG['S'] + dfG['%Async']
dfG['%Async'] = (dfG['%Async'] / dfG['N']) * 100
if(n_qty == 1):
group = dfG.groupby(['%Async', 'Groups'])['TE']
else:
group = dfG.groupby(['Dist', '%Async', 'Groups'])['TE']
#group
grouped_aggG = group.agg(['mean'])
grouped_aggG.rename(columns={'mean':'TE',}, inplace=True)
```
%% Cell type:code id: tags:
``` python
from natsort import index_natsorted
grouped_aggG.sort_values(
by="Groups",
key=lambda x: np.argsort(index_natsorted(df["Groups"]))
)
grouped_aggG
```
%% Cell type:code id: tags:
``` python
dfM = pd.read_csv( matrixMal )
dfM = dfM.drop(columns=dfM.columns[0])
dfM['S'] = dfM['N']
dfM['N'] = dfM['S'] + dfM['%Async']
dfM["TR"] = dfM["TC"] + dfM["TS"] + dfM["TA"]
dfM['%Async'] = (dfM['%Async'] / dfM['N']) * 100
if(n_qty == 1):
groupM = dfM.groupby(['%Async','NP', 'NS'])['TC', 'TS', 'TA', 'TR']
else:
groupM = dfM.groupby(['Dist', '%Async','NP', 'NS'])['TC', 'TS', 'TA', 'TR']
#group
grouped_aggM = groupM.agg(['mean'])
grouped_aggM.columns = grouped_aggM.columns.get_level_values(0)
```
%% Cell type:code id: tags:
``` python
dfL = pd.read_csv( matrixIt )
dfL = dfL.drop(columns=dfL.columns[0])
dfL['S'] = dfL['N']
dfL['N'] = dfL['S'] + dfL['%Async']
dfL['%Async'] = (dfL['%Async'] / dfL['N']) * 100
if(n_qty == 1):
groupL = dfL[dfL['NS'] != 0].groupby(['Tt', '%Async', 'NP', 'NS'])['Ti', 'To']
else:
groupL = dfL[dfL['NS'] != 0].groupby(['Tt', 'Dist', '%Async', 'NP', 'NS'])['Ti', 'To']
#group
grouped_aggL = groupL.agg(['mean', 'count'])
grouped_aggL.columns = grouped_aggL.columns.get_level_values(0)
grouped_aggL.set_axis(['Ti', 'Iters', 'To', 'Iters2'], axis='columns')
grouped_aggL['Iters'] = np.ceil(grouped_aggL['Iters']/6) # TODO Cambiar a repeticiones realizadas
grouped_aggL['Iters2'] = np.ceil(grouped_aggL['Iters2']/6)
```
%%%% Output: stream
/home/usuario/anaconda3/lib/python3.7/site-packages/ipykernel_launcher.py:16: FutureWarning: set_axis currently defaults to operating inplace.
This will change in a future version of pandas, use inplace=True to avoid this warning.
app.launch_new_instance()
%% Cell type:code id: tags:
``` python
grouped_aggL.to_excel("resultL.xlsx")
grouped_aggM.to_excel("resultM.xlsx")
grouped_aggG.to_excel("resultG.xlsx")
```
%% Cell type:code id: tags:
``` python
dfG
```
%%%% Output: execute_result
N %Async Groups Dist Matrix Time Iters TE \
0 1000000000 0.0 8,32 2,2 100000 0.1 1000 31.525710
1 1000000000 0.0 8,32 2,2 100000 0.1 1000 33.315857
2 1000000000 0.0 8,32 2,2 100000 0.1 1000 33.347537
3 1000000000 75.0 4,32 1,1 100000 0.1 1000 57.219027
4 1000000000 75.0 4,32 1,1 100000 0.1 1000 55.469166
.. ... ... ... ... ... ... ... ...
595 1000000000 50.0 4,8 2,2 100000 0.1 1000 73.771357
596 1000000000 50.0 4,8 2,2 100000 0.1 1000 75.557508
597 1000000000 50.0 16,8 1,1 100000 0.1 1000 35.949913
598 1000000000 50.0 16,8 1,1 100000 0.1 1000 37.900348
599 1000000000 50.0 16,8 1,1 100000 0.1 1000 36.012772
S
0 1000000000
1 1000000000
2 1000000000
3 250000000
4 250000000
.. ...
595 500000000
596 500000000
597 500000000
598 500000000
599 500000000
[600 rows x 9 columns]
%% Cell type:code id: tags:
``` python
grouped_aggG
```
%%%% Output: execute_result
TE
Dist %Async Groups
1,1 0.0 16,2 112.087769
16,32 18.394706
16,4 61.887052
16,8 37.986463
2,16 113.187865
... ...
2,2 100.0 4,8 74.864688
8,16 37.999586
8,2 123.584176
8,32 31.730297
8,4 74.052463
[200 rows x 1 columns]
%% Cell type:code id: tags:
``` python
dfM
```
%%%% Output: execute_result
N %Async NP NS Dist Matrix Time Iters TC TS \
0 1000000000 0.0 8 32 2,2 100000 0.1 1000 1.341434 0.695848
1 1000000000 0.0 8 32 2,2 100000 0.1 1000 1.405911 0.639849
2 1000000000 0.0 8 32 2,2 100000 0.1 1000 1.346017 0.747863
3 1000000000 75.0 4 32 1,1 100000 0.1 1000 0.688062 0.064900
4 1000000000 75.0 4 32 1,1 100000 0.1 1000 0.702200 0.068039
.. ... ... .. .. ... ... ... ... ... ...
595 1000000000 50.0 4 8 2,2 100000 0.1 1000 0.390444 0.142287
596 1000000000 50.0 4 8 2,2 100000 0.1 1000 0.351690 0.154699
597 1000000000 50.0 16 8 1,1 100000 0.1 1000 0.337472 0.081077
598 1000000000 50.0 16 8 1,1 100000 0.1 1000 0.351262 0.103176
599 1000000000 50.0 16 8 1,1 100000 0.1 1000 0.349151 0.094121
TA S TR
0 0.000000 1000000000 2.037282
1 0.000000 1000000000 2.045760
2 0.000000 1000000000 2.093880
3 0.364941 250000000 1.117903
4 0.412072 250000000 1.182311
.. ... ... ...
595 0.338576 500000000 0.871307
596 0.354917 500000000 0.861306
597 0.243481 500000000 0.662030
598 0.261565 500000000 0.716003
599 0.221750 500000000 0.665022
[600 rows x 13 columns]
%% Cell type:code id: tags:
``` python
grouped_aggM
```
%%%% Output: execute_result
TC TS TA TR
Dist %Async NP NS
1,1 0.0 2 4 0.220380 0.314893 0.000000 0.535273
8 0.248143 0.375003 0.000000 0.623146
16 0.339042 0.486650 0.000000 0.825692
32 0.743840 0.506385 0.000000 1.250225
4 2 0.197858 0.311136 0.000000 0.508994
... ... ... ... ...
2,2 100.0 16 32 1.358891 0.000000 1.419016 2.777907
32 2 0.591882 0.000000 2.477300 3.069183
4 0.804965 0.000000 1.729638 2.534603
8 0.935128 0.000000 1.520682 2.455810
16 1.221248 0.000000 1.541904 2.763152
[200 rows x 4 columns]
%% Cell type:code id: tags:
``` python
dfL
```
%%%% Output: execute_result
N %Async NP N_par NS Dist Matrix Time Iters \
0 1000000000 0.0 32 8 0 2 100000 0.1 1000
1 1000000000 0.0 32 8 0 2 100000 0.1 1000
2 1000000000 0.0 32 8 0 2 100000 0.1 1000
3 1000000000 0.0 32 8 0 2 100000 0.1 1000
4 1000000000 0.0 32 8 0 2 100000 0.1 1000
... ... ... .. ... .. ... ... ... ...
1199995 1000000000 50.0 8 16 0 1 100000 0.1 1000
1199996 1000000000 50.0 8 16 0 1 100000 0.1 1000
1199997 1000000000 50.0 8 16 0 1 100000 0.1 1000
1199998 1000000000 50.0 8 16 0 1 100000 0.1 1000
1199999 1000000000 50.0 8 16 0 1 100000 0.1 1000
Ti Tt To S
0 0.005463 0.0 6.0 1000000000
1 0.005350 0.0 6.0 1000000000
2 0.005355 0.0 6.0 1000000000
3 0.005354 0.0 6.0 1000000000
4 0.005352 0.0 6.0 1000000000
... ... ... ... ...
1199995 0.024075 0.0 27.0 500000000
1199996 0.024076 0.0 27.0 500000000
1199997 0.024076 0.0 27.0 500000000
1199998 0.024411 0.0 27.0 500000000
1199999 0.024075 0.0 27.0 500000000
[1200000 rows x 13 columns]
%% Cell type:code id: tags:
``` python
grouped_aggL
```
%%%% Output: execute_result
Ti Iters To Iters2
Tt Dist %Async NP NS
0.0 1 0.0 2 4 0.099861 500.0 112.000000 500.0
8 0.099849 500.0 112.000000 500.0
16 0.099860 500.0 112.000000 500.0
32 0.099853 500.0 112.000000 500.0
4 2 0.049642 500.0 55.666667 500.0
... ... ... ... ...
1.0 2 100.0 16 32 0.034899 21.0 14.000000 21.0
32 2 0.012084 101.0 7.000000 101.0
4 0.015599 54.0 7.000000 54.0
8 0.012685 54.0 7.000000 54.0
16 0.015421 44.0 7.000000 44.0
[360 rows x 4 columns]
%% Cell type:code id: tags:
``` python
print("TIEMPO EJECUCCION")
for dist in [1,2]:
print("Distribución " + dist_names[dist] + " -------------------------")
dist_v = str(dist)+","+str(dist)
for numP in values:
print("Para ", numP, " padres")
for numC in values:
if numP != numC:
group = str(numP) + "," + str(numC)
v1 = dfG[(dfG["%Async"] == 0.0)][(dfG.Groups == group)][(dfG["Dist"] == dist_v)]['TE']
v2 = dfG[(dfG["%Async"] == 100.0)][(dfG.Groups == group)][(dfG["Dist"] == dist_v)]['TE']
res = stats.ttest_ind(v1, v2)
diff = grouped_aggG['TE'].loc[(dist_v, 0.0, group)] - grouped_aggG['TE'].loc[(dist_v, 100.0, group)]
if diff > 0:
mejor = "Asíncrono"
else:
mejor = "Síncrono"
if res[1] < p_value:
print("EX numC=", numC, "p =", round(res[1],3), "Diff =", abs(round(diff,3)), mejor)
```
%%%% Output: stream
TIEMPO EJECUCCION
Distribución BestFit -------------------------
Para 2 padres
EX numC= 4 p = 0.039 Diff = 0.09 Asíncrono
Para 4 padres
Para 8 padres
EX numC= 4 p = 0.0 Diff = 1.411 Síncrono
Para 16 padres
EX numC= 2 p = 0.014 Diff = 3.662 Asíncrono
Para 32 padres
EX numC= 4 p = 0.002 Diff = 4.589 Asíncrono
Distribución WorstFit -------------------------
Para 2 padres
Para 4 padres
EX numC= 16 p = 0.046 Diff = 0.304 Síncrono
EX numC= 32 p = 0.012 Diff = 0.542 Síncrono
Para 8 padres
%%%% Output: stream
/home/usuario/anaconda3/lib/python3.7/site-packages/ipykernel_launcher.py:10: UserWarning: Boolean Series key will be reindexed to match DataFrame index.
# Remove the CWD from sys.path while we load stuff.
/home/usuario/anaconda3/lib/python3.7/site-packages/ipykernel_launcher.py:11: UserWarning: Boolean Series key will be reindexed to match DataFrame index.
# This is added back by InteractiveShellApp.init_path()
%%%% Output: stream
Para 16 padres
EX numC= 2 p = 0.023 Diff = 6.349 Asíncrono
EX numC= 4 p = 0.0 Diff = 1.799 Asíncrono
EX numC= 8 p = 0.046 Diff = 0.261 Asíncrono
Para 32 padres
EX numC= 2 p = 0.01 Diff = 18.514 Asíncrono
EX numC= 4 p = 0.0 Diff = 4.454 Asíncrono
EX numC= 8 p = 0.003 Diff = 1.92 Asíncrono
%% Cell type:code id: tags:
``` python
print("TIEMPO MALLEABILITY")
for dist in [1,2]:
print("Distribución " + dist_names[dist] + " -------------------------")
dist_v = str(dist)+","+str(dist)
for numP in values:
print("Para ", numP, " padres")
for numC in values:
if numP != numC:
v1 = dfM[(dfM["%Async"] == 0.0)][(dfM.NP == numP)][(dfM.NS == numC)][(dfM["Dist"] == dist_v)]['TS']
v2 = dfM[(dfM["%Async"] == 100.0)][(dfM.NP == numP)][(dfM.NS == numC)][(dfM["Dist"] == dist_v)]['TA']
res = stats.ttest_ind(v1, v2)
diff = grouped_aggM['TS'].loc[(dist_v, 0.0, numP, numC)] - grouped_aggM['TA'].loc[(dist_v, 100.0, numP, numC)]
if diff > 0:
mejor = "Asíncrono"
else:
mejor = "Síncrono"
if res[1] < p_value:
print("TR numC=", numC, "p =", round(res[1],3), "Diff =", abs(round(diff,3)), mejor)
```
%%%% Output: stream
TIEMPO MALLEABILITY
Distribución 1 -------------------------
Para 2 padres
TR numC= 8 p = 0.0 Diff = 0.029 Síncrono
Para 4 padres
TR numC= 8 p = 0.006 Diff = 0.043 Síncrono
TR numC= 32 p = 0.025 Diff = 0.052 Síncrono
Para 8 padres
TR numC= 4 p = 0.016 Diff = 0.022 Asíncrono
TR numC= 16 p = 0.009 Diff = 0.031 Síncrono
TR numC= 32 p = 0.0 Diff = 0.483 Síncrono
Para 16 padres
TR numC= 8 p = 0.002 Diff = 0.072 Síncrono
TR numC= 32 p = 0.019 Diff = 0.549 Síncrono
Para 32 padres
TR numC= 4 p = 0.002 Diff = 0.981 Síncrono
TR numC= 8 p = 0.001 Diff = 0.972 Síncrono
TR numC= 16 p = 0.001 Diff = 0.831 Síncrono
Distribución 2 -------------------------
Para 2 padres
TR numC= 4 p = 0.0 Diff = 0.069 Síncrono
%%%% Output: stream
/home/usuario/anaconda3/lib/python3.7/site-packages/ipykernel_launcher.py:9: UserWarning: Boolean Series key will be reindexed to match DataFrame index.
if __name__ == '__main__':
/home/usuario/anaconda3/lib/python3.7/site-packages/ipykernel_launcher.py:10: UserWarning: Boolean Series key will be reindexed to match DataFrame index.
# Remove the CWD from sys.path while we load stuff.
%%%% Output: stream
TR numC= 8 p = 0.029 Diff = 0.035 Síncrono
Para 4 padres
TR numC= 8 p = 0.02 Diff = 0.031 Síncrono
TR numC= 32 p = 0.009 Diff = 0.601 Síncrono
Para 8 padres
TR numC= 16 p = 0.011 Diff = 0.729 Síncrono
TR numC= 32 p = 0.018 Diff = 0.423 Síncrono
Para 16 padres
TR numC= 4 p = 0.001 Diff = 0.884 Síncrono
TR numC= 32 p = 0.021 Diff = 0.36 Síncrono
Para 32 padres
TR numC= 2 p = 0.029 Diff = 1.548 Síncrono
TR numC= 4 p = 0.008 Diff = 0.84 Síncrono
TR numC= 8 p = 0.011 Diff = 0.726 Síncrono
TR numC= 16 p = 0.004 Diff = 0.606 Síncrono
%% Cell type:code id: tags:
``` python
print("TIEMPO Iters")
for dist in [1,2]:
print("Distribución " + dist_names[dist] + " -------------------------")
dist_v = str(dist)+","+str(dist)
for numP in values:
print("Para ", numP, " padres")
for numC in values:
if numP != numC:
#exp = dfL[(dfL["Tt"] == 0)][(dfL["Dist"] == 1)][(dfL["%Async"] == 0.0)][(dfL.NP == numP)][(dfL.NS == numC)]
#TimeOp = exp['Ti']
#print(TimeOp)
v1 = dfL[(dfL["Tt"] == 0)][(dfL["Dist"] == dist)][(dfL["%Async"] == 100.0)][(dfL.NP == numP)][(dfL.NS == numC)]['Ti']
v2 = dfL[(dfL["Tt"] == 1)][(dfL["Dist"] == dist)][(dfL["%Async"] == 100.0)][(dfL.NP == numP)][(dfL.NS == numC)]['Ti']
res = stats.ttest_ind(v1, v2, equal_var = False)
diff = grouped_aggL['Ti'].loc[(0, dist, 0.0, numP, numC)] - grouped_aggL['Ti'].loc[(1, dist, 100.0, numP, numC)]
if diff > 0:
mejor = "Asíncrono"
else:
mejor = "Síncrono"
if res[1] < p_value:
#and abs(diff) > grouped_aggL['Ti'].loc[(0, dist, 0.0, numP, numC)]
print("Ti numC=", numC, "p =", round(res[1],3), "Diff =", abs(round(diff,4)), mejor)
```
%%%% Output: stream
TIEMPO Iters
Distribución BestFit -------------------------
Para 2 padres
Ti numC= 4 p = 0.035 Diff = 0.0001 Síncrono
%%%% Output: stream
/home/usuario/anaconda3/lib/python3.7/site-packages/ipykernel_launcher.py:12: UserWarning: Boolean Series key will be reindexed to match DataFrame index.
if sys.path[0] == '':
/home/usuario/anaconda3/lib/python3.7/site-packages/ipykernel_launcher.py:13: UserWarning: Boolean Series key will be reindexed to match DataFrame index.
del sys.path[0]
%%%% Output: stream
Ti numC= 8 p = 0.025 Diff = 0.0001 Síncrono
Ti numC= 16 p = 0.002 Diff = 0.0001 Síncrono
Ti numC= 32 p = 0.007 Diff = 0.0001 Síncrono
Para 4 padres
Ti numC= 16 p = 0.0 Diff = 0.0006 Síncrono
Para 8 padres
Ti numC= 4 p = 0.0 Diff = 0.0009 Síncrono
Ti numC= 32 p = 0.007 Diff = 0.0029 Síncrono
Para 16 padres
Ti numC= 32 p = 0.0 Diff = 0.0097 Síncrono
Para 32 padres
Ti numC= 2 p = 0.0 Diff = 0.0029 Síncrono
Ti numC= 4 p = 0.0 Diff = 0.0056 Síncrono
Ti numC= 8 p = 0.0 Diff = 0.0055 Síncrono
Ti numC= 16 p = 0.0 Diff = 0.0053 Síncrono
Distribución WorstFit -------------------------
Para 2 padres
Ti numC= 32 p = 0.024 Diff = 0.0256 Síncrono
Para 4 padres
Ti numC= 16 p = 0.0 Diff = 0.0243 Síncrono
Ti numC= 32 p = 0.0 Diff = 0.0343 Síncrono
Para 8 padres
Ti numC= 4 p = 0.036 Diff = 0.0044 Síncrono
Ti numC= 16 p = 0.0 Diff = 0.008 Síncrono
Ti numC= 32 p = 0.0 Diff = 0.0225 Síncrono
Para 16 padres
Ti numC= 2 p = 0.0 Diff = 0.0067 Síncrono
Ti numC= 4 p = 0.0 Diff = 0.0092 Síncrono
Ti numC= 8 p = 0.0 Diff = 0.0098 Síncrono
Ti numC= 32 p = 0.0 Diff = 0.0224 Síncrono
Para 32 padres
Ti numC= 2 p = 0.0 Diff = 0.0058 Síncrono
Ti numC= 4 p = 0.0 Diff = 0.0094 Síncrono
Ti numC= 8 p = 0.0 Diff = 0.0064 Síncrono
Ti numC= 16 p = 0.0 Diff = 0.0092 Síncrono
%% Cell type:code id: tags:
``` python
iters = dfM['Iters'].mean()
resultados = [0,0]
for dist in [1,2]:
print("Distribución " + dist_names[dist] + " -------------------------")
dist_v = str(dist)+","+str(dist)
for numP in values:
print("Para ", numP, " padres")
for numC in values:
if numP != numC:
Titer = dfL[(dfL["Tt"] == 0)][(dfL["Dist"] == dist)][(dfL.NP == numC)]['Ti'].mean() #Tiempo por iteracion
i=0
for adr in [0.0, 100.0]:
auxExp = dfM[(dfM["Dist"] == dist_v)][(dfM["%Async"] == adr)][(dfM.NP == numP)][(dfM.NS == numC)]
Tr = auxExp['TS'].mean() + auxExp['TA'].mean() #Tiempo de redistribucion
M_it = dfL[(dfL["Tt"] == 1)][(dfL["Dist"] == dist)][(dfL["%Async"] == adr)][(dfL.NP == numP)][(dfL.NS == numC)]['Ti'].count()/3 #Iteraciones asincronas
#No se presupone una diferencia temporal entre iteraciones sincronas y asincronas
if(M_it > iters):
M_it = iters
resultados[i] = (iters - M_it) * Titer + Tr
i+=1
#print(M_it)
#print(Titer)
#print((iters - M_it) * Titer)
#print(Tr)
#print("End")
if resultados[0] > resultados[1]:
mejor = "Asíncrono"
else:
mejor = "Síncrono"
diff = abs(round(resultados[0] - resultados[1], 3))
print("NC="+ str(numC) + " Es mejor " + mejor + " con una diff de "+ str(diff))
#TODO Comprobar
```
%%%% Output: stream
Distribución BestFit -------------------------
Para 2 padres
NC=4 Es mejor Asíncrono con una diff de 0.123
%%%% Output: stream
/home/usuario/anaconda3/lib/python3.7/site-packages/ipykernel_launcher.py:10: UserWarning: Boolean Series key will be reindexed to match DataFrame index.
# Remove the CWD from sys.path while we load stuff.
/home/usuario/anaconda3/lib/python3.7/site-packages/ipykernel_launcher.py:14: UserWarning: Boolean Series key will be reindexed to match DataFrame index.
/home/usuario/anaconda3/lib/python3.7/site-packages/ipykernel_launcher.py:16: UserWarning: Boolean Series key will be reindexed to match DataFrame index.
app.launch_new_instance()
%%%% Output: stream
NC=8 Es mejor Asíncrono con una diff de 0.07
NC=16 Es mejor Asíncrono con una diff de 0.046
NC=32 Es mejor Asíncrono con una diff de 0.014
Para 4 padres
NC=2 Es mejor Asíncrono con una diff de 0.645
NC=8 Es mejor Asíncrono con una diff de 0.13
NC=16 Es mejor Asíncrono con una diff de 0.052
NC=32 Es mejor Síncrono con una diff de 0.005
Para 8 padres
NC=2 Es mejor Asíncrono con una diff de 1.523
NC=4 Es mejor Asíncrono con una diff de 0.354
NC=16 Es mejor Asíncrono con una diff de 0.066
NC=32 Es mejor Síncrono con una diff de 0.327
Para 16 padres
NC=2 Es mejor Asíncrono con una diff de 3.676
NC=4 Es mejor Asíncrono con una diff de 1.235
NC=8 Es mejor Asíncrono con una diff de 0.406
NC=32 Es mejor Síncrono con una diff de 0.304
Para 32 padres
NC=2 Es mejor Asíncrono con una diff de 16.171
NC=4 Es mejor Asíncrono con una diff de 4.551
NC=8 Es mejor Asíncrono con una diff de 1.599
NC=16 Es mejor Asíncrono con una diff de 0.12
Distribución WorstFit -------------------------
Para 2 padres
NC=4 Es mejor Asíncrono con una diff de 0.13
NC=8 Es mejor Asíncrono con una diff de 0.064
NC=16 Es mejor Asíncrono con una diff de 0.034
NC=32 Es mejor Síncrono con una diff de 0.151
Para 4 padres
NC=2 Es mejor Asíncrono con una diff de 0.637
NC=8 Es mejor Asíncrono con una diff de 0.142
NC=16 Es mejor Síncrono con una diff de 0.28
NC=32 Es mejor Síncrono con una diff de 0.499
Para 8 padres
NC=2 Es mejor Asíncrono con una diff de 1.575
NC=4 Es mejor Asíncrono con una diff de 0.344
NC=16 Es mejor Síncrono con una diff de 0.32
NC=32 Es mejor Síncrono con una diff de 0.278
Para 16 padres
NC=2 Es mejor Asíncrono con una diff de 6.404
NC=4 Es mejor Asíncrono con una diff de 1.803
NC=8 Es mejor Asíncrono con una diff de 0.308
NC=32 Es mejor Síncrono con una diff de 0.113
Para 32 padres
NC=2 Es mejor Asíncrono con una diff de 18.438
NC=4 Es mejor Asíncrono con una diff de 4.533
NC=8 Es mejor Asíncrono con una diff de 1.927
NC=16 Es mejor Asíncrono con una diff de 0.481
%% Cell type:code id: tags:
``` python
grouped_aggL
```
%%%% Output: execute_result
Ti Iters To Iters2
Tt Dist %Async NP NS
0.0 1 0.0 2 4 0.099861 500.0 112.000000 500.0
8 0.099849 500.0 112.000000 500.0
16 0.099860 500.0 112.000000 500.0
32 0.099853 500.0 112.000000 500.0
4 2 0.049642 500.0 55.666667 500.0
... ... ... ... ...
1.0 2 100.0 16 32 0.034899 21.0 14.000000 21.0
32 2 0.012084 101.0 7.000000 101.0
4 0.015599 54.0 7.000000 54.0
8 0.012685 54.0 7.000000 54.0
16 0.015421 44.0 7.000000 44.0
[360 rows x 4 columns]
%% Cell type:code id: tags:
``` python
for dist in [1,2]:
v1 = grouped_aggL.loc[(0,dist,100.0,slice(None))]
v2 = grouped_aggL.loc[(1,dist,100.0,slice(None))]
aux_aggL = v1['Ti'].values / v2['Ti'].values
colors = ['r', 'orange', 'g', 'm', 'y']
markers = ['+', 'x', '1', '2', 'X']
f=plt.figure(figsize=(10, 7))
ax1 = f.add_subplot(111)
plt.xlim(0, max(values)+1)
plt.ylim(0, 1.2)
plt.xticks(values)
ax1.set_ylabel('Decremento velocidad')
ax1.set_xlabel('Procesos hijo')
ax1.set_title("Aumento de velocidad en las iteraciones al realizar redistribuciones asíncronas")
for i in range(len(values)):
numP = values[i]
c = colors[i]
mini = i * (len(values)-1)
maxi = (i+1) * (len(values)-1)
array_values = aux_aggL[mini:maxi]
indexes = np.arange(len(values)-1)
aux_j=0
for j in range(len(values)):
if(values[j] != numP):
indexes[aux_j] = values[j]
aux_j+=1
x = indexes
y = array_values
label = str(numP) + ' padres'
ax1.axvline(numP)
plt.plot(x, y, color=colors[i], label=label, marker=markers[1], markersize=10)
ax1.axhline(1, color='k')
f.legend()
#f.tight_layout()
f.savefig("Images/"+"Iters"+ dist_names[dist] +"_SpeedUp", format="png")
```
%%%% Output: display_data
[Hidden Image Output]
%%%% Output: display_data
[Hidden Image Output]
%% Cell type:code id: tags:
``` python
```
import sys
import glob
import numpy as np
import pandas as pd
def getData(lineS, outData, tp, hasIter = False):
for data in lineS:
k_v = data.split('=')
if k_v[0] == "time":
time = float(k_v[1])
elif k_v[0] == "iters" and hasIter:
iters = int(k_v[1])
outData[tp] = time
if hasIter:
outData[tp+1] = iters
#-----------------------------------------------
def record(f, observation, line):
# Record first line - General info
lineS = line.split()
for j in range(1,7):
observation[j] = int(lineS[j].split('=')[1])
# Record procces number
line = next(f)
lineS = line.split()
j = 7
for key_values in lineS:
k_v = key_values.split('=')
observation[j] = int(k_v[1])
j+=1
# Record data
j = 9
for j in range(9, 13):
line = next(f)
lineS = line.split()
getData(lineS, observation, j)
line = next(f)
lineS = line.split()
#if observation[0] == "A":
getData(lineS, observation, 13, True)
#else:
# getData(lineS, observation, 13)
#-----------------------------------------------
def read_file(f, dataA, dataB, it):
recording = False
resizes = 0
timer = 0
previousNP = 0
for line in f:
lineS = line.split()
if len(lineS) > 0:
if lineS[0] == "Config": # CONFIG LINE
recording = True
it += 1
dataA.append([None]*8)
dataB.append([None]*11)
resizes = int(lineS[2].split('=')[1].split(',')[0])
matrix = int(lineS[3].split('=')[1].split(',')[0])
sdr = int(lineS[4].split('=')[1].split(',')[0])
adr = int(lineS[5].split('=')[1].split(',')[0]) #TODO Que lo tome como porcentaje
time = float(lineS[7].split('=')[1])
dataB[it][5] = matrix
dataB[it][0] = sdr
dataB[it][1] = adr
dataB[it][6] = time
dataB[it][4] = ""
dataA[it][4] = matrix
dataA[it][0] = sdr
dataA[it][1] = adr
dataA[it][5] = time
dataA[it][3] = ""
elif recording and resizes != 0: # RESIZE LINE
iters = int(lineS[2].split('=')[1].split(',')[0])
npr = int(lineS[3].split('=')[1].split(',')[0])
dist = lineS[5].split('=')[1]
dataB[it][7] = iters
dataA[it][6] = iters
resizes = resizes - 1
if resizes == 0:
dataB[it][3] = npr
dataB[it][4] += dist
dataA[it][3] += dist
dataA[it][2] = str(previousNP) + "," + str(npr)
timer = 3
else:
dataB[it][2] = npr
dataB[it][4] += dist + ","
dataA[it][3] += dist + ","
previousNP = npr
else: # SAVE TIMES
if timer == 3:
dataB[it][8] = float(lineS[1])
elif timer == 2:
dataB[it][9] = float(lineS[1])
elif timer == 1:
dataB[it][10] = float(lineS[1])
else:
dataA[it][7] = float(lineS[1])
timer = timer - 1
return it
#columnsA1 = ["N", "%Async", "Groups", "Dist", "Matrix", "Time", "Iters", "TE"] #7
#columnsB1 = ["N", "%Async", "NP", "NS", "Dist", "Matrix", "Time", "Iters", "TC", "TS", "TA"] #10
#Config loaded: resizes=2, matrix=1000, sdr=1000000000, adr=0, aib=0, time=2.000000 || grp=1
#Resize 0: Iters=100, Procs=2, Factors=1.000000, Phy=2
#Resize 1: Iters=100, Procs=4, Factors=0.500000, Phy=2
#Tspawn: 0.249393
#Tsync: 0.330391
#Tasync: 0
#Tex: 301.428615
#-----------------------------------------------
if len(sys.argv) < 2:
print("The files name is missing\nUsage: python3 iterTimes.py resultsName directory csvOutName")
exit(1)
if len(sys.argv) >= 3:
BaseDir = sys.argv[2]
print("Searching in directory: "+ BaseDir)
else:
BaseDir = sys.argv[2]
if len(sys.argv) >= 4:
print("Csv name will be: " + sys.argv[3] + ".csv")
name = sys.argv[3]
else:
name = "data"
insideDir = "Run"
lista = glob.glob("./" + BaseDir + insideDir + "*/" + sys.argv[1]+ "*Global.o*")
print("Number of files found: "+ str(len(lista)));
it = -1
dataA = []
dataB = []
columnsA = ["N", "%Async", "Groups", "Dist", "Matrix", "Time", "Iters", "TE"] #7
columnsB = ["N", "%Async", "NP", "NS", "Dist", "Matrix", "Time", "Iters", "TC", "TS", "TA"] #10
for elem in lista:
f = open(elem, "r")
it = read_file(f, dataA, dataB, it)
f.close()
#print(data)
dfA = pd.DataFrame(dataA, columns=columnsA)
dfA.to_csv(name + '_G.csv')
dfB = pd.DataFrame(dataB, columns=columnsB)
dfB.to_csv(name + '_M.csv')
import sys
import glob
import numpy as np
import pandas as pd
#-----------------------------------------------
def read_file(f, data, it):
matrix = 0
sdr = 0
adr = 0
time = 0
recording = False
it_line = 0
aux_it = 0
iters = 0
np = 0
np_par = 0
ns = 0
for line in f:
lineS = line.split()
if len(lineS) > 1:
if recording:
aux_it = 0
if it_line==0:
lineS.pop(0)
for observation in lineS:
data.append([None]*11)
data[it+aux_it][0] = sdr
data[it+aux_it][1] = adr
data[it+aux_it][2] = np
data[it+aux_it][3] = np_par
data[it+aux_it][4] = ns
data[it+aux_it][5] = matrix
data[it+aux_it][6] = time
data[it+aux_it][7] = iters
data[it+aux_it][8] = float(observation)
aux_it+=1
it_line = it_line + 1
elif it_line==1:
lineS.pop(0)
for observation in lineS:
data[it+aux_it][9] = float(observation)
aux_it+=1
it_line = it_line + 1
else:
lineS.pop(0)
for observation in lineS:
data[it+aux_it][10] = float(observation)
aux_it+=1
it = it + aux_it
recording = False
it_line = 0
#TODO Que tome adr como porcentaje
if lineS[0] == "Config:":
matrix = int(lineS[1].split('=')[1].split(',')[0])
sdr = int(lineS[2].split('=')[1].split(',')[0])
adr = int(lineS[3].split('=')[1].split(',')[0])
time = float(lineS[5].split('=')[1])
elif lineS[0] == "Config":
recording = True
iters = int(lineS[2].split('=')[1].split(',')[0])
np = int(lineS[5].split('=')[1].split(',')[0])
np_par = int(lineS[6].split('=')[1].split(',')[0])
ns = int(float(lineS[7].split('=')[1]))
return it
#-----------------------------------------------
#Config: matrix=1000, sdr=1000000000, adr=0, aib=0 time=2.000000
#Config Group: iters=100, factor=1.000000, phy=2, procs=2, parents=0, sons=4
#Ttype: 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0
if len(sys.argv) < 2:
print("The files name is missing\nUsage: python3 iterTimes.py resultsName directory csvOutName")
exit(1)
if len(sys.argv) >= 3:
BaseDir = sys.argv[2]
print("Searching in directory: "+ BaseDir)
else:
BaseDir = sys.argv[2]
if len(sys.argv) >= 4:
print("Csv name will be: " + sys.argv[3] + ".csv")
name = sys.argv[3]
else:
name = "data"
insideDir = "Run"
lista = glob.glob("./" + BaseDir + insideDir + "*/" + sys.argv[1]+ "*ID*.o*")
print("Number of files found: "+ str(len(lista)));
it = 0
data = [] #0 #1 #2 #3 #4 #5 #6 #7 #8 #9 #10
columns = ["N", "%Async", "NP", "N_par", "NS", "Matrix", "Time", "Iters", "Ti", "Tt", "To"] #11
for elem in lista:
f = open(elem, "r")
it = read_file(f, data, it)
f.close()
#print(data)
df = pd.DataFrame(data, columns=columns)
df.to_csv(name + '.csv')
import sys
import glob
import numpy as np
import pandas as pd
def getData(lineS, outData, tp, hasIter = False):
for data in lineS:
k_v = data.split('=')
if k_v[0] == "time":
time = float(k_v[1])
elif k_v[0] == "iters" and hasIter:
iters = int(k_v[1])
outData[tp] = time
if hasIter:
outData[tp+1] = iters
#-----------------------------------------------
def record(f, observation, line):
# Record first line - General info
lineS = line.split()
for j in range(1,7):
observation[j] = int(lineS[j].split('=')[1])
# Record procces number
line = next(f)
lineS = line.split()
j = 7
for key_values in lineS:
k_v = key_values.split('=')
observation[j] = int(k_v[1])
j+=1
# Record data
j = 9
for j in range(9, 13):
line = next(f)
lineS = line.split()
getData(lineS, observation, j)
line = next(f)
lineS = line.split()
#if observation[0] == "A":
getData(lineS, observation, 13, True)
#else:
# getData(lineS, observation, 13)
#-----------------------------------------------
def read_file(f, dataA, dataB, it):
recording = False
resizes = 0
timer = 0
previousNP = 0
for line in f:
lineS = line.split()
if len(lineS) > 0:
if lineS[0] == "Config": # CONFIG LINE
recording = True
it += 1
dataA.append([None]*13)
dataB.append([None]*15)
#resizes = int(lineS[2].split('=')[1].split(',')[0])
resizes = 2
compute_tam = int(lineS[3].split('=')[1].split(',')[0])
comm_tam = int(lineS[4].split('=')[1].split(',')[0])
sdr = int(lineS[5].split('=')[1].split(',')[0])
adr = int(lineS[6].split('=')[1].split(',')[0]) #TODO Que lo tome como porcentaje
css = int(lineS[8].split('=')[1].split(',')[0])
cst = int(lineS[9].split('=')[1].split(',')[0])
# TODO Que obtenga Aib
time = float(lineS[10].split('=')[1])
dataB[it][0] = sdr
dataB[it][1] = adr
dataB[it][4] = ""
dataB[it][5] = compute_tam
dataB[it][6] = comm_tam
dataB[it][7] = cst
dataB[it][8] = css
dataB[it][9] = time
dataB[it][10] = ""
dataA[it][0] = sdr
dataA[it][1] = adr
dataA[it][5] = ""
dataA[it][6] = compute_tam
dataA[it][7] = comm_tam
dataA[it][8] = cst
dataA[it][9] = css
dataA[it][10] = time
dataA[it][11] = ""
elif recording and resizes != 0: # RESIZE LINE
iters = int(lineS[2].split('=')[1].split(',')[0])
npr = int(lineS[3].split('=')[1].split(',')[0])
dist = lineS[5].split('=')[1]
resizes = resizes - 1
if resizes == 0:
dataB[it][3] = npr
dataB[it][4] += dist
dataB[it][10] += str(iters)
dataA[it][4] = npr #FIXME No sera correcta si hay mas de una reconfig
dataA[it][2] = str(previousNP) + "," + str(npr)
dataA[it][5] += dist
dataA[it][11] += str(iters)
timer = 4
else:
dataB[it][2] = npr
dataB[it][4] += dist + ","
dataB[it][10] += str(iters) + ","
dataA[it][3] = npr
dataA[it][5] += dist + ","
dataA[it][11] += str(iters) + ","
previousNP = npr
else: # SAVE TIMES
if timer == 4:
dataB[it][11] = float(lineS[1])
elif timer == 3:
dataB[it][12] = float(lineS[1])
elif timer == 2:
dataB[it][13] = float(lineS[1])
elif timer == 1:
dataB[it][14] = float(lineS[1])
else:
dataA[it][12] = float(lineS[1])
timer = timer - 1
return it
#columnsA1 = ["N", "%Async", "Groups", "Dist", "Matrix", "CommTam", "Cst", "Css", "Time", "Iters", "TE"] #8
#columnsB1 = ["N", "%Async", "NP", "NS", "Dist", "Matrix", "CommTam", "Cst", "Css", "Time", "Iters", "TC", "TS", "TA"] #12
#Config loaded: resizes=2, matrix=1000, sdr=1000000000, adr=0, aib=0, time=2.000000 || grp=1
#Resize 0: Iters=100, Procs=2, Factors=1.000000, Phy=2
#Resize 1: Iters=100, Procs=4, Factors=0.500000, Phy=2
#Tspawn: 0.249393
#Tthread: 0
#Tsync: 0.330391
#Tasync: 0
#Tex: 301.428615
#Config loaded: resizes=1, matrix=0, comm_tam=0, sdr=0, adr=0, aib=0, cst=3, css=1, time=1 || grp=1
#-----------------------------------------------
if len(sys.argv) < 2:
print("The files name is missing\nUsage: python3 iterTimes.py resultsName directory csvOutName")
exit(1)
if len(sys.argv) >= 3:
BaseDir = sys.argv[2]
print("Searching in directory: "+ BaseDir)
else:
BaseDir = sys.argv[2]
if len(sys.argv) >= 4:
print("Csv name will be: " + sys.argv[3] + "G.csv & " + sys.argv[3] + "M.csv")
name = sys.argv[3]
else:
name = "data"
insideDir = "Run"
lista = glob.glob("./" + BaseDir + insideDir + "*/" + sys.argv[1]+ "*Global.o*")
print("Number of files found: "+ str(len(lista)));
it = -1
dataA = []
dataB = []
columnsA = ["N", "%Async", "Groups", "NP", "NS", "Dist", "Matrix", "CommTam", "Cst", "Css", "Time", "Iters", "TE"] #13
columnsB = ["N", "%Async", "NP", "NS", "Dist", "Matrix", "CommTam", "Cst", "Css", "Time", "Iters", "TC", "TH", "TS", "TA"] #15
for elem in lista:
f = open(elem, "r")
it = read_file(f, dataA, dataB, it)
f.close()
#print(data)
dfA = pd.DataFrame(dataA, columns=columnsA)
dfA.to_csv(name + 'G.csv')
dfB = pd.DataFrame(dataB, columns=columnsB)
#Poner en TC el valor real y en TH el necesario para la app
cond = dfB.TH != 0
dfB.loc[cond, ['TC', 'TH']] = dfB.loc[cond, ['TH', 'TC']].values
dfB.to_csv(name + 'M.csv')
Esta carpeta contiene códigos para poder analizar los resultados obtenidos.
Para utilizar los códigos es necesario Python con los módulos Numpy y Pandas.
El código analyser.ipynb necesita además de la aplicación JupyterLab.
Los códigos son los siguientes:
- Malltimes.py: Recoge los tiempos globales de maleabilidad y ejecución de todos los ficheros pasados como argumento y
los almacena en dos ficheros CSV para ser utilizados en analyser.ipynb
- Itertimes.py: Recoge los tiempos locales de iteraciones de un grupo de procesos de todos los ficheros pasados como
argumento y los almacena en un fichero CSV para ser utilizado en analyser.ipynb
+ Ejemplo de uso de ambos códigos (Esperan los mismos argumentos):
python3 Malltimes.py NombreFicheros DirectorioFicheros/ NombreCSV
NombreFicheros: La parte común de los ficheros, los códigos buscan solo aquellos nombres que empiecen por esta cadena.
Por defecto, con poner "R" es suficiente.
DirectorioFicheros/: Nombre del directorio donde se encuentran todos los resultados. Esta pensado para que busque
en todos las subdirectorios que tenga en el primer nivel, pero no en segundos niveles o más.
NombreCSV: Nombre del fichero CSV en el que escribir la recopilación de resultados.
- analyser.ipynb: Código para ser ejecutado por JupyterNotebook. Dentro del mismo hay que indicar los nombres de los
ficheros CSV a analizar y tras ellos ejecutar las celdas. Como resultado se obtienen tres ficheros XLSX e imagenes
en el directorio "Images", y además varios resultados sobre T-test entre varios resultados que se reflejan como
output en la salida estandar de JupyterNotebook.
This source diff could not be displayed because it is too large. You can view the blob instead.
import sys
import glob
import numpy as numpy
import pandas as pd
#-----------------------------------------------
def read_file(f, dataA, dataB, itA, itB):
compute_tam = 0
comm_tam = 0
sdr = 0
adr = 0
dist = 0
css = 0
cst = 0
time = 0
recording = False
it_line = 0
aux_itA = 0
aux_itB = 0
iters = 0
np = 0
np_par = 0
ns = 0
array = []
columnas = ['Titer','Ttype','Top']
#print(f)
for line in f:
lineS = line.split()
if len(lineS) > 1:
if recording and lineS[0].split(':')[0] in columnas: #Record data
aux_itA = 0
lineS.pop(0)
if it_line==0:
for observation in lineS:
dataA.append([None]*15)
dataA[itA+aux_itA][0] = sdr
dataA[itA+aux_itA][1] = adr
dataA[itA+aux_itA][2] = np
dataA[itA+aux_itA][3] = np_par
dataA[itA+aux_itA][4] = ns
dataA[itA+aux_itA][5] = dist
dataA[itA+aux_itA][6] = compute_tam
dataA[itA+aux_itA][7] = comm_tam
dataA[itA+aux_itA][8] = cst
dataA[itA+aux_itA][9] = css
dataA[itA+aux_itA][10] = time
dataA[itA+aux_itA][11] = iters
dataA[itA+aux_itA][12] = float(observation)
array.append(float(observation))
aux_itA+=1
elif it_line==1:
deleted = 0
for observation in lineS:
dataA[itA+aux_itA][13] = float(observation)
if float(observation) == 0:
array.pop(aux_itA - deleted)
deleted+=1
aux_itA+=1
else:
for observation in lineS:
dataA[itA+aux_itA][14] = float(observation)
aux_itA+=1
it_line += 1
if(it_line % 3 == 0): # Comprobar si se ha terminado de mirar esta ejecucion
recording = False
it_line = 0
itA = itA + aux_itA
if ns != 0: # Solo obtener datos de grupos con hijos
dataB.append([None]*14)
dataB[itB][0] = sdr
dataB[itB][1] = adr
dataB[itB][2] = np
dataB[itB][3] = np_par
dataB[itB][4] = ns
dataB[itB][5] = dist
dataB[itB][6] = compute_tam
dataB[itB][7] = comm_tam
dataB[itB][8] = cst
dataB[itB][9] = css
dataB[itB][10] = time
dataB[itB][11] = iters
dataB[itB][12] = tuple(array)
dataB[itB][13] = numpy.sum(array)
itB+=1
array = []
if lineS[0] == "Config:":
compute_tam = int(lineS[1].split('=')[1].split(',')[0])
comm_tam = int(lineS[2].split('=')[1].split(',')[0])
sdr = int(lineS[3].split('=')[1].split(',')[0])
adr = int(lineS[4].split('=')[1].split(',')[0])
css = int(lineS[6].split('=')[1].split(',')[0])
cst = int(lineS[7].split('=')[1].split(',')[0])
time = float(lineS[8].split('=')[1])
elif lineS[0] == "Config":
recording = True
iters = int(lineS[2].split('=')[1].split(',')[0])
dist = int(lineS[4].split('=')[1].split(',')[0])
np = int(lineS[5].split('=')[1].split(',')[0])
np_par = int(lineS[6].split('=')[1].split(',')[0])
ns = int(float(lineS[7].split('=')[1]))
return itA,itB
#-----------------------------------------------
#Config: matrix=1000, sdr=1000000000, adr=0, aib=0 time=2.000000
#Config Group: iters=100, factor=1.000000, phy=2, procs=2, parents=0, sons=4
#Ttype: 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0
if len(sys.argv) < 2:
print("The files name is missing\nUsage: python3 iterTimes.py resultsName directory csvOutName")
exit(1)
if len(sys.argv) >= 3:
BaseDir = sys.argv[2]
print("Searching in directory: "+ BaseDir)
else: #FIXME
BaseDir = sys.argv[2]
if len(sys.argv) >= 4:
print("Csv name will be: " + sys.argv[3] + ".csv and "+ sys.argv[3] + "_Total.csv")
name = sys.argv[3]
else:
name = "data"
insideDir = "Run"
lista = glob.glob("./" + BaseDir + insideDir + "*/" + sys.argv[1]+ "*ID*.o*")
print("Number of files found: "+ str(len(lista)));
itA = itB = 0
dataA = []
dataB = [] #0 #1 #2 #3 #4 #5 #6 #7 #8 #9 #10 #11 #12 #13 #14
columnsA = ["N", "%Async", "NP", "N_par", "NS", "Dist", "Compute_tam", "Comm_tam", "Cst", "Css","Time", "Iters", "Ti", "Tt", "To"] #15
columnsB = ["N", "%Async", "NP", "N_par", "NS", "Dist", "Compute_tam", "Comm_tam", "Cst", "Css","Time", "Iters", "Ti", "Sum"] #14
for elem in lista:
f = open(elem, "r")
itA,itB = read_file(f, dataA, dataB, itA, itB)
f.close()
#print(data)
dfA = pd.DataFrame(dataA, columns=columnsA)
dfB = pd.DataFrame(dataB, columns=columnsB)
dfA['N'] += dfA['%Async']
dfA['%Async'] = (dfA['%Async'] / dfA['N']) * 100
dfA.to_csv(name + '.csv')
dfB['N'] += dfB['%Async']
dfB['%Async'] = (dfB['%Async'] / dfB['N']) * 100
dfB.to_csv(name + '_Total.csv')
import sys
import glob
import numpy as numpy
import pandas as pd
if len(sys.argv) < 3:
print("The files name is missing\nUsage: python3 joinDf.py resultsName1.csv resultsName2.csv csvOutName")
exit(1)
if len(sys.argv) >= 4:
print("Csv name will be: " + sys.argv[3] + ".csv")
name = sys.argv[3]
else:
name = "dataJOINED"
df1 = pd.read_csv( sys.argv[1] )
df2 = pd.read_csv( sys.argv[2] )
frames = [df1, df2]
df3 = pd.concat(frames)
df3 = df3.drop(columns=df3.columns[0])
df3.to_csv(name + '.csv')
......@@ -33,12 +33,18 @@ static int handler(void* user, const char* section, const char* name,
} else if (MATCH("general", "matrix_tam")) {
pconfig->matrix_tam = atoi(value);
} else if (MATCH("general", "comm_tam")) {
pconfig->comm_tam = atoi(value);
} else if (MATCH("general", "SDR")) {
pconfig->sdr = atoi(value);
} else if (MATCH("general", "ADR")) {
pconfig->adr = atoi(value);
} else if (MATCH("general", "AIB")) {
} else if (MATCH("general", "AIB")) { //TODO Refactor cambiar nombre
pconfig->aib = atoi(value);
} else if (MATCH("general", "CST")) {
pconfig->cst = atoi(value);
} else if (MATCH("general", "CSS")) {
pconfig->css = atoi(value);
} else if (MATCH("general", "time")) {
pconfig->general_time = atof(value);
......@@ -134,8 +140,8 @@ void free_config(configuration *user_config) {
void print_config(configuration *user_config, int grp) {
if(user_config != NULL) {
int i;
printf("Config loaded: resizes=%d, matrix=%d, sdr=%d, adr=%d, aib=%d, time=%f || grp=%d\n",
user_config->resizes, user_config->matrix_tam, user_config->sdr, user_config->adr, user_config->aib, user_config->general_time, grp);
printf("Config loaded: resizes=%d, matrix=%d, comm_tam=%d, sdr=%d, adr=%d, aib=%d, css=%d, cst=%d, time=%f || grp=%d\n",
user_config->resizes, user_config->matrix_tam, user_config->comm_tam, user_config->sdr, user_config->adr, user_config->aib, user_config->css, user_config->cst, user_config->general_time, grp);
for(i=0; i<user_config->resizes; i++) {
printf("Resize %d: Iters=%d, Procs=%d, Factors=%f, Phy=%d\n",
i, user_config->iters[i], user_config->procs[i], user_config->factors[i], user_config->phy_dist[i]);
......@@ -159,8 +165,8 @@ void print_config_group(configuration *user_config, int grp) {
sons = user_config->procs[grp+1];
}
printf("Config: matrix=%d, sdr=%d, adr=%d, aib=%d time=%f\n",
user_config->matrix_tam, user_config->sdr, user_config->adr, user_config->aib, user_config->general_time);
printf("Config: matrix=%d, comm_tam=%d, sdr=%d, adr=%d, aib=%d, css=%d, cst=%d, time=%f\n",
user_config->matrix_tam, user_config->comm_tam, user_config->sdr, user_config->adr, user_config->aib, user_config->css, user_config->cst, user_config->general_time);
printf("Config Group: iters=%d, factor=%f, phy=%d, procs=%d, parents=%d, sons=%d\n",
user_config->iters[grp], user_config->factors[grp], user_config->phy_dist[grp], user_config->procs[grp], parents, sons);
}
......@@ -245,15 +251,15 @@ configuration *recv_config_file(int root, MPI_Comm intercomm) {
* de la estructura de configuracion con una sola comunicacion.
*/
void def_struct_config_file(configuration *config_file, MPI_Datatype *config_type) {
int i, counts = 8;
int blocklengths[8] = {1, 1, 1, 1, 1, 1, 1, 1};
int i, counts = 11;
int blocklengths[11] = {1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1};
MPI_Aint displs[counts], dir;
MPI_Datatype types[counts];
// Rellenar vector types
types[0] = types[1] = types[2] = types[3] = types[4] = types[5] = MPI_INT;
types[6] = MPI_FLOAT;
types[7] = MPI_DOUBLE;
types[0] = types[1] = types[2] = types[3] = types[4] = types[5] = types[6] = types[7] = types[8] = MPI_INT;
types[9] = MPI_FLOAT;
types[10] = MPI_DOUBLE;
// Rellenar vector displs
MPI_Get_address(config_file, &dir);
......@@ -261,11 +267,14 @@ void def_struct_config_file(configuration *config_file, MPI_Datatype *config_typ
MPI_Get_address(&(config_file->resizes), &displs[0]);
MPI_Get_address(&(config_file->actual_resize), &displs[1]);
MPI_Get_address(&(config_file->matrix_tam), &displs[2]);
MPI_Get_address(&(config_file->sdr), &displs[3]);
MPI_Get_address(&(config_file->adr), &displs[4]);
MPI_Get_address(&(config_file->aib), &displs[5]);
MPI_Get_address(&(config_file->general_time), &displs[6]);
MPI_Get_address(&(config_file->Top), &displs[7]);
MPI_Get_address(&(config_file->comm_tam), &displs[3]);
MPI_Get_address(&(config_file->sdr), &displs[4]);
MPI_Get_address(&(config_file->adr), &displs[5]);
MPI_Get_address(&(config_file->aib), &displs[6]);
MPI_Get_address(&(config_file->css), &displs[7]);
MPI_Get_address(&(config_file->cst), &displs[8]);
MPI_Get_address(&(config_file->general_time), &displs[9]);
MPI_Get_address(&(config_file->Top), &displs[10]);
for(i=0;i<counts;i++) displs[i] -= dir;
......
......@@ -7,7 +7,8 @@ typedef struct
{
int resizes;
int actual_resize;
int matrix_tam, sdr, adr;
int matrix_tam, comm_tam, sdr, adr;
int css, cst;
int aib;
float general_time;
double Top;
......
......@@ -11,7 +11,7 @@ void def_results_type(results_data *results, int resizes, MPI_Datatype *results_
//======================================================||
//======================================================||
//TODO Generalizar ambas funciones en una sola
/*
* Envia una estructura de resultados al grupo de procesos al que se
* enlaza este grupo a traves del intercomunicador pasado como argumento.
......@@ -57,17 +57,17 @@ void recv_results(results_data *results, int root, int resizes, MPI_Comm interco
* Define un tipo derivado de MPI para mandar los tiempos
* con una sola comunicacion.
*
* En concreto son tres escales y un vector de tamaño "resizes"
* En concreto son tres escalares y dos vectores de tamaño "resizes"
*/
void def_results_type(results_data *results, int resizes, MPI_Datatype *results_type) {
int i, counts = 4;
int blocklengths[4] = {1, 1, 1, 1};
int i, counts = 5;
int blocklengths[] = {1, 1, 1, 1, 1};
MPI_Aint displs[counts], dir;
MPI_Datatype types[counts];
// Rellenar vector types
types[0] = types[1] = types[2] = types[3] = MPI_DOUBLE;
blocklengths[3] = resizes;
types[0] = types[1] = types[2] = types[3] = types[4] = MPI_DOUBLE;
blocklengths[3] = blocklengths[4] = resizes;
// Rellenar vector displs
MPI_Get_address(results, &dir);
......@@ -75,13 +75,65 @@ void def_results_type(results_data *results, int resizes, MPI_Datatype *results_
MPI_Get_address(&(results->sync_start), &displs[0]);
MPI_Get_address(&(results->async_start), &displs[1]);
MPI_Get_address(&(results->exec_start), &displs[2]);
MPI_Get_address(&(results->spawn_time[0]), &displs[3]); //TODO Revisar si se puede simplificar
MPI_Get_address(&(results->spawn_real_time[0]), &displs[3]);
MPI_Get_address(&(results->spawn_time[0]), &displs[4]); //TODO Revisar si se puede simplificar //FIXME Si hay mas de un spawn error?
for(i=0;i<counts;i++) displs[i] -= dir;
MPI_Type_create_struct(counts, blocklengths, displs, types, results_type);
MPI_Type_commit(results_type);
}
//======================================================||
//======================================================||
//================SET RESULTS FUNCTIONS=================||
//======================================================||
//======================================================||
/*
* Guarda los resultados respecto a la redistribución de datos
* tras una reconfiguración. A llamar por los hijos tras
* terminar la redistribución y obtener la configuración.
*/
void set_results_post_reconfig(results_data *results, int grp, int sdr, int adr) {
if(sdr) { // Si no hay datos sincronos, el tiempo es 0
results->sync_time[grp] = results->sync_end - results->sync_start;
} else {
results->sync_time[grp] = 0;
}
if(adr) { // Si no hay datos asincronos, el tiempo es 0
results->async_time[grp] = results->async_end - results->async_start;
} else {
results->async_time[grp] = 0;
}
}
/*
* Pone el indice del siguiente elemento a escribir a 0 para los vectores
* que tengan que ver con las iteraciones.
* Por tanto, todos los anteriores valores de esos vectores pasan a ser invalidos
* si se intentan acceder desde un código externo.
*
* Solo es necesario llamar a esta funcion cuando se ha realizado una
* expansion con el metodo MERGE
*/
void reset_results_index(results_data *results) {
results->iter_index = 0;
}
/*
* Obtiene para cada iteracion, el tiempo maximo entre todos los procesos
* que han participado.
*
* Es necesario obtener el maximo, pues es el que representa el tiempo real
* que se ha utilizado.
*/
void compute_results_iter(results_data *results, int myId, int root, MPI_Comm comm) {
if(myId == root)
MPI_Reduce(MPI_IN_PLACE, results->iters_time, results->iter_index, MPI_DOUBLE, MPI_MAX, root, comm);
else
MPI_Reduce(results->iters_time, NULL, results->iter_index, MPI_DOUBLE, MPI_MAX, root, comm);
}
//======================================================||
//======================================================||
......@@ -95,22 +147,22 @@ void def_results_type(results_data *results, int resizes, MPI_Datatype *results_
* por iteracion, el tipo (Normal o durante communicacion asincrona)
* y cuantas operaciones internas se han realizado en cada iteracion.
*/
void print_iter_results(results_data *results, int last_normal_iter_index) {
void print_iter_results(results_data results, int last_normal_iter_index) {
int i, aux;
printf("Titer: ");
for(i=0; i< results->iter_index; i++) {
printf("%lf ", results->iters_time[i]);
for(i=0; i< results.iter_index; i++) {
printf("%lf ", results.iters_time[i]);
}
printf("\nTtype: "); //FIXME modificar a imprimir solo la cantidad de asincronas
for(i=0; i< results->iter_index; i++) {
printf("%d ", results->iters_type[i] == 0);
for(i=0; i< results.iter_index; i++) {
printf("%d ", results.iters_type[i] == 0);
}
printf("\nTop: "); //FIXME modificar a imprimir solo cuantas operaciones cuestan una iteracion
for(i=0; i< results->iter_index; i++) {
aux = results->iters_type[i] == 0 ? results->iters_type[last_normal_iter_index] : results->iters_type[i];
printf("\nTop: "); //TODO modificar a imprimir solo cuantas operaciones cuestan una iteracion?
for(i=0; i< results.iter_index; i++) {
aux = results.iters_type[i] == 0 ? results.iters_type[last_normal_iter_index] : results.iters_type[i];
printf("%d ", aux);
}
printf("\n");
......@@ -121,25 +173,30 @@ void print_iter_results(results_data *results, int last_normal_iter_index) {
* Estos son el tiempo de creacion de procesos, los de comunicacion
* asincrona y sincrona y el tiempo total de ejecucion.
*/
void print_global_results(results_data *results, int resizes) {
void print_global_results(results_data results, int resizes) {
int i;
printf("Tspawn: ");
printf("Tspawn: "); // FIXME REFACTOR Cambiar nombre a T_resize_real
for(i=0; i< resizes - 1; i++) {
printf("%lf ", results->spawn_time[i]);
printf("%lf ", results.spawn_time[i]);
}
printf("\nTspawn_real: "); // FIXME REFACTOR Cambiar nombre a T_resize
for(i=0; i< resizes - 1; i++) {
printf("%lf ", results.spawn_real_time[i]);
}
printf("\nTsync: ");
for(i=1; i < resizes; i++) {
printf("%lf ", results->sync_time[i]);
printf("%lf ", results.sync_time[i]);
}
printf("\nTasync: ");
for(i=1; i < resizes; i++) {
printf("%lf ", results->async_time[i]);
printf("%lf ", results.async_time[i]);
}
printf("\nTex: %lf\n", results->exec_time);
printf("\nTex: %lf\n", results.exec_time);
}
//======================================================||
......@@ -154,27 +211,50 @@ void print_global_results(results_data *results, int resizes) {
* Los argumentos "resizes" y "iters_size" se necesitan para obtener el tamaño
* de los vectores de resultados.
*/
void init_results_data(results_data **results, int resizes, int iters_size) {
*results = malloc(1 * sizeof(results_data));
void init_results_data(results_data *results, int resizes, int iters_size) {
//*results = malloc(1 * sizeof(results_data)); FIXME Borrar
results->spawn_time = calloc(resizes, sizeof(double));
results->spawn_real_time = calloc(resizes, sizeof(double));
results->sync_time = calloc(resizes, sizeof(double));
results->async_time = calloc(resizes, sizeof(double));
(*results)->spawn_time = calloc(resizes, sizeof(double));
(*results)->sync_time = calloc(resizes, sizeof(double));
(*results)->async_time = calloc(resizes, sizeof(double));
results->iters_size = iters_size + 100;
results->iters_time = calloc(iters_size + 100, sizeof(double)); //FIXME Numero magico
results->iters_type = calloc(iters_size + 100, sizeof(int));
results->iter_index = 0;
(*results)->iters_time = calloc(iters_size * 20, sizeof(double)); //FIXME Numero magico - Añadir funcion que amplie tamaño
(*results)->iters_type = calloc(iters_size * 20, sizeof(int));
(*results)->iter_index = 0;
}
void realloc_results_iters(results_data *results, int needed) {
double *time_aux;
int *type_aux;
time_aux = (double *) realloc(results->iters_time, needed * sizeof(double));
type_aux = (int *) realloc(results->iters_type, needed * sizeof(int));
if(time_aux == NULL || type_aux == NULL) {
fprintf(stderr, "Fatal error - No se ha podido realojar la memoria de resultados\n");
MPI_Abort(MPI_COMM_WORLD, 1);
}
results->iters_time = time_aux;
results->iters_type = type_aux;
}
/*
* Libera toda la memoria asociada con una estructura de resultados.
* TODO Asegurar que ha sido inicializado?
*/
void free_results_data(results_data **results) {
free((*results)->spawn_time);
free((*results)->sync_time);
free((*results)->async_time);
free((*results)->iters_time);
free((*results)->iters_type);
free(*results);
void free_results_data(results_data *results) {
if(results != NULL) {
free(results->spawn_time);
free(results->spawn_real_time);
free(results->sync_time);
free(results->async_time);
free(results->iters_time);
free(results->iters_type);
}
//free(*results); FIXME Borrar
}
......@@ -2,23 +2,31 @@
#include <stdlib.h>
#include <mpi.h>
#define RESULTS_INIT_DATA_QTY 100
typedef struct {
// Iters data
double *iters_time;
int *iters_type, iter_index;
int *iters_type, iter_index, iters_size;
// Spawn, Sync and Async time
double spawn_start, *spawn_time;
double sync_start, *sync_time;
double async_start, *async_time;
// Spawn, Thread, Sync, Async and Exec time
double spawn_start, *spawn_time, *spawn_real_time;
double sync_start, sync_end, *sync_time;
double async_start, async_end, *async_time;
double exec_start, exec_time;
//Overcharge time is time spent in malleability that is from IO modules
} results_data;
void send_results(results_data *results, int root, int resizes, MPI_Comm intercomm);
void recv_results(results_data *results, int root, int resizes, MPI_Comm intercomm);
void print_iter_results(results_data *results, int last_normal_iter_index);
void print_global_results(results_data *results, int resizes);
void init_results_data(results_data **results, int resizes, int iters_size);
void free_results_data(results_data **results);
void set_results_post_reconfig(results_data *results, int grp, int sdr, int adr);
void reset_results_index(results_data *results);
void compute_results_iter(results_data *results, int myId, int root, MPI_Comm comm);
void print_iter_results(results_data results, int last_normal_iter_index);
void print_global_results(results_data results, int resizes);
void init_results_data(results_data *results, int resizes, int iters_size);
void realloc_results_iters(results_data *results, int needed);
void free_results_data(results_data *results);
......@@ -2,36 +2,25 @@
#include <stdlib.h>
#include <mpi.h>
#include <fcntl.h>
#include <unistd.h>
#include <sys/stat.h>
#include <pthread.h>
#include "computing_func.h"
#include "../IOcodes/read_ini.h"
#include "../IOcodes/results.h"
#include "../malleability/ProcessDist.h"
#include "../malleability/CommDist.h"
#include "../malleability/malleabilityManager.h"
#include "../malleability/malleabilityStates.h"
#define ROOT 0
int work();
void Sons_init();
int checkpoint(int iter, int state, MPI_Request **comm_req);
void TC(int numS);
int start_redistribution(int numS, MPI_Request **comm_req);
int check_redistribution(int iter, MPI_Request **comm_req);
int end_redistribution(int iter);
int thread_creation();
int thread_check();
void* thread_async_work(void* void_arg);
void iterate(double *matrix, int n, int async_comm);
void iterate(double *matrix, int n, int async_comm, int iter);
void init_group_struct(char *argv[], int argc, int myId, int numP);
void init_application();
void obtain_op_times();
void free_application_data();
void print_general_info(int myId, int grp, int numP);
int print_local_results();
int print_final_results();
int create_out_file(char *nombre, int *ptr, int newstdout);
......@@ -43,58 +32,152 @@ typedef struct {
int argc;
int numS; // Cantidad de procesos hijos
int commAsync;
MPI_Comm children, parents;
char *compute_comm_array;
char **argv;
char *sync_array, *async_array;
} group_data;
typedef struct {
int myId, numP, numS, adr;
MPI_Comm children;
char *sync_array;
} thread_data;
configuration *config_file;
group_data *group;
results_data *results;
MPI_Comm comm;
int run_id = 0; // Utilizado para diferenciar más fácilmente ejecuciones en el análisis
pthread_t async_thread; // TODO Cambiar de sitio?
int main(int argc, char *argv[]) {
int numP, myId, res;
int req;
int im_child;
MPI_Init_thread(&argc, &argv, MPI_THREAD_SINGLE, &req);
//FIXME El codigo no es capaz de hacer mas de una redistribucion - Arreglar malleabilityTypes.c
int num_cpus, num_nodes; //nodelist_len; //FIXME Eliminar cuando se utilice Slurm
char *nodelist = NULL;
num_cpus = 20; //FIXME NUMERO MAGICO
if (argc >= 5) {
nodelist = argv[3];
//nodelist_len = strlen(nodelist);
num_nodes = atoi(argv[4]);
num_cpus = num_nodes * num_cpus;
}
MPI_Init_thread(&argc, &argv, MPI_THREAD_MULTIPLE, &req);
MPI_Comm_size(MPI_COMM_WORLD, &numP);
MPI_Comm_rank(MPI_COMM_WORLD, &myId);
comm = MPI_COMM_WORLD;
if(req != MPI_THREAD_MULTIPLE) {
printf("No se ha obtenido la configuración de hilos necesaria\nSolicitada %d -- Devuelta %d\n", req, MPI_THREAD_MULTIPLE);
}
init_group_struct(argv, argc, myId, numP);
//FIXME No funciona en OpenMPI
im_child = init_malleability(myId, numP, ROOT, comm, argv[0], nodelist, num_cpus, num_nodes);
MPI_Comm_get_parent(&(group->parents));
if(group->parents == MPI_COMM_NULL ) { // Si son el primer grupo de procesos, recogen la configuracion inicial
if(!im_child) { //TODO REFACTOR Simplificar inicio
init_application();
} else { // Si son procesos hijos deben comunicarse con las padres
Sons_init();
set_benchmark_grp(group->grp);
set_benchmark_configuration(config_file);
set_benchmark_results(results);
MPI_Barrier(comm);
results->exec_start = MPI_Wtime();
} else { //Init hijos
get_malleability_user_comm(&comm);
get_benchmark_configuration(&config_file);
get_benchmark_results(&results);
set_results_post_reconfig(results, group->grp, config_file->sdr, config_file->adr); //TODO Cambio al añadir nueva redistribucion
if(config_file->comm_tam) {
group->compute_comm_array = malloc(config_file->comm_tam * sizeof(char));
}
// TODO Refactor - Que sea una unica funcion
// Obtiene las variables que van a utilizar los hijos
void *value = NULL;
malleability_get_data(&value, 0, 1, 1);
group->grp = *((int *)value);
free(value);
malleability_get_data(&value, 1, 1, 1);
run_id = *((int *)value);
free(value);
malleability_get_data(&value, 2, 1, 1);
group->iter_start = *((int *)value);
free(value);
//FIXME Eliminar cuando se utilice SLURM
/*
malleability_get_data(&value, 4, 1, 1);
num_nodes = *((int *)value);
free(value);
malleability_get_data(&value, 5, 1, 1);
nodelist = (char *)value;
//free(value);
nodelist_len = strlen(nodelist);
*/
group->grp = group->grp + 1;
}
//
// EMPIEZA LA EJECUCION-------------------------------
//
group->grp = group->grp - 1; // TODO REFACTOR???
do {
group->grp = group->grp + 1;
set_benchmark_grp(group->grp);
get_malleability_user_comm(&comm);
MPI_Comm_size(comm, &(group->numP));
MPI_Comm_rank(comm, &(group->myId));
if(config_file->resizes != group->grp + 1) {
set_malleability_configuration(config_file->cst, config_file->css, config_file->phy_dist[group->grp+1], -1, config_file->aib, -1);
set_children_number(config_file->procs[group->grp+1]); // TODO TO BE DEPRECATED
if(group->grp == 0) {
MPI_Barrier(MPI_COMM_WORLD);
results->exec_start = MPI_Wtime();
malleability_add_data(&(group->grp), 1, MAL_INT, 1, 1);
malleability_add_data(&run_id, 1, MAL_INT, 1, 1);
malleability_add_data(&(group->iter_start), 1, MAL_INT, 1, 1);
//FIXME Eliminar cuando se utilice SLURM
//malleability_add_data(&num_nodes, 1, MAL_INT, 1, 1);
//malleability_add_data(&nodelist, nodelist_len, MAL_CHAR, 1, 1);
}
}
res = work();
if(res == MAL_ZOMBIE) break;
print_local_results();
reset_results_index(results);
} while((config_file->resizes > group->grp + 1) && (config_file->cst == COMM_SPAWN_MERGE || config_file->cst == COMM_SPAWN_MERGE_PTHREAD));
//
// TERMINA LA EJECUCION ----------------------------------------------------------
//
if(res) { // Se he llegado al final de la aplicacion
MPI_Barrier(MPI_COMM_WORLD);
if(res==1) { // Se he llegado al final de la aplicacion
MPI_Barrier(comm); // TODO Posible error al utilizar SHRINK
results->exec_time = MPI_Wtime() - results->exec_start;
}
print_final_results(); // Pasado este punto ya no pueden escribir los procesos
print_final_results();
if(comm != MPI_COMM_WORLD && comm != MPI_COMM_NULL) {
MPI_Comm_free(&comm);
}
if(group->myId == ROOT && (config_file->cst == COMM_SPAWN_MERGE || config_file->cst == COMM_SPAWN_MERGE_PTHREAD)) {
MPI_Abort(MPI_COMM_WORLD, -100);
}
free_application_data();
MPI_Finalize();
return 0;
}
......@@ -115,274 +198,35 @@ int main(int argc, char *argv[]) {
*/
int work() {
int iter, maxiter, state, res;
double *matrix;
MPI_Request *async_comm;
double *matrix = NULL;
maxiter = config_file->iters[group->grp];
//initMatrix(&matrix, config_file->matrix_tam);
state = MAL_COMM_UNINITIALIZED;
state = MAL_NOT_STARTED;
res = 0;
for(iter=group->iter_start; iter < maxiter; iter++) {
iterate(matrix, config_file->matrix_tam, state);
iterate(matrix, config_file->matrix_tam, state, iter);
}
state = checkpoint(iter, state, &async_comm);
if(config_file->resizes != group->grp + 1)
state = malleability_checkpoint();
iter = 0;
while(state == MAL_ASYNC_PENDING) {
iterate(matrix, config_file->matrix_tam, state);
while(state == MAL_DIST_PENDING || state == MAL_SPAWN_PENDING || state == MAL_SPAWN_SINGLE_PENDING) {
if(iter < config_file->iters[group->grp+1]) {
iterate(matrix, config_file->matrix_tam, state, iter);
iter++;
state = checkpoint(iter, state, &async_comm);
group->iter_start = iter;
}
state = malleability_checkpoint();
}
if(config_file->resizes - 1 == group->grp) res=1;
if(state == MAL_ZOMBIE) res=state;
return res;
}
/*
* Se realiza el redimensionado de procesos por parte de los padres.
*
* Se crean los nuevos procesos con la distribucion fisica elegida y
* a continuacion se transmite la informacion a los mismos.
*
* Si hay datos asincronos a transmitir, primero se comienza a
* transmitir estos y se termina la funcion. Se tiene que comprobar con
* llamando a la función de nuevo que se han terminado de enviar
*
* Si hay ademas datos sincronos a enviar, no se envian aun.
*
* Si solo hay datos sincronos se envian tras la creacion de los procesos
* y finalmente se desconectan los dos grupos de procesos.
*/
int checkpoint(int iter, int state, MPI_Request **comm_req) {
if(state == MAL_COMM_UNINITIALIZED) {
// Comprobar si se tiene que realizar un redimensionado
if(config_file->iters[group->grp] > iter || config_file->resizes == group->grp + 1) {return MAL_COMM_UNINITIALIZED;}
group->numS = config_file->procs[group->grp +1];
results->spawn_start = MPI_Wtime();
TC(group->numS);
results->spawn_time[group->grp] = MPI_Wtime() - results->spawn_start;
state = start_redistribution(group->numS, comm_req);
} else if(state == MAL_ASYNC_PENDING) {
state = thread_check();
if(state == MAL_COMM_COMPLETED) end_redistribution(iter);
//state = check_redistribution(iter, comm_req);
}
return state;
}
/*
* Se encarga de realizar la creacion de los procesos hijos.
*/
void TC(int numS){
// Inicialización de la comunicación con SLURM
int dist = config_file->phy_dist[group->grp +1];
init_slurm_comm(group->argv, group->myId, numS, ROOT, dist, COMM_SPAWN_SERIAL);
// Esperar a que la comunicación y creación de procesos
// haya finalizado
int test = -1;
while(test != MPI_SUCCESS) {
test = check_slurm_comm(group->myId, ROOT, MPI_COMM_WORLD, &(group->children));
}
}
/*
* Comienza la redistribucion de los datos con el nuevo grupo de procesos.
*
* Primero se envia la configuracion a utilizar al nuevo grupo de procesos y a continuacion
* se realiza el envio asincrono y/o sincrono si lo hay.
*
* En caso de que haya comunicacion asincrona, se comienza y se termina la funcion
* indicando que se ha comenzado un envio asincrono.
*
* Si no hay comunicacion asincrono se pasa a realizar la sincrona si la hubiese.
*
* Finalmente se envian datos sobre los resultados a los hijos y se desconectan ambos
* grupos de procesos.
*/
int start_redistribution(int numS, MPI_Request **comm_req) {
int rootBcast = MPI_PROC_NULL;
if(group->myId == ROOT) rootBcast = MPI_ROOT;
// Enviar a los hijos que grupo de procesos son
MPI_Bcast(&(group->grp), 1, MPI_INT, rootBcast, group->children);
MPI_Bcast(&run_id, 1, MPI_INT, rootBcast, group->children);
send_config_file(config_file, rootBcast, group->children);
if(config_file->adr > 0) {
results->async_start = MPI_Wtime();
return thread_creation();
}
return end_redistribution(0);
}
/*
* Crea una hebra para ejecutar una comunicación en segundo plano.
*/
int thread_creation() {
if(pthread_create(&async_thread, NULL, thread_async_work, NULL)) {
printf("Error al crear el hilo\n");
MPI_Abort(MPI_COMM_WORLD, -1);
return -1;
}
return MAL_ASYNC_PENDING;
}
/*
* Comprobación por parte de una hebra maestra que indica
* si una hebra esclava ha terminado su comunicación en segundo plano.
*
* El estado de la comunicación es devuelto al finalizar la función.
*/
int thread_check() {
if(group->commAsync == MAL_COMM_COMPLETED) {
if(pthread_join(async_thread, NULL)) {
printf("Error al esperar al hilo\n");
MPI_Abort(MPI_COMM_WORLD, -1);
return -2;
}
return MAL_COMM_COMPLETED;
}
return MAL_ASYNC_PENDING;
}
/*
* Función ejecutada por una hebra.
* Ejecuta una comunicación síncrona con los hijos que
* para el usuario se puede considerar como en segundo plano.
*
* Cuando termina la comunicación la hebra maestra puede comprobarlo
* por el valor "commAsync".
*/
void* thread_async_work(void* void_arg) {
send_sync(group->async_array, config_file->adr, group->myId, group->numP, ROOT, group->children, group->numS);
group->commAsync = MAL_COMM_COMPLETED;
pthread_exit(NULL);
}
/*
* @deprecated
* Comprueba si la redistribucion asincrona ha terminado.
* Si no ha terminado la funcion termina indicandolo, en caso contrario,
* se continua con la comunicacion sincrona, el envio de resultados y
* se desconectan los grupos de procesos.
*
* Esta funcion permite dos modos de funcionamiento al comprobar si la
* comunicacion asincrona ha terminado.
* Si se utiliza el modo "MAL_USE_NORMAL", se considera terminada cuando
* los padres terminan de enviar.
* Si se utiliza el modo "MAL_USE_IBARRIER", se considera terminada cuando
* los hijos han terminado de recibir.
*/
int check_redistribution(int iter, MPI_Request **comm_req) {
int completed, all_completed, test_err;
MPI_Request *req_completed;
if(config_file->aib == MAL_USE_NORMAL) {
req_completed = &(*comm_req)[0];
} else { // MAL_USE_IBARRIER
req_completed = &(*comm_req)[1];
}
test_err = MPI_Test(req_completed, &completed, MPI_STATUS_IGNORE);
if (test_err != MPI_SUCCESS && test_err != MPI_ERR_PENDING) {
printf("P%d aborting -- Test Async\n", group->myId);
MPI_Abort(MPI_COMM_WORLD, test_err);
}
MPI_Allreduce(&completed, &all_completed, 1, MPI_INT, MPI_MIN, MPI_COMM_WORLD);
if(!all_completed) return MAL_ASYNC_PENDING; // Continue only if asynchronous send has ended
MPI_Wait(req_completed, MPI_STATUS_IGNORE);
if(config_file->aib == MAL_USE_IBARRIER) {
MPI_Wait(&(*comm_req)[0], MPI_STATUS_IGNORE); // Indicar como completado el envio asincrono
//Para la desconexión de ambos grupos de procesos es necesario indicar a MPI que esta
//ha terminado, aunque solo se pueda llegar a este punto cuando ha terminado
}
free(*comm_req);
return end_redistribution(iter);
}
/*
* Termina la redistribución de los datos con los hijos, comprobando
* si se han realizado iteraciones con comunicaciones en segundo plano
* y enviando cuantas iteraciones se han realizado a los hijos.
*
* Además se realizan las comunicaciones síncronas se las hay.
* Finalmente termina enviando los datos temporales a los hijos.
*/
int end_redistribution(int iter) {
int rootBcast = MPI_PROC_NULL;
if(group->myId == ROOT) rootBcast = MPI_ROOT;
if(iter > 0) { // Mandar a los hijos iteracion en la que comenzar
MPI_Bcast(&iter, 1, MPI_INT, rootBcast, group->children);
}
if(config_file->sdr > 0) { // Realizar envio sincrono
results->sync_start = MPI_Wtime();
send_sync(group->sync_array, config_file->sdr, group->myId, group->numP, ROOT, group->children, group->numS);
}
send_results(results, rootBcast, config_file->resizes, group->children);
// Desconectar intercomunicador con los hijos
MPI_Comm_disconnect(&(group->children));
return MAL_COMM_COMPLETED;
}
/*
* Inicializacion de los datos de los hijos.
* En la misma se reciben datos de los padres: La configuracion
* de la ejecucion a realizar; y los datos a recibir de los padres
* ya sea de forma sincrona, asincrona o ambas.
*/
void Sons_init() {
// Enviar a los hijos que grupo de procesos son
MPI_Bcast(&(group->grp), 1, MPI_INT, ROOT, group->parents);
MPI_Bcast(&run_id, 1, MPI_INT, ROOT, group->parents);
group->grp++;
config_file = recv_config_file(ROOT, group->parents);
int numP_parents = config_file->procs[group->grp -1];
init_results_data(&results, config_file->resizes - 1, config_file->iters[group->grp]);
if(config_file->adr > 0) { // Recibir datos asincronos
recv_sync(&(group->async_array), config_file->adr, group->myId, group->numP, ROOT, group->parents, numP_parents);
results->async_time[group->grp] = MPI_Wtime();
MPI_Bcast(&(group->iter_start), 1, MPI_INT, ROOT, group->parents);
}
if(config_file->sdr > 0) { // Recibir datos sincronos
recv_sync(&(group->sync_array), config_file->sdr, group->myId, group->numP, ROOT, group->parents, numP_parents);
results->sync_time[group->grp] = MPI_Wtime();
}
// Guardar los resultados de esta transmision
recv_results(results, ROOT, config_file->resizes, group->parents);
if(config_file->sdr > 0) { // Si no hay datos sincronos, el tiempo es 0
results->sync_time[group->grp] = MPI_Wtime() - results->sync_start;
} else {
results->sync_time[group->grp] = 0;
}
if(config_file->adr > 0) { // Si no hay datos asincronos, el tiempo es 0
results->async_time[group->grp] = MPI_Wtime() - results->async_start;
} else {
results->async_time[group->grp] = 0;
}
// Desconectar intercomunicador con los hijos
MPI_Comm_disconnect(&(group->parents));
}
/////////////////////////////////////////
/////////////////////////////////////////
......@@ -395,24 +239,45 @@ void Sons_init() {
* Simula la ejecucción de una iteración de computo en la aplicación
* que dura al menos un tiempo de "time" segundos.
*/
void iterate(double *matrix, int n, int async_comm) {
void iterate(double *matrix, int n, int async_comm, int iter) {
double start_time, actual_time;
double time = config_file->general_time * config_file->factors[group->grp];
double Top = config_file->Top;
int i, operations = 0;
double aux = 0;
start_time = actual_time = MPI_Wtime();
start_time = MPI_Wtime();
operations = time / Top; //FIXME Calcular una sola vez
operations = time / Top;
for(i=0; i < operations; i++) {
aux += computePiSerial(n);
}
/*
if(time >= 1) {
sleep(time);
}
else {
unsigned int sleep_time = time * 1000000;
usleep(sleep_time);
}
*/
if(config_file->comm_tam) {
MPI_Bcast(group->compute_comm_array, config_file->comm_tam, MPI_CHAR, ROOT, comm);
}
actual_time = MPI_Wtime(); // Guardar tiempos
if(async_comm == MAL_ASYNC_PENDING) { // Se esta realizando una redistribucion de datos asincrona
// TODO Que diferencie entre ambas en el IO
if(async_comm == MAL_DIST_PENDING || async_comm == MAL_SPAWN_PENDING || async_comm == MAL_SPAWN_SINGLE_PENDING) { // Se esta realizando una redistribucion de datos asincrona
operations=0;
}
if(results->iter_index == results->iters_size) { // Aumentar tamaño de ambos vectores de resultados
realloc_results_iters(results, results->iters_size + 100);
}
results->iters_time[results->iter_index] = actual_time - start_time;
results->iters_type[results->iter_index] = operations;
results->iter_index = results->iter_index + 1;
......@@ -440,17 +305,18 @@ void print_general_info(int myId, int grp, int numP) {
free(version);
}
/*
* Pide al proceso raiz imprimir los datos sobre las iteraciones realizadas por el grupo de procesos.
*
* Si es el ultimo grupo de procesos, muestra los datos obtenidos de tiempo de ejecucion, creacion de procesos
* y las comunicaciones.
*/
int print_final_results() {
int ptr_local, ptr_global, err;
int print_local_results() {
int ptr_local, ptr_out, err;
char *file_name;
compute_results_iter(results, group->myId, ROOT, comm);
if(group->myId == ROOT) {
ptr_out = dup(1);
file_name = NULL;
file_name = malloc(40 * sizeof(char));
if(file_name == NULL) return -1; // No ha sido posible alojar la memoria
......@@ -459,9 +325,26 @@ int print_final_results() {
create_out_file(file_name, &ptr_local, 1);
print_config_group(config_file, group->grp);
print_iter_results(results, config_file->iters[group->grp] -1);
print_iter_results(*results, config_file->iters[group->grp] - 1);
free(file_name);
fflush(stdout);
close(1);
dup(ptr_out);
}
return 0;
}
/*
* Si es el ultimo grupo de procesos, pide al proceso raiz mostrar los datos obtenidos de tiempo de ejecucion, creacion de procesos
* y las comunicaciones.
*/
int print_final_results() {
int ptr_global, err;
char *file_name;
if(group->myId == ROOT) {
if(group->grp == config_file->resizes -1) {
file_name = NULL;
file_name = malloc(20 * sizeof(char));
......@@ -471,7 +354,8 @@ int print_final_results() {
create_out_file(file_name, &ptr_global, 1);
print_config(config_file, group->grp);
print_global_results(results, config_file->resizes);
print_global_results(*results, config_file->resizes);
fflush(stdout);
free(file_name);
}
......@@ -488,7 +372,6 @@ void init_group_struct(char *argv[], int argc, int myId, int numP) {
group->numP = numP;
group->grp = 0;
group->iter_start = 0;
group->commAsync = MAL_COMM_UNINITIALIZED;
group->argc = argc;
group->argv = argv;
}
......@@ -505,48 +388,67 @@ void init_group_struct(char *argv[], int argc, int myId, int numP) {
void init_application() {
if(group->argc < 2) {
printf("Falta el fichero de configuracion. Uso:\n./programa config.ini id\nEl argumento numerico id es opcional\n");
exit(0);
MPI_Abort(MPI_COMM_WORLD, -1);
}
if(group->argc > 2) {
run_id = atoi(group->argv[2]);
}
config_file = read_ini_file(group->argv[1]);
init_results_data(&results, config_file->resizes, config_file->iters[group->grp]);
if(config_file->sdr > 0) {
results = malloc(sizeof(results_data));
init_results_data(results, config_file->resizes, config_file->iters[group->grp]);
if(config_file->comm_tam) {
group->compute_comm_array = malloc(config_file->comm_tam * sizeof(char));
}
if(config_file->sdr) {
malloc_comm_array(&(group->sync_array), config_file->sdr , group->myId, group->numP);
}
if(config_file->adr > 0) {
if(config_file->adr) {
malloc_comm_array(&(group->async_array), config_file->adr , group->myId, group->numP);
}
obtain_op_times();
}
/*
* Obtiene cuanto tiempo es necesario para realizar una operacion de PI
*/
void obtain_op_times() {
double result, start_time = MPI_Wtime();
int i;
int i, qty = 20000;
result = 0;
for(i=0; i<20000; i++) {
for(i=0; i<qty; i++) {
result += computePiSerial(config_file->matrix_tam);
}
printf("Creado Top con valor %lf\n", result);
fflush(stdout);
//printf("Creado Top con valor %lf\n", result);
//fflush(stdout);
config_file->Top = (MPI_Wtime() - start_time) / 20000; //Tiempo de una iteracion en numero de iteraciones
MPI_Bcast(&(config_file->Top), 1, MPI_DOUBLE, ROOT, MPI_COMM_WORLD);
config_file->Top = (MPI_Wtime() - start_time) / qty; //Tiempo de una operacion
MPI_Bcast(&(config_file->Top), 1, MPI_DOUBLE, ROOT, comm);
}
/*
* Libera toda la memoria asociada con la aplicacion
*/
void free_application_data() {
if(config_file->sdr > 0) {
if(config_file->comm_tam) {
free(group->compute_comm_array);
}
if(config_file->sdr) {
free(group->sync_array);
}
if(config_file->adr > 0) {
if(config_file->adr) {
free(group->async_array);
}
free(group);
free_malleability();
free_config(config_file);
free_results_data(&results);
if(group->grp == 0) { //FIXME Revisar porque cuando es diferente a 0 no funciona
free_results_data(results);
free(results);
}
free(group);
}
......
......@@ -102,15 +102,11 @@ void node_dist(slurm_job_info_t job_record, int type, int total_procs, int **qty
procs[i] += total_procs - asigCores;
(*used_nodes)++;
}
if(*used_nodes > job_record.num_nodes) *used_nodes = job_record.num_nodes;
if(*used_nodes > job_record.num_nodes) *used_nodes = job_record.num_nodes; //FIXME Si ocurre esto no es un error?
}
*used_nodes=job_record.num_nodes;
for(i=0; i<*used_nodes; i++) {
if(procs[i] == 0){
procs[i]++;
}
}
// Antes se ponia aqui todos los nodos sin cpus a 1
*qty = procs;
}
......@@ -153,6 +149,7 @@ void fill_hostfile(slurm_job_info_t job_record, int ptr, int *qty, int used_node
hostlist = slurm_hostlist_create(job_record.nodes);
while ( (host = slurm_hostlist_shift(hostlist)) && i < used_nodes) {
if(qty[i] != 0)
write_hostfile_node(ptr, qty[i], host);
i++;
free(host);
......
module load mpich-3.4.1-noucx
mpicc -Wall Main/Main.c Main/computing_func.c IOcodes/results.c IOcodes/read_ini.c IOcodes/ini.c malleability/ProcessDist.c malleability/CommDist.c -pthread -lslurm -lm
#mpicc -Wall Main/Main.c Main/computing_func.c IOcodes/results.c IOcodes/read_ini.c IOcodes/ini.c malleability/ProcessDist.c malleability/CommDist.c -pthread -lslurm -lm
mpicc -Wall Main/Main.c Main/computing_func.c IOcodes/results.c IOcodes/read_ini.c IOcodes/ini.c malleability/malleabilityManager.c malleability/malleabilityTypes.c malleability/malleabilityZombies.c malleability/ProcessDist.c malleability/CommDist.c -pthread -lslurm -lm
if [ $# -gt 0 ]
then
if [ $1 = "-e" ]
then
cp a.out benchm.out
echo "Creado ejecutable para ejecuciones"
cp a.out bench.out
fi
fi
#include <stdio.h>
#include <stdlib.h>
#include <sys/stat.h>
#include <fcntl.h>
#include <mpi.h>
#include <pthread.h>
#include <math.h>
#include <string.h>
#include <slurm/slurm.h>
#include "ProcessDist.h"
/*
* ESTE CODIGO ES PARA COMPROBAR EL FUNCIONAMIENTO DEL FICHERO ProcessDist.h
* NO TIENE QUE VER CON EL BENCHMARK DE MALEABILIDAD
*/
#define ROOT 0
#define MAXGRP 3
#define TYPE_D 1
// 1 Es nodos
// 2 Es por nucleos
// Función para crear un fichero con el formato GxNPyIDz.o{jobId}.
// El proceso que llama a la función pasa a tener como salida estandar
// dicho fichero.
int create_out_file(int myId, int numP, int grp, char *jobId);
int create_out_file(int myId, int numP, int grp, char *jobId) {
int ptr, err;
char *file_name;
file_name = NULL;
file_name = malloc(40 * sizeof(char));
if(file_name == NULL) return -1; // No ha sido posible alojar la memoria
err = snprintf(file_name, 40, "G%dNP%dID%d.o%s", grp, numP, myId, jobId);
if(err < 0) return -2; // No ha sido posible obtener el nombre de fichero
ptr = open(file_name, O_WRONLY | O_CREAT | O_APPEND, 0644);
if(ptr < 0) return -3; // No ha sido posible crear el fichero
err = close(1);
if(err < 0) return -4; // No es posible modificar la salida estandar
err = dup(ptr);
if(err < 0) return -4; // No es posible modificar la salida estandar
return 0;
}
// Se realizan varios tests de ancho de banda
// al mandar N datos a los procesos impares desde el
// par inmediatamente anterior. Tras esto, los impares
// vuelven a enviar los N datos al proceso par.
//
// Tras las pruebas se imprime el ancho de banda, todo
// el tiempo necesario para realizar todas las pruebas y
// finalmente el tiempo medio por prueba.
void bandwidth(int myId, double latency, int n);
void bandwidth(int myId, double latency, int n) {
int i, loop_count = 100, n_bytes;
double start_time, stop_time, elapsed_time, bw, time;
char *aux;
n_bytes = n * sizeof(char);
aux = malloc(n_bytes);
elapsed_time = 0;
for(i=0; i<loop_count; i++){
MPI_Barrier(MPI_COMM_WORLD);
start_time = MPI_Wtime();
if(myId %2 == 0){
MPI_Ssend(aux, n, MPI_CHAR, myId+1, 99, MPI_COMM_WORLD);
MPI_Recv(aux, n, MPI_CHAR, myId+1, 99, MPI_COMM_WORLD, MPI_STATUS_IGNORE);
}
else if(myId %2 == 1){
MPI_Recv(aux, n, MPI_CHAR, myId-1, 99, MPI_COMM_WORLD, MPI_STATUS_IGNORE);
MPI_Ssend(aux, n, MPI_CHAR, myId-1, 99, MPI_COMM_WORLD);
}
MPI_Barrier(MPI_COMM_WORLD);
stop_time = MPI_Wtime();
elapsed_time += stop_time - start_time;
}
if(myId %2 == 0) {
time = elapsed_time / loop_count - latency;
bw = ((double)n_bytes * 2) / time;
printf("MyId %d Bw=%lf GB/s\nTot time=%lf\nTime=%lf\n", myId, bw/ 1000000000.0, elapsed_time, time);
}
}
// Se realizan varios tests de latencia al
// mandar un único dato de tipo CHAR a los procesos impares
// desde el par inmediatamente anterior. Tras esto, los impares
// vuelven a enviar el dato al proceso par.
//
// Tras las pruebas se imprime el tiempo necesario para realizar
// TODAS las pruebas y se devuleve el tiempo medio (latencia) de
// las pruebas
double ping_pong(int myId, int start);
double ping_pong(int myId, int start) {
int i, loop_count = 100;
double start_time, stop_time, elapsed_time;
char aux;
aux = '0';
elapsed_time = 0;
for(i=0; i<loop_count; i++){
MPI_Barrier(MPI_COMM_WORLD);
start_time = MPI_Wtime();
if(myId % 2 == 0){
MPI_Ssend(&aux, 1, MPI_CHAR, myId+1, 99, MPI_COMM_WORLD);
MPI_Recv(&aux, 1, MPI_CHAR, myId+1, 99, MPI_COMM_WORLD, MPI_STATUS_IGNORE);
}
else if(myId % 2 == 1){
MPI_Recv(&aux, 1, MPI_CHAR, myId-1, 99, MPI_COMM_WORLD, MPI_STATUS_IGNORE);
MPI_Ssend(&aux, 1, MPI_CHAR, myId-1, 99, MPI_COMM_WORLD);
}
MPI_Barrier(MPI_COMM_WORLD);
stop_time = MPI_Wtime();
elapsed_time += stop_time - start_time;
}
if(myId %2 == 0 && start != 0) {
printf("MyId %d Ping=%lf\n", myId, elapsed_time);
elapsed_time/=loop_count;
}
MPI_Bcast(&elapsed_time, 1, MPI_DOUBLE, ROOT, MPI_COMM_WORLD);
return elapsed_time;
}
// Trabajo común para todos los grupos de procesos
int work(int myId, int numP, char **argv, char *job_id) {
int grp, n_value, aux=0;
double latency;
MPI_Comm comm = MPI_COMM_NULL, comm_par= MPI_COMM_NULL;
int rootBcast = MPI_PROC_NULL;
if(myId == ROOT) rootBcast = MPI_ROOT;
// 1.000.000.00 1GB
n_value = 400000000;
grp = 0;
// Obtener que grupo de procesos soy de los padres
MPI_Comm_get_parent(&comm_par);
if(comm_par != MPI_COMM_NULL) {
MPI_Bcast(&grp, 1, MPI_INT, ROOT, comm_par);
grp+=1;
MPI_Barrier(comm_par);
MPI_Bcast(&aux, 1, MPI_INT, rootBcast, comm_par);
//MPI_Comm_free(&comm_par);
MPI_Comm_disconnect(&comm_par);
}
// Dividir los resultados por procesos
//create_out_file(myId, numP, grp, job_id);
/*----- PRUEBAS PRESTACIONES -----*/
// Asegurar que se ha inicializado la comunicación de MPI
ping_pong(myId, 0);
MPI_Barrier(MPI_COMM_WORLD);
// Obtener la latencia de la red
latency = ping_pong(myId, 1);
// Obtener el ancho de banda
bandwidth(myId, latency, n_value);
/*----- CREACIÓN DE PROCESOS -----*/
// Creación de un nuevo grupo de procesos
// Para evitar que se creen más grupos hay que asignar
// el valor 0 en la variable MAXGRP
if(grp != MAXGRP) {
// Inicialización de la comunicación con SLURM
int aux = numP;
init_slurm_comm(argv, myId, aux, ROOT, TYPE_D, COMM_SPAWN_SERIAL);
// Esperar a que la comunicación y creación de procesos
// haya finalizado
int test = -1;
while(test != MPI_SUCCESS) {
test = check_slurm_comm(myId, ROOT, MPI_COMM_WORLD, &comm);
}
// Enviar a los hijos que grupo de procesos son
MPI_Bcast(&grp, 1, MPI_INT, rootBcast, comm);
MPI_Barrier(comm);
MPI_Bcast(&aux, 1, MPI_INT, ROOT, comm);
// Desconectar intercomunicador con los hijos
MPI_Comm_disconnect(&comm);
//MPI_Comm_free(&comm);
} //IF GRP
if(comm != MPI_COMM_NULL || comm_par != MPI_COMM_NULL) {
printf("GRP=%d || El comunicador no esta a NULO\n", grp);
fflush(stdout);
}
return grp;
}
int main(int argc, char ** argv) {
int rank, numP, grp, len, pid;
char *tmp;
MPI_Init(&argc, &argv);
MPI_Comm_rank(MPI_COMM_WORLD, &rank);
MPI_Comm_size(MPI_COMM_WORLD, &numP);
pid = getpid();
// Imprimir datos sobre el comunicador de
// este grupo de procesos
tmp = getenv("SLURM_JOB_ID");
if(rank == ROOT) {
//system("printenv"); // Imprime todas las variables de entorno
printf("DATA\n");
//print_Info(MPI_COMM_WORLD);
}
// Imprimir nombre del nodo en el que se encuentra el proceso
char *name = malloc(MPI_MAX_PROCESSOR_NAME * sizeof(char));
MPI_Get_processor_name(name,&len);
printf("ID=%d Name %s PID=%d\n", rank, name, pid);
fflush(stdout);
MPI_Barrier(MPI_COMM_WORLD);
// Se manda el trabajo a los hijos
grp = work(rank, numP, argv, tmp);
fflush(stdout);
MPI_Barrier(MPI_COMM_WORLD);
MPI_Finalize();
return 0;
}
......@@ -28,6 +28,9 @@ void recv_sync_arrays(struct Dist_data dist_data, char *array, int root, int num
void send_async_arrays(struct Dist_data dist_data, char *array, int root, int numP_child, int idI, int idE, struct Counts counts, MPI_Request *comm_req);
void recv_async_arrays(struct Dist_data dist_data, char *array, int root, int numP_parents, int idI, int idE, struct Counts counts, MPI_Request *comm_req);
void send_async_point_arrays(struct Dist_data dist_data, char *array, int rootBcast, int numP_child, int idI, int idE, struct Counts counts, MPI_Request *comm_req);
void recv_async_point_arrays(struct Dist_data dist_data, char *array, int root, int numP_parents, int idI, int idE, struct Counts counts, MPI_Request *comm_req);
// DIST FUNCTIONS
void get_dist(int qty, int id, int numP, struct Dist_data *dist_data);
void set_counts(int id, int numP, struct Dist_data data_dist, int *sendcounts);
......@@ -63,7 +66,7 @@ void malloc_comm_array(char **array, int qty, int myId, int numP) {
//================================================================================
//================================================================================
//========================SINCHRONOUS FUNCTIONS===================================
//========================SYNCHRONOUS FUNCTIONS===================================
//================================================================================
//================================================================================
......@@ -136,7 +139,6 @@ void recv_sync(char **array, int qty, int myId, int numP, int root, MPI_Comm int
void send_sync_arrays(struct Dist_data dist_data, char *array, int rootBcast, int numP_child, int idI, int idE, struct Counts counts) {
int i;
// PREPARAR ENVIO DEL VECTOR
if(idI == 0) {
set_counts(0, numP_child, dist_data, counts.counts);
......@@ -147,10 +149,8 @@ void send_sync_arrays(struct Dist_data dist_data, char *array, int rootBcast, in
counts.displs[i] = counts.displs[i-1] + counts.counts[i-1];
}
//print_counts(dist_data, counts.counts, counts.displs, numP_child, "Padres");
/* COMUNICACION DE DATOS */
MPI_Alltoallv(array, counts.counts, counts.displs, MPI_CHAR, NULL, counts.zero_arr, counts.zero_arr, MPI_CHAR, dist_data.intercomm);
}
/*
......@@ -161,7 +161,7 @@ void send_sync_arrays(struct Dist_data dist_data, char *array, int rootBcast, in
void recv_sync_arrays(struct Dist_data dist_data, char *array, int root, int numP_parents, int idI, int idE, struct Counts counts) {
int i;
char *aux = malloc(1);
char aux;
// Ajustar los valores de recepcion
if(idI == 0) {
......@@ -175,14 +175,13 @@ void recv_sync_arrays(struct Dist_data dist_data, char *array, int root, int num
//print_counts(dist_data, counts.counts, counts.displs, numP_parents, "Hijos");
/* COMUNICACION DE DATOS */
MPI_Alltoallv(aux, counts.zero_arr, counts.zero_arr, MPI_CHAR, array, counts.counts, counts.displs, MPI_CHAR, dist_data.intercomm);
free(aux);
MPI_Alltoallv(&aux, counts.zero_arr, counts.zero_arr, MPI_CHAR, array, counts.counts, counts.displs, MPI_CHAR, dist_data.intercomm);
}
//================================================================================
//================================================================================
//========================ASINCHRONOUS FUNCTIONS==================================
//========================ASYNCHRONOUS FUNCTIONS==================================
//================================================================================
//================================================================================
......@@ -196,7 +195,7 @@ void recv_sync_arrays(struct Dist_data dist_data, char *array, int root, int num
* El vector array no se modifica en esta funcion.
*/
int send_async(char *array, int qty, int myId, int numP, int root, MPI_Comm intercomm, int numP_child, MPI_Request **comm_req, int parents_wait) {
int rootBcast = MPI_PROC_NULL;
int i, rootBcast = MPI_PROC_NULL;
int *idS = NULL;
struct Counts counts;
struct Dist_data dist_data;
......@@ -211,17 +210,25 @@ int send_async(char *array, int qty, int myId, int numP, int root, MPI_Comm inte
getIds_intercomm(dist_data, numP_child, &idS); // Obtener rango de Id hijos a los que este proceso manda datos
// MAL_USE_THREAD sigue el camino sincrono
if(parents_wait == MAL_USE_NORMAL) {
*comm_req = (MPI_Request *) malloc(sizeof(MPI_Request));
//*comm_req = (MPI_Request *) malloc(sizeof(MPI_Request));
*comm_req[0] = MPI_REQUEST_NULL;
send_async_arrays(dist_data, array, rootBcast, numP_child, idS[0], idS[1], counts, &(*comm_req[0]));
} else {
*comm_req = (MPI_Request *) malloc(2 * sizeof(MPI_Request));
(*comm_req)[0] = MPI_REQUEST_NULL;
(*comm_req)[1] = MPI_REQUEST_NULL;
} else if (parents_wait == MAL_USE_IBARRIER){
//*comm_req = (MPI_Request *) malloc(2 * sizeof(MPI_Request));
*comm_req[0] = MPI_REQUEST_NULL;
*comm_req[1] = MPI_REQUEST_NULL;
send_async_arrays(dist_data, array, rootBcast, numP_child, idS[0], idS[1], counts, &((*comm_req)[1]));
MPI_Ibarrier(intercomm, &((*comm_req)[0]) );
} else if (parents_wait == MAL_USE_POINT){
//*comm_req = (MPI_Request *) malloc(numP_child * sizeof(MPI_Request));
for(i=0; i<numP_child; i++){
(*comm_req)[i] = MPI_REQUEST_NULL;
}
send_async_point_arrays(dist_data, array, rootBcast, numP_child, idS[0], idS[1], counts, *comm_req);
} else if (parents_wait == MAL_USE_THREAD) { //TODO
}
freeCounts(&counts);
......@@ -242,15 +249,14 @@ int send_async(char *array, int qty, int myId, int numP, int root, MPI_Comm inte
*/
void recv_async(char **array, int qty, int myId, int numP, int root, MPI_Comm intercomm, int numP_parents, int parents_wait) {
int *idS = NULL;
int wait_err;
int wait_err, i;
struct Counts counts;
struct Dist_data dist_data;
MPI_Request comm_req, aux;
MPI_Request *comm_req, aux;
// Obtener distribución para este hijo
get_dist(qty, myId, numP, &dist_data);
*array = malloc(dist_data.tamBl * sizeof(char));
//(*array)[dist_data.tamBl] = '\0';
dist_data.intercomm = intercomm;
/* PREPARAR DATOS DE RECEPCION SOBRE VECTOR*/
......@@ -258,14 +264,28 @@ void recv_async(char **array, int qty, int myId, int numP, int root, MPI_Comm in
getIds_intercomm(dist_data, numP_parents, &idS); // Obtener el rango de Ids de padres del que este proceso recibira datos
recv_async_arrays(dist_data, *array, root, numP_parents, idS[0], idS[1], counts, &comm_req);
// MAL_USE_THREAD sigue el camino sincrono
if(parents_wait == MAL_USE_POINT) {
comm_req = (MPI_Request *) malloc(numP_parents * sizeof(MPI_Request));
for(i=0; i<numP_parents; i++){
comm_req[i] = MPI_REQUEST_NULL;
}
recv_async_point_arrays(dist_data, *array, root, numP_parents, idS[0], idS[1], counts, comm_req);
wait_err = MPI_Waitall(numP_parents, comm_req, MPI_STATUSES_IGNORE);
} else if (parents_wait == MAL_USE_NORMAL || parents_wait == MAL_USE_IBARRIER) {
comm_req = (MPI_Request *) malloc(sizeof(MPI_Request));
*comm_req = MPI_REQUEST_NULL;
recv_async_arrays(dist_data, *array, root, numP_parents, idS[0], idS[1], counts, comm_req);
wait_err = MPI_Wait(comm_req, MPI_STATUS_IGNORE);
} else if (parents_wait == MAL_USE_THREAD) { //TODO
}
wait_err = MPI_Wait(&comm_req, MPI_STATUS_IGNORE);
if(wait_err != MPI_SUCCESS) {
MPI_Abort(MPI_COMM_WORLD, wait_err);
}
if(parents_wait == MAL_USE_IBARRIER) {
if(parents_wait == MAL_USE_IBARRIER) { //MAL USE IBARRIER END
MPI_Ibarrier(intercomm, &aux);
MPI_Wait(&aux, MPI_STATUS_IGNORE); //Es necesario comprobar que la comunicación ha terminado para desconectar los grupos de procesos
}
......@@ -273,12 +293,15 @@ void recv_async(char **array, int qty, int myId, int numP, int root, MPI_Comm in
//printf("S%d Tam %d String: %s END\n", myId, dist_data.tamBl, *array);
freeCounts(&counts);
free(idS);
free(comm_req);
}
/*
* Envia a los hijos un vector que es redistribuido a los procesos
* hijos. Antes de realizar la comunicacion, cada proceso padre calcula sobre que procesos
* del otro grupo se transmiten elementos.
*
* El envio se realiza a partir de una comunicación colectiva.
*/
void send_async_arrays(struct Dist_data dist_data, char *array, int rootBcast, int numP_child, int idI, int idE, struct Counts counts, MPI_Request *comm_req) {
int i;
......@@ -298,10 +321,36 @@ void send_async_arrays(struct Dist_data dist_data, char *array, int rootBcast, i
MPI_Ialltoallv(array, counts.counts, counts.displs, MPI_CHAR, NULL, counts.zero_arr, counts.zero_arr, MPI_CHAR, dist_data.intercomm, comm_req);
}
/*
* Envia a los hijos un vector que es redistribuido a los procesos
* hijos. Antes de realizar la comunicacion, cada proceso padre calcula sobre que procesos
* del otro grupo se transmiten elementos.
*
* El envio se realiza a partir de varias comunicaciones punto a punto.
*/
void send_async_point_arrays(struct Dist_data dist_data, char *array, int rootBcast, int numP_child, int idI, int idE, struct Counts counts, MPI_Request *comm_req) {
int i;
// PREPARAR ENVIO DEL VECTOR
if(idI == 0) {
set_counts(0, numP_child, dist_data, counts.counts);
idI++;
MPI_Isend(array, counts.counts[0], MPI_CHAR, 0, 99, dist_data.intercomm, &(comm_req[0]));
}
for(i=idI; i<idE; i++) {
set_counts(i, numP_child, dist_data, counts.counts);
counts.displs[i] = counts.displs[i-1] + counts.counts[i-1];
MPI_Isend(array+counts.displs[i], counts.counts[i], MPI_CHAR, i, 99, dist_data.intercomm, &(comm_req[i]));
}
//print_counts(dist_data, counts.counts, counts.displs, numP_child, "Padres");
}
/*
* Recibe de los padres un vector que es redistribuido a los procesos
* de este grupo. Antes de realizar la comunicacion cada hijo calcula sobre que procesos
* del otro grupo se transmiten elementos.
*
* La recepcion se realiza a partir de una comunicacion colectiva.
*/
void recv_async_arrays(struct Dist_data dist_data, char *array, int root, int numP_parents, int idI, int idE, struct Counts counts, MPI_Request *comm_req) {
int i;
......@@ -323,6 +372,30 @@ void recv_async_arrays(struct Dist_data dist_data, char *array, int root, int nu
free(aux);
}
/*
* Recibe de los padres un vector que es redistribuido a los procesos
* de este grupo. Antes de realizar la comunicacion cada hijo calcula sobre que procesos
* del otro grupo se transmiten elementos.
*
* La recepcion se realiza a partir de varias comunicaciones punto a punto.
*/
void recv_async_point_arrays(struct Dist_data dist_data, char *array, int root, int numP_parents, int idI, int idE, struct Counts counts, MPI_Request *comm_req) {
int i;
// Ajustar los valores de recepcion
if(idI == 0) {
set_counts(0, numP_parents, dist_data, counts.counts);
idI++;
MPI_Irecv(array, counts.counts[0], MPI_CHAR, 0, 99, dist_data.intercomm, &(comm_req[0])); //FIXME BUffer recv
}
for(i=idI; i<idE; i++) {
set_counts(i, numP_parents, dist_data, counts.counts);
counts.displs[i] = counts.displs[i-1] + counts.counts[i-1];
MPI_Irecv(array+counts.displs[i], counts.counts[i], MPI_CHAR, i, 99, dist_data.intercomm, &(comm_req[i])); //FIXME BUffer recv
}
//print_counts(dist_data, counts.counts, counts.displs, numP_parents, "Hijos");
}
/*
* ========================================================================================
* ========================================================================================
......@@ -477,8 +550,8 @@ void print_counts(struct Dist_data data_dist, int *xcounts, int *xdispls, int si
int i;
for(i=0; i < size; i++) {
if(xcounts[i] != 0) {
//if(xcounts[i] != 0) {
printf("P%d of %d | %scounts[%d]=%d disp=%d\n", data_dist.myId, data_dist.numP, name, i, xcounts[i], xdispls[i]);
}
//}
}
}
......@@ -2,13 +2,16 @@
#include <stdlib.h>
#include <mpi.h>
#include <string.h>
#include "malleabilityStates.h"
#define MAL_COMM_COMPLETED 0
#define MAL_COMM_UNINITIALIZED 2
#define MAL_ASYNC_PENDING 1
//#define MAL_COMM_COMPLETED 0
//#define MAL_COMM_UNINITIALIZED 2
//#define MAL_ASYNC_PENDING 1
#define MAL_USE_NORMAL 0
#define MAL_USE_IBARRIER 1
//#define MAL_USE_NORMAL 0
//#define MAL_USE_IBARRIER 1
//#define MAL_USE_POINT 2
//#define MAL_USE_THREAD 3
int send_sync(char *array, int qty, int myId, int numP, int root, MPI_Comm intercomm, int numP_child);
void recv_sync(char **array, int qty, int myId, int numP, int root, MPI_Comm intercomm, int numP_parents);
......
......@@ -8,43 +8,53 @@
#include <slurm/slurm.h>
#include "ProcessDist.h"
#define ROOT 0
int commSlurm = COMM_UNRESERVED;
int commState = MAL_NOT_STARTED;
struct Slurm_data *slurm_data;
pthread_t slurm_thread;
pthread_t spawn_thread;
pthread_mutex_t spawn_mutex;
MPI_Comm *returned_comm;
double end_time; //FIXME REFACTOR
struct Slurm_data {
char *cmd; // Executable name
int qty_procs;
char *nodelist;
int num_cpus, num_nodes;
int qty_procs, result_procs;
MPI_Info info;
int type_creation;
int spawn_is_single;
};
struct Creation_data {
char **argv;
int numP_childs, type_dist;
};
typedef struct {
char *argv;
int numP_childs, myId, root, already_created;
int type_dist;
int spawn_is_single;
int spawn_method;
MPI_Comm comm;
}Creation_data;
//--------------PRIVATE SPAWN TYPE DECLARATIONS---------------//
void* thread_work(void* creation_data_arg);
//--------------PRIVATE DECLARATIONS---------------//
void processes_dist(char *argv, int numP_childs, int already_created, int type_dist);
void processes_dist(char *argv[], int numP_childs, int type_dist);
void generic_spawn(int myId, int root, int is_single, MPI_Comm *child, MPI_Comm comm);
void single_spawn_connection(int myId, int root, MPI_Comm comm, MPI_Comm *child);
int create_processes(int myId, int root, MPI_Comm *child, MPI_Comm comm);
void node_dist(slurm_job_info_t job_record, int type, int total_procs, int **qty, int *used_nodes);
int create_hostfile(char *jobId, char **file_name);
int write_hostfile_node(int ptr, int qty, char *node_name);
void fill_hostfile(slurm_job_info_t job_record, int ptr, int *qty, int used_nodes);
void node_dist(int type, int total_procs, int already_created, int **qty, int *used_nodes);
//TESTS
void fill_str_hostfile(slurm_job_info_t job_record, int *qty, int used_nodes, char **hostfile_str);
void fill_str_hostfile(int *qty, int used_nodes, char **hostfile_str);
int write_str_node(char **hostfile_str, int len_og, int qty, char *node_name);
//
void print_Info(MPI_Info info);
//@deprecated functions
int create_hostfile(char *jobId, char **file_name);
int write_hostfile_node(int ptr, int qty, char *node_name);
void fill_hostfile(slurm_job_info_t job_record, int ptr, int *qty, int used_nodes);
//--------------PUBLIC FUNCTIONS---------------//
......@@ -60,64 +70,203 @@ void print_Info(MPI_Info info);
*
* Si se pide en segundo plano, llamar a "check_slurm_comm()" comprobara si la configuracion para
* crearlos esta lista, y si es asi, los crea.
*
* Devuelve el estado de el procedimiento. Si no devuelve "COMM_FINISHED", es necesario llamar a
* "check_slurm_comm()".
*/
int init_slurm_comm(char **argv, int myId, int numP, int root, int type_dist, int type_creation) {
int init_slurm_comm(char *argv, int num_cpus, int num_nodes, char *nodelist, int myId, int numP, int numC, int root, int type_dist, int type_creation, int spawn_is_single, MPI_Comm comm, MPI_Comm *child) {
int spawn_qty, already_created = 0;
slurm_data = malloc(sizeof(struct Slurm_data));
if(myId == root) {
spawn_thread = pthread_self();
slurm_data->type_creation = type_creation;
if(type_creation == COMM_SPAWN_SERIAL) {
slurm_data->spawn_is_single = spawn_is_single;
slurm_data->result_procs = numC;
slurm_data->num_cpus = num_cpus;
slurm_data->num_nodes = num_nodes;
slurm_data->nodelist = nodelist;
spawn_qty = numC;
if(type_creation == COMM_SPAWN_MERGE || type_creation == COMM_SPAWN_MERGE_PTHREAD) {
if (numP < slurm_data->result_procs) {
spawn_qty = slurm_data->result_procs - numP;
already_created = numP;
}
}
pthread_mutex_init(&spawn_mutex,NULL);
processes_dist(argv, numP, type_dist);
commSlurm = COMM_FINISHED;
if(type_creation == COMM_SPAWN_SERIAL || slurm_data->type_creation == COMM_SPAWN_MERGE) {
} else if(type_creation == COMM_SPAWN_PTHREAD) {
commSlurm = COMM_IN_PROGRESS;
if(myId == root) {
processes_dist(argv, spawn_qty, already_created, type_dist);
} else {
slurm_data->cmd = malloc(1 * sizeof(char));
slurm_data->info = MPI_INFO_NULL;
}
// WORK
generic_spawn(myId, root, slurm_data->spawn_is_single, child, comm);
// END WORK
if(myId == root && slurm_data->info != MPI_INFO_NULL) {
MPI_Info_free(&(slurm_data->info));
}
pthread_mutex_destroy(&spawn_mutex);
free(slurm_data->cmd);
free(slurm_data);
} else if(type_creation == COMM_SPAWN_PTHREAD || slurm_data->type_creation == COMM_SPAWN_MERGE_PTHREAD) {
commState = MAL_SPAWN_PENDING;
struct Creation_data *creation_data = malloc(sizeof(struct Creation_Data*));
if((spawn_is_single && myId == root) || !spawn_is_single || (slurm_data->type_creation == COMM_SPAWN_MERGE_PTHREAD && numP > slurm_data->result_procs)) {
Creation_data *creation_data = (Creation_data *) malloc(sizeof(Creation_data));
creation_data->argv = argv;
creation_data->numP_childs = numP;
creation_data->numP_childs = spawn_qty;
creation_data->already_created = already_created;
creation_data->myId = myId;
creation_data->root = root;
creation_data->type_dist = type_dist;
creation_data->comm = comm;
if(pthread_create(&slurm_thread, NULL, thread_work, creation_data)) {
if(pthread_create(&spawn_thread, NULL, thread_work, (void *)creation_data)) {
printf("Error al crear el hilo de contacto con SLURM\n");
MPI_Abort(MPI_COMM_WORLD, -1);
return -1;
}
}
}
return 0;
return commState;
}
/*
* Comprueba si una configuracion para crear un nuevo grupo de procesos esta lista,
* y en caso de que lo este, se crea un nuevo grupo de procesos con esa configuracion.
* y en caso de que lo este, se devuelve el communicador a estos nuevos procesos.
*/
int check_slurm_comm(int myId, int root, MPI_Comm comm, MPI_Comm *child) {
int spawn_err = COMM_IN_PROGRESS;
int check_slurm_comm(int myId, int root, int numP, MPI_Comm *child, MPI_Comm comm, MPI_Comm comm_thread, double *real_time) {
if(slurm_data->type_creation == COMM_SPAWN_PTHREAD || slurm_data->type_creation == COMM_SPAWN_MERGE_PTHREAD) {
if (slurm_data->type_creation == COMM_SPAWN_MERGE_PTHREAD && numP > slurm_data->result_procs) { //TODO REFACTOR
printf("Error Check spawn: Configuracion invalida\nSe intenta usar el método Spawn junto a un Shrink merge\n");
MPI_Abort(MPI_COMM_WORLD, -1);
return -10;
}
if(!slurm_data->spawn_is_single || commState == MAL_SPAWN_SINGLE_PENDING || commState == MAL_SPAWN_COMPLETED) {
int state=-10;
//printf("[%d][3] Test min\n", myId); fflush(stdout);
//pthread_mutex_lock(&spawn_mutex); // TODO Descomentar
MPI_Allreduce(&commState, &state, 1, MPI_INT, MPI_MIN, comm);
//pthread_mutex_unlock(&spawn_mutex);
if(myId == root && commSlurm == COMM_FINISHED && slurm_data->type_creation == COMM_SPAWN_PTHREAD) {
if(pthread_join(slurm_thread, NULL)) {
if(state != MAL_SPAWN_COMPLETED) return state; // Continue only if asynchronous process creation has ended
//printf("[%d][5] Test Passed-----------\n", myId); fflush(stdout);
if(pthread_join(spawn_thread, NULL)) {
printf("Error al esperar al hilo\n");
MPI_Abort(MPI_COMM_WORLD, -1);
return -2;
return -10;
}
*child = *returned_comm;
} else if (slurm_data->spawn_is_single) {
//pthread_mutex_lock(&spawn_mutex); // TODO Descomentar
MPI_Bcast(&commState, 1, MPI_INT, root, comm);
//pthread_mutex_unlock(&spawn_mutex);
int threads_not_spawned = pthread_equal(pthread_self(), spawn_thread);
// Non-root processes join root to finalize the spawn
// They also must join if the application has ended its work
if(commState == MAL_SPAWN_SINGLE_START) {
commState = MAL_SPAWN_SINGLE_PENDING;
if(myId != root && threads_not_spawned) {
Creation_data *creation_data = (Creation_data *) malloc(sizeof(Creation_data));
creation_data->argv = NULL;
creation_data->numP_childs = -1;
creation_data->already_created = -1;
creation_data->myId = myId;
creation_data->root = root;
creation_data->type_dist = -1;
creation_data->comm = comm_thread;
if(pthread_create(&spawn_thread, NULL, thread_work, (void *)creation_data)) {
printf("Error al crear el hilo de apoyo\n");
MPI_Abort(MPI_COMM_WORLD, -1);
return -1;
}
}
}
MPI_Bcast(&commSlurm, 1, MPI_INT, root, comm);
// Continue only if asynchronous process creation has ended or application does not have more work
if(commState != MAL_SPAWN_COMPLETED) return commState;
if(commSlurm == COMM_FINISHED) {
spawn_err = create_processes(myId, root, child, comm);
//printf("[%d][4] Test Passed-----------\n", myId); fflush(stdout);
//Asegurar que los hilos han terminado
if(pthread_join(spawn_thread, NULL)) {
printf("Error al esperar al hilo\n");
MPI_Abort(MPI_COMM_WORLD, -1);
return -10;
}
*child = *returned_comm;
} else {
printf("Error Check spawn: Configuracion invalida\n");
MPI_Abort(MPI_COMM_WORLD, -1);
return -10;
}
} else {
return commState;
}
//Free memory
if(myId == root && slurm_data->info != MPI_INFO_NULL) {
MPI_Info_free(&(slurm_data->info));
}
free(slurm_data->cmd);
free(slurm_data);
pthread_mutex_destroy(&spawn_mutex);
spawn_thread = pthread_self();
*real_time=end_time;
return commState;
}
/*
* Conectar grupo de hijos con grupo de padres
* Devuelve un intercomunicador para hablar con los padres
*
* Solo se utiliza cuando la creación de los procesos ha sido
* realizada por un solo proceso padre
*/
void malleability_establish_connection(int myId, int root, MPI_Comm *intercomm) {
char *port_name;
MPI_Comm newintercomm;
if(myId == root) {
port_name = (char *) malloc(MPI_MAX_PORT_NAME * sizeof(char));
MPI_Open_port(MPI_INFO_NULL, port_name);
MPI_Send(port_name, MPI_MAX_PORT_NAME, MPI_CHAR, root, 130, *intercomm);
} else {
port_name = malloc(1);
}
return spawn_err;
MPI_Comm_accept(port_name, MPI_INFO_NULL, root, MPI_COMM_WORLD, &newintercomm);
if(myId == root) {
MPI_Close_port(port_name);
}
free(port_name);
MPI_Comm_free(intercomm);
*intercomm = newintercomm;
}
//--------------PRIVATE SPAWN TYPE FUNCTIONS---------------//
//--------------PRIVATE THREAD FUNCTIONS---------------//
/*
* Funcion llamada por un hilo para que este se encarge
......@@ -127,10 +276,16 @@ int check_slurm_comm(int myId, int root, MPI_Comm comm, MPI_Comm *child) {
* se avisa al hilo maestro.
*/
void* thread_work(void* creation_data_arg) {
struct Creation_data *creation_data = (struct Creation_data*) creation_data_arg;
processes_dist(creation_data->argv, creation_data->numP_childs, creation_data->type_dist);
commSlurm = COMM_FINISHED;
Creation_data *creation_data = (Creation_data*) creation_data_arg;
returned_comm = (MPI_Comm *) malloc(sizeof(MPI_Comm));
if(creation_data->myId == creation_data->root) {
processes_dist(creation_data->argv, creation_data->numP_childs, creation_data->already_created, creation_data->type_dist);
} else {
slurm_data->cmd = malloc(1 * sizeof(char));
slurm_data->info = MPI_INFO_NULL;
}
generic_spawn(creation_data->myId, creation_data->root, slurm_data->spawn_is_single, returned_comm, creation_data->comm);
free(creation_data);
pthread_exit(NULL);
......@@ -138,37 +293,150 @@ void* thread_work(void* creation_data_arg) {
//--------------PRIVATE SPAWN CREATION FUNCTIONS---------------//
/*
* Funcion generica para la creacion de procesos. Obtiene la configuracion
* y segun esta, elige como deberian crearse los procesos.
*
* Cuando termina, modifica la variable global para indicar este cambio
*/
void generic_spawn(int myId, int root, int spawn_is_single, MPI_Comm *child, MPI_Comm comm) {
if(spawn_is_single) {
single_spawn_connection(myId, root, comm, child);
} else {
int rootBcast = MPI_PROC_NULL;
if(myId == root) rootBcast = MPI_ROOT;
create_processes(myId, root, child, comm);
MPI_Bcast(&spawn_is_single, 1, MPI_INT, rootBcast, *child);
}
pthread_mutex_lock(&spawn_mutex);
commState = MAL_SPAWN_COMPLETED;
end_time = MPI_Wtime();
pthread_mutex_unlock(&spawn_mutex);
}
/*
* Crea un grupo de procesos segun la configuracion indicada por la funcion
* "processes_dist()".
*/
int create_processes(int myId, int root, MPI_Comm *child, MPI_Comm comm) {
int spawn_err = MPI_Comm_spawn(slurm_data->cmd, MPI_ARGV_NULL, slurm_data->qty_procs, slurm_data->info, root, comm, child, MPI_ERRCODES_IGNORE);
if(spawn_err != MPI_SUCCESS) {
printf("Error creating new set of %d procs.\n", slurm_data->qty_procs);
}
return spawn_err;
}
/*
* Si la variable "type" es 1, la creación es con la participación de todo el grupo de padres
* Si el valor es diferente, la creación es solo con la participación del proceso root
*/
void single_spawn_connection(int myId, int root, MPI_Comm comm, MPI_Comm *child){
char *port_name;
int auxiliar_conf = COMM_SPAWN_SINGLE;
MPI_Comm newintercomm;
if (myId == root) {
create_processes(myId, root, child, MPI_COMM_SELF);
MPI_Bcast(&auxiliar_conf, 1, MPI_INT, MPI_ROOT, *child);
port_name = (char *) malloc(MPI_MAX_PORT_NAME * sizeof(char));
MPI_Recv(port_name, MPI_MAX_PORT_NAME, MPI_CHAR, root, 130, *child, MPI_STATUS_IGNORE);
commState = MAL_SPAWN_SINGLE_START; // Indicate other processes to join root to end spawn procedure
} else {
port_name = malloc(1);
}
MPI_Comm_connect(port_name, MPI_INFO_NULL, root, comm, &newintercomm);
if(myId == root)
MPI_Comm_free(child);
free(port_name);
*child = newintercomm;
}
//--------------PRIVATE MERGE TYPE FUNCTIONS---------------//
/*
* Se encarga de que el grupo de procesos resultante se
* encuentren todos en un intra comunicador, uniendo a
* padres e hijos en un solo comunicador.
*
* Se llama antes de la redistribución de datos.
*
* TODO REFACTOR
*/
void proc_adapt_expand(int *numP, int numC, MPI_Comm intercomm, MPI_Comm *comm, int is_children_group) {
MPI_Comm new_comm = MPI_COMM_NULL;
MPI_Intercomm_merge(intercomm, is_children_group, &new_comm); //El que pone 0 va primero
//MPI_Comm_free(intercomm); TODO Nueva redistribucion para estos casos y liberar aqui
// *intercomm = MPI_COMM_NULL;
*numP = numC;
if(*comm != MPI_COMM_WORLD && *comm != MPI_COMM_NULL) {
MPI_Comm_free(comm);
}
*comm=new_comm;
}
/*
* Se encarga de que el grupo de procesos resultante se
* eliminen aquellos procesos que ya no son necesarios.
* Los procesos eliminados se quedaran como zombies.
*
* Se llama una vez ha terminado la redistribución de datos.
*/
void proc_adapt_shrink(int numC, MPI_Comm *comm, int myId) {
int color = MPI_UNDEFINED;
MPI_Comm new_comm = MPI_COMM_NULL;
if(myId < numC) {
color = 1;
}
MPI_Comm_split(*comm, color, myId, &new_comm);
if(*comm != MPI_COMM_WORLD && *comm != MPI_COMM_NULL)
//MPI_Comm_free(comm); FIXME
*comm=new_comm;
}
/*
* Configura la creacion de un nuevo grupo de procesos, reservando la memoria
* para una llamada a MPI_Comm_spawn, obteniendo una distribucion fisica
* para los procesos y creando un fichero hostfile.
*/
void processes_dist(char *argv[], int numP_childs, int type) {
int jobId, ptr;
char *tmp;
job_info_msg_t *j_info;
slurm_job_info_t last_record;
void processes_dist(char *argv, int numP_childs, int already_created, int type) {
//int jobId;
//char *tmp;
//job_info_msg_t *j_info;
//slurm_job_info_t last_record;
int used_nodes=0;
int *procs_array;
char *hostfile;
// Get Slurm job info
tmp = getenv("SLURM_JOB_ID");
jobId = atoi(tmp);
slurm_load_job(&j_info, jobId, 1);
last_record = j_info->job_array[j_info->record_count - 1];
//tmp = getenv("SLURM_JOB_ID");
//jobId = atoi(tmp);
//slurm_load_job(&j_info, jobId, 1);
//last_record = j_info->job_array[j_info->record_count - 1];
//COPY PROGRAM NAME
slurm_data->cmd = malloc(strlen(argv[0]) * sizeof(char));
strcpy(slurm_data->cmd, argv[0]);
slurm_data->cmd = malloc(strlen(argv) * sizeof(char));
strcpy(slurm_data->cmd, argv);
// GET NEW DISTRIBUTION
node_dist(last_record, type, numP_childs, &procs_array, &used_nodes);
node_dist(type, numP_childs, already_created, &procs_array, &used_nodes);
slurm_data->qty_procs = numP_childs;
/*
// CREATE/UPDATE HOSTFILE
int ptr;
ptr = create_hostfile(tmp, &hostfile);
MPI_Info_create(&(slurm_data->info));
MPI_Info_set(slurm_data->info, "hostfile", hostfile);
......@@ -177,36 +445,18 @@ void processes_dist(char *argv[], int numP_childs, int type) {
// SET NEW DISTRIBUTION
fill_hostfile(last_record, ptr, procs_array, used_nodes);
close(ptr);
*/
// TEST
/*
fill_str_hostfile(last_record, procs_array, used_nodes, &hostfile);
// CREATE AND SET STRING HOSTFILE
fill_str_hostfile(procs_array, used_nodes, &hostfile);
MPI_Info_create(&(slurm_data->info));
MPI_Info_set(slurm_data->info, "hosts", hostfile);
*/
// Free JOB INFO
slurm_free_job_info_msg(j_info);
}
/*
* Crea un grupo de procesos segun la configuracion indicada por la funcion
* "processes_dist()".
*/
int create_processes(int myId, int root, MPI_Comm *child, MPI_Comm comm) {
int spawn_err = MPI_Comm_spawn(slurm_data->cmd, MPI_ARGV_NULL, slurm_data->qty_procs, slurm_data->info, root, comm, child, MPI_ERRCODES_IGNORE);
if(spawn_err != MPI_SUCCESS) {
printf("Error creating new set of %d procs.\n", slurm_data->qty_procs);
}
free(hostfile);
free(procs_array);
if(myId == root) {
MPI_Info_free(&(slurm_data->info));
free(slurm_data->cmd);
}
return spawn_err;
// Free JOB INFO
//slurm_free_job_info_msg(j_info);
}
/*
......@@ -221,41 +471,51 @@ int create_processes(int myId, int root, MPI_Comm *child, MPI_Comm comm) {
* COMM_PHY_CPU (2): Orientada a completar la capacidad de un nodo antes de
* ocupar otro nodo.
*/
void node_dist(slurm_job_info_t job_record, int type, int total_procs, int **qty, int *used_nodes) {
void node_dist(int type, int total_procs, int already_created, int **qty, int *used_nodes) {
int i, asigCores;
int tamBl, remainder;
int *procs;
procs = calloc(job_record.num_nodes, sizeof(int)); // Numero de procesos por nodo
procs = calloc(slurm_data->num_nodes, sizeof(int)); // Numero de procesos por nodo
/* GET NEW DISTRIBUTION */
if(type == 1) { // DIST NODES
*used_nodes = job_record.num_nodes;
tamBl = total_procs / job_record.num_nodes;
remainder = total_procs % job_record.num_nodes;
*used_nodes = slurm_data->num_nodes;
tamBl = total_procs / slurm_data->num_nodes;
remainder = total_procs % slurm_data->num_nodes;
for(i=0; i<remainder; i++) {
procs[i] = tamBl + 1;
}
for(i=remainder; i<job_record.num_nodes; i++) {
for(i=remainder; i<slurm_data->num_nodes; i++) {
procs[i] = tamBl;
}
} else if (type == 2) { // DIST CPUs
tamBl = job_record.num_cpus / job_record.num_nodes;
tamBl = slurm_data->num_cpus / slurm_data->num_nodes;
asigCores = 0;
i = 0;
*used_nodes = 0;
i = *used_nodes = already_created / tamBl;
remainder = already_created % tamBl;
//First node could already have existing procs
if (remainder) {
procs[i] = asigCores = tamBl - remainder;
i = (i+1) % slurm_data->num_nodes;
(*used_nodes)++;
}
//Assing tamBl to each node
while(asigCores+tamBl <= total_procs) {
asigCores += tamBl;
procs[i] += tamBl;
i = (i+1) % job_record.num_nodes;
i = (i+1) % slurm_data->num_nodes;
(*used_nodes)++;
}
//Last node could have less procs than tamBl
if(asigCores < total_procs) {
procs[i] += total_procs - asigCores;
(*used_nodes)++;
}
if(*used_nodes > job_record.num_nodes) *used_nodes = job_record.num_nodes;
if(*used_nodes > slurm_data->num_nodes) *used_nodes = slurm_data->num_nodes; //FIXME Si ocurre esto no es un error?
}
*qty = calloc(*used_nodes, sizeof(int)); // Numero de procesos por nodo
......@@ -263,9 +523,75 @@ void node_dist(slurm_job_info_t job_record, int type, int total_procs, int **qty
(*qty)[i] = procs[i];
}
free(procs);
}
/*
* Crea y devuelve una cadena para ser utilizada por la llave "hosts"
* al crear procesos e indicar donde tienen que ser creados.
*/
void fill_str_hostfile(int *qty, int used_nodes, char **hostfile_str) {
int i=0, len=0;
char *host;
hostlist_t hostlist;
hostlist = slurm_hostlist_create(slurm_data->nodelist);
while ( (host = slurm_hostlist_shift(hostlist)) && i < used_nodes) {
if(qty[i] != 0) {
len = write_str_node(hostfile_str, len, qty[i], host);
}
i++;
free(host);
}
slurm_hostlist_destroy(hostlist);
}
/*
* Añade en una cadena "qty" entradas de "node_name".
* Realiza la reserva de memoria y la realoja si es necesario.
*/
int write_str_node(char **hostfile_str, int len_og, int qty, char *node_name) {
int err, len_node, len, i;
char *ocurrence;
len_node = strlen(node_name);
len = qty * (len_node + 1);
if(len_og == 0) { // Memoria no reservada
*hostfile_str = (char *) malloc(len * sizeof(char) - (1 * sizeof(char)));
} else { // Cadena ya tiene datos
*hostfile_str = (char *) realloc(*hostfile_str, (len_og + len) * sizeof(char) - (1 * sizeof(char)));
}
if(hostfile_str == NULL) return -1; // No ha sido posible alojar la memoria
ocurrence = (char *) malloc((len_node+1) * sizeof(char));
if(ocurrence == NULL) return -1; // No ha sido posible alojar la memoria
err = sprintf(ocurrence, ",%s", node_name);
if(err < 0) return -2; // No ha sido posible escribir sobre la variable auxiliar
i=0;
if(len_og == 0) { // Si se inicializa, la primera es una copia
i++;
strcpy(*hostfile_str, node_name);
}
for(; i<qty; i++){ // Las siguientes se conctanenan
strcat(*hostfile_str, ocurrence);
}
free(ocurrence);
return len+len_og;
}
//====================================================
//====================================================
//============DEPRECATED FUNCTIONS====================
//====================================================
//====================================================
/*
* @deprecated
* Crea un fichero que se utilizara como hostfile
* para un nuevo grupo de procesos.
*
......@@ -293,6 +619,7 @@ int create_hostfile(char *jobId, char **file_name) {
}
/*
* @deprecated
* Rellena un fichero hostfile indicado por ptr con los nombres
* de los nodos a utilizar indicados por "job_record" y la cantidad
* de procesos que alojara cada nodo indicado por "qty".
......@@ -312,6 +639,7 @@ void fill_hostfile(slurm_job_info_t job_record, int ptr, int *qty, int used_node
}
/*
* @deprecated
* Escribe en el fichero hostfile indicado por ptr una nueva linea.
*
* Esta linea indica el nombre de un nodo y la cantidad de procesos a
......@@ -336,51 +664,3 @@ int write_hostfile_node(int ptr, int qty, char *node_name) {
return 0;
}
void fill_str_hostfile(slurm_job_info_t job_record, int *qty, int used_nodes, char **hostfile_str) {
int i=0, len=0;
char *host;
hostlist_t hostlist;
hostlist = slurm_hostlist_create(job_record.nodes);
while ( (host = slurm_hostlist_shift(hostlist)) && i < used_nodes) {
len = write_str_node(hostfile_str, len, qty[i], host);
i++;
free(host);
}
slurm_hostlist_destroy(hostlist);
}
int write_str_node(char **hostfile_str, int len_og, int qty, char *node_name) {
int err, len_node, len, i;
char *ocurrence;
len_node = strlen(node_name);
len = qty * (len_node + 1);
if(len_og == 0) { // Memoria no reservada
*hostfile_str = (char *) malloc(len * sizeof(char));
} else { // Cadena ya tiene datos
*hostfile_str = (char *) realloc(*hostfile_str, (len_og + len) * sizeof(char));
}
if(hostfile_str == NULL) return -1; // No ha sido posible alojar la memoria
ocurrence = (char *) malloc((len_node+1) * sizeof(char));
if(ocurrence == NULL) return -1; // No ha sido posible alojar la memoria
err = sprintf(ocurrence, "%s,", node_name);
if(err < 0) return -2; // No ha sido posible escribir sobre la variable auxiliar
i=0;
if(len_og == 0) {
i++;
strcpy(*hostfile_str, ocurrence);
}
for(; i<qty; i++){
strcat(*hostfile_str, ocurrence);
}
free(ocurrence);
return len;
}
Supports Markdown
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment