Refactored Manager and CommDist for non-blocking communications and...

Refactored Manager and CommDist for non-blocking communications and MPI_Request usage. Two minor bug fixes. RMA asynchronous and Ibarrier strategy are the next steps to develop

Refactored Manager and CommDist for non-blocking communications and...
Refactored Manager and CommDist for non-blocking communications and MPI_Request usage. Two minor bug fixes. RMA asynchronous and Ibarrier strategy are the next steps to develop
fca86a9b · iker_martin · 95b08697 · fca86a9b · fca86a9b · fca86a9b
Commit fca86a9b authored Feb 20, 2023 by iker_martin
--- a/Codes/Main/Main.c
+++ b/Codes/Main/Main.c
@@ -66,6 +66,7 @@ int main(int argc, char *argv[]) {
      set_benchmark_configuration(config_file);
      set_benchmark_results(results);
+      set_children_number(config_file->groups[group->grp+1].procs); // TODO TO BE DEPRECATED
      set_malleability_configuration(config_file->groups[group->grp+1].sm, config_file->groups[group->grp+1].ss, 
 	config_file->groups[group->grp+1].phy_dist, config_file->groups[group->grp+1].rm, config_file->groups[group->grp+1].rs);

--- a/Codes/malleability/CommDist.c
+++ b/Codes/malleability/CommDist.c
@@ -6,16 +6,17 @@
 #include "CommDist.h"
 void prepare_redistribution(int qty, int myId, int numP, int numO, int is_children_group, int is_intercomm, char **recv, struct Counts *s_counts, struct Counts *r_counts);
+void check_requests(struct Counts s_counts, struct Counts r_counts, MPI_Request **requests, size_t *request_qty);
+void sync_point2point(char *send, char *recv, int is_intercomm, int myId, struct Counts s_counts, struct Counts r_counts, MPI_Comm comm);
 void sync_rma(char *send, char *recv, struct Counts r_counts, int tamBl, MPI_Comm comm, int red_method);
 void sync_rma_lock(char *recv, struct Counts r_counts, MPI_Win win);
 void sync_rma_lockall(char *recv, struct Counts r_counts, MPI_Win win);
-//////////////////////////
-void send_async_arrays(struct Dist_data dist_data, char *array, int numP_child, struct Counts *counts, MPI_Request *comm_req);
-void recv_async_arrays(struct Dist_data dist_data, char *array, int numP_parents, struct Counts *counts, MPI_Request *comm_req);
-void send_async_point_arrays(struct Dist_data dist_data, char *array, int numP_child, struct Counts *counts, MPI_Request *comm_req);
-void recv_async_point_arrays(struct Dist_data dist_data, char *array, int numP_parents, struct Counts *counts, MPI_Request *comm_req);
+void async_point2point(char *send, char *recv, struct Counts s_counts, struct Counts r_counts, MPI_Comm comm, MPI_Request *requests);
+void perform_manual_communication(char *send, char *recv, int myId, struct Counts s_counts, struct Counts r_counts);
 /*
 * Reserva memoria para un vector de hasta "qty" elementos.
@@ -94,7 +95,8 @@ int sync_communication(char *send, char **recv, int qty, int myId, int numP, int
 	break;
      case MALL_RED_POINT:
-	//TODO
+        sync_point2point(send, *recv, is_intercomm, myId, s_counts, r_counts, comm);
+	break;
      case MALL_RED_BASELINE:
      default:
        MPI_Alltoallv(send, s_counts.counts, s_counts.displs, MPI_CHAR, *recv, r_counts.counts, r_counts.displs, MPI_CHAR, comm);
@@ -109,6 +111,49 @@ int sync_communication(char *send, char **recv, int qty, int myId, int numP, int
    return 1; //FIXME In this case is always true...
 }
+/*
+ * Performs a series of blocking point2point communications to redistribute an array in a block distribution. 
+ * It should be called after calculating how data should be redistributed.
+ *
+ * - send (IN):  Array with the data to send. This value can not be NULL for parents.
+ * - recv (OUT): Array where data will be written. A NULL value is allowed if the process is not going to 
+ *               receive data. If the process receives data and is NULL, the behaviour is undefined.
+ * - is_intercomm (IN): Indicates wether the communicator is an intercommunicator (TRUE) or an
+ *               intracommunicator (FALSE).
+ * - myId (IN):  Rank of the MPI process in the local communicator. For the parents is not the rank obtained from "comm".
+ * - s_counts (IN): Struct which describes how many elements will send this process to each children and 
+ *               the displacements.
+ * - r_counts (IN): Structure which describes how many elements will receive this process from each parent 
+ *               and the displacements.
+ * - comm (IN):  Communicator to use to perform the redistribution.
+ *
+ */
+void sync_point2point(char *send, char *recv, int is_intercomm, int myId, struct Counts s_counts, struct Counts r_counts, MPI_Comm comm) {
+    int i, init, end;
+    init = s_counts.idI;
+    end = s_counts.idE;
+    if(!is_intercomm && (s_counts.idI == myId || s_counts.idE == myId + 1)) {
+      perform_manual_communication(send, recv, myId, s_counts, r_counts);
+      if(s_counts.idI == myId) init = s_counts.idI+1;
+      else end = s_counts.idE-1;
+    }
+    for(i=init; i<end; i++) {
+      MPI_Send(send+s_counts.displs[i], s_counts.counts[i], MPI_CHAR, i, 99, comm);
+    }
+    init = r_counts.idI;
+    end = r_counts.idE;
+    if(!is_intercomm) {
+      if(r_counts.idI == myId) init = r_counts.idI+1;
+      else if(r_counts.idE == myId + 1) end = r_counts.idE-1;
+    }
+    for(i=init; i<end; i++) {
+      MPI_Recv(recv+r_counts.displs[i], r_counts.counts[i], MPI_CHAR, i, 99, comm, MPI_STATUS_IGNORE);
+    }
+}
 /*
 * Performs synchronous MPI-RMA operations to redistribute an array in a block distribution. Is should be called after calculating
@@ -131,7 +176,7 @@ void sync_rma(char *send, char *recv, struct Counts r_counts, int tamBl, MPI_Com
  aux_array_used = 0;
  if(send == NULL) {
    tamBl = 1;
-    send = malloc(tamBl*sizeof(char));
+    send = malloc(tamBl*sizeof(char)); //TODO Check if the value can be NULL at WIN_create
    aux_array_used = 1;
  }
  MPI_Win_create(send, (MPI_Aint)tamBl, sizeof(char), MPI_INFO_NULL, comm, &win);
@@ -204,179 +249,101 @@ void sync_rma_lockall(char *recv, struct Counts r_counts, MPI_Win win) {
 //================================================================================
 /*
- * Realiza un envio asincrono del vector array desde este grupo de procesos al grupo
+ * //TODO Añadir estrategia IBARRIER
- * enlazado por el intercomunicador intercomm.
+ * Performs a communication to redistribute an array in a block distribution with non-blocking MPI functions.
+ * In the redistribution is differenciated parent group from the children and the values each group indicates can be
+ * different.
 *
- * El objeto MPI_Request se devuelve con el manejador para comprobar si la comunicacion
+ * - send (IN):  Array with the data to send. This data can not be null for parents.
- * ha terminado.
+ * - recv (OUT): Array where data will be written. A NULL value is allowed if the process is not going to receive data.
+ *               If the process receives data and is NULL, the behaviour is undefined.
+ * - qty  (IN):  Sum of elements shared by all processes that will send data.
+ * - myId (IN):  Rank of the MPI process in the local communicator. For the parents is not the rank obtained from "comm".
+ * - numP (IN):  Size of the local group. If it is a children group, this parameter must correspond to using
+ *               "MPI_Comm_size(comm)". For the parents is not always the size obtained from "comm".
+ * - numO (IN):  Amount of processes in the remote group. For the parents is the target quantity of processes after the 
+ *               resize, while for the children is the amount of parents.
+ * - is_children_group (IN): Indicates wether this MPI rank is a children(TRUE) or a parent(FALSE).
+ * - comm (IN):  Communicator to use to perform the redistribution.
+ * - requests (OUT): Pointer to array of requests to be used to determine if the communication has ended. If the pointer 
+ *               is null or not enough space has been reserved the pointer is allocated/reallocated.
+ * - request_qty (OUT): Quantity of requests to be used. If a process sends and receives data, this value will be 
+ *               modified to the expected value.
 *
- * El vector array no se modifica en esta funcion.
+ * returns: An integer indicating if the operation has been completed(TRUE) or not(FALSE). //FIXME In this case is always false...
 */
-int send_async(char *array, int qty, int myId, int numP, MPI_Comm intercomm, int numP_child, MPI_Request **comm_req, int red_method, int red_strategies) {
+int async_communication(char *send, char **recv, int qty, int myId, int numP, int numO, int is_children_group, int red_method, int red_strategies, MPI_Comm comm, MPI_Request **requests, size_t *request_qty) {
-    int i, is_intercomm;
+    int is_intercomm, aux_comm_used = 0;
    struct Counts s_counts, r_counts;
-    struct Dist_data dist_data;
+    MPI_Comm aux_comm = MPI_COMM_NULL;
-    get_block_dist(qty, myId, numP, &dist_data); // Distribucion de este proceso en su grupo
-    dist_data.intercomm = intercomm;
    /* PREPARE COMMUNICATION */
-    MPI_Comm_test_inter(intercomm, &is_intercomm);
+    MPI_Comm_test_inter(comm, &is_intercomm);
-    prepare_redistribution(qty, myId, numP, numP_child, MALLEABILITY_NOT_CHILDREN, is_intercomm, NULL, &s_counts, &r_counts);
+    prepare_redistribution(qty, myId, numP, numO, is_children_group, is_intercomm, recv, &s_counts, &r_counts);
+    check_requests(s_counts, r_counts, requests, request_qty);
-    // MAL_USE_THREAD sigue el camino sincrono
-    if(red_method == MALL_RED_BASELINE) {
-      //*comm_req = (MPI_Request *) malloc(sizeof(MPI_Request));
-      *comm_req[0] = MPI_REQUEST_NULL;
-      send_async_arrays(dist_data, array, numP_child, &s_counts, &(*comm_req[0])); 
-    } else if (red_method == MALL_RED_IBARRIER){ //FIXME No es un metodo
-      //*comm_req = (MPI_Request *) malloc(2 * sizeof(MPI_Request));
-      *comm_req[0] = MPI_REQUEST_NULL;
-      *comm_req[1] = MPI_REQUEST_NULL;
-      send_async_arrays(dist_data, array, numP_child, &s_counts, &((*comm_req)[1])); 
-      MPI_Ibarrier(intercomm, &((*comm_req)[0]) );
-    } else if (red_method == MALL_RED_POINT){
-      //*comm_req = (MPI_Request *) malloc(numP_child * sizeof(MPI_Request));
-      for(i=0; i<numP_child; i++){
-        (*comm_req)[i] = MPI_REQUEST_NULL;
-      }
-      send_async_point_arrays(dist_data, array, numP_child, &s_counts, *comm_req); 
-    }
-    freeCounts(&s_counts);
-    freeCounts(&r_counts);
-    return 1;
-}
-/*
- * Realiza una recepcion asincrona del vector array a este grupo de procesos desde el grupo
- * enlazado por el intercomunicador intercomm.
- *
- * El vector array se reserva dentro de la funcion y se devuelve en el mismo argumento.
- * Tiene que ser liberado posteriormente por el usuario.
- *
- * El argumento "parents_wait" sirve para indicar si se usará la versión en la los padres 
- * espera a que terminen de enviar, o en la que esperan a que los hijos acaben de recibir.
- */
-void recv_async(char **array, int qty, int myId, int numP, MPI_Comm intercomm, int numP_parents, int red_method, int red_strategies) {
-    int wait_err, i;
-    struct Counts counts;
-    struct Dist_data dist_data;
-    MPI_Request *comm_req, aux;
-    // Obtener distribución para este hijo
-    get_block_dist(qty, myId, numP, &dist_data);
-    *array = malloc( dist_data.tamBl * sizeof(char));
-    dist_data.intercomm = intercomm;
-    /* PREPARAR DATOS DE RECEPCION SOBRE VECTOR*/
-    //mallocCounts(&counts, numP_parents);
+    /* PERFORM COMMUNICATION */
+    switch(red_method) {
-    // MAL_USE_THREAD sigue el camino sincrono
+      case MALL_RED_RMA_LOCKALL:
-    if(red_method == MALL_RED_POINT) {
+      case MALL_RED_RMA_LOCK:
-      comm_req = (MPI_Request *) malloc(numP_parents * sizeof(MPI_Request));
+	return MALL_DENIED; //TODO Realizar versiones asíncronas
-      for(i=0; i<numP_parents; i++){
+      case MALL_RED_POINT:
-        comm_req[i] = MPI_REQUEST_NULL;
+        async_point2point(send, *recv, s_counts, r_counts, comm, *requests);
-      }
+	break;
-      recv_async_point_arrays(dist_data, *array, numP_parents, &counts, comm_req);
+      case MALL_RED_BASELINE:
-      wait_err = MPI_Waitall(numP_parents, comm_req, MPI_STATUSES_IGNORE);
+      default:
+        MPI_Ialltoallv(send, s_counts.counts, s_counts.displs, MPI_CHAR, *recv, r_counts.counts, r_counts.displs, MPI_CHAR, comm, &((*requests)[0]));
-    } else if (red_method == MALL_RED_BASELINE || red_method == MALL_RED_IBARRIER) { //FIXME IBarrier no es un método
+	break;
-      comm_req = (MPI_Request *) malloc(sizeof(MPI_Request));
-      *comm_req = MPI_REQUEST_NULL;
-      recv_async_arrays(dist_data, *array, numP_parents, &counts, comm_req);
-      wait_err = MPI_Wait(comm_req, MPI_STATUS_IGNORE);
    }
-    if(wait_err != MPI_SUCCESS) {
+    /* POST REQUESTS CHECKS */
-      MPI_Abort(MPI_COMM_WORLD, wait_err);
+    if(is_children_group) {
+      MPI_Waitall(*request_qty, *requests, MPI_STATUSES_IGNORE);
    }
-    if(red_method == MALL_RED_IBARRIER) { //MAL USE IBARRIER END //FIXME IBarrier no es un método
+    if(malleability_red_contains_strat(red_strategies, MALL_RED_IBARRIER, NULL)) { //FIXME Strategy not fully implemented
-      MPI_Ibarrier(intercomm, &aux);
+      MPI_Ibarrier(comm, &((*requests)[*request_qty-1]) ); //FIXME Not easy to read...
-      MPI_Wait(&aux, MPI_STATUS_IGNORE); //Es necesario comprobar que la comunicación ha terminado para desconectar los grupos de procesos
+      if(is_children_group) {
+        MPI_Wait(&((*requests)[*request_qty-1]), MPI_STATUSES_IGNORE); //FIXME Not easy to read...
      }
-    //printf("S%d Tam %d String: %s END\n", myId, dist_data.tamBl, *array);
-    freeCounts(&counts);
-    free(comm_req);
-}
-/*
- * Envia a los hijos un vector que es redistribuido a los procesos
- * hijos. Antes de realizar la comunicacion, cada proceso padre calcula sobre que procesos
- * del otro grupo se transmiten elementos.
- *
- * El envio se realiza a partir de una comunicación colectiva.
- */
-void send_async_arrays(struct Dist_data dist_data, char *array, int numP_child, struct Counts *counts, MPI_Request *comm_req) {
-    //prepare_comm_alltoall(dist_data.myId, dist_data.numP, numP_child, dist_data.qty, counts);
-    /* COMUNICACION DE DATOS */
-    MPI_Ialltoallv(array, counts->counts, counts->displs, MPI_CHAR, NULL, counts->zero_arr, counts->zero_arr, MPI_CHAR, dist_data.intercomm, comm_req);
-}
-/*
- * Envia a los hijos un vector que es redistribuido a los procesos
- * hijos. Antes de realizar la comunicacion, cada proceso padre calcula sobre que procesos
- * del otro grupo se transmiten elementos.
- *
- * El envio se realiza a partir de varias comunicaciones punto a punto.
- */
-void send_async_point_arrays(struct Dist_data dist_data, char *array, int numP_child, struct Counts *counts, MPI_Request *comm_req) {
-    int i;
-    // PREPARAR ENVIO DEL VECTOR
-    prepare_comm_alltoall(dist_data.myId, dist_data.numP, numP_child, dist_data.qty, counts);
-    for(i=0; i<numP_child; i++) { //TODO Esta propuesta ya no usa el IdI y Ide
-      if(counts->counts[0] != 0) {
-        MPI_Isend(array+counts->displs[i], counts->counts[i], MPI_CHAR, i, 99, dist_data.intercomm, &(comm_req[i]));
    }
+    if(aux_comm_used) {
+      MPI_Comm_free(&aux_comm);
    } 
-    //print_counts(dist_data, counts.counts, counts.displs, numP_child, "Padres");
+    freeCounts(&s_counts);
+    freeCounts(&r_counts);
+    return 0; //FIXME In this case is always false...
 }
 /*
- * Recibe de los padres un vector que es redistribuido a los procesos
+ * Performs a series of non-blocking point2point communications to redistribute an array in a block distribution. 
- * de este grupo. Antes de realizar la comunicacion cada hijo calcula sobre que procesos
+ * It should be called after calculating how data should be redistributed.
- * del otro grupo se transmiten elementos.
 *
- * La recepcion se realiza a partir de una comunicacion colectiva.
+ * - send (IN):  Array with the data to send. This value can not be NULL for parents.
- */
+ * - recv (OUT): Array where data will be written. A NULL value is allowed if the process is not going to 
-void recv_async_arrays(struct Dist_data dist_data, char *array, int numP_parents, struct Counts *counts, MPI_Request *comm_req) {
+ *               receive data. If the process receives data and is NULL, the behaviour is undefined.
-    char *aux = malloc(1);
+ * - s_counts (IN): Struct which describes how many elements will send this process to each children and 
+ *               the displacements.
-    // Ajustar los valores de recepcion
+ * - r_counts (IN): Structure which describes how many elements will receive this process from each parent 
-    prepare_comm_alltoall(dist_data.myId, dist_data.numP, numP_parents, dist_data.qty, counts);
+ *               and the displacements.
-    //print_counts(dist_data, counts->counts, counts->displs, numP_parents, 1, "Children");
+ * - comm (IN):  Communicator to use to perform the redistribution.
+ * - requests (OUT): Pointer to array of requests to be used to determine if the communication has ended.
-    /* COMUNICACION DE DATOS */
-    MPI_Ialltoallv(aux, counts->zero_arr, counts->zero_arr, MPI_CHAR, array, counts->counts, counts->displs, MPI_CHAR, dist_data.intercomm, comm_req);
-    free(aux);
-}
-/*
- * Recibe de los padres un vector que es redistribuido a los procesos
- * de este grupo. Antes de realizar la comunicacion cada hijo calcula sobre que procesos
- * del otro grupo se transmiten elementos.
 *
- * La recepcion se realiza a partir de varias comunicaciones punto a punto.
 */
-void recv_async_point_arrays(struct Dist_data dist_data, char *array, int numP_parents, struct Counts *counts, MPI_Request *comm_req) {
+void async_point2point(char *send, char *recv, struct Counts s_counts, struct Counts r_counts, MPI_Comm comm, MPI_Request *requests) {
-    int i;
+    int i, j = 0;
-    // Ajustar los valores de recepcion
+    for(i=s_counts.idI; i<s_counts.idE; i++) {
-    prepare_comm_alltoall(dist_data.myId, dist_data.numP, numP_parents, dist_data.qty, counts);
+      MPI_Isend(send+s_counts.displs[i], s_counts.counts[i], MPI_CHAR, i, 99, comm, &(requests[j]));
+      j++;
-    for(i=0; i<numP_parents; i++) { //TODO Esta propuesta ya no usa el IdI y Ide
-      if(counts->counts[0] != 0) {
-        MPI_Irecv(array+counts->displs[i], counts->counts[i], MPI_CHAR, i, 99, dist_data.intercomm, &(comm_req[i])); //FIXME BUffer recv
    }
+    for(i=r_counts.idI; i<r_counts.idE; i++) {
+      MPI_Irecv(recv+r_counts.displs[i], r_counts.counts[i], MPI_CHAR, i, 99, comm, &(requests[j]));
+      j++;
    }
-    //print_counts(dist_data, counts.counts, counts.displs, numP_parents, "Hijos");
 }
 /*
@@ -437,6 +404,63 @@ print_counts(dist_data, s_counts->counts, s_counts->displs, numO, 1, "Parents ")
  }
 }
+/*
+ * Ensures that the array of request of a process has an amount of elements equal to the amount of communication
+ * functions the process will perform. In case the array is not initialized or does not have enough space it is
+ * allocated/reallocated to the minimum amount of space needed.
+ *
+ * - s_counts (IN): Struct where is indicated how many elements sends this process to processes in the new group.
+ * - r_counts (IN): Struct where is indicated how many elements receives this process from other processes in the previous group.
+ * - requests (OUT): Pointer to array of requests to be used to determine if the communication has ended. If the pointer 
+ *               is null or not enough space has been reserved the pointer is allocated/reallocated.
+ * - request_qty (OUT): Quantity of requests to be used. If the value is smaller than the amount of communication
+ *               functions to perform, it is modified to the minimum value.
+ */
+void check_requests(struct Counts s_counts, struct Counts r_counts, MPI_Request **requests, size_t *request_qty) {
+  size_t i, sum;
+  MPI_Request *aux;
+  sum = (size_t) s_counts.idE - s_counts.idI;
+  sum += (size_t) r_counts.idE - r_counts.idI;
+  if (*requests != NULL && sum <= *request_qty) return; // Expected amount of requests
+  // FIXME Si es la estrategia Ibarrier como se tiene en cuenta en el total??
+  if (*requests == NULL) {
+    *requests = (MPI_Request *) malloc(sum * sizeof(MPI_Request));
+  } else { // Array exists, but is too small
+    aux = (MPI_Request *) realloc(*requests, sum * sizeof(MPI_Request));
+    *requests = aux;
+  }
+  if (*requests == NULL) {
+    fprintf(stderr, "Fatal error - It was not possible to allocate/reallocate memory for the MPI_Requests before the redistribution\n");
+    MPI_Abort(MPI_COMM_WORLD, 1);
+  }
+  for(i=0; i < sum; i++) {
+    (*requests)[i] = MPI_REQUEST_NULL;
+  }
+  *request_qty = sum;
+}
+/*
+ * Special case to perform a manual copy of data when a process has to send data to itself. Only used
+ * when the MPI communication is not able to hand this situation. An example is when using point to point
+ * communications and the process has to perform a Send and Recv to itself
+ * - send (IN):  Array with the data to send. This value can not be NULL.
+ * - recv (OUT): Array where data will be written. This value can not be NULL.
+ * - myId (IN):  Rank of the MPI process in the local communicator. For the parents is not the rank obtained from "comm".
+ * - s_counts (IN): Struct where is indicated how many elements sends this process to processes in the new group.
+ * - r_counts (IN): Struct where is indicated how many elements receives this process from other processes in the previous group.
+ */
+void perform_manual_communication(char *send, char *recv, int myId, struct Counts s_counts, struct Counts r_counts) {
+  int i;
+  for(i=0; i<s_counts.counts[myId];i++) {
+    recv[i+r_counts.displs[myId]] = send[i+s_counts.displs[myId]];
+  }
+}
 /*
 * Función para obtener si entre las estrategias elegidas, se utiliza

--- a/Codes/malleability/CommDist.h
+++ b/Codes/malleability/CommDist.h
@@ -17,6 +17,7 @@
 //#define MAL_USE_THREAD 3
 int sync_communication(char *send, char **recv, int qty, int myId, int numP, int numO, int is_children_group, int comm_type, MPI_Comm comm);
+int async_communication(char *send, char **recv, int qty, int myId, int numP, int numO, int is_children_group, int red_method, int red_strategies, MPI_Comm comm, MPI_Request **requests, size_t *request_qty);
 int send_async(char *array, int qty, int myId, int numP, MPI_Comm intercomm, int numP_child, MPI_Request **comm_req, int red_method, int red_strategies);
 void recv_async(char **array, int qty, int myId, int numP, MPI_Comm intercomm, int numP_parents, int red_method, int red_strategies);

--- a/Codes/malleability/distribution_methods/block_distribution.c
+++ b/Codes/malleability/distribution_methods/block_distribution.c
@@ -23,7 +23,7 @@ void prepare_comm_alltoall(int myId, int numP, int numP_other, int n, struct Cou
  get_util_ids(dist_data, numP_other, &idS);
  counts->idI = idS[0];
-  counts->idE = idS[0];
+  counts->idE = idS[1];
  get_block_dist(n, idS[0], numP_other, &dist_target); // RMA Specific operation
  counts->first_target_displs = dist_data.ini - dist_target.ini; // RMA Specific operation

--- a/Codes/malleability/malleabilityManager.c
+++ b/Codes/malleability/malleabilityManager.c
@@ -437,7 +437,8 @@ void send_data(int numP_children, malleability_data_t *data_struct, int is_async
    for(i=0; i < data_struct->entries; i++) {
      aux_send = (char *) data_struct->arrays[i]; //TODO Comprobar que realmente es un char
      aux_recv = NULL;
-      send_async(aux_send, data_struct->qty[i], mall->myId, mall->numP, mall->intercomm, numP_children, data_struct->requests, mall_conf->red_method, mall_conf->red_strategies);
+      async_communication(aux_send, &aux_recv, data_struct->qty[i], mall->myId, mall->numP, numP_children, MALLEABILITY_NOT_CHILDREN, mall_conf->red_method, mall_conf->red_strategies, mall->intercomm, 
+		      &(data_struct->requests[i]), &(data_struct->request_qty[i]));
      if(aux_recv != NULL) data_struct->arrays[i] = (void *) aux_recv;
    }
  } else {
@@ -462,7 +463,8 @@ void recv_data(int numP_parents, malleability_data_t *data_struct, int is_asynch
  if(is_asynchronous) {
    for(i=0; i < data_struct->entries; i++) {
      aux = (char *) data_struct->arrays[i]; //TODO Comprobar que realmente es un char
-      recv_async(&aux, data_struct->qty[i], mall->myId, mall->numP, mall->intercomm, numP_parents, mall_conf->red_method, mall_conf->red_strategies);
+      async_communication(&aux_s, &aux, data_struct->qty[i], mall->myId, mall->numP, numP_parents, MALLEABILITY_CHILDREN, mall_conf->red_method, mall_conf->red_strategies, mall->intercomm, 
+		      &(data_struct->requests[i]), &(data_struct->request_qty[i]));
      data_struct->arrays[i] = (void *) aux;
    }
  } else {
@@ -641,21 +643,16 @@ int start_redistribution() {
 * los hijos han terminado de recibir.
 */
 int check_redistribution() {
-  int is_intercomm, completed, all_completed, test_err;
+  int is_intercomm, req_qty, completed, all_completed, test_err;
  MPI_Request *req_completed;
-//dist_a_data->requests[0][X] //FIXME Numero magico 0 -- Modificar para que sea un for?
-  //TODO Modificar a switch-case
+  //FIXME Modificar para que sea un for
-  if (mall_conf->red_method == MALL_RED_POINT) {
+  req_completed = dist_a_data->requests[0]; //FIXME Numero magico
-    test_err = MPI_Testall(mall->numC, dist_a_data->requests[0], &completed, MPI_STATUSES_IGNORE);
+  req_qty = dist_a_data->request_qty[0]; //FIXME Numero magico
+  if(malleability_red_contains_strat(mall_conf->red_strategies, MALL_RED_IBARRIER, NULL)) { //FIXME Strategy not fully implemented
+    test_err = MPI_Test(&(req_completed[req_qty-1]), &completed, MPI_STATUS_IGNORE);
  } else {
-    if(mall_conf->red_method == MALL_RED_BASELINE) {
+    test_err = MPI_Testall(req_qty, req_completed, &completed, MPI_STATUSES_IGNORE); //FIXME Numero magico
-      req_completed = &(dist_a_data->requests[0][0]);
-    } else if (mall_conf->red_method == MALL_RED_IBARRIER) { //FIXME No es un metodo
-      req_completed = &(dist_a_data->requests[0][1]);
-    }
-    test_err = MPI_Test(req_completed, &completed, MPI_STATUS_IGNORE);
  }
  if (test_err != MPI_SUCCESS && test_err != MPI_ERR_PENDING) {
@@ -663,12 +660,11 @@ int check_redistribution() {
    MPI_Abort(MPI_COMM_WORLD, test_err);
  }
-  MPI_Wait(req_completed, MPI_STATUS_IGNORE); completed=1;
  MPI_Allreduce(&completed, &all_completed, 1, MPI_INT, MPI_MIN, mall->comm);
  if(!all_completed) return MALL_DIST_PENDING; // Continue only if asynchronous send has ended 
-  if(mall_conf->red_method == MALL_RED_IBARRIER) { //FIXME No es un metodo
+  if(malleability_red_contains_strat(mall_conf->red_strategies, MALL_RED_IBARRIER, NULL)) { //FIXME Strategy not fully implemented
-    MPI_Wait(&(dist_a_data->requests[0][0]), MPI_STATUS_IGNORE); // Indicar como completado el envio asincrono
+    MPI_Waitall(req_qty, req_completed, MPI_STATUSES_IGNORE);
    //Para la desconexión de ambos grupos de procesos es necesario indicar a MPI que esta comm
    //ha terminado, aunque solo se pueda llegar a este punto cuando ha terminado
  }

--- a/Codes/malleability/malleabilityTypes.c
+++ b/Codes/malleability/malleabilityTypes.c
@@ -147,8 +147,6 @@ void init_malleability_data_struct(malleability_data_t *data_struct, size_t size
  data_struct->requests = (MPI_Request **) malloc(size * sizeof(MPI_Request *));
  data_struct->arrays = (void **) malloc(size * sizeof(void *));
-  data_struct->request_ibarrier = MPI_REQUEST_NULL;
  for(i=0; i<size; i++) { //calloc and memset does not ensure a NULL value
    data_struct->requests[i] = NULL;
    data_struct->arrays[i] = NULL;

--- a/Codes/malleability/malleabilityTypes.h
+++ b/Codes/malleability/malleabilityTypes.h
@@ -13,7 +13,6 @@
 typedef struct {
  size_t entries; // Indica numero de vectores a comunicar (replicated data)
  size_t max_entries;
-  MPI_Request request_ibarrier; // Request para indicar que los padres esperan a que los hijos terminen de recibir
  size_t *qty; // Indica numero de elementos en cada subvector de sync_array
  int *types;