Skip to content
GitLab
Menu
Projects
Groups
Snippets
Help
Help
Support
Community forum
Keyboard shortcuts
?
Submit feedback
Contribute to GitLab
Sign in
Toggle navigation
Menu
Open sidebar
Iker Martín Álvarez
Proteo
Commits
241e098e
Commit
241e098e
authored
Jun 04, 2024
by
Iker Martín Álvarez
Browse files
WIP. Modified all compilation constants to start with MAM
parent
33fb8b86
Changes
8
Show whitespace changes
Inline
Side-by-side
Codes/Makefile
View file @
241e098e
...
...
@@ -4,14 +4,14 @@ MCC = mpicc
C_FLAGS
=
-Wall
-Wextra
-Wshadow
-Wfatal-errors
LD_FLAGS
=
-lm
-pthread
USE_MAL
_SLURM
?=
0
USE_MAL
_BARRIERS
?=
0
USE_
MA
L
_DEBUG
?=
0
MAM_USE
_SLURM
?=
0
MAM_USE
_BARRIERS
?=
0
MA
M
_DEBUG
?=
0
ifeq
($(
USE_MAL
_SLURM),1)
ifeq
($(
MAM_USE
_SLURM),1)
LD_FLAGS
+=
-lslurm
endif
DEF
=
-D
USE_MAL
_SLURM
=
$(
USE_MAL
_SLURM)
-D
USE_MAL
_BARRIERS
=
$(
USE_MAL
_BARRIERS)
-D
USE_
MA
L
_DEBUG
=
$(
USE_
MA
L
_DEBUG)
DEF
=
-D
MAM_USE
_SLURM
=
$(
MAM_USE
_SLURM)
-D
MAM_USE
_BARRIERS
=
$(
MAM_USE
_BARRIERS)
-DMA
M
_DEBUG
=
$(MA
M
_DEBUG)
.PHONY
:
clean clear install
...
...
Codes/malleability/MAM_Configuration.c
View file @
241e098e
...
...
@@ -185,7 +185,7 @@ void MAM_Set_initial_configuration() {
MPI_Abort
(
mall
->
comm
,
-
50
);
}
#if
USE_
MA
L
_DEBUG >= 2
#if MA
M
_DEBUG >= 2
if
(
mall
->
myId
==
mall
->
root
)
{
DEBUG_FUNC
(
"Initial configuration settled"
,
mall
->
myId
,
mall
->
numP
);
fflush
(
stdout
);
...
...
Codes/malleability/MAM_Manager.c
View file @
241e098e
...
...
@@ -75,7 +75,7 @@ int MAM_Init(int root, MPI_Comm *comm, char *name_exec, void (*user_function)(vo
MPI_Comm_rank
(
*
comm
,
&
(
mall
->
myId
));
MPI_Comm_size
(
*
comm
,
&
(
mall
->
numP
));
#if
USE_
MA
L
_DEBUG
#if MA
M
_DEBUG
DEBUG_FUNC
(
"Initializing MaM"
,
mall
->
myId
,
mall
->
numP
);
fflush
(
stdout
);
MPI_Barrier
(
*
comm
);
#endif
...
...
@@ -128,12 +128,12 @@ int MAM_Init(int root, MPI_Comm *comm, char *name_exec, void (*user_function)(vo
mall
->
internode_group
=
MAM_Is_internode_group
();
MAM_Set_initial_configuration
();
#if
USE_MAL
_BARRIERS &&
USE_
MA
L
_DEBUG
#if
MAM_USE
_BARRIERS && MA
M
_DEBUG
if
(
mall
->
myId
==
mall
->
root
)
printf
(
"MaM: Using barriers to record times.
\n
"
);
#endif
#if
USE_
MA
L
_DEBUG
#if MA
M
_DEBUG
DEBUG_FUNC
(
"MaM has been initialized correctly as parents"
,
mall
->
myId
,
mall
->
numP
);
fflush
(
stdout
);
MPI_Barrier
(
*
comm
);
#endif
...
...
@@ -253,7 +253,7 @@ void MAM_Resume_redistribution(int *mam_state) {
*/
void
MAM_Commit
(
int
*
mam_state
)
{
int
request_abort
;
#if
USE_
MA
L
_DEBUG
#if MA
M
_DEBUG
if
(
mall
->
myId
==
mall
->
root
){
DEBUG_FUNC
(
"Trying to commit"
,
mall
->
myId
,
mall
->
numP
);
}
fflush
(
stdout
);
#endif
...
...
@@ -270,7 +270,7 @@ void MAM_Commit(int *mam_state) {
// Zombies Treatment
MAM_Zombies_update
();
if
(
mall
->
zombie
)
{
#if
USE_
MA
L
_DEBUG >= 1
#if MA
M
_DEBUG >= 1
DEBUG_FUNC
(
"Is terminating as zombie"
,
mall
->
myId
,
mall
->
numP
);
fflush
(
stdout
);
#endif
request_abort
=
MAM_Finalize
();
...
...
@@ -294,11 +294,11 @@ void MAM_Commit(int *mam_state) {
MPI_Comm_dup
(
mall
->
comm
,
mall
->
user_comm
);
//if(mall_conf->spawn_method == MAM_SPAWN_BASELINE) { *(mall->user_comm) = MPI_COMM_WORLD; }
//else if(mall_conf->spawn_method == MAM_SPAWN_MERGE) { MPI_Comm_dup(mall->comm, mall->user_comm); }
#if
USE_
MA
L
_DEBUG
#if MA
M
_DEBUG
if
(
mall
->
myId
==
mall
->
root
)
DEBUG_FUNC
(
"Reconfiguration has been commited"
,
mall
->
myId
,
mall
->
numP
);
fflush
(
stdout
);
#endif
#if
USE_MAL
_BARRIERS
#if
MAM_USE
_BARRIERS
MPI_Barrier
(
mall
->
comm
);
#endif
mall_conf
->
times
->
malleability_end
=
MPI_Wtime
();
...
...
@@ -546,7 +546,7 @@ void recv_data(int numP_parents, malleability_data_t *data_struct, int is_asynch
int
MAM_St_rms
(
int
*
mam_state
)
{
reset_malleability_times
();
#if
USE_MAL
_BARRIERS
#if
MAM_USE
_BARRIERS
MPI_Barrier
(
mall
->
comm
);
#endif
mall_conf
->
times
->
malleability_start
=
MPI_Wtime
();
...
...
@@ -576,7 +576,7 @@ int MAM_St_spawn_start() {
int
MAM_St_spawn_pending
(
int
wait_completed
)
{
state
=
check_spawn_state
(
&
(
mall
->
intercomm
),
mall
->
comm
,
wait_completed
);
if
(
state
==
MAM_I_SPAWN_COMPLETED
||
state
==
MAM_I_SPAWN_ADAPTED
)
{
#if
USE_MAL
_BARRIERS
#if
MAM_USE
_BARRIERS
MPI_Barrier
(
mall
->
comm
);
#endif
mall_conf
->
times
->
spawn_time
=
MPI_Wtime
()
-
mall_conf
->
times
->
malleability_start
;
...
...
@@ -611,7 +611,7 @@ int MAM_St_red_pending(int wait_completed) {
}
int
MAM_St_user_start
(
int
*
mam_state
)
{
#if
USE_MAL
_BARRIERS
#if
MAM_USE
_BARRIERS
MPI_Barrier
(
mall
->
intercomm
);
#endif
mall_conf
->
times
->
user_start
=
MPI_Wtime
();
// Obtener timestamp de cuando termina user redist
...
...
@@ -627,7 +627,7 @@ int MAM_St_user_start(int *mam_state) {
}
int
MAM_St_user_pending
(
int
*
mam_state
,
int
wait_completed
,
void
(
*
user_function
)(
void
*
),
void
*
user_args
)
{
#if
USE_
MA
L
_DEBUG
#if MA
M
_DEBUG
if
(
mall
->
myId
==
mall
->
root
)
DEBUG_FUNC
(
"Starting USER redistribution"
,
mall
->
myId
,
mall
->
numP
);
fflush
(
stdout
);
#endif
if
(
user_function
!=
NULL
)
{
...
...
@@ -640,11 +640,11 @@ int MAM_St_user_pending(int *mam_state, int wait_completed, void (*user_function
}
if
(
state
!=
MAM_I_USER_PENDING
)
{
#if
USE_MAL
_BARRIERS
#if
MAM_USE
_BARRIERS
MPI_Barrier
(
mall
->
intercomm
);
#endif
if
(
mall_conf
->
spawn_method
==
MAM_SPAWN_MERGE
)
mall_conf
->
times
->
user_end
=
MPI_Wtime
();
// Obtener timestamp de cuando termina user redist
#if
USE_
MA
L
_DEBUG
#if MA
M
_DEBUG
if
(
mall
->
myId
==
mall
->
root
)
DEBUG_FUNC
(
"Ended USER redistribution"
,
mall
->
myId
,
mall
->
numP
);
fflush
(
stdout
);
#endif
return
1
;
...
...
@@ -659,7 +659,7 @@ int MAM_St_user_completed() {
int
MAM_St_spawn_adapt_pending
(
int
wait_completed
)
{
wait_completed
=
MAM_WAIT_COMPLETION
;
#if
USE_MAL
_BARRIERS
#if
MAM_USE
_BARRIERS
MPI_Barrier
(
mall
->
comm
);
#endif
mall_conf
->
times
->
spawn_start
=
MPI_Wtime
();
...
...
@@ -670,7 +670,7 @@ int MAM_St_spawn_adapt_pending(int wait_completed) {
* NO es posible debido a que solo se puede hacer tras enviar los datos variables
* y por tanto pierden validez dichos datos
if(!MAM_Contains_strat(MAM_SPAWN_STRATEGIES, MAM_STRAT_SPAWN_PTHREAD, NULL)) {
#if
USE_MAL
_BARRIERS
#if
MAM_USE
_BARRIERS
MPI_Barrier(mall->comm);
#endif
mall_conf->times->spawn_time = MPI_Wtime() - mall_conf->times->spawn_start;
...
...
@@ -678,7 +678,7 @@ int MAM_St_spawn_adapt_pending(int wait_completed) {
}
return 0;
*/
#if
USE_MAL
_BARRIERS
#if
MAM_USE
_BARRIERS
MPI_Barrier
(
mall
->
comm
);
#endif
mall_conf
->
times
->
spawn_time
=
MPI_Wtime
()
-
mall_conf
->
times
->
spawn_start
;
...
...
@@ -709,7 +709,7 @@ int MAM_St_completed(int *mam_state) {
void
Children_init
(
void
(
*
user_function
)(
void
*
),
void
*
user_args
)
{
size_t
i
;
#if
USE_
MA
L
_DEBUG
#if MA
M
_DEBUG
DEBUG_FUNC
(
"MaM will now initialize spawned processes"
,
mall
->
myId
,
mall
->
numP
);
fflush
(
stdout
);
MPI_Barrier
(
MPI_COMM_WORLD
);
#endif
...
...
@@ -726,16 +726,16 @@ void Children_init(void (*user_function)(void *), void *user_args) {
mall
->
internode_group
=
MAM_Is_internode_group
();
}
#if
USE_
MA
L
_DEBUG
#if MA
M
_DEBUG
DEBUG_FUNC
(
"Spawned have completed spawn step"
,
mall
->
myId
,
mall
->
numP
);
fflush
(
stdout
);
MPI_Barrier
(
MPI_COMM_WORLD
);
#endif
comm_data_info
(
rep_a_data
,
dist_a_data
,
MAM_TARGETS
);
if
(
dist_a_data
->
entries
||
rep_a_data
->
entries
)
{
// Recibir datos asincronos
#if
USE_
MA
L
_DEBUG >= 2
#if MA
M
_DEBUG >= 2
DEBUG_FUNC
(
"Spawned start asynchronous redistribution"
,
mall
->
myId
,
mall
->
numP
);
fflush
(
stdout
);
MPI_Barrier
(
MPI_COMM_WORLD
);
#endif
#if
USE_MAL
_BARRIERS
#if
MAM_USE
_BARRIERS
MPI_Barrier
(
mall
->
intercomm
);
#endif
...
...
@@ -750,7 +750,7 @@ void Children_init(void (*user_function)(void *), void *user_args) {
for
(
i
=
0
;
i
<
rep_a_data
->
entries
;
i
++
)
{
MPI_Ibcast
(
rep_a_data
->
arrays
[
i
],
rep_a_data
->
qty
[
i
],
rep_a_data
->
types
[
i
],
mall
->
root_collectives
,
mall
->
intercomm
,
&
(
rep_a_data
->
requests
[
i
][
0
]));
}
#if
USE_
MA
L
_DEBUG >= 2
#if MA
M
_DEBUG >= 2
DEBUG_FUNC
(
"Spawned started asynchronous redistribution"
,
mall
->
myId
,
mall
->
numP
);
fflush
(
stdout
);
MPI_Barrier
(
MPI_COMM_WORLD
);
#endif
...
...
@@ -766,7 +766,7 @@ void Children_init(void (*user_function)(void *), void *user_args) {
MPI_Wait
(
&
mall
->
wait_targets
,
MPI_STATUS_IGNORE
);
}
#if
USE_
MA
L
_DEBUG >= 2
#if MA
M
_DEBUG >= 2
DEBUG_FUNC
(
"Spawned waited for all asynchronous redistributions"
,
mall
->
myId
,
mall
->
numP
);
fflush
(
stdout
);
MPI_Barrier
(
MPI_COMM_WORLD
);
#endif
for
(
i
=
0
;
i
<
dist_a_data
->
entries
;
i
++
)
{
...
...
@@ -777,16 +777,16 @@ void Children_init(void (*user_function)(void *), void *user_args) {
}
}
#if
USE_MAL
_BARRIERS
#if
MAM_USE
_BARRIERS
MPI_Barrier
(
mall
->
intercomm
);
#endif
mall_conf
->
times
->
async_end
=
MPI_Wtime
();
// Obtener timestamp de cuando termina comm asincrona
}
#if
USE_
MA
L
_DEBUG
#if MA
M
_DEBUG
DEBUG_FUNC
(
"Spawned have completed asynchronous data redistribution step"
,
mall
->
myId
,
mall
->
numP
);
fflush
(
stdout
);
MPI_Barrier
(
MPI_COMM_WORLD
);
#endif
#if
USE_MAL
_BARRIERS
#if
MAM_USE
_BARRIERS
MPI_Barrier
(
mall
->
intercomm
);
#endif
if
(
MAM_Contains_strat
(
MAM_SPAWN_STRATEGIES
,
MAM_STRAT_SPAWN_INTERCOMM
,
NULL
))
{
...
...
@@ -800,14 +800,14 @@ void Children_init(void (*user_function)(void *), void *user_args) {
MAM_I_create_user_struct
(
MAM_TARGETS
);
user_function
(
user_args
);
}
#if
USE_MAL
_BARRIERS
#if
MAM_USE
_BARRIERS
MPI_Barrier
(
mall
->
intercomm
);
#endif
mall_conf
->
times
->
user_end
=
MPI_Wtime
();
// Obtener timestamp de cuando termina user redist
comm_data_info
(
rep_s_data
,
dist_s_data
,
MAM_TARGETS
);
if
(
dist_s_data
->
entries
||
rep_s_data
->
entries
)
{
// Recibir datos sincronos
#if
USE_MAL
_BARRIERS
#if
MAM_USE
_BARRIERS
MPI_Barrier
(
mall
->
intercomm
);
#endif
recv_data
(
mall
->
num_parents
,
dist_s_data
,
MAM_USE_SYNCHRONOUS
);
...
...
@@ -815,18 +815,18 @@ void Children_init(void (*user_function)(void *), void *user_args) {
for
(
i
=
0
;
i
<
rep_s_data
->
entries
;
i
++
)
{
MPI_Bcast
(
rep_s_data
->
arrays
[
i
],
rep_s_data
->
qty
[
i
],
rep_s_data
->
types
[
i
],
mall
->
root_collectives
,
mall
->
intercomm
);
}
#if
USE_MAL
_BARRIERS
#if
MAM_USE
_BARRIERS
MPI_Barrier
(
mall
->
intercomm
);
#endif
mall_conf
->
times
->
sync_end
=
MPI_Wtime
();
// Obtener timestamp de cuando termina comm sincrona
}
#if
USE_
MA
L
_DEBUG
#if MA
M
_DEBUG
DEBUG_FUNC
(
"Targets have completed synchronous data redistribution step"
,
mall
->
myId
,
mall
->
numP
);
fflush
(
stdout
);
MPI_Barrier
(
MPI_COMM_WORLD
);
#endif
MAM_Commit
(
NULL
);
#if
USE_
MA
L
_DEBUG
#if MA
M
_DEBUG
DEBUG_FUNC
(
"MaM has been initialized correctly for new ranks"
,
mall
->
myId
,
mall
->
numP
);
fflush
(
stdout
);
MPI_Barrier
(
MPI_COMM_WORLD
);
#endif
}
...
...
@@ -844,7 +844,7 @@ void Children_init(void (*user_function)(void *), void *user_args) {
* Si se pide en segundo plano devuelve el estado actual.
*/
int
spawn_step
(){
#if
USE_MAL
_BARRIERS
#if
MAM_USE
_BARRIERS
MPI_Barrier
(
mall
->
comm
);
#endif
mall_conf
->
times
->
spawn_start
=
MPI_Wtime
();
...
...
@@ -852,7 +852,7 @@ int spawn_step(){
state
=
init_spawn
(
mall
->
thread_comm
,
&
(
mall
->
intercomm
));
if
(
!
MAM_Contains_strat
(
MAM_SPAWN_STRATEGIES
,
MAM_STRAT_SPAWN_PTHREAD
,
NULL
))
{
#if
USE_MAL
_BARRIERS
#if
MAM_USE
_BARRIERS
MPI_Barrier
(
mall
->
comm
);
#endif
mall_conf
->
times
->
spawn_time
=
MPI_Wtime
()
-
mall_conf
->
times
->
malleability_start
;
...
...
@@ -886,7 +886,7 @@ int start_redistribution() {
comm_data_info
(
rep_a_data
,
dist_a_data
,
MAM_SOURCES
);
if
(
dist_a_data
->
entries
||
rep_a_data
->
entries
)
{
// Enviar datos asincronos
#if
USE_MAL
_BARRIERS
#if
MAM_USE
_BARRIERS
MPI_Barrier
(
mall
->
intercomm
);
#endif
mall_conf
->
times
->
async_start
=
MPI_Wtime
();
...
...
@@ -929,7 +929,7 @@ int check_redistribution(int wait_completed) {
MPI_Request
*
req_completed
;
MPI_Win
window
;
local_completed
=
1
;
#if
USE_
MA
L
_DEBUG >= 2
#if MA
M
_DEBUG >= 2
DEBUG_FUNC
(
"Sources are testing for all asynchronous redistributions"
,
mall
->
myId
,
mall
->
numP
);
fflush
(
stdout
);
MPI_Barrier
(
MPI_COMM_WORLD
);
#endif
...
...
@@ -973,7 +973,7 @@ int check_redistribution(int wait_completed) {
MPI_Test
(
&
mall
->
wait_targets
,
&
local_completed
,
MPI_STATUS_IGNORE
);
//TODO - Figure out if last process takes profit from calling here
}
}
#if
USE_
MA
L
_DEBUG >= 2
#if MA
M
_DEBUG >= 2
DEBUG_FUNC
(
"Sources will now check a global decision"
,
mall
->
myId
,
mall
->
numP
);
fflush
(
stdout
);
MPI_Barrier
(
MPI_COMM_WORLD
);
#endif
...
...
@@ -981,7 +981,7 @@ int check_redistribution(int wait_completed) {
if
(
!
all_completed
)
return
MAM_I_DIST_PENDING
;
// Continue only if asynchronous send has ended
}
#if
USE_
MA
L
_DEBUG >= 2
#if MA
M
_DEBUG >= 2
DEBUG_FUNC
(
"Sources sent asynchronous redistributions"
,
mall
->
myId
,
mall
->
numP
);
fflush
(
stdout
);
MPI_Barrier
(
MPI_COMM_WORLD
);
#endif
...
...
@@ -998,7 +998,7 @@ int check_redistribution(int wait_completed) {
async_communication_end
(
req_completed
,
req_qty
,
&
window
);
}
#if
USE_MAL
_BARRIERS
#if
MAM_USE
_BARRIERS
MPI_Barrier
(
mall
->
intercomm
);
#endif
if
(
mall_conf
->
spawn_method
==
MAM_SPAWN_MERGE
)
mall_conf
->
times
->
async_end
=
MPI_Wtime
();
// Merge method only
...
...
@@ -1019,7 +1019,7 @@ int end_redistribution() {
comm_data_info
(
rep_s_data
,
dist_s_data
,
MAM_SOURCES
);
if
(
dist_s_data
->
entries
||
rep_s_data
->
entries
)
{
// Enviar datos sincronos
#if
USE_MAL
_BARRIERS
#if
MAM_USE
_BARRIERS
MPI_Barrier
(
mall
->
intercomm
);
#endif
mall_conf
->
times
->
sync_start
=
MPI_Wtime
();
...
...
@@ -1029,7 +1029,7 @@ int end_redistribution() {
MPI_Bcast
(
rep_s_data
->
arrays
[
i
],
rep_s_data
->
qty
[
i
],
rep_s_data
->
types
[
i
],
mall
->
root_collectives
,
mall
->
intercomm
);
}
#if
USE_MAL
_BARRIERS
#if
MAM_USE
_BARRIERS
MPI_Barrier
(
mall
->
intercomm
);
#endif
if
(
mall_conf
->
spawn_method
==
MAM_SPAWN_MERGE
)
mall_conf
->
times
->
sync_end
=
MPI_Wtime
();
// Merge method only
...
...
@@ -1092,7 +1092,7 @@ int thread_check(int wait_completed) {
return
-
2
;
}
#if
USE_MAL
_BARRIERS
#if
MAM_USE
_BARRIERS
MPI_Barrier
(
mall
->
intercomm
);
#endif
if
(
mall_conf
->
spawn_method
==
MAM_SPAWN_MERGE
)
mall_conf
->
times
->
async_end
=
MPI_Wtime
();
// Merge method only
...
...
Codes/malleability/MAM_RMS.c
View file @
241e098e
...
...
@@ -9,7 +9,7 @@
#include "MAM_DataStructures.h"
#if
USE_MAL
_SLURM
#if
MAM_USE
_SLURM
#include <slurm/slurm.h>
int
MAM_I_slurm_getenv_hosts_info
();
int
MAM_I_slurm_getjob_hosts_info
();
...
...
@@ -21,7 +21,7 @@ int GetCPUCount();
void
MAM_check_hosts
()
{
int
not_filled
=
1
;
#if
USE_MAL
_SLURM
#if
MAM_USE
_SLURM
not_filled
=
MAM_I_slurm_getenv_hosts_info
();
if
(
not_filled
)
{
if
(
mall
->
nodelist
!=
NULL
)
{
...
...
@@ -48,7 +48,7 @@ void MAM_check_hosts() {
MPI_Abort
(
mall
->
comm
,
-
50
);
}
#if
USE_
MA
L
_DEBUG >= 2
#if MA
M
_DEBUG >= 2
if
(
mall
->
myId
==
mall
->
root
)
{
DEBUG_FUNC
(
"Obtained Nodelist"
,
mall
->
myId
,
mall
->
numP
);
printf
(
"NODELIST: %s
\n
NODE_COUNT: %d NUM_CPUS_PER_NODE: %d
\n
"
,
mall
->
nodelist
,
mall
->
num_nodes
,
mall
->
num_cpus
);
...
...
@@ -196,7 +196,7 @@ int GetCPUCount() {
return
count
;
}
#if
USE_MAL
_SLURM
#if
MAM_USE
_SLURM
/*
* TODO
*/
...
...
Codes/malleability/MAM_Times.c
View file @
241e098e
...
...
@@ -4,7 +4,7 @@
void
def_malleability_times
(
MPI_Datatype
*
new_type
);
void
init_malleability_times
()
{
#if
USE_
MA
L
_DEBUG
#if MA
M
_DEBUG
DEBUG_FUNC
(
"Initializing recording structure"
,
mall
->
myId
,
mall
->
numP
);
fflush
(
stdout
);
MPI_Barrier
(
mall
->
comm
);
#endif
...
...
@@ -17,7 +17,7 @@ void init_malleability_times() {
reset_malleability_times
();
def_malleability_times
(
&
mall_conf
->
times
->
times_type
);
#if
USE_
MA
L
_DEBUG
#if MA
M
_DEBUG
DEBUG_FUNC
(
"Initialized recording structure"
,
mall
->
myId
,
mall
->
numP
);
fflush
(
stdout
);
MPI_Barrier
(
mall
->
comm
);
#endif
}
...
...
@@ -31,7 +31,7 @@ void reset_malleability_times() {
}
void
free_malleability_times
()
{
#if
USE_
MA
L
_DEBUG
#if MA
M
_DEBUG
DEBUG_FUNC
(
"Freeing recording structure"
,
mall
->
myId
,
mall
->
numP
);
fflush
(
stdout
);
#endif
if
(
mall_conf
->
times
!=
NULL
)
{
...
...
@@ -41,7 +41,7 @@ void free_malleability_times() {
}
free
(
mall_conf
->
times
);
}
#if
USE_
MA
L
_DEBUG
#if MA
M
_DEBUG
DEBUG_FUNC
(
"Freed recording structure"
,
mall
->
myId
,
mall
->
numP
);
fflush
(
stdout
);
#endif
}
...
...
Codes/malleability/MAM_Zombies.c
View file @
241e098e
...
...
@@ -65,7 +65,7 @@ void MAM_I_zombies_collect(int new_zombies) {
pids_counts
=
(
int
*
)
malloc
(
numP
*
sizeof
(
int
));
pids_displs
=
(
int
*
)
malloc
(
numP
*
sizeof
(
int
));
#if
USE_
MA
L
_DEBUG > 2
#if MA
M
_DEBUG > 2
if
(
myId
==
MAM_ROOT
){
DEBUG_FUNC
(
"Collecting zombies"
,
mall
->
myId
,
mall
->
numP
);
}
fflush
(
stdout
);
#endif
...
...
Codes/malleability/distribution_methods/Distributed_CommDist.c
View file @
241e098e
...
...
@@ -186,7 +186,7 @@ void sync_rma(void *send, void *recv, MPI_Datatype datatype, struct Counts r_cou
MPI_Type_size
(
datatype
,
&
datasize
);
MPI_Win_create
(
send
,
(
MPI_Aint
)
tamBl
*
datasize
,
datasize
,
MPI_INFO_NULL
,
comm
,
&
win
);
#if
USE_
MA
L
_DEBUG >= 3
#if MA
M
_DEBUG >= 3
DEBUG_FUNC
(
"Created Window for synchronous RMA communication"
,
mall
->
myId
,
mall
->
numP
);
fflush
(
stdout
);
MPI_Barrier
(
comm
);
#endif
switch
(
mall_conf
->
red_method
)
{
...
...
@@ -197,7 +197,7 @@ void sync_rma(void *send, void *recv, MPI_Datatype datatype, struct Counts r_cou
sync_rma_lock
(
recv
,
datatype
,
r_counts
,
win
);
break
;
}
#if
USE_
MA
L
_DEBUG >= 3
#if MA
M
_DEBUG >= 3
DEBUG_FUNC
(
"Completed synchronous RMA communication"
,
mall
->
myId
,
mall
->
numP
);
fflush
(
stdout
);
MPI_Barrier
(
comm
);
#endif
MPI_Win_free
(
&
win
);
...
...
@@ -357,7 +357,7 @@ int async_communication_check(int is_children_group, MPI_Request *requests, size
*/
void
async_communication_wait
(
MPI_Request
*
requests
,
size_t
request_qty
)
{
MPI_Waitall
(
request_qty
,
requests
,
MPI_STATUSES_IGNORE
);
#if
USE_
MA
L
_DEBUG >= 3
#if MA
M
_DEBUG >= 3
DEBUG_FUNC
(
"Processes Waitall completed"
,
mall
->
myId
,
mall
->
numP
);
fflush
(
stdout
);
MPI_Barrier
(
MPI_COMM_WORLD
);
#endif
}
...
...
@@ -545,12 +545,12 @@ void prepare_redistribution(int qty, MPI_Datatype datatype, int numP, int numO,
get_block_dist
(
qty
,
mall
->
myId
,
numP
,
&
dist_data
);
*
recv
=
malloc
(
dist_data
.
tamBl
*
datasize
);
#if
USE_
MA
L
_DEBUG >= 4
#if MA
M
_DEBUG >= 4
get_block_dist
(
qty
,
mall
->
myId
,
numP
,
&
dist_data
);
print_counts
(
dist_data
,
r_counts
->
counts
,
r_counts
->
displs
,
numO
+
offset_ids
,
0
,
"Targets Recv"
);
#endif
}
else
{
#if
USE_
MA
L
_DEBUG >= 4
#if MA
M
_DEBUG >= 4
get_block_dist
(
qty
,
mall
->
myId
,
numP
,
&
dist_data
);
#endif
...
...
@@ -560,11 +560,11 @@ void prepare_redistribution(int qty, MPI_Datatype datatype, int numP, int numO,
// Obtener distribución para este hijo y reservar vector de recibo
get_block_dist
(
qty
,
mall
->
myId
,
numO
,
&
dist_data
);
*
recv
=
malloc
(
dist_data
.
tamBl
*
datasize
);
#if
USE_
MA
L
_DEBUG >= 4
#if MA
M
_DEBUG >= 4
print_counts
(
dist_data
,
r_counts
->
counts
,
r_counts
->
displs
,
array_size
,
0
,
"Sources&Targets Recv"
);
#endif
}
#if
USE_
MA
L
_DEBUG >= 4
#if MA
M
_DEBUG >= 4
print_counts
(
dist_data
,
s_counts
->
counts
,
s_counts
->
displs
,
numO
+
offset_ids
,
0
,
"Sources Send"
);
#endif
}
...
...
Codes/malleability/spawn_methods/ProcessDist.c
View file @
241e098e
...
...
@@ -22,7 +22,7 @@ void set_mapping_host(int qty, char *host, size_t index, Spawn_data *spawn_data)
void
fill_str_hosts
(
char
*
nodelist
,
int
*
qty
,
size_t
used_nodes
,
char
**
hostlist_str
);
int
write_str_node
(
char
**
hostlist_str
,
size_t
len_og
,
size_t
qty
,
char
*
node_name
);
//--------------------------------SLURM USAGE-------------------------------------//
#if
USE_MAL
_SLURM
#if
MAM_USE
_SLURM
#include <slurm/slurm.h>
void
generate_info_string_slurm
(
char
*
nodelist
,
int
*
procs_array
,
size_t
nodes
,
Spawn_data
*
spawn_data
);
void
generate_multiple_info_string_slurm
(
char
*
nodelist
,
int
*
procs_array
,
size_t
nodes
,
Spawn_data
*
spawn_data
);
...
...
@@ -52,7 +52,7 @@ void processes_dist(Spawn_data *spawn_data) {
// GET NEW DISTRIBUTION
node_dist
(
*
spawn_data
,
&
procs_array
,
&
used_nodes
,
&
spawn_data
->
total_spawns
);
spawn_data
->
sets
=
(
Spawn_set
*
)
malloc
(
spawn_data
->
total_spawns
*
sizeof
(
Spawn_set
));
#if
USE_MAL
_SLURM
#if
MAM_USE
_SLURM
switch
(
spawn_data
->
mapping_fill_method
)
{
case
MAM_PHY_TYPE_STRING
:
// if(MAM_Contains_strat(MAM_SPAWN_STRATEGIES, MAM_STRAT_SPAWN_MULTIPLE, NULL) ) {
...
...
@@ -323,7 +323,7 @@ int write_str_node(char **hostlist_str, size_t len_og, size_t qty, char *node_na
}
//--------------------------------SLURM USAGE-------------------------------------//
#if
USE_MAL
_SLURM
#if
MAM_USE
_SLURM
/*
* Crea y devuelve un objeto MPI_Info con un par hosts/mapping
* en el que se indica el mappeado a utilizar en los nuevos
...
...
Write
Preview
Supports
Markdown
0%
Try again
or
attach a new file
.
Attach a file
Cancel
You are about to add
0
people
to the discussion. Proceed with caution.
Finish editing this message first!
Cancel
Please
register
or
sign in
to comment