Skip to content
Snippets Groups Projects
Commit c22d753d authored by Pat Alt's avatar Pat Alt
Browse files

another attempt

parent 0cc0216b
No related branches found
No related tags found
1 merge request!7669 initial run including fmnist lenet and new method
...@@ -11,4 +11,4 @@ ...@@ -11,4 +11,4 @@
module load 2023r1 openmpi module load 2023r1 openmpi
srun julia --project=experiments experiments/run_experiments.jl -- data=mnist output_path=results mpi > experiments/mnist.log srun julia --project=experiments experiments/run_experiments.jl -- data=mnist output_path=results mpi retrain > experiments/mnist.log
...@@ -47,20 +47,9 @@ function prepare_models(exper::Experiment) ...@@ -47,20 +47,9 @@ function prepare_models(exper::Experiment)
@info "Training models." @info "Training models."
model_dict = train_models(models, X, labels; parallelizer=exper.parallelizer, train_parallel=exper.train_parallel, cov=exper.coverage) model_dict = train_models(models, X, labels; parallelizer=exper.parallelizer, train_parallel=exper.train_parallel, cov=exper.coverage)
else else
# Pre-trained models: # Load models on root process:
if !(is_multi_processed(exper) && MPI.Comm_rank(exper.parallelizer.comm) != 0) @info "Loading pre-trained models."
# Load models on root process: model_dict = Serialization.deserialize(joinpath(pretrained_path(exper), "$(exper.save_name)_models.jls"))
@info "Loading pre-trained models."
model_dict = Serialization.deserialize(joinpath(pretrained_path(exper), "$(exper.save_name)_models.jls"))
else
# Dummy model on other processes:
model_dict = nothing
end
# Broadcast models:
if is_multi_processed(exper)
model_dict = MPI.bcast(model_dict, exper.parallelizer.comm; root=0)
MPI.Barrier(exper.parallelizer.comm)
end
end end
# Save models: # Save models:
......
0% Loading or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment