dynare/matlab/parallel/slaveParallel.m

188 lines
6.5 KiB
Matlab
Raw Normal View History

function slaveParallel(whoiam,ThisMatlab)
% PARALLEL CONTEXT
% In a parallelization context, this function is launched on slave
% machines, to initialize MATLAB and DYNARE environment and waits for
2017-05-16 15:10:20 +02:00
% instructions sent by the Master.
% This function is invoked by masterParallel only when the strategy (1),
% i.e. always open, is actived.
%
%
% INPUTS
% o whoiam [int] index number of this CPU among all CPUs in the
% cluster.
% o ThisMatlab [int] index number of this slave machine in the cluster.
%
2017-05-16 15:10:20 +02:00
% OUTPUTS
% None
% Copyright © 2006-2017 Dynare Team
%
% This file is part of Dynare.
%
% Dynare is free software: you can redistribute it and/or modify
% it under the terms of the GNU General Public License as published by
% the Free Software Foundation, either version 3 of the License, or
% (at your option) any later version.
%
% Dynare is distributed in the hope that it will be useful,
% but WITHOUT ANY WARRANTY; without even the implied warranty of
% MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
% GNU General Public License for more details.
%
% You should have received a copy of the GNU General Public License
% along with Dynare. If not, see <https://www.gnu.org/licenses/>.
global funcName
warning off;
diary off;
delete( ['slaveParallel_',int2str(whoiam),'.log']);
diary( ['slaveParallel_',int2str(whoiam),'.log']);
% Configure dynare environment
dynareroot = dynare_config();
% Load input data.
2011-02-01 23:37:41 +01:00
load( ['slaveParallel_input',int2str(whoiam)]);
%Loads fGlobalVar Parallel.
2017-05-16 12:42:01 +02:00
if exist('fGlobalVar')
globalVars = fieldnames(fGlobalVar);
2017-05-16 12:42:01 +02:00
for j=1:length(globalVars)
2011-02-01 23:37:41 +01:00
eval(['global ',globalVars{j},';']);
evalin('base',['global ',globalVars{j},';']);
end
struct2local(fGlobalVar);
clear fGlobalVar
% create global variables in the base workspace as well
2011-02-01 23:37:41 +01:00
evalin('base',['load( [''slaveParallel_input',int2str(whoiam),'''],''fGlobalVar'')']) ;
evalin('base','struct2local(fGlobalVar)');
evalin('base','clear fGlobalVar');
end
t0=clock;
fslave = dir( ['slaveParallel_input',int2str(whoiam),'.mat']);
2017-05-16 12:42:01 +02:00
while (etime(clock,t0)<1200 && ~isempty(fslave)) || ~isempty(dir(['stayalive',int2str(whoiam),'.txt']))
if ~isempty(dir(['stayalive',int2str(whoiam),'.txt']))
t0=clock;
delete(['stayalive',int2str(whoiam),'.txt']);
end
% I wait for 20 min or while mater asks to exit (i.e. it cancels fslave file)
2017-05-16 12:42:01 +02:00
pause(1)
2017-05-16 15:10:20 +02:00
fjob = dir(['slaveJob',int2str(whoiam),'.mat']);
2017-05-16 15:10:20 +02:00
2017-05-16 12:42:01 +02:00
if ~isempty(fjob)
clear fGlobalVar fInputVar fblck nblck fname
2017-05-16 15:10:20 +02:00
while(1)
2011-02-04 17:17:48 +01:00
Go=0;
2017-05-16 15:10:20 +02:00
2011-02-04 17:17:48 +01:00
Go=fopen(['slaveJob',int2str(whoiam),'.mat']);
2017-05-16 15:10:20 +02:00
if Go>0
2011-02-04 17:17:48 +01:00
fclose(Go);
2017-05-16 12:42:01 +02:00
pause(1)
2011-02-04 17:17:48 +01:00
load(['slaveJob',int2str(whoiam),'.mat']);
break
else
% Only for testing, will be remouved!
2017-05-16 15:10:20 +02:00
2011-02-04 17:17:48 +01:00
% if isunix
% E1=fopen('/home/ivano/Works/Errore-slaveParallel.txt','w+');
% fclose(E1);
2017-05-16 15:10:20 +02:00
% else
2011-02-04 17:17:48 +01:00
% E1=fopen('c:\dynare_calcs\Errore-slaveParallel.txt','w+');
% fclose(E1);
% end
2017-05-16 15:10:20 +02:00
2011-02-04 17:17:48 +01:00
end
end
2017-05-16 15:10:20 +02:00
funcName=fname; % Update global job name.
2010-04-14 17:29:12 +02:00
if exist('fGlobalVar') && ~isempty (fGlobalVar)
globalVars = fieldnames(fGlobalVar);
2017-05-16 12:42:01 +02:00
for j=1:length(globalVars)
info_whos = whos(globalVars{j});
2017-05-16 12:42:01 +02:00
if isempty(info_whos) || ~info_whos.global
2011-02-01 23:37:41 +01:00
eval(['global ',globalVars{j},';']);
evalin('base',['global ',globalVars{j},';']);
end
end
struct2local(fGlobalVar);
2011-02-01 23:37:41 +01:00
evalin('base',['load( [''slaveJob',int2str(whoiam),'''],''fGlobalVar'')']);
evalin('base','struct2local(fGlobalVar)');
evalin('base','clear fGlobalVar');
end
delete(['slaveJob',int2str(whoiam),'.mat']);
fInputVar.Parallel = Parallel;
2017-05-16 15:10:20 +02:00
% Launch the routine to be run in parallel.
2017-05-16 12:42:01 +02:00
try
tic
2011-02-04 17:17:48 +01:00
fOutputVar = feval(fname, fInputVar ,fblck, nblck, whoiam, ThisMatlab);
2017-05-16 12:42:01 +02:00
toc
if isfield(fOutputVar,'OutputFileName')
2011-02-04 17:17:48 +01:00
OutputFileName = fOutputVar.OutputFileName;
else
OutputFileName = '';
end
2011-02-04 17:17:48 +01:00
if(whoiam)
2011-02-04 17:17:48 +01:00
% Save the output result.
save([ fname,'_output_',int2str(whoiam),'.mat'],'fOutputVar' );
2017-05-16 15:10:20 +02:00
% keyboard,
2017-05-16 12:42:01 +02:00
if isfield(fOutputVar,'CloseAllSlaves')
CloseAllSlaves = 1;
fOutputVar = rmfield(fOutputVar,'CloseAllSlaves');
save([ fname,'_output_',int2str(whoiam),'.mat'],'fOutputVar' )
save(['comp_status_',funcName,int2str(whoiam),'.mat'],'CloseAllSlaves');
end
2011-02-04 17:17:48 +01:00
% Inform the master that the job is finished, and transfer the output data
delete(['P_',fname,'_',int2str(whoiam),'End.txt']);
end
2011-02-04 17:17:48 +01:00
disp(['Job ',fname,' on CPU ',int2str(whoiam),' completed.']);
t0 =clock; % Re-set waiting time of 20 mins
2017-05-16 12:42:01 +02:00
catch
theerror = lasterror;
if strfind(theerror.message,'Master asked to break the job')
disp(['Job ',fname,' on CPU ',int2str(whoiam),' broken from master.']);
fOutputVar.message = theerror;
save([ fname,'_output_',int2str(whoiam),'.mat'],'fOutputVar' )
delete(['P_',fname,'_',int2str(whoiam),'End.txt']);
else
disp(['Job ',fname,' on CPU ',int2str(whoiam),' crashed.']);
fOutputVar.error = lasterror;
save([ fname,'_output_',int2str(whoiam),'.mat'],'fOutputVar' );
waitbarString = fOutputVar.error.message;
2017-05-16 12:42:01 +02:00
if Parallel(ThisMatlab).Local
waitbarTitle='Local ';
else
waitbarTitle=[Parallel(ThisMatlab).ComputerName];
end
fMessageStatus(NaN,whoiam,waitbarString, waitbarTitle, Parallel(ThisMatlab));
delete(['P_',fname,'_',int2str(whoiam),'End.txt']);
break
end
2017-05-16 15:10:20 +02:00
end
end
fslave = dir( ['slaveParallel_input',int2str(whoiam),'.mat']); % Check if Master asks to exit
end
2011-02-01 23:37:41 +01:00
disp(['slaveParallel on CPU ',int2str(whoiam),' completed.']);
diary off;
delete(['P_slave_',int2str(whoiam),'End.txt']);
exit;