dynare/matlab/ols/pooled_ols.m

205 lines
7.3 KiB
Matlab
Raw Normal View History

2017-10-23 15:55:01 +02:00
function pooled_ols(ds, param_common, param_regex)
2017-10-27 12:07:55 +02:00
% function pooled_ols(ds, param_common, param_regex)
2017-10-23 15:55:01 +02:00
% Run Pooled OLS
% Apply parameter values found to corresponding parameter values in the
% other blocks of the model
%
% INPUTS
% ds [dseries] data to use in estimation
% param_common [cellstr] List of values to insert into param_regex,
% e.g. country codes {'FR', 'DE', 'IT'}
% param_regex [cellstr] Where '*' should be replaced by the first
% value in param_common
%
% OUTPUTS
% none
%
% SPECIAL REQUIREMENTS
% dynare must be run with the option: json=parse
% Copyright (C) 2017 Dynare Team
%
% This file is part of Dynare.
%
% Dynare is free software: you can redistribute it and/or modify
% it under the terms of the GNU General Public License as published by
% the Free Software Foundation, either version 3 of the License, or
% (at your option) any later version.
%
% Dynare is distributed in the hope that it will be useful,
% but WITHOUT ANY WARRANTY; without even the implied warranty of
% MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
% GNU General Public License for more details.
%
% You should have received a copy of the GNU General Public License
% along with Dynare. If not, see <http://www.gnu.org/licenses/>.
global M_ oo_
2017-10-27 12:20:16 +02:00
% Check input arguments
2017-11-02 12:34:11 +01:00
assert(~isempty(ds) && isdseries(ds), 'The first argument must be a dseries');
if isempty(param_common) && isempty(param_regex)
disp('Performing OLS instead of Pooled OLS...')
dyn_ols(ds);
return;
end
2017-11-02 12:34:11 +01:00
assert(~isempty(param_common) && iscellstr(param_common), 'The second argument must be a cellstr');
assert(~isempty(param_regex) && iscellstr(param_regex), 'The third argument must be a cellstr');
2017-10-27 12:20:16 +02:00
jsonfile = [M_.fname '_original.json'];
2017-10-23 15:55:01 +02:00
if exist(jsonfile, 'file') ~= 2
error('Could not find %s! Please use the json=parse option (See the Dynare invocation section in the reference manual).', jsonfile);
end
%% Read JSON
jsonmodel = loadjson(jsonfile);
jsonmodel = jsonmodel.model;
[lhs, rhs, lineno] = getEquationsByTags(jsonmodel);
%% Replace parameter names in equations
country_name = param_common{1};
regexcountries = ['(' strjoin(param_common(2:end),'|') ')'];
for i = 1:length(param_regex)
splitp = strsplit(param_regex{i}, '*');
assert(length(splitp) >= 2);
rhs = regexprep(rhs, ...
strjoin(splitp, regexcountries), ...
strjoin(splitp, country_name));
end
%% Find parameters and variable names in every equation & Setup estimation matrices
2017-11-14 15:52:09 +01:00
M_exo_names_trim = cellstr(M_.exo_names);
M_endo_exo_names_trim = [cellstr(M_.endo_names); M_exo_names_trim];
regex = strjoin(M_endo_exo_names_trim(:,1), '|');
mathops = '[\+\*\^\-\/]';
2017-10-23 15:55:01 +02:00
params = cell(length(rhs),1);
vars = cell(length(rhs),1);
pbeta = {};
Y = [];
X = [];
2017-11-07 14:58:11 +01:00
startidxs = zeros(length(lhs), 1);
residnames = cell(length(lhs), 1);
2017-10-23 15:55:01 +02:00
for i = 1:length(lhs)
rhs_ = strsplit(rhs{i}, {'+','-','*','/','^','log(','ln(','log10(','exp(','(',')','diff('});
rhs_(cellfun(@(x) all(isstrprop(x, 'digit')), rhs_)) = [];
vnames = setdiff(rhs_, cellstr(M_.param_names));
if ~isempty(regexp(rhs{i}, ...
['(' strjoin(vnames, '\\(\\d+\\)|') '\\(\\d+\\))'], ...
'once'))
2017-10-26 11:57:39 +02:00
error(['pooled_ols: you cannot have leads in equation on line ' ...
2017-10-23 15:55:01 +02:00
lineno{i} ': ' lhs{i} ' = ' rhs{i}]);
end
2017-10-27 11:55:44 +02:00
% Find parameters and associated variables
pnames = intersect(rhs_, cellstr(M_.param_names));
pidxs = zeros(length(pnames), 1);
2017-10-27 11:55:44 +02:00
vnames = cell(1, length(pnames));
xjdata = dseries;
for j = 1:length(pnames)
createdvar = false;
idx = find(strcmp(pbeta, pnames{j}));
if isempty(idx)
pbeta = [pbeta; pnames{j}];
pidxs(j) = length(pbeta);
else
pidxs(j) = idx;
2017-10-23 15:55:01 +02:00
end
pregex = [...
mathops pnames{j} mathops ...
'|^' pnames{j} mathops ...
'|' mathops pnames{j} '$' ...
];
[startidx, endidx] = regexp(rhs{i}, pregex, 'start', 'end');
assert(length(startidx) == 1);
if rhs{i}(startidx) == '*'
vnames{j} = getStrMoveLeft(rhs{i}(1:startidx-1));
elseif rhs{i}(endidx) == '*'
vnames{j} = getStrMoveRight(rhs{i}(endidx+1:end));
elseif rhs{i}(startidx) == '+' ...
|| rhs{i}(startidx) == '-' ...
|| rhs{i}(endidx) == '+' ...
|| rhs{i}(endidx) == '-'
% intercept
createdvar = true;
if any(strcmp(M_endo_exo_names_trim, 'intercept'))
[~, vnames{j}] = fileparts(tempname);
vnames{j} = ['intercept_' vnames{j}];
assert(~any(strcmp(M_endo_exo_names_trim, vnames{j})));
else
vnames{j} = 'intercept';
end
2017-10-23 15:55:01 +02:00
else
error('pooled_ols: Shouldn''t arrive here');
end
if createdvar
xjdatatmp = dseries(ones(ds.nobs, 1), ds.firstdate, vnames{j});
else
xjdatatmp = eval(regexprep(vnames{j}, regex, 'ds.$&'));
xjdatatmp.rename_(vnames{j});
end
2017-10-23 15:55:01 +02:00
xjdatatmp.rename_(num2str(j));
xjdata = [xjdata xjdatatmp];
end
2017-11-07 14:58:11 +01:00
residuals = intersect(rhs_, cellstr(M_.exo_names));
for j = 1:length(residuals)
if any(strcmp(residuals{j}, vnames))
residuals{j} = [];
end
end
idx = ~cellfun(@isempty, residuals);
assert(sum(idx) == 1, ['More than one residual in equation ' num2str(i)]);
residnames{i} = residuals{idx};
2017-10-23 15:55:01 +02:00
params{i} = pnames;
vars{i} = [vnames{:}];
ydata = eval(regexprep(lhs{i}, regex, 'ds.$&'));
2017-10-23 15:55:01 +02:00
fp = max(ydata.firstobservedperiod, xjdata.firstobservedperiod);
lp = min(ydata.lastobservedperiod, xjdata.lastobservedperiod);
2017-11-07 14:58:11 +01:00
startidxs(i) = length(Y) + 1;
Y(startidxs(i):startidxs(i)+lp-fp, 1) = ydata(fp:lp).data;
X(startidxs(i):startidxs(i)+lp-fp, pidxs) = xjdata(fp:lp).data;
2017-10-23 15:55:01 +02:00
end
%% Estimation
% Estimated Parameters
[q, r] = qr(X, 0);
oo_.pooled_ols.beta = r\(q'*Y);
% Assign parameter values back to parameters using param_regex & param_common
param_names_trim = cellfun(@strtrim, num2cell(M_.param_names(:,:),2), 'Uniform', 0);
regexcountries = ['(' strjoin(param_common(1:end),'|') ')'];
assigned_idxs = false(size(pbeta));
for i = 1:length(param_regex)
beta_idx = strcmp(pbeta, strrep(param_regex{i}, '*', country_name));
assigned_idxs = assigned_idxs | beta_idx;
value = oo_.pooled_ols.beta(beta_idx);
assert(~isempty(value));
M_.params(~cellfun(@isempty, regexp(param_names_trim, ...
strrep(param_regex{i}, '*', regexcountries)))) = value;
end
idxs = find(assigned_idxs == 0);
values = oo_.pooled_ols.beta(idxs);
names = pbeta(idxs);
assert(length(values) == length(names));
for i = 1:length(idxs)
M_.params(strcmp(param_names_trim, names{i})) = values(i);
end
2017-11-07 14:58:11 +01:00
residuals = Y - X * oo_.pooled_ols.beta;
for i = 1:length(lhs)
if i == length(lhs)
oo_.pooled_ols.resid.(residnames{i}) = residuals(startidxs(i):end);
else
oo_.pooled_ols.resid.(residnames{i}) = residuals(startidxs(i):startidxs(i+1)-1);
end
oo_.pooled_ols.varcovar.(['eq' num2str(i)]) = oo_.pooled_ols.resid.(residnames{i})*oo_.pooled_ols.resid.(residnames{i})';
idx = find(strcmp(residnames{i}, M_exo_names_trim));
M_.Sigma_e(idx, idx) = var(oo_.pooled_ols.resid.(residnames{i}));
end
2017-10-23 15:55:01 +02:00
end