diff --git a/core/checkModelStruct.m b/core/checkModelStruct.m
index 7526d590..1ba21cb0 100755
--- a/core/checkModelStruct.m
+++ b/core/checkModelStruct.m
@@ -120,6 +120,21 @@ function checkModelStruct(model,throwErrors,trimWarnings)
         EM='The "grRules" field must be a cell array of strings';
         dispEM(EM,throwErrors);
     end
+    if ~isfield(model,'genes')
+        EM='If "grRules" field exists, the model should also contain a "genes" field';
+        dispEM(EM,throwErrors);
+    else
+        geneList = strjoin(model.grRules);
+        geneList = regexp(geneList,' |)|(|and|or','split'); % Remove all grRule punctuation
+        geneList = geneList(~cellfun(@isempty,geneList));  % Remove spaces and empty genes
+        geneList = setdiff(unique(geneList),model.genes);
+        if ~isempty(geneList)
+            problemGrRules = model.rxns(contains(model.grRules,geneList));
+            problemGrRules = strjoin(problemGrRules(:),'; ');
+            EM=['The reaction(s) "' problemGrRules '" contain the following genes in its "grRules" field, but these are not in the "genes" field:'];
+            dispEM(EM,throwErrors,geneList);
+        end
+    end
 end
 if isfield(model,'rxnComps')
     if ~isnumeric(model.rxnComps)
@@ -262,7 +277,10 @@ function checkModelStruct(model,throwErrors,trimWarnings)
 EM='The following reactions have contradicting bounds:';
 dispEM(EM,throwErrors,model.rxns(model.lb>model.ub),trimWarnings);
 EM='The following reactions have bounds contradicting their reversibility:';
-dispEM(EM,throwErrors,model.rxns(model.lb<0 & model.rev==0),trimWarnings);
+contradictBound = (model.lb < 0 & model.ub > 0 & model.rev==0) | ... % Reversible bounds, irreversible label
+                  (model.lb < 0 & model.ub <= 0 & model.rev==1) | ... % Negative bounds, reversible label
+                  (model.lb >= 0 & model.ub > 0 & model.rev==1); % Positive bounds, reversible label
+dispEM(EM,throwErrors,model.rxns(contradictBound),trimWarnings);
 
 %Multiple or no objective functions not allowed in SBML L3V1 FBCv2
 if numel(find(model.c))>1
diff --git a/core/constructS.m b/core/constructS.m
index 87ac8c89..5412cf24 100755
--- a/core/constructS.m
+++ b/core/constructS.m
@@ -152,7 +152,8 @@
         strjoin(unique(metsToS(~metsPresent)),', ')],'')
     else
         missingMet = find(~metsPresent);
-        missingMet = char(strcat(metsToS(missingMet),' (reaction:',rxns(rxnsToS(missingMet)),')\n'));
+        missingMet = strcat(metsToS(missingMet),' (reaction:',rxns(rxnsToS(missingMet)),')\n');
+        missingMet = strjoin(missingMet,'');
         error(['Could not find the following metabolites (reaction indicated) in the metabolite list: \n' ...
             missingMet '%s'],'');
     end
diff --git a/core/getExchangeRxns.m b/core/getExchangeRxns.m
index 459bc095..6433a4e6 100755
--- a/core/getExchangeRxns.m
+++ b/core/getExchangeRxns.m
@@ -1,47 +1,82 @@
 function [exchangeRxns, exchangeRxnsIndexes]=getExchangeRxns(model,reactionType)
 % getExchangeRxns
-%   Retrieves the exchange reactions from a model
+%   Retrieves the exchange reactions from a model. Exchange reactions are
+%   identified by having either no substrates or products.
 %
+% Input:
 %   model               a model structure
-%   reactionType        retrieve all reactions ('both'), only production
-%                       ('out'), or only consumption ('in') (optional, default
-%                       'both')
+%   reactionType        which exchange reactions should be returned
+%                       'all'     all reactions, irrespective of reaction
+%                                 bounds
+%                       'uptake'  reactions with bounds that imply that
+%                                 only uptake are allowed. Reaction
+%                                 direction, upper and lower bounds are
+%                                 all considered
+%                       'excrete' reactions with bounds that imply that
+%                                 only excretion are allowed. Reaction
+%                                 direction, upper and lower bounds are
+%                                 all considered
+%                       'reverse' reactions with non-zero upper and lower
+%                                 bounds that imply that both uptake and
+%                                 excretion are allowed
+%                       'blocked' reactions that have zero upper and lower
+%                                 bounds, not allowing any flux
+%                       'in'      reactions where the boundary metabolite
+%                                 is the substrate of the reaction, a
+%                                 positive flux value would imply uptake,
+%                                 but reaction bounds are not considered
+%                       'out'     reactions where the boundary metabolite
+%                                 is the substrate of the reaction, a
+%                                 positive flux value would imply uptake,
+%                                 but reaction bounds are not considered.
 %
+% Output:
 %   exchangeRxns        cell array with the IDs of the exchange reactions
 %   exchangeRxnsIndexes vector with the indexes of the exchange reactions
 %
-%   Exchange reactions are defined as reactions which involve only products
-%   or only reactants. If the unconstrained field is present, then that is
-%   used instead.
+% Note:
+%   The union of 'in' and 'out' equals 'all'. Also, the union of 'uptake',
+%   'excrete', 'reverse' and 'blocked' equals all.
 %
 % Usage: [exchangeRxns,exchangeRxnsIndexes]=getExchangeRxns(model,reactionType)
 
 if nargin<2
-    reactionType='both';
+    reactionType='all';
 else
     reactionType=char(reactionType);
 end
 
-hasNoProducts=sparse(numel(model.rxns),1);
-hasNoReactants=sparse(numel(model.rxns),1);
-
-if isfield(model,'unconstrained')
-    if strcmpi(reactionType,'both') || strcmpi(reactionType,'out')
-        [~, I]=find(model.S(model.unconstrained~=0,:)>0);
-        hasNoProducts(I)=true;
-    end
-    if strcmpi(reactionType,'both') || strcmpi(reactionType,'in')
-        [~, I]=find(model.S(model.unconstrained~=0,:)<0);
-        hasNoReactants(I)=true;
-    end
+% Find exchange reactions
+if isfield(model, 'unconstrained')
+    [~, I]=find(model.S(model.unconstrained~=0,:)>0);
+    hasNoProd(I)=true;
+    [~, I]=find(model.S(model.unconstrained~=0,:)<0);
+    hasNoSubs(I)=true;
 else
-    if strcmpi(reactionType,'both') || strcmpi(reactionType,'out')
-        hasNoProducts=sum((model.S>0))==0;
-    end
-    if strcmpi(reactionType,'both') || strcmpi(reactionType,'in')
-        hasNoReactants=sum((model.S<0))==0;
-    end
+    hasNoProd = transpose(find(sum(model.S>0)==0));
+    hasNoSubs = transpose(find(sum(model.S<0)==0));
+end
+allExch   = [hasNoProd; hasNoSubs];
+
+switch reactionType
+    case {'both','all'} % For legacy reasons, 'both' is also allowed
+        exchangeRxnsIndexes = allExch;
+    case 'in'
+        exchangeRxnsIndexes = hasNoSubs;
+    case 'out'
+        exchangeRxnsIndexes = hasNoProd;
+    case 'blocked'
+        exchangeRxnsIndexes = allExch(model.lb(allExch) == 0 & model.ub(allExch) == 0);
+    case 'reverse'
+        exchangeRxnsIndexes = allExch(model.lb(allExch) < 0 & model.ub(allExch) > 0);
+    case 'uptake'
+        exchangeRxnsIndexes = allExch([(model.lb(hasNoSubs) >= 0 & model.ub(hasNoSubs) > 0); ...
+                              (model.lb(hasNoProd) < 0 & model.ub(hasNoProd) <= 0)]);
+    case 'excrete'
+        exchangeRxnsIndexes = allExch([(model.lb(hasNoSubs) < 0 & model.ub(hasNoSubs) <= 0); ...
+                              (model.lb(hasNoProd) >= 0 & model.ub(hasNoProd) > 0)]);
+    otherwise
+        error('Invalid reactionType specified')
 end
-exchangeRxnsIndexes=find(hasNoProducts(:) | hasNoReactants(:));
-exchangeRxns=model.rxns(exchangeRxnsIndexes);
+exchangeRxns = model.rxns(exchangeRxnsIndexes);
 end
diff --git a/doc/core/checkModelStruct.html b/doc/core/checkModelStruct.html
index 2b49a88b..7cc327fe 100644
--- a/doc/core/checkModelStruct.html
+++ b/doc/core/checkModelStruct.html
@@ -179,305 +179,323 @@ <h2><a name="_source"></a>SOURCE CODE <a href="#_top"><img alt="^" border="0" sr
 0120         EM=<span class="string">'The &quot;grRules&quot; field must be a cell array of strings'</span>;
 0121         <a href="dispEM.html" class="code" title="function dispEM(string,throwErrors,toList,trimWarnings)">dispEM</a>(EM,throwErrors);
 0122     <span class="keyword">end</span>
-0123 <span class="keyword">end</span>
-0124 <span class="keyword">if</span> isfield(model,<span class="string">'rxnComps'</span>)
-0125     <span class="keyword">if</span> ~isnumeric(model.rxnComps)
-0126         EM=<span class="string">'The &quot;rxnComps&quot; field must be of type &quot;double&quot;'</span>;
-0127         <a href="dispEM.html" class="code" title="function dispEM(string,throwErrors,toList,trimWarnings)">dispEM</a>(EM,throwErrors);
-0128     <span class="keyword">end</span>
-0129 <span class="keyword">end</span>
-0130 <span class="keyword">if</span> isfield(model,<span class="string">'inchis'</span>)
-0131     <span class="keyword">if</span> ~iscellstr(model.inchis)
-0132         EM=<span class="string">'The &quot;inchis&quot; field must be a cell array of strings'</span>;
-0133         <a href="dispEM.html" class="code" title="function dispEM(string,throwErrors,toList,trimWarnings)">dispEM</a>(EM,throwErrors);
-0134     <span class="keyword">end</span>
-0135 <span class="keyword">end</span>
-0136 <span class="keyword">if</span> isfield(model,<span class="string">'metSmiles'</span>)
-0137     <span class="keyword">if</span> ~iscellstr(model.metSmiles)
-0138         EM=<span class="string">'The &quot;metSmiles&quot; field must be a cell array of strings'</span>;
-0139         <a href="dispEM.html" class="code" title="function dispEM(string,throwErrors,toList,trimWarnings)">dispEM</a>(EM,throwErrors);
-0140     <span class="keyword">end</span>
-0141 <span class="keyword">end</span>
-0142 <span class="keyword">if</span> isfield(model,<span class="string">'metFormulas'</span>)
-0143     <span class="keyword">if</span> ~iscellstr(model.metFormulas)
-0144         EM=<span class="string">'The &quot;metFormulas&quot; field must be a cell array of strings'</span>;
-0145         <a href="dispEM.html" class="code" title="function dispEM(string,throwErrors,toList,trimWarnings)">dispEM</a>(EM,throwErrors);
-0146     <span class="keyword">end</span>
-0147 <span class="keyword">end</span>
-0148 <span class="keyword">if</span> isfield(model,<span class="string">'metCharges'</span>)
-0149     <span class="keyword">if</span> ~isnumeric(model.metCharges)
-0150         EM=<span class="string">'The &quot;metCharges&quot; field must be a double'</span>;
-0151         <a href="dispEM.html" class="code" title="function dispEM(string,throwErrors,toList,trimWarnings)">dispEM</a>(EM,throwErrors);
-0152     <span class="keyword">end</span>
-0153 <span class="keyword">end</span>
-0154 <span class="keyword">if</span> isfield(model,<span class="string">'metDeltaG'</span>)
-0155     <span class="keyword">if</span> ~isnumeric(model.metDeltaG)
-0156         EM=<span class="string">'The &quot;metDeltaG&quot; field must be a double'</span>;
-0157         <a href="dispEM.html" class="code" title="function dispEM(string,throwErrors,toList,trimWarnings)">dispEM</a>(EM,throwErrors);
-0158     <span class="keyword">end</span>
-0159 <span class="keyword">end</span>
-0160 <span class="keyword">if</span> isfield(model,<span class="string">'subSystems'</span>)
-0161     <span class="keyword">for</span> i=1:numel(model.subSystems)
-0162         <span class="keyword">if</span> ~iscell(model.subSystems{i,1})
-0163             EM=<span class="string">'The &quot;subSystems&quot; field must be a cell array'</span>;
-0164             <a href="dispEM.html" class="code" title="function dispEM(string,throwErrors,toList,trimWarnings)">dispEM</a>(EM,throwErrors);
-0165         <span class="keyword">end</span>
-0166     <span class="keyword">end</span>
-0167 <span class="keyword">end</span>
-0168 <span class="keyword">if</span> isfield(model,<span class="string">'eccodes'</span>)
-0169     <span class="keyword">if</span> ~iscellstr(model.eccodes)
-0170         EM=<span class="string">'The &quot;eccodes&quot; field must be a cell array of strings'</span>;
-0171         <a href="dispEM.html" class="code" title="function dispEM(string,throwErrors,toList,trimWarnings)">dispEM</a>(EM,throwErrors);
-0172     <span class="keyword">end</span>
-0173 <span class="keyword">end</span>
-0174 <span class="keyword">if</span> isfield(model,<span class="string">'unconstrained'</span>)
-0175     <span class="keyword">if</span> ~isnumeric(model.unconstrained)
-0176         EM=<span class="string">'The &quot;unconstrained&quot; field must be of type &quot;double&quot;'</span>;
-0177         <a href="dispEM.html" class="code" title="function dispEM(string,throwErrors,toList,trimWarnings)">dispEM</a>(EM,throwErrors);
-0178     <span class="keyword">end</span>
-0179 <span class="keyword">end</span>
-0180 <span class="keyword">if</span> isfield(model,<span class="string">'rxnNotes'</span>)
-0181     <span class="keyword">if</span> ~iscellstr(model.rxnNotes)
-0182         EM=<span class="string">'The &quot;rxnNotes&quot; field must be a cell array of strings'</span>;
-0183         <a href="dispEM.html" class="code" title="function dispEM(string,throwErrors,toList,trimWarnings)">dispEM</a>(EM,throwErrors);
-0184     <span class="keyword">end</span>
-0185 <span class="keyword">end</span>
-0186 <span class="keyword">if</span> isfield(model,<span class="string">'rxnReferences'</span>)
-0187     <span class="keyword">if</span> ~iscellstr(model.rxnReferences)
-0188         EM=<span class="string">'The &quot;rxnReferences&quot; field must be a cell array of strings'</span>;
-0189         <a href="dispEM.html" class="code" title="function dispEM(string,throwErrors,toList,trimWarnings)">dispEM</a>(EM,throwErrors);
-0190     <span class="keyword">end</span>
-0191 <span class="keyword">end</span>
-0192 <span class="keyword">if</span> isfield(model,<span class="string">'rxnConfidenceScores'</span>)
-0193     <span class="keyword">if</span> ~isnumeric(model.rxnConfidenceScores)
-0194         EM=<span class="string">'The &quot;rxnConfidenceScores&quot; field must be a double'</span>;
-0195         <a href="dispEM.html" class="code" title="function dispEM(string,throwErrors,toList,trimWarnings)">dispEM</a>(EM,throwErrors);
-0196     <span class="keyword">end</span>
-0197 <span class="keyword">end</span>
-0198 <span class="keyword">if</span> isfield(model,<span class="string">'rxnDeltaG'</span>)
-0199     <span class="keyword">if</span> ~isnumeric(model.rxnDeltaG)
-0200         EM=<span class="string">'The &quot;rxnDeltaG&quot; field must be a double'</span>;
-0201         <a href="dispEM.html" class="code" title="function dispEM(string,throwErrors,toList,trimWarnings)">dispEM</a>(EM,throwErrors);
-0202     <span class="keyword">end</span>
-0203 <span class="keyword">end</span>
-0204 
-0205 <span class="comment">%Empty strings</span>
-0206 <span class="keyword">if</span> isempty(model.id)
-0207     EM=<span class="string">'The &quot;id&quot; field cannot be empty'</span>;
-0208     <a href="dispEM.html" class="code" title="function dispEM(string,throwErrors,toList,trimWarnings)">dispEM</a>(EM,throwErrors);
-0209 <span class="keyword">end</span>
-0210 <span class="keyword">if</span> any(cellfun(@isempty,model.rxns))
-0211     EM=<span class="string">'The model contains empty reaction IDs'</span>;
-0212     <a href="dispEM.html" class="code" title="function dispEM(string,throwErrors,toList,trimWarnings)">dispEM</a>(EM,throwErrors);
-0213 <span class="keyword">end</span>
-0214 <span class="keyword">if</span> any(cellfun(@isempty,model.mets))
-0215     EM=<span class="string">'The model contains empty metabolite IDs'</span>;
-0216     <a href="dispEM.html" class="code" title="function dispEM(string,throwErrors,toList,trimWarnings)">dispEM</a>(EM,throwErrors);
-0217 <span class="keyword">end</span>
-0218 <span class="keyword">if</span> any(cellfun(@isempty,model.comps))
-0219     EM=<span class="string">'The model contains empty compartment IDs'</span>;
-0220     <a href="dispEM.html" class="code" title="function dispEM(string,throwErrors,toList,trimWarnings)">dispEM</a>(EM,throwErrors);
-0221 <span class="keyword">end</span>
-0222 EM=<span class="string">'The following metabolites have empty names:'</span>;
-0223 <a href="dispEM.html" class="code" title="function dispEM(string,throwErrors,toList,trimWarnings)">dispEM</a>(EM,throwErrors,model.mets(cellfun(@isempty,model.metNames)),trimWarnings);
-0224 
-0225 <span class="keyword">if</span> isfield(model,<span class="string">'genes'</span>)
-0226     <span class="keyword">if</span> any(cellfun(@isempty,model.genes))
-0227         EM=<span class="string">'The model contains empty gene IDs'</span>;
-0228         <a href="dispEM.html" class="code" title="function dispEM(string,throwErrors,toList,trimWarnings)">dispEM</a>(EM,throwErrors);
-0229     <span class="keyword">end</span>
-0230 <span class="keyword">end</span>
-0231 
-0232 <span class="comment">%Duplicates</span>
-0233 EM=<span class="string">'The following reaction IDs are duplicates:'</span>;
-0234 <a href="dispEM.html" class="code" title="function dispEM(string,throwErrors,toList,trimWarnings)">dispEM</a>(EM,throwErrors,model.rxns(<a href="#_sub1" class="code" title="subfunction I=duplicates(strings)">duplicates</a>(model.rxns)),trimWarnings);
-0235 EM=<span class="string">'The following metabolite IDs are duplicates:'</span>;
-0236 <a href="dispEM.html" class="code" title="function dispEM(string,throwErrors,toList,trimWarnings)">dispEM</a>(EM,throwErrors,model.mets(<a href="#_sub1" class="code" title="subfunction I=duplicates(strings)">duplicates</a>(model.mets)),trimWarnings);
-0237 EM=<span class="string">'The following compartment IDs are duplicates:'</span>;
-0238 <a href="dispEM.html" class="code" title="function dispEM(string,throwErrors,toList,trimWarnings)">dispEM</a>(EM,throwErrors,model.comps(<a href="#_sub1" class="code" title="subfunction I=duplicates(strings)">duplicates</a>(model.comps)),trimWarnings);
-0239 <span class="keyword">if</span> isfield(model,<span class="string">'genes'</span>)
-0240     EM=<span class="string">'The following genes are duplicates:'</span>;
-0241     <a href="dispEM.html" class="code" title="function dispEM(string,throwErrors,toList,trimWarnings)">dispEM</a>(EM,throwErrors,model.genes(<a href="#_sub1" class="code" title="subfunction I=duplicates(strings)">duplicates</a>(model.genes)),trimWarnings);
-0242 <span class="keyword">end</span>
-0243 metInComp=strcat(model.metNames,<span class="string">'['</span>,model.comps(model.metComps),<span class="string">']'</span>);
-0244 EM=<span class="string">'The following metabolites already exist in the same compartment:'</span>;
-0245 <a href="dispEM.html" class="code" title="function dispEM(string,throwErrors,toList,trimWarnings)">dispEM</a>(EM,throwErrors,metInComp(<a href="#_sub1" class="code" title="subfunction I=duplicates(strings)">duplicates</a>(metInComp)),trimWarnings);
+0123     <span class="keyword">if</span> ~isfield(model,<span class="string">'genes'</span>)
+0124         EM=<span class="string">'If &quot;grRules&quot; field exists, the model should also contain a &quot;genes&quot; field'</span>;
+0125         <a href="dispEM.html" class="code" title="function dispEM(string,throwErrors,toList,trimWarnings)">dispEM</a>(EM,throwErrors);
+0126     <span class="keyword">else</span>
+0127         geneList = strjoin(model.grRules);
+0128         geneList = regexp(geneList,<span class="string">' |)|(|and|or'</span>,<span class="string">'split'</span>); <span class="comment">% Remove all grRule punctuation</span>
+0129         geneList = geneList(~cellfun(@isempty,geneList));  <span class="comment">% Remove spaces and empty genes</span>
+0130         geneList = setdiff(unique(geneList),model.genes);
+0131         <span class="keyword">if</span> ~isempty(geneList)
+0132             problemGrRules = model.rxns(contains(model.grRules,geneList));
+0133             problemGrRules = strjoin(problemGrRules(:),<span class="string">'; '</span>);
+0134             EM=[<span class="string">'The reaction(s) &quot;'</span> problemGrRules <span class="string">'&quot; contain the following genes in its &quot;grRules&quot; field, but these are not in the &quot;genes&quot; field:'</span>];
+0135             <a href="dispEM.html" class="code" title="function dispEM(string,throwErrors,toList,trimWarnings)">dispEM</a>(EM,throwErrors,geneList);
+0136         <span class="keyword">end</span>
+0137     <span class="keyword">end</span>
+0138 <span class="keyword">end</span>
+0139 <span class="keyword">if</span> isfield(model,<span class="string">'rxnComps'</span>)
+0140     <span class="keyword">if</span> ~isnumeric(model.rxnComps)
+0141         EM=<span class="string">'The &quot;rxnComps&quot; field must be of type &quot;double&quot;'</span>;
+0142         <a href="dispEM.html" class="code" title="function dispEM(string,throwErrors,toList,trimWarnings)">dispEM</a>(EM,throwErrors);
+0143     <span class="keyword">end</span>
+0144 <span class="keyword">end</span>
+0145 <span class="keyword">if</span> isfield(model,<span class="string">'inchis'</span>)
+0146     <span class="keyword">if</span> ~iscellstr(model.inchis)
+0147         EM=<span class="string">'The &quot;inchis&quot; field must be a cell array of strings'</span>;
+0148         <a href="dispEM.html" class="code" title="function dispEM(string,throwErrors,toList,trimWarnings)">dispEM</a>(EM,throwErrors);
+0149     <span class="keyword">end</span>
+0150 <span class="keyword">end</span>
+0151 <span class="keyword">if</span> isfield(model,<span class="string">'metSmiles'</span>)
+0152     <span class="keyword">if</span> ~iscellstr(model.metSmiles)
+0153         EM=<span class="string">'The &quot;metSmiles&quot; field must be a cell array of strings'</span>;
+0154         <a href="dispEM.html" class="code" title="function dispEM(string,throwErrors,toList,trimWarnings)">dispEM</a>(EM,throwErrors);
+0155     <span class="keyword">end</span>
+0156 <span class="keyword">end</span>
+0157 <span class="keyword">if</span> isfield(model,<span class="string">'metFormulas'</span>)
+0158     <span class="keyword">if</span> ~iscellstr(model.metFormulas)
+0159         EM=<span class="string">'The &quot;metFormulas&quot; field must be a cell array of strings'</span>;
+0160         <a href="dispEM.html" class="code" title="function dispEM(string,throwErrors,toList,trimWarnings)">dispEM</a>(EM,throwErrors);
+0161     <span class="keyword">end</span>
+0162 <span class="keyword">end</span>
+0163 <span class="keyword">if</span> isfield(model,<span class="string">'metCharges'</span>)
+0164     <span class="keyword">if</span> ~isnumeric(model.metCharges)
+0165         EM=<span class="string">'The &quot;metCharges&quot; field must be a double'</span>;
+0166         <a href="dispEM.html" class="code" title="function dispEM(string,throwErrors,toList,trimWarnings)">dispEM</a>(EM,throwErrors);
+0167     <span class="keyword">end</span>
+0168 <span class="keyword">end</span>
+0169 <span class="keyword">if</span> isfield(model,<span class="string">'metDeltaG'</span>)
+0170     <span class="keyword">if</span> ~isnumeric(model.metDeltaG)
+0171         EM=<span class="string">'The &quot;metDeltaG&quot; field must be a double'</span>;
+0172         <a href="dispEM.html" class="code" title="function dispEM(string,throwErrors,toList,trimWarnings)">dispEM</a>(EM,throwErrors);
+0173     <span class="keyword">end</span>
+0174 <span class="keyword">end</span>
+0175 <span class="keyword">if</span> isfield(model,<span class="string">'subSystems'</span>)
+0176     <span class="keyword">for</span> i=1:numel(model.subSystems)
+0177         <span class="keyword">if</span> ~iscell(model.subSystems{i,1})
+0178             EM=<span class="string">'The &quot;subSystems&quot; field must be a cell array'</span>;
+0179             <a href="dispEM.html" class="code" title="function dispEM(string,throwErrors,toList,trimWarnings)">dispEM</a>(EM,throwErrors);
+0180         <span class="keyword">end</span>
+0181     <span class="keyword">end</span>
+0182 <span class="keyword">end</span>
+0183 <span class="keyword">if</span> isfield(model,<span class="string">'eccodes'</span>)
+0184     <span class="keyword">if</span> ~iscellstr(model.eccodes)
+0185         EM=<span class="string">'The &quot;eccodes&quot; field must be a cell array of strings'</span>;
+0186         <a href="dispEM.html" class="code" title="function dispEM(string,throwErrors,toList,trimWarnings)">dispEM</a>(EM,throwErrors);
+0187     <span class="keyword">end</span>
+0188 <span class="keyword">end</span>
+0189 <span class="keyword">if</span> isfield(model,<span class="string">'unconstrained'</span>)
+0190     <span class="keyword">if</span> ~isnumeric(model.unconstrained)
+0191         EM=<span class="string">'The &quot;unconstrained&quot; field must be of type &quot;double&quot;'</span>;
+0192         <a href="dispEM.html" class="code" title="function dispEM(string,throwErrors,toList,trimWarnings)">dispEM</a>(EM,throwErrors);
+0193     <span class="keyword">end</span>
+0194 <span class="keyword">end</span>
+0195 <span class="keyword">if</span> isfield(model,<span class="string">'rxnNotes'</span>)
+0196     <span class="keyword">if</span> ~iscellstr(model.rxnNotes)
+0197         EM=<span class="string">'The &quot;rxnNotes&quot; field must be a cell array of strings'</span>;
+0198         <a href="dispEM.html" class="code" title="function dispEM(string,throwErrors,toList,trimWarnings)">dispEM</a>(EM,throwErrors);
+0199     <span class="keyword">end</span>
+0200 <span class="keyword">end</span>
+0201 <span class="keyword">if</span> isfield(model,<span class="string">'rxnReferences'</span>)
+0202     <span class="keyword">if</span> ~iscellstr(model.rxnReferences)
+0203         EM=<span class="string">'The &quot;rxnReferences&quot; field must be a cell array of strings'</span>;
+0204         <a href="dispEM.html" class="code" title="function dispEM(string,throwErrors,toList,trimWarnings)">dispEM</a>(EM,throwErrors);
+0205     <span class="keyword">end</span>
+0206 <span class="keyword">end</span>
+0207 <span class="keyword">if</span> isfield(model,<span class="string">'rxnConfidenceScores'</span>)
+0208     <span class="keyword">if</span> ~isnumeric(model.rxnConfidenceScores)
+0209         EM=<span class="string">'The &quot;rxnConfidenceScores&quot; field must be a double'</span>;
+0210         <a href="dispEM.html" class="code" title="function dispEM(string,throwErrors,toList,trimWarnings)">dispEM</a>(EM,throwErrors);
+0211     <span class="keyword">end</span>
+0212 <span class="keyword">end</span>
+0213 <span class="keyword">if</span> isfield(model,<span class="string">'rxnDeltaG'</span>)
+0214     <span class="keyword">if</span> ~isnumeric(model.rxnDeltaG)
+0215         EM=<span class="string">'The &quot;rxnDeltaG&quot; field must be a double'</span>;
+0216         <a href="dispEM.html" class="code" title="function dispEM(string,throwErrors,toList,trimWarnings)">dispEM</a>(EM,throwErrors);
+0217     <span class="keyword">end</span>
+0218 <span class="keyword">end</span>
+0219 
+0220 <span class="comment">%Empty strings</span>
+0221 <span class="keyword">if</span> isempty(model.id)
+0222     EM=<span class="string">'The &quot;id&quot; field cannot be empty'</span>;
+0223     <a href="dispEM.html" class="code" title="function dispEM(string,throwErrors,toList,trimWarnings)">dispEM</a>(EM,throwErrors);
+0224 <span class="keyword">end</span>
+0225 <span class="keyword">if</span> any(cellfun(@isempty,model.rxns))
+0226     EM=<span class="string">'The model contains empty reaction IDs'</span>;
+0227     <a href="dispEM.html" class="code" title="function dispEM(string,throwErrors,toList,trimWarnings)">dispEM</a>(EM,throwErrors);
+0228 <span class="keyword">end</span>
+0229 <span class="keyword">if</span> any(cellfun(@isempty,model.mets))
+0230     EM=<span class="string">'The model contains empty metabolite IDs'</span>;
+0231     <a href="dispEM.html" class="code" title="function dispEM(string,throwErrors,toList,trimWarnings)">dispEM</a>(EM,throwErrors);
+0232 <span class="keyword">end</span>
+0233 <span class="keyword">if</span> any(cellfun(@isempty,model.comps))
+0234     EM=<span class="string">'The model contains empty compartment IDs'</span>;
+0235     <a href="dispEM.html" class="code" title="function dispEM(string,throwErrors,toList,trimWarnings)">dispEM</a>(EM,throwErrors);
+0236 <span class="keyword">end</span>
+0237 EM=<span class="string">'The following metabolites have empty names:'</span>;
+0238 <a href="dispEM.html" class="code" title="function dispEM(string,throwErrors,toList,trimWarnings)">dispEM</a>(EM,throwErrors,model.mets(cellfun(@isempty,model.metNames)),trimWarnings);
+0239 
+0240 <span class="keyword">if</span> isfield(model,<span class="string">'genes'</span>)
+0241     <span class="keyword">if</span> any(cellfun(@isempty,model.genes))
+0242         EM=<span class="string">'The model contains empty gene IDs'</span>;
+0243         <a href="dispEM.html" class="code" title="function dispEM(string,throwErrors,toList,trimWarnings)">dispEM</a>(EM,throwErrors);
+0244     <span class="keyword">end</span>
+0245 <span class="keyword">end</span>
 0246 
-0247 <span class="comment">%Elements never used (print only as warnings</span>
-0248 EM=<span class="string">'The following reactions are empty (no involved metabolites):'</span>;
-0249 <a href="dispEM.html" class="code" title="function dispEM(string,throwErrors,toList,trimWarnings)">dispEM</a>(EM,false,model.rxns(~any(model.S,1)),trimWarnings);
-0250 EM=<span class="string">'The following metabolites are never used in a reaction:'</span>;
-0251 <a href="dispEM.html" class="code" title="function dispEM(string,throwErrors,toList,trimWarnings)">dispEM</a>(EM,false,model.mets(~any(model.S,2)),trimWarnings);
-0252 <span class="keyword">if</span> isfield(model,<span class="string">'genes'</span>)
-0253     EM=<span class="string">'The following genes are not associated to a reaction:'</span>;
-0254     <a href="dispEM.html" class="code" title="function dispEM(string,throwErrors,toList,trimWarnings)">dispEM</a>(EM,false,model.genes(~any(model.rxnGeneMat,1)),trimWarnings);
-0255 <span class="keyword">end</span>
-0256 I=true(numel(model.comps),1);
-0257 I(model.metComps)=false;
-0258 EM=<span class="string">'The following compartments contain no metabolites:'</span>;
-0259 <a href="dispEM.html" class="code" title="function dispEM(string,throwErrors,toList,trimWarnings)">dispEM</a>(EM,false,model.comps(I),trimWarnings);
-0260 
-0261 <span class="comment">%Contradicting bounds</span>
-0262 EM=<span class="string">'The following reactions have contradicting bounds:'</span>;
-0263 <a href="dispEM.html" class="code" title="function dispEM(string,throwErrors,toList,trimWarnings)">dispEM</a>(EM,throwErrors,model.rxns(model.lb&gt;model.ub),trimWarnings);
-0264 EM=<span class="string">'The following reactions have bounds contradicting their reversibility:'</span>;
-0265 <a href="dispEM.html" class="code" title="function dispEM(string,throwErrors,toList,trimWarnings)">dispEM</a>(EM,throwErrors,model.rxns(model.lb&lt;0 &amp; model.rev==0),trimWarnings);
-0266 
-0267 <span class="comment">%Multiple or no objective functions not allowed in SBML L3V1 FBCv2</span>
-0268 <span class="keyword">if</span> numel(find(model.c))&gt;1
-0269     EM=<span class="string">'Multiple objective functions found. This might be intended, but results in FBCv2 non-compliant SBML file when exported'</span>;
-0270     <a href="dispEM.html" class="code" title="function dispEM(string,throwErrors,toList,trimWarnings)">dispEM</a>(EM,false,model.rxns(find(model.c)),trimWarnings);
-0271 <span class="keyword">elseif</span> ~any(model.c)
-0272     EM=<span class="string">'No objective function found. This might be intended, but results in FBCv2 non-compliant SBML file when exported'</span>;
-0273     <a href="dispEM.html" class="code" title="function dispEM(string,throwErrors,toList,trimWarnings)">dispEM</a>(EM,false);
-0274 <span class="keyword">end</span>
-0275     
-0276 EM=<span class="string">'The following reactions have contradicting bounds:'</span>;
-0277 <a href="dispEM.html" class="code" title="function dispEM(string,throwErrors,toList,trimWarnings)">dispEM</a>(EM,throwErrors,model.rxns(model.lb&gt;model.ub),trimWarnings);
-0278 
-0279 <span class="comment">%Mapping of compartments</span>
-0280 <span class="keyword">if</span> isfield(model,<span class="string">'compOutside'</span>)
-0281     EM=<span class="string">'The following compartments are in &quot;compOutside&quot; but not in &quot;comps&quot;:'</span>;
-0282     <a href="dispEM.html" class="code" title="function dispEM(string,throwErrors,toList,trimWarnings)">dispEM</a>(EM,throwErrors,setdiff(model.compOutside,[{<span class="string">''</span>};model.comps]),trimWarnings);
-0283 <span class="keyword">end</span>
+0247 <span class="comment">%Duplicates</span>
+0248 EM=<span class="string">'The following reaction IDs are duplicates:'</span>;
+0249 <a href="dispEM.html" class="code" title="function dispEM(string,throwErrors,toList,trimWarnings)">dispEM</a>(EM,throwErrors,model.rxns(<a href="#_sub1" class="code" title="subfunction I=duplicates(strings)">duplicates</a>(model.rxns)),trimWarnings);
+0250 EM=<span class="string">'The following metabolite IDs are duplicates:'</span>;
+0251 <a href="dispEM.html" class="code" title="function dispEM(string,throwErrors,toList,trimWarnings)">dispEM</a>(EM,throwErrors,model.mets(<a href="#_sub1" class="code" title="subfunction I=duplicates(strings)">duplicates</a>(model.mets)),trimWarnings);
+0252 EM=<span class="string">'The following compartment IDs are duplicates:'</span>;
+0253 <a href="dispEM.html" class="code" title="function dispEM(string,throwErrors,toList,trimWarnings)">dispEM</a>(EM,throwErrors,model.comps(<a href="#_sub1" class="code" title="subfunction I=duplicates(strings)">duplicates</a>(model.comps)),trimWarnings);
+0254 <span class="keyword">if</span> isfield(model,<span class="string">'genes'</span>)
+0255     EM=<span class="string">'The following genes are duplicates:'</span>;
+0256     <a href="dispEM.html" class="code" title="function dispEM(string,throwErrors,toList,trimWarnings)">dispEM</a>(EM,throwErrors,model.genes(<a href="#_sub1" class="code" title="subfunction I=duplicates(strings)">duplicates</a>(model.genes)),trimWarnings);
+0257 <span class="keyword">end</span>
+0258 metInComp=strcat(model.metNames,<span class="string">'['</span>,model.comps(model.metComps),<span class="string">']'</span>);
+0259 EM=<span class="string">'The following metabolites already exist in the same compartment:'</span>;
+0260 <a href="dispEM.html" class="code" title="function dispEM(string,throwErrors,toList,trimWarnings)">dispEM</a>(EM,throwErrors,metInComp(<a href="#_sub1" class="code" title="subfunction I=duplicates(strings)">duplicates</a>(metInComp)),trimWarnings);
+0261 
+0262 <span class="comment">%Elements never used (print only as warnings</span>
+0263 EM=<span class="string">'The following reactions are empty (no involved metabolites):'</span>;
+0264 <a href="dispEM.html" class="code" title="function dispEM(string,throwErrors,toList,trimWarnings)">dispEM</a>(EM,false,model.rxns(~any(model.S,1)),trimWarnings);
+0265 EM=<span class="string">'The following metabolites are never used in a reaction:'</span>;
+0266 <a href="dispEM.html" class="code" title="function dispEM(string,throwErrors,toList,trimWarnings)">dispEM</a>(EM,false,model.mets(~any(model.S,2)),trimWarnings);
+0267 <span class="keyword">if</span> isfield(model,<span class="string">'genes'</span>)
+0268     EM=<span class="string">'The following genes are not associated to a reaction:'</span>;
+0269     <a href="dispEM.html" class="code" title="function dispEM(string,throwErrors,toList,trimWarnings)">dispEM</a>(EM,false,model.genes(~any(model.rxnGeneMat,1)),trimWarnings);
+0270 <span class="keyword">end</span>
+0271 I=true(numel(model.comps),1);
+0272 I(model.metComps)=false;
+0273 EM=<span class="string">'The following compartments contain no metabolites:'</span>;
+0274 <a href="dispEM.html" class="code" title="function dispEM(string,throwErrors,toList,trimWarnings)">dispEM</a>(EM,false,model.comps(I),trimWarnings);
+0275 
+0276 <span class="comment">%Contradicting bounds</span>
+0277 EM=<span class="string">'The following reactions have contradicting bounds:'</span>;
+0278 <a href="dispEM.html" class="code" title="function dispEM(string,throwErrors,toList,trimWarnings)">dispEM</a>(EM,throwErrors,model.rxns(model.lb&gt;model.ub),trimWarnings);
+0279 EM=<span class="string">'The following reactions have bounds contradicting their reversibility:'</span>;
+0280 contradictBound = (model.lb &lt; 0 &amp; model.ub &gt; 0 &amp; model.rev==0) | <span class="keyword">...</span><span class="comment"> % Reversible bounds, irreversible label</span>
+0281                   (model.lb &lt; 0 &amp; model.ub &lt;= 0 &amp; model.rev==1) | <span class="keyword">...</span><span class="comment"> % Negative bounds, reversible label</span>
+0282                   (model.lb &gt;= 0 &amp; model.ub &gt; 0 &amp; model.rev==1); <span class="comment">% Positive bounds, reversible label</span>
+0283 <a href="dispEM.html" class="code" title="function dispEM(string,throwErrors,toList,trimWarnings)">dispEM</a>(EM,throwErrors,model.rxns(contradictBound),trimWarnings);
 0284 
-0285 <span class="comment">%Met names which start with number</span>
-0286 I=false(numel(model.metNames),1);
-0287 <span class="keyword">for</span> i=1:numel(model.metNames)
-0288     index=strfind(model.metNames{i},<span class="string">' '</span>);
-0289     <span class="keyword">if</span> any(index)
-0290         <span class="keyword">if</span> any(str2double(model.metNames{i}(1:index(1)-1)))
-0291             I(i)=true;
-0292         <span class="keyword">end</span>
-0293     <span class="keyword">end</span>
-0294 <span class="keyword">end</span>
-0295 EM=<span class="string">'The following metabolite IDs begin with a number directly followed by space:'</span>;
-0296 <a href="dispEM.html" class="code" title="function dispEM(string,throwErrors,toList,trimWarnings)">dispEM</a>(EM,throwErrors,model.mets(I),trimWarnings);
-0297 
-0298 <span class="comment">%Non-parseable composition</span>
-0299 <span class="keyword">if</span> isfield(model,<span class="string">'metFormulas'</span>)
-0300     [~, ~, exitFlag]=<a href="parseFormulas.html" class="code" title="function [elements, useMat, exitFlag, MW]=parseFormulas(formulas, noPolymers,isInchi,ignoreRX)">parseFormulas</a>(model.metFormulas,true,false);
-0301     EM=<span class="string">'The composition for the following metabolites could not be parsed:'</span>;
-0302     <a href="dispEM.html" class="code" title="function dispEM(string,throwErrors,toList,trimWarnings)">dispEM</a>(EM,false,model.mets(exitFlag==-1),trimWarnings);
-0303 <span class="keyword">end</span>
-0304 
-0305 <span class="comment">%Check if there are metabolites with different names but the same MIRIAM</span>
-0306 <span class="comment">%codes</span>
-0307 <span class="keyword">if</span> isfield(model,<span class="string">'metMiriams'</span>)
-0308     miriams=containers.Map();
-0309     <span class="keyword">for</span> i=1:numel(model.mets)
-0310         <span class="keyword">if</span> ~isempty(model.metMiriams{i})
-0311             <span class="comment">%Loop through and add for each miriam</span>
-0312             <span class="keyword">for</span> j=1:numel(model.metMiriams{i}.name)
-0313                 <span class="comment">%Get existing metabolite indexes</span>
-0314                 current=strcat(model.metMiriams{i}.name{j},<span class="string">'/'</span>,model.metMiriams{i}.value{j});
-0315                 <span class="keyword">if</span> isKey(miriams,current)
-0316                     existing=miriams(current);
-0317                 <span class="keyword">else</span>
-0318                     existing=[];
-0319                 <span class="keyword">end</span>
-0320                 miriams(current)=[existing;i];
-0321             <span class="keyword">end</span>
-0322         <span class="keyword">end</span>
-0323     <span class="keyword">end</span>
-0324     
-0325     <span class="comment">%Get all keys</span>
-0326     allMiriams=keys(miriams);
-0327     
-0328     hasMultiple=false(numel(allMiriams),1);
-0329     <span class="keyword">for</span> i=1:numel(allMiriams)
-0330         <span class="keyword">if</span> numel(miriams(allMiriams{i}))&gt;1
-0331             <span class="comment">%Check if they all have the same name</span>
-0332             <span class="keyword">if</span> numel(unique(model.metNames(miriams(allMiriams{i}))))&gt;1
-0333                 <span class="keyword">if</span> ~regexp(allMiriams{i},<span class="string">'^sbo\/SBO:'</span>) <span class="comment">% SBO terms are expected to be multiple</span>
-0334                     hasMultiple(i)=true;
-0335                 <span class="keyword">end</span>                
-0336             <span class="keyword">end</span>
-0337         <span class="keyword">end</span>
-0338     <span class="keyword">end</span>
-0339     
-0340     <span class="comment">%Print output</span>
-0341     EM=<span class="string">'The following MIRIAM strings are associated to more than one unique metabolite name:'</span>;
-0342     <a href="dispEM.html" class="code" title="function dispEM(string,throwErrors,toList,trimWarnings)">dispEM</a>(EM,false,allMiriams(hasMultiple),trimWarnings);
-0343 <span class="keyword">end</span>
-0344 
-0345 <span class="comment">%Check if there are metabolites with different names but the same InChI</span>
-0346 <span class="comment">%codes</span>
-0347 <span class="keyword">if</span> isfield(model,<span class="string">'inchis'</span>)
-0348     inchis=containers.Map();
-0349     <span class="keyword">for</span> i=1:numel(model.mets)
-0350         <span class="keyword">if</span> ~isempty(model.inchis{i})
-0351             <span class="comment">%Get existing metabolite indexes</span>
-0352             <span class="keyword">if</span> isKey(inchis,model.inchis{i})
-0353                 existing=inchis(model.inchis{i});
-0354             <span class="keyword">else</span>
-0355                 existing=[];
-0356             <span class="keyword">end</span>
-0357             inchis(model.inchis{i})=[existing;i];
-0358         <span class="keyword">end</span>
-0359     <span class="keyword">end</span>
-0360     
-0361     <span class="comment">%Get all keys</span>
-0362     allInchis=keys(inchis);
-0363     
-0364     hasMultiple=false(numel(allInchis),1);
-0365     <span class="keyword">for</span> i=1:numel(allInchis)
-0366         <span class="keyword">if</span> numel(inchis(allInchis{i}))&gt;1
-0367             <span class="comment">%Check if they all have the same name</span>
-0368             <span class="keyword">if</span> numel(unique(model.metNames(inchis(allInchis{i}))))&gt;1
-0369                 hasMultiple(i)=true;
-0370             <span class="keyword">end</span>
-0371         <span class="keyword">end</span>
-0372     <span class="keyword">end</span>
-0373     
-0374     <span class="comment">%Print output</span>
-0375     EM=<span class="string">'The following InChI strings are associated to more than one unique metabolite name:'</span>;
-0376     <a href="dispEM.html" class="code" title="function dispEM(string,throwErrors,toList,trimWarnings)">dispEM</a>(EM,false,allInchis(hasMultiple),trimWarnings);
-0377 <span class="keyword">end</span>
-0378 
-0379 <span class="comment">% %Check if there are metabolites with different names but the same SMILES</span>
-0380 <span class="comment">% if isfield(model,'metSmiles')</span>
-0381 <span class="comment">%     metSmiles=containers.Map();</span>
-0382 <span class="comment">%     for i=1:numel(model.mets)</span>
-0383 <span class="comment">%         if ~isempty(model.metSmiles{i})</span>
-0384 <span class="comment">%             %Get existing metabolite indexes</span>
-0385 <span class="comment">%             if isKey(metSmiles,model.metSmiles{i})</span>
-0386 <span class="comment">%                 existing=metSmiles(model.metSmiles{i});</span>
-0387 <span class="comment">%             else</span>
-0388 <span class="comment">%                 existing=[];</span>
-0389 <span class="comment">%             end</span>
-0390 <span class="comment">%             metSmiles(model.metSmiles{i})=[existing;i];</span>
-0391 <span class="comment">%         end</span>
-0392 <span class="comment">%     end</span>
-0393 <span class="comment">%</span>
-0394 <span class="comment">%     %Get all keys</span>
-0395 <span class="comment">%     allmetSmiles=keys(metSmiles);</span>
-0396 <span class="comment">%</span>
-0397 <span class="comment">%     hasMultiple=false(numel(metSmiles),1);</span>
-0398 <span class="comment">%     for i=1:numel(metSmiles)</span>
-0399 <span class="comment">%         if numel(metSmiles(metSmiles{i}))&gt;1</span>
-0400 <span class="comment">%             %Check if they all have the same name</span>
-0401 <span class="comment">%             if numel(unique(model.metNames(metSmiles(allmetSmiles{i}))))&gt;1</span>
-0402 <span class="comment">%                 hasMultiple(i)=true;</span>
-0403 <span class="comment">%             end</span>
-0404 <span class="comment">%         end</span>
-0405 <span class="comment">%     end</span>
-0406 <span class="comment">%</span>
-0407 <span class="comment">%     %Print output</span>
-0408 <span class="comment">%     EM='The following metSmiles strings are associated to more than one unique metabolite name:';</span>
-0409 <span class="comment">%     dispEM(EM,false,allmetSmiles(hasMultiple),trimWarnings);</span>
-0410 <span class="comment">% end</span>
-0411 <span class="keyword">end</span>
-0412 
-0413 <a name="_sub1" href="#_subfunctions" class="code">function I=duplicates(strings)</a>
-0414 I=false(numel(strings),1);
-0415 [J, K]=unique(strings);
-0416 <span class="keyword">if</span> numel(J)~=numel(strings)
-0417     L=1:numel(strings);
-0418     L(K)=[];
-0419     I(L)=true;
-0420 <span class="keyword">end</span>
-0421 <span class="keyword">end</span></pre></div>
+0285 <span class="comment">%Multiple or no objective functions not allowed in SBML L3V1 FBCv2</span>
+0286 <span class="keyword">if</span> numel(find(model.c))&gt;1
+0287     EM=<span class="string">'Multiple objective functions found. This might be intended, but results in FBCv2 non-compliant SBML file when exported'</span>;
+0288     <a href="dispEM.html" class="code" title="function dispEM(string,throwErrors,toList,trimWarnings)">dispEM</a>(EM,false,model.rxns(find(model.c)),trimWarnings);
+0289 <span class="keyword">elseif</span> ~any(model.c)
+0290     EM=<span class="string">'No objective function found. This might be intended, but results in FBCv2 non-compliant SBML file when exported'</span>;
+0291     <a href="dispEM.html" class="code" title="function dispEM(string,throwErrors,toList,trimWarnings)">dispEM</a>(EM,false);
+0292 <span class="keyword">end</span>
+0293     
+0294 EM=<span class="string">'The following reactions have contradicting bounds:'</span>;
+0295 <a href="dispEM.html" class="code" title="function dispEM(string,throwErrors,toList,trimWarnings)">dispEM</a>(EM,throwErrors,model.rxns(model.lb&gt;model.ub),trimWarnings);
+0296 
+0297 <span class="comment">%Mapping of compartments</span>
+0298 <span class="keyword">if</span> isfield(model,<span class="string">'compOutside'</span>)
+0299     EM=<span class="string">'The following compartments are in &quot;compOutside&quot; but not in &quot;comps&quot;:'</span>;
+0300     <a href="dispEM.html" class="code" title="function dispEM(string,throwErrors,toList,trimWarnings)">dispEM</a>(EM,throwErrors,setdiff(model.compOutside,[{<span class="string">''</span>};model.comps]),trimWarnings);
+0301 <span class="keyword">end</span>
+0302 
+0303 <span class="comment">%Met names which start with number</span>
+0304 I=false(numel(model.metNames),1);
+0305 <span class="keyword">for</span> i=1:numel(model.metNames)
+0306     index=strfind(model.metNames{i},<span class="string">' '</span>);
+0307     <span class="keyword">if</span> any(index)
+0308         <span class="keyword">if</span> any(str2double(model.metNames{i}(1:index(1)-1)))
+0309             I(i)=true;
+0310         <span class="keyword">end</span>
+0311     <span class="keyword">end</span>
+0312 <span class="keyword">end</span>
+0313 EM=<span class="string">'The following metabolite IDs begin with a number directly followed by space:'</span>;
+0314 <a href="dispEM.html" class="code" title="function dispEM(string,throwErrors,toList,trimWarnings)">dispEM</a>(EM,throwErrors,model.mets(I),trimWarnings);
+0315 
+0316 <span class="comment">%Non-parseable composition</span>
+0317 <span class="keyword">if</span> isfield(model,<span class="string">'metFormulas'</span>)
+0318     [~, ~, exitFlag]=<a href="parseFormulas.html" class="code" title="function [elements, useMat, exitFlag, MW]=parseFormulas(formulas, noPolymers,isInchi,ignoreRX)">parseFormulas</a>(model.metFormulas,true,false);
+0319     EM=<span class="string">'The composition for the following metabolites could not be parsed:'</span>;
+0320     <a href="dispEM.html" class="code" title="function dispEM(string,throwErrors,toList,trimWarnings)">dispEM</a>(EM,false,model.mets(exitFlag==-1),trimWarnings);
+0321 <span class="keyword">end</span>
+0322 
+0323 <span class="comment">%Check if there are metabolites with different names but the same MIRIAM</span>
+0324 <span class="comment">%codes</span>
+0325 <span class="keyword">if</span> isfield(model,<span class="string">'metMiriams'</span>)
+0326     miriams=containers.Map();
+0327     <span class="keyword">for</span> i=1:numel(model.mets)
+0328         <span class="keyword">if</span> ~isempty(model.metMiriams{i})
+0329             <span class="comment">%Loop through and add for each miriam</span>
+0330             <span class="keyword">for</span> j=1:numel(model.metMiriams{i}.name)
+0331                 <span class="comment">%Get existing metabolite indexes</span>
+0332                 current=strcat(model.metMiriams{i}.name{j},<span class="string">'/'</span>,model.metMiriams{i}.value{j});
+0333                 <span class="keyword">if</span> isKey(miriams,current)
+0334                     existing=miriams(current);
+0335                 <span class="keyword">else</span>
+0336                     existing=[];
+0337                 <span class="keyword">end</span>
+0338                 miriams(current)=[existing;i];
+0339             <span class="keyword">end</span>
+0340         <span class="keyword">end</span>
+0341     <span class="keyword">end</span>
+0342     
+0343     <span class="comment">%Get all keys</span>
+0344     allMiriams=keys(miriams);
+0345     
+0346     hasMultiple=false(numel(allMiriams),1);
+0347     <span class="keyword">for</span> i=1:numel(allMiriams)
+0348         <span class="keyword">if</span> numel(miriams(allMiriams{i}))&gt;1
+0349             <span class="comment">%Check if they all have the same name</span>
+0350             <span class="keyword">if</span> numel(unique(model.metNames(miriams(allMiriams{i}))))&gt;1
+0351                 <span class="keyword">if</span> ~regexp(allMiriams{i},<span class="string">'^sbo\/SBO:'</span>) <span class="comment">% SBO terms are expected to be multiple</span>
+0352                     hasMultiple(i)=true;
+0353                 <span class="keyword">end</span>                
+0354             <span class="keyword">end</span>
+0355         <span class="keyword">end</span>
+0356     <span class="keyword">end</span>
+0357     
+0358     <span class="comment">%Print output</span>
+0359     EM=<span class="string">'The following MIRIAM strings are associated to more than one unique metabolite name:'</span>;
+0360     <a href="dispEM.html" class="code" title="function dispEM(string,throwErrors,toList,trimWarnings)">dispEM</a>(EM,false,allMiriams(hasMultiple),trimWarnings);
+0361 <span class="keyword">end</span>
+0362 
+0363 <span class="comment">%Check if there are metabolites with different names but the same InChI</span>
+0364 <span class="comment">%codes</span>
+0365 <span class="keyword">if</span> isfield(model,<span class="string">'inchis'</span>)
+0366     inchis=containers.Map();
+0367     <span class="keyword">for</span> i=1:numel(model.mets)
+0368         <span class="keyword">if</span> ~isempty(model.inchis{i})
+0369             <span class="comment">%Get existing metabolite indexes</span>
+0370             <span class="keyword">if</span> isKey(inchis,model.inchis{i})
+0371                 existing=inchis(model.inchis{i});
+0372             <span class="keyword">else</span>
+0373                 existing=[];
+0374             <span class="keyword">end</span>
+0375             inchis(model.inchis{i})=[existing;i];
+0376         <span class="keyword">end</span>
+0377     <span class="keyword">end</span>
+0378     
+0379     <span class="comment">%Get all keys</span>
+0380     allInchis=keys(inchis);
+0381     
+0382     hasMultiple=false(numel(allInchis),1);
+0383     <span class="keyword">for</span> i=1:numel(allInchis)
+0384         <span class="keyword">if</span> numel(inchis(allInchis{i}))&gt;1
+0385             <span class="comment">%Check if they all have the same name</span>
+0386             <span class="keyword">if</span> numel(unique(model.metNames(inchis(allInchis{i}))))&gt;1
+0387                 hasMultiple(i)=true;
+0388             <span class="keyword">end</span>
+0389         <span class="keyword">end</span>
+0390     <span class="keyword">end</span>
+0391     
+0392     <span class="comment">%Print output</span>
+0393     EM=<span class="string">'The following InChI strings are associated to more than one unique metabolite name:'</span>;
+0394     <a href="dispEM.html" class="code" title="function dispEM(string,throwErrors,toList,trimWarnings)">dispEM</a>(EM,false,allInchis(hasMultiple),trimWarnings);
+0395 <span class="keyword">end</span>
+0396 
+0397 <span class="comment">% %Check if there are metabolites with different names but the same SMILES</span>
+0398 <span class="comment">% if isfield(model,'metSmiles')</span>
+0399 <span class="comment">%     metSmiles=containers.Map();</span>
+0400 <span class="comment">%     for i=1:numel(model.mets)</span>
+0401 <span class="comment">%         if ~isempty(model.metSmiles{i})</span>
+0402 <span class="comment">%             %Get existing metabolite indexes</span>
+0403 <span class="comment">%             if isKey(metSmiles,model.metSmiles{i})</span>
+0404 <span class="comment">%                 existing=metSmiles(model.metSmiles{i});</span>
+0405 <span class="comment">%             else</span>
+0406 <span class="comment">%                 existing=[];</span>
+0407 <span class="comment">%             end</span>
+0408 <span class="comment">%             metSmiles(model.metSmiles{i})=[existing;i];</span>
+0409 <span class="comment">%         end</span>
+0410 <span class="comment">%     end</span>
+0411 <span class="comment">%</span>
+0412 <span class="comment">%     %Get all keys</span>
+0413 <span class="comment">%     allmetSmiles=keys(metSmiles);</span>
+0414 <span class="comment">%</span>
+0415 <span class="comment">%     hasMultiple=false(numel(metSmiles),1);</span>
+0416 <span class="comment">%     for i=1:numel(metSmiles)</span>
+0417 <span class="comment">%         if numel(metSmiles(metSmiles{i}))&gt;1</span>
+0418 <span class="comment">%             %Check if they all have the same name</span>
+0419 <span class="comment">%             if numel(unique(model.metNames(metSmiles(allmetSmiles{i}))))&gt;1</span>
+0420 <span class="comment">%                 hasMultiple(i)=true;</span>
+0421 <span class="comment">%             end</span>
+0422 <span class="comment">%         end</span>
+0423 <span class="comment">%     end</span>
+0424 <span class="comment">%</span>
+0425 <span class="comment">%     %Print output</span>
+0426 <span class="comment">%     EM='The following metSmiles strings are associated to more than one unique metabolite name:';</span>
+0427 <span class="comment">%     dispEM(EM,false,allmetSmiles(hasMultiple),trimWarnings);</span>
+0428 <span class="comment">% end</span>
+0429 <span class="keyword">end</span>
+0430 
+0431 <a name="_sub1" href="#_subfunctions" class="code">function I=duplicates(strings)</a>
+0432 I=false(numel(strings),1);
+0433 [J, K]=unique(strings);
+0434 <span class="keyword">if</span> numel(J)~=numel(strings)
+0435     L=1:numel(strings);
+0436     L(K)=[];
+0437     I(L)=true;
+0438 <span class="keyword">end</span>
+0439 <span class="keyword">end</span></pre></div>
 <hr><address>Generated by <strong><a href="http://www.artefact.tk/software/matlab/m2html/" title="Matlab Documentation in HTML">m2html</a></strong> &copy; 2005</address>
 </body>
 </html>
\ No newline at end of file
diff --git a/doc/core/constructS.html b/doc/core/constructS.html
index b61c0b0b..0ba99957 100644
--- a/doc/core/constructS.html
+++ b/doc/core/constructS.html
@@ -219,31 +219,32 @@ <h2><a name="_source"></a>SOURCE CODE <a href="#_top"><img alt="^" border="0" sr
 0152         strjoin(unique(metsToS(~metsPresent)),<span class="string">', '</span>)],<span class="string">''</span>)
 0153     <span class="keyword">else</span>
 0154         missingMet = find(~metsPresent);
-0155         missingMet = char(strcat(metsToS(missingMet),<span class="string">' (reaction:'</span>,rxns(rxnsToS(missingMet)),<span class="string">')\n'</span>));
-0156         error([<span class="string">'Could not find the following metabolites (reaction indicated) in the metabolite list: \n'</span> <span class="keyword">...</span>
-0157             missingMet <span class="string">'%s'</span>],<span class="string">''</span>);
-0158     <span class="keyword">end</span>
-0159 <span class="keyword">end</span>
-0160 linearIndices=sub2ind(size(S),metsLoc,rxnsToS);
-0161 S(linearIndices)=coefToS;
-0162 S=sparse(S);
-0163 <span class="keyword">end</span>
-0164 
-0165 <a name="_sub1" href="#_subfunctions" class="code">function equ=fixEquations(equ)</a>
-0166 <span class="comment">%If the equation starts with &quot;=&gt;&quot; or &quot;&lt;=&gt;&quot; then add a space again. This is</span>
-0167 <span class="comment">%an alternative way to represent uptake reactions. The opposite way for</span>
-0168 <span class="comment">%producing reactions</span>
-0169 equ=equ(:);
-0170 <span class="keyword">for</span> i=1:numel(equ)
-0171     <span class="keyword">if</span> strcmp(equ{i}(1:2),<span class="string">'=&gt;'</span>) || strcmp(equ{i}(1:3),<span class="string">'&lt;=&gt;'</span>)
-0172         equ{i}=[<span class="string">' '</span> equ{i}];
-0173     <span class="keyword">else</span>
-0174         <span class="keyword">if</span> strcmp(equ{i}(end-1:end),<span class="string">'=&gt;'</span>) || strcmp(equ{i}(end-2:end),<span class="string">'&lt;=&gt;'</span>)
-0175             equ{i}=[equ{i} <span class="string">' '</span>];
-0176         <span class="keyword">end</span>
-0177     <span class="keyword">end</span>
-0178 <span class="keyword">end</span>
-0179 <span class="keyword">end</span></pre></div>
+0155         missingMet = strcat(metsToS(missingMet),<span class="string">' (reaction:'</span>,rxns(rxnsToS(missingMet)),<span class="string">')\n'</span>);
+0156         missingMet = strjoin(missingMet,<span class="string">''</span>);
+0157         error([<span class="string">'Could not find the following metabolites (reaction indicated) in the metabolite list: \n'</span> <span class="keyword">...</span>
+0158             missingMet <span class="string">'%s'</span>],<span class="string">''</span>);
+0159     <span class="keyword">end</span>
+0160 <span class="keyword">end</span>
+0161 linearIndices=sub2ind(size(S),metsLoc,rxnsToS);
+0162 S(linearIndices)=coefToS;
+0163 S=sparse(S);
+0164 <span class="keyword">end</span>
+0165 
+0166 <a name="_sub1" href="#_subfunctions" class="code">function equ=fixEquations(equ)</a>
+0167 <span class="comment">%If the equation starts with &quot;=&gt;&quot; or &quot;&lt;=&gt;&quot; then add a space again. This is</span>
+0168 <span class="comment">%an alternative way to represent uptake reactions. The opposite way for</span>
+0169 <span class="comment">%producing reactions</span>
+0170 equ=equ(:);
+0171 <span class="keyword">for</span> i=1:numel(equ)
+0172     <span class="keyword">if</span> strcmp(equ{i}(1:2),<span class="string">'=&gt;'</span>) || strcmp(equ{i}(1:3),<span class="string">'&lt;=&gt;'</span>)
+0173         equ{i}=[<span class="string">' '</span> equ{i}];
+0174     <span class="keyword">else</span>
+0175         <span class="keyword">if</span> strcmp(equ{i}(end-1:end),<span class="string">'=&gt;'</span>) || strcmp(equ{i}(end-2:end),<span class="string">'&lt;=&gt;'</span>)
+0176             equ{i}=[equ{i} <span class="string">' '</span>];
+0177         <span class="keyword">end</span>
+0178     <span class="keyword">end</span>
+0179 <span class="keyword">end</span>
+0180 <span class="keyword">end</span></pre></div>
 <hr><address>Generated by <strong><a href="http://www.artefact.tk/software/matlab/m2html/" title="Matlab Documentation in HTML">m2html</a></strong> &copy; 2005</address>
 </body>
 </html>
\ No newline at end of file
diff --git a/doc/core/getExchangeRxns.html b/doc/core/getExchangeRxns.html
index 1baa037c..88e7f409 100644
--- a/doc/core/getExchangeRxns.html
+++ b/doc/core/getExchangeRxns.html
@@ -28,19 +28,43 @@ <h2><a name="_synopsis"></a>SYNOPSIS <a href="#_top"><img alt="^" border="0" src
 
 <h2><a name="_description"></a>DESCRIPTION <a href="#_top"><img alt="^" border="0" src="../up.png"></a></h2>
 <div class="fragment"><pre class="comment"> getExchangeRxns
-   Retrieves the exchange reactions from a model
+   Retrieves the exchange reactions from a model. Exchange reactions are
+   identified by having either no substrates or products.
 
+ Input:
    model               a model structure
-   reactionType        retrieve all reactions ('both'), only production
-                       ('out'), or only consumption ('in') (optional, default
-                       'both')
+   reactionType        which exchange reactions should be returned
+                       'all'     all reactions, irrespective of reaction
+                                 bounds
+                       'uptake'  reactions with bounds that imply that
+                                 only uptake are allowed. Reaction
+                                 direction, upper and lower bounds are
+                                 all considered
+                       'excrete' reactions with bounds that imply that
+                                 only excretion are allowed. Reaction
+                                 direction, upper and lower bounds are
+                                 all considered
+                       'reverse' reactions with non-zero upper and lower
+                                 bounds that imply that both uptake and
+                                 excretion are allowed
+                       'blocked' reactions that have zero upper and lower
+                                 bounds, not allowing any flux
+                       'in'      reactions where the boundary metabolite
+                                 is the substrate of the reaction, a
+                                 positive flux value would imply uptake,
+                                 but reaction bounds are not considered
+                       'out'     reactions where the boundary metabolite
+                                 is the substrate of the reaction, a
+                                 positive flux value would imply uptake,
+                                 but reaction bounds are not considered.
 
+ Output:
    exchangeRxns        cell array with the IDs of the exchange reactions
    exchangeRxnsIndexes vector with the indexes of the exchange reactions
 
-   Exchange reactions are defined as reactions which involve only products
-   or only reactants. If the unconstrained field is present, then that is
-   used instead.
+ Note:
+   The union of 'in' and 'out' equals 'all'. Also, the union of 'uptake',
+   'excrete', 'reverse' and 'blocked' equals all.
 
  Usage: [exchangeRxns,exchangeRxnsIndexes]=getExchangeRxns(model,reactionType)</pre></div>
 
@@ -59,51 +83,86 @@ <h2><a name="_cross"></a>CROSS-REFERENCE INFORMATION <a href="#_top"><img alt="^
 <h2><a name="_source"></a>SOURCE CODE <a href="#_top"><img alt="^" border="0" src="../up.png"></a></h2>
 <div class="fragment"><pre>0001 <a name="_sub0" href="#_subfunctions" class="code">function [exchangeRxns, exchangeRxnsIndexes]=getExchangeRxns(model,reactionType)</a>
 0002 <span class="comment">% getExchangeRxns</span>
-0003 <span class="comment">%   Retrieves the exchange reactions from a model</span>
-0004 <span class="comment">%</span>
-0005 <span class="comment">%   model               a model structure</span>
-0006 <span class="comment">%   reactionType        retrieve all reactions ('both'), only production</span>
-0007 <span class="comment">%                       ('out'), or only consumption ('in') (optional, default</span>
-0008 <span class="comment">%                       'both')</span>
-0009 <span class="comment">%</span>
-0010 <span class="comment">%   exchangeRxns        cell array with the IDs of the exchange reactions</span>
-0011 <span class="comment">%   exchangeRxnsIndexes vector with the indexes of the exchange reactions</span>
-0012 <span class="comment">%</span>
-0013 <span class="comment">%   Exchange reactions are defined as reactions which involve only products</span>
-0014 <span class="comment">%   or only reactants. If the unconstrained field is present, then that is</span>
-0015 <span class="comment">%   used instead.</span>
-0016 <span class="comment">%</span>
-0017 <span class="comment">% Usage: [exchangeRxns,exchangeRxnsIndexes]=getExchangeRxns(model,reactionType)</span>
-0018 
-0019 <span class="keyword">if</span> nargin&lt;2
-0020     reactionType=<span class="string">'both'</span>;
-0021 <span class="keyword">else</span>
-0022     reactionType=char(reactionType);
-0023 <span class="keyword">end</span>
-0024 
-0025 hasNoProducts=sparse(numel(model.rxns),1);
-0026 hasNoReactants=sparse(numel(model.rxns),1);
-0027 
-0028 <span class="keyword">if</span> isfield(model,<span class="string">'unconstrained'</span>)
-0029     <span class="keyword">if</span> strcmpi(reactionType,<span class="string">'both'</span>) || strcmpi(reactionType,<span class="string">'out'</span>)
-0030         [~, I]=find(model.S(model.unconstrained~=0,:)&gt;0);
-0031         hasNoProducts(I)=true;
-0032     <span class="keyword">end</span>
-0033     <span class="keyword">if</span> strcmpi(reactionType,<span class="string">'both'</span>) || strcmpi(reactionType,<span class="string">'in'</span>)
-0034         [~, I]=find(model.S(model.unconstrained~=0,:)&lt;0);
-0035         hasNoReactants(I)=true;
-0036     <span class="keyword">end</span>
-0037 <span class="keyword">else</span>
-0038     <span class="keyword">if</span> strcmpi(reactionType,<span class="string">'both'</span>) || strcmpi(reactionType,<span class="string">'out'</span>)
-0039         hasNoProducts=sum((model.S&gt;0))==0;
-0040     <span class="keyword">end</span>
-0041     <span class="keyword">if</span> strcmpi(reactionType,<span class="string">'both'</span>) || strcmpi(reactionType,<span class="string">'in'</span>)
-0042         hasNoReactants=sum((model.S&lt;0))==0;
-0043     <span class="keyword">end</span>
-0044 <span class="keyword">end</span>
-0045 exchangeRxnsIndexes=find(hasNoProducts(:) | hasNoReactants(:));
-0046 exchangeRxns=model.rxns(exchangeRxnsIndexes);
-0047 <span class="keyword">end</span></pre></div>
+0003 <span class="comment">%   Retrieves the exchange reactions from a model. Exchange reactions are</span>
+0004 <span class="comment">%   identified by having either no substrates or products.</span>
+0005 <span class="comment">%</span>
+0006 <span class="comment">% Input:</span>
+0007 <span class="comment">%   model               a model structure</span>
+0008 <span class="comment">%   reactionType        which exchange reactions should be returned</span>
+0009 <span class="comment">%                       'all'     all reactions, irrespective of reaction</span>
+0010 <span class="comment">%                                 bounds</span>
+0011 <span class="comment">%                       'uptake'  reactions with bounds that imply that</span>
+0012 <span class="comment">%                                 only uptake are allowed. Reaction</span>
+0013 <span class="comment">%                                 direction, upper and lower bounds are</span>
+0014 <span class="comment">%                                 all considered</span>
+0015 <span class="comment">%                       'excrete' reactions with bounds that imply that</span>
+0016 <span class="comment">%                                 only excretion are allowed. Reaction</span>
+0017 <span class="comment">%                                 direction, upper and lower bounds are</span>
+0018 <span class="comment">%                                 all considered</span>
+0019 <span class="comment">%                       'reverse' reactions with non-zero upper and lower</span>
+0020 <span class="comment">%                                 bounds that imply that both uptake and</span>
+0021 <span class="comment">%                                 excretion are allowed</span>
+0022 <span class="comment">%                       'blocked' reactions that have zero upper and lower</span>
+0023 <span class="comment">%                                 bounds, not allowing any flux</span>
+0024 <span class="comment">%                       'in'      reactions where the boundary metabolite</span>
+0025 <span class="comment">%                                 is the substrate of the reaction, a</span>
+0026 <span class="comment">%                                 positive flux value would imply uptake,</span>
+0027 <span class="comment">%                                 but reaction bounds are not considered</span>
+0028 <span class="comment">%                       'out'     reactions where the boundary metabolite</span>
+0029 <span class="comment">%                                 is the substrate of the reaction, a</span>
+0030 <span class="comment">%                                 positive flux value would imply uptake,</span>
+0031 <span class="comment">%                                 but reaction bounds are not considered.</span>
+0032 <span class="comment">%</span>
+0033 <span class="comment">% Output:</span>
+0034 <span class="comment">%   exchangeRxns        cell array with the IDs of the exchange reactions</span>
+0035 <span class="comment">%   exchangeRxnsIndexes vector with the indexes of the exchange reactions</span>
+0036 <span class="comment">%</span>
+0037 <span class="comment">% Note:</span>
+0038 <span class="comment">%   The union of 'in' and 'out' equals 'all'. Also, the union of 'uptake',</span>
+0039 <span class="comment">%   'excrete', 'reverse' and 'blocked' equals all.</span>
+0040 <span class="comment">%</span>
+0041 <span class="comment">% Usage: [exchangeRxns,exchangeRxnsIndexes]=getExchangeRxns(model,reactionType)</span>
+0042 
+0043 <span class="keyword">if</span> nargin&lt;2
+0044     reactionType=<span class="string">'all'</span>;
+0045 <span class="keyword">else</span>
+0046     reactionType=char(reactionType);
+0047 <span class="keyword">end</span>
+0048 
+0049 <span class="comment">% Find exchange reactions</span>
+0050 <span class="keyword">if</span> isfield(model, <span class="string">'unconstrained'</span>)
+0051     [~, I]=find(model.S(model.unconstrained~=0,:)&gt;0);
+0052     hasNoProd(I)=true;
+0053     [~, I]=find(model.S(model.unconstrained~=0,:)&lt;0);
+0054     hasNoSubs(I)=true;
+0055 <span class="keyword">else</span>
+0056     hasNoProd = transpose(find(sum(model.S&gt;0)==0));
+0057     hasNoSubs = transpose(find(sum(model.S&lt;0)==0));
+0058 <span class="keyword">end</span>
+0059 allExch   = [hasNoProd; hasNoSubs];
+0060 
+0061 <span class="keyword">switch</span> reactionType
+0062     <span class="keyword">case</span> {<span class="string">'both'</span>,<span class="string">'all'</span>} <span class="comment">% For legacy reasons, 'both' is also allowed</span>
+0063         exchangeRxnsIndexes = allExch;
+0064     <span class="keyword">case</span> <span class="string">'in'</span>
+0065         exchangeRxnsIndexes = hasNoSubs;
+0066     <span class="keyword">case</span> <span class="string">'out'</span>
+0067         exchangeRxnsIndexes = hasNoProd;
+0068     <span class="keyword">case</span> <span class="string">'blocked'</span>
+0069         exchangeRxnsIndexes = allExch(model.lb(allExch) == 0 &amp; model.ub(allExch) == 0);
+0070     <span class="keyword">case</span> <span class="string">'reverse'</span>
+0071         exchangeRxnsIndexes = allExch(model.lb(allExch) &lt; 0 &amp; model.ub(allExch) &gt; 0);
+0072     <span class="keyword">case</span> <span class="string">'uptake'</span>
+0073         exchangeRxnsIndexes = allExch([(model.lb(hasNoSubs) &gt;= 0 &amp; model.ub(hasNoSubs) &gt; 0); <span class="keyword">...</span>
+0074                               (model.lb(hasNoProd) &lt; 0 &amp; model.ub(hasNoProd) &lt;= 0)]);
+0075     <span class="keyword">case</span> <span class="string">'excrete'</span>
+0076         exchangeRxnsIndexes = allExch([(model.lb(hasNoSubs) &lt; 0 &amp; model.ub(hasNoSubs) &lt;= 0); <span class="keyword">...</span>
+0077                               (model.lb(hasNoProd) &gt;= 0 &amp; model.ub(hasNoProd) &gt; 0)]);
+0078     <span class="keyword">otherwise</span>
+0079         error(<span class="string">'Invalid reactionType specified'</span>)
+0080 <span class="keyword">end</span>
+0081 exchangeRxns = model.rxns(exchangeRxnsIndexes);
+0082 <span class="keyword">end</span></pre></div>
 <hr><address>Generated by <strong><a href="http://www.artefact.tk/software/matlab/m2html/" title="Matlab Documentation in HTML">m2html</a></strong> &copy; 2005</address>
 </body>
 </html>
\ No newline at end of file
diff --git a/doc/external/kegg/getKEGGModelForOrganism.html b/doc/external/kegg/getKEGGModelForOrganism.html
index 7010b5eb..e5ec6a91 100644
--- a/doc/external/kegg/getKEGGModelForOrganism.html
+++ b/doc/external/kegg/getKEGGModelForOrganism.html
@@ -63,15 +63,12 @@ <h2><a name="_description"></a>DESCRIPTION <a href="#_top"><img alt="^" border="
                            The hidden Markov models as generated in 2b or
                            downloaded from BioMet Toolbox (see below)
                        The final directory in dataDir should be styled as
-                       proXXX_keggYY or eukXXX_keggYY, indicating whether
+                       prok90_kegg105 or euk90_kegg105, indicating whether
                        the HMMs were trained on pro- or eukaryotic
-                       sequences, using a sequence similarity threshold of
-                       XXX %, fitting the KEGG version YY. E.g.
-                       euk90_kegg105. (optional, see note about fastaFile. Note
-                       that in order to rebuild the KEGG model from a
-                       database dump, as opposed to using the version
-                       supplied with RAVEN, you would still need to supply
-                       this)
+                       sequences; using which sequence similarity treshold
+                       (first set of digits); using which KEGG version
+                       (second set of digits). (this parameter should
+                       ALWAYS be provided)
    outDir              directory to save the results from the quering of
                        the hidden Markov models. The output is specific
                        for the input sequences and the settings used. It
@@ -325,1013 +322,1010 @@ <h2><a name="_source"></a>SOURCE CODE <a href="#_top"><img alt="^" border="0" sr
 0038 <span class="comment">%                           The hidden Markov models as generated in 2b or</span>
 0039 <span class="comment">%                           downloaded from BioMet Toolbox (see below)</span>
 0040 <span class="comment">%                       The final directory in dataDir should be styled as</span>
-0041 <span class="comment">%                       proXXX_keggYY or eukXXX_keggYY, indicating whether</span>
+0041 <span class="comment">%                       prok90_kegg105 or euk90_kegg105, indicating whether</span>
 0042 <span class="comment">%                       the HMMs were trained on pro- or eukaryotic</span>
-0043 <span class="comment">%                       sequences, using a sequence similarity threshold of</span>
-0044 <span class="comment">%                       XXX %, fitting the KEGG version YY. E.g.</span>
-0045 <span class="comment">%                       euk90_kegg105. (optional, see note about fastaFile. Note</span>
-0046 <span class="comment">%                       that in order to rebuild the KEGG model from a</span>
-0047 <span class="comment">%                       database dump, as opposed to using the version</span>
-0048 <span class="comment">%                       supplied with RAVEN, you would still need to supply</span>
-0049 <span class="comment">%                       this)</span>
-0050 <span class="comment">%   outDir              directory to save the results from the quering of</span>
-0051 <span class="comment">%                       the hidden Markov models. The output is specific</span>
-0052 <span class="comment">%                       for the input sequences and the settings used. It</span>
-0053 <span class="comment">%                       is stored in this manner so that the function can</span>
-0054 <span class="comment">%                       continue if interrupted or if it should run in</span>
-0055 <span class="comment">%                       parallel. Be careful not to leave output files from</span>
-0056 <span class="comment">%                       different organisms or runs with different settings</span>
-0057 <span class="comment">%                       in the same folder. They will not be overwritten</span>
-0058 <span class="comment">%                       (optional, default is a temporary dir where all *.out</span>
-0059 <span class="comment">%                       files are deleted before and after doing the</span>
-0060 <span class="comment">%                       reconstruction)</span>
-0061 <span class="comment">%   keepSpontaneous     include reactions labeled as &quot;spontaneous&quot;. (optional,</span>
-0062 <span class="comment">%                       default true)</span>
-0063 <span class="comment">%   keepUndefinedStoich    include reactions in the form n A &lt;=&gt; n+1 A. These</span>
-0064 <span class="comment">%                       will be dealt with as two separate metabolites</span>
-0065 <span class="comment">%                       (optional, default true)</span>
-0066 <span class="comment">%   keepIncomplete      include reactions which have been labelled as</span>
-0067 <span class="comment">%                       &quot;incomplete&quot;, &quot;erroneous&quot; or &quot;unclear&quot; (optional,</span>
-0068 <span class="comment">%                       default true)</span>
-0069 <span class="comment">%   keepGeneral         include reactions which have been labelled as</span>
-0070 <span class="comment">%                       &quot;general reaction&quot;. These are reactions on the form</span>
-0071 <span class="comment">%                       &quot;an aldehyde &lt;=&gt; an alcohol&quot;, and are therefore</span>
-0072 <span class="comment">%                       unsuited for modelling purposes. Note that not all</span>
-0073 <span class="comment">%                       reactions have this type of annotation, and the</span>
-0074 <span class="comment">%                       script will therefore not be able to remove all</span>
-0075 <span class="comment">%                       such reactions (optional, default false)</span>
-0076 <span class="comment">%   cutOff              significance score from HMMer needed to assign</span>
-0077 <span class="comment">%                       genes to a KO (optional, default 10^-50)</span>
-0078 <span class="comment">%   minScoreRatioG      a gene is only assigned to KOs for which the score</span>
-0079 <span class="comment">%                       is &gt;=log(score)/log(best score) for that gene. This</span>
-0080 <span class="comment">%                       is to prevent that a gene which clearly belongs to</span>
-0081 <span class="comment">%                       one KO is assigned also to KOs with much lower</span>
-0082 <span class="comment">%                       scores (optional, default 0.8 (lower is less strict))</span>
-0083 <span class="comment">%   minScoreRatioKO     ignore genes in a KO if their score is</span>
-0084 <span class="comment">%                       &lt;log(score)/log(best score in KO). This is to</span>
-0085 <span class="comment">%                       &quot;prune&quot; KOs which have many genes and where some are</span>
-0086 <span class="comment">%                       clearly a better fit (optional, default 0.3 (lower is</span>
-0087 <span class="comment">%                       less strict))</span>
-0088 <span class="comment">%   maxPhylDist         -1: only use sequences from the same domain</span>
-0089 <span class="comment">%                       (Prokaryota, Eukaryota)</span>
-0090 <span class="comment">%                       other (positive) value: only use sequences for</span>
-0091 <span class="comment">%                       organisms where the phylogenetic distance is at the</span>
-0092 <span class="comment">%                       most this large (as calculated in getPhylDist)</span>
-0093 <span class="comment">%                       (optional, default Inf, which means that all sequences</span>
-0094 <span class="comment">%                       will be used)</span>
-0095 <span class="comment">%   nSequences          for each KO, use up to this many sequences from the</span>
-0096 <span class="comment">%                       most closely related species. This is mainly to</span>
-0097 <span class="comment">%                       speed up the alignment process for KOs with very</span>
-0098 <span class="comment">%                       many genes. This subsampling is performed before</span>
-0099 <span class="comment">%                       running CD-HIT (optional, default inf)</span>
-0100 <span class="comment">%   seqIdentity         sequence identity threshold in CD-HIT, referred as</span>
-0101 <span class="comment">%                       &quot;global sequence identity&quot; in CD-HIT User's Guide.</span>
-0102 <span class="comment">%                       If -1 is provided, CD-HIT is skipped (optional, default 0.9)</span>
-0103 <span class="comment">%   globalModel         structure containing both model and KOModel</span>
-0104 <span class="comment">%                       structures as generated by getModelFromKEGG. These</span>
-0105 <span class="comment">%                       will otherwise be loaded by via getModelFromKEGG.</span>
-0106 <span class="comment">%                       Providing globalKEGGmodel can speed up model</span>
-0107 <span class="comment">%                       generation if getKEGGModelForOrganism is run</span>
-0108 <span class="comment">%                       multiple times for different strains. Example:</span>
-0109 <span class="comment">%                       [globalModel.model,globalModel.KOModel] = getModelFromKEGG;</span>
-0110 <span class="comment">%                       (optional, default empty, global model is loaded by</span>
-0111 <span class="comment">%                       getModelFromKEGG)</span>
+0043 <span class="comment">%                       sequences; using which sequence similarity treshold</span>
+0044 <span class="comment">%                       (first set of digits); using which KEGG version</span>
+0045 <span class="comment">%                       (second set of digits). (this parameter should</span>
+0046 <span class="comment">%                       ALWAYS be provided)</span>
+0047 <span class="comment">%   outDir              directory to save the results from the quering of</span>
+0048 <span class="comment">%                       the hidden Markov models. The output is specific</span>
+0049 <span class="comment">%                       for the input sequences and the settings used. It</span>
+0050 <span class="comment">%                       is stored in this manner so that the function can</span>
+0051 <span class="comment">%                       continue if interrupted or if it should run in</span>
+0052 <span class="comment">%                       parallel. Be careful not to leave output files from</span>
+0053 <span class="comment">%                       different organisms or runs with different settings</span>
+0054 <span class="comment">%                       in the same folder. They will not be overwritten</span>
+0055 <span class="comment">%                       (optional, default is a temporary dir where all *.out</span>
+0056 <span class="comment">%                       files are deleted before and after doing the</span>
+0057 <span class="comment">%                       reconstruction)</span>
+0058 <span class="comment">%   keepSpontaneous     include reactions labeled as &quot;spontaneous&quot;. (optional,</span>
+0059 <span class="comment">%                       default true)</span>
+0060 <span class="comment">%   keepUndefinedStoich    include reactions in the form n A &lt;=&gt; n+1 A. These</span>
+0061 <span class="comment">%                       will be dealt with as two separate metabolites</span>
+0062 <span class="comment">%                       (optional, default true)</span>
+0063 <span class="comment">%   keepIncomplete      include reactions which have been labelled as</span>
+0064 <span class="comment">%                       &quot;incomplete&quot;, &quot;erroneous&quot; or &quot;unclear&quot; (optional,</span>
+0065 <span class="comment">%                       default true)</span>
+0066 <span class="comment">%   keepGeneral         include reactions which have been labelled as</span>
+0067 <span class="comment">%                       &quot;general reaction&quot;. These are reactions on the form</span>
+0068 <span class="comment">%                       &quot;an aldehyde &lt;=&gt; an alcohol&quot;, and are therefore</span>
+0069 <span class="comment">%                       unsuited for modelling purposes. Note that not all</span>
+0070 <span class="comment">%                       reactions have this type of annotation, and the</span>
+0071 <span class="comment">%                       script will therefore not be able to remove all</span>
+0072 <span class="comment">%                       such reactions (optional, default false)</span>
+0073 <span class="comment">%   cutOff              significance score from HMMer needed to assign</span>
+0074 <span class="comment">%                       genes to a KO (optional, default 10^-50)</span>
+0075 <span class="comment">%   minScoreRatioG      a gene is only assigned to KOs for which the score</span>
+0076 <span class="comment">%                       is &gt;=log(score)/log(best score) for that gene. This</span>
+0077 <span class="comment">%                       is to prevent that a gene which clearly belongs to</span>
+0078 <span class="comment">%                       one KO is assigned also to KOs with much lower</span>
+0079 <span class="comment">%                       scores (optional, default 0.8 (lower is less strict))</span>
+0080 <span class="comment">%   minScoreRatioKO     ignore genes in a KO if their score is</span>
+0081 <span class="comment">%                       &lt;log(score)/log(best score in KO). This is to</span>
+0082 <span class="comment">%                       &quot;prune&quot; KOs which have many genes and where some are</span>
+0083 <span class="comment">%                       clearly a better fit (optional, default 0.3 (lower is</span>
+0084 <span class="comment">%                       less strict))</span>
+0085 <span class="comment">%   maxPhylDist         -1: only use sequences from the same domain</span>
+0086 <span class="comment">%                       (Prokaryota, Eukaryota)</span>
+0087 <span class="comment">%                       other (positive) value: only use sequences for</span>
+0088 <span class="comment">%                       organisms where the phylogenetic distance is at the</span>
+0089 <span class="comment">%                       most this large (as calculated in getPhylDist)</span>
+0090 <span class="comment">%                       (optional, default Inf, which means that all sequences</span>
+0091 <span class="comment">%                       will be used)</span>
+0092 <span class="comment">%   nSequences          for each KO, use up to this many sequences from the</span>
+0093 <span class="comment">%                       most closely related species. This is mainly to</span>
+0094 <span class="comment">%                       speed up the alignment process for KOs with very</span>
+0095 <span class="comment">%                       many genes. This subsampling is performed before</span>
+0096 <span class="comment">%                       running CD-HIT (optional, default inf)</span>
+0097 <span class="comment">%   seqIdentity         sequence identity threshold in CD-HIT, referred as</span>
+0098 <span class="comment">%                       &quot;global sequence identity&quot; in CD-HIT User's Guide.</span>
+0099 <span class="comment">%                       If -1 is provided, CD-HIT is skipped (optional, default 0.9)</span>
+0100 <span class="comment">%   globalModel         structure containing both model and KOModel</span>
+0101 <span class="comment">%                       structures as generated by getModelFromKEGG. These</span>
+0102 <span class="comment">%                       will otherwise be loaded by via getModelFromKEGG.</span>
+0103 <span class="comment">%                       Providing globalKEGGmodel can speed up model</span>
+0104 <span class="comment">%                       generation if getKEGGModelForOrganism is run</span>
+0105 <span class="comment">%                       multiple times for different strains. Example:</span>
+0106 <span class="comment">%                       [globalModel.model,globalModel.KOModel] = getModelFromKEGG;</span>
+0107 <span class="comment">%                       (optional, default empty, global model is loaded by</span>
+0108 <span class="comment">%                       getModelFromKEGG)</span>
+0109 <span class="comment">%</span>
+0110 <span class="comment">%   Output:</span>
+0111 <span class="comment">%   model               the reconstructed model</span>
 0112 <span class="comment">%</span>
-0113 <span class="comment">%   Output:</span>
-0114 <span class="comment">%   model               the reconstructed model</span>
-0115 <span class="comment">%</span>
-0116 <span class="comment">%   PLEASE READ THIS: The input to this function can be confusing, because</span>
-0117 <span class="comment">%   it is intended to be run in parallel on a cluster or in multiple</span>
-0118 <span class="comment">%   sessions. It therefore saves a lot of intermediate results to storage.</span>
-0119 <span class="comment">%   This also serves the purpose of not having to do redundant</span>
-0120 <span class="comment">%   calculations. This, however, comes with the disadvantage of somewhat</span>
-0121 <span class="comment">%   trickier handling. This is what this function does:</span>
-0122 <span class="comment">%</span>
-0123 <span class="comment">%   1a. Loads files from a local KEGG FTP dump and constructs a general</span>
-0124 <span class="comment">%       RAVEN model representing the metabolic network. The functions</span>
-0125 <span class="comment">%       getRxnsFromKEGG, getGenesFromKEGG, getMetsFromKEGG summarise the</span>
-0126 <span class="comment">%       data into 'keggRxns.mat', 'keggGenes.mat' and 'keggMets.mat' files,</span>
-0127 <span class="comment">%       which are later merged into 'keggModel.mat' by getModelFromKEGG</span>
-0128 <span class="comment">%       function. The function getPhylDist generates 'keggPhylDist.mat'</span>
-0129 <span class="comment">%       file. KEGG FTP access requires a &lt;a href=&quot;matlab:</span>
-0130 <span class="comment">%       web('http://www.bioinformatics.jp/en/keggftp.html')&quot;&gt;license&lt;/a&gt;.</span>
-0131 <span class="comment">%   1b. Generates protein FASTA files from the KEGG FTP dump (see 1a). One</span>
-0132 <span class="comment">%       multi-FASTA file for each KO in KEGG is generated.</span>
-0133 <span class="comment">%</span>
-0134 <span class="comment">%   The Step 1 has to be re-done every time KEGG updates their database (or</span>
-0135 <span class="comment">%   rather when the updates are large enough to warrant re-running this</span>
-0136 <span class="comment">%   part). Many users would probably never use this feature.</span>
-0137 <span class="comment">%</span>
-0138 <span class="comment">%   2a. Filters KO-specific protein sets. This is done by using the</span>
-0139 <span class="comment">%       settings &quot;maxPhylDist&quot; and &quot;nSequences&quot; to control which sequences</span>
-0140 <span class="comment">%       should be used for constructing Hidden Markov models (HMMs), and</span>
-0141 <span class="comment">%       later for matching your sequences to.</span>
-0142 <span class="comment">%       The most common alternatives here would be to use sequences from</span>
-0143 <span class="comment">%       only eukaryotes, only prokaryotes or all sequences in KEGG, but you</span>
-0144 <span class="comment">%       could also play around with the parameters to use e.g. only fungal</span>
-0145 <span class="comment">%       sequences.</span>
-0146 <span class="comment">%   2b. KO-specific protein FASTA files are re-organised into</span>
-0147 <span class="comment">%       non-redundant protein sets with CD-HIT. The user can only set</span>
-0148 <span class="comment">%       seqIdentity parameter, which corresponds to '-c' parameter in</span>
-0149 <span class="comment">%       CD-HIT, described as &quot;sequence identity threshold&quot;. CD-HIT suggsted</span>
-0150 <span class="comment">%       sequence identity specific word_length (-n) parameters are used.</span>
-0151 <span class="comment">%   2c. Does a multi sequence alignment for multi-FASTA files obtained in</span>
-0152 <span class="comment">%       Step 2b for future use. MAFFT software with automatic selection of</span>
-0153 <span class="comment">%       alignment algorithm is used in this step ('--auto').</span>
-0154 <span class="comment">%   2d. Trains hidden Markov models using HMMer for each of the aligned</span>
-0155 <span class="comment">%       KO-specific FASTA files obtained in Step 2c. This is performed with</span>
-0156 <span class="comment">%       'hmmbuild' using the default settings.</span>
-0157 <span class="comment">%</span>
-0158 <span class="comment">%   Step 2 may be reasonable to be re-done if the user wants to tweak the</span>
-0159 <span class="comment">%   settings in proteins filtering, clustering, multi sequence alignment or</span>
-0160 <span class="comment">%   HMMs training steps. However, it requires to have KO-specific protein</span>
-0161 <span class="comment">%   FASTA files obtained in Step 1a. As such files are not provided in</span>
-0162 <span class="comment">%   RAVEN and BioMet ToolBox, the user can only generate these files from</span>
-0163 <span class="comment">%   KEGG FTP dump files, so KEGG FTP license is needed.</span>
-0164 <span class="comment">%</span>
-0165 <span class="comment">%   3a. Queries the HMMs with sequences for the organism you are making a</span>
-0166 <span class="comment">%       model for. This step uses both the output from step 1a and from 2d.</span>
-0167 <span class="comment">%       This is done with 'hmmsearch' function under default settings. The</span>
-0168 <span class="comment">%       significance threshold value set in 'cutOff' parameter is used</span>
-0169 <span class="comment">%       later when parsing '*.out' files to filter out KO hits with higher</span>
-0170 <span class="comment">%       value than 'cutOff' value. The results with passable E values are</span>
-0171 <span class="comment">%       summarised into KO-gene occurence matrix with E values in</span>
-0172 <span class="comment">%       intersections as 'koGeneMat'. The parameters 'minScoreRatioG' and</span>
-0173 <span class="comment">%       'minScoreRatioKO' are then applied to 'prune' KO-gene associations</span>
-0174 <span class="comment">%       (see the function descriptions above for more details). The</span>
-0175 <span class="comment">%       intersection values for these 'prunable' associations are converted</span>
-0176 <span class="comment">%       to zeroes.</span>
-0177 <span class="comment">%   3b. Constructs a model based on the pre-processed KO-gene association</span>
-0178 <span class="comment">%       matrix (koGeneMat). As the full KEGG model already has reaction-KO</span>
-0179 <span class="comment">%       relationships, KOs are converted into the query genes. The final</span>
-0180 <span class="comment">%       draft model contains only these reactions, which are associated</span>
-0181 <span class="comment">%       with KOs from koGeneMat. The reactions without the genes may also</span>
-0182 <span class="comment">%       be included, if the user set keepSpontaneous as 'true'.</span>
+0113 <span class="comment">%   PLEASE READ THIS: The input to this function can be confusing, because</span>
+0114 <span class="comment">%   it is intended to be run in parallel on a cluster or in multiple</span>
+0115 <span class="comment">%   sessions. It therefore saves a lot of intermediate results to storage.</span>
+0116 <span class="comment">%   This also serves the purpose of not having to do redundant</span>
+0117 <span class="comment">%   calculations. This, however, comes with the disadvantage of somewhat</span>
+0118 <span class="comment">%   trickier handling. This is what this function does:</span>
+0119 <span class="comment">%</span>
+0120 <span class="comment">%   1a. Loads files from a local KEGG FTP dump and constructs a general</span>
+0121 <span class="comment">%       RAVEN model representing the metabolic network. The functions</span>
+0122 <span class="comment">%       getRxnsFromKEGG, getGenesFromKEGG, getMetsFromKEGG summarise the</span>
+0123 <span class="comment">%       data into 'keggRxns.mat', 'keggGenes.mat' and 'keggMets.mat' files,</span>
+0124 <span class="comment">%       which are later merged into 'keggModel.mat' by getModelFromKEGG</span>
+0125 <span class="comment">%       function. The function getPhylDist generates 'keggPhylDist.mat'</span>
+0126 <span class="comment">%       file. KEGG FTP access requires a &lt;a href=&quot;matlab:</span>
+0127 <span class="comment">%       web('http://www.bioinformatics.jp/en/keggftp.html')&quot;&gt;license&lt;/a&gt;.</span>
+0128 <span class="comment">%   1b. Generates protein FASTA files from the KEGG FTP dump (see 1a). One</span>
+0129 <span class="comment">%       multi-FASTA file for each KO in KEGG is generated.</span>
+0130 <span class="comment">%</span>
+0131 <span class="comment">%   The Step 1 has to be re-done every time KEGG updates their database (or</span>
+0132 <span class="comment">%   rather when the updates are large enough to warrant re-running this</span>
+0133 <span class="comment">%   part). Many users would probably never use this feature.</span>
+0134 <span class="comment">%</span>
+0135 <span class="comment">%   2a. Filters KO-specific protein sets. This is done by using the</span>
+0136 <span class="comment">%       settings &quot;maxPhylDist&quot; and &quot;nSequences&quot; to control which sequences</span>
+0137 <span class="comment">%       should be used for constructing Hidden Markov models (HMMs), and</span>
+0138 <span class="comment">%       later for matching your sequences to.</span>
+0139 <span class="comment">%       The most common alternatives here would be to use sequences from</span>
+0140 <span class="comment">%       only eukaryotes, only prokaryotes or all sequences in KEGG, but you</span>
+0141 <span class="comment">%       could also play around with the parameters to use e.g. only fungal</span>
+0142 <span class="comment">%       sequences.</span>
+0143 <span class="comment">%   2b. KO-specific protein FASTA files are re-organised into</span>
+0144 <span class="comment">%       non-redundant protein sets with CD-HIT. The user can only set</span>
+0145 <span class="comment">%       seqIdentity parameter, which corresponds to '-c' parameter in</span>
+0146 <span class="comment">%       CD-HIT, described as &quot;sequence identity threshold&quot;. CD-HIT suggsted</span>
+0147 <span class="comment">%       sequence identity specific word_length (-n) parameters are used.</span>
+0148 <span class="comment">%   2c. Does a multi sequence alignment for multi-FASTA files obtained in</span>
+0149 <span class="comment">%       Step 2b for future use. MAFFT software with automatic selection of</span>
+0150 <span class="comment">%       alignment algorithm is used in this step ('--auto').</span>
+0151 <span class="comment">%   2d. Trains hidden Markov models using HMMer for each of the aligned</span>
+0152 <span class="comment">%       KO-specific FASTA files obtained in Step 2c. This is performed with</span>
+0153 <span class="comment">%       'hmmbuild' using the default settings.</span>
+0154 <span class="comment">%</span>
+0155 <span class="comment">%   Step 2 may be reasonable to be re-done if the user wants to tweak the</span>
+0156 <span class="comment">%   settings in proteins filtering, clustering, multi sequence alignment or</span>
+0157 <span class="comment">%   HMMs training steps. However, it requires to have KO-specific protein</span>
+0158 <span class="comment">%   FASTA files obtained in Step 1a. As such files are not provided in</span>
+0159 <span class="comment">%   RAVEN and BioMet ToolBox, the user can only generate these files from</span>
+0160 <span class="comment">%   KEGG FTP dump files, so KEGG FTP license is needed.</span>
+0161 <span class="comment">%</span>
+0162 <span class="comment">%   3a. Queries the HMMs with sequences for the organism you are making a</span>
+0163 <span class="comment">%       model for. This step uses both the output from step 1a and from 2d.</span>
+0164 <span class="comment">%       This is done with 'hmmsearch' function under default settings. The</span>
+0165 <span class="comment">%       significance threshold value set in 'cutOff' parameter is used</span>
+0166 <span class="comment">%       later when parsing '*.out' files to filter out KO hits with higher</span>
+0167 <span class="comment">%       value than 'cutOff' value. The results with passable E values are</span>
+0168 <span class="comment">%       summarised into KO-gene occurence matrix with E values in</span>
+0169 <span class="comment">%       intersections as 'koGeneMat'. The parameters 'minScoreRatioG' and</span>
+0170 <span class="comment">%       'minScoreRatioKO' are then applied to 'prune' KO-gene associations</span>
+0171 <span class="comment">%       (see the function descriptions above for more details). The</span>
+0172 <span class="comment">%       intersection values for these 'prunable' associations are converted</span>
+0173 <span class="comment">%       to zeroes.</span>
+0174 <span class="comment">%   3b. Constructs a model based on the pre-processed KO-gene association</span>
+0175 <span class="comment">%       matrix (koGeneMat). As the full KEGG model already has reaction-KO</span>
+0176 <span class="comment">%       relationships, KOs are converted into the query genes. The final</span>
+0177 <span class="comment">%       draft model contains only these reactions, which are associated</span>
+0178 <span class="comment">%       with KOs from koGeneMat. The reactions without the genes may also</span>
+0179 <span class="comment">%       be included, if the user set keepSpontaneous as 'true'.</span>
+0180 <span class="comment">%</span>
+0181 <span class="comment">%   The Step 3 is specific to the organism for which the model is</span>
+0182 <span class="comment">%   reconstructed.</span>
 0183 <span class="comment">%</span>
-0184 <span class="comment">%   The Step 3 is specific to the organism for which the model is</span>
-0185 <span class="comment">%   reconstructed.</span>
-0186 <span class="comment">%</span>
-0187 <span class="comment">%   In principle the function looks at which output that is already available</span>
-0188 <span class="comment">%   and runs only the parts that are required for step 3. This means</span>
-0189 <span class="comment">%   that (see the definition of the parameters for details):</span>
-0190 <span class="comment">%   -1a is only performed if there are no KEGG model files in the</span>
-0191 <span class="comment">%   RAVEN\external\kegg directory</span>
-0192 <span class="comment">%   -1b is only performed if not all required HMMs OR aligned FASTA files</span>
-0193 <span class="comment">%   OR multi-FASTA files exist in the defined dataDir. This means that this</span>
-0194 <span class="comment">%   step is skipped if the HMMs are downloaded from BioMet Toolbox instead</span>
-0195 <span class="comment">%   (see above). If not all files exist it will try to find</span>
-0196 <span class="comment">%   the KEGG database files in dataDir.</span>
-0197 <span class="comment">%   -2a is only performed if not all required HMMs OR aligned FASTA files</span>
-0198 <span class="comment">%   files exist in the defined dataDir. This means that this step is skipped</span>
-0199 <span class="comment">%   if the HMMs are downloaded from BioMet Toolbox instead (see above).</span>
-0200 <span class="comment">%   -2b is only performed if not all required HMMs exist in the defined</span>
-0201 <span class="comment">%   dataDir. This means that this step is skipped if the FASTA files or</span>
-0202 <span class="comment">%   HMMs are downloaded from BioMet Toolbox instead (see above).</span>
-0203 <span class="comment">%   -3a is performed for the required HMMs for which no corresponding .out</span>
-0204 <span class="comment">%   file exists in outDir. This is just a way to enable the function to be</span>
-0205 <span class="comment">%   run in parallel or to resume if interrupted.</span>
-0206 <span class="comment">%   -3b is always performed.</span>
+0184 <span class="comment">%   In principle the function looks at which output that is already available</span>
+0185 <span class="comment">%   and runs only the parts that are required for step 3. This means</span>
+0186 <span class="comment">%   that (see the definition of the parameters for details):</span>
+0187 <span class="comment">%   -1a is only performed if there are no KEGG model files in the</span>
+0188 <span class="comment">%   RAVEN\external\kegg directory</span>
+0189 <span class="comment">%   -1b is only performed if not all required HMMs OR aligned FASTA files</span>
+0190 <span class="comment">%   OR multi-FASTA files exist in the defined dataDir. This means that this</span>
+0191 <span class="comment">%   step is skipped if the HMMs are downloaded from BioMet Toolbox instead</span>
+0192 <span class="comment">%   (see above). If not all files exist it will try to find</span>
+0193 <span class="comment">%   the KEGG database files in dataDir.</span>
+0194 <span class="comment">%   -2a is only performed if not all required HMMs OR aligned FASTA files</span>
+0195 <span class="comment">%   files exist in the defined dataDir. This means that this step is skipped</span>
+0196 <span class="comment">%   if the HMMs are downloaded from BioMet Toolbox instead (see above).</span>
+0197 <span class="comment">%   -2b is only performed if not all required HMMs exist in the defined</span>
+0198 <span class="comment">%   dataDir. This means that this step is skipped if the FASTA files or</span>
+0199 <span class="comment">%   HMMs are downloaded from BioMet Toolbox instead (see above).</span>
+0200 <span class="comment">%   -3a is performed for the required HMMs for which no corresponding .out</span>
+0201 <span class="comment">%   file exists in outDir. This is just a way to enable the function to be</span>
+0202 <span class="comment">%   run in parallel or to resume if interrupted.</span>
+0203 <span class="comment">%   -3b is always performed.</span>
+0204 <span class="comment">%</span>
+0205 <span class="comment">%   These steps are specific to the organism for which you are</span>
+0206 <span class="comment">%   reconstructing the model.</span>
 0207 <span class="comment">%</span>
-0208 <span class="comment">%   These steps are specific to the organism for which you are</span>
-0209 <span class="comment">%   reconstructing the model.</span>
-0210 <span class="comment">%</span>
-0211 <span class="comment">%   Regarding the whole pipeline, the function checks the output that is</span>
-0212 <span class="comment">%   already available and runs only the parts that are required for step 3.</span>
-0213 <span class="comment">%   This means that (see the definition of the parameters for details):</span>
-0214 <span class="comment">%   -1a is only performed if there are no KEGG model files in the</span>
-0215 <span class="comment">%   RAVEN\external\kegg directory.</span>
-0216 <span class="comment">%   -1b is only performed if any of required KOs do not have HMMs, aligned</span>
-0217 <span class="comment">%   FASTA files, clustered FASTA files and raw FASTA files in the defined</span>
-0218 <span class="comment">%   dataDir. This means that this step is skipped if the HMMs are</span>
-0219 <span class="comment">%   downloaded from BioMet Toolbox instead (see above). If not all files</span>
-0220 <span class="comment">%   exist it will try to find the KEGG database files in dataDir.</span>
-0221 <span class="comment">%   -2ab are only performed if any of required KOs do not have HMMs,</span>
-0222 <span class="comment">%   aligned FASTA files and clustered FASTA files in the defined dataDir.</span>
-0223 <span class="comment">%   This means that this step is skipped if the HMMs are downloaded from</span>
-0224 <span class="comment">%   BioMet Toolbox instead (see above).</span>
-0225 <span class="comment">%   -2c is only performed if any of required KOs do not have HMMs and</span>
-0226 <span class="comment">%   aligned FASTA files in the defined dataDir. This means that this step</span>
-0227 <span class="comment">%   is skipped if the HMMs are downloaded from BioMet Toolbox instead (see</span>
-0228 <span class="comment">%   above).</span>
-0229 <span class="comment">%   -2d is only performed if any of required KOs do not have HMMs exist in</span>
-0230 <span class="comment">%   the defined dataDir. This means that this step is skipped if the FASTA</span>
-0231 <span class="comment">%   files or HMMs are downloaded from BioMet Toolbox instead (see above).</span>
-0232 <span class="comment">%   -3a is performed for the required HMMs for which no corresponding .out</span>
-0233 <span class="comment">%   file exists in outDir. This is just a way to enable the function to be</span>
-0234 <span class="comment">%   run in parallel or to resume if interrupted.</span>
-0235 <span class="comment">%   -3b is always performed.</span>
-0236 <span class="comment">%</span>
-0237 <span class="comment">%   NOTE: it is also possible to obtain draft model from KEGG without</span>
-0238 <span class="comment">%   providing protein FASTA file for the target organism. In such case the</span>
-0239 <span class="comment">%   organism three-four letter abbreviation set as 'organismID' must exist</span>
-0240 <span class="comment">%   in the local KEGG database. In such case, the program just fetches all</span>
-0241 <span class="comment">%   the reactions, which are associated with given 'organismID'.</span>
-0242 <span class="comment">%</span>
-0243 <span class="comment">% Usage: model=getKEGGModelForOrganism(organismID,fastaFile,dataDir,...</span>
-0244 <span class="comment">%    outDir,keepSpontaneous,keepUndefinedStoich,keepIncomplete,...</span>
-0245 <span class="comment">%    keepGeneral,cutOff,minScoreRatioKO,minScoreRatioG,maxPhylDist,...</span>
-0246 <span class="comment">%    nSequences,seqIdentity)</span>
-0247 
-0248 <span class="keyword">if</span> nargin&lt;2 || isempty(fastaFile)
-0249     fastaFile=[];
-0250 <span class="keyword">else</span>
-0251     fastaFile=char(fastaFile);
-0252 <span class="keyword">end</span>
-0253 <span class="keyword">if</span> nargin&lt;3
-0254     dataDir=[];
-0255 <span class="keyword">else</span>
-0256     dataDir=char(dataDir);
-0257 <span class="keyword">end</span>
-0258 <span class="keyword">if</span> nargin&lt;4 || isempty(outDir)
-0259     outDir=tempdir;
-0260     <span class="comment">%Delete all *.out files if any exist</span>
-0261     delete(fullfile(outDir,<span class="string">'*.out'</span>));
-0262 <span class="keyword">else</span>
-0263     outDir=char(outDir);
+0208 <span class="comment">%   Regarding the whole pipeline, the function checks the output that is</span>
+0209 <span class="comment">%   already available and runs only the parts that are required for step 3.</span>
+0210 <span class="comment">%   This means that (see the definition of the parameters for details):</span>
+0211 <span class="comment">%   -1a is only performed if there are no KEGG model files in the</span>
+0212 <span class="comment">%   RAVEN\external\kegg directory.</span>
+0213 <span class="comment">%   -1b is only performed if any of required KOs do not have HMMs, aligned</span>
+0214 <span class="comment">%   FASTA files, clustered FASTA files and raw FASTA files in the defined</span>
+0215 <span class="comment">%   dataDir. This means that this step is skipped if the HMMs are</span>
+0216 <span class="comment">%   downloaded from BioMet Toolbox instead (see above). If not all files</span>
+0217 <span class="comment">%   exist it will try to find the KEGG database files in dataDir.</span>
+0218 <span class="comment">%   -2ab are only performed if any of required KOs do not have HMMs,</span>
+0219 <span class="comment">%   aligned FASTA files and clustered FASTA files in the defined dataDir.</span>
+0220 <span class="comment">%   This means that this step is skipped if the HMMs are downloaded from</span>
+0221 <span class="comment">%   BioMet Toolbox instead (see above).</span>
+0222 <span class="comment">%   -2c is only performed if any of required KOs do not have HMMs and</span>
+0223 <span class="comment">%   aligned FASTA files in the defined dataDir. This means that this step</span>
+0224 <span class="comment">%   is skipped if the HMMs are downloaded from BioMet Toolbox instead (see</span>
+0225 <span class="comment">%   above).</span>
+0226 <span class="comment">%   -2d is only performed if any of required KOs do not have HMMs exist in</span>
+0227 <span class="comment">%   the defined dataDir. This means that this step is skipped if the FASTA</span>
+0228 <span class="comment">%   files or HMMs are downloaded from BioMet Toolbox instead (see above).</span>
+0229 <span class="comment">%   -3a is performed for the required HMMs for which no corresponding .out</span>
+0230 <span class="comment">%   file exists in outDir. This is just a way to enable the function to be</span>
+0231 <span class="comment">%   run in parallel or to resume if interrupted.</span>
+0232 <span class="comment">%   -3b is always performed.</span>
+0233 <span class="comment">%</span>
+0234 <span class="comment">%   NOTE: it is also possible to obtain draft model from KEGG without</span>
+0235 <span class="comment">%   providing protein FASTA file for the target organism. In such case the</span>
+0236 <span class="comment">%   organism three-four letter abbreviation set as 'organismID' must exist</span>
+0237 <span class="comment">%   in the local KEGG database. In such case, the program just fetches all</span>
+0238 <span class="comment">%   the reactions, which are associated with given 'organismID'.</span>
+0239 <span class="comment">%</span>
+0240 <span class="comment">% Usage: model=getKEGGModelForOrganism(organismID,fastaFile,dataDir,...</span>
+0241 <span class="comment">%    outDir,keepSpontaneous,keepUndefinedStoich,keepIncomplete,...</span>
+0242 <span class="comment">%    keepGeneral,cutOff,minScoreRatioKO,minScoreRatioG,maxPhylDist,...</span>
+0243 <span class="comment">%    nSequences,seqIdentity)</span>
+0244 
+0245 <span class="keyword">if</span> nargin&lt;2 || isempty(fastaFile)
+0246     fastaFile=[];
+0247 <span class="keyword">else</span>
+0248     fastaFile=char(fastaFile);
+0249 <span class="keyword">end</span>
+0250 <span class="keyword">if</span> nargin&lt;3
+0251     dataDir=[];
+0252 <span class="keyword">else</span>
+0253     dataDir=char(dataDir);
+0254 <span class="keyword">end</span>
+0255 <span class="keyword">if</span> nargin&lt;4 || isempty(outDir)
+0256     outDir=tempdir;
+0257     <span class="comment">%Delete all *.out files if any exist</span>
+0258     delete(fullfile(outDir,<span class="string">'*.out'</span>));
+0259 <span class="keyword">else</span>
+0260     outDir=char(outDir);
+0261 <span class="keyword">end</span>
+0262 <span class="keyword">if</span> nargin&lt;5
+0263     keepSpontaneous=true;
 0264 <span class="keyword">end</span>
-0265 <span class="keyword">if</span> nargin&lt;5
-0266     keepSpontaneous=true;
+0265 <span class="keyword">if</span> nargin&lt;6
+0266     keepUndefinedStoich=true;
 0267 <span class="keyword">end</span>
-0268 <span class="keyword">if</span> nargin&lt;6
-0269     keepUndefinedStoich=true;
+0268 <span class="keyword">if</span> nargin&lt;7
+0269     keepIncomplete=true;
 0270 <span class="keyword">end</span>
-0271 <span class="keyword">if</span> nargin&lt;7
-0272     keepIncomplete=true;
+0271 <span class="keyword">if</span> nargin&lt;8
+0272     keepGeneral=false;
 0273 <span class="keyword">end</span>
-0274 <span class="keyword">if</span> nargin&lt;8
-0275     keepGeneral=false;
+0274 <span class="keyword">if</span> nargin&lt;9
+0275     cutOff=10^-50;
 0276 <span class="keyword">end</span>
-0277 <span class="keyword">if</span> nargin&lt;9
-0278     cutOff=10^-50;
+0277 <span class="keyword">if</span> nargin&lt;10
+0278     minScoreRatioKO=0.3;
 0279 <span class="keyword">end</span>
-0280 <span class="keyword">if</span> nargin&lt;10
-0281     minScoreRatioKO=0.3;
+0280 <span class="keyword">if</span> nargin&lt;11
+0281     minScoreRatioG=0.8;
 0282 <span class="keyword">end</span>
-0283 <span class="keyword">if</span> nargin&lt;11
-0284     minScoreRatioG=0.8;
-0285 <span class="keyword">end</span>
-0286 <span class="keyword">if</span> nargin&lt;12
-0287     maxPhylDist=inf;
-0288     <span class="comment">%Include all sequences for each reaction</span>
-0289 <span class="keyword">end</span>
-0290 <span class="keyword">if</span> nargin&lt;13
-0291     nSequences=inf;
-0292     <span class="comment">%Include all sequences for each reaction</span>
+0283 <span class="keyword">if</span> nargin&lt;12
+0284     maxPhylDist=inf;
+0285     <span class="comment">%Include all sequences for each reaction</span>
+0286 <span class="keyword">end</span>
+0287 <span class="keyword">if</span> nargin&lt;13
+0288     nSequences=inf;
+0289     <span class="comment">%Include all sequences for each reaction</span>
+0290 <span class="keyword">end</span>
+0291 <span class="keyword">if</span> nargin&lt;14
+0292     seqIdentity=0.9;
 0293 <span class="keyword">end</span>
-0294 <span class="keyword">if</span> nargin&lt;14
-0295     seqIdentity=0.9;
-0296 <span class="keyword">end</span>
-0297 
-0298 <span class="keyword">if</span> isempty(fastaFile)
-0299     fprintf([<span class="string">'\n*** The model reconstruction from KEGG based on the annotation available for KEGG Species &lt;strong&gt;'</span> organismID <span class="string">'&lt;/strong&gt; ***\n\n'</span>]);
-0300 <span class="keyword">else</span>
-0301     fprintf(<span class="string">'\n*** The model reconstruction from KEGG based on the protein homology search against KEGG Orthology specific HMMs ***\n\n'</span>);
-0302     <span class="comment">%Check if query fasta exists</span>
-0303     fastaFile=checkFileExistence(fastaFile,2); <span class="comment">%Copy file to temp dir</span>
-0304 <span class="keyword">end</span>
-0305 
-0306 <span class="comment">%Run the external binaries multi-threaded to use all logical cores assigned</span>
-0307 <span class="comment">%to MATLAB</span>
-0308 cores = evalc(<span class="string">'feature(''numcores'')'</span>);
-0309 cores = strsplit(cores, <span class="string">'MATLAB was assigned: '</span>);
-0310 cores = regexp(cores{2},<span class="string">'^\d*'</span>,<span class="string">'match'</span>);
-0311 cores = cores{1};
+0294 
+0295 <span class="keyword">if</span> isempty(fastaFile)
+0296     fprintf([<span class="string">'\n*** The model reconstruction from KEGG based on the annotation available for KEGG Species &lt;strong&gt;'</span> organismID <span class="string">'&lt;/strong&gt; ***\n\n'</span>]);
+0297 <span class="keyword">else</span>
+0298     fprintf(<span class="string">'\n*** The model reconstruction from KEGG based on the protein homology search against KEGG Orthology specific HMMs ***\n\n'</span>);
+0299     <span class="comment">%Check if query fasta exists</span>
+0300     fastaFile=checkFileExistence(fastaFile,2); <span class="comment">%Copy file to temp dir</span>
+0301 <span class="keyword">end</span>
+0302 
+0303 <span class="comment">%Run the external binaries multi-threaded to use all logical cores assigned</span>
+0304 <span class="comment">%to MATLAB</span>
+0305 cores = evalc(<span class="string">'feature(''numcores'')'</span>);
+0306 cores = strsplit(cores, <span class="string">'MATLAB was assigned: '</span>);
+0307 cores = regexp(cores{2},<span class="string">'^\d*'</span>,<span class="string">'match'</span>);
+0308 cores = cores{1};
+0309 
+0310 <span class="comment">%Get the directory for RAVEN Toolbox.</span>
+0311 ravenPath=findRAVENroot();
 0312 
-0313 <span class="comment">%Get the directory for RAVEN Toolbox.</span>
-0314 ravenPath=findRAVENroot();
-0315 
-0316 <span class="comment">%Checking if dataDir is consistent. It must point to pre-trained HMMs set,</span>
-0317 <span class="comment">%compatible with the the current RAVEN version. The user may have the</span>
-0318 <span class="comment">%required zip file already in working directory or have it extracted. If</span>
-0319 <span class="comment">%the zip file and directory is not here, it is downloaded from the cloud</span>
-0320 <span class="keyword">if</span> ~isempty(dataDir)
-0321     hmmOptions={<span class="string">'euk90_kegg105'</span>,<span class="string">'prok90_kegg105'</span>};
-0322     <span class="keyword">if</span> ~endsWith(dataDir,hmmOptions) <span class="comment">%Check if dataDir ends with any of the hmmOptions.</span>
-0323                                      <span class="comment">%If not, then check whether the required folders exist anyway.</span>
-0324         <span class="keyword">if</span> ~isfile(fullfile(dataDir,<span class="string">'keggdb'</span>,<span class="string">'genes.pep'</span>)) &amp;&amp; <span class="keyword">...</span>
-0325                 ~isfolder(fullfile(dataDir,<span class="string">'fasta'</span>)) &amp;&amp; <span class="keyword">...</span>
-0326                 ~isfolder(fullfile(dataDir,<span class="string">'aligned'</span>)) &amp;&amp; <span class="keyword">...</span>
-0327                 ~isfolder(fullfile(dataDir,<span class="string">'hmms'</span>))
-0328             error([<span class="string">'Pre-trained HMMs set is not recognised. If you want download RAVEN provided sets, it should match any of the following: '</span> strjoin(hmmOptions,<span class="string">' or '</span>)])
-0329         <span class="keyword">end</span>
-0330     <span class="keyword">else</span>
-0331         <span class="keyword">if</span> isfolder(dataDir) &amp;&amp; isfile(fullfile(dataDir,<span class="string">'hmms'</span>,<span class="string">'K00844.hmm'</span>))
-0332             fprintf([<span class="string">'NOTE: Found &lt;strong&gt;'</span> dataDir <span class="string">'&lt;/strong&gt; directory with pre-trained HMMs, it will therefore be used during reconstruction\n'</span>]);
-0333         <span class="keyword">elseif</span> ~isfolder(dataDir) &amp;&amp; isfile([dataDir,<span class="string">'.zip'</span>])
-0334             fprintf(<span class="string">'Extracting the HMMs archive file... '</span>);
-0335             unzip([dataDir,<span class="string">'.zip'</span>]);
-0336             fprintf(<span class="string">'COMPLETE\n'</span>);
-0337         <span class="keyword">else</span>
-0338             hmmIndex=strcmp(dataDir,hmmOptions);
-0339             <span class="keyword">if</span> ~any(hmmIndex)
-0340                 error([<span class="string">'Pre-trained HMMs are only provided with proteins clustered at 90% sequence identity (i.e. prok90_kegg105 and euk90_kegg105). '</span> <span class="keyword">...</span>
-0341                     <span class="string">'Use either of these datasets, or otherwise download the relevant sequence data from KEGG to train HMMs with your desired sequence identity'</span>])
-0342             <span class="keyword">else</span>
-0343                 fprintf(<span class="string">'Downloading the HMMs archive file... '</span>);
-0344                 <span class="keyword">try</span>
-0345                     websave([dataDir,<span class="string">'.zip'</span>],[<span class="string">'https://github.com/SysBioChalmers/RAVEN/releases/download/v2.8.0/'</span>,hmmOptions{hmmIndex},<span class="string">'.zip'</span>]);
-0346                 <span class="keyword">catch</span> ME
-0347                     <span class="keyword">if</span> strcmp(ME.identifier,<span class="string">'MATLAB:webservices:HTTP404StatusCodeError'</span>)
-0348                         error(<span class="string">'Failed to download the HMMs archive file, the server returned a 404 error, try again later. If the problem persists please report it on the RAVEN GitHub Issues page: https://github.com/SysBioChalmers/RAVEN/issues'</span>)
-0349                     <span class="keyword">end</span>
-0350                 <span class="keyword">end</span>
-0351             <span class="keyword">end</span>
-0352             
+0313 <span class="comment">%Checking if dataDir is consistent. It must point to pre-trained HMMs set,</span>
+0314 <span class="comment">%compatible with the the current RAVEN version. The user may have the</span>
+0315 <span class="comment">%required zip file already in working directory or have it extracted. If</span>
+0316 <span class="comment">%the zip file and directory is not here, it is downloaded from the cloud</span>
+0317 <span class="keyword">if</span> ~isempty(dataDir)
+0318     hmmOptions={<span class="string">'euk90_kegg105'</span>,<span class="string">'prok90_kegg105'</span>};
+0319     <span class="keyword">if</span> ~endsWith(dataDir,hmmOptions) <span class="comment">%Check if dataDir ends with any of the hmmOptions.</span>
+0320                                      <span class="comment">%If not, then check whether the required folders exist anyway.</span>
+0321         <span class="keyword">if</span> ~isfile(fullfile(dataDir,<span class="string">'keggdb'</span>,<span class="string">'genes.pep'</span>)) &amp;&amp; <span class="keyword">...</span>
+0322                 ~isfolder(fullfile(dataDir,<span class="string">'fasta'</span>)) &amp;&amp; <span class="keyword">...</span>
+0323                 ~isfolder(fullfile(dataDir,<span class="string">'aligned'</span>)) &amp;&amp; <span class="keyword">...</span>
+0324                 ~isfolder(fullfile(dataDir,<span class="string">'hmms'</span>))
+0325             error([<span class="string">'Pre-trained HMMs set is not recognised. If you want download RAVEN provided sets, it should match any of the following: '</span> strjoin(hmmOptions,<span class="string">' or '</span>)])
+0326         <span class="keyword">end</span>
+0327     <span class="keyword">else</span>
+0328         <span class="keyword">if</span> isfolder(dataDir) &amp;&amp; isfile(fullfile(dataDir,<span class="string">'hmms'</span>,<span class="string">'K00844.hmm'</span>))
+0329             fprintf([<span class="string">'NOTE: Found &lt;strong&gt;'</span> dataDir <span class="string">'&lt;/strong&gt; directory with pre-trained HMMs, it will therefore be used during reconstruction\n'</span>]);
+0330         <span class="keyword">elseif</span> ~isfolder(dataDir) &amp;&amp; isfile([dataDir,<span class="string">'.zip'</span>])
+0331             fprintf(<span class="string">'Extracting the HMMs archive file... '</span>);
+0332             unzip([dataDir,<span class="string">'.zip'</span>]);
+0333             fprintf(<span class="string">'COMPLETE\n'</span>);
+0334         <span class="keyword">else</span>
+0335             hmmIndex=strcmp(dataDir,hmmOptions);
+0336             <span class="keyword">if</span> ~any(hmmIndex)
+0337                 error([<span class="string">'Pre-trained HMMs are only provided with proteins clustered at 90% sequence identity (i.e. prok90_kegg105 and euk90_kegg105). '</span> <span class="keyword">...</span>
+0338                     <span class="string">'Use either of these datasets, or otherwise download the relevant sequence data from KEGG to train HMMs with your desired sequence identity'</span>])
+0339             <span class="keyword">else</span>
+0340                 fprintf(<span class="string">'Downloading the HMMs archive file... '</span>);
+0341                 <span class="keyword">try</span>
+0342                     websave([dataDir,<span class="string">'.zip'</span>],[<span class="string">'https://github.com/SysBioChalmers/RAVEN/releases/download/v2.8.0/'</span>,hmmOptions{hmmIndex},<span class="string">'.zip'</span>]);
+0343                 <span class="keyword">catch</span> ME
+0344                     <span class="keyword">if</span> strcmp(ME.identifier,<span class="string">'MATLAB:webservices:HTTP404StatusCodeError'</span>)
+0345                         error(<span class="string">'Failed to download the HMMs archive file, the server returned a 404 error, try again later. If the problem persists please report it on the RAVEN GitHub Issues page: https://github.com/SysBioChalmers/RAVEN/issues'</span>)
+0346                     <span class="keyword">end</span>
+0347                 <span class="keyword">end</span>
+0348             <span class="keyword">end</span>
+0349             
+0350             fprintf(<span class="string">'COMPLETE\n'</span>);
+0351             fprintf(<span class="string">'Extracting the HMMs archive file... '</span>);
+0352             unzip([dataDir,<span class="string">'.zip'</span>]);
 0353             fprintf(<span class="string">'COMPLETE\n'</span>);
-0354             fprintf(<span class="string">'Extracting the HMMs archive file... '</span>);
-0355             unzip([dataDir,<span class="string">'.zip'</span>]);
-0356             fprintf(<span class="string">'COMPLETE\n'</span>);
-0357         <span class="keyword">end</span>
-0358         <span class="comment">%Check if HMMs are extracted</span>
-0359         <span class="keyword">if</span> ~isfile(fullfile(dataDir,<span class="string">'hmms'</span>,<span class="string">'K00844.hmm'</span>))
-0360             error([<span class="string">'The HMM files seem improperly extracted and not found in '</span>,dataDir,<span class="string">'/hmms. Please remove '</span>,dataDir,<span class="string">' folder and rerun getKEGGModelForOrganism'</span>]);
-0361         <span class="keyword">end</span>
-0362     <span class="keyword">end</span>
-0363 <span class="keyword">end</span>
-0364 
-0365 <span class="comment">%Check if the fasta-file contains '/' or'\'. If not then it's probably just</span>
-0366 <span class="comment">%a file name. Expand to full path.</span>
-0367 <span class="keyword">if</span> any(fastaFile)
-0368     <span class="keyword">if</span> ~any(strfind(fastaFile,<span class="string">'\'</span>)) &amp;&amp; ~any(strfind(fastaFile,<span class="string">'/'</span>))
-0369         fastaFile=which(fastaFile);
-0370     <span class="keyword">end</span>
-0371     <span class="comment">%Create the required sub-folders in dataDir if they dont exist</span>
-0372     <span class="keyword">if</span> ~isfolder(fullfile(dataDir,<span class="string">'keggdb'</span>))
-0373         mkdir(dataDir,<span class="string">'keggdb'</span>);
+0354         <span class="keyword">end</span>
+0355         <span class="comment">%Check if HMMs are extracted</span>
+0356         <span class="keyword">if</span> ~isfile(fullfile(dataDir,<span class="string">'hmms'</span>,<span class="string">'K00844.hmm'</span>))
+0357             error([<span class="string">'The HMM files seem improperly extracted and not found in '</span>,dataDir,<span class="string">'/hmms. Please remove '</span>,dataDir,<span class="string">' folder and rerun getKEGGModelForOrganism'</span>]);
+0358         <span class="keyword">end</span>
+0359     <span class="keyword">end</span>
+0360 <span class="keyword">end</span>
+0361 
+0362 <span class="comment">%Check if the fasta-file contains '/' or'\'. If not then it's probably just</span>
+0363 <span class="comment">%a file name. Expand to full path.</span>
+0364 <span class="keyword">if</span> any(fastaFile)
+0365     <span class="keyword">if</span> ~any(strfind(fastaFile,<span class="string">'\'</span>)) &amp;&amp; ~any(strfind(fastaFile,<span class="string">'/'</span>))
+0366         fastaFile=which(fastaFile);
+0367     <span class="keyword">end</span>
+0368     <span class="comment">%Create the required sub-folders in dataDir if they dont exist</span>
+0369     <span class="keyword">if</span> ~isfolder(fullfile(dataDir,<span class="string">'keggdb'</span>))
+0370         mkdir(dataDir,<span class="string">'keggdb'</span>);
+0371     <span class="keyword">end</span>
+0372     <span class="keyword">if</span> ~isfolder(fullfile(dataDir,<span class="string">'fasta'</span>))
+0373         mkdir(dataDir,<span class="string">'fasta'</span>);
 0374     <span class="keyword">end</span>
-0375     <span class="keyword">if</span> ~isfolder(fullfile(dataDir,<span class="string">'fasta'</span>))
-0376         mkdir(dataDir,<span class="string">'fasta'</span>);
+0375     <span class="keyword">if</span> ~isfolder(fullfile(dataDir,<span class="string">'aligned'</span>))
+0376         mkdir(dataDir,<span class="string">'aligned'</span>);
 0377     <span class="keyword">end</span>
-0378     <span class="keyword">if</span> ~isfolder(fullfile(dataDir,<span class="string">'aligned'</span>))
-0379         mkdir(dataDir,<span class="string">'aligned'</span>);
+0378     <span class="keyword">if</span> ~isfolder(fullfile(dataDir,<span class="string">'hmms'</span>))
+0379         mkdir(dataDir,<span class="string">'hmms'</span>);
 0380     <span class="keyword">end</span>
-0381     <span class="keyword">if</span> ~isfolder(fullfile(dataDir,<span class="string">'hmms'</span>))
-0382         mkdir(dataDir,<span class="string">'hmms'</span>);
+0381     <span class="keyword">if</span> ~isfolder(outDir)
+0382         mkdir(outDir);
 0383     <span class="keyword">end</span>
-0384     <span class="keyword">if</span> ~isfolder(outDir)
-0385         mkdir(outDir);
-0386     <span class="keyword">end</span>
-0387 <span class="keyword">end</span>
-0388 
-0389 <span class="comment">%First generate the full global KEGG model. Can be provided as input.</span>
-0390 <span class="comment">%Otherwise, getModelFromKEGG is run. The dataDir must not be supplied as</span>
-0391 <span class="comment">%there is also an internal RAVEN version available</span>
-0392 <span class="keyword">if</span> nargin==15
-0393     model=globalModel.model;
-0394     KOModel=globalModel.KOModel;
-0395 <span class="keyword">elseif</span> any(dataDir)
-0396     [model, KOModel]=<a href="getModelFromKEGG.html" class="code" title="function [model,KOModel]=getModelFromKEGG(keggPath,keepSpontaneous,keepUndefinedStoich,keepIncomplete,keepGeneral)">getModelFromKEGG</a>(fullfile(dataDir,<span class="string">'keggdb'</span>),keepSpontaneous,keepUndefinedStoich,keepIncomplete,keepGeneral);
-0397 <span class="keyword">else</span>
-0398     [model, KOModel]=<a href="getModelFromKEGG.html" class="code" title="function [model,KOModel]=getModelFromKEGG(keggPath,keepSpontaneous,keepUndefinedStoich,keepIncomplete,keepGeneral)">getModelFromKEGG</a>([],keepSpontaneous,keepUndefinedStoich,keepIncomplete,keepGeneral);
-0399 <span class="keyword">end</span>
-0400 model.id=organismID;
-0401 model.c=zeros(numel(model.rxns),1);
-0402 
-0403 <span class="comment">%If no FASTA file is supplied, then just remove all genes which are not for</span>
-0404 <span class="comment">%the given organism ID</span>
-0405 <span class="keyword">if</span> isempty(fastaFile)
-0406     <span class="comment">%Check if organismID can be found in KEGG species list or is</span>
-0407     <span class="comment">%set to &quot;eukaryotes&quot; or &quot;prokaryotes&quot;</span>
-0408     phylDistsFull=<a href="getPhylDist.html" class="code" title="function phylDistStruct=getPhylDist(keggPath,onlyInKingdom)">getPhylDist</a>(fullfile(dataDir,<span class="string">'keggdb'</span>),true);
-0409     <span class="keyword">if</span> ~ismember(organismID,[phylDistsFull.ids <span class="string">'eukaryotes'</span> <span class="string">'prokaryotes'</span>])
-0410         error(<span class="string">'Provided organismID is incorrect. Only species abbreviations from KEGG Species List or &quot;eukaryotes&quot;/&quot;prokaryotes&quot; are allowed.'</span>);
-0411     <span class="keyword">end</span>
-0412     
-0413     fprintf([<span class="string">'Pruning the model from &lt;strong&gt;non-'</span> organismID <span class="string">'&lt;/strong&gt; genes... '</span>]);
-0414     <span class="keyword">if</span> ismember(organismID,{<span class="string">'eukaryotes'</span>,<span class="string">'prokaryotes'</span>})
-0415         phylDists=<a href="getPhylDist.html" class="code" title="function phylDistStruct=getPhylDist(keggPath,onlyInKingdom)">getPhylDist</a>(fullfile(dataDir,<span class="string">'keggdb'</span>),maxPhylDist==-1);
-0416         <span class="keyword">if</span> strcmp(organismID,<span class="string">'eukaryotes'</span>)
-0417             proxyid=<span class="string">'hsa'</span>;
-0418             <span class="comment">%Use H. sapiens here</span>
-0419         <span class="keyword">else</span>
-0420             proxyid=<span class="string">'eco'</span>;
-0421             <span class="comment">%Use E. coli here</span>
-0422         <span class="keyword">end</span>
-0423         [~, phylDistId]=ismember(proxyid,phylDists.ids);
-0424         idsToKeep=phylDists.ids(~isinf(phylDists.distMat(phylDistId,:)));
-0425         taxIDs=cellfun(@(x) x{1},cellfun(@(x) strsplit(x,<span class="string">':'</span>),model.genes,<span class="string">'UniformOutput'</span>,false),<span class="string">'UniformOutput'</span>,false);
-0426         I=ismember(upper(taxIDs),upper(idsToKeep));
-0427     <span class="keyword">else</span>
-0428         <span class="comment">%KEGG organism IDs may have three or four letters</span>
-0429         organismID=strcat(organismID,<span class="string">':'</span>);
-0430         <span class="comment">%Add colon for accurate matching</span>
-0431         <span class="keyword">if</span> length(organismID)==4
-0432             I=cellfun(@(x) strcmpi(x(1:4),organismID),model.genes);
-0433         <span class="keyword">elseif</span> length(organismID)==5
-0434             I=cellfun(@(x) strcmpi(x(1:5),organismID),model.genes);
-0435         <span class="keyword">end</span>
-0436     <span class="keyword">end</span>
-0437     <span class="comment">%Remove those genes</span>
-0438     model.genes=model.genes(I);
-0439     model.rxnGeneMat=model.rxnGeneMat(:,I);
-0440     fprintf(<span class="string">'COMPLETE\n'</span>);
-0441 <span class="keyword">end</span>
-0442 
-0443 <span class="comment">%First remove all reactions without genes</span>
-0444 <span class="keyword">if</span> keepSpontaneous==true
-0445     fprintf(<span class="string">'Removing non-spontaneous reactions without GPR rules... '</span>);
-0446     load(fullfile(ravenPath,<span class="string">'external'</span>,<span class="string">'kegg'</span>,<span class="string">'keggRxns.mat'</span>),<span class="string">'isSpontaneous'</span>);
-0447     I=~any(model.rxnGeneMat,2)&amp;~ismember(model.rxns,isSpontaneous);
-0448     spontRxnsWithGenes=model.rxns(any(model.rxnGeneMat,2)&amp;~ismember(model.rxns,isSpontaneous));
-0449 <span class="keyword">else</span>
-0450     fprintf(<span class="string">'Removing reactions without GPR rules... '</span>);
-0451     I=~any(model.rxnGeneMat,2);
-0452 <span class="keyword">end</span>
-0453 model=removeReactions(model,I,true);
-0454 fprintf(<span class="string">'COMPLETE\n'</span>);
-0455 
-0456 <span class="comment">%Clean gene names</span>
-0457 fprintf(<span class="string">'Fixing gene names in the model... '</span>);
-0458 <span class="comment">%Get rid of the prefix organism id</span>
-0459 model.genes=regexprep(model.genes,<span class="string">'^\w+?:'</span>,<span class="string">''</span>);
-0460 fprintf(<span class="string">'COMPLETE\n'</span>);
-0461 
-0462 <span class="comment">%If no FASTA file is supplied, then we are done here</span>
-0463 <span class="keyword">if</span> isempty(fastaFile)
-0464     <span class="comment">%Create grRules</span>
-0465     fprintf(<span class="string">'Constructing GPR associations and annotations for the model... '</span>);
-0466     model.grRules=cell(numel(model.rxns),1);
-0467     model.grRules(:)={<span class="string">''</span>};
-0468     <span class="comment">%Add the gene associations as 'or'</span>
-0469     <span class="keyword">for</span> i=1:numel(model.rxns)
-0470         <span class="comment">%Find the involved genes</span>
-0471         I=find(model.rxnGeneMat(i,:));
-0472         <span class="keyword">if</span> any(I)
-0473             model.grRules{i}=[<span class="string">'('</span> model.genes{I(1)}];
-0474             <span class="keyword">for</span> j=2:numel(I)
-0475                 model.grRules{i}=[model.grRules{i} <span class="string">' or '</span> model.genes{I(j)}];
-0476             <span class="keyword">end</span>
-0477             model.grRules{i}=[model.grRules{i} <span class="string">')'</span>];
-0478         <span class="keyword">end</span>
-0479     <span class="keyword">end</span>
-0480     <span class="comment">%Fix grRules and reconstruct rxnGeneMat</span>
-0481     [grRules,rxnGeneMat] = standardizeGrRules(model); <span class="comment">%Give detailed output</span>
-0482     model.grRules = grRules;
-0483     model.rxnGeneMat = rxnGeneMat;
-0484     <span class="comment">%Add geneMiriams, assuming that it follows the syntax</span>
-0485     <span class="comment">%kegg.genes/organismID:geneName</span>
-0486     model.geneMiriams=<span class="string">''</span>;
-0487     <span class="keyword">for</span> i=1:numel(model.genes)
-0488         model.geneMiriams{i,1}.name{1,1}=<span class="string">'kegg.genes'</span>;
-0489         model.geneMiriams{i,1}.value{1,1}=strcat(lower(organismID),model.genes{i,1});
-0490     <span class="keyword">end</span>
-0491     <span class="comment">%Add the description to the reactions</span>
-0492     <span class="keyword">for</span> i=1:numel(model.rxns)
-0493         <span class="keyword">if</span> ~isempty(model.rxnNotes{i})
-0494             model.rxnNotes(i)=strcat(<span class="string">'Included by getKEGGModelForOrganism (without HMMs).'</span>,model.rxnNotes(i));
-0495             model.rxnNotes(i)=strrep(model.rxnNotes(i),<span class="string">'.'</span>,<span class="string">'. '</span>);
-0496         <span class="keyword">else</span>
-0497             model.rxnNotes(i)={<span class="string">'Included by getKEGGModelForOrganism (without HMMs)'</span>};
-0498         <span class="keyword">end</span>
-0499     <span class="keyword">end</span>
-0500     fprintf(<span class="string">'COMPLETE\n\n'</span>);
-0501     fprintf(<span class="string">'*** Model reconstruction complete ***\n'</span>);
-0502     <span class="keyword">return</span>;
-0503 <span class="keyword">end</span>
-0504 
-0505 <span class="comment">%Create a phylogenetic distance structure</span>
-0506 phylDistStruct=<a href="getPhylDist.html" class="code" title="function phylDistStruct=getPhylDist(keggPath,onlyInKingdom)">getPhylDist</a>(fullfile(dataDir,<span class="string">'keggdb'</span>),maxPhylDist==-1);
-0507 [~, phylDistId]=ismember(model.id,phylDistStruct.ids);
-0508 
-0509 <span class="comment">%Calculate the real maximal distance now. An abitary large number of 1000</span>
-0510 <span class="comment">%is used for the &quot;all in kingdom&quot; or &quot;all sequences&quot; options. This is a bit</span>
-0511 <span class="comment">%inconvenient way to do it, but it is to make it fit with some older code</span>
-0512 <span class="keyword">if</span> isinf(maxPhylDist) || maxPhylDist==-1
-0513     maxPhylDist=1000;
-0514 <span class="keyword">end</span>
-0515 
-0516 <span class="comment">%Get the KO ids for which files have been generated. Maybe not the neatest</span>
-0517 <span class="comment">%way..</span>
-0518 fastaFiles=<a href="#_sub1" class="code" title="subfunction files=listFiles(directory)">listFiles</a>(fullfile(dataDir,<span class="string">'fasta'</span>,<span class="string">'*.fa'</span>));
-0519 alignedFiles=<a href="#_sub1" class="code" title="subfunction files=listFiles(directory)">listFiles</a>(fullfile(dataDir,<span class="string">'aligned'</span>,<span class="string">'*.fa'</span>));
-0520 alignedWorking=<a href="#_sub1" class="code" title="subfunction files=listFiles(directory)">listFiles</a>(fullfile(dataDir,<span class="string">'aligned'</span>,<span class="string">'*.faw'</span>));
-0521 hmmFiles=<a href="#_sub1" class="code" title="subfunction files=listFiles(directory)">listFiles</a>(fullfile(dataDir,<span class="string">'hmms'</span>,<span class="string">'*.hmm'</span>));
-0522 outFiles=<a href="#_sub1" class="code" title="subfunction files=listFiles(directory)">listFiles</a>(fullfile(outDir,<span class="string">'*.out'</span>));
-0523 
-0524 <span class="comment">%Check if multi-FASTA files should be generated. This should only be</span>
-0525 <span class="comment">%performed if there are IDs in the KOModel structure that haven't been</span>
-0526 <span class="comment">%parsed yet</span>
-0527 missingFASTA=setdiff(KOModel.rxns,[fastaFiles;alignedFiles;hmmFiles;outFiles]);
-0528 
-0529 <span class="keyword">if</span> ~isempty(missingFASTA)
-0530     <span class="keyword">if</span> ~isfile(fullfile(dataDir,<span class="string">'keggdb'</span>,<span class="string">'genes.pep'</span>))
-0531         EM=[<span class="string">'The file ''genes.pep'' cannot be located at '</span> strrep(dataDir,<span class="string">'\'</span>,<span class="string">'/'</span>) <span class="string">'/ and should be downloaded from the KEGG FTP.\n'</span>];
-0532         dispEM(EM);
-0533     <span class="keyword">end</span>
-0534     <span class="comment">%Only construct models for KOs which don't have files already</span>
-0535     fastaModel=removeReactions(KOModel,setdiff(KOModel.rxns,missingFASTA),true,true);
-0536     <span class="comment">%Permute the order of the KOs in the model so that constructMultiFasta</span>
-0537     <span class="comment">%can be run on several processors at once</span>
-0538     fastaModel=permuteModel(fastaModel,randperm(RandStream.create(<span class="string">'mrg32k3a'</span>,<span class="string">'Seed'</span>,cputime()),numel(fastaModel.rxns)),<span class="string">'rxns'</span>);
-0539     <a href="constructMultiFasta.html" class="code" title="function constructMultiFasta(model,sourceFile,outputDir)">constructMultiFasta</a>(fastaModel,fullfile(dataDir,<span class="string">'keggdb'</span>,<span class="string">'genes.pep'</span>),fullfile(dataDir,<span class="string">'fasta'</span>));
-0540 <span class="keyword">else</span>
-0541     fprintf(<span class="string">'Generating the KEGG Orthology specific multi-FASTA files... COMPLETE\n'</span>);
-0542 <span class="keyword">end</span>
-0543 
-0544 <span class="keyword">if</span> isunix
-0545     <span class="keyword">if</span> ismac
-0546         binEnd=<span class="string">'.mac'</span>;
-0547     <span class="keyword">else</span>
-0548         binEnd=<span class="string">''</span>;
-0549     <span class="keyword">end</span>
-0550 <span class="keyword">elseif</span> ispc
-0551     binEnd=<span class="string">''</span>;
-0552 <span class="keyword">else</span>
-0553     EM=<span class="string">'Unknown OS, exiting.'</span>;
-0554     disp(EM);
-0555     <span class="keyword">return</span>
-0556 <span class="keyword">end</span>
-0557 
-0558 <span class="comment">%Check if alignment of FASTA files should be performed</span>
-0559 missingAligned=setdiff(KOModel.rxns,[alignedFiles;hmmFiles;alignedWorking;outFiles]);
-0560 <span class="keyword">if</span> ~isempty(missingAligned)
-0561     <span class="keyword">if</span> seqIdentity==-1
-0562         fprintf(<span class="string">'Performing the multiple alignment for KEGG Orthology specific protein sets...   0%% complete'</span>);
-0563     <span class="keyword">else</span>
-0564         fprintf(<span class="string">'Performing clustering and multiple alignment for KEGG Orthology specific protein sets...   0%% complete'</span>);
-0565     <span class="keyword">end</span>
-0566     missingAligned=missingAligned(randperm(RandStream.create(<span class="string">'mrg32k3a'</span>,<span class="string">'Seed'</span>,cputime()),numel(missingAligned)));
-0567     tmpFile=tempname;
-0568     <span class="comment">%On Windows, paths need to be translated to Unix before parsing it to WSL</span>
-0569     <span class="keyword">if</span> ispc
-0570         wslPath.tmpFile=<a href="getWSLpath.html" class="code" title="function path=getWSLpath(path)">getWSLpath</a>(tmpFile);
-0571         <span class="comment">%mafft has problems writing to terminal (/dev/stderr) when running</span>
-0572         <span class="comment">%on WSL via MATLAB, instead write and read progress file</span>
-0573         mafftOutput = tempname;
-0574         wslPath.mafftOutput=<a href="getWSLpath.html" class="code" title="function path=getWSLpath(path)">getWSLpath</a>(mafftOutput);
-0575         wslPath.mafft=<a href="getWSLpath.html" class="code" title="function path=getWSLpath(path)">getWSLpath</a>(fullfile(ravenPath,<span class="string">'software'</span>,<span class="string">'mafft'</span>,<span class="string">'mafft-linux64'</span>,<span class="string">'mafft.bat'</span>));
-0576         wslPath.cdhit=<a href="getWSLpath.html" class="code" title="function path=getWSLpath(path)">getWSLpath</a>(fullfile(ravenPath,<span class="string">'software'</span>,<span class="string">'cd-hit'</span>,<span class="string">'cd-hit'</span>));
-0577     <span class="keyword">end</span>
-0578     
-0579     <span class="keyword">for</span> i=1:numel(missingAligned)
-0580         <span class="comment">%This is checked here because it could be that it is created by a</span>
-0581         <span class="comment">%parallel process. The faw-files are saved as temporary files to</span>
-0582         <span class="comment">%kept track of which files are being worked on</span>
-0583         <span class="keyword">if</span> ~isfile(fullfile(dataDir,<span class="string">'aligned'</span>,[missingAligned{i} <span class="string">'.faw'</span>])) &amp;&amp;<span class="keyword">...</span>
-0584                 ~isfile(fullfile(dataDir,<span class="string">'aligned'</span>,[missingAligned{i} <span class="string">'.fa'</span>]))
-0585             <span class="comment">%Check that the multi-FASTA file exists. It should do so since</span>
-0586             <span class="comment">%we are saving empty files as well. Print a warning and</span>
-0587             <span class="comment">%continue if not</span>
-0588             <span class="keyword">if</span> ~isfile(fullfile(dataDir,<span class="string">'fasta'</span>,[missingAligned{i} <span class="string">'.fa'</span>]))
-0589                 EM=[<span class="string">'WARNING: The multi-FASTA file for '</span> missingAligned{i} <span class="string">' does not exist'</span>];
-0590                 dispEM(EM,false);
-0591                 <span class="keyword">continue</span>;
-0592             <span class="keyword">end</span>
-0593             
-0594             <span class="comment">%If the multi-FASTA file is empty then save an empty aligned</span>
-0595             <span class="comment">%file and continue</span>
-0596             s=dir(fullfile(dataDir,<span class="string">'fasta'</span>,[missingAligned{i} <span class="string">'.fa'</span>]));
-0597             <span class="keyword">if</span> s.bytes&lt;=0
-0598                 fid=fopen(fullfile(dataDir,<span class="string">'aligned'</span>,[missingAligned{i} <span class="string">'.fa'</span>]),<span class="string">'w'</span>);
-0599                 fclose(fid);
-0600                 <span class="keyword">continue</span>;
-0601             <span class="keyword">end</span>
-0602             
-0603             <span class="comment">%Create an empty file to prevent other threads to start to work</span>
-0604             <span class="comment">%on the same alignment</span>
-0605             fid=fopen(fullfile(dataDir,<span class="string">'aligned'</span>,[missingAligned{i} <span class="string">'.faw'</span>]),<span class="string">'w'</span>);
-0606             fclose(fid);
-0607             
-0608             <span class="comment">%First load the FASTA file, then select up to nSequences</span>
-0609             <span class="comment">%sequences of the most closely related species, apply any</span>
-0610             <span class="comment">%constraints from maxPhylDist, and save it as a temporary file,</span>
-0611             <span class="comment">%and create the model from that</span>
-0612             
-0613             fastaStruct=fastaread(fullfile(dataDir,<span class="string">'fasta'</span>,[missingAligned{i} <span class="string">'.fa'</span>]));
-0614             phylDist=inf(numel(fastaStruct),1);
-0615             <span class="keyword">for</span> j=1:numel(fastaStruct)
-0616                 <span class="comment">%Get the organism abbreviation</span>
-0617                 index=strfind(fastaStruct(j).Header,<span class="string">':'</span>);
-0618                 <span class="keyword">if</span> any(index)
-0619                     abbrev=fastaStruct(j).Header(1:index(1)-1);
-0620                     [~, index]=ismember(abbrev,phylDistStruct.ids);
-0621                     <span class="keyword">if</span> any(index)
-0622                         phylDist(j)=phylDistStruct.distMat(index(1),phylDistId);
-0623                     <span class="keyword">end</span>
-0624                 <span class="keyword">end</span>
-0625             <span class="keyword">end</span>
+0384 <span class="keyword">end</span>
+0385 
+0386 <span class="comment">%First generate the full global KEGG model. Can be provided as input.</span>
+0387 <span class="comment">%Otherwise, getModelFromKEGG is run. The dataDir must not be supplied as</span>
+0388 <span class="comment">%there is also an internal RAVEN version available</span>
+0389 <span class="keyword">if</span> nargin==15
+0390     model=globalModel.model;
+0391     KOModel=globalModel.KOModel;
+0392 <span class="keyword">elseif</span> any(dataDir)
+0393     [model, KOModel]=<a href="getModelFromKEGG.html" class="code" title="function [model,KOModel]=getModelFromKEGG(keggPath,keepSpontaneous,keepUndefinedStoich,keepIncomplete,keepGeneral)">getModelFromKEGG</a>(fullfile(dataDir,<span class="string">'keggdb'</span>),keepSpontaneous,keepUndefinedStoich,keepIncomplete,keepGeneral);
+0394 <span class="keyword">else</span>
+0395     [model, KOModel]=<a href="getModelFromKEGG.html" class="code" title="function [model,KOModel]=getModelFromKEGG(keggPath,keepSpontaneous,keepUndefinedStoich,keepIncomplete,keepGeneral)">getModelFromKEGG</a>([],keepSpontaneous,keepUndefinedStoich,keepIncomplete,keepGeneral);
+0396 <span class="keyword">end</span>
+0397 model.id=organismID;
+0398 model.c=zeros(numel(model.rxns),1);
+0399 
+0400 <span class="comment">%If no FASTA file is supplied, then just remove all genes which are not for</span>
+0401 <span class="comment">%the given organism ID</span>
+0402 <span class="keyword">if</span> isempty(fastaFile)
+0403     <span class="comment">%Check if organismID can be found in KEGG species list or is</span>
+0404     <span class="comment">%set to &quot;eukaryotes&quot; or &quot;prokaryotes&quot;</span>
+0405     phylDistsFull=<a href="getPhylDist.html" class="code" title="function phylDistStruct=getPhylDist(keggPath,onlyInKingdom)">getPhylDist</a>(fullfile(dataDir,<span class="string">'keggdb'</span>),true);
+0406     <span class="keyword">if</span> ~ismember(organismID,[phylDistsFull.ids <span class="string">'eukaryotes'</span> <span class="string">'prokaryotes'</span>])
+0407         error(<span class="string">'Provided organismID is incorrect. Only species abbreviations from KEGG Species List or &quot;eukaryotes&quot;/&quot;prokaryotes&quot; are allowed.'</span>);
+0408     <span class="keyword">end</span>
+0409     
+0410     fprintf([<span class="string">'Pruning the model from &lt;strong&gt;non-'</span> organismID <span class="string">'&lt;/strong&gt; genes... '</span>]);
+0411     <span class="keyword">if</span> ismember(organismID,{<span class="string">'eukaryotes'</span>,<span class="string">'prokaryotes'</span>})
+0412         phylDists=<a href="getPhylDist.html" class="code" title="function phylDistStruct=getPhylDist(keggPath,onlyInKingdom)">getPhylDist</a>(fullfile(dataDir,<span class="string">'keggdb'</span>),maxPhylDist==-1);
+0413         <span class="keyword">if</span> strcmp(organismID,<span class="string">'eukaryotes'</span>)
+0414             proxyid=<span class="string">'hsa'</span>;
+0415             <span class="comment">%Use H. sapiens here</span>
+0416         <span class="keyword">else</span>
+0417             proxyid=<span class="string">'eco'</span>;
+0418             <span class="comment">%Use E. coli here</span>
+0419         <span class="keyword">end</span>
+0420         [~, phylDistId]=ismember(proxyid,phylDists.ids);
+0421         idsToKeep=phylDists.ids(~isinf(phylDists.distMat(phylDistId,:)));
+0422         taxIDs=cellfun(@(x) x{1},cellfun(@(x) strsplit(x,<span class="string">':'</span>),model.genes,<span class="string">'UniformOutput'</span>,false),<span class="string">'UniformOutput'</span>,false);
+0423         I=ismember(upper(taxIDs),upper(idsToKeep));
+0424     <span class="keyword">else</span>
+0425         <span class="comment">%KEGG organism IDs may have three or four letters</span>
+0426         organismID=strcat(organismID,<span class="string">':'</span>);
+0427         <span class="comment">%Add colon for accurate matching</span>
+0428         <span class="keyword">if</span> length(organismID)==4
+0429             I=cellfun(@(x) strcmpi(x(1:4),organismID),model.genes);
+0430         <span class="keyword">elseif</span> length(organismID)==5
+0431             I=cellfun(@(x) strcmpi(x(1:5),organismID),model.genes);
+0432         <span class="keyword">end</span>
+0433     <span class="keyword">end</span>
+0434     <span class="comment">%Remove those genes</span>
+0435     model.genes=model.genes(I);
+0436     model.rxnGeneMat=model.rxnGeneMat(:,I);
+0437     fprintf(<span class="string">'COMPLETE\n'</span>);
+0438 <span class="keyword">end</span>
+0439 
+0440 <span class="comment">%First remove all reactions without genes</span>
+0441 <span class="keyword">if</span> keepSpontaneous==true
+0442     fprintf(<span class="string">'Removing non-spontaneous reactions without GPR rules... '</span>);
+0443     load(fullfile(ravenPath,<span class="string">'external'</span>,<span class="string">'kegg'</span>,<span class="string">'keggRxns.mat'</span>),<span class="string">'isSpontaneous'</span>);
+0444     I=~any(model.rxnGeneMat,2)&amp;~ismember(model.rxns,isSpontaneous);
+0445     spontRxnsWithGenes=model.rxns(any(model.rxnGeneMat,2)&amp;~ismember(model.rxns,isSpontaneous));
+0446 <span class="keyword">else</span>
+0447     fprintf(<span class="string">'Removing reactions without GPR rules... '</span>);
+0448     I=~any(model.rxnGeneMat,2);
+0449 <span class="keyword">end</span>
+0450 model=removeReactions(model,I,true);
+0451 fprintf(<span class="string">'COMPLETE\n'</span>);
+0452 
+0453 <span class="comment">%Clean gene names</span>
+0454 fprintf(<span class="string">'Fixing gene names in the model... '</span>);
+0455 <span class="comment">%Get rid of the prefix organism id</span>
+0456 model.genes=regexprep(model.genes,<span class="string">'^\w+?:'</span>,<span class="string">''</span>);
+0457 fprintf(<span class="string">'COMPLETE\n'</span>);
+0458 
+0459 <span class="comment">%If no FASTA file is supplied, then we are done here</span>
+0460 <span class="keyword">if</span> isempty(fastaFile)
+0461     <span class="comment">%Create grRules</span>
+0462     fprintf(<span class="string">'Constructing GPR associations and annotations for the model... '</span>);
+0463     model.grRules=cell(numel(model.rxns),1);
+0464     model.grRules(:)={<span class="string">''</span>};
+0465     <span class="comment">%Add the gene associations as 'or'</span>
+0466     <span class="keyword">for</span> i=1:numel(model.rxns)
+0467         <span class="comment">%Find the involved genes</span>
+0468         I=find(model.rxnGeneMat(i,:));
+0469         <span class="keyword">if</span> any(I)
+0470             model.grRules{i}=[<span class="string">'('</span> model.genes{I(1)}];
+0471             <span class="keyword">for</span> j=2:numel(I)
+0472                 model.grRules{i}=[model.grRules{i} <span class="string">' or '</span> model.genes{I(j)}];
+0473             <span class="keyword">end</span>
+0474             model.grRules{i}=[model.grRules{i} <span class="string">')'</span>];
+0475         <span class="keyword">end</span>
+0476     <span class="keyword">end</span>
+0477     <span class="comment">%Fix grRules and reconstruct rxnGeneMat</span>
+0478     [grRules,rxnGeneMat] = standardizeGrRules(model); <span class="comment">%Give detailed output</span>
+0479     model.grRules = grRules;
+0480     model.rxnGeneMat = rxnGeneMat;
+0481     <span class="comment">%Add geneMiriams, assuming that it follows the syntax</span>
+0482     <span class="comment">%kegg.genes/organismID:geneName</span>
+0483     model.geneMiriams=<span class="string">''</span>;
+0484     <span class="keyword">for</span> i=1:numel(model.genes)
+0485         model.geneMiriams{i,1}.name{1,1}=<span class="string">'kegg.genes'</span>;
+0486         model.geneMiriams{i,1}.value{1,1}=strcat(lower(organismID),model.genes{i,1});
+0487     <span class="keyword">end</span>
+0488     <span class="comment">%Add the description to the reactions</span>
+0489     <span class="keyword">for</span> i=1:numel(model.rxns)
+0490         <span class="keyword">if</span> ~isempty(model.rxnNotes{i})
+0491             model.rxnNotes(i)=strcat(<span class="string">'Included by getKEGGModelForOrganism (without HMMs).'</span>,model.rxnNotes(i));
+0492             model.rxnNotes(i)=strrep(model.rxnNotes(i),<span class="string">'.'</span>,<span class="string">'. '</span>);
+0493         <span class="keyword">else</span>
+0494             model.rxnNotes(i)={<span class="string">'Included by getKEGGModelForOrganism (without HMMs)'</span>};
+0495         <span class="keyword">end</span>
+0496     <span class="keyword">end</span>
+0497     fprintf(<span class="string">'COMPLETE\n\n'</span>);
+0498     fprintf(<span class="string">'*** Model reconstruction complete ***\n'</span>);
+0499     <span class="keyword">return</span>;
+0500 <span class="keyword">end</span>
+0501 
+0502 <span class="comment">%Create a phylogenetic distance structure</span>
+0503 phylDistStruct=<a href="getPhylDist.html" class="code" title="function phylDistStruct=getPhylDist(keggPath,onlyInKingdom)">getPhylDist</a>(fullfile(dataDir,<span class="string">'keggdb'</span>),maxPhylDist==-1);
+0504 [~, phylDistId]=ismember(model.id,phylDistStruct.ids);
+0505 
+0506 <span class="comment">%Calculate the real maximal distance now. An abitary large number of 1000</span>
+0507 <span class="comment">%is used for the &quot;all in kingdom&quot; or &quot;all sequences&quot; options. This is a bit</span>
+0508 <span class="comment">%inconvenient way to do it, but it is to make it fit with some older code</span>
+0509 <span class="keyword">if</span> isinf(maxPhylDist) || maxPhylDist==-1
+0510     maxPhylDist=1000;
+0511 <span class="keyword">end</span>
+0512 
+0513 <span class="comment">%Get the KO ids for which files have been generated. Maybe not the neatest</span>
+0514 <span class="comment">%way..</span>
+0515 fastaFiles=<a href="#_sub1" class="code" title="subfunction files=listFiles(directory)">listFiles</a>(fullfile(dataDir,<span class="string">'fasta'</span>,<span class="string">'*.fa'</span>));
+0516 alignedFiles=<a href="#_sub1" class="code" title="subfunction files=listFiles(directory)">listFiles</a>(fullfile(dataDir,<span class="string">'aligned'</span>,<span class="string">'*.fa'</span>));
+0517 alignedWorking=<a href="#_sub1" class="code" title="subfunction files=listFiles(directory)">listFiles</a>(fullfile(dataDir,<span class="string">'aligned'</span>,<span class="string">'*.faw'</span>));
+0518 hmmFiles=<a href="#_sub1" class="code" title="subfunction files=listFiles(directory)">listFiles</a>(fullfile(dataDir,<span class="string">'hmms'</span>,<span class="string">'*.hmm'</span>));
+0519 outFiles=<a href="#_sub1" class="code" title="subfunction files=listFiles(directory)">listFiles</a>(fullfile(outDir,<span class="string">'*.out'</span>));
+0520 
+0521 <span class="comment">%Check if multi-FASTA files should be generated. This should only be</span>
+0522 <span class="comment">%performed if there are IDs in the KOModel structure that haven't been</span>
+0523 <span class="comment">%parsed yet</span>
+0524 missingFASTA=setdiff(KOModel.rxns,[fastaFiles;alignedFiles;hmmFiles;outFiles]);
+0525 
+0526 <span class="keyword">if</span> ~isempty(missingFASTA)
+0527     <span class="keyword">if</span> ~isfile(fullfile(dataDir,<span class="string">'keggdb'</span>,<span class="string">'genes.pep'</span>))
+0528         EM=[<span class="string">'The file ''genes.pep'' cannot be located at '</span> strrep(dataDir,<span class="string">'\'</span>,<span class="string">'/'</span>) <span class="string">'/ and should be downloaded from the KEGG FTP.\n'</span>];
+0529         dispEM(EM);
+0530     <span class="keyword">end</span>
+0531     <span class="comment">%Only construct models for KOs which don't have files already</span>
+0532     fastaModel=removeReactions(KOModel,setdiff(KOModel.rxns,missingFASTA),true,true);
+0533     <span class="comment">%Permute the order of the KOs in the model so that constructMultiFasta</span>
+0534     <span class="comment">%can be run on several processors at once</span>
+0535     fastaModel=permuteModel(fastaModel,randperm(RandStream.create(<span class="string">'mrg32k3a'</span>,<span class="string">'Seed'</span>,cputime()),numel(fastaModel.rxns)),<span class="string">'rxns'</span>);
+0536     <a href="constructMultiFasta.html" class="code" title="function constructMultiFasta(model,sourceFile,outputDir)">constructMultiFasta</a>(fastaModel,fullfile(dataDir,<span class="string">'keggdb'</span>,<span class="string">'genes.pep'</span>),fullfile(dataDir,<span class="string">'fasta'</span>));
+0537 <span class="keyword">else</span>
+0538     fprintf(<span class="string">'Generating the KEGG Orthology specific multi-FASTA files... COMPLETE\n'</span>);
+0539 <span class="keyword">end</span>
+0540 
+0541 <span class="keyword">if</span> isunix
+0542     <span class="keyword">if</span> ismac
+0543         binEnd=<span class="string">'.mac'</span>;
+0544     <span class="keyword">else</span>
+0545         binEnd=<span class="string">''</span>;
+0546     <span class="keyword">end</span>
+0547 <span class="keyword">elseif</span> ispc
+0548     binEnd=<span class="string">''</span>;
+0549 <span class="keyword">else</span>
+0550     EM=<span class="string">'Unknown OS, exiting.'</span>;
+0551     disp(EM);
+0552     <span class="keyword">return</span>
+0553 <span class="keyword">end</span>
+0554 
+0555 <span class="comment">%Check if alignment of FASTA files should be performed</span>
+0556 missingAligned=setdiff(KOModel.rxns,[alignedFiles;hmmFiles;alignedWorking;outFiles]);
+0557 <span class="keyword">if</span> ~isempty(missingAligned)
+0558     <span class="keyword">if</span> seqIdentity==-1
+0559         fprintf(<span class="string">'Performing the multiple alignment for KEGG Orthology specific protein sets...   0%% complete'</span>);
+0560     <span class="keyword">else</span>
+0561         fprintf(<span class="string">'Performing clustering and multiple alignment for KEGG Orthology specific protein sets...   0%% complete'</span>);
+0562     <span class="keyword">end</span>
+0563     missingAligned=missingAligned(randperm(RandStream.create(<span class="string">'mrg32k3a'</span>,<span class="string">'Seed'</span>,cputime()),numel(missingAligned)));
+0564     tmpFile=tempname;
+0565     <span class="comment">%On Windows, paths need to be translated to Unix before parsing it to WSL</span>
+0566     <span class="keyword">if</span> ispc
+0567         wslPath.tmpFile=<a href="getWSLpath.html" class="code" title="function path=getWSLpath(path)">getWSLpath</a>(tmpFile);
+0568         <span class="comment">%mafft has problems writing to terminal (/dev/stderr) when running</span>
+0569         <span class="comment">%on WSL via MATLAB, instead write and read progress file</span>
+0570         mafftOutput = tempname;
+0571         wslPath.mafftOutput=<a href="getWSLpath.html" class="code" title="function path=getWSLpath(path)">getWSLpath</a>(mafftOutput);
+0572         wslPath.mafft=<a href="getWSLpath.html" class="code" title="function path=getWSLpath(path)">getWSLpath</a>(fullfile(ravenPath,<span class="string">'software'</span>,<span class="string">'mafft'</span>,<span class="string">'mafft-linux64'</span>,<span class="string">'mafft.bat'</span>));
+0573         wslPath.cdhit=<a href="getWSLpath.html" class="code" title="function path=getWSLpath(path)">getWSLpath</a>(fullfile(ravenPath,<span class="string">'software'</span>,<span class="string">'cd-hit'</span>,<span class="string">'cd-hit'</span>));
+0574     <span class="keyword">end</span>
+0575     
+0576     <span class="keyword">for</span> i=1:numel(missingAligned)
+0577         <span class="comment">%This is checked here because it could be that it is created by a</span>
+0578         <span class="comment">%parallel process. The faw-files are saved as temporary files to</span>
+0579         <span class="comment">%kept track of which files are being worked on</span>
+0580         <span class="keyword">if</span> ~isfile(fullfile(dataDir,<span class="string">'aligned'</span>,[missingAligned{i} <span class="string">'.faw'</span>])) &amp;&amp;<span class="keyword">...</span>
+0581                 ~isfile(fullfile(dataDir,<span class="string">'aligned'</span>,[missingAligned{i} <span class="string">'.fa'</span>]))
+0582             <span class="comment">%Check that the multi-FASTA file exists. It should do so since</span>
+0583             <span class="comment">%we are saving empty files as well. Print a warning and</span>
+0584             <span class="comment">%continue if not</span>
+0585             <span class="keyword">if</span> ~isfile(fullfile(dataDir,<span class="string">'fasta'</span>,[missingAligned{i} <span class="string">'.fa'</span>]))
+0586                 EM=[<span class="string">'WARNING: The multi-FASTA file for '</span> missingAligned{i} <span class="string">' does not exist'</span>];
+0587                 dispEM(EM,false);
+0588                 <span class="keyword">continue</span>;
+0589             <span class="keyword">end</span>
+0590             
+0591             <span class="comment">%If the multi-FASTA file is empty then save an empty aligned</span>
+0592             <span class="comment">%file and continue</span>
+0593             s=dir(fullfile(dataDir,<span class="string">'fasta'</span>,[missingAligned{i} <span class="string">'.fa'</span>]));
+0594             <span class="keyword">if</span> s.bytes&lt;=0
+0595                 fid=fopen(fullfile(dataDir,<span class="string">'aligned'</span>,[missingAligned{i} <span class="string">'.fa'</span>]),<span class="string">'w'</span>);
+0596                 fclose(fid);
+0597                 <span class="keyword">continue</span>;
+0598             <span class="keyword">end</span>
+0599             
+0600             <span class="comment">%Create an empty file to prevent other threads to start to work</span>
+0601             <span class="comment">%on the same alignment</span>
+0602             fid=fopen(fullfile(dataDir,<span class="string">'aligned'</span>,[missingAligned{i} <span class="string">'.faw'</span>]),<span class="string">'w'</span>);
+0603             fclose(fid);
+0604             
+0605             <span class="comment">%First load the FASTA file, then select up to nSequences</span>
+0606             <span class="comment">%sequences of the most closely related species, apply any</span>
+0607             <span class="comment">%constraints from maxPhylDist, and save it as a temporary file,</span>
+0608             <span class="comment">%and create the model from that</span>
+0609             
+0610             fastaStruct=fastaread(fullfile(dataDir,<span class="string">'fasta'</span>,[missingAligned{i} <span class="string">'.fa'</span>]));
+0611             phylDist=inf(numel(fastaStruct),1);
+0612             <span class="keyword">for</span> j=1:numel(fastaStruct)
+0613                 <span class="comment">%Get the organism abbreviation</span>
+0614                 index=strfind(fastaStruct(j).Header,<span class="string">':'</span>);
+0615                 <span class="keyword">if</span> any(index)
+0616                     abbrev=fastaStruct(j).Header(1:index(1)-1);
+0617                     [~, index]=ismember(abbrev,phylDistStruct.ids);
+0618                     <span class="keyword">if</span> any(index)
+0619                         phylDist(j)=phylDistStruct.distMat(index(1),phylDistId);
+0620                     <span class="keyword">end</span>
+0621                 <span class="keyword">end</span>
+0622             <span class="keyword">end</span>
+0623             
+0624             <span class="comment">%Inf means that it should not be included</span>
+0625             phylDist(phylDist&gt;maxPhylDist)=[];
 0626             
-0627             <span class="comment">%Inf means that it should not be included</span>
-0628             phylDist(phylDist&gt;maxPhylDist)=[];
+0627             <span class="comment">%Sort based on phylDist</span>
+0628             [~, order]=sort(phylDist);
 0629             
-0630             <span class="comment">%Sort based on phylDist</span>
-0631             [~, order]=sort(phylDist);
-0632             
-0633             <span class="comment">%Save the first nSequences hits to a temporary FASTA file</span>
-0634             <span class="keyword">if</span> nSequences&lt;=numel(fastaStruct)
-0635                 fastaStruct=fastaStruct(order(1:nSequences));
-0636             <span class="keyword">else</span>
-0637                 fastaStruct=fastaStruct(order);
-0638             <span class="keyword">end</span>
-0639             
-0640             <span class="comment">%Do the clustering and alignment if there are more than one</span>
-0641             <span class="comment">%sequences, otherwise just save the sequence (or an empty file)</span>
-0642             <span class="keyword">if</span> numel(fastaStruct)&gt;1
-0643                  <span class="keyword">if</span> seqIdentity~=-1
-0644                     cdhitInpCustom=tempname;
-0645                     fastawrite(cdhitInpCustom,fastaStruct);
-0646                     <span class="keyword">if</span> seqIdentity&lt;=1 &amp;&amp; seqIdentity&gt;0.7
-0647                         nparam=<span class="string">'5'</span>;
-0648                     <span class="keyword">elseif</span> seqIdentity&gt;0.6
-0649                         nparam=<span class="string">'4'</span>;
-0650                     <span class="keyword">elseif</span> seqIdentity&gt;0.5
-0651                         nparam=<span class="string">'3'</span>;
-0652                     <span class="keyword">elseif</span> seqIdentity&gt;0.4
-0653                         nparam=<span class="string">'2'</span>;
-0654                     <span class="keyword">else</span>
-0655                         EM=<span class="string">'The provided seqIdentity must be between 0 and 1\n'</span>;
-0656                         dispEM(EM);
-0657                     <span class="keyword">end</span>
-0658                     <span class="keyword">if</span> ispc
-0659                         wslPath.cdhitInpCustom=<a href="getWSLpath.html" class="code" title="function path=getWSLpath(path)">getWSLpath</a>(cdhitInpCustom);
-0660                         [status, output]=system([<span class="string">'wsl &quot;'</span> wslPath.cdhit <span class="string">'&quot; -T &quot;'</span> num2str(cores) <span class="string">'&quot; -i &quot;'</span> wslPath.cdhitInpCustom <span class="string">'&quot; -o &quot;'</span> wslPath.tmpFile <span class="string">'&quot; -c &quot;'</span> num2str(seqIdentity) <span class="string">'&quot; -n '</span> nparam <span class="string">' -M 2000'</span>]);
-0661                     <span class="keyword">elseif</span> ismac || isunix
-0662                         [status, output]=system([<span class="string">'&quot;'</span> fullfile(ravenPath,<span class="string">'software'</span>,<span class="string">'cd-hit'</span>,[<span class="string">'cd-hit'</span> binEnd]) <span class="string">'&quot; -T &quot;'</span> num2str(cores) <span class="string">'&quot; -i &quot;'</span> cdhitInpCustom <span class="string">'&quot; -o &quot;'</span> tmpFile <span class="string">'&quot; -c &quot;'</span> num2str(seqIdentity) <span class="string">'&quot; -n '</span> nparam <span class="string">' -M 2000'</span>]);
-0663                     <span class="keyword">end</span>
-0664                     <span class="keyword">if</span> status~=0
-0665                         EM=[<span class="string">'Error when performing clustering of '</span> missingAligned{i} <span class="string">':\n'</span> output];
-0666                         dispEM(EM);
-0667                     <span class="keyword">end</span>
-0668                     <span class="comment">%Remove the old tempfile</span>
-0669                     <span class="keyword">if</span> exist(cdhitInpCustom, <span class="string">'file'</span>)
-0670                         delete([cdhitInpCustom <span class="string">'*'</span>]);
-0671                     <span class="keyword">end</span>
-0672                 <span class="keyword">else</span>
-0673                     <span class="comment">%This means that CD-HIT should be skipped since</span>
-0674                     <span class="comment">%seqIdentity is equal to -1</span>
-0675                     fastawrite(tmpFile,fastaStruct);
-0676                 <span class="keyword">end</span>
-0677                 <span class="comment">%Do the alignment for this file</span>
-0678                 <span class="keyword">if</span> ismac
-0679                     [status, output]=system([<span class="string">'&quot;'</span> fullfile(ravenPath,<span class="string">'software'</span>,<span class="string">'mafft'</span>,<span class="string">'mafft-mac'</span>,<span class="string">'mafft.bat'</span>) <span class="string">'&quot; --auto --anysymbol --thread &quot;'</span> num2str(cores) <span class="string">'&quot; &quot;'</span> tmpFile <span class="string">'&quot; &gt; &quot;'</span> fullfile(dataDir,<span class="string">'aligned'</span>,[missingAligned{i} <span class="string">'.faw'</span>]) <span class="string">'&quot;'</span>]);
-0680                 <span class="keyword">elseif</span> isunix
-0681                     [status, output]=system([<span class="string">'&quot;'</span> fullfile(ravenPath,<span class="string">'software'</span>,<span class="string">'mafft'</span>,<span class="string">'mafft-linux64'</span>,<span class="string">'mafft.bat'</span>) <span class="string">'&quot; --auto --anysymbol --thread &quot;'</span> num2str(cores) <span class="string">'&quot; &quot;'</span> tmpFile <span class="string">'&quot; &gt; &quot;'</span> fullfile(dataDir,<span class="string">'aligned'</span>,[missingAligned{i} <span class="string">'.faw'</span>]) <span class="string">'&quot;'</span>]);
-0682                 <span class="keyword">elseif</span> ispc
-0683                     wslPath.fawFile=<a href="getWSLpath.html" class="code" title="function path=getWSLpath(path)">getWSLpath</a>(fullfile(dataDir,<span class="string">'aligned'</span>,[missingAligned{i} <span class="string">'.faw'</span>]));
-0684                     [status, ~]=system([<span class="string">'wsl &quot;'</span> wslPath.mafft <span class="string">'&quot; --auto --anysymbol --progress &quot;'</span> wslPath.mafftOutput <span class="string">'&quot; --thread &quot;'</span> num2str(cores) <span class="string">'&quot; --out &quot;'</span> wslPath.fawFile <span class="string">'&quot; &quot;'</span> wslPath.tmpFile <span class="string">'&quot;'</span>]);
-0685                     output=fileread(mafftOutput);
-0686                     delete(mafftOutput);
-0687                 <span class="keyword">end</span>
-0688                 <span class="keyword">if</span> status~=0
-0689                     <span class="comment">%It could be that alignment failed because only one</span>
-0690                     <span class="comment">%sequence was left after clustering. If that is the</span>
-0691                     <span class="comment">%case, then the clustered file is just copied as 'faw'</span>
-0692                     <span class="comment">%file</span>
-0693                     <span class="keyword">if</span> any(regexp(output,<span class="string">'Only 1 sequence found'</span>))
-0694                         movefile(tmpFile,fullfile(dataDir,<span class="string">'aligned'</span>,[missingAligned{i} <span class="string">'.faw'</span>]),<span class="string">'f'</span>);
-0695                     <span class="keyword">else</span>
-0696                         EM=[<span class="string">'Error when performing alignment of '</span> missingAligned{i} <span class="string">':\n'</span> output];
-0697                         dispEM(EM);
-0698                     <span class="keyword">end</span>
-0699                 <span class="keyword">end</span>
-0700                 <span class="comment">%Remove the old tempfile</span>
-0701                 <span class="keyword">if</span> exist(tmpFile, <span class="string">'file'</span>)
-0702                     delete([tmpFile <span class="string">'*'</span>]);
-0703                 <span class="keyword">end</span>
-0704             <span class="keyword">else</span>
-0705                 <span class="comment">%If there is only one sequence then it's not possible to do</span>
-0706                 <span class="comment">%a multiple alignment. Just print the sequence instead. An</span>
-0707                 <span class="comment">%empty file was written previously so that doesn't have to</span>
-0708                 <span class="comment">%be dealt with</span>
-0709                 <span class="keyword">if</span> numel(fastaStruct)==1
-0710                     warnState = warning; <span class="comment">%Save the current warning state</span>
-0711                     warning(<span class="string">'off'</span>,<span class="string">'Bioinfo:fastawrite:AppendToFile'</span>);
-0712                     fastawrite(fullfile(dataDir,<span class="string">'aligned'</span>,[missingAligned{i} <span class="string">'.faw'</span>]),fastaStruct);
-0713                     warning(warnState) <span class="comment">%Reset warning state to previous settings</span>
-0714                 <span class="keyword">end</span>
-0715             <span class="keyword">end</span>
-0716             <span class="comment">%Move the temporary file to the real one</span>
-0717             movefile(fullfile(dataDir,<span class="string">'aligned'</span>,[missingAligned{i} <span class="string">'.faw'</span>]),fullfile(dataDir,<span class="string">'aligned'</span>,[missingAligned{i} <span class="string">'.fa'</span>]),<span class="string">'f'</span>);
-0718             
-0719             <span class="comment">%Print the progress every 25 files</span>
-0720             <span class="keyword">if</span> rem(i-1,25) == 0
-0721                 progress=num2str(floor(100*numel(<a href="#_sub1" class="code" title="subfunction files=listFiles(directory)">listFiles</a>(fullfile(dataDir,<span class="string">'aligned'</span>,<span class="string">'*.fa'</span>)))/numel(KOModel.rxns)));
-0722                 progress=pad(progress,3,<span class="string">'left'</span>);
-0723                 fprintf(<span class="string">'\b\b\b\b\b\b\b\b\b\b\b\b\b%s%% complete'</span>,progress);
-0724             <span class="keyword">end</span>
-0725         <span class="keyword">end</span>
-0726     <span class="keyword">end</span>
-0727     fprintf(<span class="string">'\b\b\b\b\b\b\b\b\b\b\b\b\bCOMPLETE\n'</span>);
-0728 <span class="keyword">else</span>
-0729     <span class="keyword">if</span> seqIdentity==-1
-0730         fprintf(<span class="string">'Performing the multiple alignment for KEGG Orthology specific protein sets... COMPLETE\n'</span>);
-0731     <span class="keyword">else</span>
-0732         fprintf(<span class="string">'Performing clustering and multiple alignment for KEGG Orthology specific protein sets... COMPLETE\n'</span>);
-0733     <span class="keyword">end</span>
-0734 <span class="keyword">end</span>
-0735 
-0736 <span class="comment">%Check if training of Hidden Markov models should be performed</span>
-0737 missingHMMs=setdiff(KOModel.rxns,[hmmFiles;outFiles]);
-0738 <span class="keyword">if</span> ~isempty(missingHMMs)
-0739     fprintf(<span class="string">'Training the KEGG Orthology specific HMMs...   0%% complete'</span>);
-0740     missingHMMs=missingHMMs(randperm(RandStream.create(<span class="string">'mrg32k3a'</span>,<span class="string">'Seed'</span>,cputime()),numel(missingHMMs)));
-0741     <span class="comment">%Train models for all missing KOs</span>
-0742     <span class="keyword">for</span> i=1:numel(missingHMMs)
-0743         <span class="comment">%This is checked here because it could be that it is created by a</span>
-0744         <span class="comment">%parallel process</span>
-0745         <span class="keyword">if</span> ~isfile(fullfile(dataDir,<span class="string">'hmms'</span>,[missingHMMs{i} <span class="string">'.hmm'</span>])) &amp;&amp; ~isfile(fullfile(dataDir,<span class="string">'hmms'</span>,[missingHMMs{i} <span class="string">'.hmw'</span>]))
-0746             <span class="comment">%Check that the aligned FASTA file exists. It could be that it</span>
-0747             <span class="comment">%is still being worked on by some other instance of the program</span>
-0748             <span class="comment">%(the .faw file should then exist). This should not happen on a</span>
-0749             <span class="comment">%single computer. It doesn't throw an error, because it should</span>
-0750             <span class="comment">%finalize the ones it can</span>
-0751             <span class="keyword">if</span> ~isfile(fullfile(dataDir,<span class="string">'aligned'</span>,[missingHMMs{i} <span class="string">'.fa'</span>]))
-0752                 EM=[<span class="string">'The aligned FASTA file for '</span> missingHMMs{i} <span class="string">' does not exist'</span>];
-0753                 dispEM(EM,false);
-0754                 <span class="keyword">continue</span>;
-0755             <span class="keyword">end</span>
-0756             
-0757             <span class="comment">%If the multi-FASTA file is empty then save an empty aligned</span>
-0758             <span class="comment">%file and continue</span>
-0759             s=dir(fullfile(dataDir,<span class="string">'aligned'</span>,[missingHMMs{i} <span class="string">'.fa'</span>]));
-0760             <span class="keyword">if</span> s.bytes&lt;=0
-0761                 fid=fopen(fullfile(dataDir,<span class="string">'hmms'</span>,[missingHMMs{i} <span class="string">'.hmm'</span>]),<span class="string">'w'</span>);
-0762                 fclose(fid);
-0763                 <span class="keyword">continue</span>;
-0764             <span class="keyword">end</span>
-0765             <span class="comment">%Create a temporary file to indicate that it is working on the</span>
-0766             <span class="comment">%KO. This is because hmmbuild cannot overwrite existing files</span>
-0767             fid=fopen(fullfile(dataDir,<span class="string">'hmms'</span>,[missingHMMs{i} <span class="string">'.hmw'</span>]),<span class="string">'w'</span>);
-0768             fclose(fid);
-0769             
-0770             <span class="comment">%Create HMM</span>
-0771             [status, output]=system([<span class="string">'&quot;'</span> fullfile(ravenPath,<span class="string">'software'</span>,<span class="string">'hmmer'</span>,[<span class="string">'hmmbuild'</span> binEnd]) <span class="string">'&quot; --cpu &quot;'</span> num2str(cores) <span class="string">'&quot; &quot;'</span> fullfile(dataDir,<span class="string">'hmms'</span>,[missingHMMs{i} <span class="string">'.hmm'</span>]) <span class="string">'&quot; &quot;'</span> fullfile(dataDir,<span class="string">'aligned'</span>,[missingHMMs{i} <span class="string">'.fa'</span>]) <span class="string">'&quot;'</span>]);
-0772             <span class="keyword">if</span> status~=0
-0773                 EM=[<span class="string">'Error when training HMM for '</span> missingHMMs{i} <span class="string">':\n'</span> output];
-0774                 dispEM(EM);
-0775             <span class="keyword">end</span>
-0776             
-0777             <span class="comment">%Delete the temporary file</span>
-0778             delete(fullfile(dataDir,<span class="string">'hmms'</span>,[missingHMMs{i} <span class="string">'.hmw'</span>]));
-0779 
-0780             <span class="comment">%Print the progress every 25 files</span>
-0781             <span class="keyword">if</span> rem(i-1,25) == 0
-0782                 progress=num2str(floor(100*numel(<a href="#_sub1" class="code" title="subfunction files=listFiles(directory)">listFiles</a>(fullfile(dataDir,<span class="string">'hmms'</span>,<span class="string">'*.hmm'</span>)))/numel(KOModel.rxns)));
-0783                 progress=pad(progress,3,<span class="string">'left'</span>);
-0784                 fprintf(<span class="string">'\b\b\b\b\b\b\b\b\b\b\b\b\b%s%% complete'</span>,progress);
-0785             <span class="keyword">end</span>
-0786         <span class="keyword">end</span>
-0787     <span class="keyword">end</span>
-0788     fprintf(<span class="string">'\b\b\b\b\b\b\b\b\b\b\b\b\bCOMPLETE\n'</span>);
-0789 <span class="keyword">else</span>
-0790     fprintf(<span class="string">'Training the KEGG Orthology specific HMMs... COMPLETE\n'</span>);
-0791 <span class="keyword">end</span>
-0792 
-0793 <span class="comment">%Check which new .out files that should be generated. Check if training of</span>
-0794 <span class="comment">%Hidden Markov models should be performed</span>
-0795 missingOUT=setdiff(KOModel.rxns,outFiles);
-0796 <span class="keyword">if</span> ~isempty(missingOUT)
-0797     fprintf(<span class="string">'Querying the user-specified FASTA file against the KEGG Orthology specific HMMs...   0%% complete'</span>);
-0798     missingOUT=missingOUT(randperm(RandStream.create(<span class="string">'mrg32k3a'</span>,<span class="string">'Seed'</span>,cputime()),numel(missingOUT)));
-0799     <span class="keyword">for</span> i=1:numel(missingOUT)
-0800         <span class="comment">%This is checked here because it could be that it is created by a</span>
-0801         <span class="comment">%parallel process</span>
-0802         <span class="keyword">if</span> ~isfile(fullfile(outDir,[missingOUT{i} <span class="string">'.out'</span>]))
-0803             <span class="comment">%Check that the HMM file exists. It should do so since %we are</span>
-0804             <span class="comment">%saving empty files as well. Print a warning and continue if</span>
-0805             <span class="comment">%not</span>
-0806             <span class="keyword">if</span> ~isfile(fullfile(dataDir,<span class="string">'hmms'</span>,[missingOUT{i} <span class="string">'.hmm'</span>]))
-0807                 EM=[<span class="string">'The HMM file for '</span> missingOUT{i} <span class="string">' does not exist'</span>];
-0808                 dispEM(EM,false);
-0809                 <span class="keyword">continue</span>;
-0810             <span class="keyword">end</span>
-0811             
-0812             <span class="comment">%Save an empty file to prevent several threads working on the</span>
-0813             <span class="comment">%same file</span>
-0814             fid=fopen(fullfile(outDir,[missingOUT{i} <span class="string">'.out'</span>]),<span class="string">'w'</span>);
-0815             fclose(fid);
-0816             
-0817             <span class="comment">%If the HMM file is empty then save an out file and continue</span>
-0818             s=dir(fullfile(dataDir,<span class="string">'hmms'</span>,[missingOUT{i} <span class="string">'.hmm'</span>]));
-0819             <span class="keyword">if</span> s.bytes&lt;=0
-0820                 <span class="keyword">continue</span>;
-0821             <span class="keyword">end</span>
-0822             
-0823             <span class="comment">%Check each gene in the input file against this model</span>
-0824             [status, output]=system([<span class="string">'&quot;'</span> fullfile(ravenPath,<span class="string">'software'</span>,<span class="string">'hmmer'</span>,[<span class="string">'hmmsearch'</span> binEnd]) <span class="string">'&quot; --cpu &quot;'</span> num2str(cores) <span class="string">'&quot; &quot;'</span> fullfile(dataDir,<span class="string">'hmms'</span>,[missingOUT{i} <span class="string">'.hmm'</span>]) <span class="string">'&quot; &quot;'</span> fastaFile <span class="string">'&quot;'</span>]);
-0825             <span class="keyword">if</span> status~=0
-0826                 EM=[<span class="string">'Error when querying HMM for '</span> missingOUT{i} <span class="string">':\n'</span> output];
-0827                 dispEM(EM);
-0828             <span class="keyword">end</span>
-0829             
-0830             <span class="comment">%Save the output to a file</span>
-0831             fid=fopen(fullfile(outDir,[missingOUT{i} <span class="string">'.out'</span>]),<span class="string">'w'</span>);
-0832             fwrite(fid,output);
-0833             fclose(fid);
-0834             
-0835             <span class="comment">%Print the progress every 25 files</span>
-0836             <span class="keyword">if</span> rem(i-1,25) == 0
-0837                 progress=num2str(floor(100*numel(<a href="#_sub1" class="code" title="subfunction files=listFiles(directory)">listFiles</a>(fullfile(outDir,<span class="string">'*.out'</span>)))/numel(KOModel.rxns)));
-0838                 progress=pad(progress,3,<span class="string">'left'</span>);
-0839                 fprintf(<span class="string">'\b\b\b\b\b\b\b\b\b\b\b\b\b%s%% complete'</span>,progress);
-0840             <span class="keyword">end</span>
-0841         <span class="keyword">end</span>
-0842     <span class="keyword">end</span>
-0843     fprintf(<span class="string">'\b\b\b\b\b\b\b\b\b\b\b\b\bCOMPLETE\n'</span>);
-0844 <span class="keyword">else</span>
-0845     fprintf(<span class="string">'Querying the user-specified FASTA file against the KEGG Orthology specific HMMs... COMPLETE\n'</span>);
-0846 <span class="keyword">end</span>
+0630             <span class="comment">%Save the first nSequences hits to a temporary FASTA file</span>
+0631             <span class="keyword">if</span> nSequences&lt;=numel(fastaStruct)
+0632                 fastaStruct=fastaStruct(order(1:nSequences));
+0633             <span class="keyword">else</span>
+0634                 fastaStruct=fastaStruct(order);
+0635             <span class="keyword">end</span>
+0636             
+0637             <span class="comment">%Do the clustering and alignment if there are more than one</span>
+0638             <span class="comment">%sequences, otherwise just save the sequence (or an empty file)</span>
+0639             <span class="keyword">if</span> numel(fastaStruct)&gt;1
+0640                  <span class="keyword">if</span> seqIdentity~=-1
+0641                     cdhitInpCustom=tempname;
+0642                     fastawrite(cdhitInpCustom,fastaStruct);
+0643                     <span class="keyword">if</span> seqIdentity&lt;=1 &amp;&amp; seqIdentity&gt;0.7
+0644                         nparam=<span class="string">'5'</span>;
+0645                     <span class="keyword">elseif</span> seqIdentity&gt;0.6
+0646                         nparam=<span class="string">'4'</span>;
+0647                     <span class="keyword">elseif</span> seqIdentity&gt;0.5
+0648                         nparam=<span class="string">'3'</span>;
+0649                     <span class="keyword">elseif</span> seqIdentity&gt;0.4
+0650                         nparam=<span class="string">'2'</span>;
+0651                     <span class="keyword">else</span>
+0652                         EM=<span class="string">'The provided seqIdentity must be between 0 and 1\n'</span>;
+0653                         dispEM(EM);
+0654                     <span class="keyword">end</span>
+0655                     <span class="keyword">if</span> ispc
+0656                         wslPath.cdhitInpCustom=<a href="getWSLpath.html" class="code" title="function path=getWSLpath(path)">getWSLpath</a>(cdhitInpCustom);
+0657                         [status, output]=system([<span class="string">'wsl &quot;'</span> wslPath.cdhit <span class="string">'&quot; -T &quot;'</span> num2str(cores) <span class="string">'&quot; -i &quot;'</span> wslPath.cdhitInpCustom <span class="string">'&quot; -o &quot;'</span> wslPath.tmpFile <span class="string">'&quot; -c &quot;'</span> num2str(seqIdentity) <span class="string">'&quot; -n '</span> nparam <span class="string">' -M 2000'</span>]);
+0658                     <span class="keyword">elseif</span> ismac || isunix
+0659                         [status, output]=system([<span class="string">'&quot;'</span> fullfile(ravenPath,<span class="string">'software'</span>,<span class="string">'cd-hit'</span>,[<span class="string">'cd-hit'</span> binEnd]) <span class="string">'&quot; -T &quot;'</span> num2str(cores) <span class="string">'&quot; -i &quot;'</span> cdhitInpCustom <span class="string">'&quot; -o &quot;'</span> tmpFile <span class="string">'&quot; -c &quot;'</span> num2str(seqIdentity) <span class="string">'&quot; -n '</span> nparam <span class="string">' -M 2000'</span>]);
+0660                     <span class="keyword">end</span>
+0661                     <span class="keyword">if</span> status~=0
+0662                         EM=[<span class="string">'Error when performing clustering of '</span> missingAligned{i} <span class="string">':\n'</span> output];
+0663                         dispEM(EM);
+0664                     <span class="keyword">end</span>
+0665                     <span class="comment">%Remove the old tempfile</span>
+0666                     <span class="keyword">if</span> exist(cdhitInpCustom, <span class="string">'file'</span>)
+0667                         delete([cdhitInpCustom <span class="string">'*'</span>]);
+0668                     <span class="keyword">end</span>
+0669                 <span class="keyword">else</span>
+0670                     <span class="comment">%This means that CD-HIT should be skipped since</span>
+0671                     <span class="comment">%seqIdentity is equal to -1</span>
+0672                     fastawrite(tmpFile,fastaStruct);
+0673                 <span class="keyword">end</span>
+0674                 <span class="comment">%Do the alignment for this file</span>
+0675                 <span class="keyword">if</span> ismac
+0676                     [status, output]=system([<span class="string">'&quot;'</span> fullfile(ravenPath,<span class="string">'software'</span>,<span class="string">'mafft'</span>,<span class="string">'mafft-mac'</span>,<span class="string">'mafft.bat'</span>) <span class="string">'&quot; --auto --anysymbol --thread &quot;'</span> num2str(cores) <span class="string">'&quot; &quot;'</span> tmpFile <span class="string">'&quot; &gt; &quot;'</span> fullfile(dataDir,<span class="string">'aligned'</span>,[missingAligned{i} <span class="string">'.faw'</span>]) <span class="string">'&quot;'</span>]);
+0677                 <span class="keyword">elseif</span> isunix
+0678                     [status, output]=system([<span class="string">'&quot;'</span> fullfile(ravenPath,<span class="string">'software'</span>,<span class="string">'mafft'</span>,<span class="string">'mafft-linux64'</span>,<span class="string">'mafft.bat'</span>) <span class="string">'&quot; --auto --anysymbol --thread &quot;'</span> num2str(cores) <span class="string">'&quot; &quot;'</span> tmpFile <span class="string">'&quot; &gt; &quot;'</span> fullfile(dataDir,<span class="string">'aligned'</span>,[missingAligned{i} <span class="string">'.faw'</span>]) <span class="string">'&quot;'</span>]);
+0679                 <span class="keyword">elseif</span> ispc
+0680                     wslPath.fawFile=<a href="getWSLpath.html" class="code" title="function path=getWSLpath(path)">getWSLpath</a>(fullfile(dataDir,<span class="string">'aligned'</span>,[missingAligned{i} <span class="string">'.faw'</span>]));
+0681                     [status, ~]=system([<span class="string">'wsl &quot;'</span> wslPath.mafft <span class="string">'&quot; --auto --anysymbol --progress &quot;'</span> wslPath.mafftOutput <span class="string">'&quot; --thread &quot;'</span> num2str(cores) <span class="string">'&quot; --out &quot;'</span> wslPath.fawFile <span class="string">'&quot; &quot;'</span> wslPath.tmpFile <span class="string">'&quot;'</span>]);
+0682                     output=fileread(mafftOutput);
+0683                     delete(mafftOutput);
+0684                 <span class="keyword">end</span>
+0685                 <span class="keyword">if</span> status~=0
+0686                     <span class="comment">%It could be that alignment failed because only one</span>
+0687                     <span class="comment">%sequence was left after clustering. If that is the</span>
+0688                     <span class="comment">%case, then the clustered file is just copied as 'faw'</span>
+0689                     <span class="comment">%file</span>
+0690                     <span class="keyword">if</span> any(regexp(output,<span class="string">'Only 1 sequence found'</span>))
+0691                         movefile(tmpFile,fullfile(dataDir,<span class="string">'aligned'</span>,[missingAligned{i} <span class="string">'.faw'</span>]),<span class="string">'f'</span>);
+0692                     <span class="keyword">else</span>
+0693                         EM=[<span class="string">'Error when performing alignment of '</span> missingAligned{i} <span class="string">':\n'</span> output];
+0694                         dispEM(EM);
+0695                     <span class="keyword">end</span>
+0696                 <span class="keyword">end</span>
+0697                 <span class="comment">%Remove the old tempfile</span>
+0698                 <span class="keyword">if</span> exist(tmpFile, <span class="string">'file'</span>)
+0699                     delete([tmpFile <span class="string">'*'</span>]);
+0700                 <span class="keyword">end</span>
+0701             <span class="keyword">else</span>
+0702                 <span class="comment">%If there is only one sequence then it's not possible to do</span>
+0703                 <span class="comment">%a multiple alignment. Just print the sequence instead. An</span>
+0704                 <span class="comment">%empty file was written previously so that doesn't have to</span>
+0705                 <span class="comment">%be dealt with</span>
+0706                 <span class="keyword">if</span> numel(fastaStruct)==1
+0707                     warnState = warning; <span class="comment">%Save the current warning state</span>
+0708                     warning(<span class="string">'off'</span>,<span class="string">'Bioinfo:fastawrite:AppendToFile'</span>);
+0709                     fastawrite(fullfile(dataDir,<span class="string">'aligned'</span>,[missingAligned{i} <span class="string">'.faw'</span>]),fastaStruct);
+0710                     warning(warnState) <span class="comment">%Reset warning state to previous settings</span>
+0711                 <span class="keyword">end</span>
+0712             <span class="keyword">end</span>
+0713             <span class="comment">%Move the temporary file to the real one</span>
+0714             movefile(fullfile(dataDir,<span class="string">'aligned'</span>,[missingAligned{i} <span class="string">'.faw'</span>]),fullfile(dataDir,<span class="string">'aligned'</span>,[missingAligned{i} <span class="string">'.fa'</span>]),<span class="string">'f'</span>);
+0715             
+0716             <span class="comment">%Print the progress every 25 files</span>
+0717             <span class="keyword">if</span> rem(i-1,25) == 0
+0718                 progress=num2str(floor(100*numel(<a href="#_sub1" class="code" title="subfunction files=listFiles(directory)">listFiles</a>(fullfile(dataDir,<span class="string">'aligned'</span>,<span class="string">'*.fa'</span>)))/numel(KOModel.rxns)));
+0719                 progress=pad(progress,3,<span class="string">'left'</span>);
+0720                 fprintf(<span class="string">'\b\b\b\b\b\b\b\b\b\b\b\b\b%s%% complete'</span>,progress);
+0721             <span class="keyword">end</span>
+0722         <span class="keyword">end</span>
+0723     <span class="keyword">end</span>
+0724     fprintf(<span class="string">'\b\b\b\b\b\b\b\b\b\b\b\b\bCOMPLETE\n'</span>);
+0725 <span class="keyword">else</span>
+0726     <span class="keyword">if</span> seqIdentity==-1
+0727         fprintf(<span class="string">'Performing the multiple alignment for KEGG Orthology specific protein sets... COMPLETE\n'</span>);
+0728     <span class="keyword">else</span>
+0729         fprintf(<span class="string">'Performing clustering and multiple alignment for KEGG Orthology specific protein sets... COMPLETE\n'</span>);
+0730     <span class="keyword">end</span>
+0731 <span class="keyword">end</span>
+0732 
+0733 <span class="comment">%Check if training of Hidden Markov models should be performed</span>
+0734 missingHMMs=setdiff(KOModel.rxns,[hmmFiles;outFiles]);
+0735 <span class="keyword">if</span> ~isempty(missingHMMs)
+0736     fprintf(<span class="string">'Training the KEGG Orthology specific HMMs...   0%% complete'</span>);
+0737     missingHMMs=missingHMMs(randperm(RandStream.create(<span class="string">'mrg32k3a'</span>,<span class="string">'Seed'</span>,cputime()),numel(missingHMMs)));
+0738     <span class="comment">%Train models for all missing KOs</span>
+0739     <span class="keyword">for</span> i=1:numel(missingHMMs)
+0740         <span class="comment">%This is checked here because it could be that it is created by a</span>
+0741         <span class="comment">%parallel process</span>
+0742         <span class="keyword">if</span> ~isfile(fullfile(dataDir,<span class="string">'hmms'</span>,[missingHMMs{i} <span class="string">'.hmm'</span>])) &amp;&amp; ~isfile(fullfile(dataDir,<span class="string">'hmms'</span>,[missingHMMs{i} <span class="string">'.hmw'</span>]))
+0743             <span class="comment">%Check that the aligned FASTA file exists. It could be that it</span>
+0744             <span class="comment">%is still being worked on by some other instance of the program</span>
+0745             <span class="comment">%(the .faw file should then exist). This should not happen on a</span>
+0746             <span class="comment">%single computer. It doesn't throw an error, because it should</span>
+0747             <span class="comment">%finalize the ones it can</span>
+0748             <span class="keyword">if</span> ~isfile(fullfile(dataDir,<span class="string">'aligned'</span>,[missingHMMs{i} <span class="string">'.fa'</span>]))
+0749                 EM=[<span class="string">'The aligned FASTA file for '</span> missingHMMs{i} <span class="string">' does not exist'</span>];
+0750                 dispEM(EM,false);
+0751                 <span class="keyword">continue</span>;
+0752             <span class="keyword">end</span>
+0753             
+0754             <span class="comment">%If the multi-FASTA file is empty then save an empty aligned</span>
+0755             <span class="comment">%file and continue</span>
+0756             s=dir(fullfile(dataDir,<span class="string">'aligned'</span>,[missingHMMs{i} <span class="string">'.fa'</span>]));
+0757             <span class="keyword">if</span> s.bytes&lt;=0
+0758                 fid=fopen(fullfile(dataDir,<span class="string">'hmms'</span>,[missingHMMs{i} <span class="string">'.hmm'</span>]),<span class="string">'w'</span>);
+0759                 fclose(fid);
+0760                 <span class="keyword">continue</span>;
+0761             <span class="keyword">end</span>
+0762             <span class="comment">%Create a temporary file to indicate that it is working on the</span>
+0763             <span class="comment">%KO. This is because hmmbuild cannot overwrite existing files</span>
+0764             fid=fopen(fullfile(dataDir,<span class="string">'hmms'</span>,[missingHMMs{i} <span class="string">'.hmw'</span>]),<span class="string">'w'</span>);
+0765             fclose(fid);
+0766             
+0767             <span class="comment">%Create HMM</span>
+0768             [status, output]=system([<span class="string">'&quot;'</span> fullfile(ravenPath,<span class="string">'software'</span>,<span class="string">'hmmer'</span>,[<span class="string">'hmmbuild'</span> binEnd]) <span class="string">'&quot; --cpu &quot;'</span> num2str(cores) <span class="string">'&quot; &quot;'</span> fullfile(dataDir,<span class="string">'hmms'</span>,[missingHMMs{i} <span class="string">'.hmm'</span>]) <span class="string">'&quot; &quot;'</span> fullfile(dataDir,<span class="string">'aligned'</span>,[missingHMMs{i} <span class="string">'.fa'</span>]) <span class="string">'&quot;'</span>]);
+0769             <span class="keyword">if</span> status~=0
+0770                 EM=[<span class="string">'Error when training HMM for '</span> missingHMMs{i} <span class="string">':\n'</span> output];
+0771                 dispEM(EM);
+0772             <span class="keyword">end</span>
+0773             
+0774             <span class="comment">%Delete the temporary file</span>
+0775             delete(fullfile(dataDir,<span class="string">'hmms'</span>,[missingHMMs{i} <span class="string">'.hmw'</span>]));
+0776 
+0777             <span class="comment">%Print the progress every 25 files</span>
+0778             <span class="keyword">if</span> rem(i-1,25) == 0
+0779                 progress=num2str(floor(100*numel(<a href="#_sub1" class="code" title="subfunction files=listFiles(directory)">listFiles</a>(fullfile(dataDir,<span class="string">'hmms'</span>,<span class="string">'*.hmm'</span>)))/numel(KOModel.rxns)));
+0780                 progress=pad(progress,3,<span class="string">'left'</span>);
+0781                 fprintf(<span class="string">'\b\b\b\b\b\b\b\b\b\b\b\b\b%s%% complete'</span>,progress);
+0782             <span class="keyword">end</span>
+0783         <span class="keyword">end</span>
+0784     <span class="keyword">end</span>
+0785     fprintf(<span class="string">'\b\b\b\b\b\b\b\b\b\b\b\b\bCOMPLETE\n'</span>);
+0786 <span class="keyword">else</span>
+0787     fprintf(<span class="string">'Training the KEGG Orthology specific HMMs... COMPLETE\n'</span>);
+0788 <span class="keyword">end</span>
+0789 
+0790 <span class="comment">%Check which new .out files that should be generated. Check if training of</span>
+0791 <span class="comment">%Hidden Markov models should be performed</span>
+0792 missingOUT=setdiff(KOModel.rxns,outFiles);
+0793 <span class="keyword">if</span> ~isempty(missingOUT)
+0794     fprintf(<span class="string">'Querying the user-specified FASTA file against the KEGG Orthology specific HMMs...   0%% complete'</span>);
+0795     missingOUT=missingOUT(randperm(RandStream.create(<span class="string">'mrg32k3a'</span>,<span class="string">'Seed'</span>,cputime()),numel(missingOUT)));
+0796     <span class="keyword">for</span> i=1:numel(missingOUT)
+0797         <span class="comment">%This is checked here because it could be that it is created by a</span>
+0798         <span class="comment">%parallel process</span>
+0799         <span class="keyword">if</span> ~isfile(fullfile(outDir,[missingOUT{i} <span class="string">'.out'</span>]))
+0800             <span class="comment">%Check that the HMM file exists. It should do so since %we are</span>
+0801             <span class="comment">%saving empty files as well. Print a warning and continue if</span>
+0802             <span class="comment">%not</span>
+0803             <span class="keyword">if</span> ~isfile(fullfile(dataDir,<span class="string">'hmms'</span>,[missingOUT{i} <span class="string">'.hmm'</span>]))
+0804                 EM=[<span class="string">'The HMM file for '</span> missingOUT{i} <span class="string">' does not exist'</span>];
+0805                 dispEM(EM,false);
+0806                 <span class="keyword">continue</span>;
+0807             <span class="keyword">end</span>
+0808             
+0809             <span class="comment">%Save an empty file to prevent several threads working on the</span>
+0810             <span class="comment">%same file</span>
+0811             fid=fopen(fullfile(outDir,[missingOUT{i} <span class="string">'.out'</span>]),<span class="string">'w'</span>);
+0812             fclose(fid);
+0813             
+0814             <span class="comment">%If the HMM file is empty then save an out file and continue</span>
+0815             s=dir(fullfile(dataDir,<span class="string">'hmms'</span>,[missingOUT{i} <span class="string">'.hmm'</span>]));
+0816             <span class="keyword">if</span> s.bytes&lt;=0
+0817                 <span class="keyword">continue</span>;
+0818             <span class="keyword">end</span>
+0819             
+0820             <span class="comment">%Check each gene in the input file against this model</span>
+0821             [status, output]=system([<span class="string">'&quot;'</span> fullfile(ravenPath,<span class="string">'software'</span>,<span class="string">'hmmer'</span>,[<span class="string">'hmmsearch'</span> binEnd]) <span class="string">'&quot; --cpu &quot;'</span> num2str(cores) <span class="string">'&quot; &quot;'</span> fullfile(dataDir,<span class="string">'hmms'</span>,[missingOUT{i} <span class="string">'.hmm'</span>]) <span class="string">'&quot; &quot;'</span> fastaFile <span class="string">'&quot;'</span>]);
+0822             <span class="keyword">if</span> status~=0
+0823                 EM=[<span class="string">'Error when querying HMM for '</span> missingOUT{i} <span class="string">':\n'</span> output];
+0824                 dispEM(EM);
+0825             <span class="keyword">end</span>
+0826             
+0827             <span class="comment">%Save the output to a file</span>
+0828             fid=fopen(fullfile(outDir,[missingOUT{i} <span class="string">'.out'</span>]),<span class="string">'w'</span>);
+0829             fwrite(fid,output);
+0830             fclose(fid);
+0831             
+0832             <span class="comment">%Print the progress every 25 files</span>
+0833             <span class="keyword">if</span> rem(i-1,25) == 0
+0834                 progress=num2str(floor(100*numel(<a href="#_sub1" class="code" title="subfunction files=listFiles(directory)">listFiles</a>(fullfile(outDir,<span class="string">'*.out'</span>)))/numel(KOModel.rxns)));
+0835                 progress=pad(progress,3,<span class="string">'left'</span>);
+0836                 fprintf(<span class="string">'\b\b\b\b\b\b\b\b\b\b\b\b\b%s%% complete'</span>,progress);
+0837             <span class="keyword">end</span>
+0838         <span class="keyword">end</span>
+0839     <span class="keyword">end</span>
+0840     fprintf(<span class="string">'\b\b\b\b\b\b\b\b\b\b\b\b\bCOMPLETE\n'</span>);
+0841 <span class="keyword">else</span>
+0842     fprintf(<span class="string">'Querying the user-specified FASTA file against the KEGG Orthology specific HMMs... COMPLETE\n'</span>);
+0843 <span class="keyword">end</span>
+0844 
+0845 
+0846 <span class="comment">%***Begin retrieving the output and putting together the resulting model</span>
 0847 
-0848 
-0849 <span class="comment">%***Begin retrieving the output and putting together the resulting model</span>
-0850 
-0851 fprintf(<span class="string">'Parsing the HMM search results... '</span>);
-0852 <span class="comment">%Retrieve matched genes from the HMMs</span>
-0853 koGeneMat=zeros(numel(KOModel.rxns),3000); <span class="comment">%Make room for 3000 genes</span>
-0854 genes=cell(3000,1);
-0855 <span class="comment">%Store the best score for a gene in a hash list (since it will be searching</span>
-0856 <span class="comment">%many times)</span>
-0857 hTable = java.util.Hashtable;
-0858 
-0859 geneCounter=0;
-0860 <span class="keyword">for</span> i=1:numel(KOModel.rxns)
-0861     <span class="keyword">if</span> exist(fullfile(outDir,[KOModel.rxns{i} <span class="string">'.out'</span>]), <span class="string">'file'</span>)
-0862         fid=fopen(fullfile(outDir,[KOModel.rxns{i} <span class="string">'.out'</span>]),<span class="string">'r'</span>);
-0863         beginMatches=false;
-0864         <span class="keyword">while</span> 1
-0865             <span class="comment">%Get the next line</span>
-0866             tline = fgetl(fid);
-0867             
-0868             <span class="comment">%Abort at end of file</span>
-0869             <span class="keyword">if</span> ~ischar(tline)
-0870                 <span class="keyword">break</span>;
-0871             <span class="keyword">end</span>
-0872             
-0873             <span class="keyword">if</span> and(beginMatches,strcmp(tline,<span class="string">'  ------ inclusion threshold ------'</span>))
-0874                 <span class="keyword">break</span>;
-0875             <span class="keyword">end</span>
-0876             
-0877             <span class="keyword">if</span> beginMatches==false
-0878                 <span class="comment">%This is how the listing of matches begins</span>
-0879                 <span class="keyword">if</span> any(strfind(tline,<span class="string">'E-value '</span>))
-0880                     <span class="comment">%Read one more line that is only padding</span>
-0881                     tline = fgetl(fid);
-0882                     beginMatches=true;
-0883                 <span class="keyword">end</span>
-0884             <span class="keyword">else</span>
-0885                 <span class="comment">%If matches should be read</span>
-0886                 <span class="keyword">if</span> ~strcmp(tline,<span class="string">'   [No hits detected that satisfy reporting thresholds]'</span>) &amp;&amp; ~isempty(tline)
-0887                     elements=regexp(tline,<span class="string">' '</span>,<span class="string">'split'</span>);
-0888                     elements=elements(cellfun(@any,elements));
-0889                     
-0890                     <span class="comment">%Check if the match is below the treshhold</span>
-0891                     score=str2double(elements{1});
-0892                     gene=elements{9};
-0893                     <span class="keyword">if</span> score&lt;=cutOff
-0894                         <span class="comment">%If the score is exactly 0, change it to a very</span>
-0895                         <span class="comment">%small value to avoid NaN</span>
-0896                         <span class="keyword">if</span> score==0
-0897                             score=10^-250;
-0898                         <span class="keyword">end</span>
-0899                         <span class="comment">%Check if the gene is added already and, is so, get</span>
-0900                         <span class="comment">%the best score for it</span>
-0901                         I=hTable.get(gene);
-0902                         <span class="keyword">if</span> any(I)
-0903                             koGeneMat(i,I)=score;
-0904                         <span class="keyword">else</span>
-0905                             geneCounter=geneCounter+1;
-0906                             <span class="comment">%The gene was not present yet so add it</span>
-0907                             hTable.put(gene,geneCounter);
-0908                             genes{geneCounter}=gene;
-0909                             koGeneMat(i,geneCounter)=score;
-0910                         <span class="keyword">end</span>
-0911                     <span class="keyword">end</span>
-0912                 <span class="keyword">else</span>
-0913                     <span class="keyword">break</span>;
-0914                 <span class="keyword">end</span>
-0915             <span class="keyword">end</span>
-0916         <span class="keyword">end</span>
-0917         fclose(fid);
-0918     <span class="keyword">end</span>
-0919 <span class="keyword">end</span>
-0920 fprintf(<span class="string">'COMPLETE\n'</span>);
+0848 fprintf(<span class="string">'Parsing the HMM search results... '</span>);
+0849 <span class="comment">%Retrieve matched genes from the HMMs</span>
+0850 koGeneMat=zeros(numel(KOModel.rxns),3000); <span class="comment">%Make room for 3000 genes</span>
+0851 genes=cell(3000,1);
+0852 <span class="comment">%Store the best score for a gene in a hash list (since it will be searching</span>
+0853 <span class="comment">%many times)</span>
+0854 hTable = java.util.Hashtable;
+0855 
+0856 geneCounter=0;
+0857 <span class="keyword">for</span> i=1:numel(KOModel.rxns)
+0858     <span class="keyword">if</span> exist(fullfile(outDir,[KOModel.rxns{i} <span class="string">'.out'</span>]), <span class="string">'file'</span>)
+0859         fid=fopen(fullfile(outDir,[KOModel.rxns{i} <span class="string">'.out'</span>]),<span class="string">'r'</span>);
+0860         beginMatches=false;
+0861         <span class="keyword">while</span> 1
+0862             <span class="comment">%Get the next line</span>
+0863             tline = fgetl(fid);
+0864             
+0865             <span class="comment">%Abort at end of file</span>
+0866             <span class="keyword">if</span> ~ischar(tline)
+0867                 <span class="keyword">break</span>;
+0868             <span class="keyword">end</span>
+0869             
+0870             <span class="keyword">if</span> and(beginMatches,strcmp(tline,<span class="string">'  ------ inclusion threshold ------'</span>))
+0871                 <span class="keyword">break</span>;
+0872             <span class="keyword">end</span>
+0873             
+0874             <span class="keyword">if</span> beginMatches==false
+0875                 <span class="comment">%This is how the listing of matches begins</span>
+0876                 <span class="keyword">if</span> any(strfind(tline,<span class="string">'E-value '</span>))
+0877                     <span class="comment">%Read one more line that is only padding</span>
+0878                     tline = fgetl(fid);
+0879                     beginMatches=true;
+0880                 <span class="keyword">end</span>
+0881             <span class="keyword">else</span>
+0882                 <span class="comment">%If matches should be read</span>
+0883                 <span class="keyword">if</span> ~strcmp(tline,<span class="string">'   [No hits detected that satisfy reporting thresholds]'</span>) &amp;&amp; ~isempty(tline)
+0884                     elements=regexp(tline,<span class="string">' '</span>,<span class="string">'split'</span>);
+0885                     elements=elements(cellfun(@any,elements));
+0886                     
+0887                     <span class="comment">%Check if the match is below the treshhold</span>
+0888                     score=str2double(elements{1});
+0889                     gene=elements{9};
+0890                     <span class="keyword">if</span> score&lt;=cutOff
+0891                         <span class="comment">%If the score is exactly 0, change it to a very</span>
+0892                         <span class="comment">%small value to avoid NaN</span>
+0893                         <span class="keyword">if</span> score==0
+0894                             score=10^-250;
+0895                         <span class="keyword">end</span>
+0896                         <span class="comment">%Check if the gene is added already and, is so, get</span>
+0897                         <span class="comment">%the best score for it</span>
+0898                         I=hTable.get(gene);
+0899                         <span class="keyword">if</span> any(I)
+0900                             koGeneMat(i,I)=score;
+0901                         <span class="keyword">else</span>
+0902                             geneCounter=geneCounter+1;
+0903                             <span class="comment">%The gene was not present yet so add it</span>
+0904                             hTable.put(gene,geneCounter);
+0905                             genes{geneCounter}=gene;
+0906                             koGeneMat(i,geneCounter)=score;
+0907                         <span class="keyword">end</span>
+0908                     <span class="keyword">end</span>
+0909                 <span class="keyword">else</span>
+0910                     <span class="keyword">break</span>;
+0911                 <span class="keyword">end</span>
+0912             <span class="keyword">end</span>
+0913         <span class="keyword">end</span>
+0914         fclose(fid);
+0915     <span class="keyword">end</span>
+0916 <span class="keyword">end</span>
+0917 fprintf(<span class="string">'COMPLETE\n'</span>);
+0918 
+0919 fprintf(<span class="string">'Removing gene, KEGG Orthology associations below minScoreRatioKO, minScoreRatioG... '</span>);
+0920 koGeneMat=koGeneMat(:,1:geneCounter);
 0921 
-0922 fprintf(<span class="string">'Removing gene, KEGG Orthology associations below minScoreRatioKO, minScoreRatioG... '</span>);
-0923 koGeneMat=koGeneMat(:,1:geneCounter);
-0924 
-0925 <span class="comment">%Remove the genes for each KO that are below minScoreRatioKO.</span>
-0926 <span class="keyword">for</span> i=1:size(koGeneMat,1)
-0927     J=find(koGeneMat(i,:));
-0928     <span class="keyword">if</span> any(J)
-0929         koGeneMat(i,J(log(koGeneMat(i,J))/log(min(koGeneMat(i,J)))&lt;minScoreRatioKO))=0;
-0930     <span class="keyword">end</span>
-0931 <span class="keyword">end</span>
-0932 
-0933 <span class="comment">%Remove the KOs for each gene that are below minScoreRatioG</span>
-0934 <span class="keyword">for</span> i=1:size(koGeneMat,2)
-0935     J=find(koGeneMat(:,i));
-0936     <span class="keyword">if</span> any(J)
-0937         koGeneMat(J(log(koGeneMat(J,i))/log(min(koGeneMat(J,i)))&lt;minScoreRatioG),i)=0;
-0938     <span class="keyword">end</span>
-0939 <span class="keyword">end</span>
-0940 fprintf(<span class="string">'COMPLETE\n'</span>);
-0941 
-0942 fprintf(<span class="string">'Adding gene annotations to the model... '</span>);
-0943 <span class="comment">%Create the new model</span>
-0944 model.genes=genes(1:geneCounter);
-0945 model.grRules=cell(numel(model.rxns),1);
-0946 model.grRules(:)={<span class="string">''</span>};
-0947 model.rxnGeneMat=sparse(numel(model.rxns),numel(model.genes));
-0948 
-0949 <span class="comment">%Loop through the reactions and add the corresponding genes</span>
-0950 <span class="keyword">for</span> i=1:numel(model.rxns)
-0951     <span class="keyword">if</span> isstruct(model.rxnMiriams{i})
-0952         <span class="comment">%Get all KOs</span>
-0953         I=find(strcmpi(model.rxnMiriams{i}.name,<span class="string">'kegg.orthology'</span>));
-0954         KOs=model.rxnMiriams{i}.value(I);
-0955         <span class="comment">%Find the KOs and the corresponding genes</span>
-0956         J=ismember(KOModel.rxns,KOs);
-0957         [~, K]=find(koGeneMat(J,:));
-0958         
-0959         <span class="keyword">if</span> any(K)
-0960             model.rxnGeneMat(i,K)=1;
-0961             <span class="comment">%Also delete KOs for which no genes were found. If no genes at</span>
-0962             <span class="comment">%all were matched to the reaction it will be deleted later</span>
-0963             L=sum(koGeneMat(J,:),2)==0;
-0964             model.rxnMiriams{i}.value(I(L))=[];
-0965             model.rxnMiriams{i}.name(I(L))=[];
-0966         <span class="keyword">end</span>
-0967     <span class="keyword">end</span>
-0968 <span class="keyword">end</span>
-0969 fprintf(<span class="string">'COMPLETE\n'</span>);
-0970 
-0971 <span class="comment">%Find and delete all reactions without genes. This also removes genes that</span>
-0972 <span class="comment">%are not used (which could happen because minScoreRatioG and</span>
-0973 <span class="comment">%minScoreRatioKO). If keepSpontaneous==true, the spontaneous reactions</span>
-0974 <span class="comment">%without genes are kept in the model. Spontaneous reactions with original</span>
-0975 <span class="comment">%gene associations are treated in the same way, like the rest of the</span>
-0976 <span class="comment">%reactions - if gene associations were removed during HMM search, such</span>
-0977 <span class="comment">%reactions are deleted from the model</span>
-0978 <span class="keyword">if</span> keepSpontaneous==true
-0979     <span class="comment">%Not the most comprise way to delete reactions without genes, but this</span>
-0980     <span class="comment">%makes the code easier to understand. Firstly the non-spontaneous</span>
-0981     <span class="comment">%reactions without genes are removed. After that, the second deletion</span>
-0982     <span class="comment">%step removes spontaneous reactions, which had gene associations before</span>
-0983     <span class="comment">%HMM search, but no longer have after it</span>
-0984     fprintf(<span class="string">'Removing non-spontaneous reactions which after HMM search no longer have GPR rules... '</span>);
-0985     I=~any(model.rxnGeneMat,2)&amp;~ismember(model.rxns,isSpontaneous);
-0986     model=removeReactions(model,I,true,true);
-0987     I=~any(model.rxnGeneMat,2)&amp;ismember(model.rxns,spontRxnsWithGenes);
-0988     model=removeReactions(model,I,true,true);
-0989 <span class="keyword">else</span>
-0990     <span class="comment">%Just simply check for any new reactions without genes and remove</span>
-0991     <span class="comment">%it</span>
-0992     fprintf(<span class="string">'Removing reactions which after HMM search no longer have GPR rules... '</span>);
-0993     I=~any(model.rxnGeneMat,2);
-0994     model=removeReactions(model,I,true,true);
-0995 <span class="keyword">end</span>
-0996 fprintf(<span class="string">'COMPLETE\n'</span>);
-0997 
-0998 fprintf(<span class="string">'Constructing GPR rules and finalizing the model... '</span>);
-0999 <span class="comment">%Add the gene associations as 'or'</span>
-1000 <span class="keyword">for</span> i=1:numel(model.rxns)
-1001     <span class="comment">%Find the involved genes</span>
-1002     I=find(model.rxnGeneMat(i,:));
-1003     <span class="keyword">if</span> any(I)
-1004         model.grRules{i}=[<span class="string">'('</span> model.genes{I(1)}];
-1005         <span class="keyword">for</span> j=2:numel(I)
-1006             model.grRules{i}=[model.grRules{i} <span class="string">' or '</span> model.genes{I(j)}];
-1007         <span class="keyword">end</span>
-1008         model.grRules{i}=[model.grRules{i} <span class="string">')'</span>];
-1009     <span class="keyword">end</span>
-1010 <span class="keyword">end</span>
-1011 
-1012 <span class="comment">%Fix grRules and reconstruct rxnGeneMat</span>
-1013 [grRules,rxnGeneMat] = standardizeGrRules(model,false); <span class="comment">%Give detailed output</span>
-1014 model.grRules = grRules;
-1015 model.rxnGeneMat = rxnGeneMat;
-1016 
-1017 <span class="comment">%Fix subsystems</span>
-1018 emptySubSystems=cellfun(@isempty, model.subSystems);
-1019 model.subSystems(emptySubSystems)={{<span class="string">''</span>}};
-1020 
-1021 <span class="comment">%Add the description to the reactions</span>
-1022 <span class="keyword">for</span> i=1:numel(model.rxns)
-1023     <span class="keyword">if</span> ~isempty(model.rxnNotes{i})
-1024         model.rxnNotes(i)=strcat(<span class="string">'Included by getKEGGModelForOrganism (using HMMs).'</span>,model.rxnNotes(i));
-1025         model.rxnNotes(i)=strrep(model.rxnNotes(i),<span class="string">'.'</span>,<span class="string">'. '</span>);
-1026     <span class="keyword">else</span>
-1027         model.rxnNotes(i)={<span class="string">'Included by getKEGGModelForOrganism (using HMMs)'</span>};
-1028     <span class="keyword">end</span>
-1029 <span class="keyword">end</span>
-1030 <span class="comment">%Remove the temp fasta file</span>
-1031 delete(fastaFile)
-1032 fprintf(<span class="string">'COMPLETE\n\n*** Model reconstruction complete ***\n'</span>);
-1033 <span class="keyword">end</span>
-1034 
-1035 <a name="_sub1" href="#_subfunctions" class="code">function files=listFiles(directory)</a>
-1036 <span class="comment">%Supporter function to list the files in a directory and return them as a</span>
-1037 <span class="comment">%cell array</span>
-1038 temp=dir(directory);
-1039 files=cell(numel(temp),1);
-1040 <span class="keyword">for</span> i=1:numel(temp)
-1041     files{i}=temp(i,1).name;
-1042 <span class="keyword">end</span>
-1043 files=strrep(files,<span class="string">'.fa'</span>,<span class="string">''</span>);
-1044 files=strrep(files,<span class="string">'.hmm'</span>,<span class="string">''</span>);
-1045 files=strrep(files,<span class="string">'.out'</span>,<span class="string">''</span>);
-1046 files=strrep(files,<span class="string">'.faw'</span>,<span class="string">''</span>);
-1047 <span class="keyword">end</span></pre></div>
+0922 <span class="comment">%Remove the genes for each KO that are below minScoreRatioKO.</span>
+0923 <span class="keyword">for</span> i=1:size(koGeneMat,1)
+0924     J=find(koGeneMat(i,:));
+0925     <span class="keyword">if</span> any(J)
+0926         koGeneMat(i,J(log(koGeneMat(i,J))/log(min(koGeneMat(i,J)))&lt;minScoreRatioKO))=0;
+0927     <span class="keyword">end</span>
+0928 <span class="keyword">end</span>
+0929 
+0930 <span class="comment">%Remove the KOs for each gene that are below minScoreRatioG</span>
+0931 <span class="keyword">for</span> i=1:size(koGeneMat,2)
+0932     J=find(koGeneMat(:,i));
+0933     <span class="keyword">if</span> any(J)
+0934         koGeneMat(J(log(koGeneMat(J,i))/log(min(koGeneMat(J,i)))&lt;minScoreRatioG),i)=0;
+0935     <span class="keyword">end</span>
+0936 <span class="keyword">end</span>
+0937 fprintf(<span class="string">'COMPLETE\n'</span>);
+0938 
+0939 fprintf(<span class="string">'Adding gene annotations to the model... '</span>);
+0940 <span class="comment">%Create the new model</span>
+0941 model.genes=genes(1:geneCounter);
+0942 model.grRules=cell(numel(model.rxns),1);
+0943 model.grRules(:)={<span class="string">''</span>};
+0944 model.rxnGeneMat=sparse(numel(model.rxns),numel(model.genes));
+0945 
+0946 <span class="comment">%Loop through the reactions and add the corresponding genes</span>
+0947 <span class="keyword">for</span> i=1:numel(model.rxns)
+0948     <span class="keyword">if</span> isstruct(model.rxnMiriams{i})
+0949         <span class="comment">%Get all KOs</span>
+0950         I=find(strcmpi(model.rxnMiriams{i}.name,<span class="string">'kegg.orthology'</span>));
+0951         KOs=model.rxnMiriams{i}.value(I);
+0952         <span class="comment">%Find the KOs and the corresponding genes</span>
+0953         J=ismember(KOModel.rxns,KOs);
+0954         [~, K]=find(koGeneMat(J,:));
+0955         
+0956         <span class="keyword">if</span> any(K)
+0957             model.rxnGeneMat(i,K)=1;
+0958             <span class="comment">%Also delete KOs for which no genes were found. If no genes at</span>
+0959             <span class="comment">%all were matched to the reaction it will be deleted later</span>
+0960             L=sum(koGeneMat(J,:),2)==0;
+0961             model.rxnMiriams{i}.value(I(L))=[];
+0962             model.rxnMiriams{i}.name(I(L))=[];
+0963         <span class="keyword">end</span>
+0964     <span class="keyword">end</span>
+0965 <span class="keyword">end</span>
+0966 fprintf(<span class="string">'COMPLETE\n'</span>);
+0967 
+0968 <span class="comment">%Find and delete all reactions without genes. This also removes genes that</span>
+0969 <span class="comment">%are not used (which could happen because minScoreRatioG and</span>
+0970 <span class="comment">%minScoreRatioKO). If keepSpontaneous==true, the spontaneous reactions</span>
+0971 <span class="comment">%without genes are kept in the model. Spontaneous reactions with original</span>
+0972 <span class="comment">%gene associations are treated in the same way, like the rest of the</span>
+0973 <span class="comment">%reactions - if gene associations were removed during HMM search, such</span>
+0974 <span class="comment">%reactions are deleted from the model</span>
+0975 <span class="keyword">if</span> keepSpontaneous==true
+0976     <span class="comment">%Not the most comprise way to delete reactions without genes, but this</span>
+0977     <span class="comment">%makes the code easier to understand. Firstly the non-spontaneous</span>
+0978     <span class="comment">%reactions without genes are removed. After that, the second deletion</span>
+0979     <span class="comment">%step removes spontaneous reactions, which had gene associations before</span>
+0980     <span class="comment">%HMM search, but no longer have after it</span>
+0981     fprintf(<span class="string">'Removing non-spontaneous reactions which after HMM search no longer have GPR rules... '</span>);
+0982     I=~any(model.rxnGeneMat,2)&amp;~ismember(model.rxns,isSpontaneous);
+0983     model=removeReactions(model,I,true,true);
+0984     I=~any(model.rxnGeneMat,2)&amp;ismember(model.rxns,spontRxnsWithGenes);
+0985     model=removeReactions(model,I,true,true);
+0986 <span class="keyword">else</span>
+0987     <span class="comment">%Just simply check for any new reactions without genes and remove</span>
+0988     <span class="comment">%it</span>
+0989     fprintf(<span class="string">'Removing reactions which after HMM search no longer have GPR rules... '</span>);
+0990     I=~any(model.rxnGeneMat,2);
+0991     model=removeReactions(model,I,true,true);
+0992 <span class="keyword">end</span>
+0993 fprintf(<span class="string">'COMPLETE\n'</span>);
+0994 
+0995 fprintf(<span class="string">'Constructing GPR rules and finalizing the model... '</span>);
+0996 <span class="comment">%Add the gene associations as 'or'</span>
+0997 <span class="keyword">for</span> i=1:numel(model.rxns)
+0998     <span class="comment">%Find the involved genes</span>
+0999     I=find(model.rxnGeneMat(i,:));
+1000     <span class="keyword">if</span> any(I)
+1001         model.grRules{i}=[<span class="string">'('</span> model.genes{I(1)}];
+1002         <span class="keyword">for</span> j=2:numel(I)
+1003             model.grRules{i}=[model.grRules{i} <span class="string">' or '</span> model.genes{I(j)}];
+1004         <span class="keyword">end</span>
+1005         model.grRules{i}=[model.grRules{i} <span class="string">')'</span>];
+1006     <span class="keyword">end</span>
+1007 <span class="keyword">end</span>
+1008 
+1009 <span class="comment">%Fix grRules and reconstruct rxnGeneMat</span>
+1010 [grRules,rxnGeneMat] = standardizeGrRules(model,false); <span class="comment">%Give detailed output</span>
+1011 model.grRules = grRules;
+1012 model.rxnGeneMat = rxnGeneMat;
+1013 
+1014 <span class="comment">%Fix subsystems</span>
+1015 emptySubSystems=cellfun(@isempty, model.subSystems);
+1016 model.subSystems(emptySubSystems)={{<span class="string">''</span>}};
+1017 
+1018 <span class="comment">%Add the description to the reactions</span>
+1019 <span class="keyword">for</span> i=1:numel(model.rxns)
+1020     <span class="keyword">if</span> ~isempty(model.rxnNotes{i})
+1021         model.rxnNotes(i)=strcat(<span class="string">'Included by getKEGGModelForOrganism (using HMMs).'</span>,model.rxnNotes(i));
+1022         model.rxnNotes(i)=strrep(model.rxnNotes(i),<span class="string">'.'</span>,<span class="string">'. '</span>);
+1023     <span class="keyword">else</span>
+1024         model.rxnNotes(i)={<span class="string">'Included by getKEGGModelForOrganism (using HMMs)'</span>};
+1025     <span class="keyword">end</span>
+1026 <span class="keyword">end</span>
+1027 <span class="comment">%Remove the temp fasta file</span>
+1028 delete(fastaFile)
+1029 fprintf(<span class="string">'COMPLETE\n\n*** Model reconstruction complete ***\n'</span>);
+1030 <span class="keyword">end</span>
+1031 
+1032 <a name="_sub1" href="#_subfunctions" class="code">function files=listFiles(directory)</a>
+1033 <span class="comment">%Supporter function to list the files in a directory and return them as a</span>
+1034 <span class="comment">%cell array</span>
+1035 temp=dir(directory);
+1036 files=cell(numel(temp),1);
+1037 <span class="keyword">for</span> i=1:numel(temp)
+1038     files{i}=temp(i,1).name;
+1039 <span class="keyword">end</span>
+1040 files=strrep(files,<span class="string">'.fa'</span>,<span class="string">''</span>);
+1041 files=strrep(files,<span class="string">'.hmm'</span>,<span class="string">''</span>);
+1042 files=strrep(files,<span class="string">'.out'</span>,<span class="string">''</span>);
+1043 files=strrep(files,<span class="string">'.faw'</span>,<span class="string">''</span>);
+1044 <span class="keyword">end</span></pre></div>
 <hr><address>Generated by <strong><a href="http://www.artefact.tk/software/matlab/m2html/" title="Matlab Documentation in HTML">m2html</a></strong> &copy; 2005</address>
 </body>
 </html>
\ No newline at end of file
diff --git a/doc/io/importExcelModel.html b/doc/io/importExcelModel.html
index 192c63cc..0366309c 100644
--- a/doc/io/importExcelModel.html
+++ b/doc/io/importExcelModel.html
@@ -967,7 +967,7 @@ <h2><a name="_source"></a>SOURCE CODE <a href="#_top"><img alt="^" border="0" sr
 0847             <span class="keyword">elseif</span> any(strfind(I{j},<span class="string">':'</span>))
 0848                 index=max(strfind(I{j},<span class="string">':'</span>));
 0849             <span class="keyword">end</span>
-0850             <span class="keyword">if</span> any(index)
+0850             <span class="keyword">if</span> exist(<span class="string">'index'</span>,<span class="string">'var'</span>) &amp; any(index)
 0851                 miriamStruct{i}.name{startIndex+j}=I{j}(1:index-1);
 0852                 miriamStruct{i}.value{startIndex+j}=I{j}(index+1:end);
 0853             <span class="keyword">else</span>
diff --git a/doc/io/importModel.html b/doc/io/importModel.html
index 9048c59e..7773dd1a 100644
--- a/doc/io/importModel.html
+++ b/doc/io/importModel.html
@@ -176,11 +176,11 @@ <h2><a name="_source"></a>SOURCE CODE <a href="#_top"><img alt="^" border="0" sr
 0070     <span class="keyword">end</span>
 0071 <span class="keyword">end</span>
 0072 fileName=char(fileName);
-0073 <span class="keyword">if</span> nargin&lt;2
+0073 <span class="keyword">if</span> nargin&lt;2 || isempty(removeExcMets)
 0074     removeExcMets=true;
 0075 <span class="keyword">end</span>
 0076 
-0077 <span class="keyword">if</span> nargin&lt;3
+0077 <span class="keyword">if</span> nargin&lt;3 || isempty(isSBML2COBRA)
 0078     isSBML2COBRA=false;
 0079 <span class="keyword">end</span>
 0080 
diff --git a/external/kegg/getKEGGModelForOrganism.m b/external/kegg/getKEGGModelForOrganism.m
index e3abc2d2..24355620 100755
--- a/external/kegg/getKEGGModelForOrganism.m
+++ b/external/kegg/getKEGGModelForOrganism.m
@@ -38,15 +38,12 @@
 %                           The hidden Markov models as generated in 2b or
 %                           downloaded from BioMet Toolbox (see below)
 %                       The final directory in dataDir should be styled as
-%                       proXXX_keggYY or eukXXX_keggYY, indicating whether
+%                       prok90_kegg105 or euk90_kegg105, indicating whether
 %                       the HMMs were trained on pro- or eukaryotic
-%                       sequences, using a sequence similarity threshold of
-%                       XXX %, fitting the KEGG version YY. E.g.
-%                       euk90_kegg105. (optional, see note about fastaFile. Note
-%                       that in order to rebuild the KEGG model from a
-%                       database dump, as opposed to using the version
-%                       supplied with RAVEN, you would still need to supply
-%                       this)
+%                       sequences; using which sequence similarity treshold
+%                       (first set of digits); using which KEGG version
+%                       (second set of digits). (this parameter should
+%                       ALWAYS be provided)
 %   outDir              directory to save the results from the quering of
 %                       the hidden Markov models. The output is specific
 %                       for the input sequences and the settings used. It
diff --git a/io/importExcelModel.m b/io/importExcelModel.m
index a703b5bb..0c4c0784 100755
--- a/io/importExcelModel.m
+++ b/io/importExcelModel.m
@@ -847,7 +847,7 @@
             elseif any(strfind(I{j},':'))
                 index=max(strfind(I{j},':'));
             end
-            if any(index)
+            if exist('index','var') & any(index)
                 miriamStruct{i}.name{startIndex+j}=I{j}(1:index-1);
                 miriamStruct{i}.value{startIndex+j}=I{j}(index+1:end);
             else
diff --git a/io/importModel.m b/io/importModel.m
index df9b10f2..5b422873 100755
--- a/io/importModel.m
+++ b/io/importModel.m
@@ -70,11 +70,11 @@
     end
 end
 fileName=char(fileName);
-if nargin<2
+if nargin<2 || isempty(removeExcMets)
     removeExcMets=true;
 end
 
-if nargin<3
+if nargin<3 || isempty(isSBML2COBRA)
     isSBML2COBRA=false;
 end