diff --git a/inst/stepwisefit.m b/inst/stepwisefit.m
index 34f44f63..1e84b71e 100644
--- a/inst/stepwisefit.m
+++ b/inst/stepwisefit.m
@@ -1,5 +1,6 @@
 ## Copyright (C) 2013-2021 Nir Krakauer <nkrakauer@ccny.cuny.edu>
 ## Copyright (C) 2014 Mikael Kurula <mkurula@abo.fi>
+## Copyright (C) 2025 Jayant Chauhan <0001jayant@gmail.com>
 ##
 ## This file is part of the statistics package for GNU Octave.
 ##
@@ -15,154 +16,673 @@
 ##
 ## You should have received a copy of the GNU General Public License along with
 ## this program; if not, see <http://www.gnu.org/licenses/>.
-
 ## -*- texinfo -*-
-## @deftypefn  {statistics} {[@var{X_use}, @var{b}, @var{bint}, @var{r}, @var{rint}, @var{stats}] =} stepwisefit (@var{y}, @var{X}, @var{penter} = 0.05, @var{premove} = 0.1, @var{method} = "corr")
+## @deftypefn  {statistics} {} stepwisefit (@var{X}, @var{y})
+## @deftypefnx {statistics} {@var{b} =} stepwisefit (@var{X}, @var{y})
+## @deftypefnx {statistics} {@var{b}, @var{se}, @var{pval}, @var{finalmodel}, @var{stats}, @var{nextstep}, @var{history} =} stepwisefit (@var{X}, @var{y}, @var{varargin})
+##
+## Perform stepwise linear regression using conditional p-value criteria.
+##
+## @code{stepwisefit} fits a linear regression model to response vector
+## @var{y} using predictor matrix @var{X} and performs stepwise variable
+## selection based on hypothesis tests for individual regression coefficients.
+##
+## At each iteration, predictors not currently in the model are tested for
+## inclusion using partial F- or t-tests.  The predictor with the smallest
+## p-value below the entry threshold is added.  Predictors currently in the
+## model (excluding forced predictors) are then tested for removal, and the
+## predictor with the largest p-value exceeding the removal threshold is
+## removed.  The procedure repeats until the model stabilizes or the maximum
+## number of iterations is reached.
 ##
-## Linear regression with stepwise variable selection.
+## After variable selection, the final regression model is refit using
+## @code{regress} to compute coefficient estimates and inferential statistics
+## for both included and excluded predictors.
 ##
 ## @subheading Arguments
 ##
 ## @itemize @bullet
 ## @item
-## @var{y} is an @var{n} by 1 vector of data to fit.
-## @item
-## @var{X} is an @var{n} by @var{k} matrix containing the values of @var{k} potential predictors. No constant term should be included (one will always be added to the regression automatically).
-## @item
-## @var{penter} is the maximum p-value to enter a new variable into the regression (default: 0.05).
+## @var{X} is an @var{n}-by-@var{p} numeric matrix of predictor variables.
+##
 ## @item
-## @var{premove} is the minimum p-value to remove a variable from the regression (default: 0.1).
+## @var{y} is an @var{n}-by-1 numeric response vector.
+##
 ## @item
-## @var{method} sets how predictors are selected at each step, either based on their correlation with the residuals ("corr", default)
-##   or on the p values of their regression coefficients when they are successively added ("p").
+## Optional Name–Value pairs may be supplied to control the stepwise
+## selection procedure.
 ## @end itemize
 ##
-## @subheading Return values
+## @subheading Name–Value Arguments
+##
+## @table @asis
+## @item @qcode{"InModel"}
+## Logical row vector of length @var{p} specifying predictors that are initially
+## included in the model.
+##
+## @item @qcode{"Keep"}
+## Logical row vector of length @var{p} specifying predictors that must remain
+## in the model and are never removed during stepwise selection.
+##
+## @item @qcode{"PEnter"}
+## Scalar significance level in the open interval (0,1) specifying the maximum
+## p-value required for a predictor to enter the model.  Default is @code{0.05}.
+##
+## @item @qcode{"PRemove"}
+## Scalar significance level in the open interval (0,1) specifying the minimum
+## p-value required for a predictor to be removed from the model.  If not
+## specified, a default value greater than or equal to @qcode{"PEnter"} is used.
+##
+## @item @qcode{"MaxIter"}
+## Positive integer specifying the maximum number of stepwise iterations.
+## Default is @code{Inf}.
+##
+## @item @qcode{"Scale"}
+## Either @qcode{"on"} or @qcode{"off"}.  When enabled, predictors are
+## standardized prior to stepwise selection only.  Final regression
+## coefficients are always reported on the original data scale.
+##
+## @item @qcode{"Display"}
+## Either @qcode{"on"} or @qcode{"off"}.  Accepted for compatibility but
+## currently does not affect output.
+## @end table
+##
+## @subheading Return Values
 ##
 ## @itemize @bullet
 ## @item
-## @var{X_use} contains the indices of the predictors included in the final regression model. The predictors are listed in the order they were added, so typically the first ones listed are the most significant.
+## @var{b} is a @var{p}-by-1 vector of regression coefficients.  Coefficients
+## for excluded predictors are computed conditionally.
+##
 ## @item
-## @var{b}, @var{bint}, @var{r}, @var{rint}, @var{stats} are the results of @code{[b, bint, r, rint, stats] = regress(y, [ones(size(y)) X(:, X_use)], penter);}
-## @end itemize
-## @subheading References
+## @var{se} is a @var{p}-by-1 vector of standard errors.
+##
+## @item
+## @var{pval} is a @var{p}-by-1 vector of two-sided p-values.
+##
+## @item
+## @var{finalmodel} is a logical row vector indicating which predictors are
+## included in the final model.
+##
+## @item
+## @var{stats} is a structure containing regression diagnostics, including
+## sums of squares, degrees of freedom, residuals, covariance estimates,
+## F-statistic, and related quantities.
 ##
-## @enumerate
 ## @item
-## N. R. Draper and H. Smith (1966). @cite{Applied Regression Analysis}. Wiley. Chapter 6.
+## @var{nextstep} is a scalar indicating whether an additional stepwise
+## iteration is recommended.  Currently always zero.
+##
+## @item
+## @var{history} is a structure summarizing the final model state, including
+## selected predictors and coefficient history.
+## @end itemize
 ##
-## @end enumerate
 ## @seealso{regress}
 ## @end deftypefn
 
-function [X_use, b, bint, r, rint, stats] = stepwisefit(y, X, penter = 0.05, premove = 0.1, method = "corr")
 
-if nargin >= 3 && isempty(penter)
-  penter = 0.05;
-endif
+function [b, se, pval, finalmodel, stats, nextstep, history] = ...
+         stepwisefit (X, y, varargin)
+
+  b = [];
+  se = [];
+  pval = [];
+  finalmodel = [];
+  stats = struct ();
+  nextstep = 0;
+  history = struct ();
+
+  ## Input validation (positional)
+
+  if (nargin < 2)
+    error ("stepwisefit: at least two input arguments required");
+  endif
 
-if nargin >= 4 && isempty(premove)
-  premove = 0.1;
+  if (! ismatrix (X) || ! isvector (y))
+    error ("stepwisefit: X must be a matrix and y a vector");
+  endif
+
+  y = y(:);
+
+  ## Validate row compatibility BEFORE any concatenation
+if (rows (X) != rows (y))
+  error ("stepwisefit: X must be a matrix and y a vector");
 endif
 
+  ## Parse Name–Value pairs
+  InModel  = [];
+  Display  = "on";
+  ## MATLAB-compatible defaults
+  PEnter  = 0.05;
+  PRemove = [];
+  Scale   = "off";
+  MaxIter = Inf;
+  Keep    = [];
 
-#remove any rows with missing entries
-notnans = !any (isnan ([y X]) , 2);
-y = y(notnans);
-X = X(notnans,:);
-
-n = numel(y); #number of data points
-k = size(X, 2); #number of predictors
-
-X_use = [];
-v = 0; #number of predictor variables in regression model
-
-iter = 0;
-max_iters = 100; #maximum number of iterations to do
-
-r = y;
-while 1
-
-  iter++;
-  #decide which variable to add to regression, if any
-  added = false;
-  if numel(X_use) < k
-    X_inds = zeros(k, 1, "logical"); X_inds(X_use) = 1;
-
-    switch lower (method)
-      case {"corr"}
-        [~, i_to_add] = max(abs(corr(X(:, ~X_inds), r))); #try adding the variable with the highest correlation to the residual from current regression
-        i_to_add = (1:k)(~X_inds)(i_to_add); #index within the original predictor set
-        [b_new, bint_new, r_new, rint_new, stats_new] = regress(y, [ones(n, 1) X(:, [X_use i_to_add])], penter);
-      case {"p"}
-        z_vals=zeros(k,1);
-        for j=1:k
-          if ~X_inds(j)
-            [b_j, bint_j, ~,~ ,~] = regress(y, [ones(n, 1) X(:, [X_use j])], penter);
-            z_vals(j) = abs(b_j(end)) / (bint_j(end, 2) - b_j(end));
-          endif
-        endfor
-        [~, i_to_add] = max(z_vals); #try adding the variable with the largest z-value (smallest partial p-value)
-        [b_new, bint_new, r_new, rint_new, stats_new] = regress(y, [ones(n, 1) X(:, [X_use i_to_add])], penter);
-      otherwise
-        error("stepwisefit: invalid value for method")
-    endswitch
-
-    z_new = abs(b_new(end)) / (bint_new(end, 2) - b_new(end));
-    if z_new > 1 #accept new variable
-      added = true;
-      X_use = [X_use i_to_add];
-      b = b_new;
-      bint = bint_new;
-      r = r_new;
-      rint = rint_new;
-      stats = stats_new;
-      v = v + 1;
-    endif
+  ## Parse Name-Value paired arguments using pairedArgs
+  optNames = {"InModel", "Display", "PEnter", "PRemove", ...
+              "Scale", "MaxIter", "Keep"};
+  dfValues = {[], "on", 0.05, [], "off", Inf, []};
+
+  [InModel, Display, PEnter, PRemove, Scale, MaxIter, Keep, args] = ...
+    pairedArgs (optNames, dfValues, varargin(:));
+
+  ## Semantic validation for Name-Value options 
+
+  ## Validate Display
+  if (! any (strcmpi (Display, {"on", "off"})))
+    error ("stepwisefit: Display must be 'on' or 'off'");
   endif
+  Display = lower (Display);
 
-  #decide which variable to drop from regression, if any
-  dropped = false;
-  if v > 0
-    t_ratio = tinv(1 - premove/2, n - v - 1) / tinv(1 - penter/2, n - v - 1); #estimate the ratio between the z score corresponding to premove to that corresponding to penter
-    [z_min, i_min] = min(abs(b(2:end)) ./ (bint(2:end, 2) - b(2:end)));
-    if z_min < t_ratio #drop a variable
-      dropped = true;
-      X_use(i_min) = [];
-      [b, bint, r, rint, stats] = regress(y, [ones(n, 1) X(:, X_use)], penter);
-      v = v - 1;
+  ## Validate Scale
+  if (! any (strcmpi (Scale, {"on", "off"})))
+    error ("stepwisefit: Scale must be 'on' or 'off'");
+  endif
+  Scale = lower (Scale);
+
+  ## Validate PEnter
+  if (! (isscalar (PEnter) && isnumeric (PEnter) && PEnter > 0 && PEnter < 1))
+    error ("stepwisefit: PEnter must be a scalar strictly between 0 and 1");
+  endif
+
+  ## Validate PRemove (if provided)
+  if (! isempty (PRemove))
+    if (! (isscalar (PRemove) && isnumeric (PRemove) && PRemove > 0 && PRemove < 1))
+      error ("stepwisefit: PRemove must be a scalar strictly between 0 and 1");
+    endif
+    if (PRemove < PEnter)
+      error ("stepwisefit: PRemove must be greater than or equal to PEnter");
     endif
   endif
 
-  #terminate if no change in the list of regression variables
-  if ~added && ~dropped
-    break
+  ## Validate MaxIter
+  if (! (isscalar (MaxIter) && isnumeric (MaxIter) && MaxIter > 0 && fix (MaxIter) == MaxIter))
+    error ("stepwisefit: MaxIter must be a positive integer");
   endif
 
-  if iter >= max_iters
-    warning('stepwisefit: maximum iteration count exceeded before convergence')
-    break
+  ## Handle missing values
+  wasnan = any (isnan ([X y]), 2);
+  Xc = X(!wasnan, :);
+  yc = y(!wasnan);
+
+  n = rows (Xc);
+  p = columns (Xc);
+
+  ## Validate Keep and InModel type (if provided)
+  if (! isempty (Keep) && ! islogical (Keep))
+    error ("stepwisefit: Keep must be a logical vector");
+  endif
+  if (! isempty (InModel) && ! islogical (InModel))
+    error ("stepwisefit: InModel must be a logical vector");
   endif
 
-endwhile
+  ## Validate lengths (these already exist in your file, but keep them here for order)
+  if (! isempty (Keep) && numel (Keep) != p)
+    error ("stepwisefit: Keep length must match number of predictors");
+  endif
+  if (! isempty (InModel) && numel (InModel) != p)
+    error ("stepwisefit: InModel length must match number of predictors");
+  endif
+
+  if (! isempty (args))
+    error ("stepwisefit: unrecognized input arguments");
+  endif
+
+  if (isempty (Keep))
+    Keep = false(1, p);
+  endif
+
+  ## Default PRemove if unset
+  if (isempty (PRemove))
+    PRemove = max (PEnter, 0.1);
+  endif
+
+  if (PRemove < PEnter)
+    error ("stepwisefit: PRemove must be greater than or equal to PEnter");
+  endif
+
+  if (strcmp (Scale, "on"))
+    muX = mean (Xc, 1);
+    sigX = std (Xc, 0, 1);
+    sigX(sigX == 0) = 1;   ## prevent division by zero
+    Xs = (Xc - muX) ./ sigX;
+  else
+    Xs = Xc;
+  endif
+
+  ## Validate InModel
+
+  if (! isempty (InModel))
+    cur = logical (InModel(:).');
+  else
+    cur = false (1, p);
+  endif
+
+  ## Ensure Keep predictors are always in model (already set)
+  cur(Keep) = true;
+  prev = cur;
+  iter = 0;
+
+  ## Iterative selection: each iteration attempts ADD then REMOVE.
+  while (iter < MaxIter)
+    iter = iter + 1;
+
+    ## ADD phase: evaluate candidates by conditional p-value
+    candidates = find (~cur);
+    if (! isempty (candidates))
+      best_p = Inf;
+      best_j = -1;
+      cols = find (cur);    ## current included predictors (may be empty)
+
+      for idx = 1:numel (candidates)
+        j = candidates(idx);
+
+        ## Build trial design: intercept, current included (if any), candidate j
+        if (isempty (cols))
+          Xtry = [ones(n,1), Xs(:, j)];
+        else
+          Xtry = [ones(n,1), Xs(:, cols), Xs(:, j)];
+        endif
+
+        ## Regress and compute candidate p-value; skip singular/failed fits
+        try
+          [btry, binttry] = regress (yc, Xtry);
+        catch
+          continue;
+        end_try_catch
+
+        df_try = n - columns (Xtry);
+        if (df_try <= 0)
+          continue;
+        endif
+
+        se_try = (binttry(end,2) - btry(end)) / tinv (0.975, df_try);
+        if (se_try <= 0 || ! isfinite (se_try))
+          continue;
+        endif
+
+        tstat = btry(end) / se_try;
+        p_candidate = 2 * (1 - tcdf (abs (tstat), df_try));
+
+        ## Deterministic tie-break: first encountered when nearly equal
+        if (p_candidate < best_p - eps)
+          best_p = p_candidate;
+          best_j = j;
+        endif
+      endfor
+
+      ## Add best candidate only if it meets the PEnter threshold
+      if (best_j > 0 && best_p < PEnter)
+        cur(best_j) = true;
+      endif
+    endif
+
+    ## REMOVE phase: compute conditional p-values for included predictors,
+    ##                 remove worst (largest p) among removable predictors
+    included = find (cur);
+    removable = setdiff (included, find (Keep));  ## never remove Keep
+
+    if (! isempty (removable))
+      Xfull = [ones(n,1), Xs(:, included)];
+
+      ## Regress current full model; guard against singular / failed fits
+      try
+        [bfull, bintfull] = regress (yc, Xfull);
+      catch
+        bfull = NaN (columns (Xfull), 1);
+        bintfull = NaN (columns (Xfull), 2);
+      end_try_catch
+
+      df_full = n - columns (Xfull);
+      pvals_included = Inf (1, numel (included));
+
+      for ii = 1:numel (included)
+        if (df_full <= 0)
+          pvals_included(ii) = Inf;
+        else
+          se_i = (bintfull(ii+1,2) - bfull(ii+1)) / tinv (0.975, df_full);
+          if (se_i > 0 && isfinite (se_i))
+            t_i = bfull(ii+1) / se_i;
+            pvals_included(ii) = 2 * (1 - tcdf (abs (t_i), df_full));
+          else
+            pvals_included(ii) = Inf;
+          endif
+        endif
+      endfor
+
+      ## Map removable predictors to positions within 'included'
+      removable_positions = arrayfun (@(x) find (included == x, 1), removable);
+      [maxp, pos] = max (pvals_included(removable_positions));
+
+      if (maxp > PRemove)
+        cur(removable(pos)) = false;
+      endif
+    endif
+
+    ## Convergence: structural (model unchanged)
+    if (isequal (cur, prev))
+      break;
+    endif
+
+    prev = cur;
+  endwhile
+
+
+  ## Final set of selected predictors
+  X_use = find (cur);
+
+  ## Final regression on selected predictors
+  Xfinal = [ones(n,1), Xc(:, X_use)];
+  ## regstats intentionally unused; retained for MATLAB parity
+  [B, BINT, R, RINT, regstats] = regress (yc, Xfinal); 
+
+  Rresid = R(:);   ## freeze residual vector
+
+  ## Allocate outputs
+  b    = zeros (p,1);
+  se   = zeros (p,1);
+  pval = zeros (p,1);
+
+  df = n - columns (Xfinal);
+
+  if (df <= 0)
+    ## Not enough residual degrees of freedom to estimate SE reliably.
+    se(:) = NaN;
+    pval(:) = NaN;
+  endif
+
+  ## Included predictors
+  b(X_use) = B(2:end);
+  se(X_use) = (BINT(2:end,2) - B(2:end)) ./ tinv (0.975, df);
+  pval(X_use) = 2 * (1 - tcdf (abs (B(2:end) ./ se(X_use)), df));
+
+  ## Excluded predictors: conditional refit
+  excluded = setdiff (1:p, X_use);
+
+  for j = excluded
+    Xj = [ones(n,1), Xc(:, [X_use j])];
+    [Bj, BjINT] = regress (yc, Xj);
+
+    bj  = Bj(end);
+    sej = (BjINT(end,2) - bj) ./ tinv (0.975, n - columns (Xj));
+
+    b(j) = bj;
+    se(j) = sej;
+    pval(j) = 2 * (1 - tcdf (abs (bj / sej), n - columns (Xj)));
+  endfor
+
+  ## Final model indicator
+  finalmodel = false (1,p);
+  finalmodel(X_use) = true;
+
+  ## Stats structure
+  stats = struct ();
+  stats.source    = "stepwisefit";
+  stats.df0       = numel (X_use);
+  stats.dfe       = n - stats.df0 - 1;
+  stats.SStotal   = sum ((yc - mean (yc)).^2);
+  stats.SSresid   = sum (Rresid.^2);
+  stats.rmse      = sqrt (stats.SSresid / stats.dfe);
+  stats.intercept = B(1);
+  stats.wasnan    = wasnan;
+
+  stats.yr = Rresid;
+  stats.B     = b;
+  stats.SE    = se;
+  stats.TSTAT = b ./ se;
+  stats.PVAL  = pval;
+  stats.TSTAT (!isfinite (stats.TSTAT)) = NaN;
+  
+  excluded = setdiff (1:p, X_use);
+xr = zeros (n, numel (excluded));
+
+if (! isempty (X_use))
+  Z = [ones(n,1), Xc(:, X_use)];
+  P = Z / (Z' * Z) * Z';   ## projection matrix
+  for k = 1:numel (excluded)
+    j = excluded(k);
+    xr(:,k) = Xc(:,j) - P * Xc(:,j);
+  endfor
+else
+  ## intercept-only case
+  for k = 1:numel (excluded)
+    j = excluded(k);
+    xr(:,k) = Xc(:,j) - mean (Xc(:,j));
+  endfor
+endif
+
+stats.xr = xr;
+  
+  covb = NaN (p+1, p+1);
+  covB = (stats.rmse^2) * pinv (Xfinal' * Xfinal);
+
+  idx = [1, X_use + 1];
+  covb(idx, idx) = covB;
+
+  stats.covb = covb;
+  
+  if (stats.df0 > 0)
+    stats.fstat = ((stats.SStotal - stats.SSresid) / stats.df0) ...
+                  / (stats.SSresid / stats.dfe);
+    stats.pval = 1 - fcdf (stats.fstat, stats.df0, stats.dfe);
+  else
+    stats.fstat = NaN;
+    stats.pval = NaN;
+  endif
+
+  history = struct ();
+  history.in = finalmodel;
+  history.df0 = stats.df0;
+  history.rmse = stats.rmse;
+
+  ## Coefficient history (excluding intercept)
+  ## MATLAB stores this as p-by-k; here k = 1
+  Bhist = zeros (p, 1);
+  Bhist(finalmodel) = b(finalmodel);
+  history.B = Bhist;
+ 
+  ## Placeholders for future phases
+  nextstep = 0;
 
 endfunction
 
 %!test
-%! % Sample data from Draper and Smith (n = 13, k = 4)
-%! X = [7 1 11 11 7 11 3 1 2 21 1 11 10; ...
-%!     26 29 56 31 52 55 71 31 54 47 40 66 68; ...
-%!     6 15 8 8 6 9 17 22 18 4 23 9 8; ...
-%!     60 52 20 47 33 22 6 44 22 26 34 12 12]';
-%! y = [78.5 74.3 104.3 87.6 95.9 109.2 102.7 72.5 93.1 115.9 83.8 113.3 109.4]';
-%! [X_use, b, bint, r, rint, stats] = stepwisefit(y, X);
-%! assert(X_use, [4 1])
-%! assert(b, regress(y, [ones(size(y)) X(:, X_use)], 0.05))
-%! [X_use, b, bint, r, rint, stats] = stepwisefit(y, X, 0.05, 0.1, "corr");
-%! assert(X_use, [4 1])
-%! assert(b, regress(y, [ones(size(y)) X(:, X_use)], 0.05))
-%! [X_use, b, bint, r, rint, stats] = stepwisefit(y, X, [], [], "p");
-%! assert(X_use, [4 1])
-%! assert(b, regress(y, [ones(size(y)) X(:, X_use)], 0.05))
-
+%! X = [7 26 6 60;
+%!      1 29 15 52;
+%!      11 56 8 20;
+%!      11 31 8 47;
+%!      7 52 6 33;
+%!      11 55 9 22;
+%!      3 71 17 6;
+%!      1 31 22 44;
+%!      2 54 18 22;
+%!      21 47 4 26;
+%!      1 40 23 34;
+%!      11 66 9 12;
+%!      10 68 8 12];
+%! y = [78.5; 74.3; 104.3; 87.6; 95.9; 109.2;
+%!      102.7; 72.5; 93.1; 115.9; 83.8; 113.3; 109.4];
+%! [b,se,pval,finalmodel,stats] = stepwisefit (X,y);
+%! assert (finalmodel, [true false false true]);
+%! assert (b, [1.4400; 0.4161; -0.4100; -0.6140], 1e-4);
+%! assert (se, [0.1384; 0.1856; 0.1992; 0.0486], 1e-4);
+%! assert (pval, [0; 0.0517; 0.0697; 0], 1e-4);
+%! assert (stats.rmse, 2.7343, 1e-4);
+%! assert (stats.SStotal, 2715.7631, 1e-3);
+%! assert (stats.SSresid, 74.7621, 1e-4);
+%! assert (stats.df0, 2);
+%! assert (stats.dfe, 10);
+%! assert (stats.intercept, 103.0974, 1e-4);
+%!test
+%! X = [
+%!   12.0 4 120 95 2600;
+%!   11.5 6 200 110 3000;
+%!   10.5 8 300 150 3600;
+%!   13.0 4 140 100 2800;
+%!   12.5 6 180 120 3200;
+%!   11.0 8 250 140 3500;
+%!   14.0 4 130 98 2700;
+%!   13.5 6 210 115 3100;
+%!   12.2 8 320 160 3800;
+%!   11.8 4 150 105 2900
+%! ];
+%! y = [28; 22; 18; 27; 23; 19; 29; 21; 17; 26];
+%!
+%! [b,se,pval,finalmodel,stats] = stepwisefit (X,y);
+%!
+%! assert (islogical (finalmodel));
+%! assert (numel (finalmodel) == 5);
+%! assert (sum (finalmodel) >= 1);
+%! assert (isnumeric (b));
+%! assert (isnumeric (se));
+%! assert (isnumeric (pval));
+%! assert (stats.rmse > 0);
+%! assert (isfinite (stats.intercept));
+%!test
+%! X = randn (30, 4);
+%! y = randn (30, 1);
+%! [~,~,~,~,stats] = stepwisefit (X, y);
+%!
+%! required_fields = {
+%!   "source", "df0", "dfe", "SStotal", "SSresid", "fstat", "pval", ...
+%!   "rmse", "xr", "yr", "B", "SE", "TSTAT", "PVAL", "covb", ...
+%!   "intercept", "wasnan"
+%! };
+%!
+%! for k = 1:numel (required_fields)
+%!   assert (isfield (stats, required_fields{k}));
+%! endfor
+%!test
+%! X = randn (40, 5);
+%! y = randn (40, 1);
+%! [b,se,pval,finalmodel,stats] = stepwisefit (X, y);
+%!
+%! p = columns (X);
+%! n = rows (X(~stats.wasnan, :));
+%!
+%! assert (size (stats.yr), [n, 1]);
+%! assert (rows (stats.B) == p);
+%! assert (rows (stats.SE) == p);
+%! assert (rows (stats.TSTAT) == p);
+%! assert (rows (stats.PVAL) == p);
+%! assert (size (stats.covb), [p+1, p+1]);
+%!test
+%! X = randn (25, 3);
+%! y = randn (25, 1);
+%! [~,~,~,~,stats] = stepwisefit (X, y);
+%!
+%! SSresid_calc = sum (stats.yr .^ 2);
+%! assert (SSresid_calc, stats.SSresid, 1e-10);
+%!
+%! rmse_calc = sqrt (stats.SSresid / stats.dfe);
+%! assert (rmse_calc, stats.rmse, 1e-10);
+%!test
+%! X = randn (50, 6);
+%! y = randn (50, 1);
+%! [~,~,~,~,stats] = stepwisefit (X, y);
+%!
+%! if (stats.df0 > 0)
+%!   F_calc = ((stats.SStotal - stats.SSresid) / stats.df0) ...
+%!            / (stats.SSresid / stats.dfe);
+%!
+%!   assert (F_calc, stats.fstat, 1e-10);
+%!   assert (stats.pval >= 0 && stats.pval <= 1);
+%! else
+%!   assert (isnan (stats.fstat));
+%!   assert (isnan (stats.pval));
+%! endif
+%!test
+%! X = randn (35, 4);
+%! y = randn (35, 1);
+%! [~,~,~,finalmodel,stats] = stepwisefit (X, y);
+%! p = columns (X);
+%! k = sum (finalmodel);
+%! assert (size (stats.xr, 2) == p - k);
+%! assert (all (isfinite (stats.xr(:))));
+%!test
+%! X = randn (35, 4);
+%! y = randn (35, 1);
+%! [~,~,~,finalmodel,stats] = stepwisefit (X, y);
+%!
+%! Xc = X(~stats.wasnan, :);
+%! Xfinal = [ones(rows (Xc),1), Xc(:, finalmodel)];
+%!
+%! for j = 1:columns (stats.xr)
+%!   ortho = Xfinal' * stats.xr(:,j);
+%!   assert (max (abs (ortho(:))) < 1e-6);
+%! endfor
+%!test
+%! X = randn (40, 5);
+%! y = randn (40, 1);
+%! [~,~,~,finalmodel,stats,nextstep,history] = stepwisefit (X, y);
+%!
+%! assert (nextstep == 0);
+%! assert (isstruct (history));
+%! assert (isfield (history, "in"));
+%! assert (isfield (history, "df0"));
+%! assert (isfield (history, "rmse"));
+%! assert (isfield (history, "B"));
+%! assert (isequal (history.in, finalmodel));
+%! assert (history.df0 == stats.df0);
+%! assert (history.rmse == stats.rmse);
+%! assert (rows (history.B) == columns (X));
+%!test
+%! X = randn (20,4);
+%! y = randn (20,1);
+%! stepwisefit (X,y,'Keep',[true false true false]);
+%!test
+%! X = randn (30, 4);
+%! y = randn (30, 1);
+%! keep = [true false false false];
+%! [~,~,~,finalmodel] = stepwisefit (X, y, "Keep", keep);
+%! assert (finalmodel(1) == true);
+%!test
+%! X = randn (40, 6);
+%! y = randn (40, 1);
+%! [~,~,~,finalmodel] = stepwisefit (X, y, "MaxIter", 1);
+%! assert (islogical (finalmodel));
+%!test
+%! X = randn (50, 5);
+%! y = randn (50, 1);
+%! [b1] = stepwisefit (X, y);
+%! [b2] = stepwisefit (X, y, "Scale", "on");
+%! assert (rows (b1) == rows (b2));
+%!test
+%! X = randn (20,4);
+%! y = randn (20,1);
+%! fail ("stepwisefit (X,y,'Keep',[true false])");
 
+## Test input validation
+%!error <stepwisefit: at least two input arguments required> ...
+%!       stepwisefit ()
+%!error <stepwisefit: X must be a matrix and y a vector> ...
+%!       stepwisefit (ones (2,2,2), [1;2])
+%!error <stepwisefit: X must be a matrix and y a vector> ...
+%!       stepwisefit (ones (3,2), ones (2,1))
+%!error <stepwisefit: unrecognized input arguments> ...
+%!       stepwisefit (randn (10,2), randn (10,1), "UnknownOpt", 5)
+%!error <stepwisefit: Display must be 'on' or 'off'> ...
+%!       stepwisefit (randn (10,2), randn (10,1), "Display", "maybe")
+%!error <stepwisefit: Scale must be 'on' or 'off'> ...
+%!       stepwisefit (randn (10,2), randn (10,1), "Scale", 123)
+%!error <stepwisefit: PEnter must be a scalar strictly between 0 and 1> ...
+%!       stepwisefit (randn (10,2), randn (10,1), "PEnter", -0.1)
+%!error <stepwisefit: PRemove must be a scalar strictly between 0 and 1> ...
+%!       stepwisefit (randn (10,2), randn (10,1), "PRemove", 1.5)
+%!error <stepwisefit: PRemove must be greater than or equal to PEnter> ...
+%!       stepwisefit (randn (10,2), randn (10,1), ...
+%!                     "PEnter", 0.05, "PRemove", 0.01)
+%!error <stepwisefit: MaxIter must be a positive integer> ...
+%!       stepwisefit (randn (10,2), randn (10,1), "MaxIter", -2)
+%!error <stepwisefit: MaxIter must be a positive integer> ...
+%!       stepwisefit (randn (10,2), randn (10,1), "MaxIter", 2.5)
+%!error <stepwisefit: Keep must be a logical vector> ...
+%!       stepwisefit (randn (10,2), randn (10,1), "Keep", [1 0])
+%!error <stepwisefit: InModel must be a logical vector> ...
+%!       stepwisefit (randn (10,2), randn (10,1), "InModel", [1 0])
+%!error <stepwisefit: Keep length must match number of predictors> ...
+%!       stepwisefit (randn (10,4), randn (10,1), "Keep", [true false])
+%!error <stepwisefit: InModel length must match number of predictors> ...
+%!       stepwisefit (randn (10,4), randn (10,1), "InModel", true)