diff --git a/NEWS.md b/NEWS.md
index 8d7633a..2920411 100644
--- a/NEWS.md
+++ b/NEWS.md
@@ -1,5 +1,6 @@
 # libr 1.3.5
 * Added 'parquet' file format to `libname()` function.
+* Added 'subset' parameter to `datastep()` function to filter the data on input.
 
 # libr 1.3.4
 * Fixed issue where `libname()` was failing on empty dataset.
diff --git a/R/datastep.R b/R/datastep.R
index 2a6d6f6..e01e4d8 100644
--- a/R/datastep.R
+++ b/R/datastep.R
@@ -100,6 +100,10 @@ e$output <- list()
 #' 
 #' \code{calculate} and \code{retain} are both input parameters.
 #' 
+#' The \code{subset} and \code{where} parameters can both be used to filter
+#' the datastep data.  The difference is that \code{subset} is an input
+#' parameter, and \code{where} is an output parameter.  
+#' 
 #' @section Set and Merge Operations:
 #' The \code{datastep} function allows you to join one or more input datasets 
 #' into a single output dataset.  There are two operations in this regard:
@@ -267,6 +271,11 @@ e$output <- list()
 #' \code{delete} function, or \code{output} function to filter desired results.
 #' @param log Whether or not to log the datastep.  Default is TRUE.  This 
 #' parameter is used internally.
+#' @param subset The \code{subset} parameter accepts an \code{expression} object
+#' that will be used to subset the data.  The \code{subset} expression will be 
+#' executed \strong{before} the datastep executes.  In this regard, the 
+#' \code{subset} parameter on the R datastep is similar to the \code{where} clause
+#' on the SAS datastep.
 #' @return The processed data frame, tibble, or data table.  
 #' @family datastep
 #' @seealso \code{\link{libname}} function to create a data library, and
@@ -536,7 +545,8 @@ datastep <- function(data, steps, keep = NULL,
                      merge = NULL,
                      merge_by = NULL,
                      merge_in = NULL, 
-                     log = TRUE) {
+                     log = TRUE, 
+                     subset = NULL) {
   
   if (!"data.frame" %in% class(data))
     stop("input data must be inherited from data.frame")
@@ -703,6 +713,24 @@ datastep <- function(data, steps, keep = NULL,
                           check.names = FALSE) 
   }
   
+  # Subset Before
+  if (!is.null(subset)) {
+    
+    data <- tryCatch({subset(data, eval(subset))},
+                     error = function(cond){ret})
+    
+    # Give warning if there are no rows and no output()
+    if (hout == FALSE & nrow(data) == 0) {
+      warning("After subset, input dataset has no rows.") 
+    }
+    
+    rowcount <- nrow(data)
+    
+    # Restore attributes from original data 
+    data <- copy_attributes(data_attributes, data)
+    
+  }
+  
   # Add automatic variables
   data <- add_autos(data, by, sort_check)
   
diff --git a/docs/news/index.html b/docs/news/index.html
index 8a8490b..73206fe 100644
--- a/docs/news/index.html
+++ b/docs/news/index.html
@@ -84,6 +84,7 @@ <h1 data-toc-skip>Changelog <small></small></h1>
     <div class="section level2">
 <h2 class="page-header" data-toc-text="1.3.5" id="libr-135">libr 1.3.5<a class="anchor" aria-label="anchor" href="#libr-135"></a></h2>
 <ul><li>Added ‘parquet’ file format to <code><a href="../reference/libname.html">libname()</a></code> function.</li>
+<li>Added ‘subset’ parameter to <code><a href="../reference/datastep.html">datastep()</a></code> function to filter the data on input.</li>
 </ul></div>
     <div class="section level2">
 <h2 class="page-header" data-toc-text="1.3.4" id="libr-134">libr 1.3.4<small>2024-07-19</small><a class="anchor" aria-label="anchor" href="#libr-134"></a></h2>
diff --git a/docs/pkgdown.yml b/docs/pkgdown.yml
index 5ce5a55..df2ff35 100644
--- a/docs/pkgdown.yml
+++ b/docs/pkgdown.yml
@@ -10,7 +10,7 @@ articles:
   libr-faq: libr-faq.html
   libr-management: libr-management.html
   libr: libr.html
-last_built: 2024-11-02T03:46Z
+last_built: 2024-11-05T01:57Z
 urls:
   reference: https://libr.r-sassy.org/reference
   article: https://libr.r-sassy.org/articles
diff --git a/docs/reference/datastep.html b/docs/reference/datastep.html
index fc95152..5674fab 100644
--- a/docs/reference/datastep.html
+++ b/docs/reference/datastep.html
@@ -114,7 +114,8 @@ <h1>Step through data row-by-row</h1>
 <span>  merge <span class="op">=</span> <span class="cn">NULL</span>,</span>
 <span>  merge_by <span class="op">=</span> <span class="cn">NULL</span>,</span>
 <span>  merge_in <span class="op">=</span> <span class="cn">NULL</span>,</span>
-<span>  log <span class="op">=</span> <span class="cn">TRUE</span></span>
+<span>  log <span class="op">=</span> <span class="cn">TRUE</span>,</span>
+<span>  subset <span class="op">=</span> <span class="cn">NULL</span></span>
 <span><span class="op">)</span></span></code></pre></div>
     </div>
 
@@ -269,6 +270,14 @@ <h2>Arguments</h2>
 <dd><p>Whether or not to log the datastep.  Default is TRUE.  This
 parameter is used internally.</p></dd>
 
+
+<dt id="arg-subset">subset<a class="anchor" aria-label="anchor" href="#arg-subset"></a></dt>
+<dd><p>The <code>subset</code> parameter accepts an <code>expression</code> object
+that will be used to subset the data.  The <code>subset</code> expression will be
+executed <strong>before</strong> the datastep executes.  In this regard, the
+<code>subset</code> parameter on the R datastep is similar to the <code>where</code> clause
+on the SAS datastep.</p></dd>
+
 </dl></div>
     <div id="value">
     <h2>Value</h2>
@@ -360,6 +369,9 @@ <h2>Optional Parameters</h2>
 value of the prior step/row.  This functionality allows you to increment
 values or perform cumulative operations.</p>
 <p><code>calculate</code> and <code>retain</code> are both input parameters.</p>
+<p>The <code>subset</code> and <code>where</code> parameters can both be used to filter
+the datastep data.  The difference is that <code>subset</code> is an input
+parameter, and <code>where</code> is an output parameter.</p>
     </div>
     <div id="set-and-merge-operations">
     <h2>Set and Merge Operations</h2>
diff --git a/man/datastep.Rd b/man/datastep.Rd
index 2796b1a..f95ec79 100644
--- a/man/datastep.Rd
+++ b/man/datastep.Rd
@@ -23,7 +23,8 @@ datastep(
   merge = NULL,
   merge_by = NULL,
   merge_in = NULL,
-  log = TRUE
+  log = TRUE,
+  subset = NULL
 )
 }
 \arguments{
@@ -136,6 +137,12 @@ came from the corresponding table. Use the \code{where} parameter,
 
 \item{log}{Whether or not to log the datastep.  Default is TRUE.  This 
 parameter is used internally.}
+
+\item{subset}{The \code{subset} parameter accepts an \code{expression} object
+that will be used to subset the data.  The \code{subset} expression will be 
+executed \strong{before} the datastep executes.  In this regard, the 
+\code{subset} parameter on the R datastep is similar to the \code{where} clause
+on the SAS datastep.}
 }
 \value{
 The processed data frame, tibble, or data table.
@@ -240,6 +247,10 @@ value of the prior step/row.  This functionality allows you to increment
 values or perform cumulative operations.
 
 \code{calculate} and \code{retain} are both input parameters.
+
+The \code{subset} and \code{where} parameters can both be used to filter
+the datastep data.  The difference is that \code{subset} is an input
+parameter, and \code{where} is an output parameter.
 }
 
 \section{Set and Merge Operations}{
diff --git a/tests/testthat/test-datastep.R b/tests/testthat/test-datastep.R
index 733204e..ed5c0e6 100644
--- a/tests/testthat/test-datastep.R
+++ b/tests/testthat/test-datastep.R
@@ -1807,3 +1807,29 @@ test_that("ds51: delete() works with NA in data frame.", {
 
 })
 
+
+test_that("ds52: subset clause works.", {
+  
+  df <- datastep(mtcars,
+                 subset = expression(cyl == 8),
+                 {
+                   
+                   if (mpg >= 20)
+                     mpgcat <- "High"
+                   else
+                     mpgcat <- "Low"
+                   
+                   recdt <- as.Date("1974-06-10")
+                   
+                   if (cyl == 8)
+                     is8cyl <- TRUE
+                   else
+                     is8cyl <- FALSE
+                   
+                 })
+  
+  df
+  
+  expect_equal(mean(df$cyl), 8)
+  
+})