mathworks · krisfed · Jun 19, 2025 · Jun 19, 2025 · Jun 19, 2025 · Jun 19, 2025
diff --git a/PythonModule/ZarrPy.py b/PythonModule/ZarrPy.py
@@ -81,12 +81,16 @@ def writeZarr (kvstore_schema, data):
     zarr_file[...] = data
 
 
-def readZarr (kvstore_schema):
+def readZarr (kvstore_schema, starts, ends, strides):
     """
     Reads a subset of data from a Zarr file.
 
     Parameters:
     - kvstore_schema (dictionary): Schema for the file store (local or remote)
+    - starts (numpy.ndarray): Array of start indices for each dimension (0-based)
+    - ends (numpy.ndarray): Array of end indices for each dimension (elements 
+                   at the end index will not be read)
+    - strides (numpy.ndarray): Array of strides for each dimensions
 
     Returns:
     - numpy.ndarray: The subset of the data read from the Zarr file.
@@ -96,6 +100,10 @@ def readZarr (kvstore_schema):
         'kvstore': kvstore_schema,
     }).result()
 
+    # Construct the indexing slices
+    slices = tuple(slice(start, end, stride) for start, end, stride in zip(starts, ends, strides))
+
     # Read a subset of the data
-    data = zarr_file[...].read().result()
+    data = zarr_file[slices].read().result()
+
     return data
diff --git a/Zarr.m b/Zarr.m
@@ -53,6 +53,46 @@
             isZgroup = isfile(fullfile(path, '.zgroup'));
         end
 
+        function newParams = processPartialReadParams(params, dims,...
+                defaultValues, paramName)
+            % Process the parameters for partial read (Start, Stride,
+            % Count)
+            arguments (Input)
+                params % Start/Stride/Count parameter to be validated
+                dims (1,:) double  % Zarr array dimensions
+                defaultValues (1,:) 
+                paramName (1,1) string 
+            end
+
+            arguments (Output)
+                newParams (1,:) int64 % must be integers for tensorstore
+            end
+
+            if isempty(params)
+                newParams = defaultValues;
+                return
+            end
+
+            % Allow using a scalar value for indexing into row or column
+            % datasets
+            if isscalar(params) && any(dims==1) && numel(dims)==2
+                newParams = defaultValues;
+                % use the provided value for the non-scalar dimension
+                newParams(dims~=1) = params;
+                return
+            end
+
+            if numel(params) ~= numel(dims)
+                error("MATLAB:Zarr:badPartialReadDimensions",...
+                    "Number of elements in " +...
+                    "%s must be the same "+...
+                    "as the number of Zarr array dimensions.",...
+                    paramName)
+            end
+
+            newParams = params;
+        end
+
         function resolvedPath = getFullPath(path)
             % Given a path, resolves it to a full path. The trailing
             % directories do not have to exist.
@@ -200,7 +240,7 @@ function makeZarrGroups(existingParentPath, newGroupsPath)
         end
 
 
-        function data = read(obj)
+        function data = read(obj, start, count, stride)
             % Function to read the Zarr array
 
             % If the Zarr array is local, verify that it is a valid folder
@@ -214,7 +254,27 @@ function makeZarrGroups(existingParentPath, newGroupsPath)
                 end
             end
 
-            ndArrayData = py.ZarrPy.readZarr(obj.KVStoreSchema);
+            % Validate partial read parameters
+            info = zarrinfo(obj.Path);
+            numDims = numel(info.shape);
+            start = Zarr.processPartialReadParams(start, info.shape,...
+                ones([1,numDims]), "Start");
+            stride = Zarr.processPartialReadParams(stride, info.shape,...
+                ones([1,numDims]), "Stride"); 
+            maxCount = (int64(info.shape') - start + 1)./stride; % has to be a row vector
+            count = Zarr.processPartialReadParams(count, info.shape,...
+                maxCount, "Count"); 
+
+            % Convert partial read parameters to tensorstore-style
+            % indexing
+            start = start - 1; % tensorstore is 0-based
+            % Tensorstore uses end index instead of count
+            % (it does NOT include element at the end index)
+            endInds = start + stride.*count;
+
+            % Read the data
+            ndArrayData = py.ZarrPy.readZarr(obj.KVStoreSchema,...
+                start, endInds, stride);
 
             % Store the datatype
             obj.Datatype = ZarrDatatype.fromTensorstoreType(ndArrayData.dtype.name);

diff --git a/doc/documentation.md b/doc/documentation.md
@@ -68,11 +68,32 @@ do not already exist. If `FILEPATH` exists already, the contents are overwritten
 Write the MATLAB variable data (specified by DATA) to the path specified by `FILEPATH`.
 The size of `DATA` must match the size of the Zarr array specified during creation.
 
-## `DATA = zarrread(FILEPATH)`
-Retrieve all the data from the Zarr array located at `FILEPATH`.
+## `DATA = zarrread(FILEPATH, Name=Value)`
+Retrieve data from the Zarr array located at `FILEPATH`.
 The datatype of DATA is the MATLAB equivalent of the Zarr datatype of the array
 located at `FILEPATH`.
 
+###	Name - Value Pairs
+```
+Start    - a row vector of one-based indices of the first 
+           elements to be read in each dimension. If you 
+           do not specify start, then the function starts 
+           reading the dataset from the first index along 
+           each dimension.
+
+Count    - a row vector of numbers of elements to
+           be read in each dimension. If you do not specify 
+           count, then the function reads data until the end 
+           of each dimension.
+
+Stride   - a row vector of differences between indices along 
+           each dimension. A value of 1 accesses adjacent elements
+           in the corresponding dimension, a value of 2 accesses 
+           every other element in the corresponding dimension, and 
+           so on. If you do not specify stride, then the function 
+           reads data without skipping indices along each dimension.
+```
+
 ## `INFO = zarrinfo(FILEPATH)`
 Read the metadata associated with a Zarr array or group located at `FILEPATH` and return the information in a structure INFO, whose fields are the names of the metadata keys. 
 If `FILEPATH` is a Zarr array (has a valid `.zarray` file), the value of `node_type` is "array"; if `FILEPATH` is a Zarr group (has a valid `.zgroup` file), the value of the field `node_type` is "group".

diff --git a/doc/examples.md b/doc/examples.md
@@ -6,6 +6,18 @@ filepath = "group1\dset1";
 data = zarrread(filepath)
 ```
 
+### Read a subset of Zarr array
+Read a 2x2 subset of a 3x4 array, starting with the second element in the second dimension, and only reading every other element in the second dimension.
+``` MATLAB
+filepath = "grp_v2/smallArr";
+d = zarrread(filepath, Start=[1,2], Stride=[1,2], Count=[2,2])
+
+d =
+
+     4    10
+     5    11
+```
+
 ### Create and write to a Zarr array
 ``` MATLAB
 filepath   = "myZarrfiles\singleDset";

diff --git a/test/dataFiles/grp_v2/smallArr/.zarray b/test/dataFiles/grp_v2/smallArr/.zarray
@@ -0,0 +1 @@
+{"chunks":[3,4],"compressor":null,"dimension_separator":".","dtype":"<f8","fill_value":null,"filters":null,"order":"C","shape":[3,4],"zarr_format":2}
diff --git a/test/dataFiles/grp_v2/smallArr/0.0 b/test/dataFiles/grp_v2/smallArr/0.0
diff --git a/test/dataFiles/grp_v2/vectorData/.zarray b/test/dataFiles/grp_v2/vectorData/.zarray
@@ -0,0 +1 @@
+{"chunks":[1,10],"compressor":null,"dimension_separator":".","dtype":"<f8","fill_value":null,"filters":null,"order":"C","shape":[1,10],"zarr_format":2}
diff --git a/test/dataFiles/grp_v2/vectorData/0.0 b/test/dataFiles/grp_v2/vectorData/0.0
diff --git a/test/tZarrRead.m b/test/tZarrRead.m
@@ -7,6 +7,8 @@
         % Path for read functions
         GrpPathRead = "dataFiles/grp_v2"
         ArrPathRead = "dataFiles/grp_v2/arr_v2"
+        ArrPathReadSmall = "dataFiles/grp_v2/smallArr"
+        ArrPathReadVector = "dataFiles/grp_v2/vectorData"
         ArrPathReadV3 = "dataFiles/grp_v3/arr_v3"
 
         ExpData = load(fullfile(pwd,"dataFiles","expZarrArrData.mat"))
@@ -28,6 +30,54 @@ function verifyArrayData(testcase)
             testcase.verifyEqual(actArrData,expArrData,'Failed to verify array data.');
         end
 
+        function verifyPartialArrayData(testcase)
+            % Verify array data using zarrread function with Start/Stride/Count.
+
+            % The full data in the small array is
+            % 
+            % 1    4    7   10
+            % 2    5    8   11
+            % 3    6    9   12
+            zpath = testcase.ArrPathReadSmall;
+
+            % Start
+            actData = zarrread(zpath, Start=[2, 3]);
+            expData = [8, 11; 9, 12];
+            testcase.verifyEqual(actData,expData,...
+                'Failed to verify reading with Start.');
+
+            % Count
+            actData = zarrread(zpath, Count=[2, 1]);
+            expData = [1;2];
+            testcase.verifyEqual(actData,expData,...
+                'Failed to verify reading with Count.');
+
+            % Stride
+            actData = zarrread(zpath, Stride=[3, 2]);
+            expData = [1, 7];
+            testcase.verifyEqual(actData,expData,...
+                'Failed to verify reading with Stride.');
+
+            % Start, Stride, and Count
+            actData = zarrread(zpath,...
+                Start=[2, 1], Stride=[1, 2], Count=[1, 2]);
+            expData = [2, 8];
+            testcase.verifyEqual(actData,expData,...
+                'Failed to verify reading with Start, Stride, and Count.');
+        end
+
+        function verifyPartialVectorData(testcase)
+            % Verify that specifying a scalar value for Start/Stride/Count
+            % for vector datasets works as expected
+
+            zpath = testcase.ArrPathReadVector; % data is 1:10
+
+            expData = [2,5];
+            actData = zarrread(zpath, Start=2, Stride=3, Count=2);
+            testcase.verifyEqual(actData,expData,...
+                'Failed to verify using scalar Start, Stride, and Count.');
+        end
+
         function verifyArrayDataRelativePath(testcase)
             % Verify array data if the input is using relative path to the
             % array.
@@ -83,5 +133,27 @@ function invalidFilePath(testcase)
             errID = 'MATLAB:Zarr:invalidZarrObject';
             testcase.verifyError(@()zarrread(inpPath),errID);
         end
+
+        function invalidPartialReadParams(testcase)
+            % Verify zarrread errors when invalid partial read
+            % Start/Stride/Count are used
+
+            zpath = testcase.ArrPathReadSmall; % a 2D array, 3x4
+
+            errID = 'MATLAB:Zarr:badPartialReadDimensions';
+            wrongNumberOfDimensions = [1,1,1];
+            testcase.verifyError(...
+                @()zarrread(zpath,Start=wrongNumberOfDimensions),...
+                errID);
+            testcase.verifyError(...
+                @()zarrread(zpath,Stride=wrongNumberOfDimensions),...
+                errID);
+            testcase.verifyError(...
+                @()zarrread(zpath,Count=wrongNumberOfDimensions),...
+                errID);
+
+            %TODO: negative values, wrong datatypes, out of bounds
+
+        end
     end
 end
diff --git a/zarrread.m b/zarrread.m
@@ -1,16 +1,37 @@
-function data = zarrread(filepath)
+function data = zarrread(filepath, options)
 %ZARRREAD Read data from Zarr array
 %   DATA = ZARRREAD(FILEPATH) retrieves all the data from the Zarr array
-%   located at FILEPATH.
-% The datatype of DATA is the MATLAB equivalent of the Zarr datatype of the
-% array located at FILEPATH.
+%   located at FILEPATH. The datatype of DATA is the MATLAB equivalent of 
+%   the Zarr datatype of the array located at FILEPATH.
+%
+%   DATA = ZARRREAD(..., Start=start) retrieves a subset of the data from
+%   the Zarr array. Specify start as a row vector of one-based indices of
+%   the first elements to be read in each dimension. If you do not specify
+%   start, then the function starts reading the dataset from the first
+%   index along each dimension.
+%
+%   DATA = ZARRREAD(..., Count=count) retrieves a subset of the data from
+%   the Zarr array. Specify count as a row vector of numbers of elements to
+%   be read in each dimension. If you do not specify count, then the
+%   function reads data until the end of each dimension.
+%
+%   DATA = ZARRREAD(..., Stride=stride) retrieves a subset of the data from
+%   the Zarr array. Specify stride as a row vector of differences between
+%   indices along each dimension. A value of 1 accesses adjacent elements
+%   in the corresponding dimension, a value of 2 accesses every other
+%   element in the corresponding dimension, and so on. If you do not
+%   specify stride, then the function reads data without skipping indices
+%   along each dimension.
 
 %   Copyright 2025 The MathWorks, Inc.
 
 arguments
     filepath {mustBeTextScalar, mustBeNonzeroLengthText}
+    options.Start (1,:) {mustBeInteger, mustBePositive} = [];
+    options.Count (1,:) {mustBeInteger, mustBePositive} = [];
+    options.Stride (1,:) {mustBeInteger, mustBePositive} = [];
 end
 
 zarrObj = Zarr(filepath);
-data = zarrObj.read;
+data = zarrObj.read(options.Start, options.Count, options.Stride);
 end
Original file line number	Diff line number	Diff line change
		@@ -0,0 +1 @@
		{"chunks":[3,4],"compressor":null,"dimension_separator":".","dtype":"<f8","fill_value":null,"filters":null,"order":"C","shape":[3,4],"zarr_format":2}
Original file line number	Diff line number	Diff line change
		@@ -0,0 +1 @@
		{"chunks":[1,10],"compressor":null,"dimension_separator":".","dtype":"<f8","fill_value":null,"filters":null,"order":"C","shape":[1,10],"zarr_format":2}