rymuelle · rymuelle · Jan 14, 2026 · Dec 16, 2025 · Dec 16, 2025 · Dec 16, 2025
diff --git a/examples/simple_demosaicing_RawHandlerRawpy.ipynb b/examples/simple_demosaicing_RawHandlerRawpy.ipynb
diff --git a/pyproject.toml b/pyproject.toml
@@ -1,6 +1,6 @@
 [project]
 name = "RawHandler" 
-version = "0.0.3"
+version = "0.1.0"
 description = "A basic library to handle camera raw files for use in machine learning. Built on rawpy and cv2."
 authors = [
     { name = "Ryan Mueller"},
@@ -19,6 +19,8 @@ dependencies = [
     "rawpy>=0.24.0",
     "colour_demosaicing>=0.2.6",
     "exifread>=3.3.1",
+    "exiv2",
+    "tifffile>=2024.0.0",
     ]
 
 [project.optional-dependencies]

diff --git a/src/RawHandler/MetaDataHandler.py b/src/RawHandler/MetaDataHandler.py
@@ -0,0 +1,35 @@
+import exiv2
+
+
+class MetaDataHandler:
+    def __init__(self, path: str):
+        self.metadata = exiv2.ImageFactory.open(path)
+        self.metadata.readMetadata()
+
+    def get_ISO(self):
+        return get_ISO(self.metadata)
+
+
+def get_ISO(metadata):
+    search_tags = [
+        "Exif.Photo.RecommendedExposureIndex",
+        "Exif.Photo.StandardOutputSensitivity",
+        "Exif.NikonIi.ISO",
+        "Exif.Nikon3.ISOSpeed",
+        "Exif.Nikon3.ISOSettings",
+        "Exif.Photo.ISOSpeedRatings",
+        "Exif.Image.ISOSpeedRatings",
+    ]
+
+    exif = metadata.exifData()
+
+    for tag in search_tags:
+        if tag in exif:
+            try:
+                val = exif[tag].print()
+                if val and val != 65535:
+                    return float(val)
+            except Exception as e:
+                print(e)
+                val = -1
+    return val
diff --git a/src/RawHandler/RawHandlerRawpy.py b/src/RawHandler/RawHandlerRawpy.py
@@ -0,0 +1,266 @@
+import numpy as np
+import rawpy
+from typing import NamedTuple, Optional
+from RawHandler.utils import sparse_representation_three_channel
+from RawHandler.MetaDataHandler import MetaDataHandler
+from RawHandler.dng_utils import to_dng
+from typing import Literal, Tuple
+
+from RawHandler.utils import (
+    make_colorspace_matrix,
+    pixel_unshuffle,
+    sparse_representation_and_mask,
+)
+
+
+# Define a NamedTuple for the core metadata required by BaseRawHandler for processing
+class CoreRawMetadata(NamedTuple):
+    black_level_per_channel: np.ndarray
+    white_level: int
+    rgb_xyz_matrix: np.ndarray
+    raw_pattern: np.ndarray
+    camera_white_balance: np.ndarray
+    iheight: int
+    iwidth: int
+
+
+class BaseRawHandlerRawpy:
+    """
+    Base class for handling raw image pixel data.
+
+    Args:
+        pixel_array (np.array): A 2D NumPy array representing the raw pixel data.
+        core_metadata (CoreRawMetadata): A NamedTuple containing essential metadata for processing.
+        full_metadata (Optional[FullRawMetadata]): A class wrapping exiv2 to handle metadata information.
+    """
+
+    def __init__(
+        self,
+        rawpy_object: rawpy.RawPy,
+        core_metadata: CoreRawMetadata,
+        full_metadata: Optional[dict] = None,
+        colorspace: Literal[
+            "camera", "XYZ", "sRGB", "AdobeRGB", "lin_rec2020"
+        ] = "lin_rec2020",
+    ):
+        if not isinstance(core_metadata, CoreRawMetadata):
+            raise TypeError("core_metadata must be an instance of CoreRawMetadata.")
+
+        self.rawpy_object = rawpy_object
+        self.core_metadata = core_metadata
+        self.full_metadata = full_metadata if full_metadata is not None else None
+        self.colorspace = colorspace
+        self.camera_linear = None
+
+    def compute_linear(self):
+        self.camera_linear = (
+            self.rawpy_object.postprocess(
+                user_wb=[1, 1, 1, 1],
+                output_color=rawpy.ColorSpace.raw,
+                no_auto_bright=True,
+                use_camera_wb=False,
+                use_auto_wb=False,
+                gamma=(1, 1),
+                user_flip=0,
+                output_bps=16,
+                user_black=0,
+                no_auto_scale=True,
+            )
+            / self.core_metadata.white_level
+        ).transpose(2, 0, 1)
+
+    # orig_dims = camera_linear.shape
+    # rgb_to_xyz = self.core_metadata.rgb_xyz_matrix[:3]
+    # camera_linear = (rgb_to_xyz @ camera_linear.reshape(3, -1)).reshape(orig_dims)
+    # self.camera_linear = camera_linear
+
+    def _input_handler(self, dims=None, safe_crop=0) -> np.ndarray:
+        """
+        Crops linear array.
+        """
+        if self.camera_linear is None:
+            self.compute_linear()
+        if dims is not None:
+            h1, h2, w1, w2 = dims
+            if safe_crop:
+                h1, h2, w1, w2 = list(
+                    map(lambda x: x - x % safe_crop, [h1, h2, w1, w2])
+                )
+            return self.camera_linear[:, h1:h2, w1:w2]
+        else:
+            return self.camera_linear
+
+    def rgb_colorspace_transform(self, colorspace=None, **kwargs) -> np.ndarray:
+        """
+        Generates a color space transformation matrix for this image.
+        """
+        colorspace = colorspace or self.colorspace
+        if colorspace == "camera":
+            return np.array(
+                [
+                    [1.0, 0.0, 0.0],
+                    [0.0, 1.0, 0.0],
+                    [0.0, 0.0, 1.0],
+                ]
+            )
+        rgb_to_xyz = np.linalg.inv(self.core_metadata.rgb_xyz_matrix[:3])
+        if colorspace == "XYZ":
+            return rgb_to_xyz
+
+        transform = make_colorspace_matrix(rgb_to_xyz, colorspace=colorspace, **kwargs)
+        return transform
+
+    def apply_colorspace_transform(
+        self,
+        dims=None,
+        safe_crop=0,
+        xyz_to_colorspace: np.ndarray = None,
+        colorspace=None,
+        clip=False,
+    ) -> np.ndarray:
+        """
+        Converts or returns linear data converted into specified colorspace.
+        """
+        camera_linear = self._input_handler(dims=dims, safe_crop=safe_crop)
+        rgb_transform = self.rgb_colorspace_transform(
+            colorspace=colorspace, xyz_to_colorspace=xyz_to_colorspace
+        )
+        orig_dims = camera_linear.shape
+        transformed = (rgb_transform @ camera_linear.reshape(3, -1)).reshape(orig_dims)
+        if clip:
+            transformed = np.clip(transformed, 0, 1)
+        return transformed
+
+    def compute_mask_and_sparse(
+        self, dims=None, safe_crop=0, divide_by_wl=True
+    ) -> Tuple[np.ndarray, np.ndarray]:
+        sparse, mask = sparse_representation_and_mask(
+            self.rawpy_object.raw_image_visible, self.core_metadata.raw_pattern
+        )
+        if divide_by_wl:
+            sparse = sparse / self.core_metadata.white_level
+        if dims is not None:
+            h1, h2, w1, w2 = dims
+            if safe_crop:
+                h1, h2, w1, w2 = list(
+                    map(lambda x: x - x % safe_crop, [h1, h2, w1, w2])
+                )
+            return sparse[:, h1:h2, w1:w2], mask[:, h1:h2, w1:w2]
+        else:
+            return sparse, mask
+
+    def downsize(
+        self, min_preview_size=256, colorspace=None, clip=False, safe_crop=0
+    ) -> np.ndarray:
+        _, H, W = self.camera_linear.shape
+        W_steps, H_steps = H // min_preview_size - 1, W // min_preview_size - 1
+        steps = min(W_steps, H_steps)
+        c_first_linear = self.apply_colorspace_transform(
+            colorspace=colorspace, clip=clip, safe_crop=safe_crop
+        )[0]
+        c_first_linear = c_first_linear[:, ::steps, ::steps]
+        return c_first_linear
+
+    def generate_thumbnail(
+        self,
+        min_preview_size=256,
+        colorspace=None,
+        clip=False,
+        safe_crop=0,
+    ) -> np.ndarray:
+        c_first_linear = self.downsize(
+            min_preview_size=min_preview_size,
+            colorspace=colorspace,
+            clip=clip,
+            safe_crop=safe_crop,
+        )
+        return c_first_linear
+
+    def as_rgb(
+        self,
+        colorspace=None,
+        dims=None,
+        clip=False,
+        safe_crop=0,
+    ) -> np.ndarray:
+        c_first_linear = self.apply_colorspace_transform(
+            colorspace=colorspace, dims=dims, safe_crop=safe_crop
+        )
+        if clip:
+            c_first_linear = np.clip(c_first_linear, 0, 1)
+        return c_first_linear
+
+    def as_sparse(
+        self,
+        colorspace=None,
+        dims=None,
+        clip=False,
+        safe_crop=0,
+        pattern="RGGB",
+        cfa_type="bayer",
+    ) -> np.ndarray:
+        c_first_linear = self.apply_colorspace_transform(
+            colorspace=colorspace, dims=dims, safe_crop=safe_crop
+        )
+        sparse = sparse_representation_three_channel(
+            c_first_linear, pattern=pattern, cfa_type=cfa_type
+        )
+        if clip:
+            sparse = np.clip(sparse, 0, 1)
+        return sparse
+
+    def as_cfa(self, **kwargs) -> np.ndarray:
+        sparse = self.as_sparse(**kwargs)
+        return sparse.sum(axis=0, keepdims=True)
+
+    def as_rggb(self, cfa_type="bayer", **kwargs) -> np.ndarray:
+        cfa = self.as_CFA(**kwargs)
+        if cfa_type == "bayer":
+            rggb = pixel_unshuffle(cfa, 2)
+        else:
+            rggb = pixel_unshuffle(cfa, 6)
+        return rggb
+
+    def to_dng(self, filepath, uint_img=None):
+        try:
+            to_dng(self, filepath, uint_img=uint_img)
+            return True
+        except Exception as e:
+            print(e)
+            return False
+
+
+class RawHandlerRawpy:
+    """
+    Factory class to create BaseRawHandlerRawpy instances from raw image files.
+    This class handles rawpy specific parsing for pixel data and core metadata,
+    and uses exifread for extracting general EXIF metadata.
+
+    Args:
+        path (string): Path to raw file.
+    """
+
+    def __new__(cls, path: str, **kwargs):
+        # Use rawpy for raw pixel data and core processing metadata
+        rawpy_object = rawpy.imread(path)
+
+        # Extract Core Metadata for BaseRawHandler's processing logic
+        core_metadata = CoreRawMetadata(
+            black_level_per_channel=rawpy_object.black_level_per_channel,
+            white_level=rawpy_object.white_level,
+            rgb_xyz_matrix=rawpy_object.rgb_xyz_matrix,
+            raw_pattern=rawpy_object.raw_pattern,
+            camera_white_balance=np.array(rawpy_object.camera_whitebalance),
+            iheight=rawpy_object.sizes.iheight,
+            iwidth=rawpy_object.sizes.iwidth,
+        )
+
+        # Extract Metadata using exiv2
+        metadata = MetaDataHandler(path)
+
+        return BaseRawHandlerRawpy(
+            rawpy_object=rawpy_object,
+            core_metadata=core_metadata,
+            full_metadata=metadata,
+            **kwargs,
+        )