Source code for wibench.algorithms.watermark_anything.wrapper

from wibench.algorithms.base import BaseAlgorithmWrapper
from wibench.watermark_data import TorchBitWatermarkData
from wibench.typing import TorchImg
from wibench.module_importer import ModuleImporter
import torch
import torch.nn.functional as F
from dataclasses import dataclass
import os
from wibench.download import requires_download


URL = "https://nextcloud.ispras.ru/index.php/s/mkAqMgy4PY6yaMK"
NAME = "watermark_anything"
REQUIRED_FILES = ["wam_mit.pth"]


[docs]@dataclass
class WAParams:
    """Configuration parameters for the WA (Watermark Anything) watermarking algorithm.

    Attributes
    ----------
        wm_length : int
            Length of the watermark message to be embed (in bits).
        scaling_w : float
            Scaling factor for the watermark in the embedder model.

    """
    wm_length: int
    scaling_w: float


[docs]@requires_download(URL, NAME, REQUIRED_FILES)
class WatermarkAnythingWrapper(BaseAlgorithmWrapper):
    """Watermark Anything with Localized Messages - Image Watermarking Algorithm [`paper <https://arxiv.org/abs/2411.07231>`__].
    
    Provides an interface for embedding and extracting watermarks using the Watermark Anything watermarking algorithm.
    Based on the code from `here <https://github.com/facebookresearch/watermark-anything>`__.

    """
    
    name = NAME

    def __init__(
        self,
        module_path: str,
        ckpt_path: str,
        params_path: str,
        wm_length: int,
        scaling_w: float,
        device: str = "cuda" if torch.cuda.is_available() else "cpu",
    ):
        super().__init__(WAParams(wm_length=wm_length, scaling_w=scaling_w))
        with ModuleImporter("WAM", module_path):
            from WAM.notebooks.inference_utils import (
                load_model_from_checkpoint,
                normalize_img,
                unnormalize_img,
            )
            from WAM.watermark_anything.data.metrics import msg_predict_inference

        self.ckpt_path = ckpt_path
        self.params_path = params_path
        self.device = device
        if not os.path.exists(ckpt_path):
            raise FileNotFoundError(f"{ckpt_path} does not exist") 
        self.wam = load_model_from_checkpoint(
            self.params_path, self.ckpt_path
        ).to(device)
        self.wam.scaling_w = scaling_w
        self.transform = normalize_img
        self.msg_predict_inference = msg_predict_inference
        self.unnormalize_img = unnormalize_img

[docs]    def embed(self, image: TorchImg, watermark_data: TorchBitWatermarkData):
        """Embed watermark into input image.
        
        Parameters
        ----------
        image : TorchImg
            Input image tensor in (C, H, W) format
        watermark_data: TorchBitWatermarkData
            Torch bit message with data type torch.int64

        """
        img = self.transform(image).unsqueeze(0).to(self.device)
        wm = watermark_data.watermark.to(self.device)
        with torch.no_grad():
            outputs = self.wam.embed(img, wm)
        result = outputs["imgs_w"].cpu()
        res = self.unnormalize_img(result.squeeze())
        return torch.clamp(res, 0, 1)

[docs]    def extract(self, image: TorchImg, watermark_data: TorchBitWatermarkData):
        """Extract watermark from marked image.
        
        Parameters
        ----------
        image : TorchImg
            Input image tensor in (C, H, W) format
        watermark_data: TorchBitWatermarkData
            Torch bit message with data type torch.int64

        """
        img = self.transform(image).unsqueeze(0).to(self.device)
        with torch.no_grad():
            preds = self.wam.detect(img)["preds"].cpu()
        # [1, 256, 256], predicted mask
        mask_preds = F.sigmoid(preds[:, 0, :, :])
        bit_preds = preds[:, 1:, :, :]  # [1, 32, 256, 256], predicted bits
        pred_message = self.msg_predict_inference(
            bit_preds, mask_preds
        ).float()
        return pred_message.squeeze().numpy()

[docs]    def watermark_data_gen(self) -> TorchBitWatermarkData:
        """Generate watermark payload data for Watermark Anything watermarking algorithm.
        
        Returns
        -------
        TorchBitWatermarkData
            Torch bit message with data type torch.int64 and shape of (0, message_length)

        Notes
        -----
        - Called automatically during embedding

        """
        return TorchBitWatermarkData.get_random(self.params.wm_length)