mirror of
https://github.com/wiltodelta/remove-ai-watermarks.git
synced 2026-07-05 07:57:50 +02:00
0f54c6b54d
Bright-background photos/renders and a tiny app icon were flagged as AI-generated by the visible detectors. Two failure modes: - Gemini sparkle on a bright background (snow+sky photo, white product render) scored ~0.51. The FP gate only demoted on a low core-ring brightness margin, which a bright background makes high. Add a gradient floor (_SPARKLE_FP_GRAD 0.55): a real sparkle is a crisp star (grad ~0.97-1.0), a smooth luminance blob that NCC-matches the diamond is not (the two FPs measured grad 0.105 / 0.463). The OR is a strict superset of the old margin-only demotion, so it cannot regress dark/mid (kept by margin) or white-bg (kept by confidence) real sparkles. - A 48x48 geometric icon matched the Doubao/Jimeng CJK silhouette at 0.41/0.47 NCC. Purely a small-size artifact (the same icon at >=256px collapses to ~0.06-0.10). Guard text-mark detection below a 200px short side (_MIN_DETECT_SHORT_SIDE); real marks ship on full-resolution renders (smallest captured sample 1086px). Corpus re-sweep flips only OpenAI content and already-cleaned outputs, all sub-0.5, so no provenance verdict changes. Add synthetic regression fixtures for both modes; docs/module-internals.md updated. Co-Authored-By: Claude Opus 4.8 <noreply@anthropic.com>
232 lines
10 KiB
Python
232 lines
10 KiB
Python
"""Tests for the Doubao visible-watermark engine (reverse-alpha only)."""
|
|
|
|
from __future__ import annotations
|
|
|
|
from pathlib import Path
|
|
|
|
import cv2
|
|
import numpy as np
|
|
import pytest
|
|
|
|
from remove_ai_watermarks.doubao_engine import (
|
|
_ALPHA_HEIGHT_FRAC,
|
|
_ALPHA_LOGO_BGR,
|
|
_ALPHA_MARGIN_BOTTOM_FRAC,
|
|
_ALPHA_MARGIN_RIGHT_FRAC,
|
|
_ALPHA_NATIVE_WIDTH,
|
|
_ALPHA_WIDTH_FRAC,
|
|
DETECT_NCC_THRESHOLD,
|
|
DoubaoEngine,
|
|
_alpha_template,
|
|
_glyph_silhouette,
|
|
_template_match_score,
|
|
load_image_bgr,
|
|
)
|
|
|
|
SAMPLE = Path(__file__).resolve().parents[1] / "data" / "samples" / "doubao-1.png"
|
|
|
|
|
|
class TestLocate:
|
|
def test_box_anchored_bottom_right(self):
|
|
eng = DoubaoEngine()
|
|
img = np.zeros((2048, 2048, 3), np.uint8)
|
|
loc = eng.locate(img)
|
|
assert 2048 - (loc.x + loc.w) < int(2048 * 0.03)
|
|
assert 2048 - (loc.y + loc.h) < int(2048 * 0.03)
|
|
|
|
def test_box_scales_with_width(self):
|
|
eng = DoubaoEngine()
|
|
small = eng.locate(np.zeros((1024, 1024, 3), np.uint8))
|
|
large = eng.locate(np.zeros((2048, 2048, 3), np.uint8))
|
|
assert large.w == pytest.approx(small.w * 2, rel=0.1)
|
|
|
|
|
|
# ── Detection: alpha-template NCC ───────────────────────────────────
|
|
|
|
|
|
class TestDetect:
|
|
def test_clean_gradient_not_detected(self):
|
|
eng = DoubaoEngine()
|
|
ramp = np.tile(np.linspace(0, 255, 1024, dtype=np.uint8), (1024, 1))
|
|
img = cv2.cvtColor(ramp, cv2.COLOR_GRAY2BGR)
|
|
assert not eng.detect(img).detected
|
|
|
|
def test_solid_blob_corner_not_detected(self):
|
|
"""A bright blob is not the glyph shape -> low correlation, not detected."""
|
|
eng = DoubaoEngine()
|
|
img = np.zeros((1024, 1024, 3), np.uint8)
|
|
x, y, bw, bh = eng.locate(img).bbox
|
|
img[y + bh // 4 : y + bh * 3 // 4, x : x + bw // 2] = 200
|
|
assert not eng.detect(img).detected
|
|
|
|
def test_silhouette_loads(self):
|
|
sil = _glyph_silhouette()
|
|
assert sil is not None
|
|
assert set(np.unique(sil)).issubset({0, 255})
|
|
|
|
def test_match_score_shape_sensitive(self):
|
|
"""The glyph silhouette correlates with itself, not with a filled block."""
|
|
sil = _glyph_silhouette()
|
|
h, w = sil.shape
|
|
# box that contains the silhouette -> high score
|
|
box = np.zeros((h + 8, int(w / _ALPHA_WIDTH_FRAC * 0.2) + w), np.uint8)
|
|
box[4 : 4 + h, 4 : 4 + w] = sil
|
|
assert _template_match_score(box, _ALPHA_NATIVE_WIDTH) >= DETECT_NCC_THRESHOLD
|
|
# a uniformly filled box has no glyph structure -> low score
|
|
solid = np.full_like(box, 255)
|
|
assert _template_match_score(solid, _ALPHA_NATIVE_WIDTH) < DETECT_NCC_THRESHOLD
|
|
|
|
def test_small_image_guarded_from_false_positive(self):
|
|
"""Below the minimum short side a tiny geometric shape spuriously NCC-matches
|
|
the CJK silhouette (2026-06-26 FP: a 48x48 app-icon chevron scored 0.41). The
|
|
size guard suppresses detection there. Bracket it: a real mark is detected at
|
|
native size, but the same content downscaled below the guard is not."""
|
|
w = h = _ALPHA_NATIVE_WIDTH
|
|
at = _alpha_template()
|
|
gw, gh = int(_ALPHA_WIDTH_FRAC * w), int(_ALPHA_HEIGHT_FRAC * w)
|
|
ax = w - int(_ALPHA_MARGIN_RIGHT_FRAC * w) - gw
|
|
ay = h - int(_ALPHA_MARGIN_BOTTOM_FRAC * w) - gh
|
|
amap = np.zeros((h, w), np.float32)
|
|
amap[ay : ay + gh, ax : ax + gw] = cv2.resize(at, (gw, gh))
|
|
a3 = amap[:, :, None]
|
|
wm = (a3 * np.array(_ALPHA_LOGO_BGR, np.float32) + (1 - a3) * 100.0).clip(0, 255).astype(np.uint8)
|
|
eng = DoubaoEngine()
|
|
assert eng.detect(wm).detected # native: real mark detected
|
|
assert not eng.detect(cv2.resize(wm, (150, 150))).detected # below guard: suppressed
|
|
|
|
|
|
@pytest.mark.skipif(not SAMPLE.exists(), reason="sample image not present")
|
|
class TestRealSample:
|
|
def test_detects_watermark(self):
|
|
det = DoubaoEngine().detect(load_image_bgr(SAMPLE))
|
|
assert det.detected
|
|
assert det.confidence >= DETECT_NCC_THRESHOLD
|
|
|
|
def test_reverse_alpha_removes_mark(self):
|
|
eng = DoubaoEngine()
|
|
img = load_image_bgr(SAMPLE)
|
|
assert eng.reverse_alpha_available(img) # sample is at the captured width
|
|
out = eng.remove_watermark_reverse_alpha(img)
|
|
assert not eng.detect(out).detected # mark gone after recovery
|
|
|
|
def test_far_region_untouched(self):
|
|
eng = DoubaoEngine()
|
|
img = load_image_bgr(SAMPLE)
|
|
out = eng.remove_watermark_reverse_alpha(img)
|
|
h, w = img.shape[:2]
|
|
assert np.array_equal(img[: h // 2, : w // 2], out[: h // 2, : w // 2])
|
|
|
|
|
|
# ── Reverse-alpha (exact recovery) ──────────────────────────────────
|
|
|
|
|
|
class TestReverseAlpha:
|
|
def test_alpha_asset_loads(self):
|
|
at = _alpha_template()
|
|
assert at is not None
|
|
assert at.dtype.kind == "f"
|
|
assert float(at.min()) >= 0.0
|
|
assert float(at.max()) <= 1.0
|
|
|
|
def test_available_whenever_asset_present(self):
|
|
# NCC alignment generalizes to any resolution, so availability is just
|
|
# "asset loadable" (any non-empty image); the caller gates on detect.
|
|
eng = DoubaoEngine()
|
|
assert eng.reverse_alpha_available(np.zeros((1024, 1024, 3), np.uint8))
|
|
assert eng.reverse_alpha_available(np.zeros((1773, 1535, 3), np.uint8))
|
|
assert not eng.reverse_alpha_available(np.zeros((0, 0, 3), np.uint8))
|
|
|
|
@staticmethod
|
|
def _compose(w: int, h: int, bg: float = 100.0):
|
|
"""Composite the real alpha (scaled to width ``w``) onto a flat bg.
|
|
Returns ``(watermarked_uint8, mark_bool_mask)``."""
|
|
img = np.full((h, w, 3), bg, np.float32)
|
|
at = _alpha_template()
|
|
gw, gh = int(_ALPHA_WIDTH_FRAC * w), int(_ALPHA_HEIGHT_FRAC * w)
|
|
ax = w - int(_ALPHA_MARGIN_RIGHT_FRAC * w) - gw
|
|
ay = h - int(_ALPHA_MARGIN_BOTTOM_FRAC * w) - gh
|
|
amap = np.zeros((h, w), np.float32)
|
|
amap[ay : ay + gh, ax : ax + gw] = cv2.resize(at, (gw, gh))
|
|
a3 = amap[:, :, None]
|
|
wm = (a3 * np.array(_ALPHA_LOGO_BGR, np.float32) + (1 - a3) * img).clip(0, 255).astype(np.uint8)
|
|
return wm, amap > 0.2
|
|
|
|
def test_removes_synthetic_mark(self):
|
|
"""Reverse-alpha + thin residual inpaint clears a mark composed from the
|
|
real alpha (re-detect no longer fires)."""
|
|
eng = DoubaoEngine()
|
|
wm, _mark = self._compose(_ALPHA_NATIVE_WIDTH, _ALPHA_NATIVE_WIDTH)
|
|
assert eng.detect(wm).detected
|
|
out = eng.remove_watermark_reverse_alpha(wm)
|
|
assert not eng.detect(out).detected
|
|
|
|
@pytest.mark.parametrize(
|
|
("w", "h", "max_err"),
|
|
[
|
|
(_ALPHA_NATIVE_WIDTH, _ALPHA_NATIVE_WIDTH, 5.0), # captured width
|
|
(1773, 2364, 8.0), # 3:4 portrait -> NCC alignment generalizes the single capture
|
|
],
|
|
)
|
|
def test_recovers_flat_background(self, w, h, max_err):
|
|
"""Recovers the flat background at the captured width AND a non-native
|
|
resolution (NCC alignment generalizes the single capture)."""
|
|
eng = DoubaoEngine()
|
|
wm, mark = self._compose(w, h)
|
|
assert float(np.abs(wm.astype(np.float32)[mark] - 100.0).mean()) > 15 # mark visible
|
|
out = eng.remove_watermark_reverse_alpha(wm).astype(np.float32)
|
|
assert float(np.abs(out[mark] - 100.0).mean()) < max_err
|
|
|
|
@staticmethod
|
|
def _textured_bg(w: int, h: int):
|
|
yy, xx = np.mgrid[0:h, 0:w].astype(np.float32)
|
|
base = 120 + 40 * np.sin(xx / 90.0) + 30 * np.cos(yy / 70.0)
|
|
return np.clip(np.stack([base, base * 0.95, base * 1.05], axis=-1), 0, 255)
|
|
|
|
def test_recovers_shifted_mark_on_texture(self):
|
|
"""A real mark is re-rasterized a few px off its fixed slot, so removal
|
|
must NCC-align to it. Regression guard for the issue-#13 follow-up defect:
|
|
a too-tight locate box let a corner-ward shift fall outside the alignment
|
|
search, leaving a readable outline that the detector did not flag. Composes
|
|
the real alpha SHIFTED on a known texture and asserts the texture is
|
|
recovered (a misaligned removal would leave the bright glyph outline)."""
|
|
eng = DoubaoEngine()
|
|
w = h = _ALPHA_NATIVE_WIDTH
|
|
at = _alpha_template()
|
|
gw, gh = int(_ALPHA_WIDTH_FRAC * w), int(_ALPHA_HEIGHT_FRAC * w)
|
|
ax = w - int(_ALPHA_MARGIN_RIGHT_FRAC * w) - gw + 12 # shift toward the corner
|
|
ay = h - int(_ALPHA_MARGIN_BOTTOM_FRAC * w) - gh + 8
|
|
amap = np.zeros((h, w), np.float32)
|
|
amap[ay : ay + gh, ax : ax + gw] = cv2.resize(at, (gw, gh))
|
|
a3 = amap[:, :, None]
|
|
bg = self._textured_bg(w, h)
|
|
wm = (a3 * np.array(_ALPHA_LOGO_BGR, np.float32) + (1 - a3) * bg).clip(0, 255).astype(np.uint8)
|
|
mark = amap > 0.15
|
|
assert float(np.abs(wm.astype(np.float32)[mark] - bg[mark]).mean()) > 30 # mark clearly visible
|
|
out = eng.remove_watermark_reverse_alpha(wm).astype(np.float32)
|
|
assert float(np.abs(out[mark] - bg[mark]).mean()) < 8.0 # texture recovered, no outline
|
|
|
|
|
|
class TestDegenerateAndChannelInputs:
|
|
"""Removal must not crash on degenerate sizes or non-3-channel inputs."""
|
|
|
|
@pytest.mark.parametrize(("w", "h"), [(2048, 1), (1, 2048), (2048, 8)])
|
|
def test_wide_short_does_not_raise(self, w, h):
|
|
"""A wide/short image at native width makes the width-derived glyph box
|
|
taller than the image; the slice assignment must not ValueError."""
|
|
eng = DoubaoEngine()
|
|
img = np.zeros((h, w, 3), np.uint8)
|
|
out = eng.remove_watermark_reverse_alpha(img)
|
|
assert out.shape == img.shape
|
|
|
|
def test_grayscale_2d_does_not_raise(self):
|
|
eng = DoubaoEngine()
|
|
gray = np.zeros((2048, 2048), np.uint8)
|
|
out = eng.remove_watermark_reverse_alpha(gray)
|
|
assert out.shape == (2048, 2048, 3)
|
|
|
|
def test_bgra_4channel_does_not_raise(self):
|
|
eng = DoubaoEngine()
|
|
bgra = np.zeros((2048, 2048, 4), np.uint8)
|
|
out = eng.remove_watermark_reverse_alpha(bgra)
|
|
assert out.shape == (2048, 2048, 3)
|