From acef9e21e19de4de9e14201e0e4431f54e9ec0b5 Mon Sep 17 00:00:00 2001 From: Christian Liebhardt Date: Thu, 13 Jun 2024 20:37:34 +0200 Subject: [PATCH] Denoised and contrast amplified variants --- homr/staff_parsing_tromr.py | 7 ++++++- homr/transformer/decoder.py | 2 +- 2 files changed, 7 insertions(+), 2 deletions(-) diff --git a/homr/staff_parsing_tromr.py b/homr/staff_parsing_tromr.py index 4174b29..c4d9fc8 100644 --- a/homr/staff_parsing_tromr.py +++ b/homr/staff_parsing_tromr.py @@ -30,7 +30,12 @@ def apply_clahe(staff_image: NDArray, clip_limit: float = 2.0, kernel_size: int def build_image_options(staff_image: NDArray) -> list[NDArray]: - return [staff_image] + denoised1 = cv2.fastNlMeansDenoisingColored(staff_image, None, 10, 10, 7, 21) + return [ + staff_image, + denoised1, + apply_clahe(denoised1), + ] def predict_best( diff --git a/homr/transformer/decoder.py b/homr/transformer/decoder.py index 9231e8b..1589379 100644 --- a/homr/transformer/decoder.py +++ b/homr/transformer/decoder.py @@ -242,7 +242,7 @@ def generate( # noqa: PLR0915 if is_eos == 0: break retry = merger.add_symbol(rhythm_token[0][0], pitch_token[0][0], lift_token[0][0]) - current_temperature *= 2 + current_temperature *= 3.5 attempt += 1 out_lift = torch.cat((out_lift, lift_sample), dim=-1)