From e598e34d45a6a651174fff9788a9c642aeb8f5e2 Mon Sep 17 00:00:00 2001 From: tretrauit Date: Wed, 31 Jan 2024 23:37:36 +0700 Subject: [PATCH] fix(tesseract): add [oc] to regex generation --- swordfish/src/tesseract/utils.rs | 2 ++ 1 file changed, 2 insertions(+) diff --git a/swordfish/src/tesseract/utils.rs b/swordfish/src/tesseract/utils.rs index 38fbb64..657e9e5 100644 --- a/swordfish/src/tesseract/utils.rs +++ b/swordfish/src/tesseract/utils.rs @@ -168,6 +168,8 @@ pub fn regexify_text(text: &String) -> String { ascii_text.push_str("[ti]"); } else if ['I', 'l', '!', '1'].contains(&c) { ascii_text.push_str("[Il!1i]"); + } else if ['o', 'c'].contains(&c) { + ascii_text.push_str("[oc]"); } else if ['.'].contains(&c) { if prev_chars.len() > 3 { let prev_char = prev_chars[prev_chars.len() - 1];