From 2cef408cf799e37fc63313000efbcda2233bd563 Mon Sep 17 00:00:00 2001 From: Leonard Slass Date: Tue, 25 Apr 2023 11:24:43 +0200 Subject: [PATCH 1/3] remove support for Tesseract 2 --- CMakeModules/FindTesseract.cmake | 14 ++------------ 1 file changed, 2 insertions(+), 12 deletions(-) diff --git a/CMakeModules/FindTesseract.cmake b/CMakeModules/FindTesseract.cmake index 4b15d74..36cf0fb 100644 --- a/CMakeModules/FindTesseract.cmake +++ b/CMakeModules/FindTesseract.cmake @@ -43,18 +43,8 @@ if(TESSERACT_DATA_PATH) add_definitions(-DTESSERACT_DATA_PATH="${TESSERACT_DATA_PATH}") endif() -set(CMAKE_REQUIRED_INCLUDES ${Tesseract_INCLUDE_DIR}) -check_cxx_source_compiles( - "#include \"tesseract/baseapi.h\" - using namespace tesseract; - int main() { - }" - TESSERACT_NAMESPACE) -if(TESSERACT_NAMESPACE) - add_definitions("-DCONFIG_TESSERACT_NAMESPACE") -else() - message(WARNING "You are using an old Tesseract version. Support for Tesseract 2 is deprecated and will be removed in the future!") -endif() +add_definitions("-DCONFIG_TESSERACT_NAMESPACE") + list(REMOVE_ITEM CMAKE_REQUIRED_INCLUDES ${Tesseract_INCLUDE_DIR}) if(BUILD_STATIC) From eb452398c0473e467bf14dd8c8308d5af279a4f1 Mon Sep 17 00:00:00 2001 From: Leonard Slass Date: Tue, 25 Apr 2023 11:25:09 +0200 Subject: [PATCH 2/3] add support for C++ 11 --- CMakeLists.txt | 3 +++ 1 file changed, 3 insertions(+) diff --git a/CMakeLists.txt b/CMakeLists.txt index d1954cb..f734306 100644 --- a/CMakeLists.txt +++ b/CMakeLists.txt @@ -2,6 +2,9 @@ project(vobsub2srt) cmake_minimum_required(VERSION 2.6.4 FATAL_ERROR) +set(CMAKE_CXX_STANDARD 11) +set(CMAKE_CXX_STANDARD_REQUIRED True) + set(CMAKE_MODULE_PATH ${CMAKE_SOURCE_DIR}/CMakeModules) if(NOT CMAKE_BUILD_TYPE) From 149b34b969a2b287f4df4044e4a1cb5dc6b52c3d Mon Sep 17 00:00:00 2001 From: Leonard Slass Date: Tue, 25 Apr 2023 11:33:38 +0200 Subject: [PATCH 3/3] invert image for better recognition --- src/vobsub2srt.c++ | 16 ++++++++++++++++ 1 file changed, 16 insertions(+) diff --git a/src/vobsub2srt.c++ b/src/vobsub2srt.c++ index 2f9e1a0..1d49006 100644 --- a/src/vobsub2srt.c++ +++ b/src/vobsub2srt.c++ @@ -269,6 +269,22 @@ int main(int argc, char **argv) { dump_pgm(subname, sub_counter, width, height, stride, image, image_size); } + // for 4.x version use dark text on light background. + bool inverting_images = true; + + if (inverting_images) { + int size_r = width * height; + unsigned char* image_rev = new unsigned char[size_r]; + for (int i = 0; i < size_r; i++) + { + int val = static_cast(image[i]); + unsigned char cz = (255 - val); + image_rev[i] = cz; + } + + image = image_rev; + } + #ifdef CONFIG_TESSERACT_NAMESPACE char *text = tess_base_api.TesseractRect(image, 1, stride, 0, 0, width, height); #else