diff --git a/.github/workflows/wheels.yml b/.github/workflows/wheels.yml index 05e6aacd..75b2f9cc 100644 --- a/.github/workflows/wheels.yml +++ b/.github/workflows/wheels.yml @@ -103,7 +103,7 @@ jobs: CIBW_REPAIR_WHEEL_COMMAND_MACOS: "" # do not run delocate-wheel before the re-tag CIBW_ENVIRONMENT: "MACOSX_DEPLOYMENT_TARGET=${{ matrix.os.min_macos_version }}.0" ARCHFLAGS: -arch x86_64 - BUILD_THREADS: "1" + BUILD_THREADS: "4" PYTORCH_MPS_HIGH_WATERMARK_RATIO: "0.0" run: | PY_CACHE_TAG=$(uv run python -c 'import sys;print(sys.implementation.cache_tag)') diff --git a/app/analyse.cpp b/app/analyse.cpp index 146b376d..804da9b7 100644 --- a/app/analyse.cpp +++ b/app/analyse.cpp @@ -295,6 +295,15 @@ int main(int argc, char* argv[]) else if (lvl == "error") { loguru::g_stderr_verbosity = loguru::Verbosity_ERROR; } } + // --- Initialize fonts like app/render.cpp --- + { + nlohmann::json data; + std::string resource_dir = resource_utils::get_resources_dir(false).string(); + data[pdflib::pdf_resource::RESOURCE_DIR_KEY] = resource_dir; + std::unordered_map font_timings; + pdflib::pdf_resource::initialise(data, font_timings); + } + if (not result.count("input")) { LOG_S(ERROR) << "-i/--input is required"; diff --git a/tests/data_utils.py b/tests/data_utils.py index 0f04a865..69b45dd9 100644 --- a/tests/data_utils.py +++ b/tests/data_utils.py @@ -5,8 +5,7 @@ from huggingface_hub import snapshot_download HF_DATASET_REPO_ID = "docling-project/regression-dataset-for-docling-parse" -# HF_DATASET_REVISION = "5d7c3d7b575397ca5b2a943171b0da4fe08c5a5b" -HF_DATASET_REVISION = "9a3713bd2e7b5b55ad9dde9d85953a0f5eb5150e" +HF_DATASET_REVISION = "38d690fdbc01b9537f0cddff5b00dce179a768fd" TESTS_DIR = Path(__file__).resolve().parent TEST_DATA_DIR = TESTS_DIR / "data"