diff --git a/README.md b/README.md index d2358aa76b..cec8b6e711 100644 --- a/README.md +++ b/README.md @@ -18,7 +18,7 @@ to find, contextualize, and extract text, tables, charts and infographics that y > [!Note] > NeMo Retriever extraction is also known as NVIDIA Ingest and nv-ingest. -NeMo Retriever Library enables parallelization of splitting documents into pages where artifacts are classified (such as text, tables, charts, and infographics), extracted, and further contextualized through optical character recognition (OCR) into a well defined JSON schema. From there, NeMo Retriever Library manages computaiton of embeddings for the extracted content as well as storing them in a vector database [Milvus](https://milvus.io/). +NeMo Retriever Library enables parallelization of splitting documents into pages where artifacts are classified (such as text, tables, charts, and infographics), extracted, and further contextualized through optical character recognition (OCR) into a well defined JSON schema. From there, NeMo Retriever Library manages computation of embeddings for the extracted content as well as storing them in a vector database [Milvus](https://milvus.io/). The following diagram shows the NeMo Retriever Library pipeline. diff --git a/tests/integration/conftest.py b/tests/integration/conftest.py index 993d189a0b..3c66601a78 100644 --- a/tests/integration/conftest.py +++ b/tests/integration/conftest.py @@ -18,6 +18,11 @@ def _wait_for_port(host: str, port: int, timeout: float = 120.0, interval: float Wait until a TCP port on a host is accepting connections or raise TimeoutError. This makes the tests robust against pipeline warm-up variability. """ + if timeout <= 0: + raise ValueError(f"timeout must be positive, got {timeout}") + if interval <= 0: + raise ValueError(f"interval must be positive, got {interval}") + deadline = time.time() + timeout last_err: Exception | None = None while time.time() < deadline: