CogStack · mart-r · Dec 2, 2025 · Dec 2, 2025 · Dec 2, 2025 · Dec 2, 2025
diff --git a/.github/workflows/medcat-v2_main.yml b/.github/workflows/medcat-v2_main.yml
@@ -11,7 +11,25 @@
   run:
     working-directory: ./medcat-v2
 jobs:
-  build:
+  base-install-imports:
+    runs-on: ubuntu-latest
+    steps:
+      - uses: actions/checkout@v5
+      # NOTE: using oldest supported python version
+      - name: Install uv for Python 3.10
+        uses: astral-sh/setup-uv@v7
+        with:
+          python-version: 3.10
+          enable-cache: true
+          cache-dependency-glob: "medcat-v2/uv.lock"
+      - name: Install the project
+        run: |
+          uv sync # NO extras
+      - name: Check that all packages / modules can be imported with default / no-extras install
+        run: |
+          uv run python tests/other/check_base_install_can_import_all.py medcat
+
+  types-lints-tests-regression:
@@ -1,4 +1,6 @@
 name: medcat-v2 - Test
+permissions:
+  contents: read
 on:
  push:
@@ -1,4 +1,6 @@
 name: medcat-v2 - Test
+permissions:
+  contents: read

 on:
  push:
     runs-on: ubuntu-latest
     strategy:
       matrix:

diff --git a/medcat-v2/medcat/utils/legacy/convert_meta_cat.py b/medcat-v2/medcat/utils/legacy/convert_meta_cat.py
@@ -3,8 +3,6 @@
 import json
 import logging
 
-import torch
-
 from medcat.components.addons.meta_cat import MetaCAT, MetaCATAddon
 from medcat.components.addons.meta_cat.mctokenizers.tokenizers import (
     TokenizerWrapperBase, load_tokenizer)
@@ -13,6 +11,13 @@
 
 from medcat.utils.legacy.helpers import fix_old_style_cnf
 
+# NOTE: needs to be before torch since default doesn't include torch
+from medcat.utils.import_utils import ensure_optional_extras_installed
+_EXTRA_NAME = "meta-cat"
+ensure_optional_extras_installed("medcat", _EXTRA_NAME)
+
+import torch  # noqa
+
 
 logger = logging.getLogger(__name__)
 

diff --git a/medcat-v2/medcat/utils/legacy/convert_rel_cat.py b/medcat-v2/medcat/utils/legacy/convert_rel_cat.py
@@ -2,8 +2,6 @@
 import json
 import logging
 
-import torch
-
 from medcat.cdb import CDB
 from medcat.components.addons.relation_extraction.rel_cat import (
     RelCAT, RelCATAddon)
@@ -13,6 +11,13 @@
 from medcat.tokenizing.tokenizers import BaseTokenizer, create_tokenizer
 from medcat.utils.legacy.helpers import fix_old_style_cnf
 
+# NOTE: needs to be before torch since default doesn't include torch
+from medcat.utils.import_utils import ensure_optional_extras_installed
+_EXTRA_NAME = "rel-cat"
+ensure_optional_extras_installed("medcat", _EXTRA_NAME)
+
+import torch  # noqa
+
 
 logger = logging.getLogger(__name__)
 

diff --git a/medcat-v2/pyproject.toml b/medcat-v2/pyproject.toml
@@ -65,6 +65,9 @@ dependencies = [ # Optional
   "xxhash>=3.5.0,<4.0",
   "pydantic>2.0",
   "typing-extensions",
+  "packaging",
+  "pyyaml",
+  "requests",
   # TODO - others
 ]
 

diff --git a/medcat-v2/tests/other/check_base_install_can_import_all.py b/medcat-v2/tests/other/check_base_install_can_import_all.py
@@ -0,0 +1,132 @@
+from typing import Iterable
+import os
+import subprocess
+import sys
+import re
+from collections import Counter
+
+MISSING_DEP_PATTERN = re.compile(
+    r"The optional dependency set '([\w\-_]*)' is missing")
+
+
+def walk_packages(path: str,
+                  base_pkg_name: str,
+                  base_path: str = '') -> Iterable[str]:
+    if not base_path:
+        base_path = path
+    pkg_path = path.removeprefix(base_path).replace(
+        os.path.sep, '.').strip(".")
+    pkg_to_here = f"{base_pkg_name}.{pkg_path}" if pkg_path else base_pkg_name
+    for fn in os.listdir(path):
+        cur_path = os.path.join(path, fn)
+        if os.path.isdir(cur_path) and (
+                not fn.startswith("__") and not fn.endswith("__")):
+            yield from walk_packages(cur_path, base_pkg_name=base_pkg_name,
+                                     base_path=base_path)
+            continue
+        if not fn.endswith(".py"):
+            continue
+        if fn == "__init__.py":
+            yield pkg_to_here
+            continue
+        yield f"{pkg_to_here}.{fn.removesuffix('.py')}"
+
+
+def find_all_modules(package_name, package_path=None):
+    """Find all importable modules in a package."""
+    if package_path is None:
+        # Import the package to get its path
+        try:
+            pkg = __import__(package_name)
+            package_path = pkg.__path__
+        except ImportError:
+            print(f"Could not import {package_name}")
+            return []
+
+    modules = []
+    for modname in walk_packages(package_path[0],
+                                 base_pkg_name=package_name):
+        modules.append(modname)
+
+    return modules
+
+
+def test_import(module_name):
+    """Test if a module can be imported in isolation."""
+    code = f"import {module_name}"
+    result = subprocess.run(
+        [sys.executable, "-c", code],
+        capture_output=True,
+        text=True,
+        timeout=30,
+    )
+    return result.returncode == 0, result.stderr
+
+
+def get_missing_dep_set(error: str) -> str | None:
+    err1 = error.strip().split('\n')[-1]
+    if "MissingDependenciesError" not in err1:
+        return None
+    matches = MISSING_DEP_PATTERN.findall(err1)
+    if len(matches) != 1:
+        raise ValueError(f"Unknown error:\n'{error}'\nLookin at:\n{err1}"
+                         f"\ngot: {matches}")
+    return matches[0]
+
+
+def main():
+    if len(sys.argv) < 2:
+        print("Usage: python check_imports.py <package_name>")
+        sys.exit(1)
+
+    package_name = sys.argv[1]
+
+    print(f"Finding all modules in {package_name}...")
+    modules = find_all_modules(package_name)
+
+    if not modules:
+        print(f"No modules found in {package_name}")
+        sys.exit(1)
+
+    print(f"Found {len(modules)} modules. Testing imports...\n")
+
+    successful = []
+    missing_opt_dep_expl = []
+    failed = []
+
+    for module in modules:
+        success, error = test_import(module)
+        if success:
+            successful.append(module)
+            print(f"✓ {module}")
+        elif (missing_dep := get_missing_dep_set(error)):
+            missing_opt_dep_expl.append((module, missing_dep))
+            print(f"M {module}: missing {missing_dep}")
+        else:
+            failed.append((module, error))
+            print(f"✗ {module}")
+            # Print the first line of error for quick diagnosis
+            first_error_line = (
+                error.strip().split('\n')[-1] if error else "Unknown error")
+            print(f"  → {first_error_line}")
+
+    # Summary
+    print("\n" + "="*60)
+    per_opt_dep_missing = Counter()
+    for _, missing_dep in missing_opt_dep_expl:
+        per_opt_dep_missing[missing_dep] += 1
+    print(f"Results: {len(successful)} successful, "
+          f"{len(missing_opt_dep_expl)} missing optional deps "
+          f"({per_opt_dep_missing}), {len(failed)} failed")
+    print("="*60)
+
+    if failed:
+        print("\nFailed imports:")
+        for module, error in failed:
+            print(f"\n{module}:")
+            print(error)
+        sys.exit(1)
+
+
+if __name__ == "__main__":
+    main()