From 7b2125b200c713b7fa656decfb6caf53a03e5342 Mon Sep 17 00:00:00 2001
From: Matt Robinson <mrobinson@unstructured.io>
Date: Wed, 22 May 2024 13:49:01 -0400
Subject: [PATCH] BREAKING CHANGE: remove legacy `detectron2` model; remove
 layoutparser extras (#350)

### Summary

First step in resolving
https://github.com/Unstructured-IO/unstructured/issues/3051. Per [this
comment](https://github.com/Unstructured-IO/unstructured/issues/3051#issuecomment-2123176161),
we were having troubling running `unstructured` in the Python 3.12
`wolfi-base` contain due to issues related to `pycocotools`, which is
only used for the legacy `detectron2` model from `layoutparser`. Since
we've replaced this with `detectron2onnx`, this PR removes the
`layoutparser` extra dependencies that caused issues with Python 3.12.

The `layoutparser` base dependency is still required because we use
layout objects from that library. It's likely we could remove these in a
future iteration.

Temporarily disabled the ingest tests, because they seem to have been
broken for the past six months. Last commit that they passed for was
[this
one](https://github.com/Unstructured-IO/unstructured-inference/commit/0f0c2be07c673615217b214937f50a091676a8aa).
Opened #352 to reenable them.

### Testing

If CI passes we should be good to go.
---
 .github/workflows/ci.yml                      |  86 ++++++++-------
 CHANGELOG.md                                  |  15 ++-
 requirements/base.in                          |   5 +-
 requirements/base.txt                         |  62 ++++-------
 requirements/dev.txt                          |  41 ++++---
 requirements/test.txt                         |  24 ++--
 .../inference/test_layout.py                  |   6 +-
 .../models/test_detectron2.py                 |  50 ---------
 .../models/test_model.py                      |  10 +-
 unstructured_inference/__version__.py         |   2 +-
 unstructured_inference/models/base.py         |   4 -
 unstructured_inference/models/detectron2.py   | 104 ------------------
 12 files changed, 121 insertions(+), 288 deletions(-)
 delete mode 100644 test_unstructured_inference/models/test_detectron2.py
 delete mode 100644 unstructured_inference/models/detectron2.py

diff --git a/.github/workflows/ci.yml b/.github/workflows/ci.yml
index 5b81d852..57064918 100644
--- a/.github/workflows/ci.yml
+++ b/.github/workflows/ci.yml
@@ -104,48 +104,50 @@ jobs:
         CI=true make test
         make check-coverage
 
-  test_ingest:
-    strategy:
-      matrix:
-        python-version: ["3.9","3.10"]
-    runs-on: ubuntu-latest
-    env:
-      NLTK_DATA: ${{ github.workspace }}/nltk_data
-    needs: lint
-    steps:
-    - name: Checkout unstructured repo for integration testing
-      uses: actions/checkout@v4
-      with:
-        repository: 'Unstructured-IO/unstructured'
-    - name: Checkout this repo
-      uses: actions/checkout@v4
-      with:
-        path: inference
-    - name: Set up Python ${{ matrix.python-version }}
-      uses: actions/setup-python@v4
-      with:
-        python-version: ${{ matrix.python-version }}
-    - name: Test
-      env:
-        GH_READ_ONLY_ACCESS_TOKEN: ${{ secrets.GH_READ_ONLY_ACCESS_TOKEN }}
-        SLACK_TOKEN: ${{ secrets.SLACK_TOKEN }}
-        DISCORD_TOKEN: ${{ secrets.DISCORD_TOKEN }}
-      run: |
-        python${{ matrix.python-version }} -m venv .venv
-        source .venv/bin/activate
-        [ ! -d "$NLTK_DATA" ] && mkdir "$NLTK_DATA"
-        make install-ci
-        pip install -e inference/
-        sudo apt-get update
-        sudo apt-get install -y libmagic-dev poppler-utils libreoffice pandoc
-        sudo add-apt-repository -y ppa:alex-p/tesseract-ocr5
-        sudo apt-get install -y tesseract-ocr
-        sudo apt-get install -y tesseract-ocr-kor
-        sudo apt-get install -y diffstat
-        tesseract --version
-        make install-all-ingest
-        # only run ingest tests that check expected output diffs.
-        bash inference/scripts/test-unstructured-ingest-helper.sh
+  # NOTE(robinson) - disabling ingest tests for now, as of 5/22/2024 they seem to have been
+  # broken for the past six months
+  # test_ingest:
+  #   strategy:
+  #     matrix:
+  #       python-version: ["3.9","3.10"]
+  #   runs-on: ubuntu-latest
+  #   env:
+  #     NLTK_DATA: ${{ github.workspace }}/nltk_data
+  #   needs: lint
+  #   steps:
+  #   - name: Checkout unstructured repo for integration testing
+  #     uses: actions/checkout@v4
+  #     with:
+  #       repository: 'Unstructured-IO/unstructured'
+  #   - name: Checkout this repo
+  #     uses: actions/checkout@v4
+  #     with:
+  #       path: inference
+  #   - name: Set up Python ${{ matrix.python-version }}
+  #     uses: actions/setup-python@v4
+  #     with:
+  #       python-version: ${{ matrix.python-version }}
+  #   - name: Test
+  #     env:
+  #       GH_READ_ONLY_ACCESS_TOKEN: ${{ secrets.GH_READ_ONLY_ACCESS_TOKEN }}
+  #       SLACK_TOKEN: ${{ secrets.SLACK_TOKEN }}
+  #       DISCORD_TOKEN: ${{ secrets.DISCORD_TOKEN }}
+  #     run: |
+  #       python${{ matrix.python-version }} -m venv .venv
+  #       source .venv/bin/activate
+  #       [ ! -d "$NLTK_DATA" ] && mkdir "$NLTK_DATA"
+  #       make install-ci
+  #       pip install -e inference/
+  #       sudo apt-get update
+  #       sudo apt-get install -y libmagic-dev poppler-utils libreoffice pandoc
+  #       sudo add-apt-repository -y ppa:alex-p/tesseract-ocr5
+  #       sudo apt-get install -y tesseract-ocr
+  #       sudo apt-get install -y tesseract-ocr-kor
+  #       sudo apt-get install -y diffstat
+  #       tesseract --version
+  #       make install-all-ingest
+  #       # only run ingest tests that check expected output diffs.
+  #       bash inference/scripts/test-unstructured-ingest-helper.sh
 
   changelog:
     runs-on: ubuntu-latest
diff --git a/CHANGELOG.md b/CHANGELOG.md
index d193864e..6a9c2216 100644
--- a/CHANGELOG.md
+++ b/CHANGELOG.md
@@ -1,17 +1,22 @@
+## 0.7.33
+
+* BREAKING CHANGE: removes legacy detectron2 model
+* deps: remove layoutparser optional dependencies
+
 ## 0.7.32
 
-* refactor: remove all code related to filling inferred elements text from embedded text (pdfminer). 
+* refactor: remove all code related to filling inferred elements text from embedded text (pdfminer).
 * bug: set the Chipper max_length variable
 
 ## 0.7.31
 
-* refactor: remove all `cid` related code that was originally added to filter out invalid `pdfminer` text 
+* refactor: remove all `cid` related code that was originally added to filter out invalid `pdfminer` text
 * enhancement: Wrapped hf_hub_download with a function that checks for local file before checking HF
 
 ## 0.7.30
 
-* fix: table transformer doesn't return multiple cells with same coordinates 
-* 
+* fix: table transformer doesn't return multiple cells with same coordinates
+*
 ## 0.7.29
 
 * fix: table transformer predictions are now removed if confidence is below threshold
@@ -458,4 +463,4 @@ we have the mapping from standard language code to paddle language code.
 
 ## 0.2.0
 
-* Initial release of unstructured-inference
\ No newline at end of file
+* Initial release of unstructured-inference
diff --git a/requirements/base.in b/requirements/base.in
index 9f321b26..fc60b9bc 100644
--- a/requirements/base.in
+++ b/requirements/base.in
@@ -1,10 +1,13 @@
 -c constraints.in
-layoutparser[layoutmodels,tesseract]
+layoutparser
 python-multipart
 huggingface-hub
 opencv-python!=4.7.0.68
 onnx
 onnxruntime>=1.17.0
+matplotlib
+torch
+timm
 # NOTE(alan): Pinned because this is when the most recent module we import appeared
 transformers>=4.25.1
 rapidfuzz
diff --git a/requirements/base.txt b/requirements/base.txt
index e4512b00..536ea640 100644
--- a/requirements/base.txt
+++ b/requirements/base.txt
@@ -4,8 +4,6 @@
 #
 #    pip-compile requirements/base.in
 #
-antlr4-python3-runtime==4.9.3
-    # via omegaconf
 certifi==2024.2.2
     # via requests
 cffi==1.16.0
@@ -18,13 +16,11 @@ coloredlogs==15.0.1
     # via onnxruntime
 contourpy==1.2.1
     # via matplotlib
-cryptography==42.0.5
+cryptography==42.0.7
     # via pdfminer-six
 cycler==0.12.1
     # via matplotlib
-effdet==0.4.1
-    # via layoutparser
-filelock==3.13.4
+filelock==3.14.0
     # via
     #   huggingface-hub
     #   torch
@@ -33,11 +29,11 @@ flatbuffers==24.3.25
     # via onnxruntime
 fonttools==4.51.0
     # via matplotlib
-fsspec==2024.3.1
+fsspec==2024.5.0
     # via
     #   huggingface-hub
     #   torch
-huggingface-hub==0.22.2
+huggingface-hub==0.23.1
     # via
     #   -r requirements/base.in
     #   timm
@@ -51,16 +47,16 @@ importlib-resources==6.4.0
     # via matplotlib
 iopath==0.1.10
     # via layoutparser
-jinja2==3.1.3
+jinja2==3.1.4
     # via torch
 kiwisolver==1.4.5
     # via matplotlib
-layoutparser[layoutmodels,tesseract]==0.3.4
+layoutparser==0.3.4
     # via -r requirements/base.in
 markupsafe==2.1.5
     # via jinja2
-matplotlib==3.8.4
-    # via pycocotools
+matplotlib==3.9.0
+    # via -r requirements/base.in
 mpmath==1.3.0
     # via sympy
 networkx==3.2.1
@@ -74,15 +70,12 @@ numpy==1.26.4
     #   onnxruntime
     #   opencv-python
     #   pandas
-    #   pycocotools
     #   scipy
     #   torchvision
     #   transformers
-omegaconf==2.3.0
-    # via effdet
 onnx==1.16.0
     # via -r requirements/base.in
-onnxruntime==1.17.3
+onnxruntime==1.18.0
     # via -r requirements/base.in
 opencv-python==4.9.0.80
     # via
@@ -93,7 +86,6 @@ packaging==24.0
     #   huggingface-hub
     #   matplotlib
     #   onnxruntime
-    #   pytesseract
     #   transformers
 pandas==2.2.2
     # via layoutparser
@@ -109,7 +101,6 @@ pillow==10.3.0
     #   matplotlib
     #   pdf2image
     #   pdfplumber
-    #   pytesseract
     #   torchvision
 portalocker==2.8.2
     # via iopath
@@ -117,16 +108,12 @@ protobuf==5.26.1
     # via
     #   onnx
     #   onnxruntime
-pycocotools==2.0.7
-    # via effdet
 pycparser==2.22
     # via cffi
 pyparsing==3.1.2
     # via matplotlib
-pypdfium2==4.29.0
+pypdfium2==4.30.0
     # via pdfplumber
-pytesseract==0.3.10
-    # via layoutparser
 python-dateutil==2.9.0.post0
     # via
     #   matplotlib
@@ -139,14 +126,13 @@ pyyaml==6.0.1
     # via
     #   huggingface-hub
     #   layoutparser
-    #   omegaconf
     #   timm
     #   transformers
-rapidfuzz==3.8.1
+rapidfuzz==3.9.1
     # via -r requirements/base.in
-regex==2024.4.16
+regex==2024.5.15
     # via transformers
-requests==2.31.0
+requests==2.32.2
     # via
     #   huggingface-hub
     #   transformers
@@ -162,27 +148,23 @@ sympy==1.12
     # via
     #   onnxruntime
     #   torch
-timm==0.9.16
-    # via effdet
+timm==1.0.3
+    # via -r requirements/base.in
 tokenizers==0.19.1
     # via transformers
-torch==2.2.2
+torch==2.3.0
     # via
-    #   effdet
-    #   layoutparser
+    #   -r requirements/base.in
     #   timm
     #   torchvision
-torchvision==0.17.2
-    # via
-    #   effdet
-    #   layoutparser
-    #   timm
-tqdm==4.66.2
+torchvision==0.18.0
+    # via timm
+tqdm==4.66.4
     # via
     #   huggingface-hub
     #   iopath
     #   transformers
-transformers==4.40.0
+transformers==4.41.0
     # via -r requirements/base.in
 typing-extensions==4.11.0
     # via
@@ -193,5 +175,5 @@ tzdata==2024.1
     # via pandas
 urllib3==2.2.1
     # via requests
-zipp==3.18.1
+zipp==3.18.2
     # via importlib-resources
diff --git a/requirements/dev.txt b/requirements/dev.txt
index b065f8f4..1021b087 100644
--- a/requirements/dev.txt
+++ b/requirements/dev.txt
@@ -25,7 +25,7 @@ attrs==23.2.0
     # via
     #   jsonschema
     #   referencing
-babel==2.14.0
+babel==2.15.0
     # via jupyterlab-server
 beautifulsoup4==4.12.3
     # via nbconvert
@@ -136,7 +136,7 @@ isoduration==20.11.0
     # via jsonschema
 jedi==0.19.1
     # via ipython
-jinja2==3.1.3
+jinja2==3.1.4
     # via
     #   -c requirements/base.txt
     #   jupyter-server
@@ -147,7 +147,7 @@ json5==0.9.25
     # via jupyterlab-server
 jsonpointer==2.4
     # via jsonschema
-jsonschema[format-nongpl]==4.21.1
+jsonschema[format-nongpl]==4.22.0
     # via
     #   jupyter-events
     #   jupyterlab-server
@@ -189,11 +189,11 @@ jupyter-server==2.14.0
     #   notebook-shim
 jupyter-server-terminals==0.5.3
     # via jupyter-server
-jupyterlab==4.1.6
+jupyterlab==4.2.0
     # via notebook
 jupyterlab-pygments==0.3.0
     # via nbconvert
-jupyterlab-server==2.26.0
+jupyterlab-server==2.27.1
     # via
     #   jupyterlab
     #   notebook
@@ -208,7 +208,7 @@ markupsafe==2.1.5
     #   -c requirements/base.txt
     #   jinja2
     #   nbconvert
-matplotlib==3.8.4
+matplotlib==3.9.0
     # via
     #   -c requirements/base.txt
     #   -r requirements/dev.in
@@ -220,7 +220,7 @@ mistune==3.0.2
     # via nbconvert
 nbclient==0.10.0
     # via nbconvert
-nbconvert==7.16.3
+nbconvert==7.16.4
     # via
     #   jupyter
     #   jupyter-server
@@ -231,7 +231,7 @@ nbformat==5.10.4
     #   nbconvert
 nest-asyncio==1.6.0
     # via ipykernel
-notebook==7.1.3
+notebook==7.2.0
     # via jupyter
 notebook-shim==0.2.4
     # via
@@ -270,7 +270,7 @@ pillow==10.3.0
     #   matplotlib
 pip-tools==7.4.1
     # via -r requirements/dev.in
-platformdirs==4.2.0
+platformdirs==4.2.2
     # via
     #   -c requirements/test.txt
     #   jupyter-core
@@ -292,7 +292,7 @@ pycparser==2.22
     # via
     #   -c requirements/base.txt
     #   cffi
-pygments==2.17.2
+pygments==2.18.0
     # via
     #   ipython
     #   jupyter-console
@@ -302,7 +302,7 @@ pyparsing==3.1.2
     # via
     #   -c requirements/base.txt
     #   matplotlib
-pyproject-hooks==1.0.0
+pyproject-hooks==1.1.0
     # via
     #   build
     #   pip-tools
@@ -319,23 +319,23 @@ pyyaml==6.0.1
     #   -c requirements/base.txt
     #   -c requirements/test.txt
     #   jupyter-events
-pyzmq==26.0.0
+pyzmq==26.0.3
     # via
     #   ipykernel
     #   jupyter-client
     #   jupyter-console
     #   jupyter-server
     #   qtconsole
-qtconsole==5.5.1
+qtconsole==5.5.2
     # via jupyter
 qtpy==2.4.1
     # via qtconsole
-referencing==0.34.0
+referencing==0.35.1
     # via
     #   jsonschema
     #   jsonschema-specifications
     #   jupyter-events
-requests==2.31.0
+requests==2.32.2
     # via
     #   -c requirements/base.txt
     #   -c requirements/test.txt
@@ -348,7 +348,7 @@ rfc3986-validator==0.1.1
     # via
     #   jsonschema
     #   jupyter-events
-rpds-py==0.18.0
+rpds-py==0.18.1
     # via
     #   jsonschema
     #   referencing
@@ -374,7 +374,7 @@ terminado==0.18.1
     # via
     #   jupyter-server
     #   jupyter-server-terminals
-tinycss2==1.2.1
+tinycss2==1.3.0
     # via nbconvert
 tomli==2.0.1
     # via
@@ -382,7 +382,6 @@ tomli==2.0.1
     #   build
     #   jupyterlab
     #   pip-tools
-    #   pyproject-hooks
 tornado==6.4
     # via
     #   ipykernel
@@ -391,7 +390,7 @@ tornado==6.4
     #   jupyterlab
     #   notebook
     #   terminado
-traitlets==5.14.2
+traitlets==5.14.3
     # via
     #   comm
     #   ipykernel
@@ -432,13 +431,13 @@ webencodings==0.5.1
     # via
     #   bleach
     #   tinycss2
-websocket-client==1.7.0
+websocket-client==1.8.0
     # via jupyter-server
 wheel==0.43.0
     # via pip-tools
 widgetsnbextension==4.0.10
     # via ipywidgets
-zipp==3.18.1
+zipp==3.18.2
     # via
     #   -c requirements/base.txt
     #   importlib-metadata
diff --git a/requirements/test.txt b/requirements/test.txt
index 864b5fe3..5f738730 100644
--- a/requirements/test.txt
+++ b/requirements/test.txt
@@ -6,7 +6,7 @@
 #
 anyio==4.3.0
     # via httpx
-black==24.4.0
+black==24.4.2
     # via -r requirements/test.in
 certifi==2024.2.2
     # via
@@ -22,7 +22,7 @@ click==8.1.7
     # via
     #   -r requirements/test.in
     #   black
-coverage[toml]==7.4.4
+coverage[toml]==7.5.1
     # via
     #   -r requirements/test.in
     #   pytest-cov
@@ -30,7 +30,7 @@ exceptiongroup==1.2.1
     # via
     #   anyio
     #   pytest
-filelock==3.13.4
+filelock==3.14.0
     # via
     #   -c requirements/base.txt
     #   huggingface-hub
@@ -40,7 +40,7 @@ flake8==7.0.0
     #   flake8-docstrings
 flake8-docstrings==1.7.0
     # via -r requirements/test.in
-fsspec==2024.3.1
+fsspec==2024.5.0
     # via
     #   -c requirements/base.txt
     #   huggingface-hub
@@ -50,7 +50,7 @@ httpcore==1.0.5
     # via httpx
 httpx==0.27.0
     # via -r requirements/test.in
-huggingface-hub==0.22.2
+huggingface-hub==0.23.1
     # via
     #   -c requirements/base.txt
     #   -r requirements/test.in
@@ -64,7 +64,7 @@ iniconfig==2.0.0
     # via pytest
 mccabe==0.7.0
     # via flake8
-mypy==1.9.0
+mypy==1.10.0
     # via -r requirements/test.in
 mypy-extensions==1.0.0
     # via
@@ -86,9 +86,9 @@ pillow==10.3.0
     # via
     #   -c requirements/base.txt
     #   pdf2image
-platformdirs==4.2.0
+platformdirs==4.2.2
     # via black
-pluggy==1.4.0
+pluggy==1.5.0
     # via pytest
 pycodestyle==2.11.1
     # via flake8
@@ -96,7 +96,7 @@ pydocstyle==6.3.0
     # via flake8-docstrings
 pyflakes==3.2.0
     # via flake8
-pytest==8.1.1
+pytest==8.2.1
     # via
     #   pytest-cov
     #   pytest-mock
@@ -108,11 +108,11 @@ pyyaml==6.0.1
     # via
     #   -c requirements/base.txt
     #   huggingface-hub
-requests==2.31.0
+requests==2.32.2
     # via
     #   -c requirements/base.txt
     #   huggingface-hub
-ruff==0.4.0
+ruff==0.4.4
     # via -r requirements/test.in
 sniffio==1.3.1
     # via
@@ -126,7 +126,7 @@ tomli==2.0.1
     #   coverage
     #   mypy
     #   pytest
-tqdm==4.66.2
+tqdm==4.66.4
     # via
     #   -c requirements/base.txt
     #   huggingface-hub
diff --git a/test_unstructured_inference/inference/test_layout.py b/test_unstructured_inference/inference/test_layout.py
index 0952e0fa..6cb618ce 100644
--- a/test_unstructured_inference/inference/test_layout.py
+++ b/test_unstructured_inference/inference/test_layout.py
@@ -159,7 +159,7 @@ def test_process_data_with_model_raises_on_invalid_model_name():
         layout.process_data_with_model(fp, model_name="fake")
 
 
-@pytest.mark.parametrize("model_name", [None, "checkbox"])
+@pytest.mark.parametrize("model_name", [None, "yolox"])
 def test_process_file_with_model(monkeypatch, mock_final_layout, model_name):
     def mock_initialize(self, *args, **kwargs):
         self.model = MockLayoutModel(mock_final_layout)
@@ -169,7 +169,7 @@ def mock_initialize(self, *args, **kwargs):
         "from_file",
         lambda *args, **kwargs: layout.DocumentLayout.from_pages([]),
     )
-    monkeypatch.setattr(models.UnstructuredDetectronModel, "initialize", mock_initialize)
+    monkeypatch.setattr(models.UnstructuredDetectronONNXModel, "initialize", mock_initialize)
     filename = ""
     assert layout.process_file_with_model(filename, model_name=model_name)
 
@@ -183,7 +183,7 @@ def mock_initialize(self, *args, **kwargs):
         "from_file",
         lambda *args, **kwargs: layout.DocumentLayout.from_pages([]),
     )
-    monkeypatch.setattr(models.UnstructuredDetectronModel, "initialize", mock_initialize)
+    monkeypatch.setattr(models.UnstructuredDetectronONNXModel, "initialize", mock_initialize)
     filename = ""
     layout.process_file_with_model(filename, model_name=None)
     # There should be no UserWarning, but if there is one it should not have the following message
diff --git a/test_unstructured_inference/models/test_detectron2.py b/test_unstructured_inference/models/test_detectron2.py
deleted file mode 100644
index 987120e1..00000000
--- a/test_unstructured_inference/models/test_detectron2.py
+++ /dev/null
@@ -1,50 +0,0 @@
-from unittest.mock import patch
-
-import pytest
-
-import unstructured_inference.models.base as models
-from unstructured_inference.models import detectron2
-
-
-class MockDetectron2LayoutModel:
-    def __init__(self, *args, **kwargs):
-        self.args = args
-        self.kwargs = kwargs
-
-    def detect(self, x):
-        return []
-
-
-def test_load_default_model(monkeypatch):
-    monkeypatch.setattr(detectron2, "Detectron2LayoutModel", MockDetectron2LayoutModel)
-    monkeypatch.setattr(models, "models", {})
-
-    with patch.object(detectron2, "is_detectron2_available", return_value=True):
-        model = models.get_model("detectron2_lp")
-
-    assert isinstance(model.model, MockDetectron2LayoutModel)
-
-
-def test_load_default_model_raises_when_not_available(monkeypatch):
-    monkeypatch.setattr(models, "models", {})
-    with patch.object(detectron2, "is_detectron2_available", return_value=False):
-        with pytest.raises(ImportError):
-            models.get_model("detectron2_lp")
-
-
-@pytest.mark.parametrize(("config_path", "model_path"), [("asdf", "diufs"), ("dfaw", "hfhfhfh")])
-def test_load_model(monkeypatch, config_path, model_path):
-    monkeypatch.setattr(detectron2, "Detectron2LayoutModel", MockDetectron2LayoutModel)
-    with patch.object(detectron2, "is_detectron2_available", return_value=True):
-        model = detectron2.UnstructuredDetectronModel()
-        model.initialize(config_path=config_path, model_path=model_path)
-    assert config_path == model.model.args[0]
-    assert model_path == model.model.kwargs["model_path"]
-
-
-def test_unstructured_detectron_model():
-    model = detectron2.UnstructuredDetectronModel()
-    model.model = MockDetectron2LayoutModel()
-    result = model(None)
-    assert isinstance(result, list)
-    assert len(result) == 0
diff --git a/test_unstructured_inference/models/test_model.py b/test_unstructured_inference/models/test_model.py
index d6f431aa..411ef3d4 100644
--- a/test_unstructured_inference/models/test_model.py
+++ b/test_unstructured_inference/models/test_model.py
@@ -35,8 +35,8 @@ def predict(self, x: Any) -> Any:
 
 def test_get_model(monkeypatch):
     monkeypatch.setattr(models, "models", {})
-    with mock.patch.dict(models.model_class_map, {"checkbox": MockModel}):
-        assert isinstance(models.get_model("checkbox"), MockModel)
+    with mock.patch.dict(models.model_class_map, {"yolox": MockModel}):
+        assert isinstance(models.get_model("yolox"), MockModel)
 
 
 def test_register_new_model():
@@ -62,7 +62,7 @@ def test_raises_invalid_model():
 
 def test_raises_uninitialized():
     with pytest.raises(ModelNotInitializedError):
-        models.UnstructuredDetectronModel().predict(None)
+        models.UnstructuredDetectronONNXModel().predict(None)
 
 
 def test_model_initializes_once():
@@ -170,8 +170,8 @@ def test_env_variables_override_default_model(monkeypatch):
     monkeypatch.setattr(models, "models", {})
     with mock.patch.dict(
         models.os.environ,
-        {"UNSTRUCTURED_DEFAULT_MODEL_NAME": "checkbox"},
-    ), mock.patch.dict(models.model_class_map, {"checkbox": MockModel}):
+        {"UNSTRUCTURED_DEFAULT_MODEL_NAME": "yolox"},
+    ), mock.patch.dict(models.model_class_map, {"yolox": MockModel}):
         model = models.get_model()
     assert isinstance(model, MockModel)
 
diff --git a/unstructured_inference/__version__.py b/unstructured_inference/__version__.py
index e19533c3..2ee5708c 100644
--- a/unstructured_inference/__version__.py
+++ b/unstructured_inference/__version__.py
@@ -1 +1 @@
-__version__ = "0.7.32"  # pragma: no cover
+__version__ = "0.7.33"  # pragma: no cover
diff --git a/unstructured_inference/models/base.py b/unstructured_inference/models/base.py
index fd8eaded..7ebe6e42 100644
--- a/unstructured_inference/models/base.py
+++ b/unstructured_inference/models/base.py
@@ -6,8 +6,6 @@
 
 from unstructured_inference.models.chipper import MODEL_TYPES as CHIPPER_MODEL_TYPES
 from unstructured_inference.models.chipper import UnstructuredChipperModel
-from unstructured_inference.models.detectron2 import MODEL_TYPES as DETECTRON2_MODEL_TYPES
-from unstructured_inference.models.detectron2 import UnstructuredDetectronModel
 from unstructured_inference.models.detectron2onnx import MODEL_TYPES as DETECTRON2_ONNX_MODEL_TYPES
 from unstructured_inference.models.detectron2onnx import UnstructuredDetectronONNXModel
 from unstructured_inference.models.unstructuredmodel import UnstructuredModel
@@ -26,12 +24,10 @@ def get_default_model_mappings() -> Tuple[
 ]:
     """default model mappings for models that are in `unstructured_inference` repo"""
     return {
-        **{name: UnstructuredDetectronModel for name in DETECTRON2_MODEL_TYPES},
         **{name: UnstructuredDetectronONNXModel for name in DETECTRON2_ONNX_MODEL_TYPES},
         **{name: UnstructuredYoloXModel for name in YOLOX_MODEL_TYPES},
         **{name: UnstructuredChipperModel for name in CHIPPER_MODEL_TYPES},
     }, {
-        **DETECTRON2_MODEL_TYPES,
         **DETECTRON2_ONNX_MODEL_TYPES,
         **YOLOX_MODEL_TYPES,
         **CHIPPER_MODEL_TYPES,
diff --git a/unstructured_inference/models/detectron2.py b/unstructured_inference/models/detectron2.py
deleted file mode 100644
index 520298ce..00000000
--- a/unstructured_inference/models/detectron2.py
+++ /dev/null
@@ -1,104 +0,0 @@
-from __future__ import annotations
-
-from pathlib import Path
-from typing import Any, Dict, Final, List, Optional, Union
-
-from layoutparser.models.detectron2.layoutmodel import (
-    Detectron2LayoutModel,
-    is_detectron2_available,
-)
-from layoutparser.models.model_config import LayoutModelConfig
-from PIL import Image as PILImage
-
-from unstructured_inference.constants import ElementType
-from unstructured_inference.inference.layoutelement import LayoutElement
-from unstructured_inference.logger import logger
-from unstructured_inference.models.unstructuredmodel import (
-    UnstructuredObjectDetectionModel,
-)
-from unstructured_inference.utils import (
-    LazyDict,
-    LazyEvaluateInfo,
-    download_if_needed_and_get_local_path,
-)
-
-DETECTRON_CONFIG: Final = "lp://PubLayNet/faster_rcnn_R_50_FPN_3x/config"
-DEFAULT_LABEL_MAP: Final[Dict[int, str]] = {
-    0: ElementType.TEXT,
-    1: ElementType.TITLE,
-    2: ElementType.LIST,
-    3: ElementType.TABLE,
-    4: ElementType.FIGURE,
-}
-DEFAULT_EXTRA_CONFIG: Final[List[Any]] = ["MODEL.ROI_HEADS.SCORE_THRESH_TEST", 0.8]
-
-
-# NOTE(alan): Entries are implemented as LazyDicts so that models aren't downloaded until they are
-# needed.
-MODEL_TYPES = {
-    "detectron2_lp": LazyDict(
-        model_path=LazyEvaluateInfo(
-            download_if_needed_and_get_local_path,
-            "layoutparser/detectron2",
-            "PubLayNet/faster_rcnn_R_50_FPN_3x/model_final.pth",
-        ),
-        config_path=LazyEvaluateInfo(
-            download_if_needed_and_get_local_path,
-            "layoutparser/detectron2",
-            "PubLayNet/faster_rcnn_R_50_FPN_3x/config.yml",
-        ),
-        label_map=DEFAULT_LABEL_MAP,
-        extra_config=DEFAULT_EXTRA_CONFIG,
-    ),
-    "checkbox": LazyDict(
-        model_path=LazyEvaluateInfo(
-            download_if_needed_and_get_local_path,
-            "unstructuredio/oer-checkbox",
-            "detectron2_finetuned_oer_checkbox.pth",
-        ),
-        config_path=LazyEvaluateInfo(
-            download_if_needed_and_get_local_path,
-            "unstructuredio/oer-checkbox",
-            "detectron2_oer_checkbox.json",
-        ),
-        label_map={0: "Unchecked", 1: "Checked"},
-        extra_config=None,
-    ),
-}
-
-
-class UnstructuredDetectronModel(UnstructuredObjectDetectionModel):
-    """Unstructured model wrapper for Detectron2LayoutModel."""
-
-    def predict(self, x: PILImage.Image):
-        """Makes a prediction using detectron2 model."""
-        super().predict(x)
-        prediction = self.model.detect(x)
-        return [LayoutElement.from_lp_textblock(block) for block in prediction]
-
-    def initialize(
-        self,
-        config_path: Union[str, Path, LayoutModelConfig],
-        model_path: Optional[Union[str, Path]] = None,
-        label_map: Optional[Dict[int, str]] = None,
-        extra_config: Optional[list] = None,
-        device: Optional[str] = None,
-    ):
-        """Loads the detectron2 model using the specified parameters"""
-
-        if not is_detectron2_available():
-            raise ImportError(
-                "Failed to load the Detectron2 model. Ensure that the Detectron2 "
-                "module is correctly installed.",
-            )
-
-        config_path_str = str(config_path)
-        model_path_str: Optional[str] = None if model_path is None else str(model_path)
-        logger.info("Loading the Detectron2 layout model ...")
-        self.model = Detectron2LayoutModel(
-            config_path_str,
-            model_path=model_path_str,
-            label_map=label_map,
-            extra_config=extra_config,
-            device=device,
-        )