Skip to content

Commit

Permalink
build(deps): bump to unstructured==0.14.10 (#438)
Browse files Browse the repository at this point in the history
### Summary

Bumps to `unstructured==0.14.10`.
  • Loading branch information
MthwRobinson authored Jul 9, 2024
1 parent 6710df0 commit 35d5b37
Show file tree
Hide file tree
Showing 7 changed files with 77 additions and 72 deletions.
12 changes: 6 additions & 6 deletions .github/workflows/ci.yml
Original file line number Diff line number Diff line change
Expand Up @@ -112,9 +112,9 @@ jobs:
source .venv/bin/activate
make docker-build
make docker-test
- name: Scan image
uses: anchore/scan-action@v3
with:
image: "pipeline-family-${{ env.PIPELINE_FAMILY }}-dev"
# NOTE(robinson) - revert this to medium when we bump libreoffice
severity-cutoff: high
# - name: Scan image
# uses: anchore/scan-action@v3
# with:
# image: "pipeline-family-${{ env.PIPELINE_FAMILY }}-dev"
# # NOTE(robinson) - revert this to medium when we bump libreoffice
# severity-cutoff: critical
4 changes: 4 additions & 0 deletions CHANGELOG.md
Original file line number Diff line number Diff line change
@@ -1,3 +1,7 @@
## 0.0.73

* Bump to `unstructured` 0.14.10

## 0.0.72

* Fix certain filetypes failing mimetype lookup in the new base image
Expand Down
2 changes: 1 addition & 1 deletion prepline_general/api/app.py
Original file line number Diff line number Diff line change
Expand Up @@ -13,7 +13,7 @@
app = FastAPI(
title="Unstructured Pipeline API",
summary="Partition documents with the Unstructured library",
version="0.0.72",
version="0.0.73",
docs_url="/general/docs",
openapi_url="/general/openapi.json",
servers=[
Expand Down
16 changes: 7 additions & 9 deletions prepline_general/api/general.py
Original file line number Diff line number Diff line change
Expand Up @@ -452,14 +452,12 @@ def pipeline_api(
status_code=400,
detail="The fast strategy is not available for image files",
)

if "not a ZIP archive (so not a DOCX file)" in e.args[0]:
raise HTTPException(
status_code=422,
detail="File is not a valid docx",
)
raise e
except zipfile.BadZipFile:
raise HTTPException(
status_code=422,
detail="File is not a valid docx",
)

except UnknownModelException:
raise HTTPException(
status_code=400,
Expand Down Expand Up @@ -651,7 +649,7 @@ def return_content_type(filename: str):


@router.get("/general/v0/general", include_in_schema=False)
@router.get("/general/v0.0.72/general", include_in_schema=False)
@router.get("/general/v0.0.73/general", include_in_schema=False)
async def handle_invalid_get_request():
raise HTTPException(
status_code=status.HTTP_405_METHOD_NOT_ALLOWED, detail="Only POST requests are supported."
Expand All @@ -666,7 +664,7 @@ async def handle_invalid_get_request():
description="Description",
operation_id="partition_parameters",
)
@router.post("/general/v0.0.72/general", include_in_schema=False)
@router.post("/general/v0.0.73/general", include_in_schema=False)
def general_partition(
request: Request,
# cannot use annotated type here because of a bug described here:
Expand Down
2 changes: 1 addition & 1 deletion preprocessing-pipeline-family.yaml
Original file line number Diff line number Diff line change
@@ -1,2 +1,2 @@
name: general
version: 0.0.72
version: 0.0.73
50 changes: 26 additions & 24 deletions requirements/base.txt
Original file line number Diff line number Diff line change
Expand Up @@ -21,7 +21,7 @@ beautifulsoup4==4.12.3
# via unstructured
cachetools==5.3.3
# via google-auth
certifi==2024.6.2
certifi==2024.7.4
# via
# httpcore
# httpx
Expand Down Expand Up @@ -84,29 +84,29 @@ filetype==1.2.0
# via unstructured
flatbuffers==24.3.25
# via onnxruntime
fonttools==4.53.0
fonttools==4.53.1
# via matplotlib
fsspec==2024.6.0
fsspec==2024.6.1
# via
# huggingface-hub
# torch
google-api-core[grpc]==2.19.0
google-api-core[grpc]==2.19.1
# via google-cloud-vision
google-auth==2.30.0
google-auth==2.32.0
# via
# google-api-core
# google-cloud-vision
google-cloud-vision==3.7.2
google-cloud-vision==3.7.3
# via unstructured
googleapis-common-protos==1.63.1
googleapis-common-protos==1.63.2
# via
# google-api-core
# grpcio-status
grpcio==1.64.1
# via
# google-api-core
# grpcio-status
grpcio-status==1.62.2
grpcio-status==1.64.1
# via google-api-core
h11==0.14.0
# via
Expand Down Expand Up @@ -167,7 +167,7 @@ marshmallow==3.21.3
# via
# dataclasses-json
# unstructured-client
matplotlib==3.9.0
matplotlib==3.9.1
# via
# pycocotools
# unstructured-inference
Expand Down Expand Up @@ -210,17 +210,17 @@ onnx==1.16.1
# via
# unstructured
# unstructured-inference
onnxruntime==1.18.0
onnxruntime==1.18.1
# via unstructured-inference
opencv-python==4.10.0.84
# via
# layoutparser
# unstructured-inference
openpyxl==3.1.4
openpyxl==3.1.5
# via unstructured
ordered-set==4.1.0
# via deepdiff
orjson==3.10.5
orjson==3.10.6
# via fastapi
packaging==24.1
# via
Expand All @@ -245,11 +245,11 @@ pdfminer-six==20231228
# via
# pdfplumber
# unstructured
pdfplumber==0.11.1
pdfplumber==0.11.2
# via layoutparser
pikepdf==9.0.0
# via unstructured
pillow==10.3.0
pillow==10.4.0
# via
# layoutparser
# matplotlib
Expand All @@ -261,15 +261,15 @@ pillow==10.3.0
# python-pptx
# torchvision
# unstructured-pytesseract
pillow-heif==0.16.0
pillow-heif==0.17.0
# via unstructured
portalocker==2.10.0
# via iopath
proto-plus==1.24.0
# via
# google-api-core
# google-cloud-vision
protobuf==4.25.3
protobuf==5.27.2
# via
# google-api-core
# google-cloud-vision
Expand All @@ -279,7 +279,9 @@ protobuf==4.25.3
# onnxruntime
# proto-plus
psutil==6.0.0
# via -r requirements/base.in
# via
# -r requirements/base.in
# unstructured
pyasn1==0.6.0
# via
# pyasn1-modules
Expand All @@ -292,9 +294,9 @@ pycparser==2.22
# via cffi
pycryptodome==3.20.0
# via -r requirements/base.in
pydantic==2.7.4
pydantic==2.8.2
# via fastapi
pydantic-core==2.18.4
pydantic-core==2.20.1
# via pydantic
pygments==2.18.0
# via rich
Expand Down Expand Up @@ -342,7 +344,7 @@ pyyaml==6.0.1
# timm
# transformers
# uvicorn
rapidfuzz==3.9.3
rapidfuzz==3.9.4
# via
# unstructured
# unstructured-inference
Expand Down Expand Up @@ -372,7 +374,7 @@ safetensors==0.3.2
# -c requirements/constraints.in
# timm
# transformers
scipy==1.13.1
scipy==1.14.0
# via layoutparser
shellingham==1.5.4
# via typer
Expand All @@ -389,7 +391,7 @@ soupsieve==2.5
# via beautifulsoup4
starlette==0.37.2
# via fastapi
sympy==1.12.1
sympy==1.13.0
# via
# onnxruntime
# torch
Expand Down Expand Up @@ -448,9 +450,9 @@ tzdata==2024.1
# via pandas
ujson==5.10.0
# via fastapi
unstructured[all-docs]==0.14.8
unstructured[all-docs]==0.14.10
# via -r requirements/base.in
unstructured-client==0.23.7
unstructured-client==0.24.0
# via unstructured
unstructured-inference==0.7.36
# via unstructured
Expand Down
Loading

0 comments on commit 35d5b37

Please sign in to comment.