支持mineru npu处理 (#174)

* feature: unstructured支持简单pdf处理

* feature: update values.yaml to enhance ray-cluster configuration with security context, environment variables, and resource limits

* feature: update deploy.yaml and process.py for mineru server configuration and PDF processing enhancements

* feature: update deploy.yaml and process.py for mineru server configuration and PDF processing enhancements

* feature: improve PDF processing logic and update dependencies in process.py and pyproject.toml

* feature: improve PDF processing logic and update dependencies in process.py and pyproject.toml

* feature: update Dockerfile for improved package source mirrors and add mineru-npu to build targets
This commit is contained in:
hhhhsc701
2025-12-17 16:31:06 +08:00
committed by GitHub
parent 3b4f8488e8
commit 924d977d6f
8 changed files with 110 additions and 35 deletions

View File

@@ -22,26 +22,32 @@ spec:
image: datamate-mineru
imagePullPolicy: IfNotPresent
command:
- python
- /opt/runtime/datamate/mineru/mineru_api.py
- mineru-openai-server
args:
- --engine
- vllm
- --host
- 0.0.0.0
- --port
- "9001"
- "8000"
env:
- name: MINERU_MODEL_SOURCE
value: local
- name: MINERU_DEVICE_MODE
value: cpu
- name: MINERU_BACKEND_MODE
value: pipeline
value: npu
- name: VLLM_WORKER_MULTIPROC_METHOD
value: spawn
ports:
- containerPort: 9001
- containerPort: 8000
resources:
limits:
cpu: 16
cpu: 8
memory: 32Gi
huawei.com/Ascend910: 1
requests:
cpu: 100m
memory: 100Mi
huawei.com/Ascend910: 1
volumeMounts:
- name: dataset-volume
mountPath: /dataset
@@ -67,8 +73,8 @@ metadata:
spec:
type: ClusterIP
ports:
- port: 9001
targetPort: 9001
- port: 8000
targetPort: 8000
protocol: TCP
selector:
app: datamate