Skip to content

Commit a98cde9

Browse files
build: add new tokenizer.
1 parent 573ec2b commit a98cde9

File tree

2 files changed

+14
-3
lines changed

2 files changed

+14
-3
lines changed

.github/workflows/build-and-push-vector-model.yml

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -5,7 +5,7 @@ on:
55
inputs:
66
dockerImageTag:
77
description: 'Docker Image Tag'
8-
default: 'v2.0.1'
8+
default: 'v2.0.2'
99
required: true
1010
architecture:
1111
description: 'Architecture'

installer/Dockerfile-vector-model

Lines changed: 13 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -10,12 +10,23 @@
1010

1111
# 不知道为什么用上面的脚本重新拉一遍向量模型比之前的大很多,所以还是用下面的脚本复用原来已经构建好的向量模型
1212

13+
FROM python:3.11-slim-bookworm AS tmp-stage1
14+
COPY installer/install_model_token.py install_model_token.py
15+
RUN pip3 install --upgrade pip setuptools && \
16+
pip install pycrawlers && \
17+
pip install transformers && \
18+
python3 install_model_token.py && \
19+
cp -r model/base/hub model/tokenizer
20+
1321
FROM ghcr.io/1panel-dev/maxkb-vector-model:v1.0.1 AS vector-model
1422

15-
FROM alpine AS tmp-stage
23+
FROM alpine AS tmp-stage2
1624
COPY --from=vector-model /opt/maxkb/app/model /opt/maxkb-app/model
1725
COPY --from=vector-model /opt/maxkb/app/model/base/hub /opt/maxkb-app/model/tokenizer
26+
COPY --from=tmp-stage1 model/tokenizer /opt/maxkb-app/model/tokenizer
1827
RUN rm -rf /opt/maxkb-app/model/embedding/shibing624_text2vec-base-chinese/onnx
1928

29+
30+
2031
FROM scratch
21-
COPY --from=tmp-stage /opt/maxkb-app/model /opt/maxkb-app/model
32+
COPY --from=tmp-stage2 /opt/maxkb-app/model /opt/maxkb-app/model

0 commit comments

Comments
 (0)