Skip to content

Commit 47cea10

Browse files
shaohuzhang1liuruibin
authored andcommitted
fix: The image uploaded from the workflow knowledge base zip file cannot be parsed (#4505)
1 parent b18cd78 commit 47cea10

File tree

2 files changed

+5
-5
lines changed

2 files changed

+5
-5
lines changed

apps/common/handle/impl/text/text_split_handle.py

Lines changed: 3 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -28,11 +28,13 @@
2828

2929
class TextSplitHandle(BaseSplitHandle):
3030
def support(self, file, get_buffer):
31-
buffer = get_buffer(file)
3231
file_name: str = file.name.lower()
3332
if file_name.endswith(".md") or file_name.endswith('.txt') or file_name.endswith('.TXT') or file_name.endswith(
3433
'.MD'):
3534
return True
35+
if file_name.index('.') > 0:
36+
return False
37+
buffer = get_buffer(file)
3638
result = detect(buffer)
3739
if result['encoding'] is not None and result['confidence'] is not None and result['encoding'] != 'ascii' and \
3840
result['confidence'] > 0.5:

apps/common/handle/impl/text/zip_split_handle.py

Lines changed: 2 additions & 4 deletions
Original file line numberDiff line numberDiff line change
@@ -216,20 +216,18 @@ def get_content(self, file, save_image):
216216
real_name = get_file_name(zf.name)
217217
except Exception:
218218
real_name = zf.name
219-
220219
# 为 split_handle 提供可重复读取的 file-like 对象
221220
zf.name = real_name
221+
get_buffer = FileBufferHandle().get_buffer
222222
for split_handle in split_handles:
223-
# 准备一个简单的 get_buffer 回调,返回当前 raw
224-
get_buffer = FileBufferHandle().get_buffer
225223
if split_handle.support(zf, get_buffer):
226224
row = get_buffer(zf)
227225
md_text = split_handle.get_content(io.BytesIO(row), save_image)
228226
file_content_list.append({'content': md_text, 'name': real_name})
229227
break
230228
for file_content in file_content_list:
231229
_image_list, content = get_image_list_by_content(file_content.get('name'), file_content.get("content"),
232-
files)
230+
files)
233231
content_parts.append(content)
234232
for image in _image_list:
235233
image_list.append(image)

0 commit comments

Comments
 (0)