mirror of
https://git.mirrors.martin98.com/https://github.com/langgenius/dify.git
synced 2025-08-11 19:49:02 +08:00
fix the ssrf of docx file extractor external images (#10237)
This commit is contained in:
parent
8ab05d4c36
commit
1024fc623e
@ -14,6 +14,7 @@ import requests
|
|||||||
from docx import Document as DocxDocument
|
from docx import Document as DocxDocument
|
||||||
|
|
||||||
from configs import dify_config
|
from configs import dify_config
|
||||||
|
from core.helper import ssrf_proxy
|
||||||
from core.rag.extractor.extractor_base import BaseExtractor
|
from core.rag.extractor.extractor_base import BaseExtractor
|
||||||
from core.rag.models.document import Document
|
from core.rag.models.document import Document
|
||||||
from extensions.ext_database import db
|
from extensions.ext_database import db
|
||||||
@ -86,7 +87,7 @@ class WordExtractor(BaseExtractor):
|
|||||||
image_count += 1
|
image_count += 1
|
||||||
if rel.is_external:
|
if rel.is_external:
|
||||||
url = rel.reltype
|
url = rel.reltype
|
||||||
response = requests.get(url, stream=True)
|
response = ssrf_proxy.get(url, stream=True)
|
||||||
if response.status_code == 200:
|
if response.status_code == 200:
|
||||||
image_ext = mimetypes.guess_extension(response.headers["Content-Type"])
|
image_ext = mimetypes.guess_extension(response.headers["Content-Type"])
|
||||||
file_uuid = str(uuid.uuid4())
|
file_uuid = str(uuid.uuid4())
|
||||||
|
Loading…
x
Reference in New Issue
Block a user