mirror of
https://git.mirrors.martin98.com/https://github.com/infiniflow/ragflow.git
synced 2025-06-04 11:24:00 +08:00

* add field progress msg into docinfo; add file processing procedure * go through upload, create kb, add doc to kb
20 lines
513 B
Python
20 lines
513 B
Python
import re
|
|
|
|
def rmSpace(txt):
|
|
txt = re.sub(r"([^a-z0-9.,]) +([^ ])", r"\1\2", txt)
|
|
return re.sub(r"([^ ]) +([^a-z0-9.,])", r"\1\2", txt)
|
|
|
|
def findMaxDt(fnm):
|
|
m = "1970-01-01 00:00:00"
|
|
try:
|
|
with open(fnm, "r") as f:
|
|
while True:
|
|
l = f.readline()
|
|
if not l:break
|
|
l = l.strip("\n")
|
|
if l == 'nan':continue
|
|
if l > m:m = l
|
|
except Exception as e:
|
|
print("WARNING: can't find "+ fnm)
|
|
return m
|