mirror of
https://git.mirrors.martin98.com/https://github.com/jina-ai/reader.git
synced 2025-08-20 10:19:07 +08:00
fix: pdf mode and google web cache
This commit is contained in:
parent
f6bbddcb48
commit
e9258af742
@ -136,7 +136,8 @@ export class SnapshotFormatter extends AsyncService {
|
||||
}
|
||||
|
||||
let pdfMode = false;
|
||||
if (snapshot.pdfs?.length && !snapshot.title) {
|
||||
// in case of Google Web Cache content
|
||||
if (snapshot.pdfs?.length && (!snapshot.title || snapshot.title.startsWith('cache:'))) {
|
||||
const pdf = await this.pdfExtractor.cachedExtract(snapshot.pdfs[0],
|
||||
this.threadLocal.get('cacheTolerance')
|
||||
);
|
||||
|
||||
Loading…
x
Reference in New Issue
Block a user