Use pdf-worker to extract text for item.attachmentContent if no cache

2023-04-29 17:37:50 -04:00 · 2023-04-29 17:37:50 -04:00 · 4ec357bb26
commit 4ec357bb26
parent adf2d92471
1 changed files with 3 additions and 17 deletions
--- a/chrome/content/zotero/xpcom/data/item.js
+++ b/chrome/content/zotero/xpcom/data/item.js
@ -3565,24 +3565,10 @@ Zotero.defineProperty(Zotero.Item.prototype, 'attachmentText', {
 					let data = JSON.parse(json);
 					str = data.text;
 				}
-				// Otherwise extract text to temporary file and read that
+				// Otherwise extract text
 				else if (contentType == 'application/pdf') {
-					let tmpCacheFile = OS.Path.join(
+					let { text } = await Zotero.PDFWorker.getFullText(this.id);
-						Zotero.getTempDirectory().path, Zotero.Utilities.randomString()
+					str = text;
 					);
 					let { exec, args } = Zotero.FullText.getPDFConverterExecAndArgs();
 					args.push(
 						'-nopgbrk',
 						path,
 						tmpCacheFile
 					);
 					await Zotero.Utilities.Internal.exec(exec, args);
 					if (!await OS.File.exists(tmpCacheFile)) {
 						Zotero.logError("Cache file not found after running PDF converter");
 						return '';
 					}
 					str = await Zotero.File.getContentsAsync(tmpCacheFile);
 					await OS.File.remove(tmpCacheFile);
 				}
 				else {
 					Zotero.logError("Unsupported cached file type in .attachmentText");