Use pdf-worker to extract text for item.attachmentContent if no cache

2023-04-29 17:37:50 -04:00 · 2023-04-29 17:37:50 -04:00 · 4ec357bb26
commit 4ec357bb26
parent adf2d92471
1 changed files with 3 additions and 17 deletions
--- a/chrome/content/zotero/xpcom/data/item.js
+++ b/chrome/content/zotero/xpcom/data/item.js
@ -3565,24 +3565,10 @@ Zotero.defineProperty(Zotero.Item.prototype, 'attachmentText', {
 					let data = JSON.parse(json);
 					str = data.text;
 				}
-				// Otherwise extract text to temporary file and read that
+				// Otherwise extract text
 				else if (contentType == 'application/pdf') {
-					let tmpCacheFile = OS.Path.join(
-						Zotero.getTempDirectory().path, Zotero.Utilities.randomString()
-					);
-					let { exec, args } = Zotero.FullText.getPDFConverterExecAndArgs();
-					args.push(
-						'-nopgbrk',
-						path,
-						tmpCacheFile
-					);
-					await Zotero.Utilities.Internal.exec(exec, args);
-					if (!await OS.File.exists(tmpCacheFile)) {
-						Zotero.logError("Cache file not found after running PDF converter");
-						return '';
-					}
-					str = await Zotero.File.getContentsAsync(tmpCacheFile);
-					await OS.File.remove(tmpCacheFile);
+					let { text } = await Zotero.PDFWorker.getFullText(this.id);
+					str = text;
 				}
 				else {
 					Zotero.logError("Unsupported cached file type in .attachmentText");