SylphxAI
diff --git a/‎dist/handlers/readPdf.js‎
Lines changed: 2 additions & 2 deletions b/‎dist/handlers/readPdf.js‎
Lines changed: 2 additions & 2 deletions
diff --git a/‎dist/pdf/extractor.js‎
Lines changed: 153 additions & 29 deletions b/‎dist/pdf/extractor.js‎
Lines changed: 153 additions & 29 deletions
diff --git a/‎package.json‎
Lines changed: 2 additions & 0 deletions b/‎package.json‎
Lines changed: 2 additions & 0 deletions
diff --git a/‎pnpm-lock.yaml‎
Lines changed: 19 additions & 0 deletions b/‎pnpm-lock.yaml‎
Lines changed: 19 additions & 0 deletions
diff --git a/‎src/handlers/readPdf.ts‎
Lines changed: 2 additions & 2 deletions b/‎src/handlers/readPdf.ts‎
Lines changed: 2 additions & 2 deletions
@@ -147,11 +147,11 @@ export const handleReadPdfFunc = async (args) => {
                     });
                 }
                 else if (item.type === 'image' && item.imageData) {
-                    // Add image content part
+                    // Add image content part (all images are now encoded as PNG)
                     content.push({
                         type: 'image',
                         data: item.imageData.data,
-                        mimeType: item.imageData.format === 'rgba' ? 'image/png' : 'image/jpeg',
+                        mimeType: 'image/png',
                     });
                 }
             }
 
@@ -1,5 +1,42 @@
 // PDF text and metadata extraction utilities
+import { PNG } from 'pngjs';
 import { OPS } from 'pdfjs-dist/legacy/build/pdf.mjs';
+/**
+ * Encode raw pixel data to PNG format
+ */
+const encodePixelsToPNG = (pixelData, width, height, channels) => {
+    const png = new PNG({ width, height });
+    // Convert pixel data to RGBA format expected by pngjs
+    if (channels === 4) {
+        // Already RGBA
+        png.data = Buffer.from(pixelData);
+    }
+    else if (channels === 3) {
+        // RGB -> RGBA (add alpha channel)
+        for (let i = 0; i < width * height; i++) {
+            const srcIdx = i * 3;
+            const dstIdx = i * 4;
+            png.data[dstIdx] = pixelData[srcIdx] ?? 0; // R
+            png.data[dstIdx + 1] = pixelData[srcIdx + 1] ?? 0; // G
+            png.data[dstIdx + 2] = pixelData[srcIdx + 2] ?? 0; // B
+            png.data[dstIdx + 3] = 255; // A (fully opaque)
+        }
+    }
+    else if (channels === 1) {
+        // Grayscale -> RGBA
+        for (let i = 0; i < width * height; i++) {
+            const gray = pixelData[i] ?? 0;
+            const dstIdx = i * 4;
+            png.data[dstIdx] = gray; // R
+            png.data[dstIdx + 1] = gray; // G
+            png.data[dstIdx + 2] = gray; // B
+            png.data[dstIdx + 3] = 255; // A
+        }
+    }
+    // Encode to PNG and convert to base64
+    const pngBuffer = PNG.sync.write(png);
+    return pngBuffer.toString('base64');
+};
 /**
  * Extract metadata and page count from a PDF document
  */
@@ -78,38 +115,83 @@ const extractImagesFromPage = async (page, pageNum) => {
                 imageIndices.push(i);
             }
         }
-        // Extract each image using Promise-based approach
+        // Extract each image - try sync first, then async if needed
         const imagePromises = imageIndices.map((imgIndex, arrayIndex) => new Promise((resolve) => {
             const argsArray = operatorList.argsArray[imgIndex];
             if (!argsArray || argsArray.length === 0) {
                 resolve(null);
                 return;
             }
             const imageName = argsArray[0];
-            // Use callback-based get() as images may not be resolved yet
-            page.objs.get(imageName, (imageData) => {
+            // Helper to process image data
+            const processImageData = (imageData) => {
                 if (!imageData || typeof imageData !== 'object') {
-                    resolve(null);
-                    return;
+                    return null;
                 }
                 const img = imageData;
                 if (!img.data || !img.width || !img.height) {
-                    resolve(null);
-                    return;
+                    return null;
                 }
-                // Determine image format based on kind
-                // kind === 1 = grayscale, 2 = RGB, 3 = RGBA
+                // Determine number of channels based on kind
+                // kind === 1 = grayscale (1 channel), 2 = RGB (3 channels), 3 = RGBA (4 channels)
+                const channels = img.kind === 1 ? 1 : img.kind === 3 ? 4 : 3;
                 const format = img.kind === 1 ? 'grayscale' : img.kind === 3 ? 'rgba' : 'rgb';
-                // Convert Uint8Array to base64
-                const base64 = Buffer.from(img.data).toString('base64');
-                resolve({
+                // Encode raw pixel data to PNG format
+                const pngBase64 = encodePixelsToPNG(img.data, img.width, img.height, channels);
+                return {
                     page: pageNum,
                     index: arrayIndex,
                     width: img.width,
                     height: img.height,
                     format,
-                    data: base64,
-                });
+                    data: pngBase64,
+                };
+            };
+            // Try to get from commonObjs first if it starts with 'g_'
+            if (imageName.startsWith('g_')) {
+                try {
+                    const imageData = page.commonObjs.get(imageName);
+                    if (imageData) {
+                        const result = processImageData(imageData);
+                        resolve(result);
+                        return;
+                    }
+                }
+                catch (error) {
+                    const message = error instanceof Error ? error.message : String(error);
+                    console.warn(`[PDF Reader MCP] Error getting image from commonObjs ${imageName}: ${message}`);
+                }
+            }
+            // Try synchronous get first - if image is already loaded
+            try {
+                const imageData = page.objs.get(imageName);
+                if (imageData !== undefined) {
+                    const result = processImageData(imageData);
+                    resolve(result);
+                    return;
+                }
+            }
+            catch (error) {
+                // Synchronous get failed or not supported, fall through to async
+                const message = error instanceof Error ? error.message : String(error);
+                console.warn(`[PDF Reader MCP] Sync image get failed for ${imageName}, trying async: ${message}`);
+            }
+            // Fallback to async callback-based get with timeout
+            let resolved = false;
+            const timeout = setTimeout(() => {
+                if (!resolved) {
+                    resolved = true;
+                    console.warn(`[PDF Reader MCP] Image extraction timeout for ${imageName} on page ${String(pageNum)}`);
+                    resolve(null);
+                }
+            }, 10000); // 10 second timeout as a safety net
+            page.objs.get(imageName, (imageData) => {
+                if (!resolved) {
+                    resolved = true;
+                    clearTimeout(timeout);
+                    const result = processImageData(imageData);
+                    resolve(result);
+                }
             });
         }));
         const resolvedImages = await Promise.all(imagePromises);
@@ -196,7 +278,7 @@ export const extractPageContent = async (pdfDocument, pageNum, includeImages, so
                     imageIndices.push(i);
                 }
             }
-            // Extract each image with its Y-coordinate
+            // Extract each image with its Y-coordinate - try sync first, then async if needed
             const imagePromises = imageIndices.map((imgIndex, arrayIndex) => new Promise((resolve) => {
                 const argsArray = operatorList.argsArray[imgIndex];
                 if (!argsArray || argsArray.length === 0) {
@@ -205,32 +287,29 @@ export const extractPageContent = async (pdfDocument, pageNum, includeImages, so
                 }
                 const imageName = argsArray[0];
                 // Get transform matrix from the args (if available)
-                // The transform is typically in argsArray[1] for some ops
                 let yPosition = 0;
                 if (argsArray.length > 1 && Array.isArray(argsArray[1])) {
                     const transform = argsArray[1];
-                    // transform[5] is the Y coordinate
                     const yCoord = transform[5];
                     if (yCoord !== undefined) {
                         yPosition = Math.round(yCoord);
                     }
                 }
-                // Use callback-based get() as images may not be resolved yet
-                page.objs.get(imageName, (imageData) => {
+                // Helper to process image data
+                const processImageData = (imageData) => {
                     if (!imageData || typeof imageData !== 'object') {
-                        resolve(null);
-                        return;
+                        return null;
                     }
                     const img = imageData;
                     if (!img.data || !img.width || !img.height) {
-                        resolve(null);
-                        return;
+                        return null;
                     }
-                    // Determine image format based on kind
+                    // Determine number of channels based on kind
+                    const channels = img.kind === 1 ? 1 : img.kind === 3 ? 4 : 3;
                     const format = img.kind === 1 ? 'grayscale' : img.kind === 3 ? 'rgba' : 'rgb';
-                    // Convert Uint8Array to base64
-                    const base64 = Buffer.from(img.data).toString('base64');
-                    resolve({
+                    // Encode raw pixel data to PNG format
+                    const pngBase64 = encodePixelsToPNG(img.data, img.width, img.height, channels);
+                    return {
                         type: 'image',
                         yPosition,
                         imageData: {
@@ -239,9 +318,54 @@ export const extractPageContent = async (pdfDocument, pageNum, includeImages, so
                             width: img.width,
                             height: img.height,
                             format,
-                            data: base64,
+                            data: pngBase64,
                         },
-                    });
+                    };
+                };
+                // Try to get from commonObjs first if it starts with 'g_'
+                if (imageName.startsWith('g_')) {
+                    try {
+                        const imageData = page.commonObjs.get(imageName);
+                        if (imageData) {
+                            const result = processImageData(imageData);
+                            resolve(result);
+                            return;
+                        }
+                    }
+                    catch (error) {
+                        const message = error instanceof Error ? error.message : String(error);
+                        console.warn(`[PDF Reader MCP] Error getting image from commonObjs ${imageName}: ${message}`);
+                    }
+                }
+                // Try synchronous get first - if image is already loaded
+                try {
+                    const imageData = page.objs.get(imageName);
+                    if (imageData !== undefined) {
+                        const result = processImageData(imageData);
+                        resolve(result);
+                        return;
+                    }
+                }
+                catch (error) {
+                    const message = error instanceof Error ? error.message : String(error);
+                    console.warn(`[PDF Reader MCP] Sync image get failed for ${imageName}, trying async: ${message}`);
+                }
+                // Fallback to async callback-based get with timeout
+                let resolved = false;
+                const timeout = setTimeout(() => {
+                    if (!resolved) {
+                        resolved = true;
+                        console.warn(`[PDF Reader MCP] Image extraction timeout for ${imageName} on page ${String(pageNum)}`);
+                        resolve(null);
+                    }
+                }, 10000); // 10 second timeout as a safety net
+                page.objs.get(imageName, (imageData) => {
+                    if (!resolved) {
+                        resolved = true;
+                        clearTimeout(timeout);
+                        const result = processImageData(imageData);
+                        resolve(result);
+                    }
                 });
             }));
             const resolvedImages = await Promise.all(imagePromises);
 
@@ -69,6 +69,7 @@
     "@modelcontextprotocol/sdk": "1.20.2",
     "glob": "^11.0.1",
     "pdfjs-dist": "^5.4.296",
+    "pngjs": "^7.0.0",
     "zod": "^3.24.2",
     "zod-to-json-schema": "^3.24.5"
   },
@@ -78,6 +79,7 @@
     "@commitlint/config-conventional": "^19.8.0",
     "@types/glob": "^8.1.0",
     "@types/node": "^24.0.7",
+    "@types/pngjs": "^6.0.5",
     "@vitest/coverage-v8": "^3.1.1",
     "husky": "^9.1.7",
     "lint-staged": "^16.2.6",
 
@@ -207,11 +207,11 @@ export const handleReadPdfFunc = async (
             text: item.textContent,
           });
         } else if (item.type === 'image' && item.imageData) {
-          // Add image content part
+          // Add image content part (all images are now encoded as PNG)
           content.push({
             type: 'image',
             data: item.imageData.data,
-            mimeType: item.imageData.format === 'rgba' ? 'image/png' : 'image/jpeg',
+            mimeType: 'image/png',
           });
         }
       }
Original file line number	Diff line number	Diff line change
`@@ -147,11 +147,11 @@ export const handleReadPdfFunc = async (args) => {`
`147`	`147`	`});`
`148`	`148`	`}`
`149`	`149`	`else if (item.type === 'image' && item.imageData) {`
`150`		`- // Add image content part`
	`150`	`+ // Add image content part (all images are now encoded as PNG)`
`151`	`151`	`content.push({`
`152`	`152`	`type: 'image',`
`153`	`153`	`data: item.imageData.data,`
`154`		`- mimeType: item.imageData.format === 'rgba' ? 'image/png' : 'image/jpeg',`
	`154`	`+ mimeType: 'image/png',`
`155`	`155`	`});`
`156`	`156`	`}`
`157`	`157`	`}`
Original file line number	Diff line number	Diff line change
`@@ -207,11 +207,11 @@ export const handleReadPdfFunc = async (`
`207`	`207`	`text: item.textContent,`
`208`	`208`	`});`
`209`	`209`	`} else if (item.type === 'image' && item.imageData) {`
`210`		`- // Add image content part`
	`210`	`+ // Add image content part (all images are now encoded as PNG)`
`211`	`211`	`content.push({`
`212`	`212`	`type: 'image',`
`213`	`213`	`data: item.imageData.data,`
`214`		`- mimeType: item.imageData.format === 'rgba' ? 'image/png' : 'image/jpeg',`
	`214`	`+ mimeType: 'image/png',`
`215`	`215`	`});`
`216`	`216`	`}`
`217`	`217`	`}`