diff --git a/apps/api/src/scraper/WebScraper/custom/handleCustomScraping.ts b/apps/api/src/scraper/WebScraper/custom/handleCustomScraping.ts index d78d815..f8b2503 100644 --- a/apps/api/src/scraper/WebScraper/custom/handleCustomScraping.ts +++ b/apps/api/src/scraper/WebScraper/custom/handleCustomScraping.ts @@ -29,22 +29,23 @@ export async function handleCustomScraping( }; } - // Check for Google Drive PDF links in the raw HTML - const googleDrivePdfPattern = - /https:\/\/drive\.google\.com\/file\/d\/([^\/]+)\/view/; - const googleDrivePdfLink = url.match(googleDrivePdfPattern); - if (googleDrivePdfLink) { - console.log( - `Google Drive PDF link detected for ${url}: ${googleDrivePdfLink[0]}` - ); + // Check for Google Drive PDF links in meta tags + const googleDriveMetaPattern = /