const axios = require('axios'); /** * Scrape a website using Firecrawl. * Returns { markdown, links } — raw output passed to OpenAI. */ async function scrape(url) { const apiKey = process.env.FIRECRAWL_API_KEY; if (!apiKey) throw new Error('FIRECRAWL_API_KEY not set'); try { const response = await axios.post( 'https://api.firecrawl.dev/v1/scrape', { url, formats: ['markdown', 'links'] }, { headers: { Authorization: `Bearer ${apiKey}`, 'Content-Type': 'application/json', }, timeout: 30000, } ); const data = response.data?.data || response.data; const markdownLen = typeof data?.markdown === 'string' ? data.markdown.length : 0; const linksCount = Array.isArray(data?.links) ? data.links.length : 0; console.log( `[Firecrawl] scrape success | status=${response.status} | markdownLen=${markdownLen} | links=${linksCount}` ); return { markdown: data.markdown || '', links: data.links || [], }; } catch (err) { throw err; } } module.exports = { scrape };