https://docs.firecrawl.dev/introduction
https://gitingest.com/mendableai/firecrawl
curl -X POST https://api.firecrawl.dev/v1/map \
-H 'Content-Type: application/json' \
-H 'Authorization: Bearer $FIRECRAWL_API_KEY' \
-d '{
"url": "https://www.mfri.org/course/msfs/FIRE/101/",
"search": "Firefighter I"
}'
pip install firecrawl-py
from firecrawl import FirecrawlApp
import os
app = FirecrawlApp(api_key=os.getenv("FIRECRAWL_API_KEY"))
scrape_result = app.scrape_url('https://www.mfri.org/course/msfs/FIRE/101/S069/2025/', formats=['markdown'])
scrape_result.markdown
map_result = app.map_url('https://www.mfri.org/course/msfs/FIRE/101/', search="Firefighter I", limit=1_000)
print(map_result)
import os
import requests
api_url = "https://api.firecrawl.dev/v1/map"
target_url = "https://www.mfri.org/course/msfs/FIRE/101/"
payload = {
"url": target_url,
"search": "Firefighter I",
"ignoreSitemap": False,
"sitemapOnly": False,
"includeSubdomains":True,
"limit": 1000,
"timeout": 10000
}
headers = {
"Authorization": f"Bearer {os.getenv('FIRECRAWL_API_KEY')}",
"Content-Type": "application/json",
"Referer": target_url
}
response = requests.post(api_url, json=payload, headers=headers)
len(response.json()["links"])