2026-05-10 09:41:59 +02:00

54 lines
2.4 KiB
JSON

{
"name": "@tip/scraper",
"version": "0.1.0",
"private": true,
"description": "TIP scraper engine — Crawlee + Playwright for competitor pricing, stock, datasheets, FAQs",
"main": "dist/index.js",
"scripts": {
"build": "tsc",
"dev": "tsx src/index.ts",
"scrape:fs": "tsx src/scrapers/fs-com.ts",
"scrape:fs:db-detail": "FS_DB_DETAIL_ONLY=1 TIP_FORCE_REVALIDATE=1 tsx src/scrapers/fs-com.ts",
"scrape:fs:url-discovery": "FS_URL_DISCOVERY_ONLY=1 TIP_FORCE_REVALIDATE=1 tsx src/scrapers/fs-com.ts",
"scrape:atgbics:details": "tsx src/scrapers/atgbics-detail-pages.ts",
"scrape:vendors:details": "tsx src/scrapers/shopfiber24-fibermall-detail-pages.ts",
"scrape:gaotek:details": "tsx src/scrapers/gaotek-detail-pages.ts",
"scrape:10gtek": "tsx src/scrapers/tenGtek.ts",
"scrape:gbics": "tsx src/scrapers/gbics.ts",
"scrape:tscom": "tsx src/scrapers/tscom.ts",
"scrape:sfpcables": "tsx src/scrapers/sfpcables.ts",
"verify:catalog:details": "tsx src/utils/verify-catalog-details.ts",
"verify:quarantine:non-transceivers": "tsx src/utils/quarantine-non-transceivers.ts",
"verify:product-page-assets": "tsx src/utils/verify-product-page-assets.ts",
"verify:product-page-prices": "tsx src/utils/verify-product-page-prices.ts",
"verify:10gtek:datasheets": "tsx src/utils/verify-10gtek-datasheets.ts",
"verify:part-number-details": "tsx src/utils/verify-part-number-details.ts",
"verify:normalize:product-urls": "tsx src/utils/normalize-product-urls.ts",
"verify:fs:sku-aliases": "tsx src/utils/quarantine-fs-sku-aliases.ts",
"verify:price-availability": "tsx src/utils/resolve-price-availability.ts",
"verify:no-valid-competitor": "tsx src/utils/resolve-no-valid-competitor.ts",
"verify:open-competitor-status": "tsx src/utils/resolve-open-competitor-status.ts",
"scrape:cisco": "tsx src/scrapers/cisco-tmg.ts",
"scrape:optcore": "tsx src/scrapers/optcore.ts",
"scrape:news": "tsx src/scrapers/news.ts",
"scrape:all": "tsx src/index.ts --all",
"robots:verification": "tsx src/robots/verification-robots.ts"
},
"dependencies": {
"crawlee": "^3.12.0",
"playwright": "^1.50.0",
"pg": "^8.13.1",
"pg-boss": "^10.1.5",
"dotenv": "^16.4.7",
"cheerio": "^1.0.0",
"xml2js": "^0.6.2",
"socks-proxy-agent": "^8.0.5"
},
"devDependencies": {
"@types/pg": "^8.11.11",
"@types/xml2js": "^0.4.14",
"typescript": "^5.9.3",
"tsx": "^4.19.0"
}
}