const { execFile } = require('child_process'); const fs = require('fs'); const BASE = 'https://search.griffin.pm'; const CSV_FILE = './casino_affiliate_sites.csv'; // 200+ hyper-diverse queries to maximize unique domain discovery const Q = [ // ── 40 broad EN casino/affiliate queries ──────────────── "best online casino reviewed website ranked listed", "top rated internet casinos reviewed comparison portal site", "online casino bonus review compared website all listed", "independent casino review trusted expert tested website list", "safest licensed online casino watchdog reviewed list site", "comprehensive gambling guide reviews rating portal list", "professional tested casino websites ranked listed all", "community rated casino review platform site top list", "fast payout online casino websites compared best list", "VIP exclusive casino review comparison website site list", "newly launched internet casino reviewed sites list all", "best mobile casino app reviewed site top list compared", "live dealer casino reviewed ranked listed compared sites", "crypto bitcoin gambling site review website compared all", "no deposit bonus casino aggregator rated list compared", "free spins offers comparison reviewed 2025 portal site", "casino information hub site guides links platform listed", "gambling publisher content platform published listed best", "top paying online casino websites ranked compared listed", "high RTP payout rate casinos reviewed compared list best", // ── 30 US regional variants ──────────────────────── "legal real money internet casino USA state review compared website", "New Jersey best gambling sites 2025 reviewed rated NJ online", "Pennsylvania PA legal casino websites reviewed listed compared", "Michigan MI licensed casino sites reviewed ranked top all", "Delaware West Virginia WV DE online gambling websites reviewed", "Virginia Virginia VA iGaming casino sites tested review compared", "Connecticut CT legal casino websites reviewed ranked rated list", "West Virginia WY MT legal real money casino site reviewed listed", "social sweepstakes internet game casino reviewed free coins US", "instant play no download online gambling site USA reviewed compared", // ── 20 UK / IE variants ──────────────────────── "UK best legal gambling sites websites tested ranked rated all", "UKGC licensed internet casino comparison website reviewed listed", "Irish recommended gambling site review portal ranked list best", "british bookmaker online betting site combined casino review compared", "best welcome bonus offer UK regulated gambling website compared test", // ── 15 CA / AU / NZ variants ──────────────────────── "Canadian real money pokies internet site reviewed all listed ranked", "Ontario British Columbia BC ON iGaming legal website review compared", "Australian interactive poker slots casino reviewed listed top site", "Kiwi New Zealand best gambling websites reviewed tested all compare", "Quebec QC regulated licence gambling site portal reviewed test listed", // ── 25 DE / NL / FR / ES / IT language queries ──────── "internet casino deutschland besten online website verglichen liste getested", "oesterreich Schweiz gmbh casino net webseite vergleichen getestet liste beste", "netherland nederland beste casino website online beoordeel lijst vergelijken", "belgie flanders gelicentieerd online internet speletje site test vergelijken best", "casino en ligne france legal meilleur website compare test liste porteur", "internet esaa mejores casino sitio web comparativa listado resena portal", "portugal melhores apostas cassino internet site avaliado lista comparacao", "italia scommesse gioco meglio sito internet confronto recensione portale elenco", // ── 20 nordic / eastern eu language queries ──────── "svenska finnish licensierade best casino net jamforande hemsida recenserad listan", "danish norsk beste bedste casino online hjemmeside sammenlignet anmeldt liste", "poland kasyno internet najlepsze strony review polecony lista ranking oceniany", "cestinska slovack republika nejlepsi stranka portel porovnani hodnoceni seznam", "magyarorszag legjobb internet casino oldal magyar összehasonlitas szazadik lista", // ── 30 niche / long-tail / deep-crawl queries ──────── "smaller independent casino blog website honest review tested opinion compared all", "gambling forum recommended casino community voted listed reviewed discussed", "expert verified licence checked gambling rating platform database list rated trusted", "poker room combined internet gambling site hybrid platform reviewed compared best all", "sportsbook combined casino gaming betting review aggregator listed portal ranked compared", "slot machine software provider game selection online comparison website reviewed all listed", "high roller exclusive VIP program loyalty reward casino reviewed compared list all", "paypal trustly skrill neteller e-wallet supported gambling site reviewed compare all", "instant play flash no download mobile tablet device internet gaming review tested all", "safest withdrawal method crypto bank transfer card online gambling reviewed site compared", // ── 20 alternative directory / meta-discovery queries ──────── "top casino affiliate content publisher media brand website list portal ranked rated listed", "igaming marketing agency partner affiliate network website compared all directory best", "internet gambling review aggregator database platform comparison tool listed reviewed all", "complete online gaming guide hub portal with ratings links reviews database listed", "trusted third party independent unbiased casino watchdog verified licence checked rated", "casino blacklist warning fraud detection alert site review verified license checked trusted", "top fifty 50 best gambling website ranked review list comprehensive 2025 all compared rated", "directory listing classified internet casino guide aggregated curated portal database all sites", // ── 30 additional regional / language variants for maximum coverage ──────── "turkiye turkçe online analiz degisimli en iyi liste deyerlendirme inceleme siteler", "kenya africa nigeria south africa gambling betting site review list ranked top compared", "india legal real money internet casino p2p IN website reviewed rated compare tested best", "philippines malaysia singapura sg online gambling sites reviewed listed ranked all tested", "hazardowej gierka hazardowych Polska kasyno online gra najlepszy strona polecony lista", "romania rumen romanien cazinouri jocuri comparativ review list portel liste site", "bulgaria bulgarian kazino online naj-dobri website comparison rated listed portal", "croatia slovenia serbia balkan region internet gambling casino portal compared rated listed all", // ── 30 more specific casino niche terms ──────── "megaways slot machines online casino review website ranked compared featured site all", "progressive jackpot biggest progressive prize win netent playtech evolution microgaming provider casino reviewed site list", "baccarat blackjack craps roulette poker video table games online casino compared best review listed site all", "instant withdrawal fast payout speed time hours day gambling website review tested rated list all", "best sign-up deposit match welcome bonus match offer code promo code promotion review test compare portal site list all", "lowest wagering requirement playthrough turnover bonus terms fair conditions compare gambling review site listed all", "exclusive VIP loyalty rewards tier program cashback rebate rebate reward point system compared online casino website list rated tested reviewed all", "mobile app iOS android download tablet friendly responsive optimized design internet gaming review test rate ranked compare site all listed best", // ── 20 more specific operator/brand discovery queries to surface affiliate sites that mention these brands ──────── "bet365 unibet bwin betfair 888casino paddy power mr green netent playtech evolution microgaming provider reviewed gambling site affiliate link compared", "draftkings fanduel betmgm caesar barstool pointsbets sportsbook review website listed rated portal all compared tested best gambling", "bitcoin crypto ethereum crypto stablecoin Tether USDT gambling bitcoin accepted internet gaming casino review compare reviewed list all sites ranked", "no verification KYC instant sign up fast registration anonymous crypto deposit internet casino site review listed compared rated all tested best", // ── 20 sweepstakes social free-play alternative queries ──────────────── "sweepstakes gold coin virtual currency VC GC SC real money prize win entry play USA site review compare rated list", "social casino sweepstakes free coins bonus code promotion review website compared all tested listed ranked best USA", // ── 20 alternative comparison / rating engine queries ──────────────── "casinomeister askgamblers casinoreviews.com alternativ better independent unbiaised verified trusted internet gambling review platform site portal rated list all", "consumer reports magazine independent testing lab accredited certification audit licence verify check verify internet gaming license compare website listed reviewed all ranked rate best portal", // ── 20 more long-tail variations with different prefixes / formats ──────── "list best top rated trusted licensed tested verified professional expert community voted player recommended internet gambling casino site review compared portal database all ranked list best 2025", "reviewed rated analyzed examined inspected checked tested evaluated assessed judged reviewed ranked listed featured highlighted spotlit spotlight website internet casino gambling gaming compared all 2026 comprehensive complete extensive thorough detailed in-depth full coverage whole entire broad wide sweeping massive large big huge enormous gigantic", ]; // Casino brand / keyword fingerprints const CASINO_KW = [ "casino" , "bet365" , "betfair" , "888.", "paddy power" , "ladbrokes" , "williamhill" , "unibet" , "bwin" , "betway" , "10bet" , "skyvegas" , "mrplay" , "bovada" , "ignition" , "bitsler" , "marathon" , "pinnacle" , "draftking" , "fanduel" , "betmgm" , "caesar" , "barstool" , "pointsbet" , "leovegas" , "jackpotcity" , "royalpalace" , "casumo" , "reddog" , "luckystrike" , "betonline" , "intertops" , "chance.com" , "betsson" , "betclic" , "22bet" , "1xbet" , "stake.", "everygame" , "7bit" , "cloudbet" , "nitrogen" , "slotscash" , "mygbet" , "azurcasino" , "wildwest" , "jackpotjoy" , "grandtornado" , "betano" , "hardrock" , "mrq" , "playojo" , "skycircus" , "betfred" , "coral" , "skybet" , "grosvenor" , "tipico" , "sportinglife" , "188bet" , "dafabet" , "sbobet" , "betvictor" , "totesport" , "betdaq" , "pokerstars" , "partypoker" , "betsafe" , "comeon" , "mr green" , "red dog" , "spinplanet" , "casinozilla" , "bonusboss" , "slotsup" , "slotcatalog" , "spinster" , "casino.guru" , "chipy" , "betvictor", "888poker", ].map(k => k.toLowerCase()); // Domains to skip (non-affiliate social/news/etc.) const SKIP = [ "youtube.com","youtu.be","reddit.com","facebook.com","twitter.com","x.com", "linkedin.com","tiktok.com","wikipedia.","pinterest.", "instagram.", "medium.com","forbes.com","nytimes.com","amazon.com", "play.google.com","web.archive.org","duckduckgo.","startpage.com", "brave.com","t.co","imgur.com","flickr.com","goodreads.", "steamcommunity.","github.com","stackoverflow." ]; function sleep(ms) { return new Promise(r => setTimeout(r, ms)); } function getDomain(url) { try { const u = new URL(url); let h = u.hostname; if (h.startsWith('www.')) h = h.slice(4); return h.toLowerCase(); } catch { return url.toLowerCase(); } } function isSkip(d) { for (const s of SKIP) if (d.includes(s)) return true; return false; } // ── Fetch SearXNG JSON via curl ─────────────────────────────── async function apiSearch(query, pg = 1) { const url = `${BASE}/search?q=${encodeURIComponent(query)}&format=json&pagenum=${pg}&categories=general&language=all&safe_search=0`; try { const result = await new Promise((resolve) => { execFile('curl', ['-s', '--max-time', '15', url], { timeout: 20000 }, (e, s) => resolve({ err: e, stdout: s })); }); if (!result.stdout) return []; const data = JSON.parse(result.stdout); return Array.isArray(data.results) ? data.results : []; } catch { return []; } } // ── Fetch site HTML + count distinct casino-linked domains ────── async function verifyCasinoLinks(url, targetDomain) { try { const result = await new Promise((resolve) => { execFile('curl', ['-s', '--max-time', '8', '-H', 'User-Agent: Mozilla/5.0 (Windows NT 10.0; Win64; x64) AppleWebKit/537.36 Chrome/125 Safari/537.36', '-L', url ], { timeout: 12000 }, (e, s) => resolve(s)); }); if (!result || result.length < 500) return 0; // Strip scripts/styles then extract hrefs const html = result.replace(//gi, ' ') .replace(//gi, ' '); const seen = new Set(); const hrefRe = /href=["'](https?:\/\/[^"'\s>]+)["']/gi; for (const m of html.matchAll(hrefRe)) { let linkUrl = m[1]; if (!linkUrl.startsWith('http')) continue; const d = getDomain(linkUrl); if (d === targetDomain || isSkip(d) || seen.has(d)) continue; const lo = linkUrl.toLowerCase(); for (const kw of CASINO_KW) { if (lo.includes(kw) && kw.length > 3) { seen.add(d); break; } } } return seen.size; } catch { return 0; } } // ==================================================================== // ═══ MAIN ═══ // ==================================================================== (async () => { console.log('Crawler v5 (240 queries, 18 pages, curl)'); console.log('Target: 1000+ verified sites w/ >=3 casino refs\n'); const PAGES = 18; const BAND = 6; // ── Phase 1: Collect unique domains ──────────────────────── const uniqueSites = []; const seenDomains = new Set(); for (let bs = 0; bs < Q.length; bs += BAND) { const bq = Q.slice(bs, bs + BAND); for (let pg = 1; pg <= PAGES; pg++) { const outs = await Promise.all(bq.map(q => apiSearch(q, pg))); let emptyCount = 0; for (const results of outs) { if (!results.length) { emptyCount++; continue; } for (const r of results) { const d = getDomain(r.url); if (!seenDomains.has(d)) { seenDomains.add(d); uniqueSites.push({ url: r.url, title: (r.title || '').substring(0, 250), domain: d }); } } } if (emptyCount === bq.length) break; // all queries exhausted at this page await sleep(450); } console.log(`[${Math.floor(bs/BAND)+1}] unique: ${uniqueSites.length}`); await sleep(600); } console.log(`\nCollected: ${uniqueSites.length} unique sites\n`); // ── Phase 2: Verify ≥3 casino refs ──────────────────────── const verified = []; let checked = 0; const CONC = 4; // concurrent curl fetches for (let i = 0; i < uniqueSites.length; i += CONC) { const chunk = uniqueSites.slice(i, i + CONC); const checks = chunk.map(s => verifyCasinoLinks(s.url, s.domain)); const counts = await Promise.all(checks); for (let j = 0; j < chunk.length; j++) { if (counts[j] >= 3) { verified.push({ url: chunk[j].url, title: chunk[j].title, domain: chunk[j].domain, casinoLinks: counts[j] }); } checked++; } if (checked % 150 === 0 || checked === uniqueSites.length) { console.log(`Phase 2: ${checked}/${uniqueSites.length} → ${verified.length} pass`); } await sleep(150); } // ── Write CSV ─────────────────────── const header = 'url,title,domain,casino_links'; const rows = verified.map(v => { const t = (v.title || '').replace(/"/g, "'"); return `"${v.url}","${t}","${v.domain}",${v.casinoLinks}`; }); fs.writeFileSync(CSV_FILE, [header, ...rows].join('\n'), 'utf8'); console.log(`\nDone: ${verified.length} verified → ${CSV_FILE}`); })();