diff --git a/scraper/scrapers/ondebaixa/ondebaixa_api.js b/scraper/scrapers/ondebaixa/ondebaixa_api.js index d7268b1..5aff100 100644 --- a/scraper/scrapers/ondebaixa/ondebaixa_api.js +++ b/scraper/scrapers/ondebaixa/ondebaixa_api.js @@ -118,7 +118,7 @@ function parseTorrentPage(body) { magnetLink: magnetLink, category: parseCategory(category), uploadDate: new Date($('time').attr('datetime')), - languages: sanitizePtLanguages(details.find('span:contains(\'Idioma\')')[0].nextSibling.nodeValue) + languages: sanitizePtLanguages(details.find('span:contains(\'Idioma\')').next().text()) })); resolve(torrents.filter((x) => x)); }); diff --git a/scraper/scrapers/scraperHelper.js b/scraper/scrapers/scraperHelper.js index 2df9f78..d15378a 100644 --- a/scraper/scrapers/scraperHelper.js +++ b/scraper/scrapers/scraperHelper.js @@ -5,7 +5,7 @@ function isPtDubbed(name) { function sanitizePtName(name) { return name .replace(/(.*)\b(\d{3,4}P)\b(?!.*\d{3,4}[Pp])(.*)/, '$1$3 $2') // add resolution to the end if missing - .replace(/^[[{]?(?:ACESSE.*|WWW\.)?[A-Z]+\.(COM|NET|ORG|TO|TV|ME)\b\s*[-\]}]+[\s.]*/i, '') // replace watermarks + .replace(/^[\[{]?(?:ACESSE.*|WWW\.)?[A-Z]+\.(COM|NET|ORG|TO|TV|ME)\b\s*[-\]}]+[\s.]*/i, '') // replace watermarks .replace(/^(\d*(?:\.\d{1,2})?(?:[4A-Z-]{3,}|P)[-.]+)+/, '') // replace metadata prefixes .replace(/^(COM|NET|ORG|TO|TV|ME)\b\s*-+[\s.]*/, '') // replace dangling site endings .trim();