Skip to content

Commit

Permalink
Browse files Browse the repository at this point in the history
  • Loading branch information
nickscamara committed Jan 30, 2025
2 parents ec2c0f6 + 71878cf commit a585340
Show file tree
Hide file tree
Showing 2 changed files with 3 additions and 2 deletions.
1 change: 1 addition & 0 deletions apps/api/src/lib/concurrency-limit.ts
Original file line number Diff line number Diff line change
Expand Up @@ -9,6 +9,7 @@ const constructQueueKey = (team_id: string) =>
const stalledJobTimeoutMs = 2 * 60 * 1000;

export function getConcurrencyLimitMax(plan: string): number {
if (plan === "growth") return 100;
return getRateLimiterPoints(RateLimiterMode.Scrape, undefined, plan);
}

Expand Down
4 changes: 2 additions & 2 deletions apps/api/src/scraper/WebScraper/crawler.ts
Original file line number Diff line number Diff line change
Expand Up @@ -401,13 +401,13 @@ export class WebCrawler {

public async extractLinksFromHTML(html: string, url: string) {
try {
return (await this.extractLinksFromHTMLRust(html, url)).map(x => {
return [...new Set((await this.extractLinksFromHTMLRust(html, url)).map(x => {
try {
return new URL(x, url).href
} catch (e) {
return null;
}
}).filter(x => x !== null) as string[];
}).filter(x => x !== null) as string[])];
} catch (error) {
this.logger.error("Failed to call html-transformer! Falling back to cheerio...", {
error,
Expand Down

0 comments on commit a585340

Please sign in to comment.