diff --git a/lib/MetaCPAN/Web/Role/Request.pm b/lib/MetaCPAN/Web/Role/Request.pm index ce431efc90..8612da6827 100644 --- a/lib/MetaCPAN/Web/Role/Request.pm +++ b/lib/MetaCPAN/Web/Role/Request.pm @@ -26,7 +26,9 @@ sub get_page_size { my $default_page_size = shift; my $page_size = $req->param('size'); - unless ( is_PositiveInt($page_size) && $page_size <= 500 ) { + + # We no longer support more than 100 results per page + unless ( is_PositiveInt($page_size) && $page_size <= 100 ) { $page_size = $default_page_size; } return $page_size; diff --git a/root/inc/pager.tx b/root/inc/pager.tx index 9d02f05e02..943f4ada0b 100644 --- a/root/inc/pager.tx +++ b/root/inc/pager.tx @@ -3,31 +3,23 @@
%% }
-
[% $pageset.total_entries | format_number %] [% pluralize("result", $pageset.total_entries) %] diff --git a/root/robots.txt b/root/robots.txt index 70fd28846b..740dc05883 100644 --- a/root/robots.txt +++ b/root/robots.txt @@ -14,69 +14,4 @@ Disallow: /*?*size=* Sitemap: https://metacpan.org/sitemap-authors.xml.gz Sitemap: https://metacpan.org/sitemap-releases.xml.gz -# Stop the bots, using list from: -# https://github.com/ai-robots-txt/ai.robots.txt/blob/main/robots.txt -User-agent: AI2Bot -User-agent: Ai2Bot-Dolma -User-agent: aiHitBot -User-agent: Amazonbot -User-agent: anthropic-ai -User-agent: Applebot -User-agent: Applebot-Extended -User-agent: Brightbot 1.0 -User-agent: Bytespider -User-agent: CCBot -User-agent: ChatGPT-User -User-agent: Claude-SearchBot -User-agent: Claude-User -User-agent: Claude-Web -User-agent: ClaudeBot -User-agent: cohere-ai -User-agent: cohere-training-data-crawler -User-agent: Cotoyogi -User-agent: Crawlspace -User-agent: Diffbot -User-agent: DuckAssistBot -User-agent: FacebookBot -User-agent: Factset_spyderbot -User-agent: FirecrawlAgent -User-agent: FriendlyCrawler -User-agent: Google-CloudVertexBot -User-agent: Google-Extended -User-agent: GoogleOther -User-agent: GoogleOther-Image -User-agent: GoogleOther-Video -User-agent: GPTBot -User-agent: iaskspider/2.0 -User-agent: ICC-Crawler -User-agent: ImagesiftBot -User-agent: img2dataset -User-agent: imgproxy -User-agent: ISSCyberRiskCrawler -User-agent: Kangaroo Bot -User-agent: meta-externalagent -User-agent: Meta-ExternalAgent -User-agent: meta-externalfetcher -User-agent: Meta-ExternalFetcher -User-agent: MistralAI-User/1.0 -User-agent: NovaAct -User-agent: OAI-SearchBot -User-agent: omgili -User-agent: omgilibot -User-agent: Operator -User-agent: PanguBot -User-agent: Perplexity-User -User-agent: PerplexityBot -User-agent: PetalBot -User-agent: QualifiedBot -User-agent: Scrapy -User-agent: SemrushBot-OCOB -User-agent: SemrushBot-SWA -User-agent: Sidetrade indexer bot -User-agent: TikTokSpider -User-agent: Timpibot -User-agent: VelenPublicWebCrawler -User-agent: Webzio-Extended -User-agent: wpbot -User-agent: YouBot -Disallow: / +# Stop the bots - using signalsciences to block \ No newline at end of file