Блокировка поисковых ботов в Битрикс24

vi /etc/nginx/bx/site_enabled/block_bots.conf
map $http_user_agent $limit_bots {
    default 0;

    # --- старые и вредные парсеры (твой исходный список) ---
    ~*(amazonbot|adbeat_bot|ahrefsbot|ahrefssiteaudit|alexibot|appengine|aqua_products|archive.org_bot|archive|asterias|attackbot|b2w|backdoorbot|becomebot|blackwidow|blekkobot) 1;
    ~*(blowfish|botalot|builtbottough|bullseye|bunnyslippers|ccbot|cheesebot|cherrypicker|chinaclaw|chroot|clshttp|collector) 1;
    ~*(control|copernic|copyrightcheck|copyscape|cosmos|craftbot|crescent|curl|custo|demon) 1;
    ~*(disco|dittospyder|dotbot|download|downloader|dumbot|ecatch|eirgrabber|email|emailcollector) 1;
    ~*(emailsiphon|emailwolf|enterprise_search|erocrawler|eventmachine|exabot|express|extractor|extractorpro|eyenetie) 1;
    ~*(fairad|flaming|flashget|foobot|foto|gaisbot|getright|getty|getweb!|gigabot) 1;
    ~*(github|go!zilla|go-ahead-got-it|go-http-client|grabnet|grafula|grub|hari|harvest|hatena|antenna|hloader) 1;
    ~*(hmview|htmlparser|httplib|httrack|humanlinks|ia_archiver|indy|infonavirobot|interget|intraformant) 1;
    ~*(iron33|jamesbot|jennybot|jetbot|jetcar|joc|jorgee|kenjin|keyword|larbin|leechftp) 1;
    ~*(lexibot|library|libweb|libwww|linkextractorpro|linkpadbot|linkscan|linkwalker|lnspiderguy|looksmart) 1;
    ~*(lwp-trivial|mass|mata|midown|miixpc|mister|mj12bot|moget|msiecrawler|naver) 1;
    ~*(navroad|nearsite|nerdybot|netants|netmechanic|netspider|netzip|nicerspro|ninja|nutch) 1;
    ~*(octopus|offline|openbot|openfind|openlink|pagegrabber|papa|pavuk|pcbrowser|perl) 1;
    ~*(perman|picscout|propowerbot|prowebwalker|psbot|pycurl|pyq|pyth|python) 1;
    ~*(python-urllib|queryn|quester|radiation|realdownload|reget|retriever|rma|rogerbot|scan|screaming|frog|seo) 1;
    ~*(scooter|searchengineworld|searchpreview|semrush|semrushbot|semrushbot-sa|seokicks-robot|sitesnagger|smartdownload|sootle) 1;
    ~*(spankbot|spanner|spbot|spider|stanford|stripper|sucker|superbot|superhttp|surfbot|surveybot) 1;
    ~*(suzuran|szukacz|takeout|teleport|telesoft|thenomad|tocrawl|tool|true_robot|turingos) 1;
    ~*(twengabot|typhoeus|url_spider_pro|urldispatcher|urllib|urly|vampire|vci|voideye|warning) 1;
    ~*(webauto|webbandit|webcollector|webcopier|webcopy|webcraw|webenhancer|webfetch|webgo|webleacher) 1;
    ~*(webmasterworld|webmasterworldforumbot|webpictures|webreaper|websauger|webspider|webster|webstripper|webvac|webviewer) 1;
    ~*(webwhacker|webzip|wesee|wget|widow|woobot|www-collector-e|wwwoffle|xenu) 1;

    # --- обновления 2024–2025: крупные SEO-сканеры и маркеты ---
    ~*(serpstatbot|megaindex|babbar\.tech|barkrowler|dataforseo|seokicks|linkpadbot) 1;

    # --- соцсети и мессенджеры (если предпросмотры не нужны — блокируем) ---
    ~*(facebookexternalhit|facebot|twitterbot|linkedinbot|pinterestbot|slackbot|telegrambot|whatsapp|vkshare|discordbot|skypeuripreview) 1;

    # --- популярные фреймворки/клиенты (часто в сером парсинге и сканах) ---
    ~*(aiohttp|guzzlehttp|okhttp|okhttpclient|httpclient|jakarta|java|node-fetch|httpx|scrapy|cobweb|go-http-client) 1;

    # --- трафиковые/поисковые боты из Азии (часто шумят) ---
    ~*(baiduspider|yisouspider|sogou|360spider|petalbot|bytespider|toutiao|shenma) 1;

    # --- доп. утилиты и загрузчики ---
    ~*(wget|curl|python-requests|libwww-perl) 1;
}
vi /etc/nginx/bx/site_settings/default/block_bots.conf
if ($limit_bots = 1) {
  return 403;
}

Оставьте комментарий

Ваш адрес email не будет опубликован. Обязательные поля помечены *

Прокрутить вверх