|
8 | 8 | /*jshint esversion: 6 */ |
9 | 9 |
|
10 | 10 | const { UAParser } = require('../main/ua-parser'); |
11 | | -const { CPUArch, OSName, EngineName } = require('../enums/ua-parser-enums'); |
| 11 | +const { CPUArch, OSName, EngineName, Extension } = require('../enums/ua-parser-enums'); |
12 | 12 | const { Bots } = require('../extensions/ua-parser-extensions'); |
13 | 13 | const { isFromEU } = require('detect-europe-js'); |
14 | 14 | const { isFrozenUA } = require('ua-is-frozen'); |
@@ -41,125 +41,124 @@ const isAppleSilicon = (resultOrUA) => { |
41 | 41 | return false; |
42 | 42 | } |
43 | 43 |
|
| 44 | +const Crawler = Extension.BrowserName.Crawlers; |
44 | 45 | const isAIBot = (resultOrUA) => [ |
45 | 46 |
|
46 | 47 | // AI2 |
47 | | - 'ai2bot', |
| 48 | + Crawler.AI2_BOT, |
48 | 49 |
|
49 | 50 | // Amazon |
50 | | - 'amazonbot', |
| 51 | + Crawler.AMAZON_BOT, |
51 | 52 |
|
52 | 53 | // Anthropic |
53 | | - 'anthropic-ai', |
54 | | - 'claude-web', |
55 | | - 'claude-searchbot', |
56 | | - 'claudebot', |
| 54 | + Crawler.ANTHROPIC_AI, |
| 55 | + Crawler.ANTHROPIC_CLAUDE_BOT, |
| 56 | + Crawler.ANTHROPIC_CLAUDE_SEARCHBOT, |
| 57 | + Crawler.ANTHROPIC_CLAUDE_WEB, |
57 | 58 |
|
58 | 59 | // Apple |
59 | | - 'applebot', |
60 | | - 'applebot-extended', |
| 60 | + Crawler.APPLE_BOT, |
| 61 | + Crawler.APPLE_BOT_EXTENDED, |
61 | 62 |
|
62 | 63 | // Brave |
63 | | - 'bravebot', |
| 64 | + Crawler.BRAVE_BOT, |
64 | 65 |
|
65 | 66 | // ByteDance |
66 | | - 'bytespider', |
67 | | - 'tiktokspider', |
| 67 | + Crawler.BYTEDANCE_BYTESPIDER, |
| 68 | + Crawler.BYTEDANCE_TIKTOKSPIDER, |
68 | 69 |
|
69 | 70 | // Cohere |
70 | | - 'cohere-training-data-crawler', |
| 71 | + Crawler.COHERE_TRAINING_DATA_CRAWLER, |
71 | 72 |
|
72 | 73 | // Common Crawl |
73 | | - 'ccbot', |
| 74 | + Crawler.COMMON_CRAWL_CCBOT, |
74 | 75 |
|
75 | 76 | // Coveo |
76 | | - 'coveobot', |
| 77 | + Crawler.COVEO_BOT, |
77 | 78 |
|
78 | 79 | // DataForSeo |
79 | | - 'dataforseobot', |
| 80 | + Crawler.DATAFORSEO_BOT, |
80 | 81 |
|
81 | 82 | // DeepSeek |
82 | | - 'deepseekbot', |
| 83 | + Crawler.DEEPSEEK_BOT, |
83 | 84 |
|
84 | 85 | // Diffbot |
85 | | - 'diffbot', |
| 86 | + Crawler.DIFFBOT, |
86 | 87 |
|
87 | 88 | // Google |
88 | | - 'googleother', |
89 | | - 'googleother-image', |
90 | | - 'googleother-video', |
91 | | - 'google-cloudvertexbot', |
92 | | - 'google-extended', |
| 89 | + Crawler.GOOGLE_EXTENDED, |
| 90 | + Crawler.GOOGLE_OTHER, |
| 91 | + Crawler.GOOGLE_OTHER_IMAGE, |
| 92 | + Crawler.GOOGLE_OTHER_VIDEO, |
| 93 | + Crawler.GOOGLE_CLOUDVERTEXBOT, |
93 | 94 |
|
94 | 95 | // Hive AI |
95 | | - 'imagesiftbot', |
| 96 | + Crawler.HIVE_IMAGESIFTBOT, |
96 | 97 |
|
97 | 98 | // Huawei |
98 | | - 'petalbot', |
99 | | - 'pangubot', |
| 99 | + Crawler.HUAWEI_PETALBOT, |
| 100 | + Crawler.HUAWEI_PANGUBOT, |
100 | 101 |
|
101 | 102 | // Hugging Face |
102 | | - 'huggingface-bot', |
| 103 | + Crawler.HUGGINGFACE_BOT, |
103 | 104 |
|
104 | 105 | // Kangaroo |
105 | | - 'kangaroo bot', |
| 106 | + Crawler.KANGAROO_BOT, |
106 | 107 |
|
107 | 108 | // Mendable.ai |
108 | | - 'firecrawlagent', |
| 109 | + Crawler.FIRECRAWL_AGENT, |
109 | 110 |
|
110 | 111 | // Meta |
111 | | - 'facebookbot', |
112 | | - 'meta-externalagent', |
| 112 | + Crawler.META_FACEBOOKBOT, |
| 113 | + Crawler.META_EXTERNALAGENT, |
113 | 114 |
|
114 | 115 | // OpenAI |
115 | | - 'gptbot', |
116 | | - 'oai-searchbot', |
| 116 | + Crawler.OPENAI_GPTBOT, |
| 117 | + Crawler.OPENAI_SEARCH_BOT, |
117 | 118 |
|
118 | 119 | // Perplexity |
119 | | - 'perplexitybot', |
| 120 | + Crawler.PERPLEXITY_BOT, |
120 | 121 |
|
121 | 122 | // Replicate |
122 | | - 'replicate-bot', |
| 123 | + Crawler.REPLICATE_BOT, |
123 | 124 |
|
124 | 125 | // Runpod |
125 | | - 'runpod-bot', |
| 126 | + Crawler.RUNPOD_BOT, |
126 | 127 |
|
127 | 128 | // SB Intuitions |
128 | | - 'sbintuitionsbot', |
| 129 | + Crawler.SB_INTUITIONS_BOT, |
129 | 130 |
|
130 | 131 | // Semrush |
131 | | - 'semrushbot-ocob', |
| 132 | + Crawler.SEMRUSH_BOT_CONTENTSHAKE, |
132 | 133 |
|
133 | 134 | // Timpi |
134 | | - 'timpibot', |
| 135 | + Crawler.TIMPI_BOT, |
135 | 136 |
|
136 | 137 | // Together AI |
137 | | - 'together-bot', |
| 138 | + Crawler.TOGETHER_BOT, |
138 | 139 |
|
139 | 140 | // Velen.io |
140 | | - 'velenpublicwebcrawler', |
| 141 | + Crawler.HUNTER_VELENPUBLICWEBCRAWLER, |
141 | 142 |
|
142 | 143 | // Vercel |
143 | | - 'v0bot', |
| 144 | + Crawler.VERCEL_V0BOT, |
144 | 145 |
|
145 | 146 | // Webz.io |
146 | | - 'omgili', |
147 | | - 'omgilibot', |
148 | | - 'webzio-extended', |
| 147 | + Crawler.WEBZIO_OMGILI, |
| 148 | + Crawler.WEBZIO_OMGILI_BOT, |
| 149 | + Crawler.WEBZIO_EXTENDED, |
149 | 150 |
|
150 | 151 | // X |
151 | | - 'xai-bot', |
| 152 | + Crawler.XAI_BOT, |
152 | 153 |
|
153 | 154 | // You.com |
154 | | - 'youbot', |
| 155 | + Crawler.YOU_BOT, |
155 | 156 |
|
156 | 157 | // Zhipu AI |
157 | | - 'chatglm-spider', |
158 | | - |
159 | | - // Zyte |
160 | | - 'scrapy' |
161 | | - |
162 | | - ].includes(String(toResult(resultOrUA, Bots).browser.name).toLowerCase()); |
| 158 | + Crawler.ZHIPU_CHATGLM_SPIDER |
| 159 | + ] |
| 160 | + .map((s) => s.toLowerCase()) |
| 161 | + .includes(String(toResult(resultOrUA, Bots).browser.name).toLowerCase()); |
163 | 162 |
|
164 | 163 | const isBot = (resultOrUA) => [ |
165 | 164 | 'cli', |
|
0 commit comments