map $http_user_agent $denied_scraper {
default 0; # Not denied
'' 1; # No User-Agent Set
+ '-' 1;
# Library defaults
'~^Python\-urllib\/' 1;
'~^Microsoft-ATL-Native\/' 1;
'/n software IPWorks HTTP/S Component - www.nsoftware.com' 1;
'~^Wget\/' 1;
+ 'java' 1;
# Library defaults or fakes
'Android' 1;
'host' 1;
'~^maptestapp' 1;
'Other' 1;
+ 'osmdroid' 1;
+ '~^tilelive-http' 1;
+ '~^Java-http-client' 1;
# Fakes
'Mozilla/4.0' 1;
'br.com.concisoti.potybus' 1;
'com.soft373.taptaxi' 1;
'com.kradac.ktxcore' 1;
- 'ru.crowdsystems.topcontrol.knd' 1;
+ '~^ru.crowdsystems.topcontrol.knd' 1;
'pl.itaxi.driver' 1;
'net.uztaxi.driver' 1;
'OSMDroid/2.1 (its; rutaxi 3.28.0)' 1;
'ru.taximaster.www' 1;
'com.arobs.trackgps' 1;
'com.helleniccomms.asteras.driver' 1;
+
+ # Malware
+ 'Agent Smith' 1;
# '~[a-f0-9]{8}-[a-f0-9]{4}-[a-f0-9]{4}-[a-f0-9]{12}' 1; # Fake UA
}
map $http_referer $denied_referer {
default 0; # Not denied
- 'http://www.openstreetmap.org/' 1; # Faked
- 'http://www.openstreetmap.org' 1; # Faked
- 'https://www.openstreetmap.org' 1; # Faked
- 'http://openstreetmap.org/' 1; # Faked
- 'http://openstreetmap.org' 1; # Faked
- 'https://openstreetmap.org' 1; # Faked
- 'http://www.osm.org/' 1; # Faked
- 'http://www.osm.org' 1; # Faked
- 'http://osm.org/' 1; # Faked
- 'http://osm.org' 1; # Faked
- 'http://google.com' 1; # Faked
- 'http://www.google.com' 1; # Faked
- 'http://google.com/' 1; # Faked
- 'http://www.google.com/' 1; # Faked
- 'https://google.com' 1; # Faked
- 'https://www.google.com' 1; # Faked
- 'https://google.com/' 1; # Faked
- 'https://www.google.com/' 1; # Faked
- 'http://www.microsoft.com/' 1; # Faked
- '~^https?://pmap\.kuku\.lu/' 1; # Too much traffic
- '~^https?://[^.]*\.pmap\.kuku\.lu/' 1; # Too much traffic
- '~^https?://fastpokemap\.com/' 1; # Too much traffic
- '~^https?://[^.]*\.fastpokemap\.com/' 1; # Too much traffic
- '~^https?://pkget\.com/' 1; # Too much traffic
- '~^https?://[^.]*\.pkget\.com/' 1; # Too much traffic
- '~^https?://twpkinfo\.com/' 1; # Too much traffic
- '~^https?://[^.]*\.twpkinfo\.com/' 1; # Too much traffic
- '~^https?://9db\.jp/' 1; # Too much traffic
- '~^https?://[^.]*\.9db\.jp/' 1; # Too much traffic
- '~^https?://clustrmaps\.com/' 1; # Too much traffic
- '~^https?://[^.]*\.clustrmaps\.com/' 1; # Too much traffic
- '~^https?://geoportal360\.pl/' 1; # Too much traffic
- '~^https?://skelbiu\.lt/' 1; # Too much traffic
- '~^https?://[^.]*\.skelbiu\.lt/' 1; # Too much traffic
- # '~^https?://[^.]*\.wialon.com/' 1; # Too much traffic (hold per 2020-04-10 email)
+ # Faked sites
+ 'http://www.openstreetmap.org/' 1;
+ 'http://www.openstreetmap.org' 1;
+ 'https://www.openstreetmap.org' 1;
+ 'http://openstreetmap.org/' 1;
+ 'http://openstreetmap.org' 1;
+ 'https://openstreetmap.org' 1;
+ 'http://www.osm.org/' 1;
+ 'http://www.osm.org' 1;
+ 'http://osm.org/' 1;
+ 'http://osm.org' 1;
+ 'http://google.com' 1;
+ 'http://www.google.com' 1;
+ 'http://google.com/' 1;
+ 'http://www.google.com/' 1;
+ 'https://google.com' 1;
+ 'https://www.google.com' 1;
+ 'https://google.com/' 1;
+ 'https://www.google.com/' 1;
+ 'http://www.microsoft.com/' 1;
+
+ # Overusing websites
+ '~^https?://pmap\.kuku\.lu/' 1;
+ '~^https?://[^.]*\.pmap\.kuku\.lu/' 1;
+ '~^https?://fastpokemap\.com/' 1;
+ '~^https?://[^.]*\.fastpokemap\.com/' 1;
+ '~^https?://pkget\.com/' 1;
+ '~^https?://[^.]*\.pkget\.com/' 1;
+ '~^https?://twpkinfo\.com/' 1;
+ '~^https?://[^.]*\.twpkinfo\.com/' 1;
+ '~^https?://9db\.jp/' 1;
+ '~^https?://[^.]*\.9db\.jp/' 1;
+ '~^https?://clustrmaps\.com/' 1;
+ '~^https?://[^.]*\.clustrmaps\.com/' 1;
+ '~^https?://geoportal360\.pl/' 1;
+ '~^https?://skelbiu\.lt/' 1;
+ '~^https?://[^.]*\.skelbiu\.lt/' 1;
+ '~^https?://wialon\.[^.]*/' 1; # wialon has many domains, so block them all
+ '~^https?://[^.]*\.wialon\.[^.]*/' 1;
+ '~^https?://gps-trace\.com/' 1;
+ '~^https?://[^.]*\.gps-trace\.com/' 1;
+ '~^https?://cellmapper\.net/' 1;
+ '~^https?://[^.]*\.cellmapper\.net/' 1;
}
map $http_referer $osm_referer {