From c84077d01eea17829e6296a843b3ad8e4f1c8169 Mon Sep 17 00:00:00 2001 From: Greg Bonnette Date: Fri, 18 Nov 2016 09:34:31 -0500 Subject: [PATCH 01/15] Adding new Outlook email referrer Added outlook.live.com to list of Outlook.com email referrers. --- resources/referers.yml | 1 + 1 file changed, 1 insertion(+) diff --git a/resources/referers.yml b/resources/referers.yml index e1ecf54f..981f9ec5 100644 --- a/resources/referers.yml +++ b/resources/referers.yml @@ -107,6 +107,7 @@ email: Outlook.com: domains: - mail.live.com + - outlook.live.com QQ Mail: domains: From 10cb34f93a0dd1da55b9ef6b22dc0d3fdfcd4414 Mon Sep 17 00:00:00 2001 From: Daniel Morrison Date: Fri, 23 Sep 2016 12:51:30 +0100 Subject: [PATCH 02/15] Fix for ITU as it was incorrectly indented --- resources/referers.yml | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/resources/referers.yml b/resources/referers.yml index 981f9ec5..a7f5001c 100644 --- a/resources/referers.yml +++ b/resources/referers.yml @@ -421,7 +421,7 @@ social: domains: - getpocket.com - ITU Sozluk: + ITU Sozluk: domains: - itusozluk.com From 0ea94956e9824bc8ed40ce6567cf627980b63add Mon Sep 17 00:00:00 2001 From: Daniel Morrison Date: Fri, 23 Sep 2016 13:45:53 +0100 Subject: [PATCH 03/15] Removed Comcast duplicated key --- resources/referers.yml | 6 ------ 1 file changed, 6 deletions(-) diff --git a/resources/referers.yml b/resources/referers.yml index a7f5001c..070ea258 100644 --- a/resources/referers.yml +++ b/resources/referers.yml @@ -779,12 +779,6 @@ search: domains: - pesquisa.clix.pt - Comcast: - parameters: - - q - domains: - - search.comcast.net - Conduit: parameters: - q From fc842de92f8c14070871c35d673bec8ee24a11b9 Mon Sep 17 00:00:00 2001 From: Robert Kingston Date: Sat, 6 Aug 2016 19:03:29 +1000 Subject: [PATCH 04/15] Adding paid sources and medium - Removed Taboola and Outbrain from "unknown" section - Preliminary list of paid sources added --- resources/referers.yml | 184 +++++++++++++++++++++++++++++++++++++++-- 1 file changed, 176 insertions(+), 8 deletions(-) diff --git a/resources/referers.yml b/resources/referers.yml index 070ea258..9166fb21 100644 --- a/resources/referers.yml +++ b/resources/referers.yml @@ -8,6 +8,7 @@ # 2. Email providers # 3. Social providers # 4. Search providers +# 5. Paid media # ####################################################################################################### @@ -51,14 +52,6 @@ unknown: - omg.yahoo.com - match.yahoo.net - Taboola: - domains: - - trc.taboola.com - - api.taboola.com - - Outbrain: - domains: - - paid.outbrain.com # ####################################################################################################### @@ -3614,3 +3607,178 @@ search: - q domains: - zoohoo.cz + + + +# ####################################################################################################### +# +# PAID MEDIA + +paid: + + Acuity Ads: + domains: + - acuityplatform.com + + Adform: + domains: + - adform.net + + AdRoll: + domains: + - adroll.com + + AppNexus: + domains: + - ib.adnxs.com + - adnxs.com + - 247realmedia.com + + AudienceScience: + domains: + - wunderloop.net + + BidSwitch: + domains: + - bidswitch.net + + Casale Media: + domains: + - casalemedia.com + + Criteo: + domains: + - cas.jp.as.criteo.com + - cas.criteo.com + + Doubleclick: + domains: + - ad.doubleclick.net + - ad-apac.doubleclick.net + - s0.2mdn.net + - s1.2mdn.net + - dp.g.doubleclick.net + - pubads.g.doubleclick.net + + Eyeota: + domains: + - eyeota.net + + Flashtalking: + domains: + - flashtalking.com + - servedby.flashtalking.com + + Fluct: + domains: + - adingo.jp + + Google: + domains: + - www.googleadservices.com + - partner.googleadservices.com + - googleads.g.doubleclick.net + - tpc.googlesyndication.com + - googleadservices.com + - imasdk.googleapis.com + + LifeStreet: + domains: + - lfstmedia.com + + Jivox: + domains: + - jivox.com + + MicroAd: + domains: + - microad.jp + + Mixpo: + domains: + - mixpo.com + + Mozo: + domains: + - mozo.com.au + - a.mozo.com.au + + Neustar AdAdvisor: + domains: + - adadvisor.net + + ONE by AOL: + domains: + - nexage.com + + OpenX: + domains: + - us-ads.openx.net + - openx.net + - servedbyopenx.com + - openxenterprise.com + + Outbrain: + domains: + - paid.outbrain.com + + Plista: + domains: + - farm.plista.com + + PubMatic: + domains: + - sshowads.pubmatic.com + + Rubicon Project: + domains: + - optimized-by.rubiconproject.com + + Sizmek: + domains: + - bs.serving-sys.com + + Sociomantic Labs: + domains: + - sociomantic.com + + Sonobi: + domains: + - sonobi.com + + Sovrn: + domains: + - lijit.com + + SteelHouse: + domains: + - steelhousemedia.com + + StickyADS.tv: + domains: + - stickyadstv.com + - sfx.stickyadstv.com + + Taboola: + domains: + - trc.taboola.com + - api.taboola.com + - taboola.com + + Tribal Fusion: + domains: + - cdnx.tribalfusion.com + + White Pages: + domains: + - www.whitepages.com.au + - mobile.whitepages.com.au + + Yieldmo: + domains: + - yieldmo.com + + ZEDO: + domains: + - zedo.com + - z1.zedo.com From 4f1d8c7e4f98f40211e2835e3e3b4969559fc82d Mon Sep 17 00:00:00 2001 From: Robert Kingston Date: Sat, 6 Aug 2016 18:44:58 +1000 Subject: [PATCH 05/15] Updating search and mail referrers list - Adding some ANZ's largest ISPs' web mail domains and search engine domains (Dodo, Telstra, Optus, 2degrees, iiNet, Virgin, Vodafone etc) - Chinese Soso search engine merged under Sogou - Various other search engines added (SosoDesk - unrelated to Soso) - Moved a bunch of domains into alphabetical order to make management of the list a little easier in future --- resources/referers.yml | 149 ++++++++++++++++++++++++++++++++++++----- 1 file changed, 134 insertions(+), 15 deletions(-) diff --git a/resources/referers.yml b/resources/referers.yml index 9166fb21..619b3c77 100644 --- a/resources/referers.yml +++ b/resources/referers.yml @@ -68,6 +68,14 @@ email: domains: - mail.163.com + 2degrees: + domains: + - webmail.2degreesbroadband.co.nz + + Adam Internet: + domains: + - webmail.adam.com.au + AOL Mail: domains: - mail.aol.com @@ -76,22 +84,60 @@ email: domains: - webmail.bigpond.com - webmail2.bigpond.com + - email.telstra.com + - basic.messaging.bigpond.com + + Commander: + domains: + - webmail.commander.net.au Daum Mail: domains: - mail2.daum.net + - mail.daum.net + + Dodo: + domains: + - webmail.dodo.com.au + + Freenet: + domains: + - webmail.freenet.de Gmail: domains: - mail.google.com + - inbox.google.com + + iiNet: + domains: + - webmail.iinet.net.au + - mail.iinet.net.au + + Inbox.com: + domains: + - inbox.com + + iPrimus: + domains: + - webmail.iprimus.com.au + + Mynet Mail: + domains: + - mail.mynet.com Naver Mail: domains: - mail.naver.com + Netspace: + domains: + - webmail.netspace.net.au + Optus Zoo: domains: - - webmail.optuszoo.com.au + - webmail.optuszoo.com.au + - webmail.optusnet.com.au Orange Webmail: domains: @@ -108,7 +154,19 @@ email: Seznam Mail: domains: - - email.seznam.cz + - email.seznam.cz + + Virgin: + domains: + - webmail.virginbroadband.com.au + + Vodafone: + domains: + - webmail.vodafone.co.nz + + Westnet: + domains: + - webmail.westnet.com.au Yahoo! Mail: domains: @@ -116,11 +174,10 @@ email: - mail.yahoo.com - mail.yahoo.co.uk - mail.yahoo.co.jp - - Mynet Mail: - domains: - - mail.mynet.com + Zoho: + domains: + - mail.zoho.com # ####################################################################################################### # @@ -417,31 +474,31 @@ social: ITU Sozluk: domains: - itusozluk.com - + Instela: domains: - instela.com - + Eksi Sozluk: domains: - Sozluk.com - sourtimes.org - + Uludag Sozluk: domains: - uludagsozluk.com - ulusozluk.com - + Inci Sozluk: domains: - inci.sozlukspot.com - incisozluk.com - incisozluk.cc - + Hocam.com: domains: - hocam.com - + Donanimhaber: domains: - donanimhaber.com @@ -456,6 +513,10 @@ social: domains: - quora.com + Whirlpool: + domains: + - forums.whirlpool.net.au + # ####################################################################################################### # # SEARCH PROVIDERS @@ -470,6 +531,12 @@ search: # 123people TODO + 1&1: + parameters: + - q + domains: + - search.1and1.com + 1und1: parameters: - su @@ -741,6 +808,12 @@ search: domains: - search.bluewin.ch + British Telecommunications: + parameters: + - p + domains: + - search.bt.com + canoe.ca: parameters: - q @@ -858,6 +931,12 @@ search: - dmoz.org - editors.dmoz.org + Dodo: + parameters: + - q + domains: + - google.dodo.com.au + DuckDuckGo: parameters: - q @@ -940,6 +1019,12 @@ search: domains: - recherche.francite.com + Finderoo: + parameters: + - q + domains: + - www.finderoo.com + Findwide: parameters: - k @@ -2770,6 +2855,12 @@ search: domains: - www.ilse.nl + Inbox.com: + parameters: + - q + domains: + - inbox.com/search/ + InfoSpace: parameters: - q @@ -2789,6 +2880,12 @@ search: - search.searchcompletion.com - clusty.com + Flyingbird: + parameters: + - q + domains: + - inspsearch.com + Interia: parameters: - q @@ -3146,6 +3243,12 @@ search: # Add Scour.com + Search This: + parameters: + - q + domains: + - www.searchthis.com + Search.com: parameters: - q @@ -3196,11 +3299,20 @@ search: domains: - www.skynet.be + The Smart Search: + parameters: + - q + domains: + - thesmartsearch.net + - www.thesmartsearch.net + Sogou: parameters: - query + - w domains: - www.sougou.com + - www.soso.com Softonic: parameters: @@ -3208,11 +3320,12 @@ search: domains: - search.softonic.com - soso.com: + SoSoDesk: parameters: - - w + - q domains: - - www.soso.com + - sosodesktop.com + - search.sosodesktop.com Snapdo: parameters: @@ -3262,6 +3375,12 @@ search: domains: - technorati.com + Telstra: + parameters: + - find + domains: + - search.media.telstra.com.au + Teoma: parameters: - q From 331a55e62a16b44e1e1a59e30494f8f6c56a6b36 Mon Sep 17 00:00:00 2001 From: Victor Chima Date: Mon, 25 Jul 2016 17:51:45 +0200 Subject: [PATCH 06/15] Removed duplicate domains from referers.yml file --- resources/referers.yml | 20 ++------------------ 1 file changed, 2 insertions(+), 18 deletions(-) diff --git a/resources/referers.yml b/resources/referers.yml index 619b3c77..7bb4e9f1 100644 --- a/resources/referers.yml +++ b/resources/referers.yml @@ -30,7 +30,6 @@ unknown: - sites.google.com - groups.google.com - groups.google.co.uk - - news.google.co.uk Yahoo!: domains: @@ -424,7 +423,7 @@ social: Buzznet: domains: - - wayn.com + - buzznet.com Multiply: domains: @@ -1254,7 +1253,6 @@ search: - www.google.jo - www.google.co.jp - www.google.co.ke - - www.google.com.kh - www.google.ki - www.google.kg - www.google.co.kr @@ -1451,7 +1449,6 @@ search: - google.jo - google.co.jp - google.co.ke - - google.com.kh - google.ki - google.kg - google.co.kr @@ -1665,7 +1662,6 @@ search: - blogsearch.google.com.hk - blogsearch.google.com.jm - blogsearch.google.com.kh - - blogsearch.google.com.kh - blogsearch.google.com.kw - blogsearch.google.com.lb - blogsearch.google.com.lc @@ -2063,7 +2059,6 @@ search: - images.google.com.hk - images.google.com.jm - images.google.com.kh - - images.google.com.kh - images.google.com.kw - images.google.com.lb - images.google.com.lc @@ -2183,7 +2178,6 @@ search: - images.google.us - images.google.vg - images.google.vu - - images.google.ws Google News: parameters: @@ -2265,7 +2259,6 @@ search: - news.google.com.hk - news.google.com.jm - news.google.com.kh - - news.google.com.kh - news.google.com.kw - news.google.com.lb - news.google.com.lc @@ -2467,7 +2460,6 @@ search: - google.com.hk/products - google.com.jm/products - google.com.kh/products - - google.com.kh/products - google.com.kw/products - google.com.lb/products - google.com.lc/products @@ -2664,7 +2656,6 @@ search: - www.google.com.hk/products - www.google.com.jm/products - www.google.com.kh/products - - www.google.com.kh/products - www.google.com.kw/products - www.google.com.lb/products - www.google.com.lc/products @@ -3186,7 +3177,7 @@ search: parameters: - q domains: - - www.plazoo.com + - poisk.ru PriceRunner: parameters: @@ -3588,8 +3579,6 @@ search: - es.search.yahoo.com - es.yahoo.com - espanol.searchpanol.yahoo.com - - espanol.searchpanol.yahoo.com - - espanol.yahoo.com - espanol.yahoo.com - fr.search.yahoo.com - fr.yahoo.com @@ -3608,15 +3597,10 @@ search: - one.cn.yahoo.com - one.searchn.yahoo.com - qc.search.yahoo.com - - qc.search.yahoo.com - - qc.search.yahoo.com - - qc.yahoo.com - qc.yahoo.com - se.search.yahoo.com - - se.search.yahoo.com - se.yahoo.com - search.searcharch.yahoo.com - - search.yahoo.com - uk.search.yahoo.com - uk.yahoo.com - www.yahoo.co.jp From 55850229edfed8dfe623c15b9ee0794687a617dc Mon Sep 17 00:00:00 2001 From: "Andriy Kushnir (Orhideous)" Date: Tue, 24 May 2016 13:15:13 +0300 Subject: [PATCH 07/15] Add two popular ukrainian search providers: ukr.net and i.ua --- resources/referers.yml | 12 ++++++++++++ 1 file changed, 12 insertions(+) diff --git a/resources/referers.yml b/resources/referers.yml index 7bb4e9f1..1a033718 100644 --- a/resources/referers.yml +++ b/resources/referers.yml @@ -2889,6 +2889,12 @@ search: domains: - start.iplay.com + I.ua: + parameters: + - q + domains: + - search.i.ua + IXquick: parameters: - query @@ -3440,6 +3446,12 @@ search: domains: - www.twingly.com + UKR.net: + parameters: + - q + domains: + - search.ukr.net + uol.com.br: parameters: - q From 44615307eb22be1f01ef4f2dfa0d48eadccdb79e Mon Sep 17 00:00:00 2001 From: "Andriy Kushnir (Orhideous)" Date: Tue, 24 May 2016 13:15:47 +0300 Subject: [PATCH 08/15] Add belarusian search provider: tut.by --- resources/referers.yml | 6 ++++++ 1 file changed, 6 insertions(+) diff --git a/resources/referers.yml b/resources/referers.yml index 1a033718..f15e7215 100644 --- a/resources/referers.yml +++ b/resources/referers.yml @@ -3440,6 +3440,12 @@ search: domains: - www.trusted--search.com + Tut.by: + parameters: + - query + domains: + - search.tut.by + Twingly: parameters: - q From 519dadb53c72f64831cd9e6865c812579fdaded0 Mon Sep 17 00:00:00 2001 From: Alex Dean Date: Mon, 12 Jun 2017 00:32:46 +0300 Subject: [PATCH 09/15] Added kununu --- resources/referers.yml | 6 ++++++ 1 file changed, 6 insertions(+) diff --git a/resources/referers.yml b/resources/referers.yml index f15e7215..e7dd5f81 100644 --- a/resources/referers.yml +++ b/resources/referers.yml @@ -2944,6 +2944,12 @@ search: domains: - www.kvasir.no + kununu: + parameters: + - q + domains: + - kununu.com + Latne: parameters: - q From 54faaa1dad8b0097594462e63f35e5f3e08f5b03 Mon Sep 17 00:00:00 2001 From: Alex Dean Date: Mon, 12 Jun 2017 00:35:57 +0300 Subject: [PATCH 10/15] Add t.umblr domain to Tumblr --- resources/referers.yml | 1 + 1 file changed, 1 insertion(+) diff --git a/resources/referers.yml b/resources/referers.yml index e7dd5f81..47c10621 100644 --- a/resources/referers.yml +++ b/resources/referers.yml @@ -400,6 +400,7 @@ social: Tumblr: domains: - tumblr.com + - t.umblr.com Nasza-klasa.pl: domains: From 9baaa2012467f4198ee96eb675b35c1d41bda85c Mon Sep 17 00:00:00 2001 From: jobartim44 Date: Mon, 4 Jan 2016 10:32:22 +0100 Subject: [PATCH 11/15] Update referers.yml MIME-Version: 1.0 Content-Type: text/plain; charset=UTF-8 Content-Transfer-Encoding: 8bit Add différent search engines found on our websites. --- resources/referers.yml | 12 ++++++++++++ 1 file changed, 12 insertions(+) diff --git a/resources/referers.yml b/resources/referers.yml index 47c10621..7af31043 100644 --- a/resources/referers.yml +++ b/resources/referers.yml @@ -636,6 +636,7 @@ search: - www.aolimages.aol.fr - aim.search.aol.com - www.recherche.aol.fr + - recherche.aol.fr - find.web.aol.com - recherche.aol.ca - aolsearch.aol.co.uk @@ -757,6 +758,7 @@ search: - tieba.baidu.com - news.baidu.com - web.gougou.com + - m.baidu.com Biglobe: parameters: @@ -1334,6 +1336,7 @@ search: - www.google.tm - www.google.to - www.google.com.tn + - www.google.tn - www.google.com.tr - www.google.tt - www.google.com.tw @@ -1551,6 +1554,7 @@ search: - google.co.za - google.co.zm - google.co.zw + - google.tn # powered by Google - search.avg.com - isearch.avg.com @@ -3158,9 +3162,11 @@ search: Orange: parameters: - q + - kw domains: - busca.orange.es - search.orange.co.uk + - lemoteur.orange.fr Paperball: parameters: @@ -3500,6 +3506,12 @@ search: - ricercanews.virgilio.it - mobile.virgilio.it + Vi-view + parameters: + - q + domains: + - viview.inspsearch.com + Voila: parameters: - rdata From e1fa00fc4b974dac0f29451b8b399315f1afcc95 Mon Sep 17 00:00:00 2001 From: Alex Dean Date: Mon, 12 Jun 2017 14:21:30 +0300 Subject: [PATCH 12/15] Moved Vi-view under Flyingbird --- resources/referers.yml | 7 +------ 1 file changed, 1 insertion(+), 6 deletions(-) diff --git a/resources/referers.yml b/resources/referers.yml index 7af31043..35577b65 100644 --- a/resources/referers.yml +++ b/resources/referers.yml @@ -2881,6 +2881,7 @@ search: - q domains: - inspsearch.com + - viview.inspsearch.com Interia: parameters: @@ -3506,12 +3507,6 @@ search: - ricercanews.virgilio.it - mobile.virgilio.it - Vi-view - parameters: - - q - domains: - - viview.inspsearch.com - Voila: parameters: - rdata From 57d9946874b4bb083a3d49d5cf415d43b6167488 Mon Sep 17 00:00:00 2001 From: Alex Dean Date: Mon, 12 Jun 2017 13:47:37 +0300 Subject: [PATCH 13/15] Documentation: correct authors in README (close #148) --- README.md | 6 +++--- 1 file changed, 3 insertions(+), 3 deletions(-) diff --git a/README.md b/README.md index 3cd568a1..91d353f8 100644 --- a/README.md +++ b/README.md @@ -12,7 +12,7 @@ _Note that we always use the original HTTP misspelling of 'referer' (and thus 'r * Java/Scala: [Snowplow Analytics Ltd] [snowplow-analytics] * Ruby: [Kelley Reynolds] [kreynolds] at Inside Systems, Inc -* Python: [Don Spaulding] [donspaulding] +* Python: [Don Spaulding] [donspaulding] * node.js (JavaScript): [Martin Katrenik] [mkatrenik] * .NET (C#): [Sepp Wijnands] [swijnands] at [iPerform Software] [iperform] * PHP: [Lars Strojny] [lstrojny] @@ -299,9 +299,9 @@ The node.js (JavaScript) port is copyright 2013-2014 [Martin Katrenik] [mkatreni The .NET (C#) port is copyright 2013-2014 [iPerform Software] [iperform] and is available under the [Apache License, Version 2.0] [apache-license]. -The PHP port is copyright 2013-2014 [Lars Strojny] [tsileo] and is available under the [MIT License] [mit-license]. +The PHP port is copyright 2013-2014 [Lars Strojny] [lstrojny] and is available under the [MIT License] [mit-license]. -The Go port is copyright 2014 [Thomas Sileo] [lstrojny] and is available under the [MIT License] [mit-license]. +The Go port is copyright 2014 [Thomas Sileo] [tsileo] and is available under the [MIT License] [mit-license]. [ua-parser]: https://github.com/tobie/ua-parser From 81fbf6892ebe6393dec3a195b19f0e0b8f84fabc Mon Sep 17 00:00:00 2001 From: Alex Dean Date: Mon, 12 Jun 2017 14:44:39 +0300 Subject: [PATCH 14/15] Documentation: add new section about hosted database (close #150) --- README.md | 16 +++++++++++++++- 1 file changed, 15 insertions(+), 1 deletion(-) diff --git a/README.md b/README.md index 91d353f8..c8eb6884 100644 --- a/README.md +++ b/README.md @@ -2,12 +2,26 @@ Java/Scala: [![Build Status](https://travis-ci.org/snowplow/referer-parser.png)](https://travis-ci.org/snowplow/referer-parser) -referer-parser is a multi-language library for extracting marketing attribution data (such as search terms) from referer URLs, inspired by the [ua-parser] [ua-parser] project (an equivalent library for user agent parsing). +referer-parser is a database for extracting marketing attribution data (such as search terms) from referer URLs, inspired by the [ua-parser] [ua-parser] project (an equivalent library for user agent parsing). + +The referer-parser project also contains multiple libraries for working with the referer-parser database in different languages. referer-parser is a core component of [Snowplow] [snowplow], the open-source web-scale analytics platform powered by Hadoop and Redshift. _Note that we always use the original HTTP misspelling of 'referer' (and thus 'referal') in this project - never 'referrer'._ +## Database + +The latest database is always available on this URL: + +https://s3-eu-west-1.amazonaws.com/snowplow-hosted-assets/third-party/referer-parser/referers-latest.yml + +The database is updated at most once a month. Each new version of the database is also uploaded with a timestamp: + +https://s3-eu-west-1.amazonaws.com/snowplow-hosted-assets/third-party/referer-parser/referers-YYYY-MM.yml + +If there is an issue with the database necessitating a re-release within the month, the corresponding files will be overwritten. + ## Maintainers * Java/Scala: [Snowplow Analytics Ltd] [snowplow-analytics] From e78a6521efd334d7f07ad9495cdbef97030509a7 Mon Sep 17 00:00:00 2001 From: Alex Dean Date: Mon, 12 Jun 2017 14:46:20 +0300 Subject: [PATCH 15/15] Prepared for release --- CHANGELOG | 17 +++++++++++++++++ 1 file changed, 17 insertions(+) create mode 100644 CHANGELOG diff --git a/CHANGELOG b/CHANGELOG new file mode 100644 index 00000000..4cacd6a7 --- /dev/null +++ b/CHANGELOG @@ -0,0 +1,17 @@ +Release June 2017 (2017-06-12) +------------------------------ +Documentation: correct authors in README (#148) +Documentation: add new section about hosted database (#150) +Database: add preliminary list of paid sources +Database: add some ANZ's largest ISPs' web mail domains and search engine domains (Dodo, Telstra, Optus, 2degrees, iiNet, Virgin, Vodafone etc) +Database: add various other search engines (SosoDesk - unrelated to Soso) +Database: add Ukrainian search providers ukr.net and i.ua +Database: add belarusian search provider tut.by +Database: add kununu +Database: add outlook.live.com to list of Outlook.com email referrers +Database: add t.umblr domain to Tumblr +Database: merge Chinese Soso search engine under Sogou +Database: fix for ITU as it was incorrectly indented +Database: remove duplicated domains e.g. Comcast +Database: move Taboola and Outbrain from "unknown" section to paid sources +Database: move some domains into alphabetical order