Skip to content

Commit edc9fb1

Browse files
committed
exclude android.clients.google.com
1 parent 220d0b8 commit edc9fb1

3 files changed

Lines changed: 10 additions & 10 deletions

File tree

sql/2025/privacy/tracker_distribution.sql

Lines changed: 4 additions & 4 deletions
Original file line numberDiff line numberDiff line change
@@ -26,14 +26,14 @@ tracker_counts AS (
2626
root_page,
2727
COUNT(DISTINCT tracker) AS number_of_trackers
2828
FROM `httparchive.crawl.requests`
29-
JOIN whotracksme
29+
LEFT JOIN whotracksme
3030
ON
3131
NET.HOST(url) = domain OR
3232
ENDS_WITH(NET.HOST(url), CONCAT('.', domain))
3333
WHERE
34-
date = '2025-07-01' AND
35-
--rank = 1000 AND
36-
NOT ENDS_WITH('.' || NET.HOST(root_page), '.' || NET.HOST(url)) -- third-party
34+
date = '2025-07-01'
35+
--AND rank = 1000
36+
AND url NOT IN ('https://android.clients.google.com/checkin', 'https://android.clients.google.com/c2dm/register3')
3737
GROUP BY
3838
client,
3939
root_page

sql/2025/privacy/whotracksme_categories_top.sql

Lines changed: 3 additions & 3 deletions
Original file line numberDiff line numberDiff line change
@@ -30,8 +30,8 @@ tracker_categories AS (
3030
ENDS_WITH(NET.HOST(url), CONCAT('.', domain))
3131
)
3232
WHERE
33-
date = '2025-07-01' AND
34-
NOT ENDS_WITH('.' || NET.HOST(root_page), '.' || NET.HOST(url)) -- third party
33+
date = '2025-07-01'
34+
AND url NOT IN ('https://android.clients.google.com/checkin', 'https://android.clients.google.com/c2dm/register3')
3535
),
3636

3737
aggregated AS (
@@ -63,4 +63,4 @@ FROM aggregated
6363
FOR client IN ('desktop', 'mobile')
6464
)
6565
|> RENAME pct_mobile AS mobile, pct_desktop AS desktop
66-
|> ORDER BY websites_count_desktop + websites_count_mobile DESC
66+
|> ORDER BY COALESCE(websites_count_desktop, 0) + COALESCE(websites_count_mobile, 0) DESC

sql/2025/privacy/whotracksme_trackers_top.sql

Lines changed: 3 additions & 3 deletions
Original file line numberDiff line numberDiff line change
@@ -22,8 +22,8 @@ FROM `httparchive.crawl.requests`
2222
ON NET.HOST(url) = domain OR
2323
ENDS_WITH(NET.HOST(url), '.' || domain)
2424
|> WHERE
25-
date = '2025-07-01' AND
26-
NOT ENDS_WITH('.' || NET.HOST(root_page), '.' || NET.HOST(url)) -- third party
25+
date = '2025-07-01'
26+
AND url NOT IN ('https://android.clients.google.com/checkin', 'https://android.clients.google.com/c2dm/register3')
2727
|> AGGREGATE COUNT(DISTINCT root_page) AS number_of_websites GROUP BY client, tracker
2828
|> JOIN base_totals USING (client)
2929
|> EXTEND number_of_websites / total_websites AS pct_websites
@@ -34,4 +34,4 @@ FROM `httparchive.crawl.requests`
3434
FOR client IN ('desktop', 'mobile')
3535
)
3636
|> RENAME pct_mobile AS mobile, pct_desktop AS desktop
37-
|> ORDER BY websites_count_desktop + websites_count_mobile DESC
37+
|> ORDER BY COALESCE(websites_count_desktop, 0) + COALESCE(websites_count_mobile, 0) DESC

0 commit comments

Comments
 (0)