<?xml version="1.0" encoding="UTF-8"?>
<!-- generator="FeedCreator 1.8" -->
<?xml-stylesheet href="https://measuretheweb.org/lib/exe/css.php?s=feed" type="text/css"?>
<rdf:RDF
    xmlns="http://purl.org/rss/1.0/"
    xmlns:rdf="http://www.w3.org/1999/02/22-rdf-syntax-ns#"
    xmlns:slash="http://purl.org/rss/1.0/modules/slash/"
    xmlns:dc="http://purl.org/dc/elements/1.1/">
    <channel rdf:about="https://measuretheweb.org/feed.php">
        <title>Measure The Web</title>
        <description></description>
        <link>https://measuretheweb.org/</link>
        <image rdf:resource="https://measuretheweb.org/_media/wiki/dokuwiki.svg" />
       <dc:date>2026-04-21T10:19:27+00:00</dc:date>
        <items>
            <rdf:Seq>
                <rdf:li rdf:resource="https://measuretheweb.org/start?rev=1774597921&amp;do=diff"/>
                <rdf:li rdf:resource="https://measuretheweb.org/programming/similarweb?rev=1774344851&amp;do=diff"/>
                <rdf:li rdf:resource="https://measuretheweb.org/privacy/requests?rev=1759994294&amp;do=diff"/>
                <rdf:li rdf:resource="https://measuretheweb.org/design/website_classification?rev=1750668644&amp;do=diff"/>
                <rdf:li rdf:resource="https://measuretheweb.org/research_journey?rev=1742380570&amp;do=diff"/>
                <rdf:li rdf:resource="https://measuretheweb.org/writing/conferences?rev=1742380068&amp;do=diff"/>
                <rdf:li rdf:resource="https://measuretheweb.org/programming/interaction?rev=1742374311&amp;do=diff"/>
                <rdf:li rdf:resource="https://measuretheweb.org/literature/bibliography?rev=1742373423&amp;do=diff"/>
                <rdf:li rdf:resource="https://measuretheweb.org/programming/stateful_stateless?rev=1742307641&amp;do=diff"/>
                <rdf:li rdf:resource="https://measuretheweb.org/design/archives?rev=1742306852&amp;do=diff"/>
                <rdf:li rdf:resource="https://measuretheweb.org/playground/playground?rev=1742306770&amp;do=diff"/>
                <rdf:li rdf:resource="https://measuretheweb.org/?image=privacy%3Aprivacy_cookies_cookieblock_vs_cookiepedia.png&amp;ns=privacy&amp;rev=1736271935&amp;tab_details=history&amp;media_do=diff&amp;do=media"/>
                <rdf:li rdf:resource="https://measuretheweb.org/?image=wiki%3Aprivacy%3Aprivacy_adgraph_performance_lists_iqbal2020_adgraph.png&amp;ns=wiki%3Aprivacy&amp;rev=1735924136&amp;tab_details=history&amp;media_do=diff&amp;do=media"/>
                <rdf:li rdf:resource="https://measuretheweb.org/?image=privacy%3Aprivacy_adgraph_performance_lists_iqbal2020_adgraph.png&amp;ns=privacy&amp;rev=1735924040&amp;tab_details=history&amp;media_do=diff&amp;do=media"/>
                <rdf:li rdf:resource="https://measuretheweb.org/?image=design%3Awebsite_ranking_list_popularity_scheitle2018.png&amp;ns=design&amp;rev=1735838037&amp;tab_details=history&amp;media_do=diff&amp;do=media"/>
                <rdf:li rdf:resource="https://measuretheweb.org/?image=design%3Awebsite_ranking_list_popularity_xie2022.png&amp;ns=design&amp;rev=1735838036&amp;tab_details=history&amp;media_do=diff&amp;do=media"/>
                <rdf:li rdf:resource="https://measuretheweb.org/?image=design%3Awebsite_classification_coverage_vallina2020.png&amp;ns=design&amp;rev=1735838030&amp;tab_details=history&amp;media_do=diff&amp;do=media"/>
                <rdf:li rdf:resource="https://measuretheweb.org/?image=design%3Awebsite_classification_popularity_vallina2020.png&amp;ns=design&amp;rev=1735838030&amp;tab_details=history&amp;media_do=diff&amp;do=media"/>
                <rdf:li rdf:resource="https://measuretheweb.org/?image=design%3Awebsite_ranking_list_manipulations_lepochat2019.png&amp;ns=design&amp;rev=1735838029&amp;tab_details=history&amp;media_do=diff&amp;do=media"/>
            </rdf:Seq>
        </items>
    </channel>
    <image rdf:about="https://measuretheweb.org/_media/wiki/dokuwiki.svg">
        <title>Measure The Web</title>
        <link>https://measuretheweb.org/</link>
        <url>https://measuretheweb.org/_media/wiki/dokuwiki.svg</url>
    </image>
    <item rdf:about="https://measuretheweb.org/start?rev=1774597921&amp;do=diff">
        <dc:format>text/html</dc:format>
        <dc:date>2026-03-27T07:52:01+00:00</dc:date>
        <dc:creator>karelkubicek (karelkubicek@undisclosed.example.com)</dc:creator>
        <title>start - [Outline] </title>
        <link>https://measuretheweb.org/start?rev=1774597921&amp;do=diff</link>
        <description>Welcome to Measure The Web

Empirical studies on the web require researchers to navigate a complex landscape of experimental design choices, ranging from selecting a representative sample of websites to choosing the appropriate crawling technology. Similarly, analyzing results involves critical decisions, such as website categorization and statistical methodology. Too often, these decisions are made based on limited guidance, informal advice, or trial and error, despite their profound impact on …</description>
    </item>
    <item rdf:about="https://measuretheweb.org/programming/similarweb?rev=1774344851&amp;do=diff">
        <dc:format>text/html</dc:format>
        <dc:date>2026-03-24T09:34:11+00:00</dc:date>
        <dc:creator>karelkubicek (karelkubicek@undisclosed.example.com)</dc:creator>
        <title>similarweb - Updated API against blocking</title>
        <link>https://measuretheweb.org/programming/similarweb?rev=1774344851&amp;do=diff</link>
        <description>While official API use is paid, Similarweb offers a browser extension, which uses an internal API to retrieve data. 

Methodology for Code Reproduction

To update the scraper logic when Similarweb changes their verification, follow these steps:

	*    Install the extension in a Chromium-based browser.</description>
    </item>
    <item rdf:about="https://measuretheweb.org/privacy/requests?rev=1759994294&amp;do=diff">
        <dc:format>text/html</dc:format>
        <dc:date>2025-10-09T07:18:14+00:00</dc:date>
        <dc:creator>karelkubicek (karelkubicek@undisclosed.example.com)</dc:creator>
        <title>requests - [Programming: Using Lists] added adblock-rust</title>
        <link>https://measuretheweb.org/privacy/requests?rev=1759994294&amp;do=diff</link>
        <description>Classifying Web Requests

A common task in web privacy measurements is to determine which web requests correspond to the benign loading of required web resources and which are used to track users. There are two main methods for such classification: matching requests against crowd-sourced lists (typically used in ad-blocking or tracking protection extensions) or using machine learning (</description>
    </item>
    <item rdf:about="https://measuretheweb.org/design/website_classification?rev=1750668644&amp;do=diff">
        <dc:format>text/html</dc:format>
        <dc:date>2025-06-23T08:50:44+00:00</dc:date>
        <dc:creator>karelkubicek (karelkubicek@undisclosed.example.com)</dc:creator>
        <title>website_classification - [Adult Websites, Security, and Privacy Protection] </title>
        <link>https://measuretheweb.org/design/website_classification?rev=1750668644&amp;do=diff</link>
        <description>Overview

Similarly to Website Selection, also the classification of websites according to their topic, properties of their companies (industry type, employees count) is often important step in results processing of web measurement studies. Awareness of the available services, their capabilities but also limitations is essential for high-quality research.</description>
    </item>
    <item rdf:about="https://measuretheweb.org/research_journey?rev=1742380570&amp;do=diff">
        <dc:format>text/html</dc:format>
        <dc:date>2025-03-19T10:36:10+00:00</dc:date>
        <dc:creator>karelkubicek (karelkubicek@undisclosed.example.com)</dc:creator>
        <title>research_journey - new links</title>
        <link>https://measuretheweb.org/research_journey?rev=1742380570&amp;do=diff</link>
        <description>Research Journey

At the moment, this page is WiP and only relevant to automated measurements. Maybe we have to create the same page for manual studies (I am not covering them at the wiki at all now). The plan is that each point links to some page.</description>
    </item>
    <item rdf:about="https://measuretheweb.org/writing/conferences?rev=1742380068&amp;do=diff">
        <dc:format>text/html</dc:format>
        <dc:date>2025-03-19T10:27:48+00:00</dc:date>
        <dc:creator>karelkubicek (karelkubicek@undisclosed.example.com)</dc:creator>
        <title>conferences - created</title>
        <link>https://measuretheweb.org/writing/conferences?rev=1742380068&amp;do=diff</link>
        <description>Conferences and Journals

This page should outline list of publication venues suitable for web measurement studies, typically with focus on security or privacy.

URLs to conferences were up to date in 2025, but year of conference is often embedded in the link and can be easily updated.</description>
    </item>
    <item rdf:about="https://measuretheweb.org/programming/interaction?rev=1742374311&amp;do=diff">
        <dc:format>text/html</dc:format>
        <dc:date>2025-03-19T08:51:51+00:00</dc:date>
        <dc:creator>karelkubicek (karelkubicek@undisclosed.example.com)</dc:creator>
        <title>interaction - Links and references</title>
        <link>https://measuretheweb.org/programming/interaction?rev=1742374311&amp;do=diff</link>
        <description>Interaction with website

This page only contains notes

Topics to cover (in separate pages):

	*  Input into website forms
	*  Interacting with consent
	*  Stateful and stateless crawling
		*  Urban et al.  studied crawling only index pages vs crawling multiple subpages of a website, showing significant increase in third-party requests and cookies when you browse also subpages. From 10 visited subpages is increase small.</description>
    </item>
    <item rdf:about="https://measuretheweb.org/literature/bibliography?rev=1742373423&amp;do=diff">
        <dc:format>text/html</dc:format>
        <dc:date>2025-03-19T08:37:03+00:00</dc:date>
        <dc:creator>karelkubicek (karelkubicek@undisclosed.example.com)</dc:creator>
        <title>bibliography - Polishing archives papers + new papers for website interaction topics</title>
        <link>https://measuretheweb.org/literature/bibliography?rev=1742373423&amp;do=diff</link>
        <description></description>
    </item>
    <item rdf:about="https://measuretheweb.org/programming/stateful_stateless?rev=1742307641&amp;do=diff">
        <dc:format>text/html</dc:format>
        <dc:date>2025-03-18T14:20:41+00:00</dc:date>
        <dc:creator>karelkubicek (karelkubicek@undisclosed.example.com)</dc:creator>
        <title>stateful_stateless - filled with references</title>
        <link>https://measuretheweb.org/programming/stateful_stateless?rev=1742307641&amp;do=diff</link>
        <description>Stateful and Stateless Crawling

This page only contains notes

Key message:

	*  Majority of web measurements studies use stateless crawls, as it is easy to associate events with the single browsed visited website. Also, stateless crawls do not depend on crawling order and are easier to parallelize.</description>
    </item>
    <item rdf:about="https://measuretheweb.org/design/archives?rev=1742306852&amp;do=diff">
        <dc:format>text/html</dc:format>
        <dc:date>2025-03-18T14:07:32+00:00</dc:date>
        <dc:creator>archives (archives@undisclosed.example.com)</dc:creator>
        <title>archives</title>
        <link>https://measuretheweb.org/design/archives?rev=1742306852&amp;do=diff</link>
        <description>Use of web archives for research

Various researchers have utilized web archives for longitudinal analyses of privacy  and security features . 
Using archives for research have several advantages. Their use helps towards solving the issue of reproducibility of research, given that a static snapshot is used for each page visit. It also eliminates the need to write project-specific crawlers. However, there are a number of pitfalls associated with the use of archives. Additionally, there are numero…</description>
    </item>
    <item rdf:about="https://measuretheweb.org/playground/playground?rev=1742306770&amp;do=diff">
        <dc:format>text/html</dc:format>
        <dc:date>2025-03-18T14:06:10+00:00</dc:date>
        <dc:creator>archives (archives@undisclosed.example.com)</dc:creator>
        <title>playground - removed</title>
        <link>https://measuretheweb.org/playground/playground?rev=1742306770&amp;do=diff</link>
        <description>PlayGround</description>
    </item>
    <item rdf:about="https://measuretheweb.org/?image=privacy%3Aprivacy_cookies_cookieblock_vs_cookiepedia.png&amp;ns=privacy&amp;rev=1736271935&amp;tab_details=history&amp;media_do=diff&amp;do=media">
        <dc:format>text/html</dc:format>
        <dc:date>2025-01-07T17:45:35+00:00</dc:date>
        <dc:creator>karelkubicek (karelkubicek@undisclosed.example.com)</dc:creator>
        <title>privacy_cookies_cookieblock_vs_cookiepedia.png - created</title>
        <link>https://measuretheweb.org/?image=privacy%3Aprivacy_cookies_cookieblock_vs_cookiepedia.png&amp;ns=privacy&amp;rev=1736271935&amp;tab_details=history&amp;media_do=diff&amp;do=media</link>
        <description>&lt;img src=&quot;https://measuretheweb.org/_media/privacy/privacy_cookies_cookieblock_vs_cookiepedia.png?w=500&amp;amp;h=500&amp;amp;tok=fc904a&quot; alt=&quot;privacy_cookies_cookieblock_vs_cookiepedia.png&quot; loading=&quot;lazy&quot; width=&quot;500&quot; height=&quot;500&quot; /&gt;</description>
    </item>
    <item rdf:about="https://measuretheweb.org/?image=wiki%3Aprivacy%3Aprivacy_adgraph_performance_lists_iqbal2020_adgraph.png&amp;ns=wiki%3Aprivacy&amp;rev=1735924136&amp;tab_details=history&amp;media_do=diff&amp;do=media">
        <dc:format>text/html</dc:format>
        <dc:date>2025-01-03T17:08:56+00:00</dc:date>
        <dc:creator>admin (admin@undisclosed.example.com)</dc:creator>
        <title>privacy_adgraph_performance_lists_iqbal2020_adgraph.png - removed</title>
        <link>https://measuretheweb.org/?image=wiki%3Aprivacy%3Aprivacy_adgraph_performance_lists_iqbal2020_adgraph.png&amp;ns=wiki%3Aprivacy&amp;rev=1735924136&amp;tab_details=history&amp;media_do=diff&amp;do=media</link>
        <description>&lt;img src=&quot;https://measuretheweb.org/_media/wiki/privacy/privacy_adgraph_performance_lists_iqbal2020_adgraph.png?w=500&amp;amp;h=500&amp;amp;tok=8dc038&quot; alt=&quot;privacy_adgraph_performance_lists_iqbal2020_adgraph.png&quot; loading=&quot;lazy&quot; width=&quot;500&quot; height=&quot;500&quot; /&gt;</description>
    </item>
    <item rdf:about="https://measuretheweb.org/?image=privacy%3Aprivacy_adgraph_performance_lists_iqbal2020_adgraph.png&amp;ns=privacy&amp;rev=1735924040&amp;tab_details=history&amp;media_do=diff&amp;do=media">
        <dc:format>text/html</dc:format>
        <dc:date>2025-01-03T17:07:20+00:00</dc:date>
        <dc:creator>karelkubicek (karelkubicek@undisclosed.example.com)</dc:creator>
        <title>privacy_adgraph_performance_lists_iqbal2020_adgraph.png - created</title>
        <link>https://measuretheweb.org/?image=privacy%3Aprivacy_adgraph_performance_lists_iqbal2020_adgraph.png&amp;ns=privacy&amp;rev=1735924040&amp;tab_details=history&amp;media_do=diff&amp;do=media</link>
        <description>&lt;img src=&quot;https://measuretheweb.org/_media/privacy/privacy_adgraph_performance_lists_iqbal2020_adgraph.png?w=500&amp;amp;h=500&amp;amp;tok=d3576d&quot; alt=&quot;privacy_adgraph_performance_lists_iqbal2020_adgraph.png&quot; loading=&quot;lazy&quot; width=&quot;500&quot; height=&quot;500&quot; /&gt;</description>
    </item>
    <item rdf:about="https://measuretheweb.org/?image=design%3Awebsite_ranking_list_popularity_scheitle2018.png&amp;ns=design&amp;rev=1735838037&amp;tab_details=history&amp;media_do=diff&amp;do=media">
        <dc:format>text/html</dc:format>
        <dc:date>2025-01-02T17:13:57+00:00</dc:date>
        <dc:creator>karelkubicek (karelkubicek@undisclosed.example.com)</dc:creator>
        <title>website_ranking_list_popularity_scheitle2018.png - created</title>
        <link>https://measuretheweb.org/?image=design%3Awebsite_ranking_list_popularity_scheitle2018.png&amp;ns=design&amp;rev=1735838037&amp;tab_details=history&amp;media_do=diff&amp;do=media</link>
        <description>&lt;img src=&quot;https://measuretheweb.org/_media/design/website_ranking_list_popularity_scheitle2018.png?w=500&amp;amp;h=500&amp;amp;tok=f313a7&quot; alt=&quot;website_ranking_list_popularity_scheitle2018.png&quot; loading=&quot;lazy&quot; width=&quot;500&quot; height=&quot;500&quot; /&gt;</description>
    </item>
    <item rdf:about="https://measuretheweb.org/?image=design%3Awebsite_ranking_list_popularity_xie2022.png&amp;ns=design&amp;rev=1735838036&amp;tab_details=history&amp;media_do=diff&amp;do=media">
        <dc:format>text/html</dc:format>
        <dc:date>2025-01-02T17:13:56+00:00</dc:date>
        <dc:creator>karelkubicek (karelkubicek@undisclosed.example.com)</dc:creator>
        <title>website_ranking_list_popularity_xie2022.png - created</title>
        <link>https://measuretheweb.org/?image=design%3Awebsite_ranking_list_popularity_xie2022.png&amp;ns=design&amp;rev=1735838036&amp;tab_details=history&amp;media_do=diff&amp;do=media</link>
        <description>&lt;img src=&quot;https://measuretheweb.org/_media/design/website_ranking_list_popularity_xie2022.png?w=500&amp;amp;h=500&amp;amp;tok=24e12f&quot; alt=&quot;website_ranking_list_popularity_xie2022.png&quot; loading=&quot;lazy&quot; width=&quot;500&quot; height=&quot;500&quot; /&gt;</description>
    </item>
    <item rdf:about="https://measuretheweb.org/?image=design%3Awebsite_classification_coverage_vallina2020.png&amp;ns=design&amp;rev=1735838030&amp;tab_details=history&amp;media_do=diff&amp;do=media">
        <dc:format>text/html</dc:format>
        <dc:date>2025-01-02T17:13:50+00:00</dc:date>
        <dc:creator>karelkubicek (karelkubicek@undisclosed.example.com)</dc:creator>
        <title>website_classification_coverage_vallina2020.png - created</title>
        <link>https://measuretheweb.org/?image=design%3Awebsite_classification_coverage_vallina2020.png&amp;ns=design&amp;rev=1735838030&amp;tab_details=history&amp;media_do=diff&amp;do=media</link>
        <description>&lt;img src=&quot;https://measuretheweb.org/_media/design/website_classification_coverage_vallina2020.png?w=500&amp;amp;h=500&amp;amp;tok=197176&quot; alt=&quot;website_classification_coverage_vallina2020.png&quot; loading=&quot;lazy&quot; width=&quot;500&quot; height=&quot;500&quot; /&gt;</description>
    </item>
    <item rdf:about="https://measuretheweb.org/?image=design%3Awebsite_classification_popularity_vallina2020.png&amp;ns=design&amp;rev=1735838030&amp;tab_details=history&amp;media_do=diff&amp;do=media">
        <dc:format>text/html</dc:format>
        <dc:date>2025-01-02T17:13:50+00:00</dc:date>
        <dc:creator>karelkubicek (karelkubicek@undisclosed.example.com)</dc:creator>
        <title>website_classification_popularity_vallina2020.png - created</title>
        <link>https://measuretheweb.org/?image=design%3Awebsite_classification_popularity_vallina2020.png&amp;ns=design&amp;rev=1735838030&amp;tab_details=history&amp;media_do=diff&amp;do=media</link>
        <description>&lt;img src=&quot;https://measuretheweb.org/_media/design/website_classification_popularity_vallina2020.png?w=500&amp;amp;h=500&amp;amp;tok=d062ce&quot; alt=&quot;website_classification_popularity_vallina2020.png&quot; loading=&quot;lazy&quot; width=&quot;500&quot; height=&quot;500&quot; /&gt;</description>
    </item>
    <item rdf:about="https://measuretheweb.org/?image=design%3Awebsite_ranking_list_manipulations_lepochat2019.png&amp;ns=design&amp;rev=1735838029&amp;tab_details=history&amp;media_do=diff&amp;do=media">
        <dc:format>text/html</dc:format>
        <dc:date>2025-01-02T17:13:49+00:00</dc:date>
        <dc:creator>karelkubicek (karelkubicek@undisclosed.example.com)</dc:creator>
        <title>website_ranking_list_manipulations_lepochat2019.png - created</title>
        <link>https://measuretheweb.org/?image=design%3Awebsite_ranking_list_manipulations_lepochat2019.png&amp;ns=design&amp;rev=1735838029&amp;tab_details=history&amp;media_do=diff&amp;do=media</link>
        <description>&lt;img src=&quot;https://measuretheweb.org/_media/design/website_ranking_list_manipulations_lepochat2019.png?w=500&amp;amp;h=500&amp;amp;tok=c4b64e&quot; alt=&quot;website_ranking_list_manipulations_lepochat2019.png&quot; loading=&quot;lazy&quot; width=&quot;500&quot; height=&quot;500&quot; /&gt;</description>
    </item>
</rdf:RDF>
