<?xml version="1.0" encoding="UTF-8"?>
<!DOCTYPE html PUBLIC "-//W3C//DTD XHTML 1.0 Transitional//EN" "http://www.w3.org/TR/xhtml1/DTD/xhtml1-transitional.dtd">
<html xmlns="http://www.w3.org/1999/xhtml" lang="en">

<head>
  <title>[1805.12512] On the Origins of Memes by Means of Fringe Web Communities</title>
  <link rel="shortcut icon" href="/favicon.ico" type="image/x-icon" />
  <link rel="stylesheet" type="text/css" media="screen" href="//static.arxiv.org/css/arXiv.css?v=20190307" />
  
  <!-- Piwik -->
  <script type="text/javascript">
    var _paq = _paq || [];
    _paq.push(["setDomains", ["*.arxiv.org"]]);
    _paq.push(['trackPageView']);
    _paq.push(['enableLinkTracking']);
    (function() {
      var u = "//webanalytics.library.cornell.edu/";
      _paq.push(['setTrackerUrl', u + 'piwik.php']);
      _paq.push(['setSiteId', 538]);
      var d = document,
        g = d.createElement('script'),
        s = d.getElementsByTagName('script')[0];
      g.type = 'text/javascript';
      g.async = true;
      g.defer = true;
      g.src = u + 'piwik.js';
      s.parentNode.insertBefore(g, s);
    })();
  </script>
  <!-- End Piwik Code -->
  <script type="text/javascript" src="https://arxiv-org.atlassian.net/s/d41d8cd98f00b204e9800998ecf8427e-T/zca7yc/b/13/a44af77267a987a660377e5c46e0fb64/_/download/batch/com.atlassian.jira.collector.plugin.jira-issue-collector-plugin:issuecollector/com.atlassian.jira.collector.plugin.jira-issue-collector-plugin:issuecollector.js?locale=en-US&collectorId=7a8da419"></script>
<script type="text/javascript">window.ATL_JQ_PAGE_PROPS =  {
  "triggerFunction": function(showCollectorDialog) {
    //Requires that jQuery is available!
    jQuery("#feedback-button").click(function(e) {
      e.preventDefault();
      showCollectorDialog();
    });
  },
  fieldValues: {
    "components": ["15700"],  // Browse component.
    "versions": ["14132"],  // Release browse-0.1
    "customfield_11401": window.location.href
  }
  };
</script><link rel="stylesheet" href="https://maxcdn.bootstrapcdn.com/font-awesome/4.7.0/css/font-awesome.min.css">
  <link rel="stylesheet" media="screen" type="text/css" href="/bibex/bibex.css?20181010"/>
  <script src="//static.arxiv.org/js/mathjaxToggle.min.js" type="text/javascript"></script>
  <meta name="citation_title" content="On the Origins of Memes by Means of Fringe Web Communities"/>
  <meta name="citation_author" content="Zannettou, Savvas"/>
  <meta name="citation_author" content="Caulfield, Tristan"/>
  <meta name="citation_author" content="Blackburn, Jeremy"/>
  <meta name="citation_author" content="De Cristofaro, Emiliano"/>
  <meta name="citation_author" content="Sirivianos, Michael"/>
  <meta name="citation_author" content="Stringhini, Gianluca"/>
  <meta name="citation_author" content="Suarez-Tangil, Guillermo"/>
  <meta name="citation_date" content="2018/05/31"/>
  <meta name="citation_online_date" content="2018/09/22"/>
  <meta name="citation_pdf_url" content="https://arxiv.org/pdf/1805.12512"/>
  <meta name="citation_arxiv_id" content="1805.12512"/><meta name="twitter:site" content="@arxiv"/>
    <meta property="twitter:title" content="On the Origins of Memes by Means of Fringe Web Communities"/>
    <meta property="twitter:description" content="Internet memes are increasingly used to sway and manipulate public opinion.
This prompts the need to study their propagation, evolution, and influence
across the Web. In this paper, we detect and..."/>
    <meta property="og:site_name" content="arXiv.org"/>
    <meta property="og:title" content="On the Origins of Memes by Means of Fringe Web Communities"/>
    <meta property="og:url" content="https://arxiv.org/abs/1805.12512v3"/>
    <meta property="og:description" content="Internet memes are increasingly used to sway and manipulate public opinion.
This prompts the need to study their propagation, evolution, and influence
across the Web. In this paper, we detect and measure the propagation of memes
across multiple Web communities, using a processing pipeline based on
perceptual hashing and clustering techniques, and a dataset of 160M images from
2.6B posts gathered from Twitter, Reddit, 4chan&#39;s Politically Incorrect board
(/pol/), and Gab, over the course of 13 months. We group the images posted on
fringe Web communities (/pol/, Gab, and The_Donald subreddit) into clusters,
annotate them using meme metadata obtained from Know Your Meme, and also map
images from mainstream communities (Twitter and Reddit) to the clusters.
  Our analysis provides an assessment of the popularity and diversity of memes
in the context of each community, showing, e.g., that racist memes are
extremely common in fringe Web communities. We also find a substantial number
of politics-related memes on both mainstream and fringe Web communities,
supporting media reports that memes might be used to enhance or harm
politicians. Finally, we use Hawkes processes to model the interplay between
Web communities and quantify their reciprocal influence, finding that /pol/
substantially influences the meme ecosystem with the number of memes it
produces, while \td has a higher success rate in pushing them to other
communities."/>
</head>

<body  class="with-cu-identity">
  <noscript><img src="//webanalytics.library.cornell.edu/piwik.php?idsite=538&amp;rec=1" style="border:0;" alt="" /></noscript>
  <div id="cu-identity">
    <div id="cu-logo">
      <a href="https://www.cornell.edu/"><img src="//static.arxiv.org/icons/cu/cornell-reduced-white-SMALL.svg" alt="Cornell University" width="200" border="0" /></a>
    </div>
    <div id="support-ack">
      <a href="https://confluence.cornell.edu/x/ALlRF">We gratefully acknowledge support from<br/>the Simons Foundation and member institutions.</a>
    </div>
  </div>

  <div id="header" >
    
  <h1><a href="/">arXiv.org</a> &gt; <a href="/list/cs/recent">cs</a> &gt; arXiv:1805.12512</h1>
  <div id="search">
    <form id="search-arxiv" method="get" action="https://arxiv.org/search">

      <div class="wrapper-search-arxiv">
        <input class="keyword-field" type="text" name="query" placeholder="Search or Article ID" />

        <div class="filter-field">
          <select name="searchtype">
            <option value="all">All fields</option>
            <option value="title">Title</option>
            <option value="author">Author(s)</option>
            <option value="abstract">Abstract</option>
            <option value="comments">Comments</option>
            <option value="journal_ref">Journal reference</option>
            <option value="acm_class">ACM classification</option>
            <option value="msc_class">MSC classification</option>
            <option value="report_num">Report number</option>
            <option value="paper_id">arXiv identifier</option>
            <option value="doi">DOI</option>
            <option value="orcid">ORCID</option>
            <option value="author_id">arXiv author ID</option>
            <option value="help">Help pages</option>
            <option value="full_text">Full text</option>
          </select>
        </div>
        <input class="btn-search-arxiv" value="" type="submit">
        <div class="links">(<a href="https://arxiv.org/help">Help</a> | <a href="https://arxiv.org/search/advanced">Advanced search</a>)</div>
      </div>
    </form>
  </div>

  </div>

  <div id="content">
    <!--
rdf:RDF xmlns:rdf="http://www.w3.org/1999/02/22-rdf-syntax-ns#"
         xmlns:dc="http://purl.org/dc/elements/1.1/"
         xmlns:trackback="http://madskills.com/public/xml/rss/module/trackback/">
    <rdf:Description
        rdf:about="/abs/1805.12512"
        dc:identifier="/abs/1805.12512"
        dc:title="On the Origins of Memes by Means of Fringe Web Communities"
        trackback:ping="/trackback/1805.12512" />
    </rdf:RDF>
-->
<div id="abs">
  <div class="extra-services">
    <div class="full-text">
      <span class="descriptor">Full-text links:</span>
      <h2>Download:</h2>
      <ul>
  <li><a href="/pdf/1805.12512" accesskey="f">PDF</a></li>
  <li><a href="/format/1805.12512">Other formats</a></li></ul>
      <div class="abs-license">(<a href="http://arxiv.org/licenses/nonexclusive-distrib/1.0/" title="Rights to this article">license</a>)</div>
    </div>
    <!--end full-text-->
    <div class="browse">
    <h3>Current browse context:</h3>
  <div class="current">cs.SI</div>

  <div class="prevnext">

  <span class="arrow">
    <a href="/prevnext?site=arxiv.org&amp;id=1805.12512&amp;function=prev&amp;context=cs.SI"
       accesskey="p" title="previous in cs.SI (accesskey p)">&lt;&nbsp;prev</a>
  </span>&nbsp;|&nbsp;

  
  <span class="arrow">
    <a href="/prevnext?site=arxiv.org&amp;id=1805.12512&amp;function=next&amp;context=cs.SI" accesskey="n"
       title="next in cs.SI (accesskey n)">next&nbsp;&gt;</a>
  </span><br/>
  </div><div class="list">
    <a href="/list/cs.SI/new">new</a>&nbsp;|
    <a href="/list/cs.SI/recent">recent</a>&nbsp;|
    <a href="/list/cs.SI/1805">1805</a>
  </div><h3>Change to browse by:</h3>
  <div class="switch">
    
      <a href="/abs/1805.12512?context=cs">cs</a>
      
    <br/>
    
      <span class="subclass"><a href="/abs/1805.12512?context=cs.CY">cs.CY</a></span>
      
    <br/>
    
  </div>
  
    </div>

    <div class="extra-ref-cite">
      <h3>References &amp; Citations</h3>
      <ul>
        
        <li><a href="https://ui.adsabs.harvard.edu/#abs/arXiv:1805.12512">NASA ADS</a></li>
      </ul>
    </div>

    
    <div class="extra-general">
        <div class="what-is-this">
            <h3><a href="/tb/1805.12512"> 1 blog link</a></h3> (<a href="https://arxiv.org/help/trackback">what is this?</a>)
        </div>
    </div>
    <div class="dblp">
    <h3><a href="https://dblp.uni-trier.de">DBLP</a> - CS Bibliography</h3>
    <div class="list">
      <a href="https://dblp.uni-trier.de/db/journals/corr/corr1805.html#abs-1805-12512" title="listing on DBLP">listing</a> | <a href="https://dblp.uni-trier.de/rec/bibtex/journals/corr/abs-1805-12512" title="DBLP bibtex record">bibtex</a>
    </div>
    
    <div class="list">
      <a href="https://dblp.uni-trier.de/search/author?author=Savvas%20Zannettou" title="DBLP author search">Savvas Zannettou</a><br/><a href="https://dblp.uni-trier.de/search/author?author=Tristan%20Caulfield" title="DBLP author search">Tristan Caulfield</a><br/><a href="https://dblp.uni-trier.de/search/author?author=Jeremy%20Blackburn" title="DBLP author search">Jeremy Blackburn</a><br/><a href="https://dblp.uni-trier.de/search/author?author=Emiliano%20De%20Cristofaro" title="DBLP author search">Emiliano De Cristofaro</a><br/><a href="https://dblp.uni-trier.de/search/author?author=Michael%20Sirivianos" title="DBLP author search">Michael Sirivianos</a>
    
      <div class="list">&hellip;</div>
    
    </div>
    
  </div><div class="bookmarks">
  <div class="what-is-this"><h3>Bookmark</h3> (<a href="https://arxiv.org/help/social_bookmarking">what is this?</a>)</div><a href="/ct?url=http%3A%2F%2Fwww.citeulike.org%2Fposturl%3Furl%3Dhttps%3A%2F%2Farxiv.org%2Fabs%2F1805.12512&amp;v=64290903"
     title="Bookmark on CiteULike">
    <img src="//static.arxiv.org/icons/social/citeulike.png"
         alt="CiteULike logo" />
  </a>
  <a href="/ct?url=http%3A%2F%2Fwww.bibsonomy.org%2FBibtexHandler%3FrequTask%3Dupload%26url%3Dhttps%3A%2F%2Farxiv.org%2Fabs%2F1805.12512%26description%3DOn+the+Origins+of+Memes+by+Means+of+Fringe+Web+Communities&amp;v=e8a34bf4"
     title="Bookmark on BibSonomy">
    <img src="//static.arxiv.org/icons/social/bibsonomy.png"
         alt="BibSonomy logo"/>
  </a>
  <a href="/ct?url=https%3A%2F%2Fwww.mendeley.com%2Fimport%2F%3Furl%3Dhttps%3A%2F%2Farxiv.org%2Fabs%2F1805.12512&amp;v=4df657e4"
     title="Bookmark on Mendeley">
    <img src="//static.arxiv.org/icons/social/mendeley.png"
         alt="Mendeley logo"/>
  </a>
  <a href="/ct?url=https%3A%2F%2Freddit.com%2Fsubmit%3Furl%3Dhttps%3A%2F%2Farxiv.org%2Fabs%2F1805.12512%26title%3DOn+the+Origins+of+Memes+by+Means+of+Fringe+Web+Communities&amp;v=0a82ff47"
     title="Bookmark on Reddit">
    <img src="//static.arxiv.org/icons/social/reddit.png"
         alt="Reddit logo"/>
  </a>
  <a href="/ct?url=http%3A%2F%2Fsciencewise.info%2Fbookmarks%2Fadd%3Furl%3Dhttps%3A%2F%2Farxiv.org%2Fabs%2F1805.12512&amp;v=b3fe4936"
     title="Bookmark on ScienceWISE">
    <img src="//static.arxiv.org/icons/social/sciencewise.png"
         alt="ScienceWISE logo"/>
  </a>
</div>
  </div>
  <!--end extra-services-->

  <div class="leftcolumn">
    <div class="subheader">
      <h1>Computer Science > Social and Information Networks</h1>
    </div>
    <h1 class="title mathjax"><span class="descriptor">Title:</span>On the Origins of Memes by Means of Fringe Web Communities</h1>
    <div class="authors"><span class="descriptor">Authors:</span><a href="https://arxiv.org/search/cs?searchtype=author&amp;query=Zannettou%2C+S">Savvas Zannettou</a>, <a href="https://arxiv.org/search/cs?searchtype=author&amp;query=Caulfield%2C+T">Tristan Caulfield</a>, <a href="https://arxiv.org/search/cs?searchtype=author&amp;query=Blackburn%2C+J">Jeremy Blackburn</a>, <a href="https://arxiv.org/search/cs?searchtype=author&amp;query=De+Cristofaro%2C+E">Emiliano De Cristofaro</a>, <a href="https://arxiv.org/search/cs?searchtype=author&amp;query=Sirivianos%2C+M">Michael Sirivianos</a>, <a href="https://arxiv.org/search/cs?searchtype=author&amp;query=Stringhini%2C+G">Gianluca Stringhini</a>, <a href="https://arxiv.org/search/cs?searchtype=author&amp;query=Suarez-Tangil%2C+G">Guillermo Suarez-Tangil</a>
    </div>

    <div class="dateline">(Submitted on 31 May 2018 (<a href="/abs/1805.12512v1">v1</a>), last revised 22 Sep 2018 (this version, v3))</div>

    
    <blockquote class="abstract mathjax"><span class="descriptor">Abstract:</span>  Internet memes are increasingly used to sway and manipulate public opinion.
This prompts the need to study their propagation, evolution, and influence
across the Web. In this paper, we detect and measure the propagation of memes
across multiple Web communities, using a processing pipeline based on
perceptual hashing and clustering techniques, and a dataset of 160M images from
2.6B posts gathered from Twitter, Reddit, 4chan&#39;s Politically Incorrect board
(/pol/), and Gab, over the course of 13 months. We group the images posted on
fringe Web communities (/pol/, Gab, and The_Donald subreddit) into clusters,
annotate them using meme metadata obtained from Know Your Meme, and also map
images from mainstream communities (Twitter and Reddit) to the clusters.
<br />Our analysis provides an assessment of the popularity and diversity of memes
in the context of each community, showing, e.g., that racist memes are
extremely common in fringe Web communities. We also find a substantial number
of politics-related memes on both mainstream and fringe Web communities,
supporting media reports that memes might be used to enhance or harm
politicians. Finally, we use Hawkes processes to model the interplay between
Web communities and quantify their reciprocal influence, finding that /pol/
substantially influences the meme ecosystem with the number of memes it
produces, while \td has a higher success rate in pushing them to other
communities.
</blockquote>
    <!--CONTEXT-->
    <div class="metatable">
      <table summary="Additional metadata">
        <tr>
          <td class="tablecell label">Comments:</td>
          <td class="tablecell comments mathjax">A shorter version of this paper appears in the Proceedings of 18th ACM Internet Measurement Conference (IMC 2018). This is the full version</td>
        </tr>
        <tr>
          <td class="tablecell label">Subjects:</td>
          <td class="tablecell subjects"><span class="primary-subject">Social and Information Networks (cs.SI)</span>; Computers and Society (cs.CY)</td>
        </tr><tr>
          <td class="tablecell label">Cite as:</td>
          <td class="tablecell arxivid"><a href="https://arxiv.org/abs/1805.12512">arXiv:1805.12512</a> [cs.SI]</td>
        </tr>
        <tr>
          <td class="tablecell label">&nbsp;</td>
          <td class="tablecell arxividv">(or <span class="arxivid">
              <a href="https://arxiv.org/abs/1805.12512v3">arXiv:1805.12512v3</a> [cs.SI]</span> for this version)
          </td>
        </tr>
      </table>
    </div>
    <div class="submission-history">
      <h2>Submission history</h2> From: Emiliano De Cristofaro [<a href="/show-email/4dd3bc4c/1805.12512">view email</a>]
      <br/>
  <b><a href="/abs/1805.12512v1">[v1]</a></b>
  Thu, 31 May 2018 15:22:55 UTC (8,802 KB)<br/>
  <b><a href="/abs/1805.12512v2">[v2]</a></b>
  Tue, 24 Jul 2018 13:00:50 UTC (8,472 KB)<br/><b>[v3]</b>
Sat, 22 Sep 2018 21:02:03 UTC (9,390 KB)<br/></div>
  </div>
  <!--end leftcolumn-->
  <div class="endorsers"><a href="/auth/show-endorsers/1805.12512">Which authors of this paper are endorsers?</a> | <a id="mathjax_toggle" href="javascript:setMathjaxCookie()">Disable MathJax</a> (<a href="https://arxiv.org/help/mathjax">What is MathJax?</a>)
    <span class="help" style="display: inline-block; font-style: normal; float: right; margin-top: 0; margin-right: 1em;"><a href="https://confluence.cornell.edu/x/MjmLFQ">Browse v0.1 released 2018-10-22</a>&nbsp;&nbsp;<button class="button is-small" id="feedback-button">Feedback?</button></span>
  </div>
  <script type="text/javascript" language="javascript">mathjaxToggle();</script>
  <script src="/bibex/bibex.js?20181010" type="text/javascript" defer></script>
  
</div>

  </div>

  <footer style="clear: both;">
    <div class="columns is-desktop" role="navigation" aria-label="Secondary" style="margin: -0.75em -0.75em 0.75em -0.75em">
      <!-- Macro-Column 1 -->
      <div class="column" style="padding: 0;">
        <div class="columns">
          <div class="column">
            <ul style="list-style: none; line-height: 2;">
              <li><a href="https://arxiv.org/about">About arXiv</a></li>
              <li><a href="https://arxiv.org/about/people/leadership_team">Leadership Team</a></li>
            </ul>
          </div>
          <div class="column">
            <ul style="list-style: none; line-height: 2;">
              <li><span class="icon"><i class="fa fa-envelope"></i></span><a href="https://arxiv.org/help/contact"> Contact Us</a></li>
              <li><span class="icon"><i class="fa fa-twitter"></i></span><a href="https://twitter.com/arxiv"> Follow us on Twitter</a></li>
            </ul>
          </div>
        </div>
      </div>
      <!-- End Macro-Column 1 -->
      <!-- Macro-Column 2 -->
      <div class="column" style="padding: 0;">
        <div class="columns">
          <div class="column">
            <ul style="list-style: none; line-height: 2;">
              <li><a href="https://arxiv.org/help">Help</a></li>
              <li><a href="https://arxiv.org/help/policies/privacy_policy">Privacy Policy</a></li>
            </ul>
          </div>
          <div class="column">
            <ul style="list-style: none; line-height: 2;">
              <li><a href="https://blogs.cornell.edu/arxiv">Blog</a></li>
              <li><a href="https://arxiv.org/help/subscribe"> Subscribe</a></li>
            </ul>
          </div>
        </div>
      </div>
      <!-- End Macro-Column 2 -->
    </div>

    <div class="columns" style="border-top: 1px solid #979797; margin: -0.75em;">
      <div class="column">
        <p class="help" style="margin-bottom: 0;">arXiv&#174; is a registered trademark of Cornell University.</p>
      </div>
      <div class="column">
        <p class="help" style="margin-bottom: 0;">If you have a disability and are having trouble accessing information on this website or need materials in an alternate format,
        contact <a href="mailto:web-accessibility@cornell.edu">web-accessibility@cornell.edu</a> for assistance.</p>
      </div>
    </div>
  </footer>

</body>

</html>