<?xml version="1.0" encoding="utf-8" standalone="yes"?>
<TEI xmlns="http://www.tei-c.org/ns/1.0">
  <teiHeader>
    <fileDesc>
      <titleStmt>
        <title type="main" level="a">Semantic analysis of web archive historical data: 1983 “Marche pour l’égalité et contre le racisme”</title>
        <author>
          <persName n="1" ref="https://orcid.org/0009-0001-3001-8864" type="ORCID">
            <forename>Davide</forename>
            <surname>Rendina</surname>
            <placeName type="affiliation">Aix-Marseille University, France</placeName>
          </persName>
          <persName n="2" ref="https://orcid.org/0000-0002-9883-733X" type="ORCID">
            <forename>Sophie</forename>
            <surname>Gebeil</surname>
            <placeName type="affiliation">Aix-Marseille University, France</placeName>
          </persName>
          <persName n="3" ref="https://orcid.org/0000-0001-5492-8750" type="ORCID">
            <forename>Mathieu</forename>
            <surname>Génois</surname>
            <placeName type="affiliation">Aix-Marseille University, France</placeName>
          </persName>
          <persName n="4" ref="https://orcid.org/0000-0001-8698-5055" type="ORCID">
            <forename>Patrice</forename>
            <surname>Bellot</surname>
            <placeName type="affiliation">Aix-Marseille University, France</placeName>
          </persName>
        </author>
        <respStmt>
          <resp>This is a section of <title>Exploring the Archived Web during a Highly Transformative Age</title>(DOI: <idno type="DOI">10.36253/979-12-215-0413-2</idno>) by </resp>
          <name>Sophie Gebeil, Jean-Christophe Peyssard</name>
        </respStmt>
      </titleStmt>
      <publicationStmt>
        <publisher>Firenze University Press</publisher>
        <pubPlace>Florence</pubPlace>
        <date when="2024">2024</date>
        <idno type="DOI">https://doi.org/10.36253/979-12-215-0413-2.22</idno>
        <availability>
          <p>Available for academic research purposes</p>
          <p>Open Access</p>
          <p>Copyright Author(s)</p>
          <licence source="text" target="https://creativecommons.org/licenses/by/4.0/legalcode">
            <p>Content licence CC BY 4.0</p>
          </licence>
          <licence source="metadata" target="https://creativecommons.org/publicdomain/zero/1.0/legalcode">
            <p>Metadata licence CC0 1.0</p>
          </licence>
        </availability>
      </publicationStmt>
      <sourceDesc>
        <p>This is original content, published for academic research purposes</p>
      </sourceDesc>
    </fileDesc>
    <encodingDesc>
      <appInfo>
        <application version="2.2" ident="Booksflow">
          <desc>Digital edition XML powered by Booksflow</desc>
        </application>
      </appInfo>
    </encodingDesc>
    <profileDesc>
      <abstract xml:lang="en">
        <p>Based on a corpus composed by data obtained from the web archive of the French National Audiovisual Institute, including web pages referencing the history of the 1983 March for Equality and Against Racism, we explored how the memory of a historical event is built through the recounting of web media and the possibilities afforded by computational text analysis methods for the study of large corpuses of historical data from the archived web. This chapter presents the methodology and results of Davide Rendina's master's thesis in computer sciences under the supervision of Sophie Gebeil, Mathieu Génois, and Patrice Bellot. The objective is to demonstrate how historians can utilize archived HTML pages to study the media coverage of historical subjects on the web.</p>
      </abstract>
      <textClass>
        <keywords>
          <list>
            <item>anti-racism</item>
            <item>media web archive</item>
            <item>memory studies</item>
            <item>topic modeling</item>
            <item>1983</item>
          </list>
        </keywords>
      </textClass>
    </profileDesc>
  </teiHeader>
  <text>
    <body>
      <p>It is available online at https://doi.org/10.36253/979-12-215-0413-2.22<ref target="https://doi.org/10.36253/979-12-215-0413-2.22" /></p>
      <div>
        <listBibl>
          <head>References</head>
          <bibl n="154250">Davide Rendina, Sophie Gebeil, Mathieu G&amp;#233;nois, Patrice Bellot. “Semantic analysis of web archive historical data: the 1983 &amp;#39;Marche pour l&amp;#39;&amp;#233;galit&amp;#233; et contre le racisme&amp;#39;.“ Master Thesis. Erasmus Mundus Joint Master&amp;#39;s Degree in Big Data Management and Analytics (BDMA). Data Analysis, Statistics and Probability [physics.data-an]. 2023. ⟨dumas-04541382⟩</bibl>
          <bibl n="154425">
            <bibl>Davide Rendina, Sophie Gebeil, Mathieu G&amp;#233;nois, Patrice Bellot. “Master Thesis Report - Semantic Analysis of Web Archive Historical Data the 1983 “Marche Pour L&amp;#39;&amp;#233;galit&amp;#233; Et Contre Le Racisme“ &amp;#187;. Zenodo, 10 ao&amp;#251;t 2023.</bibl>
            <idno type="DOI">10.5281/zenodo.10972646</idno>
          </bibl>
          <bibl n="154612">De Lange, Sarah L. and Mudde Cas. “Political extremism in Europe.“ European Political Science 4(4): 476–88 (2005). http://www.cambridge.org/9780521850810</bibl>
          <bibl n="154431">
            <bibl>Ehrmann, Maud, Ahmed Hamdi, Elvys Linhares Pontes, Matteo Romanello, and Antoine Doucet. 2024. “Named Entity Recognition and Classification on Historical Documents: A Survey“. ACM Computing Surveys 56 (2): 1‑47.</bibl>
            <idno type="DOI">10.1145/3604931</idno>
          </bibl>
          <bibl n="154759">
            <bibl>Fortunato, S. “Community detection in graphs.“ Physics Reports, 486 (3–5), 75-174 (2009).</bibl>
            <idno type="DOI">10.1016/j.physrep.2009.11.002</idno>
          </bibl>
          <bibl n="154554">
            <bibl>Gimenez, Elsa, and Voirol Olivier. “Les agitateurs de la toile. L’Internet des droites extr&amp;#234;mes. Pr&amp;#233;sentation du num&amp;#233;ro.“ R&amp;#233;seaux, vol. 202-203, no. 2–3, 2017, pp. 9-37.</bibl>
            <idno type="DOI">10.3917/res.202.0009</idno>
          </bibl>
          <bibl n="154692">Pippa, Noris. “Preaching to the converted?: Pluralism, participation and party websites“. Party Politics 9(1): 21–45 (2003).</bibl>
          <bibl n="154280">R&amp;#246;der, M., Both, A., and Hinneburg, A. “Exploring the space of topic coherence measures.“ In Proceedings of the Eighth ACM International Conference on Web Search and Data Mining, WSDM 2015, Shanghai, China, February 2–6, 2015 (2015), X. Cheng, H. Li, E. Gabrilovich, and J. Tang, Eds., ACM, pp. 399–408.</bibl>
          <bibl n="154239">Tedeschi, S., Maiorca, V., Campolungo, N., Cecconi, F., and Navigli, R. “Wikineural: Combined neural and knowledge-based silver data creation for multilingual NER.“ In Findings of the Association for Computational Linguistics: EMNLP 2021, Virtual Event / Punta Cana, Dominican Republic, 16–20 November, 2021 (2021), M. Moens, X. Huang, L. Specia, and S. W. Yih, Eds. Association for Computational Linguistics, pp. 2521–2533.</bibl>
        </listBibl>
      </div>
    </body>
  </text>
</TEI>