@inbook {40533, title = {Constituer une archive du web de la Grande Guerre et la rendre accessible aux chercheurs}, booktitle = {Le web fran{\c c}ais de la Grande Guerre. R{\'e}seaux amateurs et institutionnels}, year = {2018}, pages = {91-[105]}, publisher = {Presses universitaires de Paris Nanterre}, organization = {Presses universitaires de Paris Nanterre}, address = {Nanterre}, author = {Agn{\`e}s Sandras and Peter Stirling}, editor = {Val{\'e}rie Beaudouin and Philippe Chevallier and Lionel Maurel} } @inbook {41681, title = {Exploring the Memory of the First World War Using Web Archives: Web Graphs Seen from Different Angles}, booktitle = {The Sage Handbook of Web History}, year = {2018}, pages = {441-453}, publisher = {Sage}, organization = {Sage}, address = {London}, author = {Val{\'e}rie Beaudouin and Zeynep Pehlivan and Peter Stirling} } @conference {40368, title = {Meeting researchers{\textquoteright} needs in mining web archives: the experience of the National Library of France}, booktitle = {LIBER 2018 : 47th LIBER Annual Conference : Research Libraries as an Open Science Hub: from Strategy to Action}, year = {2018}, month = {2018/07/05}, publisher = {LIBER}, organization = {LIBER}, address = {Villeneuve d{\textquoteright}Ascq, Universit{\'e} de Lille, LILLIAD Learning center Innovation}, abstract = {
The digital legal deposit collections of the National Library of France (Biblioth{\`e}que nationale de France, BnF) cover a period of over twenty years and now represent almost a petabyte of data. Opened in 2008, access to the web archives is provided in the research reading rooms of the BnF and in a number of regional libraries, via the application Archives de l{\textquoteright}internet, which allows researchers to search and view websites as they were at the moment of capture and navigate within these temporal collections. In recent years, an increasing number of researchers have sought to use these collections for analyses that employ innovative methods often grouped under the term {\textquoteleft}digital humanities{\textquoteright}, such as text and data mining (TDM) or link analysis. This paper will describe how the BnF has sought to respond to the needs of these researchers, based on three recent case studies: the creation of a web cartography of sites and the analysis of a discussion forum related to WWI; a study of the early French web from the 1990s; and a study of the use of neologisms in French based on news sites.
The paper will concentrate not on the results of the projects but rather on the issues raised in allowing researchers to use such methods on the BnF web archives. This subject will be studied from three different angles:
● Legal context and framework: intellectual property law and the specific context of legal deposit legislation set limits on the use of these collections, which are still protected under French copyright provisions. The use of text and
data mining for research is also an area currently under discussion on a European level. The BnF uses research agreements to fix the conditions of usage of its collections for this kind of analysis while respecting the relevant legislation.
● Organisational questions: it is necessary to find means of accompanying the research teams, in terms of physical reception and equipment, providing information on the available collections and facilitating exchanges on the needs of the study.
● Technical aspects: each project has specific needs in terms of data and metadata, which in addition to the legal context require specific kinds of IT infrastructure and software. The BnF is experimenting with different technical solutions, including working in cooperation with the researchers to install, integrate or develop new tools.
Finally, the paper will draw initial lessons from these three projects, which are carried out in the context of an internal four-year research programme called CORPUS, aimed at shaping a service to provide tools, corpora, and guidance
to researchers who wish to apply TDM to analyse the Library{\textquoteright}s various digital collections.
}, author = {Peter Stirling and Sara Aubry} } @conference {7191, title = {Regards crois{\'e}s sur les outils d{\textquoteright}acc{\`e}s {\`a} la BnF et {\`a} l{\textquoteright}Ina}, booktitle = {Il {\'e}tait une fois dans le web. 20 ans d{\textquoteright}archives de l{\textquoteright}internet en France}, year = {2016}, month = {2016/11/23}, publisher = {Biblioth{\`e}que nationale de France ; Institut national de l{\textquoteright}audiovisuel ; ANR Web90 ; Universit{\'e} Paris Lumi{\`e}res}, organization = {Biblioth{\`e}que nationale de France ; Institut national de l{\textquoteright}audiovisuel ; ANR Web90 ; Universit{\'e} Paris Lumi{\`e}res}, address = {Paris, Biblioth{\`e}que nationale de France, site Fran{\c c}ois-Mitterrand, Petit Auditorium}, author = {Zeynep Pehlivan and Peter Stirling} } @conference {6433, title = {Web Graphs from Web Archives: Seen from Different Angles}, booktitle = {IIPC Web Archiving Conference 2016}, year = {2016}, month = {2016/04/14}, publisher = {International Internet Preservation Consortium ; Landsb{\'o}kasafn {\'I}slands {\textendash} H{\'a}sk{\'o}lab{\'o}kasafn / National and University Library of Iceland}, organization = {International Internet Preservation Consortium ; Landsb{\'o}kasafn {\'I}slands {\textendash} H{\'a}sk{\'o}lab{\'o}kasafn / National and University Library of Iceland}, address = {Islande, Reykjav{\'\i}k, Radisson Blu Saga Hotel, Hekla}, author = {Peter Stirling and Zeynep Pehlivan} } @conference {6435, title = {Using WAT at the BnF to map the First World War}, booktitle = {IIPC General Assembly 2015}, year = {2015}, month = {2015/04/30}, publisher = {International Internet Preservation Consortium}, organization = {International Internet Preservation Consortium}, address = {Etats-Unis, Silicon Valley, Stanford University campus, Li Ka Shing Conference Center (LKSC), Li Ka Shing Center Berg Hall A}, url = {http://www.netpreserve.org/sites/default/files/attachments/Data_mining_and_WAT_files.pdf}, author = {Peter Stirling} } @conference {41735, title = {D{\'e}p{\^o}t l{\'e}gal de la photographie et images du web}, year = {2014}, month = {2014/04/03}, publisher = {Ecole nationale sup{\'e}rieure Louis-Lumi{\`e}re}, organization = {Ecole nationale sup{\'e}rieure Louis-Lumi{\`e}re}, address = {Saint-Denis, Ecole nationale sup{\'e}rieure Louis-Lumi{\`e}re}, author = {Peter Stirling and Dominique Versavel} } @online {6166, title = {La BnF rend accessibles les archives de l{\textquoteright}internet en r{\'e}gion}, journal = {Blog Lecteurs de la Biblioth{\`e}que nationale de France}, year = {2014}, month = {2014/11/13}, url = {http://blog.bnf.fr/lecteurs/index.php/2014/11/la-bnf-rend-accessibles-les-archives-de-internet-en-region/}, author = {Peter Stirling} } @conference {1841, title = {Le projet {\guillemotleft}Le devenir du patrimoine num{\'e}ris{\'e} en ligne{\guillemotright} : une proposition m{\'e}thodologique}, booktitle = {Atelier n{\textdegree} 5 - Labex Les pass{\'e}s dans le pr{\'e}sent : Pour une {\'e}tude des usages du patrimoine num{\'e}ris{\'e}}, year = {2014}, month = {2014/11/21}, publisher = {Labex Les pass{\'e}s dans le pr{\'e}sent}, organization = {Labex Les pass{\'e}s dans le pr{\'e}sent}, address = {Nanterre, Universit{\'e} Paris Ouest Nanterre La D{\'e}fense ; MAE, Ren{\'e}-Ginouv{\`e}s, Salle du Conseil}, keywords = {Bibli-Lab}, author = {Peter Stirling and Lionel Maurel and Nicolas Auray} } @online {6173, title = {Web scientifique : de la vulgarisation {\`a} la science participative}, journal = {Blog Lecteurs de la Biblioth{\`e}que nationale de France}, year = {2014}, month = {2014/10/13}, url = {http://blog.bnf.fr/lecteurs/index.php/2014/10/web-scientifique-de-la-vulgarisation-a-la-science-participative/}, author = {Peter Stirling} } @article {3158, title = {Le d{\'e}p{\^o}t l{\'e}gal du web cartographique : rencontre avec Guillaume Lebailly et Peter Stirling}, journal = {La G{\'e}ofeuille [publication {\'e}lectronique du "G{\'e}oR{\'e}seau", site des cartoth{\`e}ques et biblioth{\`e}ques universitaires]}, volume = {automne}, year = {2013}, pages = {5 p.}, url = {http://geographie.ipt.univ-paris8.fr/rubriks/carto/journalGR/photos/depotlegalweb.pdf}, author = {Guillaume Lebailly and Peter Stirling} } @proceedings {2678, title = {Actual and potential users of the BnF web archives. Experiences and expectations}, journal = {International Internet Preservation Consortium (IIPC) General Assembly}, year = {2012}, month = {2012/04/30}, publisher = {International Internet Preservation Consortium}, address = {Washington (USA)}, keywords = {archivage du web, D{\'e}p{\^o}t l{\'e}gal de l{\textquoteright}internet}, url = {http://netpreserve.org/sites/default/files/resources/Oury_stirling.pdf}, author = {Cl{\'e}ment Oury and Peter Stirling} } @article {stirling_state_2012, title = {The state of e-legal deposit in France: Looking back at five years of putting new legislation into practice and envisioning the future}, journal = {IFLA Journal}, volume = {38}, number = {1}, year = {2012}, month = {2012/03}, pages = {5{\textendash}24}, author = {Peter Stirling and Gildas Illien and Pascal Sanz and Sophie Sepetjan} } @article {stirling_web_2012, title = {Web Archives for Researchers: Representations, Expectations and Potential Uses}, journal = {D-Lib Magazine}, volume = {18}, number = {3/4}, year = {2012}, month = {2012/03}, pages = {1}, abstract = {

The Internet has been covered by legal deposit legislation in France since 2006, making web archiving one of the missions of the Biblioth{\`e}que nationale de France (BnF).\ Access to the web archives has been provided in the library on an experimental basis since 2008. In the context of increasing interest in many countries in web archiving and how it may best serve the needs of researchers, especially in the expanding field of Internet studies for social sciences, a qualitative study was performed, based on interviews with potential users of the web archives held at the BnF, and particularly researchers working in various areas related to the Internet. The study aimed to explore their needs in terms of both content and services, and also to analyse different ways of representing the archives, in order to identify ways of increasing their use. While the interest of maintaining the "memory" of the web is obvious to the researchers, they are faced with the difficulty of defining, in what is a seemingly limitless space, meaningful collections of documents. Cultural heritage institutions such as national libraries are perceived as trusted third parties capable of creating rationally-constructed and well-documented collections, but such archives raise certain ethical and methodological questions.

}, doi = {10.1045/march2012-stirling}, url = {http://www.dlib.org/dlib/march12/stirling/03stirling.html}, author = {Peter Stirling and Philippe Chevallier and Gildas Illien} } @conference {2145, title = {The state of e-legal deposit in France: looking back at five years of putting new legislation into practice and envisioning the future}, booktitle = {77th IFLA General Conference and Assembly : World Library and Information Congress : Libraries beyond libraries: Integration, Innovation and Information for all}, year = {2011}, month = {2011/08/13}, publisher = {F{\'e}d{\'e}ration internationale des associations de biblioth{\'e}caires et d{\textquoteright}institutions}, organization = {F{\'e}d{\'e}ration internationale des associations de biblioth{\'e}caires et d{\textquoteright}institutions}, address = {San Juan, Puerto Rico}, url = {http://conference.ifla.org/past/ifla77/193-stirling-en.pdf}, author = {Peter Stirling and Gildas Illien and Pascal Sanz and Sophie Sepetjan} }