{"id":7783,"date":"2018-06-01T15:47:53","date_gmt":"2018-06-01T13:47:53","guid":{"rendered":"https:\/\/www.l3s.de\/?page_id=7783"},"modified":"2023-01-17T11:32:52","modified_gmt":"2023-01-17T10:32:52","slug":"big-data-and-the-lost-web","status":"publish","type":"page","link":"https:\/\/www.l3s.de\/de\/magazine\/binaire-articles\/big-data-and-the-lost-web\/","title":{"rendered":"Big Data und das verlorene Web"},"content":{"rendered":"<div data-colibri-id=\"7783-c1\" class=\"style-8242 style-local-7783-c1 position-relative\">\n  <!---->\n  <div data-colibri-component=\"section\" data-colibri-id=\"7783-c2\" id=\"reusable-sections\" class=\"h-section h-section-global-spacing d-flex align-items-lg-center align-items-md-center align-items-center style-8243 style-local-7783-c2 position-relative\">\n    <!---->\n    <!---->\n    <div class=\"h-section-grid-container h-section-boxed-container\">\n      <!---->\n      <div data-colibri-id=\"7783-c3\" class=\"h-row-container gutters-row-lg-3 gutters-row-md-3 gutters-row-0 gutters-row-v-lg-3 gutters-row-v-md-3 gutters-row-v-3 style-8244 style-local-7783-c3 position-relative\">\n        <div class=\"background-wrapper\">\n          <div class=\"background-layer background-layer-media-container-lg\">\n            <div data-enabled=\"true\" data-colibri-component=\"parallax\" class=\"background-layer paraxify lazyload\" model-id=\"7783-c3\" media=\"desktop\" is-preview=\"true\" style=\"background-image:inherit;\" data-bg-image=\"url(&quot;https:\/\/www.l3s.de\/wp-content\/uploads\/2022\/09\/cropped-Fotolia_38582476_L.jpeg&quot;)\"><\/div>\n          <\/div>\n          <div class=\"background-layer background-layer-media-container-md\">\n            <div data-enabled=\"true\" data-colibri-component=\"parallax\" class=\"background-layer paraxify lazyload\" model-id=\"7783-c3\" media=\"tablet\" is-preview=\"true\" style=\"background-image:inherit;\" data-bg-image=\"url(&quot;https:\/\/www.l3s.de\/wp-content\/uploads\/2022\/09\/cropped-Fotolia_38582476_L.jpeg&quot;)\"><\/div>\n          <\/div>\n          <div class=\"background-layer background-layer-media-container\">\n            <div data-enabled=\"true\" data-colibri-component=\"parallax\" class=\"background-layer paraxify lazyload\" model-id=\"7783-c3\" media=\"mobile\" is-preview=\"true\" style=\"background-image:inherit;\" data-bg-image=\"url(&quot;https:\/\/www.l3s.de\/wp-content\/uploads\/2022\/09\/cropped-Fotolia_38582476_L.jpeg&quot;)\"><\/div>\n          <\/div>\n        <\/div>\n        <div class=\"h-row justify-content-lg-center justify-content-md-center justify-content-center align-items-lg-stretch align-items-md-stretch align-items-stretch gutters-col-lg-3 gutters-col-md-3 gutters-col-0 gutters-col-v-lg-3 gutters-col-v-md-3 gutters-col-v-3\">\n          <!---->\n          <div class=\"h-column h-column-container d-flex h-col-lg-auto h-col-md-auto h-col-auto style-8245-outer style-local-7783-c4-outer\">\n            <div data-colibri-id=\"7783-c4\" class=\"d-flex h-flex-basis h-column__inner h-ui-empty-state-container h-px-lg-3 h-px-md-3 h-px-3 v-inner-lg-3 v-inner-md-3 v-inner-3 style-8245 style-local-7783-c4 position-relative\">\n              <!---->\n              <!---->\n              <div class=\"w-100 h-y-container h-column__content h-column__v-align flex-basis-100\">\n                <!---->\n              <\/div>\n            <\/div>\n          <\/div>\n        <\/div>\n      <\/div>\n      <div data-colibri-id=\"7783-c40\" class=\"h-row-container gutters-row-lg-0 gutters-row-md-0 gutters-row-0 gutters-row-v-lg-0 gutters-row-v-md-0 gutters-row-v-0 style-11938 style-local-7783-c40 position-relative\">\n        <!---->\n        <div class=\"h-row justify-content-lg-center justify-content-md-center justify-content-center align-items-lg-stretch align-items-md-stretch align-items-stretch gutters-col-lg-0 gutters-col-md-0 gutters-col-0 gutters-col-v-lg-0 gutters-col-v-md-0 gutters-col-v-0\">\n          <!---->\n          <div class=\"h-column h-column-container d-flex h-col-lg-auto h-col-md-auto h-col-auto style-11939-outer style-local-7783-c41-outer\">\n            <div data-colibri-id=\"7783-c41\" class=\"d-flex h-flex-basis h-column__inner h-px-lg-0 h-px-md-0 h-px-0 v-inner-lg-0 v-inner-md-0 v-inner-0 style-11939 style-local-7783-c41 position-relative\">\n              <!---->\n              <!---->\n              <div class=\"w-100 h-y-container h-column__content h-column__v-align flex-basis-100 align-self-lg-start align-self-md-start align-self-start\">\n                <!---->\n                <div data-colibri-id=\"7783-c42\" class=\"h-text h-text-component style-11940 style-local-7783-c42 position-relative h-element\">\n                  <!---->\n                  <!---->\n                  <div class=\"\">\n                    <p>Foto: <span style=\"font-weight: 300; font-size: 14px; font-family: &quot;Open Sans&quot;; color: rgb(0, 0, 0);\">\u00a9<\/span>senoldo &#8211; Fotolia.com<\/p>\n                  <\/div>\n                <\/div>\n              <\/div>\n            <\/div>\n          <\/div>\n        <\/div>\n      <\/div>\n      <div data-colibri-id=\"7783-c5\" class=\"h-row-container gutters-row-lg-2 gutters-row-md-2 gutters-row-0 gutters-row-v-lg-2 gutters-row-v-md-2 gutters-row-v-2 style-8246 style-local-7783-c5 position-relative\">\n        <!---->\n        <div class=\"h-row justify-content-lg-center justify-content-md-center justify-content-center align-items-lg-stretch align-items-md-stretch align-items-stretch gutters-col-lg-2 gutters-col-md-2 gutters-col-0 gutters-col-v-lg-2 gutters-col-v-md-2 gutters-col-v-2\">\n          <!---->\n          <div class=\"h-column h-column-container d-flex h-col-lg h-col-md-auto h-col-auto style-8247-outer style-local-7783-c6-outer\">\n            <div data-colibri-id=\"7783-c6\" class=\"d-flex h-flex-basis h-column__inner h-px-lg-0 h-px-md-0 h-px-0 v-inner-lg-0 v-inner-md-0 v-inner-0 style-8247 style-local-7783-c6 position-relative\">\n              <!---->\n              <!---->\n              <div class=\"w-100 h-y-container h-column__content h-column__v-align flex-basis-100 align-self-lg-start align-self-md-start align-self-start\">\n                <!---->\n                <div data-colibri-id=\"7783-c7\" class=\"h-row-container gutters-row-lg-0 gutters-row-md-0 gutters-row-0 gutters-row-v-lg-0 gutters-row-v-md-0 gutters-row-v-0 style-8248 style-local-7783-c7 position-relative\">\n                  <!---->\n                  <div class=\"h-row justify-content-lg-center justify-content-md-center justify-content-center align-items-lg-stretch align-items-md-stretch align-items-stretch gutters-col-lg-0 gutters-col-md-0 gutters-col-0 gutters-col-v-lg-0 gutters-col-v-md-0 gutters-col-v-0\">\n                    <!---->\n                    <div class=\"h-column h-column-container d-flex h-col-lg-auto h-col-md-auto h-col-auto style-8249-outer style-local-7783-c8-outer\">\n                      <div data-colibri-id=\"7783-c8\" class=\"d-flex h-flex-basis h-column__inner h-px-lg-2 h-px-md-2 h-px-2 v-inner-lg-2 v-inner-md-2 v-inner-2 style-8249 style-local-7783-c8 position-relative\">\n                        <!---->\n                        <!---->\n                        <div class=\"w-100 h-y-container h-column__content h-column__v-align flex-basis-100 align-self-lg-start align-self-md-start align-self-start\">\n                          <!---->\n                          <div data-colibri-id=\"7783-c9\" class=\"h-text h-text-component style-8250 style-local-7783-c9 position-relative h-element\">\n                            <!---->\n                            <!---->\n                            <div class=\"\">\n                              <p>Ausgabe: 02\/2018<\/p>\n                            <\/div>\n                          <\/div>\n                          <div data-colibri-id=\"7783-c10\" class=\"h-x-container style-8251 style-local-7783-c10 position-relative h-element\">\n                            <!---->\n                            <div class=\"h-x-container-inner style-dynamic-7783-c10-group style-8251-spacing style-local-7783-c10-spacing\"><span class=\"h-link__outer style-8252-outer style-local-7783-c11-outer d-inline-flex h-element\"><a h-use-smooth-scroll=\"true\" href=\"https:\/\/www.l3s.de\/wp-content\/uploads\/2022\/09\/L3S-Binaire-2-web.pdf\" target=\"_blank\" data-colibri-id=\"7783-c11\" class=\"d-flex w-100 align-items-center h-link style-8252 style-local-7783-c11 position-relative\" rel=\"noopener\"><!----><!----> <span>Maschinelles Lernen<\/span><\/a>\n                              <\/span>\n                            <\/div>\n                          <\/div>\n                          <div data-colibri-id=\"7783-c12\" class=\"style-8253 style-local-7783-c12 position-relative h-element\">\n                            <!---->\n                          <\/div>\n                        <\/div>\n                      <\/div>\n                    <\/div>\n                    <div class=\"h-column h-column-container d-flex h-col-lg-auto h-col-md-auto h-col-auto style-8254-outer style-local-7783-c13-outer\">\n                      <div data-colibri-id=\"7783-c13\" class=\"d-flex h-flex-basis h-column__inner h-px-lg-2 h-px-md-2 h-px-2 v-inner-lg-2 v-inner-md-2 v-inner-2 style-8254 style-local-7783-c13 position-relative\">\n                        <!---->\n                        <!---->\n                        <div class=\"w-100 h-y-container h-column__content h-column__v-align flex-basis-100 align-self-lg-start align-self-md-start align-self-start\">\n                          <!---->\n                          <div data-colibri-id=\"7783-c14\" class=\"h-global-transition-all h-heading style-8255 style-local-7783-c14 position-relative h-element\">\n                            <!---->\n                            <div class=\"h-heading__outer style-8255 style-local-7783-c14\">\n                              <!---->\n                              <!---->\n                              <h6 class=\"\">Web-Archive erm\u00f6glichen einen Blick in die Vergangenheit<\/h6>\n                            <\/div>\n                          <\/div>\n                          <div data-colibri-id=\"7783-c15\" class=\"h-global-transition-all h-heading style-8256 style-local-7783-c15 position-relative h-element\">\n                            <!---->\n                            <div class=\"h-heading__outer style-8256 style-local-7783-c15\">\n                              <!---->\n                              <!---->\n                              <h1 class=\"\">Big Data und das verlorene Web<\/h1>\n                            <\/div>\n                          <\/div>\n                          <div data-colibri-id=\"7783-c16\" class=\"style-8257 style-local-7783-c16 position-relative h-element\">\n                            <!---->\n                          <\/div>\n                          <div data-colibri-id=\"7783-c17\" class=\"h-row-container gutters-row-lg-0 gutters-row-md-0 gutters-row-0 gutters-row-v-lg-0 gutters-row-v-md-0 gutters-row-v-0 style-8258 style-local-7783-c17 position-relative\">\n                            <!---->\n                            <div class=\"h-row justify-content-lg-center justify-content-md-center justify-content-center align-items-lg-stretch align-items-md-stretch align-items-stretch gutters-col-lg-0 gutters-col-md-0 gutters-col-0 gutters-col-v-lg-0 gutters-col-v-md-0 gutters-col-v-0\">\n                              <!---->\n                              <div class=\"h-column h-column-container d-flex h-col-lg h-col-md h-col-auto style-8259-outer style-local-7783-c18-outer\">\n                                <div data-colibri-id=\"7783-c18\" class=\"d-flex h-flex-basis h-column__inner h-px-lg-0 h-px-md-0 h-px-0 v-inner-lg-0 v-inner-md-0 v-inner-0 style-8259 style-local-7783-c18 position-relative\">\n                                  <!---->\n                                  <!---->\n                                  <div class=\"w-100 h-y-container h-column__content h-column__v-align flex-basis-100 align-self-lg-start align-self-md-start align-self-start\">\n                                    <!---->\n                                    <div data-colibri-id=\"7783-c19\" class=\"h-text h-text-component style-8260 style-local-7783-c19 position-relative h-element\">\n                                      <!---->\n                                      <!---->\n                                      <div class=\"\">\n                                        <p class=\"translation-block\">Das Internet vergisst nicht. Trotzdem sind viele Inhalte auf Anhieb unauffindbar &ndash; alte Webseiten zum Beispiel. Dabei gibt es Organisationen, die alte Seiten f&uuml;r die Nachwelt aufbewahren und zur Verf&uuml;gung stellen, allen voran das&nbsp;<em>Internet Archive<\/em>&nbsp;in Kalifornien. Am L3S besch&auml;ftigen sich Forscher bereits seit 2014 intensiv mit Web-Archiven und erarbeiten neue Anwendungsf&auml;lle, Zugriffsmethoden und Analyseverfahren f&uuml;r diese interessanten Datensammlungen. Das L3S hat Zugang zu einer lokalen Kopie des gesamten deutschen Webs unter der Dom&auml;ne&nbsp;<em>.de<\/em>, welches das&nbsp;<em>Internet Archive<\/em>&nbsp;bereits seit 1996 archiviert.<\/p>\n                                        <p class=\"translation-block\">Eine Fragestellung, die die Forscher dabei besch\u00e4ftigt: Wie kann der Zugang zu diesen archivierten Seiten f\u00fcr jeden von uns einfacher werden? Besonders durch den zeitlichen Aspekt, der im aktuellen Web kaum eine Rolle spielt, in einem Archiv jedoch h\u00f6chste Priorit\u00e4t hat, ergeben sich neue Anforderungen an Suchmaschinen. Es ist nicht mehr nur wichtig, eine m\u00f6glichst relevante Seite zu finden, sondern au\u00dferdem eine bestimmte Version einer Seite, die sich m\u00f6glicherweise in der Zwischenzeit ver\u00e4ndert hat oder gar nicht mehr verf\u00fcgbar ist. Zwei Suchmaschinen, die vor diesem Hintergrund als Prototypen entstanden sind, jedoch noch weiterentwickelt und verbessert werden, k\u00f6nnen unter\u00a0<a href=\"http:\/\/alexandria-project.eu\/archivesearch\">ArchiveSearch<\/a> sowie\u00a0<a href=\"http:\/\/tempas.l3s.de\/\">Tempas - Temporal Archive Search<\/a>\u00a0 bereits ausprobiert werden.<\/p>\n                                        <p class=\"translation-block\">Das Interesse an Web-Archiven nimmt auch in anderen Wissenschaftsdisziplinen zu. F&uuml;r Historiker, Politikwissenschaftler und andere, die fr&uuml;her weitestgehend mit analogen Daten gearbeitet haben, gewinnt das Web immer mehr an Bedeutung &ndash; und damit auch die archivierten Websites. Bei den riesigen Datenmengen ist es allerdings nicht mehr m&ouml;glich, alle Dokumente zu lesen. Also sind neue Datenverarbeitungsmethoden notwendig. Auch daran forscht das L3S und bietet mit ArchiveSpark eines der meistgenutzten Tools f&uuml;r den effizienten Zugriff auf &bdquo;historische&ldquo; Web-Kollektionen. Die Software entwickeln die Wissenschaftler am L3S gemeinsam mit dem&nbsp;<em>Internet Archive<\/em>, um auf m&ouml;glichst einfache Weise Datenanalysen jeglicher Art in Web-Archiven zu erm&ouml;glichen.<\/p>\n                                        <p class=\"translation-block\">Ein weiteres Projekt, das sich ebenfalls mit anderen gro&szlig;en Datenmengen besch&auml;ftigt, ist <a href=\"http:\/\/www.sobigdata.eu\" rel=\"nofollow noopener\" target=\"_blank\" class=\"customize-unpreviewable\">SoBigData<\/a>. Gemeinsam mit anderen Wissenschaftlern aus Italien, Gro&szlig;britannien, den Niederlanden, Estland, Finnland und der Schweiz entwickelt das L3S eine europ&auml;ische Forschungsinfrastruktur f&uuml;r Big Data. Dabei werden Datens&auml;tze aus unterschiedlichen Quellen sowie verschiedene Tools f&uuml;r die Arbeit mit diesen Daten in einer offenen Plattform integriert. Zus&auml;tzlich werden Leitf&auml;den sowohl f&uuml;r die praktische Arbeit mit den Daten als auch mit besonderem Fokus auf die rechtlichen und Datenschutz-relevanten Aspekte sowie umfassende Beispiele und Vorlagen &uuml;ber die SoBigData-Plattform geteilt. Auch die oben genannten Arbeiten zu Web-Archiven stellt das L3S anderen Wissenschaftlern aus ganz Europa auf diese Weise zur Verf&uuml;gung.<\/p>\n                                        <p>Die wachsende Rolle von Daten bzw. Big Data ist nicht nur in der Forschung, sondern insbesondere auch in Wirtschaft und Industrie sp&uuml;rbar. Das Forschungszentrum L3S bietet mit seinen Arbeiten aus den Projekten ALEXANDRIA und SoBigData dabei die optimale Grundlage f&uuml;r einen leichten Einstieg in dieses komplexe Themenfeld. Da das Web immer mehr zur prim&auml;ren Medium zum Teilen von Nachrichten, Informationen und Daten wird, wird auch die Bedeutung von Web-Archiven als Zeugen dieser Entwicklung weiter zunehmen und auch in Bereiche Einzug halten, wo dies heute noch gar nicht absehbar ist. Diesen Weg zu ebnen, ist das Ziel von ALEXANDRIA. Die SoBigData-Infrastruktur als zentraler Anlaufpunkt f&uuml;r alle Fragen rund um Big Data erm&ouml;glicht, die Forschungsergebnisse anderen zug&auml;nglich zu machen und gemeinsam in Europa Ans&auml;tze f&uuml;r die Arbeit mit diesen und anderen Daten zu erarbeiten.<\/p>\n                                      <\/div>\n                                    <\/div>\n                                  <\/div>\n                                <\/div>\n                              <\/div>\n                            <\/div>\n                          <\/div>\n                        <\/div>\n                      <\/div>\n                    <\/div>\n                  <\/div>\n                <\/div>\n              <\/div>\n            <\/div>\n          <\/div>\n        <\/div>\n      <\/div>\n    <\/div>\n  <\/div>\n  <div data-colibri-component=\"section\" data-colibri-id=\"7783-c20\" id=\"reusable-sections-2\" class=\"h-section h-section-global-spacing d-flex align-items-lg-center align-items-md-center align-items-center style-8264 style-local-7783-c20 position-relative\">\n    <!---->\n    <!---->\n    <div class=\"h-section-grid-container h-section-boxed-container\">\n      <!---->\n      <div data-colibri-id=\"7783-c21\" class=\"h-row-container gutters-row-lg-0 gutters-row-md-0 gutters-row-0 gutters-row-v-lg-0 gutters-row-v-md-0 gutters-row-v-0 style-8265 style-local-7783-c21 position-relative\">\n        <!---->\n        <div class=\"h-row justify-content-lg-center justify-content-md-center justify-content-center align-items-lg-stretch align-items-md-stretch align-items-stretch gutters-col-lg-0 gutters-col-md-0 gutters-col-0 gutters-col-v-lg-0 gutters-col-v-md-0 gutters-col-v-0\">\n          <!---->\n          <div class=\"h-column h-column-container d-flex h-col-lg-auto h-col-md-auto h-col-auto style-8266-outer style-local-7783-c22-outer\">\n            <div data-colibri-id=\"7783-c22\" class=\"d-flex h-flex-basis h-column__inner h-px-lg-0 h-px-md-0 h-px-0 v-inner-lg-0 v-inner-md-0 v-inner-0 style-8266 style-local-7783-c22 position-relative\">\n              <!---->\n              <!---->\n              <div class=\"w-100 h-y-container h-column__content h-column__v-align flex-basis-100 align-self-lg-start align-self-md-start align-self-start\">\n                <!---->\n                <div data-colibri-id=\"7783-c23\" class=\"h-divider style-8267 style-local-7783-c23 position-relative h-element\">\n                  <!----><span class=\"h-divider__line style-8267-line style-local-7783-c23-line style-8267-line style-local-7783-c23-line\"><\/span><\/div>\n              <\/div>\n            <\/div>\n          <\/div>\n        <\/div>\n      <\/div>\n      <div data-colibri-id=\"7783-c24\" class=\"h-row-container gutters-row-lg-2 gutters-row-md-2 gutters-row-0 gutters-row-v-lg-2 gutters-row-v-md-2 gutters-row-v-2 style-8268 style-local-7783-c24 position-relative\">\n        <!---->\n        <div class=\"h-row justify-content-lg-center justify-content-md-center justify-content-center align-items-lg-stretch align-items-md-stretch align-items-stretch gutters-col-lg-2 gutters-col-md-2 gutters-col-0 gutters-col-v-lg-2 gutters-col-v-md-2 gutters-col-v-2\">\n          <!---->\n          <div class=\"h-column h-column-container d-flex h-col-lg-auto h-col-md-auto h-col-auto style-8269-outer style-local-7783-c25-outer\">\n            <div data-colibri-id=\"7783-c25\" class=\"d-flex h-flex-basis h-column__inner h-px-lg-2 h-px-md-2 h-px-2 v-inner-lg-2 v-inner-md-2 v-inner-2 style-8269 style-local-7783-c25 position-relative\">\n              <!---->\n              <!---->\n              <div class=\"w-100 h-y-container h-column__content h-column__v-align flex-basis-100 align-self-lg-start align-self-md-start align-self-start\">\n                <!---->\n                <div data-colibri-id=\"7783-c26\" class=\"h-global-transition-all h-heading style-8270 style-local-7783-c26 position-relative h-element\">\n                  <!---->\n                  <div class=\"h-heading__outer style-8270 style-local-7783-c26\">\n                    <!---->\n                    <!---->\n                    <h6 class=\"\">Vorgestellte Projekte<\/h6>\n                  <\/div>\n                <\/div>\n                <div data-colibri-id=\"7783-c27\" class=\"d-block style-8272 style-local-7783-c27 position-relative h-element\">\n                  <!---->\n                  <div class=\"h-image__frame-container-outer\">\n                    <a href=\"http:\/\/alexandria-project.eu\/\" h-use-smooth-scroll=\"true\" class=\"image-link\">\n                      <div class=\"h-image__frame-container\">\n                        <!---->\n                        <!---->\n                        <img decoding=\"async\" width=\"237\" height=\"198\" data-src=\"https:\/\/www.l3s.de\/wp-content\/uploads\/2022\/09\/cropped-alexandria_header_v4_cr.jpeg\" class=\"wp-image-7790 style-8272-image style-local-7783-c27-image lazyload\" alt=\"\" data-srcset=\"https:\/\/www.l3s.de\/wp-content\/uploads\/2022\/09\/cropped-alexandria_header_v4_cr.jpeg 237w, https:\/\/www.l3s.de\/wp-content\/uploads\/2022\/09\/cropped-alexandria_header_v4_cr-14x12.jpeg 14w\" data-sizes=\"(max-width: 237px) 100vw, 237px\" src=\"data:image\/svg+xml;base64,PHN2ZyB3aWR0aD0iMSIgaGVpZ2h0PSIxIiB4bWxucz0iaHR0cDovL3d3dy53My5vcmcvMjAwMC9zdmciPjwvc3ZnPg==\" style=\"--smush-placeholder-width: 237px; --smush-placeholder-aspect-ratio: 237\/198;\" \/>\n                        <div class=\"h-image__frame h-hide-lg h-hide-md h-hide-sm style-8272-frameImage style-local-7783-c27-frameImage\"><\/div>\n                      <\/div>\n                    <\/a>\n                  <\/div>\n                <\/div>\n                <div data-colibri-id=\"7783-c28\" class=\"d-block style-8271 style-local-7783-c28 position-relative h-element\">\n                  <!---->\n                  <div class=\"h-image__frame-container-outer\">\n                    <a href=\"http:\/\/www.sobigdata.eu\" h-use-smooth-scroll=\"true\" class=\"image-link\">\n                      <div class=\"h-image__frame-container\">\n                        <!---->\n                        <!---->\n                        <img decoding=\"async\" width=\"501\" height=\"227\" data-src=\"https:\/\/www.l3s.de\/wp-content\/uploads\/2022\/09\/logo-SoBigData-DEFINITIVO_small_0.png\" class=\"wp-image-7788 style-8271-image style-local-7783-c28-image lazyload\" alt=\"\" data-srcset=\"https:\/\/www.l3s.de\/wp-content\/uploads\/2022\/09\/logo-SoBigData-DEFINITIVO_small_0.png 501w, https:\/\/www.l3s.de\/wp-content\/uploads\/2022\/09\/logo-SoBigData-DEFINITIVO_small_0-300x136.png 300w, https:\/\/www.l3s.de\/wp-content\/uploads\/2022\/09\/logo-SoBigData-DEFINITIVO_small_0-18x8.png 18w\" data-sizes=\"(max-width: 501px) 100vw, 501px\" src=\"data:image\/svg+xml;base64,PHN2ZyB3aWR0aD0iMSIgaGVpZ2h0PSIxIiB4bWxucz0iaHR0cDovL3d3dy53My5vcmcvMjAwMC9zdmciPjwvc3ZnPg==\" style=\"--smush-placeholder-width: 501px; --smush-placeholder-aspect-ratio: 501\/227;\" \/>\n                        <div class=\"h-image__frame h-hide-lg h-hide-md h-hide-sm style-8271-frameImage style-local-7783-c28-frameImage\"><\/div>\n                      <\/div>\n                    <\/a>\n                  <\/div>\n                <\/div>\n              <\/div>\n            <\/div>\n          <\/div>\n          <div class=\"h-column h-column-container d-flex h-col-lg-auto h-col-md-auto h-col-auto style-8273-outer style-local-7783-c29-outer\">\n            <div data-colibri-id=\"7783-c29\" class=\"d-flex h-flex-basis h-column__inner h-px-lg-2 h-px-md-2 h-px-2 v-inner-lg-2 v-inner-md-2 v-inner-2 style-8273 style-local-7783-c29 position-relative\">\n              <!---->\n              <!---->\n              <div class=\"w-100 h-y-container h-column__content h-column__v-align flex-basis-100 align-self-lg-start align-self-md-start align-self-start\">\n                <!---->\n                <div data-colibri-id=\"7783-c30\" class=\"h-global-transition-all h-heading style-8270 style-local-7783-c30 position-relative h-element\">\n                  <!---->\n                  <div class=\"h-heading__outer style-8270 style-local-7783-c30\">\n                    <!---->\n                    <!---->\n                    <h6 class=\"\">Kontakt<\/h6>\n                  <\/div>\n                <\/div>\n                <div data-colibri-id=\"7783-c31\" class=\"h-row-container gutters-row-lg-2 gutters-row-md-2 gutters-row-0 gutters-row-v-lg-2 gutters-row-v-md-2 gutters-row-v-2 style-8274 style-local-7783-c31 position-relative\">\n                  <!---->\n                  <div class=\"h-row justify-content-lg-center justify-content-md-center justify-content-center align-items-lg-stretch align-items-md-stretch align-items-stretch gutters-col-lg-2 gutters-col-md-2 gutters-col-0 gutters-col-v-lg-2 gutters-col-v-md-2 gutters-col-v-2\">\n                    <!---->\n                    <div class=\"h-column h-column-container d-flex h-col-lg-auto h-col-md-auto h-col-auto style-8275-outer style-local-7783-c32-outer\">\n                      <div data-colibri-id=\"7783-c32\" class=\"d-flex h-flex-basis h-column__inner h-px-lg-2 h-px-md-2 h-px-2 v-inner-lg-2 v-inner-md-2 v-inner-2 style-8275 style-local-7783-c32 position-relative\">\n                        <!---->\n                        <!---->\n                        <div class=\"w-100 h-y-container h-column__content h-column__v-align flex-basis-100 align-self-lg-start align-self-md-start align-self-start\">\n                          <!---->\n                          <div data-colibri-id=\"7783-c33\" class=\"d-block style-8276 style-local-7783-c33 position-relative h-element\">\n                            <!---->\n                            <div class=\"h-image__frame-container-outer\">\n                              <div class=\"h-image__frame-container\">\n                                <!---->\n                                <!---->\n                                <img decoding=\"async\" width=\"1024\" height=\"1024\" data-src=\"https:\/\/www.l3s.de\/wp-content\/uploads\/2022\/08\/Anand-Avishek-3.jpg\" class=\"wp-image-4203 style-8276-image style-local-7783-c33-image lazyload\" alt=\"\" data-srcset=\"https:\/\/www.l3s.de\/wp-content\/uploads\/2022\/08\/Anand-Avishek-3.jpg 1024w, https:\/\/www.l3s.de\/wp-content\/uploads\/2022\/08\/Anand-Avishek-3-300x300.jpg 300w, https:\/\/www.l3s.de\/wp-content\/uploads\/2022\/08\/Anand-Avishek-3-150x150.jpg 150w, https:\/\/www.l3s.de\/wp-content\/uploads\/2022\/08\/Anand-Avishek-3-768x768.jpg 768w, https:\/\/www.l3s.de\/wp-content\/uploads\/2022\/08\/Anand-Avishek-3-12x12.jpg 12w\" data-sizes=\"(max-width: 1024px) 100vw, 1024px\" src=\"data:image\/svg+xml;base64,PHN2ZyB3aWR0aD0iMSIgaGVpZ2h0PSIxIiB4bWxucz0iaHR0cDovL3d3dy53My5vcmcvMjAwMC9zdmciPjwvc3ZnPg==\" style=\"--smush-placeholder-width: 1024px; --smush-placeholder-aspect-ratio: 1024\/1024;\" \/>\n                                <div class=\"h-image__frame h-hide-lg h-hide-md h-hide-sm style-8276-frameImage style-local-7783-c33-frameImage\"><\/div>\n                              <\/div>\n                            <\/div>\n                          <\/div>\n                          <div data-colibri-id=\"7783-c34\" class=\"h-row-container gutters-row-lg-0 gutters-row-md-0 gutters-row-0 gutters-row-v-lg-0 gutters-row-v-md-0 gutters-row-v-0 style-8277 style-local-7783-c34 position-relative\">\n                            <!---->\n                            <div class=\"h-row justify-content-lg-center justify-content-md-center justify-content-center align-items-lg-stretch align-items-md-stretch align-items-stretch gutters-col-lg-0 gutters-col-md-0 gutters-col-0 gutters-col-v-lg-0 gutters-col-v-md-0 gutters-col-v-0\">\n                              <!---->\n                              <div class=\"h-column h-column-container d-flex h-col-lg h-col-md h-col-auto style-8278-outer style-local-7783-c35-outer\">\n                                <div data-colibri-id=\"7783-c35\" class=\"d-flex h-flex-basis h-column__inner h-px-lg-0 h-px-md-0 h-px-0 v-inner-lg-0 v-inner-md-0 v-inner-0 style-8278 style-local-7783-c35 position-relative\">\n                                  <!---->\n                                  <!---->\n                                  <div class=\"w-100 h-y-container h-column__content h-column__v-align flex-basis-100 align-self-lg-start align-self-md-start align-self-start\">\n                                    <!---->\n                                    <div data-colibri-id=\"7783-c36\" class=\"h-global-transition-all h-heading style-8279 style-local-7783-c36 position-relative h-element\">\n                                      <!---->\n                                      <div class=\"h-heading__outer style-8279 style-local-7783-c36\">\n                                        <!---->\n                                        <!---->\n                                        <h4 class=\"\">Prof. Dr. Avishek Anand<\/h4>\n                                      <\/div>\n                                    <\/div>\n                                    <div data-colibri-id=\"7783-c37\" class=\"h-x-container style-8280 style-local-7783-c37 position-relative h-element\">\n                                      <!---->\n                                      <div class=\"h-x-container-inner style-dynamic-7783-c37-group style-8280-spacing style-local-7783-c37-spacing\"><span class=\"h-link__outer style-8281-outer style-local-7783-c38-outer d-inline-flex h-element\"><a h-use-smooth-scroll=\"true\" href=\"mailto:anand@l3s.de\"  data-colibri-id=\"7783-c38\" class=\"d-flex w-100 align-items-center h-link style-8281 style-local-7783-c38 position-relative\"><!----><!----> <span>anand@l3s.de<\/span><\/a>\n                                        <\/span>\n                                      <\/div>\n                                    <\/div>\n                                  <\/div>\n                                <\/div>\n                              <\/div>\n                            <\/div>\n                          <\/div>\n                          <div data-colibri-id=\"7783-c39\" class=\"h-text h-text-component style-8282 style-local-7783-c39 position-relative h-element\">\n                            <!---->\n                            <!---->\n                            <div class=\"\">\n                              <p>Avishek Anand leitet am L3S die Projekte ALEXANDRIA und SoBigData.<\/p>\n                            <\/div>\n                          <\/div>\n                        <\/div>\n                      <\/div>\n                    <\/div>\n                  <\/div>\n                <\/div>\n              <\/div>\n            <\/div>\n          <\/div>\n        <\/div>\n      <\/div>\n    <\/div>\n  <\/div>\n<\/div>","protected":false},"excerpt":{"rendered":"<p>Foto: \u00a9senoldo &#8211; Fotolia.com Issue: 02\/2018 Maschinelles Lernen Web archives allow a look into the past Big Data and the Lost Web The Internet doesn&#8217;t forget. Nevertheless many contents are untraceable at first attempt &#8211; old web pages for example. There are organizations that keep and make available old pages for posterity, especially the&nbsp;Internet Archive&nbsp;in [&hellip;]<\/p>","protected":false},"author":7,"featured_media":7784,"parent":2750,"menu_order":0,"comment_status":"closed","ping_status":"closed","template":"page-templates\/full-width-page.php","meta":{"_acf_changed":false,"footnotes":""},"categories":[],"tags":[28,90],"class_list":["post-7783","page","type-page","status-publish","has-post-thumbnail","hentry","tag-binaire","tag-binaire-2018-02"],"acf":[],"aioseo_notices":[],"publishpress_future_action":{"enabled":false,"date":"2026-05-27 02:06:02","action":"category","newStatus":"draft","terms":[75],"taxonomy":"category","extraData":[]},"publishpress_future_workflow_manual_trigger":{"enabledWorkflows":[]},"_links":{"self":[{"href":"https:\/\/www.l3s.de\/de\/wp-json\/wp\/v2\/pages\/7783","targetHints":{"allow":["GET"]}}],"collection":[{"href":"https:\/\/www.l3s.de\/de\/wp-json\/wp\/v2\/pages"}],"about":[{"href":"https:\/\/www.l3s.de\/de\/wp-json\/wp\/v2\/types\/page"}],"author":[{"embeddable":true,"href":"https:\/\/www.l3s.de\/de\/wp-json\/wp\/v2\/users\/7"}],"replies":[{"embeddable":true,"href":"https:\/\/www.l3s.de\/de\/wp-json\/wp\/v2\/comments?post=7783"}],"version-history":[{"count":0,"href":"https:\/\/www.l3s.de\/de\/wp-json\/wp\/v2\/pages\/7783\/revisions"}],"up":[{"embeddable":true,"href":"https:\/\/www.l3s.de\/de\/wp-json\/wp\/v2\/pages\/2750"}],"wp:featuredmedia":[{"embeddable":true,"href":"https:\/\/www.l3s.de\/de\/wp-json\/wp\/v2\/media\/7784"}],"wp:attachment":[{"href":"https:\/\/www.l3s.de\/de\/wp-json\/wp\/v2\/media?parent=7783"}],"wp:term":[{"taxonomy":"category","embeddable":true,"href":"https:\/\/www.l3s.de\/de\/wp-json\/wp\/v2\/categories?post=7783"},{"taxonomy":"post_tag","embeddable":true,"href":"https:\/\/www.l3s.de\/de\/wp-json\/wp\/v2\/tags?post=7783"}],"curies":[{"name":"wp","href":"https:\/\/api.w.org\/{rel}","templated":true}]}}