diff --git a/404.html b/404.html index 699805b..1f05659 100644 --- a/404.html +++ b/404.html @@ -1,6 +1,6 @@ - +
@@ -793,25 +793,25 @@- © 2023. + © 2024.
diff --git a/categories/index.html b/categories/index.html index 5b43910..3ea18b4 100644 --- a/categories/index.html +++ b/categories/index.html @@ -1,6 +1,6 @@ - + @@ -860,7 +860,7 @@- © 2023. + © 2024.
diff --git a/event/index.html b/event/index.html index f4f7c14..0000025 100644 --- a/event/index.html +++ b/event/index.html @@ -1,6 +1,6 @@ - + @@ -1107,7 +1107,7 @@- © 2023. + © 2024.
diff --git a/index.html b/index.html index 7e9778e..0aed88e 100644 --- a/index.html +++ b/index.html @@ -1,6 +1,6 @@ - + @@ -346,7 +346,7 @@ - + @@ -1210,6 +1210,7 @@@@ -2039,13 +2034,19 @@
@@ -2112,7 +2109,7 @@
@@ -2189,7 +2190,7 @@
@@ -2270,7 +2277,7 @@
- © 2023. + © 2024.
diff --git a/index.json b/index.json index d5027a0..e102698 100644 --- a/index.json +++ b/index.json @@ -24,4 +24,10 @@ - [{"authors":null,"categories":null,"content":"I am a Fixed-term Researcher at the Department of Engineering “Enzo Ferrari”, where I am also part of Database Group (DBGroup).\nMy research interests lie in the area of data integration and big data management.\n","date":-62135596800,"expirydate":-62135596800,"kind":"term","lang":"en","lastmod":-62135596800,"objectID":"2525497d367e79493fd32b198b28f040","permalink":"","publishdate":"0001-01-01T00:00:00Z","relpermalink":"","section":"authors","summary":"I am a Fixed-term Researcher at the Department of Engineering “Enzo Ferrari”, where I am also part of Database Group (DBGroup).\nMy research interests lie in the area of data integration and big data management.","tags":null,"title":"Luca Gagliardelli","type":"authors"},{"authors":["Luca Gagliardelli","Luca Zecchini","Luca Ferretti","Domenico Beneventano","Giovanni Simonini","Sonia Bergamaschi","Mirko Orsini","Luca Magnotta","Emma Mescoli","Andrea Livaldi"," others"],"categories":[],"content":"","date":1672531200,"expirydate":-62135596800,"kind":"page","lang":"en","lastmod":1673862669,"objectID":"74a78c2a85bf951f8df0f0afabad4ec8","permalink":"http://www.lucagagliardelli.com/publication/gagliardelli-2023-big/","publishdate":"2023-01-16T09:51:08.647626Z","relpermalink":"/publication/gagliardelli-2023-big/","section":"publication","summary":"","tags":[],"title":"A big data platform exploiting auditable tokenization to promote good practices inside local energy communities","type":"publication"},{"authors":["Luca Gagliardelli","George Papadakis","Giovanni Simonini","Sonia Bergamaschi","Themis Palpanas"],"categories":[],"content":"","date":1672531200,"expirydate":-62135596800,"kind":"page","lang":"en","lastmod":1697440584,"objectID":"df54129f998567c74c30caa3846d7552","permalink":"http://www.lucagagliardelli.com/publication/dblp-confsebd-gagliardelli-0-sb-23/","publishdate":"2023-10-16T07:16:24.365699Z","relpermalink":"/publication/dblp-confsebd-gagliardelli-0-sb-23/","section":"publication","summary":"","tags":[],"title":"A general approach to Supervised Meta-Blocking","type":"publication"},{"authors":["Adeel Aslam","Giovanni Simonini","Luca Gagliardelli","Angelo Mozzillo","Sonia Bergamaschi"],"categories":[],"content":"","date":1672531200,"expirydate":-62135596800,"kind":"page","lang":"en","lastmod":1697440584,"objectID":"f31fe105153840832000d431e10f332d","permalink":"http://www.lucagagliardelli.com/publication/dblp-confdawak-aslam-sgmb-23/","publishdate":"2023-10-16T07:16:23.708311Z","relpermalink":"/publication/dblp-confdawak-aslam-sgmb-23/","section":"publication","summary":"","tags":[],"title":"HKS: Efficient Data Partitioning for Stateful Streaming","type":"publication"},{"authors":["Domenico Beneventano","Sonia Bergamaschi","Luca Gagliardelli","Francesco Guerra","Maurizio Vincini"],"categories":[],"content":"","date":1672531200,"expirydate":-62135596800,"kind":"page","lang":"en","lastmod":1697440644,"objectID":"5dacb18107011ec2806cc6a3d5c207c3","permalink":"http://www.lucagagliardelli.com/publication/basidati-2023/","publishdate":"2023-10-16T07:17:23.714477Z","relpermalink":"/publication/basidati-2023/","section":"publication","summary":"","tags":[],"title":"Progetto di Basi di Dati Relazionali","type":"publication"},{"authors":[],"categories":null,"content":"","date":1662616080,"expirydate":-62135596800,"kind":"page","lang":"en","lastmod":1662616080,"objectID":"eb7ca127e6bed0c9c6039765ab83f13c","permalink":"http://www.lucagagliardelli.com/talk/generalized-supervised-meta-blocking-@-vldb-2022/","publishdate":"2022-09-08T05:48:00Z","relpermalink":"/talk/generalized-supervised-meta-blocking-@-vldb-2022/","section":"event","summary":"Presentation of \"Generalized Supervised Meta-blocking\" paper at VLDB 2022.","tags":[],"title":"Generalized Supervised Meta-blocking @ VLDB 2022","type":"event"},{"authors":[],"categories":null,"content":"","date":1648554900,"expirydate":-62135596800,"kind":"page","lang":"en","lastmod":1648554900,"objectID":"a422385dbc14dbdb0b083e0f31466b0a","permalink":"http://www.lucagagliardelli.com/talk/ecdp-@-dataplat-2022/","publishdate":"2022-03-29T11:55:00Z","relpermalink":"/talk/ecdp-@-dataplat-2022/","section":"event","summary":"Presentation of \"ECDP: A Big Data Platform for the Smart Monitoring of Local Energy Communities\" paper at DataPlat 2022.","tags":[],"title":"ECDP @ DataPlat 2022","type":"event"},{"authors":["Luca Gagliardelli","Luca Zecchini","Domenico Beneventano","Giovanni Simonini","Sonia Bergamaschi","Mirko Orsini","Luca Magnotta","Emma Mescoli","Andrea Livaldi","Nicola Gessa","Piero De Sabbata","Gianluca D'Agosta","Fabrizio Paolucci"],"categories":[],"content":"","date":1640995200,"expirydate":-62135596800,"kind":"page","lang":"en","lastmod":1663769746,"objectID":"6d8d7f647e34d236c8541b09c493df25","permalink":"http://www.lucagagliardelli.com/publication/dblp-confedbt-gagliardelli-zbs-22/","publishdate":"2022-09-21T14:15:45.995014Z","relpermalink":"/publication/dblp-confedbt-gagliardelli-zbs-22/","section":"publication","summary":"","tags":[],"title":"ECDP: A Big Data Platform for the Smart Monitoring of Local Energy Communities","type":"publication"},{"authors":["Luca Gagliardelli","George Papadakis","Giovanni Simonini","Sonia Bergamaschi","Themis Palpanas"],"categories":[],"content":"","date":1640995200,"expirydate":-62135596800,"kind":"page","lang":"en","lastmod":1663769745,"objectID":"a11d0af9d9c8defec1527632e11e2c32","permalink":"http://www.lucagagliardelli.com/publication/dblp-journalspvldb-gagliardelli-psb-22/","publishdate":"2022-09-21T14:15:45.498756Z","relpermalink":"/publication/dblp-journalspvldb-gagliardelli-psb-22/","section":"publication","summary":"","tags":[],"title":"Generalized Supervised Meta-blocking","type":"publication"},{"authors":["Luca Gagliardelli","George Papadakis","Giovanni Simonini","Sonia Bergamaschi","Themis Palpanas"],"categories":[],"content":"","date":1640995200,"expirydate":-62135596800,"kind":"page","lang":"en","lastmod":1663769747,"objectID":"d4594a1fb7a894c8e6dc7bda22f17787","permalink":"http://www.lucagagliardelli.com/publication/dblp-journalscorrabs-2204-08801/","publishdate":"2022-09-21T14:15:46.923621Z","relpermalink":"/publication/dblp-journalscorrabs-2204-08801/","section":"publication","summary":"","tags":[],"title":"Generalized Supervised Meta-blocking (technical report)","type":"publication"},{"authors":["Giovanni Simonini","Luca Gagliardelli","Michele Rinaldi","Luca Zecchini","Giulio De Sabbata","Adeel Aslam","Domenico Beneventano","Sonia Bergamaschi"],"categories":[],"content":"","date":1640995200,"expirydate":-62135596800,"kind":"page","lang":"en","lastmod":1663769746,"objectID":"b3732822915a3e6e494bdfb441b9d0c9","permalink":"http://www.lucagagliardelli.com/publication/dblp-confsebd-simonini-grzsabb-22/","publishdate":"2022-09-21T14:15:46.451318Z","relpermalink":"/publication/dblp-confsebd-simonini-grzsabb-22/","section":"publication","summary":"","tags":[],"title":"Progressive Entity Resolution with Node Embeddings","type":"publication"},{"authors":["Georgios M. Mandilaras","George Papadakis","Luca Gagliardelli","Giovanni Simonini","Emmanouil Thanos","George Giannakopoulos","Sonia Bergamaschi","Themis Palpanas","Manolis Koubarakis","Alicia Lara-Clares","Antonio Fariña"],"categories":[],"content":"","date":1609459200,"expirydate":-62135596800,"kind":"page","lang":"en","lastmod":1663769747,"objectID":"14e7bebd89f2f10b9e61609bae9aee89","permalink":"http://www.lucagagliardelli.com/publication/dblp-journalsis-mandilaras-0-gstg-21/","publishdate":"2022-09-21T14:15:47.40018Z","relpermalink":"/publication/dblp-journalsis-mandilaras-0-gstg-21/","section":"publication","summary":"","tags":[],"title":"Reproducible experiments on Three-Dimensional Entity Resolution with JedAI","type":"publication"},{"authors":["Giovanni Simonini","Henrique Saccani","Luca Gagliardelli","Luca Zecchini","Domenico Beneventano","Sonia Bergamaschi"],"categories":[],"content":"","date":1609459200,"expirydate":-62135596800,"kind":"page","lang":"en","lastmod":1663769748,"objectID":"dd5d7bc65512cb261d5d8186f7955ca4","permalink":"http://www.lucagagliardelli.com/publication/dblp-confsebd-simonini-sgzbb-21/","publishdate":"2022-09-21T14:15:47.872122Z","relpermalink":"/publication/dblp-confsebd-simonini-sgzbb-21/","section":"publication","summary":"","tags":[],"title":"The Case for Multi-task Active Learning Entity Resolution (Discussion Paper)","type":"publication"},{"authors":["Domenico Beneventano","Sonia Bergamaschi","Luca Gagliardelli","Giovanni Simonini"],"categories":[],"content":"","date":1577836800,"expirydate":-62135596800,"kind":"page","lang":"en","lastmod":1663769749,"objectID":"91b01ed749421d01ea6d99e441eb86df","permalink":"http://www.lucagagliardelli.com/publication/dblp-journalsjdiq-beneventano-bgs-20/","publishdate":"2022-09-21T14:15:48.78534Z","relpermalink":"/publication/dblp-journalsjdiq-beneventano-bgs-20/","section":"publication","summary":"","tags":[],"title":"emphBLAST2: An Efficient Technique for Loose Schema Information Extraction from Heterogeneous Big Data Sources","type":"publication"},{"authors":["Luca Gagliardelli","Giovanni Simonini","Sonia Bergamaschi"],"categories":[],"content":"","date":1577836800,"expirydate":-62135596800,"kind":"page","lang":"en","lastmod":1663769749,"objectID":"faa5c3fedf4f6ecf90d47a44fea52d4f","permalink":"http://www.lucagagliardelli.com/publication/dblp-confedbt-gagliardelli-sb-20/","publishdate":"2022-09-21T14:15:49.24102Z","relpermalink":"/publication/dblp-confedbt-gagliardelli-sb-20/","section":"publication","summary":"","tags":[],"title":"RulER: Scaling Up Record-level Matching Rules","type":"publication"},{"authors":["Luca Gagliardelli","Giovanni Simonini","Sonia Bergamaschi"],"categories":[],"content":"","date":1577836800,"expirydate":-62135596800,"kind":"page","lang":"en","lastmod":1663769750,"objectID":"a9adad9042ae4ac84d945a977cc59d9c","permalink":"http://www.lucagagliardelli.com/publication/dblp-confsebd-gagliardelli-sb-20/","publishdate":"2022-09-21T14:15:49.696323Z","relpermalink":"/publication/dblp-confsebd-gagliardelli-sb-20/","section":"publication","summary":"","tags":[],"title":"Scaling Up Record-level Matching Rules","type":"publication"},{"authors":["George Papadakis","Georgios M. Mandilaras","Luca Gagliardelli","Giovanni Simonini","Emmanouil Thanos","George Giannakopoulos","Sonia Bergamaschi","Themis Palpanas","Manolis Koubarakis"],"categories":[],"content":"","date":1577836800,"expirydate":-62135596800,"kind":"page","lang":"en","lastmod":1663769748,"objectID":"4cecfd89473b4a1fd03d3f4c03c533bc","permalink":"http://www.lucagagliardelli.com/publication/dblp-journalsis-papadakis-mgstgb-20/","publishdate":"2022-09-21T14:15:48.318098Z","relpermalink":"/publication/dblp-journalsis-papadakis-mgstgb-20/","section":"publication","summary":"","tags":[],"title":"Three-dimensional Entity Resolution with JedAI","type":"publication"},{"authors":["Domenico Beneventano","Sonia Bergamaschi","Luca Gagliardelli","Giovanni Simonini"],"categories":[],"content":"","date":1546300800,"expirydate":-62135596800,"kind":"page","lang":"en","lastmod":1663769751,"objectID":"663cad9ba94e5874abc491955823013d","permalink":"http://www.lucagagliardelli.com/publication/dblp-confsebd-beneventano-bgs-19/","publishdate":"2022-09-21T14:15:51.075065Z","relpermalink":"/publication/dblp-confsebd-beneventano-bgs-19/","section":"publication","summary":"","tags":[],"title":"Entity Resolution and Data Fusion: An Integrated Approach","type":"publication"},{"authors":["Giovanni Simonini","Luca Gagliardelli","Sonia Bergamaschi","H. V. Jagadish"],"categories":[],"content":"","date":1546300800,"expirydate":-62135596800,"kind":"page","lang":"en","lastmod":1663769750,"objectID":"594e4e4d2e00aefe0b6e2a015bbee534","permalink":"http://www.lucagagliardelli.com/publication/dblp-journalsis-simonini-gbj-19/","publishdate":"2022-09-21T14:15:50.160845Z","relpermalink":"/publication/dblp-journalsis-simonini-gbj-19/","section":"publication","summary":"","tags":[],"title":"Scaling entity resolution: A loosely schema-aware approach","type":"publication"},{"authors":["Luca Gagliardelli","Giovanni Simonini","Domenico Beneventano","Sonia Bergamaschi"],"categories":[],"content":"","date":1546300800,"expirydate":-62135596800,"kind":"page","lang":"en","lastmod":1663769751,"objectID":"84af9d2f803041d4ab63e0710db49a02","permalink":"http://www.lucagagliardelli.com/publication/dblp-confedbt-gagliardelli-sbb-19/","publishdate":"2022-09-21T14:15:50.620075Z","relpermalink":"/publication/dblp-confedbt-gagliardelli-sbb-19/","section":"publication","summary":"","tags":[],"title":"SparkER: Scaling Entity Resolution in Spark","type":"publication"},{"authors":["Giovanni Simonini","Luca Gagliardelli","Song Zhu","Sonia Bergamaschi"],"categories":[],"content":"","date":1514764800,"expirydate":-62135596800,"kind":"page","lang":"en","lastmod":1663769752,"objectID":"89d41483c731af7210fd57921c53c99d","permalink":"http://www.lucagagliardelli.com/publication/dblp-confieeehpcs-simonini-gzb-18/","publishdate":"2022-09-21T14:15:51.977706Z","relpermalink":"/publication/dblp-confieeehpcs-simonini-gzb-18/","section":"publication","summary":"","tags":[],"title":"Enhancing Loosely Schema-aware Entity Resolution with User Interaction","type":"publication"},{"authors":["Sonia Bergamaschi","Domenico Beneventano","Federica Mandreoli","Riccardo Martoglia","Francesco Guerra","Mirko Orsini","Laura Po","Maurizio Vincini","Giovanni Simonini","Song Zhu","Luca Gagliardelli","Luca Magnotta"],"categories":[],"content":"","date":1514764800,"expirydate":-62135596800,"kind":"page","lang":"en","lastmod":1516544152,"objectID":"2b2ba43e8ff94ef1c8f095350ab32ce2","permalink":"http://www.lucagagliardelli.com/publication/dblp-bookssp-18-bergamaschi-bmm-0-opvszgm-18/","publishdate":"2022-09-21T14:15:52.445257Z","relpermalink":"/publication/dblp-bookssp-18-bergamaschi-bmm-0-opvszgm-18/","section":"publication","summary":"","tags":[],"title":"From Data Integration to Big Data Integration","type":"publication"},{"authors":["Song Zhu","Luca Gagliardelli","Giovanni Simonini","Domenico Beneventano"],"categories":[],"content":"","date":1514764800,"expirydate":-62135596800,"kind":"page","lang":"en","lastmod":1663769751,"objectID":"4141944fb5eb9e2113361dd018504c3c","permalink":"http://www.lucagagliardelli.com/publication/dblp-confieeehpcs-zhu-gsb-18/","publishdate":"2022-09-21T14:15:51.538207Z","relpermalink":"/publication/dblp-confieeehpcs-zhu-gsb-18/","section":"publication","summary":"","tags":[],"title":"How Improve Set Similarity Join Based on Prefix Approach in Distributed Environment","type":"publication"},{"authors":["Mirko Orsini","Enrico Calanchi","Luca Magnotta","Luca Gagliardelli","Monica Govi","Fabiano Mele","Rossella Tuplert"],"categories":[],"content":"","date":1483228800,"expirydate":-62135596800,"kind":"page","lang":"en","lastmod":1663769753,"objectID":"60229854d55ee13b1bbe5cbad9fb5a2c","permalink":"http://www.lucagagliardelli.com/publication/dblp-confrtsi-orsini-cmggmt-17/","publishdate":"2022-09-21T14:15:52.9118Z","relpermalink":"/publication/dblp-confrtsi-orsini-cmggmt-17/","section":"publication","summary":"","tags":[],"title":"The Italian FSHD registry: An enhanced data integration and analytics framework for smart health care","type":"publication"},{"authors":["Domenico Beneventano","Sonia Bergamaschi","Luca Gagliardelli","Laura Po"],"categories":[],"content":"","date":1420070400,"expirydate":-62135596800,"kind":"page","lang":"en","lastmod":1663769754,"objectID":"43b678003b927b8481e2a7b9002c4b79","permalink":"http://www.lucagagliardelli.com/publication/dblp-confic-3-k-beneventano-bgp-15-a/","publishdate":"2022-09-21T14:15:53.824148Z","relpermalink":"/publication/dblp-confic-3-k-beneventano-bgp-15-a/","section":"publication","summary":"","tags":[],"title":"Driving Innovation in Youth Policies with Open Data","type":"publication"},{"authors":["Domenico Beneventano","Sonia Bergamaschi","Luca Gagliardelli","Laura Po"],"categories":[],"content":"","date":1420070400,"expirydate":-62135596800,"kind":"page","lang":"en","lastmod":1663769753,"objectID":"5f88e4cf7d96cb8e986a648c40e0cea1","permalink":"http://www.lucagagliardelli.com/publication/dblp-confic-3-k-beneventano-bgp-15/","publishdate":"2022-09-21T14:15:53.366405Z","relpermalink":"/publication/dblp-confic-3-k-beneventano-bgp-15/","section":"publication","summary":"","tags":[],"title":"Open Data for Improving Youth Policies","type":"publication"}] \ No newline at end of file + + + + + + + [{"authors":null,"categories":null,"content":"I am a Fixed-term Researcher at the Department of Engineering “Enzo Ferrari”, where I am also part of Database Group (DBGroup).\nMy research interests lie in the area of data integration and big data management.\n","date":-62135596800,"expirydate":-62135596800,"kind":"term","lang":"en","lastmod":-62135596800,"objectID":"2525497d367e79493fd32b198b28f040","permalink":"","publishdate":"0001-01-01T00:00:00Z","relpermalink":"","section":"authors","summary":"I am a Fixed-term Researcher at the Department of Engineering “Enzo Ferrari”, where I am also part of Database Group (DBGroup).\nMy research interests lie in the area of data integration and big data management.","tags":null,"title":"Luca Gagliardelli","type":"authors"},{"authors":["Sania Aftar","Luca Gagliardelli","Amina El Ganadi","Federico Ruozzi","Sonia Bergamaschi"],"categories":[],"content":"","date":1704067200,"expirydate":-62135596800,"kind":"page","lang":"en","lastmod":1720443836,"objectID":"161e280fc960f63de0e4a8a86b009fa4","permalink":"http://www.lucagagliardelli.com/publication/dblp-confircdl-aftar-ggrb-24/","publishdate":"2024-07-08T13:03:55.105438Z","relpermalink":"/publication/dblp-confircdl-aftar-ggrb-24/","section":"publication","summary":"","tags":[],"title":"A Novel Methodology for Topic Identification in Hadith","type":"publication"},{"authors":["Luca Gagliardelli","George Papadakis","Giovanni Simonini","Sonia Bergamaschi","Themis Palpanas"],"categories":[],"content":"","date":1704067200,"expirydate":-62135596800,"kind":"page","lang":"en","lastmod":1720443831,"objectID":"4d72d3156a0e48ddcf9033829f89a31d","permalink":"http://www.lucagagliardelli.com/publication/dblp-journalsis-gagliardelli-psbp-24/","publishdate":"2024-07-08T13:03:50.345787Z","relpermalink":"/publication/dblp-journalsis-gagliardelli-psbp-24/","section":"publication","summary":"","tags":[],"title":"GSM: A generalized approach to Supervised Meta-blocking for scalable entity resolution","type":"publication"},{"authors":["Adeel Aslam","Giovanni Simonini","Luca Gagliardelli","Luca Zecchini","Sonia Bergamaschi"],"categories":[],"content":"","date":1704067200,"expirydate":-62135596800,"kind":"page","lang":"en","lastmod":1720444115,"objectID":"83b711df4f4f97c290210c45414e0272","permalink":"http://www.lucagagliardelli.com/publication/aslam-2024102425/","publishdate":"2024-07-08T13:08:33.787446Z","relpermalink":"/publication/aslam-2024102425/","section":"publication","summary":"Inequality join is an operator to join data on inequality conditions and it is a fundamental building block for applications. While methods and optimizations exist for efficient inequality join in batch processing, little attention has been given to its streaming version, particularly to large-scale data-intensive applications that run on Distributed Stream Processing Systems (DSPSs). Designing an inequality join in streaming and distributed settings is not an easy task: (i) indexes have to be employed to efficiently support inequality-based comparisons, but the continuous stream of data imposes continuous insertions, updates, and deletions of elements in the indexes—hence a huge overhead for the DSPSs; (ii) oftentimes real data is skewed, which makes indexing even more challenging. To address these challenges, we propose the Stream-Aware inequality join (STA), an indexing method that can reduce redundancy and index update overhead. STA builds a separate in-memory index structure for hotkeys, i.e., the most frequently used keys, which are automatically identified with an efficient data sketch. On the other hand, the cold keys are treated using a linked set of index structures. In this way, STA avoids many superfluous index updates for frequent items. Finally, we implement four state-of-the-art inequality join solutions for a widely employed DSPS (Apache Storm) and compare their performance with STA on four real-world data sets and a synthetic one. The results of our experimental evaluation reveal that our stream-aware approach outperforms existing solutions.","tags":["Distributed stream processing system","Inequality join","Btree indexing","Augmented sketch","Skewed data distribution"],"title":"Stream-aware indexing for distributed inequality join processing","type":"publication"},{"authors":["Luca Gagliardelli","Luca Zecchini","Luca Ferretti","Domenico Beneventano","Giovanni Simonini","Sonia Bergamaschi","Mirko Orsini","Luca Magnotta","Emma Mescoli","Andrea Livaldi"," others"],"categories":[],"content":"","date":1672531200,"expirydate":-62135596800,"kind":"page","lang":"en","lastmod":1673862669,"objectID":"74a78c2a85bf951f8df0f0afabad4ec8","permalink":"http://www.lucagagliardelli.com/publication/gagliardelli-2023-big/","publishdate":"2023-01-16T09:51:08.647626Z","relpermalink":"/publication/gagliardelli-2023-big/","section":"publication","summary":"","tags":[],"title":"A big data platform exploiting auditable tokenization to promote good practices inside local energy communities","type":"publication"},{"authors":["Sonia Bergamaschi","Luca Gagliardelli"],"categories":[],"content":"","date":1672531200,"expirydate":-62135596800,"kind":"page","lang":"en","lastmod":1720443829,"objectID":"0af0cec5560dfcfd0c36f5ad027bb184","permalink":"http://www.lucagagliardelli.com/publication/dblp-confbigdataconf-bergamaschi-g-23/","publishdate":"2024-07-08T13:03:46.229438Z","relpermalink":"/publication/dblp-confbigdataconf-bergamaschi-g-23/","section":"publication","summary":"","tags":[],"title":"A Big Data Platform for the Management of Local Energy Communities Data","type":"publication"},{"authors":["Luca Gagliardelli","George Papadakis","Giovanni Simonini","Sonia Bergamaschi","Themis Palpanas"],"categories":[],"content":"","date":1672531200,"expirydate":-62135596800,"kind":"page","lang":"en","lastmod":1697440584,"objectID":"df54129f998567c74c30caa3846d7552","permalink":"http://www.lucagagliardelli.com/publication/dblp-confsebd-gagliardelli-0-sb-23/","publishdate":"2023-10-16T07:16:24.365699Z","relpermalink":"/publication/dblp-confsebd-gagliardelli-0-sb-23/","section":"publication","summary":"","tags":[],"title":"A general approach to Supervised Meta-Blocking","type":"publication"},{"authors":["Luca Gagliardelli","Domenico Beneventano","Marco Esposito","Luca Zecchini","Giovanni Simonini","Sonia Bergamaschi","Fabio Miselli","Giuseppe Calogero Miano"],"categories":[],"content":"","date":1672531200,"expirydate":-62135596800,"kind":"page","lang":"en","lastmod":1720443834,"objectID":"6c970af3685110c8f12c9770538ee585","permalink":"http://www.lucagagliardelli.com/publication/dblp-journalscorrabs-2312-12902/","publishdate":"2024-07-08T13:03:53.519177Z","relpermalink":"/publication/dblp-journalscorrabs-2312-12902/","section":"publication","summary":"","tags":[],"title":"DXP: Billing Data Preparation for Big Data Analytics","type":"publication"},{"authors":["Angelo Mozzillo","Luca Zecchini","Luca Gagliardelli","Adeel Aslam","Sonia Bergamaschi","Giovanni Simonini"],"categories":[],"content":"","date":1672531200,"expirydate":-62135596800,"kind":"page","lang":"en","lastmod":1720443833,"objectID":"e85f9649ae6ab7de64eff19b56e3dc88","permalink":"http://www.lucagagliardelli.com/publication/dblp-journalscorrabs-2312-11122/","publishdate":"2024-07-08T13:03:52.038307Z","relpermalink":"/publication/dblp-journalscorrabs-2312-11122/","section":"publication","summary":"","tags":[],"title":"Evaluation of Dataframe Libraries for Data Preparation on a Single Machine","type":"publication"},{"authors":["Adeel Aslam","Giovanni Simonini","Luca Gagliardelli","Angelo Mozzillo","Sonia Bergamaschi"],"categories":[],"content":"","date":1672531200,"expirydate":-62135596800,"kind":"page","lang":"en","lastmod":1697440584,"objectID":"f31fe105153840832000d431e10f332d","permalink":"http://www.lucagagliardelli.com/publication/dblp-confdawak-aslam-sgmb-23/","publishdate":"2023-10-16T07:16:23.708311Z","relpermalink":"/publication/dblp-confdawak-aslam-sgmb-23/","section":"publication","summary":"","tags":[],"title":"HKS: Efficient Data Partitioning for Stateful Streaming","type":"publication"},{"authors":["Domenico Beneventano","Sonia Bergamaschi","Luca Gagliardelli","Francesco Guerra","Maurizio Vincini"],"categories":[],"content":"","date":1672531200,"expirydate":-62135596800,"kind":"page","lang":"en","lastmod":1697440644,"objectID":"5dacb18107011ec2806cc6a3d5c207c3","permalink":"http://www.lucagagliardelli.com/publication/basidati-2023/","publishdate":"2023-10-16T07:17:23.714477Z","relpermalink":"/publication/basidati-2023/","section":"publication","summary":"","tags":[],"title":"Progetto di Basi di Dati Relazionali","type":"publication"},{"authors":[],"categories":null,"content":"","date":1662616080,"expirydate":-62135596800,"kind":"page","lang":"en","lastmod":1662616080,"objectID":"eb7ca127e6bed0c9c6039765ab83f13c","permalink":"http://www.lucagagliardelli.com/talk/generalized-supervised-meta-blocking-@-vldb-2022/","publishdate":"2022-09-08T05:48:00Z","relpermalink":"/talk/generalized-supervised-meta-blocking-@-vldb-2022/","section":"event","summary":"Presentation of \"Generalized Supervised Meta-blocking\" paper at VLDB 2022.","tags":[],"title":"Generalized Supervised Meta-blocking @ VLDB 2022","type":"event"},{"authors":[],"categories":null,"content":"","date":1648554900,"expirydate":-62135596800,"kind":"page","lang":"en","lastmod":1648554900,"objectID":"a422385dbc14dbdb0b083e0f31466b0a","permalink":"http://www.lucagagliardelli.com/talk/ecdp-@-dataplat-2022/","publishdate":"2022-03-29T11:55:00Z","relpermalink":"/talk/ecdp-@-dataplat-2022/","section":"event","summary":"Presentation of \"ECDP: A Big Data Platform for the Smart Monitoring of Local Energy Communities\" paper at DataPlat 2022.","tags":[],"title":"ECDP @ DataPlat 2022","type":"event"},{"authors":["Luca Gagliardelli","Luca Zecchini","Domenico Beneventano","Giovanni Simonini","Sonia Bergamaschi","Mirko Orsini","Luca Magnotta","Emma Mescoli","Andrea Livaldi","Nicola Gessa","Piero De Sabbata","Gianluca D'Agosta","Fabrizio Paolucci"],"categories":[],"content":"","date":1640995200,"expirydate":-62135596800,"kind":"page","lang":"en","lastmod":1663769746,"objectID":"6d8d7f647e34d236c8541b09c493df25","permalink":"http://www.lucagagliardelli.com/publication/dblp-confedbt-gagliardelli-zbs-22/","publishdate":"2022-09-21T14:15:45.995014Z","relpermalink":"/publication/dblp-confedbt-gagliardelli-zbs-22/","section":"publication","summary":"","tags":[],"title":"ECDP: A Big Data Platform for the Smart Monitoring of Local Energy Communities","type":"publication"},{"authors":["Luca Gagliardelli","George Papadakis","Giovanni Simonini","Sonia Bergamaschi","Themis Palpanas"],"categories":[],"content":"","date":1640995200,"expirydate":-62135596800,"kind":"page","lang":"en","lastmod":1663769745,"objectID":"a11d0af9d9c8defec1527632e11e2c32","permalink":"http://www.lucagagliardelli.com/publication/dblp-journalspvldb-gagliardelli-psb-22/","publishdate":"2022-09-21T14:15:45.498756Z","relpermalink":"/publication/dblp-journalspvldb-gagliardelli-psb-22/","section":"publication","summary":"","tags":[],"title":"Generalized Supervised Meta-blocking","type":"publication"},{"authors":["Luca Gagliardelli","George Papadakis","Giovanni Simonini","Sonia Bergamaschi","Themis Palpanas"],"categories":[],"content":"","date":1640995200,"expirydate":-62135596800,"kind":"page","lang":"en","lastmod":1663769747,"objectID":"d4594a1fb7a894c8e6dc7bda22f17787","permalink":"http://www.lucagagliardelli.com/publication/dblp-journalscorrabs-2204-08801/","publishdate":"2022-09-21T14:15:46.923621Z","relpermalink":"/publication/dblp-journalscorrabs-2204-08801/","section":"publication","summary":"","tags":[],"title":"Generalized Supervised Meta-blocking (technical report)","type":"publication"},{"authors":["Giovanni Simonini","Luca Gagliardelli","Michele Rinaldi","Luca Zecchini","Giulio De Sabbata","Adeel Aslam","Domenico Beneventano","Sonia Bergamaschi"],"categories":[],"content":"","date":1640995200,"expirydate":-62135596800,"kind":"page","lang":"en","lastmod":1663769746,"objectID":"b3732822915a3e6e494bdfb441b9d0c9","permalink":"http://www.lucagagliardelli.com/publication/dblp-confsebd-simonini-grzsabb-22/","publishdate":"2022-09-21T14:15:46.451318Z","relpermalink":"/publication/dblp-confsebd-simonini-grzsabb-22/","section":"publication","summary":"","tags":[],"title":"Progressive Entity Resolution with Node Embeddings","type":"publication"},{"authors":["Georgios M. Mandilaras","George Papadakis","Luca Gagliardelli","Giovanni Simonini","Emmanouil Thanos","George Giannakopoulos","Sonia Bergamaschi","Themis Palpanas","Manolis Koubarakis","Alicia Lara-Clares","Antonio Fariña"],"categories":[],"content":"","date":1609459200,"expirydate":-62135596800,"kind":"page","lang":"en","lastmod":1663769747,"objectID":"14e7bebd89f2f10b9e61609bae9aee89","permalink":"http://www.lucagagliardelli.com/publication/dblp-journalsis-mandilaras-0-gstg-21/","publishdate":"2022-09-21T14:15:47.40018Z","relpermalink":"/publication/dblp-journalsis-mandilaras-0-gstg-21/","section":"publication","summary":"","tags":[],"title":"Reproducible experiments on Three-Dimensional Entity Resolution with JedAI","type":"publication"},{"authors":["Giovanni Simonini","Henrique Saccani","Luca Gagliardelli","Luca Zecchini","Domenico Beneventano","Sonia Bergamaschi"],"categories":[],"content":"","date":1609459200,"expirydate":-62135596800,"kind":"page","lang":"en","lastmod":1663769748,"objectID":"dd5d7bc65512cb261d5d8186f7955ca4","permalink":"http://www.lucagagliardelli.com/publication/dblp-confsebd-simonini-sgzbb-21/","publishdate":"2022-09-21T14:15:47.872122Z","relpermalink":"/publication/dblp-confsebd-simonini-sgzbb-21/","section":"publication","summary":"","tags":[],"title":"The Case for Multi-task Active Learning Entity Resolution (Discussion Paper)","type":"publication"},{"authors":["Domenico Beneventano","Sonia Bergamaschi","Luca Gagliardelli","Giovanni Simonini"],"categories":[],"content":"","date":1577836800,"expirydate":-62135596800,"kind":"page","lang":"en","lastmod":1663769749,"objectID":"91b01ed749421d01ea6d99e441eb86df","permalink":"http://www.lucagagliardelli.com/publication/dblp-journalsjdiq-beneventano-bgs-20/","publishdate":"2022-09-21T14:15:48.78534Z","relpermalink":"/publication/dblp-journalsjdiq-beneventano-bgs-20/","section":"publication","summary":"","tags":[],"title":"emphBLAST2: An Efficient Technique for Loose Schema Information Extraction from Heterogeneous Big Data Sources","type":"publication"},{"authors":["Luca Gagliardelli","Giovanni Simonini","Sonia Bergamaschi"],"categories":[],"content":"","date":1577836800,"expirydate":-62135596800,"kind":"page","lang":"en","lastmod":1663769749,"objectID":"faa5c3fedf4f6ecf90d47a44fea52d4f","permalink":"http://www.lucagagliardelli.com/publication/dblp-confedbt-gagliardelli-sb-20/","publishdate":"2022-09-21T14:15:49.24102Z","relpermalink":"/publication/dblp-confedbt-gagliardelli-sb-20/","section":"publication","summary":"","tags":[],"title":"RulER: Scaling Up Record-level Matching Rules","type":"publication"},{"authors":["Luca Gagliardelli","Giovanni Simonini","Sonia Bergamaschi"],"categories":[],"content":"","date":1577836800,"expirydate":-62135596800,"kind":"page","lang":"en","lastmod":1663769750,"objectID":"a9adad9042ae4ac84d945a977cc59d9c","permalink":"http://www.lucagagliardelli.com/publication/dblp-confsebd-gagliardelli-sb-20/","publishdate":"2022-09-21T14:15:49.696323Z","relpermalink":"/publication/dblp-confsebd-gagliardelli-sb-20/","section":"publication","summary":"","tags":[],"title":"Scaling Up Record-level Matching Rules","type":"publication"},{"authors":["George Papadakis","Georgios M. Mandilaras","Luca Gagliardelli","Giovanni Simonini","Emmanouil Thanos","George Giannakopoulos","Sonia Bergamaschi","Themis Palpanas","Manolis Koubarakis"],"categories":[],"content":"","date":1577836800,"expirydate":-62135596800,"kind":"page","lang":"en","lastmod":1663769748,"objectID":"4cecfd89473b4a1fd03d3f4c03c533bc","permalink":"http://www.lucagagliardelli.com/publication/dblp-journalsis-papadakis-mgstgb-20/","publishdate":"2022-09-21T14:15:48.318098Z","relpermalink":"/publication/dblp-journalsis-papadakis-mgstgb-20/","section":"publication","summary":"","tags":[],"title":"Three-dimensional Entity Resolution with JedAI","type":"publication"},{"authors":["Domenico Beneventano","Sonia Bergamaschi","Luca Gagliardelli","Giovanni Simonini"],"categories":[],"content":"","date":1546300800,"expirydate":-62135596800,"kind":"page","lang":"en","lastmod":1663769751,"objectID":"663cad9ba94e5874abc491955823013d","permalink":"http://www.lucagagliardelli.com/publication/dblp-confsebd-beneventano-bgs-19/","publishdate":"2022-09-21T14:15:51.075065Z","relpermalink":"/publication/dblp-confsebd-beneventano-bgs-19/","section":"publication","summary":"","tags":[],"title":"Entity Resolution and Data Fusion: An Integrated Approach","type":"publication"},{"authors":["Giovanni Simonini","Luca Gagliardelli","Sonia Bergamaschi","H. V. Jagadish"],"categories":[],"content":"","date":1546300800,"expirydate":-62135596800,"kind":"page","lang":"en","lastmod":1663769750,"objectID":"594e4e4d2e00aefe0b6e2a015bbee534","permalink":"http://www.lucagagliardelli.com/publication/dblp-journalsis-simonini-gbj-19/","publishdate":"2022-09-21T14:15:50.160845Z","relpermalink":"/publication/dblp-journalsis-simonini-gbj-19/","section":"publication","summary":"","tags":[],"title":"Scaling entity resolution: A loosely schema-aware approach","type":"publication"},{"authors":["Luca Gagliardelli","Giovanni Simonini","Domenico Beneventano","Sonia Bergamaschi"],"categories":[],"content":"","date":1546300800,"expirydate":-62135596800,"kind":"page","lang":"en","lastmod":1663769751,"objectID":"84af9d2f803041d4ab63e0710db49a02","permalink":"http://www.lucagagliardelli.com/publication/dblp-confedbt-gagliardelli-sbb-19/","publishdate":"2022-09-21T14:15:50.620075Z","relpermalink":"/publication/dblp-confedbt-gagliardelli-sbb-19/","section":"publication","summary":"","tags":[],"title":"SparkER: Scaling Entity Resolution in Spark","type":"publication"},{"authors":["Giovanni Simonini","Luca Gagliardelli","Song Zhu","Sonia Bergamaschi"],"categories":[],"content":"","date":1514764800,"expirydate":-62135596800,"kind":"page","lang":"en","lastmod":1663769752,"objectID":"89d41483c731af7210fd57921c53c99d","permalink":"http://www.lucagagliardelli.com/publication/dblp-confieeehpcs-simonini-gzb-18/","publishdate":"2022-09-21T14:15:51.977706Z","relpermalink":"/publication/dblp-confieeehpcs-simonini-gzb-18/","section":"publication","summary":"","tags":[],"title":"Enhancing Loosely Schema-aware Entity Resolution with User Interaction","type":"publication"},{"authors":["Sonia Bergamaschi","Domenico Beneventano","Federica Mandreoli","Riccardo Martoglia","Francesco Guerra","Mirko Orsini","Laura Po","Maurizio Vincini","Giovanni Simonini","Song Zhu","Luca Gagliardelli","Luca Magnotta"],"categories":[],"content":"","date":1514764800,"expirydate":-62135596800,"kind":"page","lang":"en","lastmod":1516544152,"objectID":"2b2ba43e8ff94ef1c8f095350ab32ce2","permalink":"http://www.lucagagliardelli.com/publication/dblp-bookssp-18-bergamaschi-bmm-0-opvszgm-18/","publishdate":"2022-09-21T14:15:52.445257Z","relpermalink":"/publication/dblp-bookssp-18-bergamaschi-bmm-0-opvszgm-18/","section":"publication","summary":"","tags":[],"title":"From Data Integration to Big Data Integration","type":"publication"},{"authors":["Song Zhu","Luca Gagliardelli","Giovanni Simonini","Domenico Beneventano"],"categories":[],"content":"","date":1514764800,"expirydate":-62135596800,"kind":"page","lang":"en","lastmod":1663769751,"objectID":"4141944fb5eb9e2113361dd018504c3c","permalink":"http://www.lucagagliardelli.com/publication/dblp-confieeehpcs-zhu-gsb-18/","publishdate":"2022-09-21T14:15:51.538207Z","relpermalink":"/publication/dblp-confieeehpcs-zhu-gsb-18/","section":"publication","summary":"","tags":[],"title":"How Improve Set Similarity Join Based on Prefix Approach in Distributed Environment","type":"publication"},{"authors":["Mirko Orsini","Enrico Calanchi","Luca Magnotta","Luca Gagliardelli","Monica Govi","Fabiano Mele","Rossella Tuplert"],"categories":[],"content":"","date":1483228800,"expirydate":-62135596800,"kind":"page","lang":"en","lastmod":1663769753,"objectID":"60229854d55ee13b1bbe5cbad9fb5a2c","permalink":"http://www.lucagagliardelli.com/publication/dblp-confrtsi-orsini-cmggmt-17/","publishdate":"2022-09-21T14:15:52.9118Z","relpermalink":"/publication/dblp-confrtsi-orsini-cmggmt-17/","section":"publication","summary":"","tags":[],"title":"The Italian FSHD registry: An enhanced data integration and analytics framework for smart health care","type":"publication"},{"authors":["Domenico Beneventano","Sonia Bergamaschi","Luca Gagliardelli","Laura Po"],"categories":[],"content":"","date":1420070400,"expirydate":-62135596800,"kind":"page","lang":"en","lastmod":1663769754,"objectID":"43b678003b927b8481e2a7b9002c4b79","permalink":"http://www.lucagagliardelli.com/publication/dblp-confic-3-k-beneventano-bgp-15-a/","publishdate":"2022-09-21T14:15:53.824148Z","relpermalink":"/publication/dblp-confic-3-k-beneventano-bgp-15-a/","section":"publication","summary":"","tags":[],"title":"Driving Innovation in Youth Policies with Open Data","type":"publication"},{"authors":["Domenico Beneventano","Sonia Bergamaschi","Luca Gagliardelli","Laura Po"],"categories":[],"content":"","date":1420070400,"expirydate":-62135596800,"kind":"page","lang":"en","lastmod":1663769753,"objectID":"5f88e4cf7d96cb8e986a648c40e0cea1","permalink":"http://www.lucagagliardelli.com/publication/dblp-confic-3-k-beneventano-bgp-15/","publishdate":"2022-09-21T14:15:53.366405Z","relpermalink":"/publication/dblp-confic-3-k-beneventano-bgp-15/","section":"publication","summary":"","tags":[],"title":"Open Data for Improving Youth Policies","type":"publication"}] \ No newline at end of file diff --git a/index.xml b/index.xml index 1c652d2..8905080 100644 --- a/index.xml +++ b/index.xml @@ -5,13 +5,37 @@ http://www.lucagagliardelli.com/- © 2023. + © 2024.
diff --git a/publication-type/1/index.xml b/publication-type/1/index.xml index 92750c1..ade40d8 100644 --- a/publication-type/1/index.xml +++ b/publication-type/1/index.xml @@ -5,13 +5,29 @@ http://www.lucagagliardelli.com/publication-type/1/- © 2023. + © 2024.
diff --git a/publication-type/2/index.html b/publication-type/2/index.html index 75ba457..55629af 100644 --- a/publication-type/2/index.html +++ b/publication-type/2/index.html @@ -1,6 +1,6 @@ - + @@ -326,7 +326,7 @@ - + @@ -836,7 +836,7 @@- © 2023. + © 2024.
diff --git a/publication-type/2/index.xml b/publication-type/2/index.xml index c342870..ed28a7f 100644 --- a/publication-type/2/index.xml +++ b/publication-type/2/index.xml @@ -5,13 +5,29 @@ http://www.lucagagliardelli.com/publication-type/2/- © 2023. + © 2024.
diff --git a/publication-type/6/index.html b/publication-type/6/index.html index c88f6d5..01afa26 100644 --- a/publication-type/6/index.html +++ b/publication-type/6/index.html @@ -1,6 +1,6 @@ - + @@ -978,7 +978,7 @@- © 2023. + © 2024.
diff --git a/publication/aslam-2024102425/cite.bib b/publication/aslam-2024102425/cite.bib new file mode 100644 index 0000000..cd1861f --- /dev/null +++ b/publication/aslam-2024102425/cite.bib @@ -0,0 +1,13 @@ +@article{ASLAM2024102425, + abstract = {Inequality join is an operator to join data on inequality conditions and it is a fundamental building block for applications. While methods and optimizations exist for efficient inequality join in batch processing, little attention has been given to its streaming version, particularly to large-scale data-intensive applications that run on Distributed Stream Processing Systems (DSPSs). Designing an inequality join in streaming and distributed settings is not an easy task: (i) indexes have to be employed to efficiently support inequality-based comparisons, but the continuous stream of data imposes continuous insertions, updates, and deletions of elements in the indexes—hence a huge overhead for the DSPSs; (ii) oftentimes real data is skewed, which makes indexing even more challenging. To address these challenges, we propose the Stream-Aware inequality join (STA), an indexing method that can reduce redundancy and index update overhead. STA builds a separate in-memory index structure for hotkeys, i.e., the most frequently used keys, which are automatically identified with an efficient data sketch. On the other hand, the cold keys are treated using a linked set of index structures. In this way, STA avoids many superfluous index updates for frequent items. Finally, we implement four state-of-the-art inequality join solutions for a widely employed DSPS (Apache Storm) and compare their performance with STA on four real-world data sets and a synthetic one. The results of our experimental evaluation reveal that our stream-aware approach outperforms existing solutions.}, + author = {Adeel Aslam and Giovanni Simonini and Luca Gagliardelli and Luca Zecchini and Sonia Bergamaschi}, + doi = {https://doi.org/10.1016/j.is.2024.102425}, + issn = {0306-4379}, + journal = {Information Systems}, + keywords = {Distributed stream processing system, Inequality join, Btree indexing, Augmented sketch, Skewed data distribution}, + pages = {102425}, + title = {Stream-aware indexing for distributed inequality join processing}, + url = {https://www.sciencedirect.com/science/article/pii/S0306437924000838}, + year = {2024} +} + diff --git a/publication/aslam-2024102425/index.html b/publication/aslam-2024102425/index.html new file mode 100644 index 0000000..e5b4f53 --- /dev/null +++ b/publication/aslam-2024102425/index.html @@ -0,0 +1,1431 @@ + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + +Inequality join is an operator to join data on inequality conditions and it is a fundamental building block for applications. While methods and optimizations exist for efficient inequality join in batch processing, little attention has been given to its streaming version, particularly to large-scale data-intensive applications that run on Distributed Stream Processing Systems (DSPSs). Designing an inequality join in streaming and distributed settings is not an easy task: (i) indexes have to be employed to efficiently support inequality-based comparisons, but the continuous stream of data imposes continuous insertions, updates, and deletions of elements in the indexes—hence a huge overhead for the DSPSs; (ii) oftentimes real data is skewed, which makes indexing even more challenging. To address these challenges, we propose the Stream-Aware inequality join (STA), an indexing method that can reduce redundancy and index update overhead. STA builds a separate in-memory index structure for hotkeys, i.e., the most frequently used keys, which are automatically identified with an efficient data sketch. On the other hand, the cold keys are treated using a linked set of index structures. In this way, STA avoids many superfluous index updates for frequent items. Finally, we implement four state-of-the-art inequality join solutions for a widely employed DSPS (Apache Storm) and compare their performance with STA on four real-world data sets and a synthetic one. The results of our experimental evaluation reveal that our stream-aware approach outperforms existing solutions.
+ + + + +- © 2023. + © 2024.
diff --git a/publication/dblp-bookssp-18-bergamaschi-bmm-0-opvszgm-18/index.html b/publication/dblp-bookssp-18-bergamaschi-bmm-0-opvszgm-18/index.html index d11bac7..fb5b6a4 100644 --- a/publication/dblp-bookssp-18-bergamaschi-bmm-0-opvszgm-18/index.html +++ b/publication/dblp-bookssp-18-bergamaschi-bmm-0-opvszgm-18/index.html @@ -1,6 +1,6 @@ - + @@ -1281,7 +1281,7 @@- © 2023. + © 2024.
diff --git a/publication/dblp-confbigdataconf-bergamaschi-g-23/cite.bib b/publication/dblp-confbigdataconf-bergamaschi-g-23/cite.bib new file mode 100644 index 0000000..81a870f --- /dev/null +++ b/publication/dblp-confbigdataconf-bergamaschi-g-23/cite.bib @@ -0,0 +1,27 @@ +@inproceedings{DBLP:conf/bigdataconf/BergamaschiG23, + author = {Sonia Bergamaschi and +Luca Gagliardelli}, + bibsource = {dblp computer science bibliography, https://dblp.org}, + biburl = {https://dblp.org/rec/conf/bigdataconf/BergamaschiG23.bib}, + booktitle = {IEEE International Conference on Big Data, BigData 2023, Sorrento, +Italy, December 15-18, 2023}, + doi = {10.1109/BIGDATA59044.2023.10386905}, + editor = {Jingrui He and +Themis Palpanas and +Xiaohua Hu and +Alfredo Cuzzocrea and +Dejing Dou and +Dominik Slezak and +Wei Wang and +Aleksandra Gruca and +Jerry Chun-Wei Lin and +Rakesh Agrawal}, + pages = {3898--3903}, + publisher = {IEEE}, + timestamp = {Fri, 02 Feb 2024 12:00:39 +0100}, + title = {A Big Data Platform for the Management of Local Energy Communities +Data}, + url = {https://doi.org/10.1109/BigData59044.2023.10386905}, + year = {2023} +} + diff --git a/publication/dblp-confbigdataconf-bergamaschi-g-23/index.html b/publication/dblp-confbigdataconf-bergamaschi-g-23/index.html new file mode 100644 index 0000000..5e34df6 --- /dev/null +++ b/publication/dblp-confbigdataconf-bergamaschi-g-23/index.html @@ -0,0 +1,1393 @@ + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + +- © 2023. + © 2024.
diff --git a/publication/dblp-confedbt-gagliardelli-sb-20/index.html b/publication/dblp-confedbt-gagliardelli-sb-20/index.html index c15fb76..490dd69 100644 --- a/publication/dblp-confedbt-gagliardelli-sb-20/index.html +++ b/publication/dblp-confedbt-gagliardelli-sb-20/index.html @@ -1,6 +1,6 @@ - + @@ -1234,7 +1234,7 @@- © 2023. + © 2024.
diff --git a/publication/dblp-confedbt-gagliardelli-sbb-19/index.html b/publication/dblp-confedbt-gagliardelli-sbb-19/index.html index 65de544..61948e8 100644 --- a/publication/dblp-confedbt-gagliardelli-sbb-19/index.html +++ b/publication/dblp-confedbt-gagliardelli-sbb-19/index.html @@ -1,6 +1,6 @@ - + @@ -1233,7 +1233,7 @@- © 2023. + © 2024.
diff --git a/publication/dblp-confedbt-gagliardelli-zbs-22/index.html b/publication/dblp-confedbt-gagliardelli-zbs-22/index.html index dd51770..fc95692 100644 --- a/publication/dblp-confedbt-gagliardelli-zbs-22/index.html +++ b/publication/dblp-confedbt-gagliardelli-zbs-22/index.html @@ -1,6 +1,6 @@ - + @@ -1284,7 +1284,7 @@- © 2023. + © 2024.
diff --git a/publication/dblp-confic-3-k-beneventano-bgp-15-a/index.html b/publication/dblp-confic-3-k-beneventano-bgp-15-a/index.html index c141c80..08ba3c7 100644 --- a/publication/dblp-confic-3-k-beneventano-bgp-15-a/index.html +++ b/publication/dblp-confic-3-k-beneventano-bgp-15-a/index.html @@ -1,6 +1,6 @@ - + @@ -1225,7 +1225,7 @@- © 2023. + © 2024.
diff --git a/publication/dblp-confic-3-k-beneventano-bgp-15/index.html b/publication/dblp-confic-3-k-beneventano-bgp-15/index.html index 1b56313..f259eec 100644 --- a/publication/dblp-confic-3-k-beneventano-bgp-15/index.html +++ b/publication/dblp-confic-3-k-beneventano-bgp-15/index.html @@ -1,6 +1,6 @@ - + @@ -1225,7 +1225,7 @@- © 2023. + © 2024.
diff --git a/publication/dblp-confieeehpcs-simonini-gzb-18/index.html b/publication/dblp-confieeehpcs-simonini-gzb-18/index.html index b5f478b..530c71c 100644 --- a/publication/dblp-confieeehpcs-simonini-gzb-18/index.html +++ b/publication/dblp-confieeehpcs-simonini-gzb-18/index.html @@ -1,6 +1,6 @@ - + @@ -1225,7 +1225,7 @@- © 2023. + © 2024.
diff --git a/publication/dblp-confieeehpcs-zhu-gsb-18/index.html b/publication/dblp-confieeehpcs-zhu-gsb-18/index.html index 9667af4..69b7ee8 100644 --- a/publication/dblp-confieeehpcs-zhu-gsb-18/index.html +++ b/publication/dblp-confieeehpcs-zhu-gsb-18/index.html @@ -1,6 +1,6 @@ - + @@ -1225,7 +1225,7 @@- © 2023. + © 2024.
diff --git a/publication/dblp-confircdl-aftar-ggrb-24/cite.bib b/publication/dblp-confircdl-aftar-ggrb-24/cite.bib new file mode 100644 index 0000000..5266b1f --- /dev/null +++ b/publication/dblp-confircdl-aftar-ggrb-24/cite.bib @@ -0,0 +1,27 @@ +@inproceedings{DBLP:conf/ircdl/AftarGGRB24, + author = {Sania Aftar and +Luca Gagliardelli and +Amina El Ganadi and +Federico Ruozzi and +Sonia Bergamaschi}, + bibsource = {dblp computer science bibliography, https://dblp.org}, + biburl = {https://dblp.org/rec/conf/ircdl/AftarGGRB24.bib}, + booktitle = {Proceedings of the 20th Conference on Information and Research science +Connecting to Digital and Library science (formerly the Italian Research +Conference on Digital Libraries), Bressanone, Brixen, Italy - 22-23 +February 2024}, + editor = {Eleonora Bernasconi and +Andrea Mannocci and +Antonella Poggi and +Angelo A. Salatino and +Gianmaria Silvello}, + pages = {117--125}, + publisher = {CEUR-WS.org}, + series = {CEUR Workshop Proceedings}, + timestamp = {Fri, 01 Mar 2024 16:26:21 +0100}, + title = {A Novel Methodology for Topic Identification in Hadith}, + url = {https://ceur-ws.org/Vol-3643/paper12.pdf}, + volume = {3643}, + year = {2024} +} + diff --git a/publication/dblp-confircdl-aftar-ggrb-24/index.html b/publication/dblp-confircdl-aftar-ggrb-24/index.html new file mode 100644 index 0000000..33227ed --- /dev/null +++ b/publication/dblp-confircdl-aftar-ggrb-24/index.html @@ -0,0 +1,1402 @@ + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + +- © 2023. + © 2024.
diff --git a/publication/dblp-confsebd-beneventano-bgs-19/index.html b/publication/dblp-confsebd-beneventano-bgs-19/index.html index d15610e..e5efd5c 100644 --- a/publication/dblp-confsebd-beneventano-bgs-19/index.html +++ b/publication/dblp-confsebd-beneventano-bgs-19/index.html @@ -1,6 +1,6 @@ - + @@ -1213,7 +1213,7 @@- © 2023. + © 2024.
diff --git a/publication/dblp-confsebd-gagliardelli-0-sb-23/index.html b/publication/dblp-confsebd-gagliardelli-0-sb-23/index.html index 09777cc..70f1ae0 100644 --- a/publication/dblp-confsebd-gagliardelli-0-sb-23/index.html +++ b/publication/dblp-confsebd-gagliardelli-0-sb-23/index.html @@ -1,6 +1,6 @@ - + @@ -1228,7 +1228,7 @@- © 2023. + © 2024.
diff --git a/publication/dblp-confsebd-gagliardelli-sb-20/index.html b/publication/dblp-confsebd-gagliardelli-sb-20/index.html index 7aef8cc..19c1e95 100644 --- a/publication/dblp-confsebd-gagliardelli-sb-20/index.html +++ b/publication/dblp-confsebd-gagliardelli-sb-20/index.html @@ -1,6 +1,6 @@ - + @@ -1206,7 +1206,7 @@- © 2023. + © 2024.
diff --git a/publication/dblp-confsebd-simonini-grzsabb-22/index.html b/publication/dblp-confsebd-simonini-grzsabb-22/index.html index b39c53f..515eb21 100644 --- a/publication/dblp-confsebd-simonini-grzsabb-22/index.html +++ b/publication/dblp-confsebd-simonini-grzsabb-22/index.html @@ -1,6 +1,6 @@ - + @@ -1241,7 +1241,7 @@- © 2023. + © 2024.
diff --git a/publication/dblp-confsebd-simonini-sgzbb-21/index.html b/publication/dblp-confsebd-simonini-sgzbb-21/index.html index 2b019af..897981f 100644 --- a/publication/dblp-confsebd-simonini-sgzbb-21/index.html +++ b/publication/dblp-confsebd-simonini-sgzbb-21/index.html @@ -1,6 +1,6 @@ - + @@ -1227,7 +1227,7 @@- © 2023. + © 2024.
diff --git a/publication/dblp-journalscorrabs-2204-08801/index.html b/publication/dblp-journalscorrabs-2204-08801/index.html index 0de03c4..783d855 100644 --- a/publication/dblp-journalscorrabs-2204-08801/index.html +++ b/publication/dblp-journalscorrabs-2204-08801/index.html @@ -1,6 +1,6 @@ - + @@ -1232,7 +1232,7 @@- © 2023. + © 2024.
diff --git a/publication/dblp-journalscorrabs-2312-11122/cite.bib b/publication/dblp-journalscorrabs-2312-11122/cite.bib new file mode 100644 index 0000000..24e8b68 --- /dev/null +++ b/publication/dblp-journalscorrabs-2312-11122/cite.bib @@ -0,0 +1,21 @@ +@article{DBLP:journals/corr/abs-2312-11122, + author = {Angelo Mozzillo and +Luca Zecchini and +Luca Gagliardelli and +Adeel Aslam and +Sonia Bergamaschi and +Giovanni Simonini}, + bibsource = {dblp computer science bibliography, https://dblp.org}, + biburl = {https://dblp.org/rec/journals/corr/abs-2312-11122.bib}, + doi = {10.48550/ARXIV.2312.11122}, + eprint = {2312.11122}, + eprinttype = {arXiv}, + journal = {CoRR}, + timestamp = {Tue, 16 Jan 2024 11:57:42 +0100}, + title = {Evaluation of Dataframe Libraries for Data Preparation on a Single +Machine}, + url = {https://doi.org/10.48550/arXiv.2312.11122}, + volume = {abs/2312.11122}, + year = {2023} +} + diff --git a/publication/dblp-journalscorrabs-2312-11122/index.html b/publication/dblp-journalscorrabs-2312-11122/index.html new file mode 100644 index 0000000..b11f9d4 --- /dev/null +++ b/publication/dblp-journalscorrabs-2312-11122/index.html @@ -0,0 +1,1421 @@ + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + +- © 2023. + © 2024.
diff --git a/publication/dblp-journalsis-papadakis-mgstgb-20/index.html b/publication/dblp-journalsis-papadakis-mgstgb-20/index.html index c4f7b04..7be4147 100644 --- a/publication/dblp-journalsis-papadakis-mgstgb-20/index.html +++ b/publication/dblp-journalsis-papadakis-mgstgb-20/index.html @@ -1,6 +1,6 @@ - + @@ -1260,7 +1260,7 @@- © 2023. + © 2024.
diff --git a/publication/dblp-journalsis-simonini-gbj-19/index.html b/publication/dblp-journalsis-simonini-gbj-19/index.html index 87485c5..0ee08cb 100644 --- a/publication/dblp-journalsis-simonini-gbj-19/index.html +++ b/publication/dblp-journalsis-simonini-gbj-19/index.html @@ -1,6 +1,6 @@ - + @@ -1225,7 +1225,7 @@- © 2023. + © 2024.
diff --git a/publication/dblp-journalsjdiq-beneventano-bgs-20/index.html b/publication/dblp-journalsjdiq-beneventano-bgs-20/index.html index 42e27ca..fc719b6 100644 --- a/publication/dblp-journalsjdiq-beneventano-bgs-20/index.html +++ b/publication/dblp-journalsjdiq-beneventano-bgs-20/index.html @@ -1,6 +1,6 @@ - + @@ -1225,7 +1225,7 @@- © 2023. + © 2024.
diff --git a/publication/dblp-journalspvldb-gagliardelli-psb-22/index.html b/publication/dblp-journalspvldb-gagliardelli-psb-22/index.html index 09edd2d..2e774c7 100644 --- a/publication/dblp-journalspvldb-gagliardelli-psb-22/index.html +++ b/publication/dblp-journalspvldb-gagliardelli-psb-22/index.html @@ -1,6 +1,6 @@ - + @@ -1236,7 +1236,7 @@- © 2023. + © 2024.
diff --git a/publication/gagliardelli-2023-big/index.html b/publication/gagliardelli-2023-big/index.html index b3f07ea..9ee1fa9 100644 --- a/publication/gagliardelli-2023-big/index.html +++ b/publication/gagliardelli-2023-big/index.html @@ -1,6 +1,6 @@ - + @@ -1260,7 +1260,7 @@- © 2023. + © 2024.
diff --git a/publication/index.html b/publication/index.html index 5aa90f6..30dc004 100644 --- a/publication/index.html +++ b/publication/index.html @@ -1,6 +1,6 @@ - + @@ -326,7 +326,7 @@ - + @@ -868,6 +868,24 @@+ + + + + + + + + + + + + + + + Cite + + + + + + + + + + + + + + + + DOI + + + + + + + + + + + + + + + + URL + +
+ + + ++ + + + + + + + + + + + + + + + Cite + + + + + + + + + + + + + + + + DOI + + + + + + + + + + + + + + + + URL + +
+ + + ++ + + + + + + + + + + + + + + + PDF + + + + + + Cite + + + + + + + + + + + + + + + +
+ + + ++ + + + + + + + + + + + + + + + Cite + + + + + + + + + + + + + + + + DOI + + + + + + + + + + + + + + + + URL + +
+ + + ++ + + + + + + + + + + + + + + + Cite + + + + + + + + + + + + + + + + DOI + + + + + + + + + + + + + + + + URL + +
+ + + ++ + + + + + + + + + + + + + + + Cite + + + + + + + + + + + + + + + + DOI + + + + + + + + + + + + + + + + URL + +
+ + + +- © 2023. + © 2024.
diff --git a/publication/index.xml b/publication/index.xml index 486797a..2f2dbc4 100644 --- a/publication/index.xml +++ b/publication/index.xml @@ -5,13 +5,37 @@ http://www.lucagagliardelli.com/publication/- © 2023. + © 2024.
diff --git a/publication_types/index.xml b/publication_types/index.xml index 67a4fea..4f874c1 100644 --- a/publication_types/index.xml +++ b/publication_types/index.xml @@ -5,7 +5,7 @@ http://www.lucagagliardelli.com/publication_types/- © 2023. + © 2024.
diff --git a/tags/index.xml b/tags/index.xml index 82a63ca..2752b07 100644 --- a/tags/index.xml +++ b/tags/index.xml @@ -5,7 +5,7 @@ http://www.lucagagliardelli.com/tags/- © 2023. + © 2024.
diff --git a/talk/generalized-supervised-meta-blocking-@-vldb-2022/index.html b/talk/generalized-supervised-meta-blocking-@-vldb-2022/index.html index fa4ad3d..49e9aab 100644 --- a/talk/generalized-supervised-meta-blocking-@-vldb-2022/index.html +++ b/talk/generalized-supervised-meta-blocking-@-vldb-2022/index.html @@ -1,6 +1,6 @@ - + @@ -1308,7 +1308,7 @@- © 2023. + © 2024.