diff --git a/404.html b/404.html index 699805b..1f05659 100644 --- a/404.html +++ b/404.html @@ -1,6 +1,6 @@ - + @@ -793,25 +793,25 @@

Page not found

Latest

@@ -858,7 +858,7 @@

Latest

diff --git a/categories/index.html b/categories/index.html index 5b43910..3ea18b4 100644 --- a/categories/index.html +++ b/categories/index.html @@ -1,6 +1,6 @@ - + @@ -860,7 +860,7 @@

Categories

diff --git a/event/index.html b/event/index.html index f4f7c14..0000025 100644 --- a/event/index.html +++ b/event/index.html @@ -1,6 +1,6 @@ - + @@ -1107,7 +1107,7 @@

2022

diff --git a/index.html b/index.html index 7e9778e..0aed88e 100644 --- a/index.html +++ b/index.html @@ -1,6 +1,6 @@ - + @@ -346,7 +346,7 @@ - + @@ -1210,6 +1210,7 @@

News

@@ -871,13 +871,19 @@

1

+ + + + PDF + + + data-filename="/publication/dblp-confircdl-aftar-ggrb-24/cite.bib"> Cite @@ -894,20 +900,6 @@

1

- - - - - - - - - - - - - URL - @@ -941,7 +933,7 @@

1

- HKS: Efficient Data Partitioning for Stateful Streaming + A Big Data Platform for the Management of Local Energy Communities Data
@@ -955,11 +947,8 @@

1

- Adeel Aslam, - Giovanni Simonini, - Luca Gagliardelli, - Angelo Mozzillo, - Sonia Bergamaschi + Sonia Bergamaschi, + Luca Gagliardelli
@@ -982,7 +971,7 @@

1

+ data-filename="/publication/dblp-confbigdataconf-bergamaschi-g-23/cite.bib"> Cite @@ -998,7 +987,7 @@

1

- + DOI @@ -1014,7 +1003,7 @@

1

- + URL @@ -1050,7 +1039,7 @@

1

- ECDP: A Big Data Platform for the Smart Monitoring of Local Energy Communities + A general approach to Supervised Meta-Blocking
@@ -1065,18 +1054,10 @@

1

Luca Gagliardelli, - Luca Zecchini, - Domenico Beneventano, + George Papadakis, Giovanni Simonini, Sonia Bergamaschi, - Mirko Orsini, - Luca Magnotta, - Emma Mescoli, - Andrea Livaldi, - Nicola Gessa, - Piero De Sabbata, - Gianluca D'Agosta, - Fabrizio Paolucci + Themis Palpanas
@@ -1093,19 +1074,13 @@

1

- - - - PDF - - + data-filename="/publication/dblp-confsebd-gagliardelli-0-sb-23/cite.bib"> Cite @@ -1119,16 +1094,22 @@

1

+ + + + - - Video - - - - + + + + + + + + URL @@ -1163,7 +1144,7 @@

1

- Progressive Entity Resolution with Node Embeddings + HKS: Efficient Data Partitioning for Stateful Streaming
@@ -1177,13 +1158,10 @@

1

+ Adeel Aslam, Giovanni Simonini, Luca Gagliardelli, - Michele Rinaldi, - Luca Zecchini, - Giulio De Sabbata, - Adeel Aslam, - Domenico Beneventano, + Angelo Mozzillo, Sonia Bergamaschi
@@ -1201,19 +1179,13 @@

1

- - - - - PDF - + data-filename="/publication/dblp-confdawak-aslam-sgmb-23/cite.bib"> Cite @@ -1229,6 +1201,24 @@

1

+ + DOI + + + + + + + + + + + + + + + + URL @@ -1263,7 +1253,7 @@

1

- The Case for Multi-task Active Learning Entity Resolution (Discussion Paper) + ECDP: A Big Data Platform for the Smart Monitoring of Local Energy Communities
@@ -1277,12 +1267,19 @@

1

- Giovanni Simonini, - Henrique Saccani, Luca Gagliardelli, Luca Zecchini, Domenico Beneventano, - Sonia Bergamaschi + Giovanni Simonini, + Sonia Bergamaschi, + Mirko Orsini, + Luca Magnotta, + Emma Mescoli, + Andrea Livaldi, + Nicola Gessa, + Piero De Sabbata, + Gianluca D'Agosta, + Fabrizio Paolucci
@@ -1304,14 +1301,14 @@

1

- + PDF + data-filename="/publication/dblp-confedbt-gagliardelli-zbs-22/cite.bib"> Cite @@ -1325,6 +1322,14 @@

1

+ + + + + + Video + + @@ -1361,7 +1366,7 @@

1

- RulER: Scaling Up Record-level Matching Rules + Progressive Entity Resolution with Node Embeddings
@@ -1375,8 +1380,13 @@

1

- Luca Gagliardelli, Giovanni Simonini, + Luca Gagliardelli, + Michele Rinaldi, + Luca Zecchini, + Giulio De Sabbata, + Adeel Aslam, + Domenico Beneventano, Sonia Bergamaschi
@@ -1394,25 +1404,23 @@

1

+ + + + PDF + + + data-filename="/publication/dblp-confsebd-simonini-grzsabb-22/cite.bib"> Cite - - - - - - Code - - @@ -1422,34 +1430,8 @@

1

- - - - - - Video - - - - DOI - - - - - - - - - - - - - - - - URL @@ -1484,7 +1466,7 @@

1

- Scaling Up Record-level Matching Rules + The Case for Multi-task Active Learning Entity Resolution (Discussion Paper)
@@ -1498,8 +1480,11 @@

1

- Luca Gagliardelli, Giovanni Simonini, + Henrique Saccani, + Luca Gagliardelli, + Luca Zecchini, + Domenico Beneventano, Sonia Bergamaschi
@@ -1522,14 +1507,14 @@

1

- + PDF + data-filename="/publication/dblp-confsebd-simonini-sgzbb-21/cite.bib"> Cite @@ -1579,7 +1564,7 @@

1

- Entity Resolution and Data Fusion: An Integrated Approach + RulER: Scaling Up Record-level Matching Rules
@@ -1593,10 +1578,9 @@

1

- Domenico Beneventano, - Sonia Bergamaschi, Luca Gagliardelli, - Giovanni Simonini + Giovanni Simonini, + Sonia Bergamaschi
@@ -1613,23 +1597,24 @@

1

- - - - PDF - - + data-filename="/publication/dblp-confedbt-gagliardelli-sb-20/cite.bib"> Cite + + + + + + Code + @@ -1640,9 +1625,36 @@

1

+ + + + + + Video + + + DOI + + + + + + + + + + + + + + + + URL + + @@ -1675,7 +1687,7 @@

1

- SparkER: Scaling Entity Resolution in Spark + Scaling Up Record-level Matching Rules
@@ -1691,7 +1703,6 @@

1

Luca Gagliardelli, Giovanni Simonini, - Domenico Beneventano, Sonia Bergamaschi
@@ -1709,24 +1720,23 @@

1

+ + + + PDF + + + data-filename="/publication/dblp-confsebd-gagliardelli-sb-20/cite.bib"> Cite - - - - - - Code - @@ -1739,25 +1749,6 @@

1

- - DOI - - - - - - - - - - - - - - - - URL - @@ -1791,7 +1782,7 @@

1

- Enhancing Loosely Schema-aware Entity Resolution with User Interaction + Entity Resolution and Data Fusion: An Integrated Approach
@@ -1805,10 +1796,10 @@

1

- Giovanni Simonini, + Domenico Beneventano, + Sonia Bergamaschi, Luca Gagliardelli, - Song Zhu, - Sonia Bergamaschi + Giovanni Simonini
@@ -1825,13 +1816,19 @@

1

+ + + + PDF + + + data-filename="/publication/dblp-confsebd-beneventano-bgs-19/cite.bib"> Cite @@ -1847,24 +1844,6 @@

1

- - DOI - - - - - - - - - - - - - - - - URL @@ -1934,7 +1913,7 @@

1

diff --git a/publication-type/1/index.xml b/publication-type/1/index.xml index 92750c1..ade40d8 100644 --- a/publication-type/1/index.xml +++ b/publication-type/1/index.xml @@ -5,13 +5,29 @@ http://www.lucagagliardelli.com/publication-type/1/ 1 - Wowchemy (https://wowchemy.com)en-usSun, 01 Jan 2023 00:00:00 +0000 + Wowchemy (https://wowchemy.com)en-usMon, 01 Jan 2024 00:00:00 +0000 http://www.lucagagliardelli.com/media/icon_hu0b7a4cb9992c9ac0e91bd28ffd38dd00_9727_512x512_fill_lanczos_center_3.png 1 http://www.lucagagliardelli.com/publication-type/1/ + + A Novel Methodology for Topic Identification in Hadith + http://www.lucagagliardelli.com/publication/dblp-confircdl-aftar-ggrb-24/ + Mon, 01 Jan 2024 00:00:00 +0000 + http://www.lucagagliardelli.com/publication/dblp-confircdl-aftar-ggrb-24/ + + + + + A Big Data Platform for the Management of Local Energy Communities Data + http://www.lucagagliardelli.com/publication/dblp-confbigdataconf-bergamaschi-g-23/ + Sun, 01 Jan 2023 00:00:00 +0000 + http://www.lucagagliardelli.com/publication/dblp-confbigdataconf-bergamaschi-g-23/ + + + A general approach to Supervised Meta-Blocking http://www.lucagagliardelli.com/publication/dblp-confsebd-gagliardelli-0-sb-23/ diff --git a/publication-type/1/page/2/index.html b/publication-type/1/page/2/index.html index 81bc7cb..f486e0c 100644 --- a/publication-type/1/page/2/index.html +++ b/publication-type/1/page/2/index.html @@ -1,6 +1,6 @@ - + @@ -326,7 +326,7 @@ - + @@ -828,6 +828,230 @@

1

+ + + + +
+
+ +
+ SparkER: Scaling Entity Resolution in Spark +
+ + + + + + + + + +
+
+ + +
+
+ + + + + + + + + + + + + + + + + + + +
+
+ +
+ Enhancing Loosely Schema-aware Entity Resolution with User Interaction +
+ + + + + + + + + +
+
+ + +
+
+ + + + + + + + + + + + + + + @@ -1306,7 +1530,7 @@

1

diff --git a/publication-type/2/index.html b/publication-type/2/index.html index 75ba457..55629af 100644 --- a/publication-type/2/index.html +++ b/publication-type/2/index.html @@ -1,6 +1,6 @@ - + @@ -326,7 +326,7 @@ - + @@ -836,7 +836,7 @@

2

- A big data platform exploiting auditable tokenization to promote good practices inside local energy communities + GSM: A generalized approach to Supervised Meta-blocking for scalable entity resolution
@@ -851,16 +851,10 @@

2

Luca Gagliardelli, - Luca Zecchini, - Luca Ferretti, - Domenico Beneventano, + George Papadakis, Giovanni Simonini, Sonia Bergamaschi, - Mirko Orsini, - Luca Magnotta, - Emma Mescoli, - Andrea Livaldi, - others + Themis Palpanas
@@ -883,7 +877,7 @@

2

+ data-filename="/publication/dblp-journalsis-gagliardelli-psbp-24/cite.bib"> Cite @@ -899,11 +893,25 @@

2

- + DOI + + + + + + + + + + + + + URL + @@ -932,15 +940,23 @@

2

+ +
- Generalized Supervised Meta-blocking + Stream-aware indexing for distributed inequality join processing
+ +
+ Inequality join is an operator to join data on inequality conditions and it is a fundamental building block for applications. While … +
+
+
@@ -972,33 +988,60 @@

2

- - - - PDF - - + data-filename="/publication/aslam-2024102425/cite.bib"> Cite + + + + + + + + + + + + + DOI + + + + - - Code - + + + + + + + + URL +
+ + + +
+ + +
+ + + @@ -1007,17 +1050,87 @@

2

- + + + + + + + + +
+
+ +
+ A big data platform exploiting auditable tokenization to promote good practices inside local energy communities +
+ + + + + + @@ -1050,7 +1163,7 @@

2

- Generalized Supervised Meta-blocking (technical report) + DXP: Billing Data Preparation for Big Data Analytics
@@ -1065,10 +1178,13 @@

2

Luca Gagliardelli, - George Papadakis, + Domenico Beneventano, + Marco Esposito, + Luca Zecchini, Giovanni Simonini, Sonia Bergamaschi, - Themis Palpanas + Fabio Miselli, + Giuseppe Calogero Miano
@@ -1091,7 +1207,7 @@

2

+ data-filename="/publication/dblp-journalscorrabs-2312-12902/cite.bib"> Cite @@ -1107,7 +1223,7 @@

2

- + DOI @@ -1123,7 +1239,7 @@

2

- + URL @@ -1159,7 +1275,7 @@

2

- Reproducible experiments on Three-Dimensional Entity Resolution with JedAI + Evaluation of Dataframe Libraries for Data Preparation on a Single Machine
@@ -1173,17 +1289,12 @@

2

- Georgios M. Mandilaras, - George Papadakis, + Angelo Mozzillo, + Luca Zecchini, Luca Gagliardelli, - Giovanni Simonini, - Emmanouil Thanos, - George Giannakopoulos, + Adeel Aslam, Sonia Bergamaschi, - Themis Palpanas, - Manolis Koubarakis, - Alicia Lara-Clares, - Antonio Fariña + Giovanni Simonini
@@ -1206,7 +1317,7 @@

2

+ data-filename="/publication/dblp-journalscorrabs-2312-11122/cite.bib"> Cite @@ -1222,7 +1333,7 @@

2

- + DOI @@ -1238,7 +1349,7 @@

2

- + URL @@ -1274,7 +1385,7 @@

2

- emphBLAST2: An Efficient Technique for Loose Schema Information Extraction from Heterogeneous Big Data Sources + Generalized Supervised Meta-blocking
@@ -1288,10 +1399,124 @@

2

- Domenico Beneventano, + Luca Gagliardelli, + George Papadakis, + Giovanni Simonini, Sonia Bergamaschi, + Themis Palpanas +
+ + + + + + + + +
+ + +
+ + + + + + + + + + + + + + + + + + + + +
+
+ +
+ Generalized Supervised Meta-blocking (technical report) +
+ + + + @@ -1314,7 +1539,7 @@

2

+ data-filename="/publication/dblp-journalscorrabs-2204-08801/cite.bib"> Cite @@ -1330,7 +1555,7 @@

2

- + DOI @@ -1346,7 +1571,7 @@

2

- + URL @@ -1382,7 +1607,7 @@

2

- Three-dimensional Entity Resolution with JedAI + Reproducible experiments on Three-Dimensional Entity Resolution with JedAI
@@ -1396,15 +1621,17 @@

2

- George Papadakis, Georgios M. Mandilaras, + George Papadakis, Luca Gagliardelli, Giovanni Simonini, Emmanouil Thanos, George Giannakopoulos, Sonia Bergamaschi, Themis Palpanas, - Manolis Koubarakis + Manolis Koubarakis, + Alicia Lara-Clares, + Antonio Fariña
@@ -1427,7 +1654,7 @@

2

+ data-filename="/publication/dblp-journalsis-mandilaras-0-gstg-21/cite.bib"> Cite @@ -1443,7 +1670,7 @@

2

- + DOI @@ -1459,7 +1686,7 @@

2

- + URL @@ -1495,7 +1722,7 @@

2

- Scaling entity resolution: A loosely schema-aware approach + emphBLAST2: An Efficient Technique for Loose Schema Information Extraction from Heterogeneous Big Data Sources
@@ -1509,10 +1736,123 @@

2

- Giovanni Simonini, + Domenico Beneventano, + Sonia Bergamaschi, + Luca Gagliardelli, + Giovanni Simonini +
+ +
+ + + + + + +
+ + +
+ + + + + + + + + + + + + + + + + + + + +
+
+ +
+ Three-dimensional Entity Resolution with JedAI +
+ + + + @@ -1535,7 +1875,7 @@

2

+ data-filename="/publication/dblp-journalsis-papadakis-mgstgb-20/cite.bib"> Cite @@ -1551,7 +1891,7 @@

2

- + DOI @@ -1567,7 +1907,7 @@

2

- + URL @@ -1586,6 +1926,15 @@

2

+ +
@@ -1629,7 +1978,7 @@

2

diff --git a/publication-type/2/index.xml b/publication-type/2/index.xml index c342870..ed28a7f 100644 --- a/publication-type/2/index.xml +++ b/publication-type/2/index.xml @@ -5,13 +5,29 @@ http://www.lucagagliardelli.com/publication-type/2/ 2 - Wowchemy (https://wowchemy.com)en-usSun, 01 Jan 2023 00:00:00 +0000 + Wowchemy (https://wowchemy.com)en-usMon, 01 Jan 2024 00:00:00 +0000 http://www.lucagagliardelli.com/media/icon_hu0b7a4cb9992c9ac0e91bd28ffd38dd00_9727_512x512_fill_lanczos_center_3.png 2 http://www.lucagagliardelli.com/publication-type/2/ + + GSM: A generalized approach to Supervised Meta-blocking for scalable entity resolution + http://www.lucagagliardelli.com/publication/dblp-journalsis-gagliardelli-psbp-24/ + Mon, 01 Jan 2024 00:00:00 +0000 + http://www.lucagagliardelli.com/publication/dblp-journalsis-gagliardelli-psbp-24/ + + + + + Stream-aware indexing for distributed inequality join processing + http://www.lucagagliardelli.com/publication/aslam-2024102425/ + Mon, 01 Jan 2024 00:00:00 +0000 + http://www.lucagagliardelli.com/publication/aslam-2024102425/ + + + A big data platform exploiting auditable tokenization to promote good practices inside local energy communities http://www.lucagagliardelli.com/publication/gagliardelli-2023-big/ @@ -20,6 +36,22 @@ + + DXP: Billing Data Preparation for Big Data Analytics + http://www.lucagagliardelli.com/publication/dblp-journalscorrabs-2312-12902/ + Sun, 01 Jan 2023 00:00:00 +0000 + http://www.lucagagliardelli.com/publication/dblp-journalscorrabs-2312-12902/ + + + + + Evaluation of Dataframe Libraries for Data Preparation on a Single Machine + http://www.lucagagliardelli.com/publication/dblp-journalscorrabs-2312-11122/ + Sun, 01 Jan 2023 00:00:00 +0000 + http://www.lucagagliardelli.com/publication/dblp-journalscorrabs-2312-11122/ + + + Generalized Supervised Meta-blocking http://www.lucagagliardelli.com/publication/dblp-journalspvldb-gagliardelli-psb-22/ diff --git a/publication-type/2/page/2/index.html b/publication-type/2/page/2/index.html new file mode 100644 index 0000000..9be566a --- /dev/null +++ b/publication-type/2/page/2/index.html @@ -0,0 +1,1161 @@ + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + 2 | Luca Gagliardelli + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + +
+ + + + + + + + + + + + + + + + + + + + + + + + + +
+

2

+ + + + +
+ + + +
+ + + + + + + + + + + + + + + + + + + + + + + + +
+
+ +
+ Scaling entity resolution: A loosely schema-aware approach +
+ + + + + + + + + +
+
+ + +
+
+ + + + + + + + + +
+
+ + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + diff --git a/publication-type/5/index.html b/publication-type/5/index.html index 2107a00..976932c 100644 --- a/publication-type/5/index.html +++ b/publication-type/5/index.html @@ -1,6 +1,6 @@ - + @@ -967,7 +967,7 @@

5

diff --git a/publication-type/6/index.html b/publication-type/6/index.html index c88f6d5..01afa26 100644 --- a/publication-type/6/index.html +++ b/publication-type/6/index.html @@ -1,6 +1,6 @@ - + @@ -978,7 +978,7 @@

6

diff --git a/publication/aslam-2024102425/cite.bib b/publication/aslam-2024102425/cite.bib new file mode 100644 index 0000000..cd1861f --- /dev/null +++ b/publication/aslam-2024102425/cite.bib @@ -0,0 +1,13 @@ +@article{ASLAM2024102425, + abstract = {Inequality join is an operator to join data on inequality conditions and it is a fundamental building block for applications. While methods and optimizations exist for efficient inequality join in batch processing, little attention has been given to its streaming version, particularly to large-scale data-intensive applications that run on Distributed Stream Processing Systems (DSPSs). Designing an inequality join in streaming and distributed settings is not an easy task: (i) indexes have to be employed to efficiently support inequality-based comparisons, but the continuous stream of data imposes continuous insertions, updates, and deletions of elements in the indexes—hence a huge overhead for the DSPSs; (ii) oftentimes real data is skewed, which makes indexing even more challenging. To address these challenges, we propose the Stream-Aware inequality join (STA), an indexing method that can reduce redundancy and index update overhead. STA builds a separate in-memory index structure for hotkeys, i.e., the most frequently used keys, which are automatically identified with an efficient data sketch. On the other hand, the cold keys are treated using a linked set of index structures. In this way, STA avoids many superfluous index updates for frequent items. Finally, we implement four state-of-the-art inequality join solutions for a widely employed DSPS (Apache Storm) and compare their performance with STA on four real-world data sets and a synthetic one. The results of our experimental evaluation reveal that our stream-aware approach outperforms existing solutions.}, + author = {Adeel Aslam and Giovanni Simonini and Luca Gagliardelli and Luca Zecchini and Sonia Bergamaschi}, + doi = {https://doi.org/10.1016/j.is.2024.102425}, + issn = {0306-4379}, + journal = {Information Systems}, + keywords = {Distributed stream processing system, Inequality join, Btree indexing, Augmented sketch, Skewed data distribution}, + pages = {102425}, + title = {Stream-aware indexing for distributed inequality join processing}, + url = {https://www.sciencedirect.com/science/article/pii/S0306437924000838}, + year = {2024} +} + diff --git a/publication/aslam-2024102425/index.html b/publication/aslam-2024102425/index.html new file mode 100644 index 0000000..e5b4f53 --- /dev/null +++ b/publication/aslam-2024102425/index.html @@ -0,0 +1,1431 @@ + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + Stream-aware indexing for distributed inequality join processing | Luca Gagliardelli + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + +
+ + + + + + + + + + + + + +
+ + + + + + + + + + + + + + + + + + + + +
+

Stream-aware indexing for distributed inequality join processing

+ + + + + + + + + + + + + + + + + + +
+ + + +
+ + +

Abstract

+

Inequality join is an operator to join data on inequality conditions and it is a fundamental building block for applications. While methods and optimizations exist for efficient inequality join in batch processing, little attention has been given to its streaming version, particularly to large-scale data-intensive applications that run on Distributed Stream Processing Systems (DSPSs). Designing an inequality join in streaming and distributed settings is not an easy task: (i) indexes have to be employed to efficiently support inequality-based comparisons, but the continuous stream of data imposes continuous insertions, updates, and deletions of elements in the indexes—hence a huge overhead for the DSPSs; (ii) oftentimes real data is skewed, which makes indexing even more challenging. To address these challenges, we propose the Stream-Aware inequality join (STA), an indexing method that can reduce redundancy and index update overhead. STA builds a separate in-memory index structure for hotkeys, i.e., the most frequently used keys, which are automatically identified with an efficient data sketch. On the other hand, the cold keys are treated using a linked set of index structures. In this way, STA avoids many superfluous index updates for frequent items. Finally, we implement four state-of-the-art inequality join solutions for a widely employed DSPS (Apache Storm) and compare their performance with STA on four real-world data sets and a synthetic one. The results of our experimental evaluation reveal that our stream-aware approach outperforms existing solutions.

+ + + + +
+
+
+
+
Type
+ +
+
+
+
+
+ + + +
+
+
+
+
Publication
+
Information Systems
+
+
+
+
+
+ + +
+ +
+ + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + +
+
+
+ + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + diff --git a/publication/basidati-2023/index.html b/publication/basidati-2023/index.html index 25aaaeb..1315fe2 100644 --- a/publication/basidati-2023/index.html +++ b/publication/basidati-2023/index.html @@ -1,6 +1,6 @@ - + @@ -1228,7 +1228,7 @@

Progetto di Basi di Dati Relazionali

diff --git a/publication/dblp-bookssp-18-bergamaschi-bmm-0-opvszgm-18/index.html b/publication/dblp-bookssp-18-bergamaschi-bmm-0-opvszgm-18/index.html index d11bac7..fb5b6a4 100644 --- a/publication/dblp-bookssp-18-bergamaschi-bmm-0-opvszgm-18/index.html +++ b/publication/dblp-bookssp-18-bergamaschi-bmm-0-opvszgm-18/index.html @@ -1,6 +1,6 @@ - + @@ -1281,7 +1281,7 @@

From Data Integration to Big Data Integration

diff --git a/publication/dblp-confbigdataconf-bergamaschi-g-23/cite.bib b/publication/dblp-confbigdataconf-bergamaschi-g-23/cite.bib new file mode 100644 index 0000000..81a870f --- /dev/null +++ b/publication/dblp-confbigdataconf-bergamaschi-g-23/cite.bib @@ -0,0 +1,27 @@ +@inproceedings{DBLP:conf/bigdataconf/BergamaschiG23, + author = {Sonia Bergamaschi and +Luca Gagliardelli}, + bibsource = {dblp computer science bibliography, https://dblp.org}, + biburl = {https://dblp.org/rec/conf/bigdataconf/BergamaschiG23.bib}, + booktitle = {IEEE International Conference on Big Data, BigData 2023, Sorrento, +Italy, December 15-18, 2023}, + doi = {10.1109/BIGDATA59044.2023.10386905}, + editor = {Jingrui He and +Themis Palpanas and +Xiaohua Hu and +Alfredo Cuzzocrea and +Dejing Dou and +Dominik Slezak and +Wei Wang and +Aleksandra Gruca and +Jerry Chun-Wei Lin and +Rakesh Agrawal}, + pages = {3898--3903}, + publisher = {IEEE}, + timestamp = {Fri, 02 Feb 2024 12:00:39 +0100}, + title = {A Big Data Platform for the Management of Local Energy Communities +Data}, + url = {https://doi.org/10.1109/BigData59044.2023.10386905}, + year = {2023} +} + diff --git a/publication/dblp-confbigdataconf-bergamaschi-g-23/index.html b/publication/dblp-confbigdataconf-bergamaschi-g-23/index.html new file mode 100644 index 0000000..5e34df6 --- /dev/null +++ b/publication/dblp-confbigdataconf-bergamaschi-g-23/index.html @@ -0,0 +1,1393 @@ + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + A Big Data Platform for the Management of Local Energy Communities Data | Luca Gagliardelli + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + +
+ + + + + + + + + + + + + +
+ + + + + + + + + + + + + + + + + + + + +
+

A Big Data Platform for the Management of Local Energy Communities Data

+ + + + + + + + + + + + + + + + + + +
+ + + +
+ + + + + +
+
+
+
+
Type
+ +
+
+
+
+
+ + + +
+
+
+
+
Publication
+
IEEE International Conference on Big Data, BigData 2023, Sorrento, Italy, December 15-18, 2023
+
+
+
+
+
+ + +
+ +
+ + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + +
+
+
+ + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + diff --git a/publication/dblp-confdawak-aslam-sgmb-23/index.html b/publication/dblp-confdawak-aslam-sgmb-23/index.html index 29a4060..1a03377 100644 --- a/publication/dblp-confdawak-aslam-sgmb-23/index.html +++ b/publication/dblp-confdawak-aslam-sgmb-23/index.html @@ -1,6 +1,6 @@ - + @@ -1232,7 +1232,7 @@

HKS: Efficient Data Partitioning for Stateful Streaming

diff --git a/publication/dblp-confedbt-gagliardelli-sb-20/index.html b/publication/dblp-confedbt-gagliardelli-sb-20/index.html index c15fb76..490dd69 100644 --- a/publication/dblp-confedbt-gagliardelli-sb-20/index.html +++ b/publication/dblp-confedbt-gagliardelli-sb-20/index.html @@ -1,6 +1,6 @@ - + @@ -1234,7 +1234,7 @@

RulER: Scaling Up Record-level Matching Rules

diff --git a/publication/dblp-confedbt-gagliardelli-sbb-19/index.html b/publication/dblp-confedbt-gagliardelli-sbb-19/index.html index 65de544..61948e8 100644 --- a/publication/dblp-confedbt-gagliardelli-sbb-19/index.html +++ b/publication/dblp-confedbt-gagliardelli-sbb-19/index.html @@ -1,6 +1,6 @@ - + @@ -1233,7 +1233,7 @@

SparkER: Scaling Entity Resolution in Spark

diff --git a/publication/dblp-confedbt-gagliardelli-zbs-22/index.html b/publication/dblp-confedbt-gagliardelli-zbs-22/index.html index dd51770..fc95692 100644 --- a/publication/dblp-confedbt-gagliardelli-zbs-22/index.html +++ b/publication/dblp-confedbt-gagliardelli-zbs-22/index.html @@ -1,6 +1,6 @@ - + @@ -1284,7 +1284,7 @@

ECDP: A Big Data Platform for the Smart Monitoring of Local Energy Communiti diff --git a/publication/dblp-confic-3-k-beneventano-bgp-15-a/index.html b/publication/dblp-confic-3-k-beneventano-bgp-15-a/index.html index c141c80..08ba3c7 100644 --- a/publication/dblp-confic-3-k-beneventano-bgp-15-a/index.html +++ b/publication/dblp-confic-3-k-beneventano-bgp-15-a/index.html @@ -1,6 +1,6 @@ - + @@ -1225,7 +1225,7 @@

Driving Innovation in Youth Policies with Open Data

diff --git a/publication/dblp-confic-3-k-beneventano-bgp-15/index.html b/publication/dblp-confic-3-k-beneventano-bgp-15/index.html index 1b56313..f259eec 100644 --- a/publication/dblp-confic-3-k-beneventano-bgp-15/index.html +++ b/publication/dblp-confic-3-k-beneventano-bgp-15/index.html @@ -1,6 +1,6 @@ - + @@ -1225,7 +1225,7 @@

Open Data for Improving Youth Policies

diff --git a/publication/dblp-confieeehpcs-simonini-gzb-18/index.html b/publication/dblp-confieeehpcs-simonini-gzb-18/index.html index b5f478b..530c71c 100644 --- a/publication/dblp-confieeehpcs-simonini-gzb-18/index.html +++ b/publication/dblp-confieeehpcs-simonini-gzb-18/index.html @@ -1,6 +1,6 @@ - + @@ -1225,7 +1225,7 @@

Enhancing Loosely Schema-aware Entity Resolution with User Interaction

diff --git a/publication/dblp-confieeehpcs-zhu-gsb-18/index.html b/publication/dblp-confieeehpcs-zhu-gsb-18/index.html index 9667af4..69b7ee8 100644 --- a/publication/dblp-confieeehpcs-zhu-gsb-18/index.html +++ b/publication/dblp-confieeehpcs-zhu-gsb-18/index.html @@ -1,6 +1,6 @@ - + @@ -1225,7 +1225,7 @@

How Improve Set Similarity Join Based on Prefix Approach in Distributed Envi diff --git a/publication/dblp-confircdl-aftar-ggrb-24/cite.bib b/publication/dblp-confircdl-aftar-ggrb-24/cite.bib new file mode 100644 index 0000000..5266b1f --- /dev/null +++ b/publication/dblp-confircdl-aftar-ggrb-24/cite.bib @@ -0,0 +1,27 @@ +@inproceedings{DBLP:conf/ircdl/AftarGGRB24, + author = {Sania Aftar and +Luca Gagliardelli and +Amina El Ganadi and +Federico Ruozzi and +Sonia Bergamaschi}, + bibsource = {dblp computer science bibliography, https://dblp.org}, + biburl = {https://dblp.org/rec/conf/ircdl/AftarGGRB24.bib}, + booktitle = {Proceedings of the 20th Conference on Information and Research science +Connecting to Digital and Library science (formerly the Italian Research +Conference on Digital Libraries), Bressanone, Brixen, Italy - 22-23 +February 2024}, + editor = {Eleonora Bernasconi and +Andrea Mannocci and +Antonella Poggi and +Angelo A. Salatino and +Gianmaria Silvello}, + pages = {117--125}, + publisher = {CEUR-WS.org}, + series = {CEUR Workshop Proceedings}, + timestamp = {Fri, 01 Mar 2024 16:26:21 +0100}, + title = {A Novel Methodology for Topic Identification in Hadith}, + url = {https://ceur-ws.org/Vol-3643/paper12.pdf}, + volume = {3643}, + year = {2024} +} + diff --git a/publication/dblp-confircdl-aftar-ggrb-24/index.html b/publication/dblp-confircdl-aftar-ggrb-24/index.html new file mode 100644 index 0000000..33227ed --- /dev/null +++ b/publication/dblp-confircdl-aftar-ggrb-24/index.html @@ -0,0 +1,1402 @@ + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + A Novel Methodology for Topic Identification in Hadith | Luca Gagliardelli + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + +
+ + + + + + + + + + + + + +
+ + + + + + + + + + + + + + + + + + + + +
+

A Novel Methodology for Topic Identification in Hadith

+ + + + + + + + + + + + + + + + + + +
+ + + +
+ + + + + +
+
+
+
+
Type
+ +
+
+
+
+
+ + + +
+
+
+
+
Publication
+
Proceedings of the 20th Conference on Information and Research science Connecting to Digital and Library science (formerly the Italian Research Conference on Digital Libraries), Bressanone, Brixen, Italy - 22-23 February 2024
+
+
+
+
+
+ + +
+ +
+ + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + +
+
+
+ + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + diff --git a/publication/dblp-confrtsi-orsini-cmggmt-17/index.html b/publication/dblp-confrtsi-orsini-cmggmt-17/index.html index be4d83f..c575cef 100644 --- a/publication/dblp-confrtsi-orsini-cmggmt-17/index.html +++ b/publication/dblp-confrtsi-orsini-cmggmt-17/index.html @@ -1,6 +1,6 @@ - + @@ -1246,7 +1246,7 @@

The Italian FSHD registry: An enhanced data integration and analytics framew diff --git a/publication/dblp-confsebd-beneventano-bgs-19/index.html b/publication/dblp-confsebd-beneventano-bgs-19/index.html index d15610e..e5efd5c 100644 --- a/publication/dblp-confsebd-beneventano-bgs-19/index.html +++ b/publication/dblp-confsebd-beneventano-bgs-19/index.html @@ -1,6 +1,6 @@ - + @@ -1213,7 +1213,7 @@

Entity Resolution and Data Fusion: An Integrated Approach

diff --git a/publication/dblp-confsebd-gagliardelli-0-sb-23/index.html b/publication/dblp-confsebd-gagliardelli-0-sb-23/index.html index 09777cc..70f1ae0 100644 --- a/publication/dblp-confsebd-gagliardelli-0-sb-23/index.html +++ b/publication/dblp-confsebd-gagliardelli-0-sb-23/index.html @@ -1,6 +1,6 @@ - + @@ -1228,7 +1228,7 @@

A general approach to Supervised Meta-Blocking

diff --git a/publication/dblp-confsebd-gagliardelli-sb-20/index.html b/publication/dblp-confsebd-gagliardelli-sb-20/index.html index 7aef8cc..19c1e95 100644 --- a/publication/dblp-confsebd-gagliardelli-sb-20/index.html +++ b/publication/dblp-confsebd-gagliardelli-sb-20/index.html @@ -1,6 +1,6 @@ - + @@ -1206,7 +1206,7 @@

Scaling Up Record-level Matching Rules

diff --git a/publication/dblp-confsebd-simonini-grzsabb-22/index.html b/publication/dblp-confsebd-simonini-grzsabb-22/index.html index b39c53f..515eb21 100644 --- a/publication/dblp-confsebd-simonini-grzsabb-22/index.html +++ b/publication/dblp-confsebd-simonini-grzsabb-22/index.html @@ -1,6 +1,6 @@ - + @@ -1241,7 +1241,7 @@

Progressive Entity Resolution with Node Embeddings

diff --git a/publication/dblp-confsebd-simonini-sgzbb-21/index.html b/publication/dblp-confsebd-simonini-sgzbb-21/index.html index 2b019af..897981f 100644 --- a/publication/dblp-confsebd-simonini-sgzbb-21/index.html +++ b/publication/dblp-confsebd-simonini-sgzbb-21/index.html @@ -1,6 +1,6 @@ - + @@ -1227,7 +1227,7 @@

The Case for Multi-task Active Learning Entity Resolution (Discussion Paper) diff --git a/publication/dblp-journalscorrabs-2204-08801/index.html b/publication/dblp-journalscorrabs-2204-08801/index.html index 0de03c4..783d855 100644 --- a/publication/dblp-journalscorrabs-2204-08801/index.html +++ b/publication/dblp-journalscorrabs-2204-08801/index.html @@ -1,6 +1,6 @@ - + @@ -1232,7 +1232,7 @@

Generalized Supervised Meta-blocking (technical report)

diff --git a/publication/dblp-journalscorrabs-2312-11122/cite.bib b/publication/dblp-journalscorrabs-2312-11122/cite.bib new file mode 100644 index 0000000..24e8b68 --- /dev/null +++ b/publication/dblp-journalscorrabs-2312-11122/cite.bib @@ -0,0 +1,21 @@ +@article{DBLP:journals/corr/abs-2312-11122, + author = {Angelo Mozzillo and +Luca Zecchini and +Luca Gagliardelli and +Adeel Aslam and +Sonia Bergamaschi and +Giovanni Simonini}, + bibsource = {dblp computer science bibliography, https://dblp.org}, + biburl = {https://dblp.org/rec/journals/corr/abs-2312-11122.bib}, + doi = {10.48550/ARXIV.2312.11122}, + eprint = {2312.11122}, + eprinttype = {arXiv}, + journal = {CoRR}, + timestamp = {Tue, 16 Jan 2024 11:57:42 +0100}, + title = {Evaluation of Dataframe Libraries for Data Preparation on a Single +Machine}, + url = {https://doi.org/10.48550/arXiv.2312.11122}, + volume = {abs/2312.11122}, + year = {2023} +} + diff --git a/publication/dblp-journalscorrabs-2312-11122/index.html b/publication/dblp-journalscorrabs-2312-11122/index.html new file mode 100644 index 0000000..b11f9d4 --- /dev/null +++ b/publication/dblp-journalscorrabs-2312-11122/index.html @@ -0,0 +1,1421 @@ + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + Evaluation of Dataframe Libraries for Data Preparation on a Single Machine | Luca Gagliardelli + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + +
+ + + + + + + + + + + + + +
+ + + + + + + + + + + + + + + + + + + + +
+

Evaluation of Dataframe Libraries for Data Preparation on a Single Machine

+ + + + + + + + + + + + + + + + + + +
+ + + +
+ + + + + +
+
+
+
+
Type
+ +
+
+
+
+
+ + + +
+
+
+
+
Publication
+
CoRR
+
+
+
+
+
+ + +
+ +
+ + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + +
+
+
+ + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + diff --git a/publication/dblp-journalscorrabs-2312-12902/cite.bib b/publication/dblp-journalscorrabs-2312-12902/cite.bib new file mode 100644 index 0000000..1fe7214 --- /dev/null +++ b/publication/dblp-journalscorrabs-2312-12902/cite.bib @@ -0,0 +1,22 @@ +@article{DBLP:journals/corr/abs-2312-12902, + author = {Luca Gagliardelli and +Domenico Beneventano and +Marco Esposito and +Luca Zecchini and +Giovanni Simonini and +Sonia Bergamaschi and +Fabio Miselli and +Giuseppe Calogero Miano}, + bibsource = {dblp computer science bibliography, https://dblp.org}, + biburl = {https://dblp.org/rec/journals/corr/abs-2312-12902.bib}, + doi = {10.48550/ARXIV.2312.12902}, + eprint = {2312.12902}, + eprinttype = {arXiv}, + journal = {CoRR}, + timestamp = {Wed, 17 Jan 2024 15:55:49 +0100}, + title = {DXP: Billing Data Preparation for Big Data Analytics}, + url = {https://doi.org/10.48550/arXiv.2312.12902}, + volume = {abs/2312.12902}, + year = {2023} +} + diff --git a/publication/dblp-journalscorrabs-2312-12902/index.html b/publication/dblp-journalscorrabs-2312-12902/index.html new file mode 100644 index 0000000..b6fc827 --- /dev/null +++ b/publication/dblp-journalscorrabs-2312-12902/index.html @@ -0,0 +1,1435 @@ + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + DXP: Billing Data Preparation for Big Data Analytics | Luca Gagliardelli + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + +
+ + + + + + + + + + + + + +
+ + + + + + + + + + + + + + + + + + + + +
+

DXP: Billing Data Preparation for Big Data Analytics

+ + + + + + + + + + + + + + + + + + +
+ + + +
+ + + + + +
+
+
+
+
Type
+ +
+
+
+
+
+ + + +
+
+
+
+
Publication
+
CoRR
+
+
+
+
+
+ + +
+ +
+ + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + +
+
+
+ + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + diff --git a/publication/dblp-journalsis-gagliardelli-psbp-24/cite.bib b/publication/dblp-journalsis-gagliardelli-psbp-24/cite.bib new file mode 100644 index 0000000..c430da2 --- /dev/null +++ b/publication/dblp-journalsis-gagliardelli-psbp-24/cite.bib @@ -0,0 +1,19 @@ +@article{DBLP:journals/is/GagliardelliPSBP24, + author = {Luca Gagliardelli and +George Papadakis and +Giovanni Simonini and +Sonia Bergamaschi and +Themis Palpanas}, + bibsource = {dblp computer science bibliography, https://dblp.org}, + biburl = {https://dblp.org/rec/journals/is/GagliardelliPSBP24.bib}, + doi = {10.1016/J.IS.2023.102307}, + journal = {Inf. Syst.}, + pages = {102307}, + timestamp = {Sat, 08 Jun 2024 13:15:20 +0200}, + title = {GSM: A generalized approach to Supervised Meta-blocking for scalable +entity resolution}, + url = {https://doi.org/10.1016/j.is.2023.102307}, + volume = {120}, + year = {2024} +} + diff --git a/publication/dblp-journalsis-gagliardelli-psbp-24/index.html b/publication/dblp-journalsis-gagliardelli-psbp-24/index.html new file mode 100644 index 0000000..32059fc --- /dev/null +++ b/publication/dblp-journalsis-gagliardelli-psbp-24/index.html @@ -0,0 +1,1414 @@ + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + GSM: A generalized approach to Supervised Meta-blocking for scalable entity resolution | Luca Gagliardelli + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + +
+ + + + + + + + + + + + + +
+ + + + + + + + + + + + + + + + + + + + +
+

GSM: A generalized approach to Supervised Meta-blocking for scalable entity resolution

+ + + + + + + + + + + + + + + + + + +
+ + + +
+ + + + + +
+
+
+
+
Type
+ +
+
+
+
+
+ + + +
+
+
+
+
Publication
+
Information Systems
+
+
+
+
+
+ + +
+ +
+ + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + +
+
+
+ + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + diff --git a/publication/dblp-journalsis-mandilaras-0-gstg-21/index.html b/publication/dblp-journalsis-mandilaras-0-gstg-21/index.html index 4d4ad2b..9e35e2a 100644 --- a/publication/dblp-journalsis-mandilaras-0-gstg-21/index.html +++ b/publication/dblp-journalsis-mandilaras-0-gstg-21/index.html @@ -1,6 +1,6 @@ - + @@ -1274,7 +1274,7 @@

Reproducible experiments on Three-Dimensional Entity Resolution with JedAI - © 2023. + © 2024.

diff --git a/publication/dblp-journalsis-papadakis-mgstgb-20/index.html b/publication/dblp-journalsis-papadakis-mgstgb-20/index.html index c4f7b04..7be4147 100644 --- a/publication/dblp-journalsis-papadakis-mgstgb-20/index.html +++ b/publication/dblp-journalsis-papadakis-mgstgb-20/index.html @@ -1,6 +1,6 @@ - + @@ -1260,7 +1260,7 @@

Three-dimensional Entity Resolution with JedAI

diff --git a/publication/dblp-journalsis-simonini-gbj-19/index.html b/publication/dblp-journalsis-simonini-gbj-19/index.html index 87485c5..0ee08cb 100644 --- a/publication/dblp-journalsis-simonini-gbj-19/index.html +++ b/publication/dblp-journalsis-simonini-gbj-19/index.html @@ -1,6 +1,6 @@ - + @@ -1225,7 +1225,7 @@

Scaling entity resolution: A loosely schema-aware approach

diff --git a/publication/dblp-journalsjdiq-beneventano-bgs-20/index.html b/publication/dblp-journalsjdiq-beneventano-bgs-20/index.html index 42e27ca..fc719b6 100644 --- a/publication/dblp-journalsjdiq-beneventano-bgs-20/index.html +++ b/publication/dblp-journalsjdiq-beneventano-bgs-20/index.html @@ -1,6 +1,6 @@ - + @@ -1225,7 +1225,7 @@

emphBLAST2: An Efficient Technique for Loose Schema Information Extraction f diff --git a/publication/dblp-journalspvldb-gagliardelli-psb-22/index.html b/publication/dblp-journalspvldb-gagliardelli-psb-22/index.html index 09edd2d..2e774c7 100644 --- a/publication/dblp-journalspvldb-gagliardelli-psb-22/index.html +++ b/publication/dblp-journalspvldb-gagliardelli-psb-22/index.html @@ -1,6 +1,6 @@ - + @@ -1236,7 +1236,7 @@

Generalized Supervised Meta-blocking

diff --git a/publication/gagliardelli-2023-big/index.html b/publication/gagliardelli-2023-big/index.html index b3f07ea..9ee1fa9 100644 --- a/publication/gagliardelli-2023-big/index.html +++ b/publication/gagliardelli-2023-big/index.html @@ -1,6 +1,6 @@ - + @@ -1260,7 +1260,7 @@

A big data platform exploiting auditable tokenization to promote good practi diff --git a/publication/index.html b/publication/index.html index 5aa90f6..30dc004 100644 --- a/publication/index.html +++ b/publication/index.html @@ -1,6 +1,6 @@ - + @@ -326,7 +326,7 @@ - + @@ -868,6 +868,24 @@

Publications

+ + + + + + + + + + + + + + + + + + @@ -921,6 +939,10 @@

Publications

+ + @@ -965,6 +987,261 @@

Publications

+
+ + + +
+ + + + + + + (2024). + Stream-aware indexing for distributed inequality join processing. + Information Systems. + +

+ + + + + + + + + + + + + + + + Cite + + + + + + + + + + + + + + + + DOI + + + + + + + + + + + + + + + + URL + +

+ + + +
+ +
+ + + + + + + +
+ + + +
+ + + + + + + (2024). + GSM: A generalized approach to Supervised Meta-blocking for scalable entity resolution. + Information Systems. + +

+ + + + + + + + + + + + + + + + Cite + + + + + + + + + + + + + + + + DOI + + + + + + + + + + + + + + + + URL + +

+ + + +
+ +
+ + + + + + + +
+ + + +
+ + + + + + + (2024). + A Novel Methodology for Topic Identification in Hadith. + Proceedings of the 20th Conference on Information and Research science Connecting to Digital and Library science (formerly the Italian Research Conference on Digital Libraries), Bressanone, Brixen, Italy - 22-23 February 2024. + +

+ + + + + + + + + + + + + + + + PDF + + + + + + Cite + + + + + + + + + + + + + + + +

+ + + +
+ +
+ + + + + + +
@@ -1139,6 +1416,188 @@

Publications

+
+ + + +
+ + + + + + + (2023). + Evaluation of Dataframe Libraries for Data Preparation on a Single Machine. + CoRR. + +

+ + + + + + + + + + + + + + + + Cite + + + + + + + + + + + + + + + + DOI + + + + + + + + + + + + + + + + URL + +

+ + + +
+ +
+ + + + + + + +
+ + + +
+ + + + + + + (2023). + DXP: Billing Data Preparation for Big Data Analytics. + CoRR. + +

+ + + + + + + + + + + + + + + + Cite + + + + + + + + + + + + + + + + DOI + + + + + + + + + + + + + + + + URL + +

+ + + +
+ +
+ + + + + + +
@@ -1224,6 +1683,92 @@

Publications

+
+ + + +
+ + + + + + + (2023). + A Big Data Platform for the Management of Local Energy Communities Data. + IEEE International Conference on Big Data, BigData 2023, Sorrento, Italy, December 15-18, 2023. + +

+ + + + + + + + + + + + + + + + Cite + + + + + + + + + + + + + + + + DOI + + + + + + + + + + + + + + + + URL + +

+ + + +
+ +
+ + + + + + +
@@ -3032,7 +3577,7 @@

Publications

diff --git a/publication/index.xml b/publication/index.xml index 486797a..2f2dbc4 100644 --- a/publication/index.xml +++ b/publication/index.xml @@ -5,13 +5,37 @@ http://www.lucagagliardelli.com/publication/ Publications - Wowchemy (https://wowchemy.com)en-usSun, 01 Jan 2023 00:00:00 +0000 + Wowchemy (https://wowchemy.com)en-usMon, 01 Jan 2024 00:00:00 +0000 http://www.lucagagliardelli.com/media/icon_hu0b7a4cb9992c9ac0e91bd28ffd38dd00_9727_512x512_fill_lanczos_center_3.png Publications http://www.lucagagliardelli.com/publication/ + + A Novel Methodology for Topic Identification in Hadith + http://www.lucagagliardelli.com/publication/dblp-confircdl-aftar-ggrb-24/ + Mon, 01 Jan 2024 00:00:00 +0000 + http://www.lucagagliardelli.com/publication/dblp-confircdl-aftar-ggrb-24/ + + + + + GSM: A generalized approach to Supervised Meta-blocking for scalable entity resolution + http://www.lucagagliardelli.com/publication/dblp-journalsis-gagliardelli-psbp-24/ + Mon, 01 Jan 2024 00:00:00 +0000 + http://www.lucagagliardelli.com/publication/dblp-journalsis-gagliardelli-psbp-24/ + + + + + Stream-aware indexing for distributed inequality join processing + http://www.lucagagliardelli.com/publication/aslam-2024102425/ + Mon, 01 Jan 2024 00:00:00 +0000 + http://www.lucagagliardelli.com/publication/aslam-2024102425/ + + + A big data platform exploiting auditable tokenization to promote good practices inside local energy communities http://www.lucagagliardelli.com/publication/gagliardelli-2023-big/ @@ -20,6 +44,14 @@ + + A Big Data Platform for the Management of Local Energy Communities Data + http://www.lucagagliardelli.com/publication/dblp-confbigdataconf-bergamaschi-g-23/ + Sun, 01 Jan 2023 00:00:00 +0000 + http://www.lucagagliardelli.com/publication/dblp-confbigdataconf-bergamaschi-g-23/ + + + A general approach to Supervised Meta-Blocking http://www.lucagagliardelli.com/publication/dblp-confsebd-gagliardelli-0-sb-23/ @@ -28,6 +60,22 @@ + + DXP: Billing Data Preparation for Big Data Analytics + http://www.lucagagliardelli.com/publication/dblp-journalscorrabs-2312-12902/ + Sun, 01 Jan 2023 00:00:00 +0000 + http://www.lucagagliardelli.com/publication/dblp-journalscorrabs-2312-12902/ + + + + + Evaluation of Dataframe Libraries for Data Preparation on a Single Machine + http://www.lucagagliardelli.com/publication/dblp-journalscorrabs-2312-11122/ + Sun, 01 Jan 2023 00:00:00 +0000 + http://www.lucagagliardelli.com/publication/dblp-journalscorrabs-2312-11122/ + + + HKS: Efficient Data Partitioning for Stateful Streaming http://www.lucagagliardelli.com/publication/dblp-confdawak-aslam-sgmb-23/ diff --git a/publication_types/index.html b/publication_types/index.html index de5a2eb..67caba6 100644 --- a/publication_types/index.html +++ b/publication_types/index.html @@ -1,6 +1,6 @@ - + @@ -326,7 +326,7 @@ - + @@ -858,7 +858,7 @@

Publication_types

- Oct 16, 2023 + Jul 8, 2024 @@ -932,7 +932,7 @@

Publication_types

- Jan 16, 2023 + Jul 8, 2024 @@ -1158,7 +1158,7 @@

Publication_types

diff --git a/publication_types/index.xml b/publication_types/index.xml index 67a4fea..4f874c1 100644 --- a/publication_types/index.xml +++ b/publication_types/index.xml @@ -5,7 +5,7 @@ http://www.lucagagliardelli.com/publication_types/ Publication_types - Wowchemy (https://wowchemy.com)en-usSun, 01 Jan 2023 00:00:00 +0000 + Wowchemy (https://wowchemy.com)en-usMon, 01 Jan 2024 00:00:00 +0000 http://www.lucagagliardelli.com/media/icon_hu0b7a4cb9992c9ac0e91bd28ffd38dd00_9727_512x512_fill_lanczos_center_3.png Publication_types diff --git a/sitemap.xml b/sitemap.xml index 1b75d2b..2200352 100644 --- a/sitemap.xml +++ b/sitemap.xml @@ -3,11 +3,59 @@ xmlns:xhtml="http://www.w3.org/1999/xhtml"> http://www.lucagagliardelli.com/publication-type/1/ - 2023-10-16T09:16:24+02:00 + 2024-07-08T15:03:56+02:00 weekly http://www.lucagagliardelli.com/publication-type/2/ - 2023-01-16T10:51:09+01:00 + 2024-07-08T15:08:35+02:00 + weekly + + http://www.lucagagliardelli.com/publication/dblp-confircdl-aftar-ggrb-24/ + 2024-07-08T15:03:56+02:00 + weekly + + http://www.lucagagliardelli.com/tag/augmented-sketch/ + 2024-07-08T15:08:35+02:00 + weekly + + http://www.lucagagliardelli.com/tag/btree-indexing/ + 2024-07-08T15:08:35+02:00 + weekly + + http://www.lucagagliardelli.com/tag/distributed-stream-processing-system/ + 2024-07-08T15:08:35+02:00 + weekly + + http://www.lucagagliardelli.com/publication/dblp-journalsis-gagliardelli-psbp-24/ + 2024-07-08T15:03:51+02:00 + weekly + + http://www.lucagagliardelli.com/tag/inequality-join/ + 2024-07-08T15:08:35+02:00 + weekly + + http://www.lucagagliardelli.com/ + 2024-07-08T15:08:35+02:00 + weekly + + http://www.lucagagliardelli.com/publication_types/ + 2024-07-08T15:08:35+02:00 + weekly + + http://www.lucagagliardelli.com/publication/ + 2024-07-08T15:08:35+02:00 + weekly + + http://www.lucagagliardelli.com/tag/skewed-data-distribution/ + 2024-07-08T15:08:35+02:00 + weekly + + http://www.lucagagliardelli.com/publication/aslam-2024102425/ + 2024-07-08T15:08:35+02:00 + weekly + + http://www.lucagagliardelli.com/tags/ + 2024-07-08T15:08:35+02:00 weekly http://www.lucagagliardelli.com/publication-type/5/ @@ -18,27 +66,27 @@ 2023-01-16T10:51:09+01:00 weekly - http://www.lucagagliardelli.com/publication/dblp-confsebd-gagliardelli-0-sb-23/ - 2023-10-16T09:16:24+02:00 + http://www.lucagagliardelli.com/publication/dblp-confbigdataconf-bergamaschi-g-23/ + 2024-07-08T15:03:49+02:00 weekly - http://www.lucagagliardelli.com/publication/dblp-confdawak-aslam-sgmb-23/ + http://www.lucagagliardelli.com/publication/dblp-confsebd-gagliardelli-0-sb-23/ 2023-10-16T09:16:24+02:00 weekly - http://www.lucagagliardelli.com/ - 2023-10-16T09:17:24+02:00 + http://www.lucagagliardelli.com/publication/dblp-journalscorrabs-2312-12902/ + 2024-07-08T15:03:54+02:00 weekly - http://www.lucagagliardelli.com/publication/basidati-2023/ - 2023-10-16T09:17:24+02:00 + http://www.lucagagliardelli.com/publication/dblp-journalscorrabs-2312-11122/ + 2024-07-08T15:03:53+02:00 weekly - http://www.lucagagliardelli.com/publication_types/ - 2023-10-16T09:17:24+02:00 + http://www.lucagagliardelli.com/publication/dblp-confdawak-aslam-sgmb-23/ + 2023-10-16T09:16:24+02:00 weekly - http://www.lucagagliardelli.com/publication/ + http://www.lucagagliardelli.com/publication/basidati-2023/ 2023-10-16T09:17:24+02:00 weekly @@ -139,8 +187,5 @@ http://www.lucagagliardelli.com/categories/ weekly - - http://www.lucagagliardelli.com/tags/ - weekly diff --git a/tag/augmented-sketch/index.html b/tag/augmented-sketch/index.html new file mode 100644 index 0000000..4b27e83 --- /dev/null +++ b/tag/augmented-sketch/index.html @@ -0,0 +1,1161 @@ + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + Augmented sketch | Luca Gagliardelli + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + +
+ + + + + + + + + + + + + + + + + + + + + + + + + +
+

Augmented sketch

+ + + + +
+ + + +
+ + + + + + + + + + + + + + + + + + + + + + + + + + +
+
+ +
+ Stream-aware indexing for distributed inequality join processing +
+ + + +
+ Inequality join is an operator to join data on inequality conditions and it is a fundamental building block for applications. While … +
+
+ + + + + + + + +
+
+ + +
+
+ + + + + + + +
+
+ + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + diff --git a/tag/augmented-sketch/index.xml b/tag/augmented-sketch/index.xml new file mode 100644 index 0000000..714bd66 --- /dev/null +++ b/tag/augmented-sketch/index.xml @@ -0,0 +1,24 @@ + + + + Augmented sketch | Luca Gagliardelli + http://www.lucagagliardelli.com/tag/augmented-sketch/ + + Augmented sketch + Wowchemy (https://wowchemy.com)en-usMon, 01 Jan 2024 00:00:00 +0000 + + http://www.lucagagliardelli.com/media/icon_hu0b7a4cb9992c9ac0e91bd28ffd38dd00_9727_512x512_fill_lanczos_center_3.png + Augmented sketch + http://www.lucagagliardelli.com/tag/augmented-sketch/ + + + + Stream-aware indexing for distributed inequality join processing + http://www.lucagagliardelli.com/publication/aslam-2024102425/ + Mon, 01 Jan 2024 00:00:00 +0000 + http://www.lucagagliardelli.com/publication/aslam-2024102425/ + + + + + diff --git a/tag/augmented-sketch/page/1/index.html b/tag/augmented-sketch/page/1/index.html new file mode 100644 index 0000000..973a2c5 --- /dev/null +++ b/tag/augmented-sketch/page/1/index.html @@ -0,0 +1,10 @@ + + + + http://www.lucagagliardelli.com/tag/augmented-sketch/ + + + + + + diff --git a/tag/btree-indexing/index.html b/tag/btree-indexing/index.html new file mode 100644 index 0000000..f87c974 --- /dev/null +++ b/tag/btree-indexing/index.html @@ -0,0 +1,1161 @@ + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + Btree indexing | Luca Gagliardelli + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + +
+ + + + + + + + + + + + + + + + + + + + + + + + + +
+

Btree indexing

+ + + + +
+ + + +
+ + + + + + + + + + + + + + + + + + + + + + + + + + +
+
+ +
+ Stream-aware indexing for distributed inequality join processing +
+ + + +
+ Inequality join is an operator to join data on inequality conditions and it is a fundamental building block for applications. While … +
+
+ + + + + + + + +
+
+ + +
+
+ + + + + + + +
+
+ + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + diff --git a/tag/btree-indexing/index.xml b/tag/btree-indexing/index.xml new file mode 100644 index 0000000..be42d7c --- /dev/null +++ b/tag/btree-indexing/index.xml @@ -0,0 +1,24 @@ + + + + Btree indexing | Luca Gagliardelli + http://www.lucagagliardelli.com/tag/btree-indexing/ + + Btree indexing + Wowchemy (https://wowchemy.com)en-usMon, 01 Jan 2024 00:00:00 +0000 + + http://www.lucagagliardelli.com/media/icon_hu0b7a4cb9992c9ac0e91bd28ffd38dd00_9727_512x512_fill_lanczos_center_3.png + Btree indexing + http://www.lucagagliardelli.com/tag/btree-indexing/ + + + + Stream-aware indexing for distributed inequality join processing + http://www.lucagagliardelli.com/publication/aslam-2024102425/ + Mon, 01 Jan 2024 00:00:00 +0000 + http://www.lucagagliardelli.com/publication/aslam-2024102425/ + + + + + diff --git a/tag/btree-indexing/page/1/index.html b/tag/btree-indexing/page/1/index.html new file mode 100644 index 0000000..b063878 --- /dev/null +++ b/tag/btree-indexing/page/1/index.html @@ -0,0 +1,10 @@ + + + + http://www.lucagagliardelli.com/tag/btree-indexing/ + + + + + + diff --git a/tag/distributed-stream-processing-system/index.html b/tag/distributed-stream-processing-system/index.html new file mode 100644 index 0000000..e4d653a --- /dev/null +++ b/tag/distributed-stream-processing-system/index.html @@ -0,0 +1,1161 @@ + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + Distributed stream processing system | Luca Gagliardelli + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + +
+ + + + + + + + + + + + + + + + + + + + + + + + + +
+

Distributed stream processing system

+ + + + +
+ + + +
+ + + + + + + + + + + + + + + + + + + + + + + + + + +
+
+ +
+ Stream-aware indexing for distributed inequality join processing +
+ + + +
+ Inequality join is an operator to join data on inequality conditions and it is a fundamental building block for applications. While … +
+
+ + + + + + + + +
+
+ + +
+
+ + + + + + + +
+
+ + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + diff --git a/tag/distributed-stream-processing-system/index.xml b/tag/distributed-stream-processing-system/index.xml new file mode 100644 index 0000000..d359d83 --- /dev/null +++ b/tag/distributed-stream-processing-system/index.xml @@ -0,0 +1,24 @@ + + + + Distributed stream processing system | Luca Gagliardelli + http://www.lucagagliardelli.com/tag/distributed-stream-processing-system/ + + Distributed stream processing system + Wowchemy (https://wowchemy.com)en-usMon, 01 Jan 2024 00:00:00 +0000 + + http://www.lucagagliardelli.com/media/icon_hu0b7a4cb9992c9ac0e91bd28ffd38dd00_9727_512x512_fill_lanczos_center_3.png + Distributed stream processing system + http://www.lucagagliardelli.com/tag/distributed-stream-processing-system/ + + + + Stream-aware indexing for distributed inequality join processing + http://www.lucagagliardelli.com/publication/aslam-2024102425/ + Mon, 01 Jan 2024 00:00:00 +0000 + http://www.lucagagliardelli.com/publication/aslam-2024102425/ + + + + + diff --git a/tag/distributed-stream-processing-system/page/1/index.html b/tag/distributed-stream-processing-system/page/1/index.html new file mode 100644 index 0000000..d4eab87 --- /dev/null +++ b/tag/distributed-stream-processing-system/page/1/index.html @@ -0,0 +1,10 @@ + + + + http://www.lucagagliardelli.com/tag/distributed-stream-processing-system/ + + + + + + diff --git a/tag/inequality-join/index.html b/tag/inequality-join/index.html new file mode 100644 index 0000000..bc95c75 --- /dev/null +++ b/tag/inequality-join/index.html @@ -0,0 +1,1161 @@ + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + Inequality join | Luca Gagliardelli + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + +
+ + + + + + + + + + + + + + + + + + + + + + + + + +
+

Inequality join

+ + + + +
+ + + +
+ + + + + + + + + + + + + + + + + + + + + + + + + + +
+
+ +
+ Stream-aware indexing for distributed inequality join processing +
+ + + +
+ Inequality join is an operator to join data on inequality conditions and it is a fundamental building block for applications. While … +
+
+ + + + + + + + +
+
+ + +
+
+ + + + + + + +
+
+ + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + diff --git a/tag/inequality-join/index.xml b/tag/inequality-join/index.xml new file mode 100644 index 0000000..c4874a6 --- /dev/null +++ b/tag/inequality-join/index.xml @@ -0,0 +1,24 @@ + + + + Inequality join | Luca Gagliardelli + http://www.lucagagliardelli.com/tag/inequality-join/ + + Inequality join + Wowchemy (https://wowchemy.com)en-usMon, 01 Jan 2024 00:00:00 +0000 + + http://www.lucagagliardelli.com/media/icon_hu0b7a4cb9992c9ac0e91bd28ffd38dd00_9727_512x512_fill_lanczos_center_3.png + Inequality join + http://www.lucagagliardelli.com/tag/inequality-join/ + + + + Stream-aware indexing for distributed inequality join processing + http://www.lucagagliardelli.com/publication/aslam-2024102425/ + Mon, 01 Jan 2024 00:00:00 +0000 + http://www.lucagagliardelli.com/publication/aslam-2024102425/ + + + + + diff --git a/tag/inequality-join/page/1/index.html b/tag/inequality-join/page/1/index.html new file mode 100644 index 0000000..ac8ad84 --- /dev/null +++ b/tag/inequality-join/page/1/index.html @@ -0,0 +1,10 @@ + + + + http://www.lucagagliardelli.com/tag/inequality-join/ + + + + + + diff --git a/tag/skewed-data-distribution/index.html b/tag/skewed-data-distribution/index.html new file mode 100644 index 0000000..a7ad1e8 --- /dev/null +++ b/tag/skewed-data-distribution/index.html @@ -0,0 +1,1161 @@ + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + Skewed data distribution | Luca Gagliardelli + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + +
+ + + + + + + + + + + + + + + + + + + + + + + + + +
+

Skewed data distribution

+ + + + +
+ + + +
+ + + + + + + + + + + + + + + + + + + + + + + + + + +
+
+ +
+ Stream-aware indexing for distributed inequality join processing +
+ + + +
+ Inequality join is an operator to join data on inequality conditions and it is a fundamental building block for applications. While … +
+
+ + + + + + + + +
+
+ + +
+
+ + + + + + + +
+
+ + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + diff --git a/tag/skewed-data-distribution/index.xml b/tag/skewed-data-distribution/index.xml new file mode 100644 index 0000000..8edf039 --- /dev/null +++ b/tag/skewed-data-distribution/index.xml @@ -0,0 +1,24 @@ + + + + Skewed data distribution | Luca Gagliardelli + http://www.lucagagliardelli.com/tag/skewed-data-distribution/ + + Skewed data distribution + Wowchemy (https://wowchemy.com)en-usMon, 01 Jan 2024 00:00:00 +0000 + + http://www.lucagagliardelli.com/media/icon_hu0b7a4cb9992c9ac0e91bd28ffd38dd00_9727_512x512_fill_lanczos_center_3.png + Skewed data distribution + http://www.lucagagliardelli.com/tag/skewed-data-distribution/ + + + + Stream-aware indexing for distributed inequality join processing + http://www.lucagagliardelli.com/publication/aslam-2024102425/ + Mon, 01 Jan 2024 00:00:00 +0000 + http://www.lucagagliardelli.com/publication/aslam-2024102425/ + + + + + diff --git a/tag/skewed-data-distribution/page/1/index.html b/tag/skewed-data-distribution/page/1/index.html new file mode 100644 index 0000000..723887b --- /dev/null +++ b/tag/skewed-data-distribution/page/1/index.html @@ -0,0 +1,10 @@ + + + + http://www.lucagagliardelli.com/tag/skewed-data-distribution/ + + + + + + diff --git a/tags/index.html b/tags/index.html index d858362..7e252a1 100644 --- a/tags/index.html +++ b/tags/index.html @@ -1,6 +1,6 @@ - + @@ -326,6 +326,8 @@ + + @@ -813,6 +815,376 @@

Tags

+ + + + + + + + + + + + + + + +
+
+ +
+ Augmented sketch +
+ + + + + + + +
+
+ + +
+
+ + + + + + + + + + + + + + + + + +
+
+ +
+ Btree indexing +
+ + + + + + + +
+
+ + +
+
+ + + + + + + + + + + + + + + + + +
+
+ +
+ Distributed stream processing system +
+ + + + + + + +
+
+ + +
+
+ + + + + + + + + + + + + + + + + +
+
+ +
+ Inequality join +
+ + + + + + + +
+
+ + +
+
+ + + + + + + + + + + + + + + + + +
+
+ +
+ Skewed data distribution +
+ + + + + + + +
+
+ + +
+
+ + @@ -860,7 +1232,7 @@

Tags

diff --git a/tags/index.xml b/tags/index.xml index 82a63ca..2752b07 100644 --- a/tags/index.xml +++ b/tags/index.xml @@ -5,7 +5,7 @@ http://www.lucagagliardelli.com/tags/ Tags - Wowchemy (https://wowchemy.com)en-us + Wowchemy (https://wowchemy.com)en-usMon, 01 Jan 2024 00:00:00 +0000 http://www.lucagagliardelli.com/media/icon_hu0b7a4cb9992c9ac0e91bd28ffd38dd00_9727_512x512_fill_lanczos_center_3.png Tags diff --git a/talk/ecdp-@-dataplat-2022/index.html b/talk/ecdp-@-dataplat-2022/index.html index 5bb031f..2f9eab2 100644 --- a/talk/ecdp-@-dataplat-2022/index.html +++ b/talk/ecdp-@-dataplat-2022/index.html @@ -1,6 +1,6 @@ - + @@ -1300,7 +1300,7 @@
Fixed-term Researcher
diff --git a/talk/generalized-supervised-meta-blocking-@-vldb-2022/index.html b/talk/generalized-supervised-meta-blocking-@-vldb-2022/index.html index fa4ad3d..49e9aab 100644 --- a/talk/generalized-supervised-meta-blocking-@-vldb-2022/index.html +++ b/talk/generalized-supervised-meta-blocking-@-vldb-2022/index.html @@ -1,6 +1,6 @@ - + @@ -1308,7 +1308,7 @@
Fixed-term Researcher