From 8e08154ada0d1bb24fdc9ef50b6d78be1989e42d Mon Sep 17 00:00:00 2001 From: svaderia Date: Tue, 7 Oct 2025 07:21:47 -0400 Subject: [PATCH 1/7] Lemire's Range Mapping trick --- ref.bib | 8 ++++++++ 1 file changed, 8 insertions(+) diff --git a/ref.bib b/ref.bib index 6177b32..9420fa1 100644 --- a/ref.bib +++ b/ref.bib @@ -33742,3 +33742,11 @@ @article{wang:pacmdata2023 address = {New York, NY, USA}, numpages = 23 } + +@misc{www-lemire-fastmodulo2016, + author = {Lemire, Daniel}, + title = {A fast alternative to the modulo reduction}, + year = 2017, + month = jun, + howpublished = {\url{https://lemire.me/blog/2016/06/27/a-fast-alternative-to-the-modulo-reduction/}}, +} From aff2cdee0f7772f2b55c65f8a994be929be9f185 Mon Sep 17 00:00:00 2001 From: svaderia Date: Mon, 10 Nov 2025 07:52:45 -0500 Subject: [PATCH 2/7] Bitonic sort reference --- ref.bib | 8 ++++++++ 1 file changed, 8 insertions(+) diff --git a/ref.bib b/ref.bib index 9420fa1..1d3b03f 100644 --- a/ref.bib +++ b/ref.bib @@ -33750,3 +33750,11 @@ @misc{www-lemire-fastmodulo2016 month = jun, howpublished = {\url{https://lemire.me/blog/2016/06/27/a-fast-alternative-to-the-modulo-reduction/}}, } + +@inproceedings{batcher1968sorting, + title={Sorting networks and their applications}, + author={Batcher, Kenneth E}, + booktitle={Proceedings of the April 30--May 2, 1968, spring joint computer conference}, + pages={307--314}, + year={1968} +} From c1c3c2b4b65b8c8032a0cb9efb11ed631c70c47f Mon Sep 17 00:00:00 2001 From: svaderia Date: Tue, 18 Nov 2025 20:22:55 -0500 Subject: [PATCH 3/7] Recent Bloom tutorial reference --- ref.bib | 22 ++++++++++++++++++++++ 1 file changed, 22 insertions(+) diff --git a/ref.bib b/ref.bib index 1d3b03f..2d07694 100644 --- a/ref.bib +++ b/ref.bib @@ -33758,3 +33758,25 @@ @inproceedings{batcher1968sorting pages={307--314}, year={1968} } + +@inproceedings{pandey2024bloom, + author = {Prashant Pandey and + Mart{\'{\i}}n Farach{-}Colton and + Niv Dayan and + Huanchen Zhang}, + editor = {Pablo Barcel{\'{o}} and + Nayat S{\'{a}}nchez Pi and + Alexandra Meliou and + S. Sudarshan}, + title = {Beyond Bloom: {A} Tutorial on Future Feature-Rich Filters}, + booktitle = {Companion of the 2024 International Conference on Management of Data, + {SIGMOD/PODS} 2024, Santiago AA, Chile, June 9-15, 2024}, + pages = {636--644}, + publisher = {{ACM}}, + year = {2024}, + url = {https://doi.org/10.1145/3626246.3654681}, + doi = {10.1145/3626246.3654681}, + timestamp = {Fri, 31 May 2024 21:05:26 +0200}, + biburl = {https://dblp.org/rec/conf/sigmod/0001FDZ24.bib}, + bibsource = {dblp computer science bibliography, https://dblp.org} +} From 929242526613eca268ce59d9a3525d27966c16a3 Mon Sep 17 00:00:00 2001 From: svaderia Date: Thu, 20 Nov 2025 18:43:05 -0500 Subject: [PATCH 4/7] (cob) Cache oblivious literature --- ref.bib | 37 +++++++++++++++++++++++++++++++++++++ 1 file changed, 37 insertions(+) diff --git a/ref.bib b/ref.bib index 2d07694..78a5caf 100644 --- a/ref.bib +++ b/ref.bib @@ -33780,3 +33780,40 @@ @inproceedings{pandey2024bloom biburl = {https://dblp.org/rec/conf/sigmod/0001FDZ24.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} } + +@inproceedings{frigo1999oblivious, + author={Frigo, M. and Leiserson, C.E. and Prokop, H. and Ramachandran, S.}, + booktitle={40th Annual Symposium on Foundations of Computer Science (Cat. No.99CB37039)}, + title={Cache-oblivious algorithms}, + year={1999}, + volume={}, + number={}, + pages={285-297}, + keywords={Sorting;Algorithm design and analysis;Strontium;Laboratories;Hardware;Central Processing Unit;Banking}, + doi={10.1109/SFFCS.1999.814600} +} + +@inproceedings{Bender2004, + author={Bender, M.A. and Demaine, E.D. and Farach-Colton, M.}, + booktitle={Proceedings 41st Annual Symposium on Foundations of Computer Science}, + title={Cache-oblivious B-trees}, + year={2000}, + volume={}, + number={}, + pages={399-409}, + keywords={Data structures;Computer science;Computer networks;Registers;Network-on-a-chip;Algorithm design and analysis;Laboratories;Costs;Central Processing Unit;Clustering algorithms}, + doi={10.1109/SFCS.2000.892128} +} + +@inproceedings{Brodal2002 + author = {Brodal, Gerth St\o{}lting and Fagerberg, Rolf}, + title = {Funnel Heap - A Cache Oblivious Priority Queue}, + year = {2002}, + isbn = {3540001425}, + publisher = {Springer-Verlag}, + address = {Berlin, Heidelberg}, + booktitle = {Proceedings of the 13th International Symposium on Algorithms and Computation}, + pages = {219–228}, + numpages = {10}, + series = {ISAAC '02} +} From a1a030c23c434bcc783de81dfd0d5dd722c14d36 Mon Sep 17 00:00:00 2001 From: svaderia Date: Thu, 20 Nov 2025 18:46:43 -0500 Subject: [PATCH 5/7] (chore) fix missing , --- ref.bib | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/ref.bib b/ref.bib index 78a5caf..cf68384 100644 --- a/ref.bib +++ b/ref.bib @@ -33805,7 +33805,7 @@ @inproceedings{Bender2004 doi={10.1109/SFCS.2000.892128} } -@inproceedings{Brodal2002 +@inproceedings{Brodal2002, author = {Brodal, Gerth St\o{}lting and Fagerberg, Rolf}, title = {Funnel Heap - A Cache Oblivious Priority Queue}, year = {2002}, From b2f45434d3e19e127d9fc4bce5fbb882ffc7ff88 Mon Sep 17 00:00:00 2001 From: svaderia Date: Fri, 21 Nov 2025 07:23:26 -0500 Subject: [PATCH 6/7] Filter literature --- ref.bib | 84 +++++++++++++++++++++++++++++++++++++++++++++++++++++++++ 1 file changed, 84 insertions(+) diff --git a/ref.bib b/ref.bib index cf68384..0d1b8d4 100644 --- a/ref.bib +++ b/ref.bib @@ -33817,3 +33817,87 @@ @inproceedings{Brodal2002 numpages = {10}, series = {ISAAC '02} } + +@article{Lemire2020xor, + author = {Graf, Thomas Mueller and Lemire, Daniel}, + title = {Xor Filters: Faster and Smaller Than Bloom and Cuckoo Filters}, + year = {2020}, + issue_date = {2020}, + publisher = {Association for Computing Machinery}, + address = {New York, NY, USA}, + volume = {25}, + issn = {1084-6654}, + url = {https://doi.org/10.1145/3376122}, + doi = {10.1145/3376122}, + journal = {ACM J. Exp. Algorithmics}, + month = mar, + articleno = {1.5}, + numpages = {16}, + keywords = {Bloom filters, approximate set membership, cuckoo filters} +} + +@InProceedings{dillinger2022ribbon, + author = {Dillinger, Peter C. and H\"{u}bschle-Schneider, Lorenz and Sanders, Peter and Walzer, Stefan}, + title = {{Fast Succinct Retrieval and Approximate Membership Using Ribbon}}, + booktitle = {20th International Symposium on Experimental Algorithms (SEA 2022)}, + pages = {4:1--4:20}, + series = {Leibniz International Proceedings in Informatics (LIPIcs)}, + ISBN = {978-3-95977-251-8}, + ISSN = {1868-8969}, + year = {2022}, + volume = {233}, + editor = {Schulz, Christian and U\c{c}ar, Bora}, + publisher = {Schloss Dagstuhl -- Leibniz-Zentrum f{\"u}r Informatik}, + address = {Dagstuhl, Germany}, + URL = {https://drops.dagstuhl.de/entities/document/10.4230/LIPIcs.SEA.2022.4}, + URN = {urn:nbn:de:0030-drops-165385}, + doi = {10.4230/LIPIcs.SEA.2022.4}, + annote = {Keywords: AMQ, Bloom filter, dictionary, linear algebra, randomized algorithm, retrieval data structure, static function data structure, succinct data structure, perfect hashing} +} + +@article{evne2022prefix, +author = {Even, Tomer and Even, Guy and Morrison, Adam}, +title = {Prefix filter: practically and theoretically better than bloom}, +year = {2022}, +issue_date = {March 2022}, +publisher = {VLDB Endowment}, +volume = {15}, +number = {7}, +issn = {2150-8097}, +url = {https://doi.org/10.14778/3523210.3523211}, +doi = {10.14778/3523210.3523211}, +journal = {Proc. VLDB Endow.}, +month = mar, +pages = {1311–1323}, +numpages = {13} +} + +@inproceedings{Bender2018adaptive, + author={Bender, Michael A. and Farach-Colton, Martin and Goswami, Mayank and Johnson, Rob and McCauley, Samuel and Singh, Shikha}, + booktitle={2018 IEEE 59th Annual Symposium on Foundations of Computer Science (FOCS)}, + title={Bloom Filters, Adaptivity, and the Dictionary Problem}, + year={2018}, + volume={}, + number={}, + pages={182-193}, + keywords={Dictionaries;Data structures;Games;Probabilistic logic;Measurement;Computer science;Random access memory;Bloom filters;approximate membership query data structures;adaptive data structures;dictionary data structures}, + doi={10.1109/FOCS.2018.00026} +} + +@article{mitzenmacher2020adaptivecuckoo, + author = {Mitzenmacher, Michael and Pontarelli, Salvatore and Reviriego, Pedro}, + title = {Adaptive Cuckoo Filters}, + year = {2020}, + issue_date = {2020}, + publisher = {Association for Computing Machinery}, + address = {New York, NY, USA}, + volume = {25}, + issn = {1084-6654}, + url = {https://doi.org/10.1145/3339504}, + doi = {10.1145/3339504}, + journal = {ACM J. Exp. Algorithmics}, + month = mar, + articleno = {1.1}, + numpages = {20}, + keywords = {false positive rate, adaptive, Markov chains, Cuckoo hashing, Bloom filters} +} From ff050820713dacf4dce29b174f32ef67d4a949f8 Mon Sep 17 00:00:00 2001 From: svaderia Date: Thu, 18 Dec 2025 15:22:35 -0500 Subject: [PATCH 7/7] PBF and cache tech report --- ref.bib | 53 +++++++++++++++++++++++++++++++++++++++++++++++++++++ 1 file changed, 53 insertions(+) diff --git a/ref.bib b/ref.bib index 0d1b8d4..c37c8a7 100644 --- a/ref.bib +++ b/ref.bib @@ -33901,3 +33901,56 @@ @article{mitzenmacher2020adaptivecuckoo numpages = {20}, keywords = {false positive rate, adaptive, Markov chains, Cuckoo hashing, Bloom filters} } + +@article{Mullin1983pbf, + author = {Mullin, James K.}, + title = {A second look at bloom filters}, + year = {1983}, + issue_date = {Aug. 1983}, + publisher = {Association for Computing Machinery}, + address = {New York, NY, USA}, + volume = {26}, + number = {8}, + issn = {0001-0782}, + url = {https://doi.org/10.1145/358161.358167}, + doi = {10.1145/358161.358167}, + journal = {Commun. ACM}, + month = aug, + pages = {570–571}, + numpages = {2}, + keywords = {bloom, differential file, filter} +} + +@article{Almeida2023pbf, + author={Almeida, Paulo Sérgio}, + journal={IEEE Transactions on Computers}, + title={A Case for Partitioned Bloom Filters}, + year={2023}, + volume={72}, + number={6}, + pages={1681-1691}, + keywords={Standards;Hash functions;Proposals;Indexes;Hardware;Testing;Libraries;Information filtering;partitioned bloom filters;probabilistic data structures}, + doi={10.1109/TC.2022.3218995} +} + +@inproceedings{Sanchez2007pbf, + author={Sanchez, Daniel and Yen, Luke and Hill, Mark D. and Sankaralingam, Karthikeyan}, + booktitle={40th Annual IEEE/ACM International Symposium on Microarchitecture (MICRO 2007)}, + title={Implementing Signatures for Transactional Memory}, + year={2007}, + volume={}, + number={}, + pages={123-133}, + keywords={Filters;Hardware;Read-write memory;Performance analysis;Hydrogen;Costs;System testing;Degradation;Space exploration;Dynamic programming}, + doi={10.1109/MICRO.2007.24} +} + +@techreport{Cooper2011PortableTT, + author = "Keith D. Cooper and Jeffrey A. Sandoval", + title = "Portable Techniques to Find Effective Memory Hierarchy Parameters", + institution = "Rice University", + year = 2011, + month = dec, + number = "TR-11-06", + type = "Technical Report" +}