The following team members were involved in the SFB 876:
Erich Schubert Room: OH14 R334 Phone: +49 231/755-7876 erich schubert () tu-dortmund de
Professor of data mining, working on cluster analysis, outlier detection, change detection.
Andreas Lang Room: OH14 R336 Phone: +49 231/755-6093 andreas lang () tu-dortmund de
PhD student working on tree-based acceleration of cluster analysis.
Lars Lenssen Room: OH14 R335 Phone: +49 231/755-8254 lars lenssen () tu-dortmund de
PhD student working on clustering objectives.
Erik Thordsen Room: OH14 R335 Phone: +49 231/755-8255 erik thordsen () tu-dortmund de
PhD student working on intrinsic dimensionality of data.
Project publications
Publications from our subproject:
Lars Lenssen and Erich Schubert. Sparse Partitioning Around Medoids In: Machine Learning under Resource Constraints -- Fundamentals 1, 182-196, 2023.
[DOI: 10.1515/9783110785944-005] | [BibTeX]
@incollection{LenssenSchubert23a,
author = {Lars Lenssen and Erich Schubert},
booktitle = {Machine Learning under Resource Constraints -- Fundamentals},
chapter = {5.1},
doi = {10.1515/9783110785944-005},
editor = {Katharina Morik and Peter Marwedel},
pages = {182--196},
publisher = {De Gruyter},
title = {Sparse Partitioning Around Medoids},
volume = {1},
year = {2023}
}
Erich Schubert and Andreas Lang. Data Aggregation for Hierarchical Clustering In: Machine Learning under Resource Constraints -- Fundamentals 1, 215-226, 2023.
[DOI: 10.1515/9783110785944-005] | [BibTeX]
@incollection{LangSchubert23a,
author = {Erich Schubert and Andreas Lang},
booktitle = {Machine Learning under Resource Constraints -- Fundamentals},
chapter = {5.3},
doi = {10.1515/9783110785944-005},
editor = {Katharina Morik and Peter Marwedel},
pages = {215--226},
publisher = {De Gruyter},
title = {Data Aggregation for Hierarchical Clustering},
volume = {1},
year = {2023}
}
Franka Bause, Erich Schubert and Nils M. Kriege. EmbAssi: embedding assignment costs for similarity search in large graph databases In: Data Min. Knowl. Discov. 36, 1728-1755, 2022.
[DOI: 10.1007/s10618-022-00850-3] | [BibTeX]
@article{DBLP:journals/datamine/BauseSK22,
author = {Franka Bause and Erich Schubert and Nils M. Kriege},
doi = {10.1007/s10618-022-00850-3},
journal = {Data Min. Knowl. Discov.},
number = {5},
pages = {1728--1755},
title = {EmbAssi: embedding assignment costs for similarity search in large graph databases},
volume = {36},
year = {2022}
}
Erik Thordsen and Erich Schubert. ABID: Angle Based Intrinsic Dimensionality - Theory and analysis In: Inf. Syst. 108, 101989, 2022.
[DOI: 10.1016/j.is.2022.101989] | [BibTeX]
@article{DBLP:journals/is/ThordsenS22,
author = {Erik Thordsen and Erich Schubert},
doi = {10.1016/j.is.2022.101989},
journal = {Inf. Syst.},
pages = {101989},
title = {{ABID:} Angle Based Intrinsic Dimensionality - Theory and analysis},
volume = {108},
year = {2022}
}
Andreas Lang and Erich Schubert. BETULA: Fast clustering of large data with improved BIRCH CF-Trees In: Inf. Syst. 108, 101918, 2022.
[DOI: 10.1016/j.is.2021.101918] | [BibTeX]
@article{DBLP:journals/is/LangS22,
author = {Andreas Lang and Erich Schubert},
doi = {10.1016/j.is.2021.101918},
journal = {Inf. Syst.},
pages = {101918},
title = {{BETULA:} Fast clustering of large data with improved {BIRCH} CF-Trees},
volume = {108},
year = {2022}
}
Erich Schubert and Lars Lenssen. Fast k-medoids Clustering in Rust and Python In: J. Open Source Softw. 7, 4183, 2022.
[DOI: 10.21105/joss.04183] | [BibTeX]
@article{DBLP:journals/jossw/SchubertL22,
author = {Erich Schubert and Lars Lenssen},
doi = {10.21105/joss.04183},
journal = {J. Open Source Softw.},
number = {75},
pages = {4183},
title = {Fast k-medoids Clustering in Rust and Python},
volume = {7},
year = {2022}
}
Schubert, Erich and Lenssen, Lars. Fast k-medoids Clustering in Rust and Python Open-Source software, Zenodo, 2022.
[DOI: 10.5281/zenodo.6802320] | [BibTeX]
@misc{zenodo/SchubertL22,
author = {Schubert, Erich and Lenssen, Lars},
doi = {10.5281/zenodo.6802320},
month = {July},
publisher = {Zenodo},
howpublished = {Open-source software, Zenodo},
title = {Fast k-medoids Clustering in Rust and Python},
version = {0.3.3},
year = {2022}
}
Lars Lenssen and Erich Schubert. Clustering by Direct Optimization of the Medoid Silhouette In: Similarity Search and Applications - 15th International Conference, SISAP 2022, Bologna, Italy, October 5-7, 2022, Proceedings, 190-204, 2022.
[Preprint (arXiv)] | [DOI: 10.1007/978-3-031-17849-8_15] | [BibTeX]
@inproceedings{DBLP:conf/sisap/LenssenS22,
author = {Lars Lenssen and Erich Schubert},
booktitle = {Similarity Search and Applications - 15th International Conference, {SISAP} 2022, Bologna, Italy, October
5-7, 2022, Proceedings},
doi = {10.1007/978-3-031-17849-8\_15},
pages = {190--204},
title = {Clustering by Direct Optimization of the Medoid Silhouette},
year = {2022}
}
Erich Schubert and Peter J. Rousseeuw. Fast and eager k-medoids clustering: O(k) runtime improvement of the PAM, CLARA, and CLARANS algorithms In: Inf. Syst. 101, 101804, 2021.
[DOI: 10.1016/j.is.2021.101804] | [BibTeX]
@article{DBLP:journals/is/SchubertR21,
author = {Erich Schubert and Peter J. Rousseeuw},
doi = {10.1016/j.is.2021.101804},
journal = {Inf. Syst.},
pages = {101804},
title = {Fast and eager k-medoids clustering: O(k) runtime improvement of the PAM, CLARA, and {CLARANS} algorithms},
volume = {101},
year = {2021}
}
Erich Schubert, Andreas Lang and Gloria Feher. Accelerating Spherical k-Means In: Similarity Search and Applications - 14th International Conference, SISAP 2021, Dortmund, Germany, September 29 - October 1, 2021, Proceedings, 217-231, 2021.
[Preprint (arXiv)] | [DOI: 10.1007/978-3-030-89657-7_17] | [BibTeX]
@inproceedings{DBLP:conf/sisap/SchubertLF21,
author = {Erich Schubert and Andreas Lang and Gloria Feher},
booktitle = {Similarity Search and Applications - 14th International Conference, {SISAP} 2021, Dortmund, Germany, September
29 - October 1, 2021, Proceedings},
doi = {10.1007/978-3-030-89657-7\_17},
pages = {217--231},
title = {Accelerating Spherical k-Means},
year = {2021}
}
Erich Schubert. A Triangle Inequality for Cosine Similarity In: Similarity Search and Applications - 14th International Conference, SISAP 2021, Dortmund, Germany, September 29 - October 1, 2021, Proceedings, 32-44, 2021.
[Preprint (arXiv)] | [DOI: 10.1007/978-3-030-89657-7_3] | [BibTeX]
@inproceedings{DBLP:conf/sisap/Schubert21,
author = {Erich Schubert},
booktitle = {Similarity Search and Applications - 14th International Conference, {SISAP} 2021, Dortmund, Germany, September
29 - October 1, 2021, Proceedings},
doi = {10.1007/978-3-030-89657-7\_3},
pages = {32--44},
title = {A Triangle Inequality for Cosine Similarity},
year = {2021}
}
Franka Bause, David B. Blumenthal, Erich Schubert and Nils M. Kriege. Metric Indexing for Graph Similarity Search In: Similarity Search and Applications - 14th International Conference, SISAP 2021, Dortmund, Germany, September 29 - October 1, 2021, Proceedings, 323-336, 2021.
[Preprint (arXiv)] | [DOI: 10.1007/978-3-030-89657-7_24] | [BibTeX]
@inproceedings{DBLP:conf/sisap/BauseBSK21,
author = {Franka Bause and David B. Blumenthal and Erich Schubert and Nils M. Kriege},
booktitle = {Similarity Search and Applications - 14th International Conference, {SISAP} 2021, Dortmund, Germany, September
29 - October 1, 2021, Proceedings},
doi = {10.1007/978-3-030-89657-7\_24},
pages = {323--336},
title = {Metric Indexing for Graph Similarity Search},
url = {https://doi.org/10.1007/978-3-030-89657-7\_24},
year = {2021}
}
Andreas Lang and Erich Schubert. BETULA: Numerically Stable CF-Trees for BIRCH Clustering In: Similarity Search and Applications - 13th International Conference, SISAP 2020, Copenhagen, Denmark, September 30 - October 2, 2020, Proceedings, 281-296, 2020.
[Preprint (arXiv)] | [DOI: 10.1007/978-3-030-60936-8_22] | [BibTeX]
@inproceedings{DBLP:conf/sisap/LangS20,
author = {Andreas Lang and Erich Schubert},
booktitle = {Similarity Search and Applications - 13th International Conference, {SISAP} 2020, Copenhagen, Denmark, September
30 - October 2, 2020, Proceedings},
doi = {10.1007/978-3-030-60936-8\_22},
pages = {281--296},
title = {{BETULA:} Numerically Stable CF-Trees for {BIRCH} Clustering},
year = {2020}
}