@inproceedings{3800c19ed6ae4e04b46b275110a7e969,
title = "A first study on clustering collections of workflow graphs",
abstract = "As workflow systems get more widely used, the number of workflows and the volume of provenance they generate has grown considerably. New tools and infrastructure are needed to allow users to interact with, reason about, and re-use this information. In this paper, we explore the use of clustering techniques to organize large collections of workflow and provenance graphs. We propose two different representations for these graphs and present an experimental evaluation, using a collection of 1,700 workflow graphs, where we study the trade-offs of these representations and the effectiveness of alternative clustering techniques.",
author = "Emanuele Santos and Lauro Lins and Ahrens, {James P.} and Juliana Freire and Silva, {Cl{\'a}udio T.}",
note = "Publisher Copyright: {\textcopyright} Springer-Verlag Berlin Heidelberg 2008.; 2nd International Provenance and Annotation Workshop, IPAW 2008 ; Conference date: 17-06-2008 Through 18-06-2008",
year = "2008",
doi = "10.1007/978-3-540-89965-5_18",
language = "English (US)",
isbn = "9783540899648",
series = "Lecture Notes in Computer Science (including subseries Lecture Notes in Artificial Intelligence and Lecture Notes in Bioinformatics)",
publisher = "Springer Verlag",
pages = "160--173",
editor = "Juliana Freire and David Koop and Juliana Freire and Juliana Freire and Luc Moreau",
booktitle = "Provenance and Annotation of Data and Processes - 2nd International Provenance and Annotation Workshop, IPAW 2008, Revised Selected Papers",
}