Web Science requires efficient techniques for analysing large datasets. Many Semantic Web problems are difficult to solve through common divide-and-conquer strategies, since they are hard to partition. We present MARVIN, a parallel and distributed platform for processing large amounts of RDF data, on a network of loosely-coupled peers. We present our divide-conquer-swap strategy and show that this model converges towards completeness. We evaluate performance, load balancing and efficiency of our system.
@inproceedings{WebScience09,
author = {Eyal Oren and Spyros Kotoulas and George Anadiotis and Ronny Siebes and
Annette ten Teije and and Frank van Harmelen},
title = {MARVIN: A platform for large-scale analysis of Semantic Web data},
booktitle = {Proceedings of the WebScience '09},
year = {2009},
publisher = {Society On-Line},
keywords = {Semantic Web},
urlPaper = "http://www.cs.vu.nl/~frankh/postscript/WebScience09.pdf"
}
Back to list of papers