MATCH (f:file)
WITH
    f.host as host,
    f.userid as userid,
    f.project as project,
    f.extension as ext,
    sum(f.filesize / (1024^2)) as total_size
WHERE total_size > 1
RETURN host, userid, project, ext, total_size
ORDER BY total_size DESC
LIMIT 100
