Papers | Parallel Computing
2024
Gianluca Mittone, Giulio Malenza, Marco Aldinucci, Robert Birke
Distributed Edge Inference: an Experimental Study on Multiview Detection Proceedings Article
In: Proc. of the 16th IEEE/ACM Intl. Conference on Utility and Cloud Computing Companion (UCC), pp. 1-6, ACM, Taormina, Italy, 2024, (eupilot, icsc).
Abstract | Links | BibTeX | Tags: ai, eupilot, icsc
@inproceedings{23:mittone:multiview,
title = {Distributed Edge Inference: an Experimental Study on Multiview Detection},
author = {Gianluca Mittone and Giulio Malenza and Marco Aldinucci and Robert Birke},
url = {https://iris.unito.it/handle/2318/1950083},
doi = {10.1145/3603166.3632561},
year = {2024},
date = {2024-12-01},
booktitle = {Proc. of the 16th IEEE/ACM Intl. Conference on Utility and Cloud Computing Companion (UCC)},
volume = {30},
pages = {1-6},
publisher = {ACM},
address = {Taormina, Italy},
institution = {Computer Science Department, University of Torino},
abstract = {Computing is evolving rapidly to cater to the increasing demand for sophisticated services, and Cloud computing lays a solid foundation for flexible on-demand provisioning. However, as the size of applications grows, the centralised client-server approach used by Cloud computing increasingly limits the applications' scalability. To achieve ultra-scalability, cloud/edge/fog computing converges into the compute continuum, completely decentralising the infrastructure to encompass universal, pervasive resources. The compute continuum makes devising applications benefitting from this complex environment a challenging research problem. We put the opportunities the compute continuum others to the test through a real-world multi-view detection model (MvDet) implemented with the FastFL C/C++ high-performance edge inference framework. Computational performance is discussed considering many experimental scenarios, encompassing different edge computational capabilities and network bandwidths. We obtain up to 1.92x speedup in inference time over a centralised solution using the same devices.},
note = {eupilot, icsc},
keywords = {ai, eupilot, icsc},
pubstate = {published},
tppubtype = {inproceedings}
}
Bruno Casella, Alessio Barbaro Chisari, Marco Aldinucci, Sebastiano Battiato, Mario Valerio Giuffrida
Federated Learning in a Semi-Supervised Environment for Earth Observation Data Proceedings Article
In: Proceedings of the 32nd European Symposium on Artificial Neural Networks, Computational Intelligence and Machine Learning, ESANN, Bruges, Belgium, 2024.
Abstract | Links | BibTeX | Tags: ai, epi, icsc
@inproceedings{24:casella:fedrec,
title = {Federated Learning in a Semi-Supervised Environment for Earth Observation Data},
author = {Bruno Casella and Alessio Barbaro Chisari and Marco Aldinucci and Sebastiano Battiato and Mario Valerio Giuffrida},
url = {https://iris.unito.it/retrieve/a798d7b8-6b98-48c2-92f4-327d2aaa8788/ES2024-214.pdf},
doi = {10.14428/esann/2024.es2024-214},
year = {2024},
date = {2024-10-01},
booktitle = {Proceedings of the 32nd European Symposium on Artificial Neural Networks, Computational Intelligence and Machine Learning, ESANN},
address = {Bruges, Belgium},
abstract = {We propose FedRec, a federated learning workflow taking advantage of unlabelled data in a semi-supervised environment to assist in the training of a supervised aggregated model. In our proposed method, an encoder architecture extracting features from unlabelled data is aggregated with the feature extractor of a classification model via weight averaging. The fully connected layers of the supervised models are also averaged in a federated fashion. We show the effectiveness of our approach by comparing it with the state-of-the-art federated algorithm, an isolated and a centralised baseline, on novel cloud detection datasets.},
keywords = {ai, epi, icsc},
pubstate = {published},
tppubtype = {inproceedings}
}
Bruno Casella, Jakobs Matthias, Marco Aldinucci, Sebastian Buschjager
Federated Time Series Classification with ROCKET features Proceedings Article
In: Proceedings of the 32nd European Symposium on Artificial Neural Networks, Computational Intelligence and Machine Learning, ESANN, Bruges, Belgium, 2024.
Abstract | Links | BibTeX | Tags: ai, epi, icsc
@inproceedings{24:casella:frocks,
title = {Federated Time Series Classification with ROCKET features},
author = {Bruno Casella and Jakobs Matthias and Marco Aldinucci and Sebastian Buschjager},
url = {https://iris.unito.it/retrieve/51b63fc1-3e22-4ad4-8926-84af69cde739/ES2024-61.pdf},
doi = {10.14428/esann/2024.es2024-61},
year = {2024},
date = {2024-10-01},
booktitle = {Proceedings of the 32nd European Symposium on Artificial Neural Networks, Computational Intelligence and Machine Learning, ESANN},
address = {Bruges, Belgium},
abstract = {This paper proposes FROCKS, a federated time series classification method using ROCKET features. Our approach dynamically adapts the models’ features by selecting and exchanging the best-performing ROCKET kernels from a federation of clients. Specifically, the server gathers the best-performing kernels of the clients together with the associated model parameters, and it performs a weighted average if a kernel is best-performing for more than one client. We compare the proposed method with state-of-the-art approaches on the UCR archive binary classification datasets and show superior performance on most datasets.},
keywords = {ai, epi, icsc},
pubstate = {published},
tppubtype = {inproceedings}
}
Samuele Fonio, Mirko Polato, Roberto Esposito
FedHP: Federated Learning with Hyperspherical Prototypical Regularization Proceedings Article
In: 32nd European Symposium on Artificial Neural Networks, Computational Intelligence and Machine Learning, (ESANN), Bruges, Belgium, 2024.
Abstract | Links | BibTeX | Tags: ai, icsc
@inproceedings{24:esann:fonio:fedhp,
title = {FedHP: Federated Learning with Hyperspherical Prototypical Regularization},
author = {Samuele Fonio and Mirko Polato and Roberto Esposito},
url = {https://www.esann.org/sites/default/files/proceedings/2024/ES2024-183.pdf},
year = {2024},
date = {2024-10-01},
booktitle = {32nd European Symposium on Artificial Neural Networks, Computational Intelligence and Machine Learning, (ESANN)},
address = {Bruges, Belgium},
abstract = {This paper presents FedHP, an algorithm that amalgamates federated learning, hyperspherical geometries, and prototype learning. Federated Learning (FL) has garnered attention as a privacy-preserving method for constructing robust models across distributed datasets. Traditionally, FL involves exchanging model parameters to uphold data privacy; however, in scenarios with costly data communication, exchanging large neural net- work models becomes impractical. In such instances, prototype learning provides a feasible solution by necessitating the exchange of a few class prototypes instead of entire deep learning models. Motivated by these considerations, our approach leverages recent advancements in prototype learning, particularly the benefits offered by non-Euclidean geometries. Alongside introducing FedHP, we provide empirical evidence demonstrat- ing its comparable performance to other state-of-the-art approaches while significantly reducing communication costs.},
keywords = {ai, icsc},
pubstate = {published},
tppubtype = {inproceedings}
}
Iacopo Colonnelli, Doriana Medić, Alberto Mulone, Viviana Bono, Luca Padovani, Marco Aldinucci
Introducing SWIRL: An Intermediate Representation Language for Scientific Workflows Proceedings Article
In: Platzer, André, Rozier, Kristin Yvonne, Pradella, Matteo, Rossi, Matteo (Ed.): Formal Methods. FM 2024, pp. 226–244, Springer Nature Switzerland, Milano, Italy, 2024.
Abstract | Links | BibTeX | Tags: eupex, icsc
@inproceedings{24:fm:swirl,
title = {Introducing SWIRL: An Intermediate Representation Language for Scientific Workflows},
author = {Iacopo Colonnelli and Doriana Medić and Alberto Mulone and Viviana Bono and Luca Padovani and Marco Aldinucci},
editor = {André Platzer and Kristin Yvonne Rozier and Matteo Pradella and Matteo Rossi},
url = {https://iris.unito.it/retrieve/b39a6f09-a8d3-4974-abf6-c109916694fa/PDFEditoriale.pdf},
doi = {10.1007/978-3-031-71162-6_12},
year = {2024},
date = {2024-09-01},
booktitle = {Formal Methods. FM 2024},
volume = {14933},
pages = {226–244},
publisher = {Springer Nature Switzerland},
address = {Milano, Italy},
series = {Lecture Notes in Computer Science},
abstract = {In the ever-evolving landscape of scientific computing, properly supporting the modularity and complexity of modern scientific applications requires new approaches to workflow execution, like seamless interoperability between different workflow systems, distributed-by-design workflow models, and automatic optimisation of data movements. In order to address this need, this article introduces SWIRL, an intermediate representation language for scientific workflows. In contrast with other product-agnostic workflow languages, SWIRL is not designed for human interaction but to serve as a low-level compilation target for distributed workflow execution plans. The main advantages of SWIRL semantics are low-level primitives based on the send/receive programming model and a formal framework ensuring the consistency of the semantics and the specification of translating workflow models represented by Directed Acyclic Graphs (DAGs) into SWIRL workflow descriptions. Additionally, SWIRL offers rewriting rules designed to optimise execution traces, accompanied by corresponding equivalence. An open-source SWIRL compiler toolchain has been developed using the ANTLR Python3 bindings.},
keywords = {eupex, icsc},
pubstate = {published},
tppubtype = {inproceedings}
}
Simone Leo, Michael R. Crusoe, Laura Rodríguez-Navas, Raül Sirvent, Alexander Kanitz, Paul De Geest, Rudolf Wittner, Luca Pireddu, Daniel Garijo, José M. Fernández, Iacopo Colonnelli, Matej Gallo, Tazro Ohta, Hirotaka Suetake, Salvador Capella-Gutierrez, Renske Wit, Bruno P. Kinoshita, Stian Soiland-Reyes
Recording provenance of workflow runs with RO-Crate Journal Article
In: PLoS ONE, vol. 19, no. 9, pp. 1–35, 2024.
Abstract | Links | BibTeX | Tags: across, eupex, icsc, streamflow
@article{24:pone:wfrunrocrate,
title = {Recording provenance of workflow runs with RO-Crate},
author = {Simone Leo and Michael R. Crusoe and Laura Rodríguez-Navas and Raül Sirvent and Alexander Kanitz and Paul De Geest and Rudolf Wittner and Luca Pireddu and Daniel Garijo and José M. Fernández and Iacopo Colonnelli and Matej Gallo and Tazro Ohta and Hirotaka Suetake and Salvador Capella-Gutierrez and Renske Wit and Bruno P. Kinoshita and Stian Soiland-Reyes},
url = {https://iris.unito.it/retrieve/57752f7b-9f8f-4013-8cef-5b498703d882/journal.pone.0309210.pdf},
doi = {10.1371/journal.pone.0309210},
year = {2024},
date = {2024-09-01},
journal = {PLoS ONE},
volume = {19},
number = {9},
pages = {1–35},
publisher = {Public Library of Science},
abstract = {Recording the provenance of scientific computation results is key to the support of traceability, reproducibility and quality assessment of data products. Several data models have been explored to address this need, providing representations of workflow plans and their executions as well as means of packaging the resulting information for archiving and sharing. However, existing approaches tend to lack interoperable adoption across workflow management systems. In this work we present Workflow Run RO-Crate, an extension of RO-Crate (Research Object Crate) and Schema.org to capture the provenance of the execution of computational workflows at different levels of granularity and bundle together all their associated objects (inputs, outputs, code, etc.). The model is supported by a diverse, open community that runs regular meetings, discussing development, maintenance and adoption aspects. Workflow Run RO-Crate is already implemented by several workflow management systems, allowing interoperable comparisons between workflow runs from heterogeneous systems. We describe the model, its alignment to standards such as W3C PROV, and its implementation in six workflow systems. Finally, we illustrate the application of Workflow Run RO-Crate in two use cases of machine learning in the digital image analysis domain.},
keywords = {across, eupex, icsc, streamflow},
pubstate = {published},
tppubtype = {article}
}
Alberto Mulone, Doriana Medić, Marco Aldinucci
A Fault Tolerance mechanism for Hybrid Scientific Workflows Proceedings Article
In: 1st workshop about High-Performance e-Science (HiPES), Madrid, Spain, 2024.
Abstract | BibTeX | Tags: eupex, icsc, streamflow
@inproceedings{24:madrid:hipes,
title = {A Fault Tolerance mechanism for Hybrid Scientific Workflows},
author = {Alberto Mulone and Doriana Medić and Marco Aldinucci},
year = {2024},
date = {2024-08-01},
booktitle = {1st workshop about High-Performance e-Science (HiPES)},
address = {Madrid, Spain},
abstract = {In large distributed systems, failures are a daily event occurring frequently, especially with growing numbers of computation tasks and locations on which they are deployed. The advantage of representing an application as a workflow is possibility to utilize the Workflow Management Systems which are reliable systems guaranteeing the correct execution of the application and providing the features such as portability, scalability, and fault tolerance. Over recent years, the emergence of hybrid workflows has posed new and intriguing challenges by increasing the possibility of distributing computations involving heterogeneous and independent environments. As a consequence, the number of possible points of failure in the execution augmented, creating different important challenges interesting to study.},
keywords = {eupex, icsc, streamflow},
pubstate = {published},
tppubtype = {inproceedings}
}
Alessia Antelmi, Massimo Torquati, Giacomo Corridori, Daniele Gregori, Francesco Polzella, Gianmarco Spinatelli, Marco Aldinucci
Analyzing FOSS license usage in publicly available software at scale via the SWH-analytics framework Journal Article
In: The Journal of Supercomputing, vol. 80, no. 11, pp. 15799-15833, 2024, ISSN: 1573-0484.
Abstract | Links | BibTeX | Tags: analytics, icsc
@article{Antelmi_JSUPE_2024,
title = {Analyzing FOSS license usage in publicly available software at scale via the SWH-analytics framework},
author = {Alessia Antelmi and Massimo Torquati and Giacomo Corridori and Daniele Gregori and Francesco Polzella and Gianmarco Spinatelli and Marco Aldinucci},
url = {https://doi.org/10.1007/s11227-024-06069-x},
doi = {10.1007/s11227-024-06069-x},
issn = {1573-0484},
year = {2024},
date = {2024-07-01},
journal = {The Journal of Supercomputing},
volume = {80},
number = {11},
pages = {15799-15833},
abstract = {The Software Heritage (SWH) dataset represents an invaluable source of open-source code as it aims to collect, preserve, and share all publicly available software in source code form ever produced by humankind. Although designed to archive deduplicated small files thanks to the use of a Merkle tree as the underlying data structure, querying the SWH dataset presents challenges due to the nature of these structures, which organize content based on hash values rather than any locality principle. The magnitude of the repository, coupled with the resource-intensive nature of the download process, highlights the need for specialized infrastructure and computational resources to effectively handle and study the extensive dataset housed within SWH. Currently, there is a lack of infrastructures specifically tailored for running analytics on the SWH dataset, leaving users to handle these issues manually. To address these challenges, we implemented the SWH-Analytics (SWHA) framework, a development environment that transparently runs custom analytic applications on publicly available software data preserved over time by SWH. Specifically, this work shows how SWHA can be effectively exploited to study usage patterns of free and open-source software licenses, highlighting the need to improve license literacy among developers.},
keywords = {analytics, icsc},
pubstate = {published},
tppubtype = {article}
}
Miruna Bețianu, Abele Mălan, Marco Aldinucci, Robert Birke, Lydia Chen
DALLMi: Domain Adaption for LLM-based Multi-label Classifier Proceedings Article
In: Yang, De-Nian, Xie, Xing, Tseng, Vincent S., Pei, Jian, Huang, Jen-Wei, Lin, Jerry Chun-Wei (Ed.): Proceedings of the 28th Pacific-Asia Conference on Knowledge Discovery and Data Mining, pp. 277–289, Springer, Taipei, Taiwan, 2024.
Abstract | Links | BibTeX | Tags: ai, eupilot, icsc
@inproceedings{24:betianu:llm,
title = {DALLMi: Domain Adaption for LLM-based Multi-label Classifier},
author = {Miruna Bețianu and Abele Mălan and Marco Aldinucci and Robert Birke and Lydia Chen},
editor = {De-Nian Yang and Xing Xie and Vincent S. Tseng and Jian Pei and Jen-Wei Huang and Jerry Chun-Wei Lin},
url = {https://hdl.handle.net/2318/1976672},
doi = {10.1007/978-981-97-2259-4_21},
year = {2024},
date = {2024-05-01},
booktitle = {Proceedings of the 28th Pacific-Asia Conference on Knowledge Discovery and Data Mining},
volume = {14647},
pages = {277–289},
publisher = {Springer},
address = {Taipei, Taiwan},
series = {Lecture Notes in Computer Science},
abstract = {Large language models (LLMs) increasingly serve as the backbone for classifying text associated with distinct domains and simultaneously several labels (classes). When encountering domain shifts, e.g., classifier of movie reviews from IMDb to Rotten Tomatoes, adapting such an LLM-based multi-label classifier is challenging due to incomplete label sets at the target domain and daunting training overhead. The existing domain adaptation methods address either image multi-label classifiers or text binary classifiers. In this paper, we design DALLMi, Domain Adaptation Large Language Model interpolator, a first-of-its-kind semi-supervised domain adaptation method for text data models based on LLMs, specifically BERT. The core of DALLMi is the novel variation loss and MixUp regularization, which jointly leverage the limited positively labeled and large quantity of unlabeled text and, importantly, their interpolation from the BERT word embeddings. DALLMi also introduces a label-balanced sampling strategy to overcome the imbalance between labeled and unlabeled data. We evaluate DALLMi against the partial-supervised and unsupervised approach on three datasets under different scenarios of label availability for the target domain. Our results show that DALLMi achieves higher mAP than unsupervised and partially-supervised approaches by 19.9% and 52.2%, respectively.},
keywords = {ai, eupilot, icsc},
pubstate = {published},
tppubtype = {inproceedings}
}
Chi Hong, Robert Birke, Pin-Yu Chen, Lydia Chen
On Dark Knowledge for Distilling Generators Proceedings Article
In: Yang, De-Nian, Xie, Xing, Tseng, Vincent S., Pei, Jian, Huang, Jen-Wei, Lin, Jerry Chun-Wei (Ed.): Proceedings of the 28th Pacific-Asia Conference on Knowledge Discovery and Data Mining, pp. 235–247, Springer, Taipei, Taiwan, 2024.
Abstract | Links | BibTeX | Tags: ai, epi, icsc
@inproceedings{24:chen:llm,
title = {On Dark Knowledge for Distilling Generators},
author = {Chi Hong and Robert Birke and Pin-Yu Chen and Lydia Chen},
editor = {De-Nian Yang and Xing Xie and Vincent S. Tseng and Jian Pei and Jen-Wei Huang and Jerry Chun-Wei Lin},
url = {https://hdl.handle.net/2318/1976671},
doi = {10.1007/978-981-97-2253-2_19},
year = {2024},
date = {2024-05-01},
booktitle = {Proceedings of the 28th Pacific-Asia Conference on Knowledge Discovery and Data Mining},
volume = {14646},
pages = {235–247},
publisher = {Springer},
address = {Taipei, Taiwan},
series = {Lecture Notes in Computer Science},
abstract = {Knowledge distillation has been applied on generative models, such as Variational Autoencoder (VAE) and Generative Adversarial Networks (GANs). To distill the knowledge, the synthetic outputs of a teacher generator are used to train a student model. While the dark knowledge, i.e., the probabilistic output, is well explored in distilling classifiers, little is known about the existence of an equivalent dark knowledge for generative models and its extractability. In this paper, we derive the first kind of empirical risk bound for distilling generative models from a Bayesian perspective. Through our analysis, we show the existence of the dark knowledge for generative models, i.e., Bayes probability distribution of a synthetic output from a given input, which achieves lower empirical risk bound than merely using the synthetic output of the generators. Furthermore, we propose a Dark Knowledge based Distillation , DKtill, which trains the student generator based on the (approximate) dark knowledge. Our extensive evaluation on distilling VAE, conditional GANs, and translation GANs on Facades and CelebA datasets show that the FID of student generators trained by DKtill combining dark knowledge are lower than student generators trained only by the synthetic outputs by up to 42.66%, and 78.99%, respectively.},
keywords = {ai, epi, icsc},
pubstate = {published},
tppubtype = {inproceedings}
}
Bruno Casella, Iacopo Colonnelli, Gianluca Mittone, Robert Birke, Walter Riviera, Antonio Sciarappa, Carlo Cavazzoni, Marco Aldinucci
A Performance Analysis for Confidential Federated Learning Proceedings Article
In: Proceedings of the 2024 Deep Learning Security and Privacy Workshop, IEEE Symposium on Security and Privacy 2024, San Francisco, CA, 2024.
Abstract | Links | BibTeX | Tags: ai, confidential, epi, icsc
@inproceedings{24:casella:sgx,
title = {A Performance Analysis for Confidential Federated Learning},
author = {Bruno Casella and Iacopo Colonnelli and Gianluca Mittone and Robert Birke and Walter Riviera and Antonio Sciarappa and Carlo Cavazzoni and Marco Aldinucci},
url = {https://iris.unito.it/retrieve/b5877a97-2d8d-4e95-8791-0aa4a1b953b3/DLSP___CONFIDENTIAL_FL.pdf},
doi = {10.1109/SPW63631.2024.00009},
year = {2024},
date = {2024-05-01},
booktitle = {Proceedings of the 2024 Deep Learning Security and Privacy Workshop, IEEE Symposium on Security and Privacy 2024},
address = {San Francisco, CA},
abstract = {Federated Learning (FL) has emerged as a solution to preserve data privacy by keeping the data locally on each participant's device. However, FL alone is still vulnerable to attacks that can cause privacy leaks. Therefore, it becomes necessary to take additional security measures at the cost of increasing runtimes. The Trusted Execution Environment (TEE) approach promises to offer the highest degree of security during execution. However, TEEs suffer from memory limits which prevent safe end-to-end FL training of modern deep models. State-of- the-art approaches limit secure training to selected layers, failing to avert the full spectrum of attacks or adopt layer-wise training affecting model performance. We benchmark the usage of a library OS (LibOS) to run the full, unmodified end-to-end FL training inside the TEE. We extensively evaluate and model the overhead of the different security mechanisms needed to protect the data and model during computation (TEE), communication (TLS), and storage (disk encryption). The obtained results across three datasets and two models demonstrate that LibOSes are a viable way to seamlessly inject security into FL with limited overhead (at most 2x), offering valuable guidance for researchers and developers aiming to apply FL in data-security-focused contexts.},
keywords = {ai, confidential, epi, icsc},
pubstate = {published},
tppubtype = {inproceedings}
}
Giulio Malenza, Valentina Cesare, Marco Aldinucci, Ugo Becciani, Alberto Vecchiato
Toward HPC application portability via C++ PSTL: the Gaia AVU-GSR code assessment Journal Article
In: The Journal of Supercomputing, 2024, ISSN: 09208542.
Abstract | Links | BibTeX | Tags: eupex, HPC, icsc
@article{24:jsupe:Gaia,
title = {Toward HPC application portability via C++ PSTL: the Gaia AVU-GSR code assessment},
author = {Giulio Malenza and Valentina Cesare and Marco Aldinucci and Ugo Becciani and Alberto Vecchiato},
doi = {10.1007/s11227-024-06011-1},
issn = {09208542},
year = {2024},
date = {2024-03-01},
journal = {The Journal of Supercomputing},
publisher = {Springer},
abstract = {The computing capacity needed to process the data generated in modern scientific experiments is approaching ExaFLOPs. Currently, achieving such performances is only feasible through GPU-accelerated supercomputers. Different languages were developed to program GPUs at different levels of abstraction. Typically, the more abstract the languages, the more portable they are across different GPUs. However, the less abstract and co-designed with the hardware, the more room for code optimization and, eventually, the more performance. In the HPC context, portability and performance are a fairly traditional dichotomy. The current C++ Parallel Standard Template Library (PSTL) has the potential to go beyond this dichotomy. In this work, we analyze the main performance benefits and limitations of PSTL using as a use-case the Gaia Astrometric Verification Unit-Global Sphere Reconstruction parallel solver developed by the European Space Agency Gaia mission. The code aims to find the astrometric parameters of $$sim10^8$$stars in the Milky Way by iteratively solving a linear system of equations with the LSQR algorithm, originally GPU-ported with the CUDA language. We show that the performance obtained with the PSTL version, which is intrinsically more portable than CUDA, is comparable to the CUDA one on NVIDIA GPU architecture.},
keywords = {eupex, HPC, icsc},
pubstate = {published},
tppubtype = {article}
}
Marco Edoardo Santimaria, Samuele Fonio, Giulio Malenza, Iacopo Colonnelli, Marco Aldinucci
Benchmarking Parallelization Models through Karmarkar Interior-point method Proceedings Article
In: Chis, Horacio González-Vélez Adriana E. (Ed.): Proc. of 32nd Euromicro intl. Conference on Parallel, Distributed and Network-based Processing (PDP), pp. 1-8, IEEE, Dublin, Ireland, 2024, ISSN: 2377-5750.
Abstract | Links | BibTeX | Tags: HPC, icsc
@inproceedings{24:pdp:karmarkar,
title = {Benchmarking Parallelization Models through Karmarkar Interior-point method},
author = {Marco Edoardo Santimaria and Samuele Fonio and Giulio Malenza and Iacopo Colonnelli and Marco Aldinucci},
editor = {Horacio González-Vélez Adriana E. Chis},
url = {https://hdl.handle.net/2318/1964571},
doi = {10.1109/PDP62718.2024.00010},
issn = {2377-5750},
year = {2024},
date = {2024-03-01},
booktitle = {Proc. of 32nd Euromicro intl. Conference on Parallel, Distributed and Network-based Processing (PDP)},
pages = {1-8},
publisher = {IEEE},
address = {Dublin, Ireland},
abstract = {Optimization problems are one of the main focus of scientific research. Their computational-intensive nature makes them prone to be parallelized with consistent improvements in performance. This paper sheds light on different parallel models for accelerating Karmarkar's Interior-point method. To do so, we assess parallelization strategies for individual operations within the aforementioned Karmarkar's algorithm using OpenMP, GPU acceleration with CUDA, and the recent Parallel Standard C++ Linear Algebra library (PSTL) executing both on GPU and CPU. Our different implementations yield interesting benchmark results that show the optimal approach for parallelizing interior point algorithms for general Linear Programming (LP) problems. In addition, we propose a more theoretical perspective of the parallelization of this algorithm, with a detailed study of our OpenMP implementation, showing the limits of optimizing the single operations},
keywords = {HPC, icsc},
pubstate = {published},
tppubtype = {inproceedings}
}
Bruno Casella, Roberto Esposito, Antonio Sciarappa, Carlo Cavazzoni, Marco Aldinucci
Experimenting With Normalization Layers in Federated Learning on Non-IID Scenarios Journal Article
In: IEEE Access, vol. 12, pp. 47961-47971, 2024.
Links | BibTeX | Tags: epi, icsc
@article{24:casella:normalization,
title = {Experimenting With Normalization Layers in Federated Learning on Non-IID Scenarios},
author = {Bruno Casella and Roberto Esposito and Antonio Sciarappa and Carlo Cavazzoni and Marco Aldinucci},
doi = {10.1109/ACCESS.2024.3383783},
year = {2024},
date = {2024-01-01},
journal = {IEEE Access},
volume = {12},
pages = {47961-47971},
keywords = {epi, icsc},
pubstate = {published},
tppubtype = {article}
}
Lorenzo Brescia, Marco Aldinucci
Secure Generic Remote Workflow Execution with TEEs Proceedings Article
In: Proc. of the 2nd Workshop on Workflows in Distributed Environments (WiDE), pp. 8-13, ACM, Athens, Greece, 2024.
Abstract | Links | BibTeX | Tags: confidential, icsc
@inproceedings{23:brescia:wide,
title = {Secure Generic Remote Workflow Execution with TEEs},
author = {Lorenzo Brescia and Marco Aldinucci},
doi = {10.1145/3642978.3652834},
year = {2024},
date = {2024-01-01},
booktitle = {Proc. of the 2nd Workshop on Workflows in Distributed Environments (WiDE)},
pages = {8-13},
publisher = {ACM},
address = {Athens, Greece},
abstract = {In scientific environments, the frequent need to process substantial volumes of data poses a common challenge. Individuals tasked with executing these computations frequently encounter a deficit in local computational resources, leading them to opt for the facilities of a Cloud Service Provider (CSP) for data processing. However, the data subjected to these calculations may be subject to confidentiality constraints. This paper introduces a proof-of-concept framework that leverages Gramine LibOS and Intel SGX, enabling the protection of generic remote workflow computations through SGX enclaves as Trusted Execution Environments (TEEs). The framework entails the delineation of user and CSP behavior and has been implemented using Bash scripts. Furthermore, an infrastructure has been designed for the Data Center Attestation Primitives (DCAP) remote attestation mechanism, wherein the user gains trust in the proper instantiation of the enclave within the CSP. To assess the framework efficacy, it has been tested on two distinct workflows, one trivial and the other involving real-world bioinformatics applications for processing DNA data. The performance study revealed that the framework incurred an acceptable overhead, ranging from a factor of x1.4 to x1.8 compared to unsafe execution practice.},
howpublished = {Proceedings of the 2nd Workshop on Workflows in Distributed Environments},
keywords = {confidential, icsc},
pubstate = {published},
tppubtype = {inproceedings}
}
Simon Queyrut, Robert Birke, Pascal Felber, Valerio Schiavon
CLUES: Collusive Theft of Conditional Generative Adversarial Networks Proceedings Article
In: 43rd International Symposium on Reliable Distributed Systems SRDS, 2024.
@inproceedings{24:queyrut:srds,
title = {CLUES: Collusive Theft of Conditional Generative Adversarial Networks},
author = {Simon Queyrut and Robert Birke and Pascal Felber and Valerio Schiavon},
year = {2024},
date = {2024-01-01},
booktitle = {43rd International Symposium on Reliable Distributed Systems SRDS},
keywords = {ai, icsc},
pubstate = {published},
tppubtype = {inproceedings}
}
Daniele De Vinco, Alessia Antelmi, Carmine Spagnuolo, Luca Maria Aiello
Deciphering Conversational Networks: Stance Detection via Hypergraphs and LLMs Proceedings Article
In: Companion Publication of the 16th ACM Web Science Conference, pp. 3–4, Association for Computing Machinery, Stuttgart, Germany, 2024, ISBN: 9798400704536.
Abstract | Links | BibTeX | Tags: analytics, icsc
@inproceedings{Antelmi_WebSci_2024,
title = {Deciphering Conversational Networks: Stance Detection via Hypergraphs and LLMs},
author = {Daniele De Vinco and Alessia Antelmi and Carmine Spagnuolo and Luca Maria Aiello},
url = {https://doi.org/10.1145/3630744.3658418},
doi = {10.1145/3630744.3658418},
isbn = {9798400704536},
year = {2024},
date = {2024-01-01},
booktitle = {Companion Publication of the 16th ACM Web Science Conference},
pages = {3–4},
publisher = {Association for Computing Machinery},
address = {Stuttgart, Germany},
series = {Websci Companion '24},
abstract = {Understanding the structural and linguistic properties of conversational data in social media is crucial for extracting meaningful insights to understand opinion dynamics, (mis-)information spreading, and the evolution of harmful behavior. Current state-of-the-art mathematical frameworks, such as hypergraphs and linguistic tools, such as large language models (LLMs), offer robust methodologies for modeling high-order group interactions and unprecedented capabilities for dealing with natural language-related tasks. In this study, we propose an innovative approach that blends these worlds by abstracting conversational networks via hypergraphs and analyzing their dynamics through LLMs. Our aim is to enhance the stance detection task by incorporating the high-order interactions naturally embedded within a conversation, thereby enriching the contextual understanding of LLMs regarding the intricate human dynamics underlying social media data.},
keywords = {analytics, icsc},
pubstate = {published},
tppubtype = {inproceedings}
}
Alessia Antelmi, Daniele De Vinco, Carmine Spagnuolo
HypergraphRepository: A Community-Driven and Interactive Hypernetwork Data Collection Proceedings Article
In: Dewar, Megan, Kamiński, Bogumił, Kaszyński, Daniel, Kraiński, Łukasz, Prałat, Paweł, Théberge, François, Wrzosek, Małgorzata (Ed.): Modelling and Mining Networks, pp. 159–173, Springer Nature Switzerland, Cham, 2024, ISBN: 978-3-031-59205-8.
Abstract | Links | BibTeX | Tags: analytics, icsc
@inproceedings{Antelmi_WAW_2024,
title = {HypergraphRepository: A Community-Driven and Interactive Hypernetwork Data Collection},
author = {Alessia Antelmi and Daniele De Vinco and Carmine Spagnuolo},
editor = {Megan Dewar and Bogumił Kamiński and Daniel Kaszyński and Łukasz Kraiński and Paweł Prałat and François Théberge and Małgorzata Wrzosek},
doi = {10.1007/978-3-031-59205-8_11},
isbn = {978-3-031-59205-8},
year = {2024},
date = {2024-01-01},
booktitle = {Modelling and Mining Networks},
pages = {159–173},
publisher = {Springer Nature Switzerland},
address = {Cham},
abstract = {Hypergraph research has been thriving over the past few years, with a growing interest in a plethora of domains. Despite this remarkable surge, the lack of a comprehensive platform for searching and downloading diverse and well-curated datasets poses a significant obstacle to the continued advancement of the field. This absence hinders the ability of researchers and practitioners to validate and benchmark their hypergraph algorithms and models effectively.},
keywords = {analytics, icsc},
pubstate = {published},
tppubtype = {inproceedings}
}
Alessia Antelmi, Pasquale Caramante, Gennaro Cordasco, Giuseppe D'Ambrosio, Daniele De Vinco, Francesco Foglia, Luca Postiglione, Carmine Spagnuolo
Reliable and Efficient Agent-Based Modeling and Simulation Journal Article
In: Journal of Artificial Societies and Social Simulation, vol. 27, no. 2, pp. 4, 2024, ISSN: 1460-7425.
Abstract | Links | BibTeX | Tags: analytics, icsc
@article{Antelmi_JASSS_2024,
title = {Reliable and Efficient Agent-Based Modeling and Simulation},
author = {Alessia Antelmi and Pasquale Caramante and Gennaro Cordasco and Giuseppe D'Ambrosio and Daniele De Vinco and Francesco Foglia and Luca Postiglione and Carmine Spagnuolo},
url = {http://jasss.soc.surrey.ac.uk/27/2/4.html},
doi = {10.18564/jasss.5300},
issn = {1460-7425},
year = {2024},
date = {2024-01-01},
journal = {Journal of Artificial Societies and Social Simulation},
volume = {27},
number = {2},
pages = {4},
abstract = {Agent-based models represent a primary methodology to untangle and study complex systems. Over the last decade, the need for more elaborate computing-demanding models gave rise to many frameworks and tools to run ABM simulations. Current state-of-the-art ABM tools either focus on ease of use, performance, or a trade-off between these two elements. Still, efficiency-oriented solutions (required for both large and small-scale simulations) are vulnerable to memory flaws which could invalidate the experiment results. This work aims to merge efficiency, reliability, and safeness under an innovative ABM software framework based on the Rust programming language. Our framework, krABMaga, is an open-source library that offers a high-level environment by exploiting metaprogramming and expandable visualization features. We equipped our library with a dynamic simulation monitoring system and model exploration and optimization capabilities over parallel, distributed, and cloud architectures. After having presented the overall architecture and functionalities of krABMaga, we discuss a performance comparison of our framework against the mostly adopted ABM software and the scalability potential of our simulation engine on a model calibration experiment running over an AWS EC2 virtual cluster machine. All code and examples models are available on GitHub.},
keywords = {analytics, icsc},
pubstate = {published},
tppubtype = {article}
}
Raffaele Mineo, Federica Salanitri Proietto, Giovanni Bellitto, Isaak Kavasidis, Ovidio. De Filippo, Michele Millesimo, Gaetano Maria De Ferrari, Marco Aldinucci, Daniela Giordano, Simone Palazzo, Fabrizio D’Ascenzo, Concetto Spampinato
A Convolutional-Transformer Model for FFR and iFR Assessment from Coronary Angiography Journal Article
In: 2024.
Abstract | Links | BibTeX | Tags: ai
@article{angiography:TMI:24,
title = {A Convolutional-Transformer Model for FFR and iFR Assessment from Coronary Angiography},
author = {Raffaele Mineo and Federica Salanitri Proietto and Giovanni Bellitto and Isaak Kavasidis and Ovidio. De Filippo and Michele Millesimo and Gaetano Maria De Ferrari and Marco Aldinucci and Daniela Giordano and Simone Palazzo and Fabrizio D’Ascenzo and Concetto Spampinato},
url = {https://ieeexplore.ieee.org/stamp/stamp.jsp?tp=&arnumber=10582501},
doi = {10.1109/TMI.2024.3383283},
year = {2024},
date = {2024-01-01},
publisher = {IEEE},
abstract = {The quantification of stenosis severity from X-ray catheter angiography is a challenging task. Indeed, this requires to fully understand the lesion’s geometry by analyzing dynamics of the contrast material, only relying on visual observation by clinicians. To support decision making for cardiac intervention, we propose a hybrid CNN-Transformer model for the assessment of angiography-based non-invasive fractional flow-reserve (FFR) and instantaneous wave-free ratio (iFR) of intermediate coronary stenosis. Our approach predicts whether a coronary artery stenosis is hemodynamically significant and provides direct FFR and iFR estimates. This is achieved through a combination of regression and classification branches that forces the model to focus on the cut-off region of FFR (around 0.8 FFR value), which is highly critical for decision-making. We also propose a spatio-temporal factorization mechanisms that redesigns the transformer’s self-attention mechanism to capture both local spatial and temporal interactions between vessel geometry, blood flow dynamics, and lesion morphology. The proposed method achieves state-of-the-art performance on a dataset of 778 exams from 389 patients. Unlike existing methods, our approach employs a single angiography view and does not require knowledge of the key frame; supervision at training time is provided by a classification loss (based on a threshold of the FFR/iFR values) and a regression loss for direct estimation. Finally, the analysis of model interpretability and calibration shows that, in spite of the complexity of angiographic imaging data, our method can robustly identify the location of the stenosis and correlate prediction uncertainty to the provided output scores.},
keywords = {ai},
pubstate = {published},
tppubtype = {article}
}
Raffaele Mineo, Federica Salanitri Proietto, Giovanni Bellitto, Isaak Kavasidis, Ovidio. De Filippo, Michele Millesimo, Gaetano Maria De Ferrari, Marco Aldinucci, Daniela Giordano, Simone Palazzo, Fabrizio D'Ascenzo, Concetto Spampinato
A Convolutional-Transformer Model for FFR and iFR Assessment from Coronary Angiography Journal Article
In: IEEE Transaction on Medical Imaging, vol. 43, no. 8, pp. 2866-2877, 2024.
Abstract | Links | BibTeX | Tags: ai, cardio
@article{24:angiography:TMI,
title = {A Convolutional-Transformer Model for FFR and iFR Assessment from Coronary Angiography},
author = {Raffaele Mineo and Federica Salanitri Proietto and Giovanni Bellitto and Isaak Kavasidis and Ovidio. De Filippo and Michele Millesimo and Gaetano Maria De Ferrari and Marco Aldinucci and Daniela Giordano and Simone Palazzo and Fabrizio D'Ascenzo and Concetto Spampinato},
url = {https://ieeexplore.ieee.org/stamp/stamp.jsp?tp=&arnumber=10582501},
doi = {10.1109/TMI.2024.3383283},
year = {2024},
date = {2024-01-01},
journal = {IEEE Transaction on Medical Imaging},
volume = {43},
number = {8},
pages = {2866-2877},
publisher = {IEEE},
abstract = {The quantification of stenosis severity from X-ray catheter angiography is a challenging task. Indeed, this requires to fully understand the lesion's geometry by analyzing dynamics of the contrast material, only relying on visual observation by clinicians. To support decision making for cardiac intervention, we propose a hybrid CNN-Transformer model for the assessment of angiography-based non-invasive fractional flow-reserve (FFR) and instantaneous wave-free ratio (iFR) of intermediate coronary stenosis. Our approach predicts whether a coronary artery stenosis is hemodynamically significant and provides direct FFR and iFR estimates. This is achieved through a combination of regression and classification branches that forces the model to focus on the cut-off region of FFR (around 0.8 FFR value), which is highly critical for decision-making. We also propose a spatio-temporal factorization mechanisms that redesigns the transformer's self-attention mechanism to capture both local spatial and temporal interactions between vessel geometry, blood flow dynamics, and lesion morphology. The proposed method achieves state-of-the-art performance on a dataset of 778 exams from 389 patients. Unlike existing methods, our approach employs a single angiography view and does not require knowledge of the key frame; supervision at training time is provided by a classification loss (based on a threshold of the FFR/iFR values) and a regression loss for direct estimation. Finally, the analysis of model interpretability and calibration shows that, in spite of the complexity of angiographic imaging data, our method can robustly identify the location of the stenosis and correlate prediction uncertainty to the provided output scores.},
keywords = {ai, cardio},
pubstate = {published},
tppubtype = {article}
}
Iacopo Colonnelli, Robert Birke, Giulio Malenza, Gianluca Mittone, Alberto Mulone, Jeroen Galjaard, Lydia Y. Chen, Sanzio Bassini, Gabriella Scipione, Jan Martinovič, Vit Vondrák, Marco Aldinucci
Cross-Facility Federated Learning Journal Article
In: Procedia Computer Science, vol. 240, pp. 3–12, 2024, ISSN: 1877-0509.
Abstract | Links | BibTeX | Tags: icsc, space, streamflow
@article{24:eurohpc:xffl,
title = {Cross-Facility Federated Learning},
author = {Iacopo Colonnelli and Robert Birke and Giulio Malenza and Gianluca Mittone and Alberto Mulone and Jeroen Galjaard and Lydia Y. Chen and Sanzio Bassini and Gabriella Scipione and Jan Martinovič and Vit Vondrák and Marco Aldinucci},
url = {https://www.sciencedirect.com/science/article/pii/S1877050924016909},
doi = {10.1016/j.procs.2024.07.003},
issn = {1877-0509},
year = {2024},
date = {2024-01-01},
booktitle = {Proceedings of the First EuroHPC user day},
journal = {Procedia Computer Science},
volume = {240},
pages = {3–12},
publisher = {Elsevier},
address = {Bruxelles, Belgium},
abstract = {In a decade, AI frontier research transitioned from the researcher's workstation to thousands of high-end hardware-accelerated compute nodes. This rapid evolution shows no signs of slowing down in the foreseeable future. While top cloud providers may be able to keep pace with this growth rate, obtaining and efficiently exploiting computing resources at that scale is a daunting challenge for universities and SMEs. This work introduces the Cross-Facility Federated Learning (XFFL) framework to bridge this compute divide, extending the opportunity to efficiently exploit multiple independent data centres for extreme-scale deep learning tasks to data scientists and domain experts. XFFL relies on hybrid workflow abstractions to decouple tasks from environment-specific technicalities, reducing complexity and enhancing reusability. In addition, Federated Learning (FL) algorithms eliminate the need to move large amounts of data between different facilities, reducing time-to-solution and preserving data privacy. The XFFL approach is empirically evaluated by training a full LLaMAv2 7B instance on two facilities of the EuroHPC JU, showing how the increased computing power completely compensates for the additional overhead introduced by two data centres.},
keywords = {icsc, space, streamflow},
pubstate = {published},
tppubtype = {article}
}
Emilio Sulis, Ilaria Angela Amantea, Marco Aldinucci, Guido Boella, Renata Marinello, Marco Grosso, Paolo Platter, Serena Ambrosini
An ambient assisted living architecture for hospital at home coupled with a process-oriented perspective Journal Article
In: Journal of Ambient Intelligence and Humanized Computing, vol. 15, no. 5, pp. 2727-2735, 2024.
Abstract | Links | BibTeX | Tags: ai
@article{22:Sulis,
title = {An ambient assisted living architecture for hospital at home coupled with a process-oriented perspective},
author = {Emilio Sulis and Ilaria Angela Amantea and Marco Aldinucci and Guido Boella and Renata Marinello and Marco Grosso and Paolo Platter and Serena Ambrosini},
url = {https://iris.unito.it/retrieve/c7eaab0b-f78b-4af0-8c17-fa5479d776e6/jaihc2021-preprint.pdf},
doi = {10.1007/s12652-022-04388-6},
year = {2024},
date = {2024-01-01},
journal = {Journal of Ambient Intelligence and Humanized Computing},
volume = {15},
number = {5},
pages = {2727-2735},
abstract = {The growing number of next-generation applications offers a relevant opportunity for healthcare services, generating an urgent need for architectures for systems integration. Moreover, the huge amount of stored information related to events can be explored by adopting a process-oriented perspective. This paper discusses an Ambient Assisted Living healthcare architecture to manage hospital home-care services. The proposed solution relies on adopting an event manager to integrate sources ranging from personal devices to web-based applications. Data are processed on a federated cloud platform offering computing infrastructure and storage resources to improve scientific research. In a second step, a business process analysis of telehealth and telemedicine applications is considered. An initial study explored the business process flow to capture the main sequences of tasks, activities, events. This step paves the way for the integration of process mining techniques to compliance monitoring in an AAL architecture framework.},
keywords = {ai},
pubstate = {published},
tppubtype = {article}
}
Sunwoo Kim, Soo Yong Lee, Yue Gao, Alessia Antelmi, Mirko Polato, Kijung Shin
A Survey on Hypergraph Neural Networks: An In-Depth and Step-By-Step Guide Proceedings Article
In: Proceedings of the 30th ACM SIGKDD Conference on Knowledge Discovery and Data Mining, pp. 6534–6544, Association for Computing Machinery, Barcelona, Spain, 2024, ISBN: 9798400704901.
Abstract | Links | BibTeX | Tags: ai, analytics, icsc
@inproceedings{Antelmi_KDD_2024,
title = {A Survey on Hypergraph Neural Networks: An In-Depth and Step-By-Step Guide},
author = {Sunwoo Kim and Soo Yong Lee and Yue Gao and Alessia Antelmi and Mirko Polato and Kijung Shin},
url = {https://doi.org/10.1145/3637528.3671457},
doi = {10.1145/3637528.3671457},
isbn = {9798400704901},
year = {2024},
date = {2024-01-01},
booktitle = {Proceedings of the 30th ACM SIGKDD Conference on Knowledge Discovery and Data Mining},
pages = {6534–6544},
publisher = {Association for Computing Machinery},
address = {Barcelona, Spain},
series = {KDD '24},
abstract = {Higher-order interactions (HOIs) are ubiquitous in real-world complex systems and applications. Investigation of deep learning for HOIs, thus, has become a valuable agenda for the data mining and machine learning communities. As networks of HOIs are expressed mathematically as hypergraphs, hypergraph neural networks (HNNs) have emerged as a powerful tool for representation learning on hypergraphs. Given the emerging trend, we present the first survey dedicated to HNNs, with an in-depth and step-by-step guide. Broadly, the present survey overviews HNN architectures, training strategies, and applications. First, we break existing HNNs down into four design components: (i) input features, (ii) input structures, (iii) message-passing schemes, and (iv) training strategies. Second, we examine how HNNs address and learn HOIs with each of their components. Third, we overview the recent applications of HNNs in recommendation, bioinformatics and medical science, time series analysis, and computer vision. Lastly, we conclude with a discussion on limitations and future directions.},
keywords = {ai, analytics, icsc},
pubstate = {published},
tppubtype = {inproceedings}
}
Lorenzo Brescia, Iacopo Colonnelli, Marco Aldinucci
Performance Analysis on DNA Alignment Workload with Intel SGX Multithreading Proceedings Article
In: Antelmi, Alessia, Carlini, Emanuele, Dazzi, Patrizio (Ed.): Proceedings of BigHPC2024: Special Track on Big Data and High-Performance Computing, co-located with the 3textsuperscriptrd Italian Conference on Big Data and Data Science, ITADATA2024, CEUR-WS.org, 2024.
Abstract | Links | BibTeX | Tags: confidential, icsc
@inproceedings{24:brescia:itadata,
title = {Performance Analysis on DNA Alignment Workload with Intel SGX Multithreading},
author = {Lorenzo Brescia and Iacopo Colonnelli and Marco Aldinucci},
editor = {Alessia Antelmi and Emanuele Carlini and Patrizio Dazzi},
url = {https://ceur-ws.org/Vol-3785/paper107.pdf},
year = {2024},
date = {2024-01-01},
booktitle = {Proceedings of BigHPC2024: Special Track on Big Data and High-Performance Computing, co-located with the 3textsuperscriptrd Italian Conference on Big Data and Data Science, ITADATA2024},
volume = {3785},
publisher = {CEUR-WS.org},
series = {CEUR Workshop Proceedings},
abstract = {Data confidentiality is a critical issue in the digital age, impacting interactions between users and public services and between scientific computing organizations and Cloud and HPC providers. Performance in parallel computing is essential, yet techniques for establishing Trusted Execution Environments (TEEs) to ensure privacy in remote environments often negatively impact execution time. This paper aims to analyze the performance of a parallel bioinformatics workload for DNA alignment (Bowtie2) executed within the confidential enclaves of Intel SGX processors. The results provide encouraging insights regarding the feasibility of using SGX-based TEEs for parallel computing on large datasets. The findings indicate that, under conditions of high parallelization and with twice as many threads, workloads executed within SGX enclaves perform, on average, 15% faster than non-confidential execution. This empirical demonstration supports the potential of SGX-based TEEs to effectively balance the need for privacy with the demands of high-performance computing.},
keywords = {confidential, icsc},
pubstate = {published},
tppubtype = {inproceedings}
}
Adriano Marques Garcia, Giulio Malenza, Robert Birke, Marco Aldinucci
Assessing Large Language Models Inference Performance on a 64-core RISC-V CPU with Silicon-Enabled Vectors Proceedings Article
In: Antelmi, Alessia, Carlini, Emanuele, Dazzi, Patrizio (Ed.): Proceedings of BigHPC2024: Special Track on Big Data and High-Performance Computing, co-located with the 3textsuperscriptrd Italian Conference on Big Data and Data Science, ITADATA2024, pp. 1-9, CEUR-WS.org, Pisa, Italy, 2024.
Abstract | Links | BibTeX | Tags: eupilot, icsc
@inproceedings{24:garcia:itadata,
title = {Assessing Large Language Models Inference Performance on a 64-core RISC-V CPU with Silicon-Enabled Vectors},
author = {Adriano Marques Garcia and Giulio Malenza and Robert Birke and Marco Aldinucci},
editor = {Alessia Antelmi and Emanuele Carlini and Patrizio Dazzi},
url = {https://iris.unito.it/retrieve/1540f675-5e88-4f57-95e7-df8e0fe5f1df/paper110.pdf},
year = {2024},
date = {2024-01-01},
booktitle = {Proceedings of BigHPC2024: Special Track on Big Data and High-Performance Computing, co-located with the 3textsuperscriptrd Italian Conference on Big Data and Data Science, ITADATA2024},
volume = {3785},
pages = {1-9},
publisher = {CEUR-WS.org},
address = {Pisa, Italy},
series = {CEUR Workshop Proceedings},
abstract = {The rising usage of compute-intensive AI applications with fast response time requirements, such as text generation using large language models, underscores the need for more efficient and versatile hardware solutions. This drives the exploration of emerging architectures like RISC-V, which has the potential to deliver strong performance within tight power constraints. The recent commercial release of processors with RISC-V Vector (RVV) silicon-enabled extensions further amplifies the significance of RISC-V architectures, offering enhanced capabilities for parallel processing and accelerating tasks critical to large language models and other AI applications. This work aims to evaluate the BERT and GPT-2 language models inference performance on the SOPHON SG2042 64-core RISC-V architecture with silicon-enabled RVV v0.7.1. We benchmarked the models with and without RVV, using OpenBLAS and BLIS as BLAS backends for PyTorch to enable vectorization. Enabling RVV in OpenBLAS improved the inference performance by up to 40% in some cases.},
keywords = {eupilot, icsc},
pubstate = {published},
tppubtype = {inproceedings}
}
Oussama Harrak, Bruno Casella, Samuele Fonio, Piero Fariselli, Gianluca Mittone, Tiziana Sanavia, Marco Aldinucci
Federated AdaBoost for Survival Analysis Proceedings Article
In: Proceedings of the ECML-PKDD Workshop, 2nd workshop on advancements in Federated Learning, Vilnius, Lithuania, 2024.
Abstract | BibTeX | Tags: epi, icsc
@inproceedings{harrak2024fedsurvboost,
title = {Federated AdaBoost for Survival Analysis},
author = {Oussama Harrak and Bruno Casella and Samuele Fonio and Piero Fariselli and Gianluca Mittone and Tiziana Sanavia and Marco Aldinucci},
year = {2024},
date = {2024-01-01},
booktitle = {Proceedings of the ECML-PKDD Workshop, 2nd workshop on advancements in Federated Learning},
address = {Vilnius, Lithuania},
abstract = {This work proposes FedSurvBoost, a federated learning pipeline for survival analysis based on the AdaBoost.F algorithm, which iteratively aggregates the best local weak hypotheses. Our method extends AdaBoost.F by removing the dependence on the number of classes coefficient from the computation of the weights of the best model. This makes it suitable for regression tasks, such as survival analysis. We show the effectiveness of our approach by comparing it with state-of-the-art methods, specifically developed for survival analysis problems, on two common survival datasets. Our code is available at https://github.com/oussamaHarrak/FedSurvBoost.},
keywords = {epi, icsc},
pubstate = {published},
tppubtype = {inproceedings}
}
Zilong Zhao, Aditya Kunar, Robert Birke, Hiek Van Scheer, Lydia Y. Chen
CTAB-GAN+: enhancing tabular data synthesis Journal Article
In: Frontiers Big Data, vol. 6, 2024.
@article{24:fdata:zhao,
title = {CTAB-GAN+: enhancing tabular data synthesis},
author = {Zilong Zhao and Aditya Kunar and Robert Birke and Hiek Van Scheer and Lydia Y. Chen},
url = {https://doi.org/10.3389/fdata.2023.1296508},
doi = {10.3389/FDATA.2023.1296508},
year = {2024},
date = {2024-01-01},
journal = {Frontiers Big Data},
volume = {6},
keywords = {ai},
pubstate = {published},
tppubtype = {article}
}
Nur Zincir-Heywood, Robert Birke, Elias Bou-Harb, Takeru Inoue, Neeraj Kumar, Hanan Lutfiyya, Deepak Puthal, Abdallah Shami, Natalia Stakhanova
Guest Editorial: Special section on Networks, Systems, and Services Operations and Management Through Intelligence Journal Article
In: IEEE Trans. Netw. Serv. Manag., vol. 21, no. 3, pp. 2608–2612, 2024.
@article{24:tnsm:nur,
title = {Guest Editorial: Special section on Networks, Systems, and Services
Operations and Management Through Intelligence},
author = {Nur Zincir-Heywood and Robert Birke and Elias Bou-Harb and Takeru Inoue and Neeraj Kumar and Hanan Lutfiyya and Deepak Puthal and Abdallah Shami and Natalia Stakhanova},
url = {https://doi.org/10.1109/TNSM.2024.3416861},
doi = {10.1109/TNSM.2024.3416861},
year = {2024},
date = {2024-01-01},
journal = {IEEE Trans. Netw. Serv. Manag.},
volume = {21},
number = {3},
pages = {2608–2612},
keywords = {ai},
pubstate = {published},
tppubtype = {article}
}
Alessia Antelmi, Vincenzo Offertucci, Maria Angela Pellegrino
High-Performance Computation on a Rust-based distributed ABM engine Proceedings Article
In: Proceedings of the 9th International Workshop on the Visualization and Interaction for Ontologies, Linked Data and Knowledge Graphs co-located with the 23rd International Semantic Web Conference (ISWC 2024), CEUR-WS.org, 2024.
Abstract | Links | BibTeX | Tags: analytics
@inproceedings{Antelmi_ISWCWrks_24,
title = {High-Performance Computation on a Rust-based distributed ABM engine},
author = {Alessia Antelmi and Vincenzo Offertucci and Maria Angela Pellegrino},
url = {https://ceur-ws.org/Vol-3773/paper6.pdf},
year = {2024},
date = {2024-01-01},
booktitle = {Proceedings of the 9th International Workshop on the Visualization and Interaction for Ontologies, Linked Data and Knowledge Graphs co-located with the 23rd International Semantic Web Conference (ISWC 2024)},
volume = {3773},
publisher = {CEUR-WS.org},
series = {CEUR Workshop Proceedings},
abstract = {The growing availability of (linked) open data requires lay users to master how to deal with data effectively, yet SPARQL presents a barrier to leveraging data represented as knowledge graphs. As the block programming paradigm has been successfully used to teach programming skills, we demonstrate how to use KGSnap!, an extension of the block-based programming environment Snap!, to foster knowledge graph literacy among individuals lacking expertise in query languages. This work mainly focuses on the visualization and interaction aspects of KGSnap!, a visual SPARQL query builder, when experienced by users without expertise in the Semantic Web technologies. The reported experience is discussed as a learning-by-doing protocol aimed at facilitating the reproducibility and transparency of the performed evaluation. KGSnap! ease of use has been verified by 14 Snap! experts and 24 high-school learners. The findings indicate that lay users perceived it as a promising approach to acquaint themselves with knowledge graphs.},
keywords = {analytics},
pubstate = {published},
tppubtype = {inproceedings}
}
Daniele De Vinco, Andrea Tranquillo, Alessia Antelmi, Carmine Spagnuolo, Vittorio Scarano
High-Performance Computation on a Rust-based distributed ABM engine Proceedings Article
In: Antelmi, Alessia, Carlini, Emanuele, Dazzi, Patrizio (Ed.): Proceedings of BigHPC2024: Special Track on Big Data and High-Performance Computing, co-located with the 3textsuperscriptrd Italian Conference on Big Data and Data Science, ITADATA2024, CEUR-WS.org, 2024.
Abstract | Links | BibTeX | Tags: analytics, icsc
@inproceedings{Antelmi_BigHPC_24,
title = {High-Performance Computation on a Rust-based distributed ABM engine},
author = {Daniele De Vinco and Andrea Tranquillo and Alessia Antelmi and Carmine Spagnuolo and Vittorio Scarano},
editor = {Alessia Antelmi and Emanuele Carlini and Patrizio Dazzi},
url = {https://ceur-ws.org/Vol-3785/paper124.pdf},
year = {2024},
date = {2024-01-01},
booktitle = {Proceedings of BigHPC2024: Special Track on Big Data and High-Performance Computing, co-located with the 3textsuperscriptrd Italian Conference on Big Data and Data Science, ITADATA2024},
volume = {3785},
publisher = {CEUR-WS.org},
series = {CEUR Workshop Proceedings},
abstract = {An agent-based model (ABM) is a computational model for simulating autonomous agents' actions and interactions to understand a system's behavior and what governs its outcomes. When the data or number of agents grow or multiple runs are necessary, agent-based simulations are generally computationally costly. Therefore, adopting different computing paradigms, such as the distributed one, is essential to manage long-running simulations. The main problem with this approach is finding a way to distribute and balance the simulation field so that the agents can move from one machine to another with the least amount of synchronization overhead. Based on our experiences, we present a Rust-based ABM engine capable of distributing models on high-performance computing resources, gaining remarkable speedup against the sequential version.},
keywords = {analytics, icsc},
pubstate = {published},
tppubtype = {inproceedings}
}
Bruno Casella, Walter Riviera, Marco Aldinucci, Gloria Menegaz
Protocol for training MERGE: A federated multi-input neural network for COVID-19 prognosis Journal Article
In: STAR Protocols, 2024, (https://prod-shared-star-protocols.s3.amazonaws.com/protocols/3225.pdf).
Abstract | Links | BibTeX | Tags: epi, icsc
@article{24:casella:starprotocol,
title = {Protocol for training MERGE: A federated multi-input neural network for COVID-19 prognosis},
author = {Bruno Casella and Walter Riviera and Marco Aldinucci and Gloria Menegaz},
url = {https://prod-shared-star-protocols.s3.amazonaws.com/protocols/3225.pdf},
doi = {10.1016/j.xpro.2023.102812},
year = {2024},
date = {2024-01-01},
journal = {STAR Protocols},
institution = {Computer Science Department, University of Torino},
abstract = {Federated learning is a cooperative learning approach that has emerged as an effective way to address privacy concerns. Here, we present a protocol for training MERGE: a federated multi-input neural network (NN) for COVID-19 prognosis. We describe steps for collecting and preprocessing datasets. We then detail the process of training a multi-input NN. This protocol can be adapted for use with datasets containing both image- and table-based input sources.},
note = {https://prod-shared-star-protocols.s3.amazonaws.com/protocols/3225.pdf},
keywords = {epi, icsc},
pubstate = {published},
tppubtype = {article}
}
Adriano Marques Garcia, Dalvan Griebler, Claudio Schepke, José Daniel García, Javier Fernández Muñoz, Luiz Gustavo Fernandes
Performance and programmability of GrPPI for parallel stream processing on multi-cores Journal Article
In: The Journal of Supercomputing, vol. In press, no. In press, pp. 1-35, 2024, ISBN: 1573-0484.
Abstract | Links | BibTeX | Tags: admire
@article{GARCIA:JSuper:24,
title = {Performance and programmability of GrPPI for parallel stream processing on multi-cores},
author = {Adriano Marques Garcia and Dalvan Griebler and Claudio Schepke and José Daniel García and Javier Fernández Muñoz and Luiz Gustavo Fernandes},
url = {https://iris.unito.it/retrieve/fff66640-fcbe-4080-a4f1-3279c9fadafb/s11227-024-05934-z.pdf},
doi = {10.1007/s11227-024-05934-z},
isbn = {1573-0484},
year = {2024},
date = {2024-01-01},
journal = {The Journal of Supercomputing},
volume = {In press},
number = {In press},
pages = {1-35},
publisher = {Springer},
abstract = {GrPPI library aims to simplify the burdening task of parallel programming. It provides a unified, abstract, and generic layer while promising minimal overhead on performance. Although it supports stream parallelism, GrPPI lacks an evaluation regarding representative performance metrics for this domain, such as throughput and latency. This work evaluates GrPPI focused on parallel stream processing. We compare the throughput and latency performance, memory usage, and programmability of GrPPI against handwritten parallel code. For this, we use the benchmarking framework SPBench to build custom GrPPI benchmarks and benchmarks with handwritten parallel code using the same backends supported by GrPPI. The basis of the benchmarks is real applications, such as Lane Detection, Bzip2, Face Recognizer, and Ferret. Experiments show that while performance is often competitive with handwritten parallel code, the infeasibility of fine-tuning GrPPI is a crucial drawback for emerging applications. Despite this, programmability experiments estimate that GrPPI can potentially reduce the development time of parallel applications by about three times.},
keywords = {admire},
pubstate = {published},
tppubtype = {article}
}
2023
Alberto Riccardo Martinelli, Massimo Torquati, Marco Aldinucci, Iacopo Colonnelli, Barbara Cantalupo
CAPIO: a Middleware for Transparent I/O Streaming in Data-Intensive Workflows Proceedings Article
In: 2023 IEEE 30th International Conference on High Performance Computing, Data, and Analytics (HiPC), IEEE, Goa, India, 2023.
Abstract | Links | BibTeX | Tags: admire, capio, eupex, icsc
@inproceedings{23:hipc:capio,
title = {CAPIO: a Middleware for Transparent I/O Streaming in Data-Intensive Workflows},
author = {Alberto Riccardo Martinelli and Massimo Torquati and Marco Aldinucci and Iacopo Colonnelli and Barbara Cantalupo},
url = {https://iris.unito.it/retrieve/27380f37-0978-409e-a9d8-2b5e95a4bb85/CAPIO-HiPC23-preprint.pdf},
doi = {10.1109/HiPC58850.2023.00031},
year = {2023},
date = {2023-12-01},
booktitle = {2023 IEEE 30th International Conference on High Performance Computing, Data, and Analytics (HiPC)},
publisher = {IEEE},
address = {Goa, India},
abstract = {With the increasing amount of digital data available for analysis and simulation, the class of I/O-intensive HPC workflows is fated to quickly expand, further exacerbating the performance gap between computing, memory, and storage technologies. This paper introduces CAPIO (Cross-Application Programmable I/O), a middleware capable of injecting I/O streaming capabilities into file-based workflows, improving the computation-I/O overlap without the need to change the application code. The contribution is twofold: 1) at design time, a new I/O coordination language allows users to annotate workflow data dependencies with synchronization semantics; 2) at run time, a user-space middleware automatically and transparently to the user turns a workflow batch execution into a streaming execution according to the semantics expressed in the configuration file. CAPIO has been tested on synthetic benchmarks simulating typical workflow I/O patterns and two real-world workflows. Experiments show that CAPIO reduces the execution time by 10% to 66% for data-intensive workflows that use the file system as a communication medium.},
keywords = {admire, capio, eupex, icsc},
pubstate = {published},
tppubtype = {inproceedings}
}
Marco Aldinucci, Elena Maria Baralis, Valeria Cardellini, Iacopo Colonnelli, Marco Danelutto, Sergio Decherchi, Giuseppe Di Modica, Luca Ferrucci, Marco Gribaudo, Francesco Iannone, Marco Lapegna, Doriana Medic, Giuseppa Muscianisi, Francesca Righetti, Eva Sciacca, Nicola Tonellotto, Mauro Tortonesi, Paolo Trunfio, Tullio Vardanega
A Systematic Mapping Study of Italian Research on Workflows Proceedings Article
In: Proceedings of the SC '23 Workshops of The International Conference on High Performance Computing, Network, Storage, and Analysis, SC-W 2023, pp. 2065–2076, ACM, Denver, CO, USA, 2023.
Abstract | Links | BibTeX | Tags: icsc, jupyter-workflow, streamflow
@inproceedings{WORKS2023,
title = {A Systematic Mapping Study of Italian Research on Workflows},
author = {Marco Aldinucci and Elena Maria Baralis and Valeria Cardellini and Iacopo Colonnelli and Marco Danelutto and Sergio Decherchi and Giuseppe Di Modica and Luca Ferrucci and Marco Gribaudo and Francesco Iannone and Marco Lapegna and Doriana Medic and Giuseppa Muscianisi and Francesca Righetti and Eva Sciacca and Nicola Tonellotto and Mauro Tortonesi and Paolo Trunfio and Tullio Vardanega},
url = {https://doi.org/10.1145/3624062.3624285},
doi = {10.1145/3624062.3624285},
year = {2023},
date = {2023-11-01},
booktitle = {Proceedings of the SC '23 Workshops of The International Conference on High Performance Computing, Network, Storage, and Analysis, SC-W 2023},
pages = {2065–2076},
publisher = {ACM},
address = {Denver, CO, USA},
abstract = {An entire ecosystem of methodologies and tools revolves around scientific workflow management. They cover crucial non-functional requirements that standard workflow models fail to target, such as interactive execution, energy efficiency, performance portability, Big Data management, and intelligent orchestration in the Computing Continuum. Characterizing and monitoring this ecosystem is crucial to develop an informed view of current and future research directions. This work conducts a systematic mapping study of the Italian workflow research community, collecting and analyzing 25 tools and 10 applications from several scientific domains in the context of the ``National Research Centre for HPC, Big Data, and Quantum Computing'' (ICSC). The study aims to outline the main current research directions and determine how they address the critical needs of modern scientific applications. The findings highlight a variegated research ecosystem of tools, with a prominent interest in advanced workflow orchestration and still immature but promising efforts toward energy efficiency.},
keywords = {icsc, jupyter-workflow, streamflow},
pubstate = {published},
tppubtype = {inproceedings}
}
Zilong Zhao, Robert Birke, Lydia Y. Chen
FCT-GAN: Enhancing Global Correlation of Table Synthesis via Fourier Transform Proceedings Article
In: 32nd ACM International Conference on Information and Knowledge Management (CIKM '23), ACM, Birmingham, United Kingdom, 2023.
Abstract | Links | BibTeX | Tags: icsc
@inproceedings{23:zhao:fctgan,
title = {FCT-GAN: Enhancing Global Correlation of Table Synthesis via Fourier Transform},
author = {Zilong Zhao and Robert Birke and Lydia Y. Chen},
url = {https://iris.unito.it/retrieve/966ba767-dbbd-41e1-b4e3-7ab7ba09303f/FCT-GAN.pdf},
doi = {10.1145/3583780.3615202},
year = {2023},
date = {2023-10-01},
booktitle = {32nd ACM International Conference on Information and Knowledge Management (CIKM '23)},
publisher = {ACM},
address = {Birmingham, United Kingdom},
abstract = {An alternative method for sharing knowledge while complying with strict data access regulations, such as the European General Data Protection Regulation (GDPR), is the emergence of synthetic tabular data. Mainstream table synthesizers utilize methodologies derived from Generative Adversarial Networks (GAN). Although several state-of-the-art (SOTA) tabular GAN algorithms inherit Convolutional Neural Network (CNN)-based architectures, which have proven effective for images, they tend to overlook two critical properties of tabular data: (i) the global correlation across columns, and (ii) the semantic invariance to the column order. Permuting columns in a table does not alter the semantic meaning of the data, but features extracted by CNNs can change significantly due to their limited convolution filter kernel size. To address the above problems, we propose FCT-GAN– the first conditional tabular GAN to adopt Fourier networks into table synthesis. FCT-GAN enhances permutation invariant GAN training by strengthening the learning of global correlations via Fourier layers. Extensive evaluation on benchmarks and real-world datasets show that FCT-GAN can synthesize tabular data with better (up to 27.8%) machine learning utility (i.e. a proxy of global correlations) and higher (up to 26.5%) statistical similarity to real data. FCT-GAN also has the least variation on synthetic data quality among 7 SOTA baselines on 3 different training-data column orders.},
keywords = {icsc},
pubstate = {published},
tppubtype = {inproceedings}
}
Samuele Fonio, Lorenzo Paletto, Mattia Cerrato, Dino Ienco, Roberto Esposito
Hierarchical priors for Hyperspherical Prototypical Networks Proceedings Article
In: 31th European Symposium on Artificial Neural Networks, Computational Intelligence and Machine Learning, ESANN, Bruges, Belgium, 2023, (In print).
Abstract | Links | BibTeX | Tags: ai, icsc
@inproceedings{23:esann:fonio,
title = {Hierarchical priors for Hyperspherical Prototypical Networks},
author = {Samuele Fonio and Lorenzo Paletto and Mattia Cerrato and Dino Ienco and Roberto Esposito},
url = {https://www.esann.org/sites/default/files/proceedings/2023/ES2023-65.pdf},
year = {2023},
date = {2023-10-01},
booktitle = {31th European Symposium on Artificial Neural Networks, Computational Intelligence and Machine Learning, ESANN},
address = {Bruges, Belgium},
abstract = {In this paper, we explore the usage of hierarchical priors to improve learning in contexts where the number of available examples is extremely low. Specifically, we consider a Prototype Learning setting where deep neural networks are used to embed data in hyperspherical geometries.In this scenario, we propose an innovative way to learn the prototypes by combining class separation and hierarchical information. In addition, we introduce a contrastive loss function capable of balancing the exploitation of prototypes through a prototype pruning mechanism. We compare the proposed method with state-of-the-art approaches on two public datasets.},
note = {In print},
keywords = {ai, icsc},
pubstate = {published},
tppubtype = {inproceedings}
}
Samuele Fonio
Benchmarking Federated Learning Frameworks for Medical Imaging Tasks Proceedings Article
In: Foresti, G. L., Fusiello, A., Hancock, E. (Ed.): Image Analysis and Processing - ICIAP 2023 Workshops. ICIAP 2023, Springer, Cham, Udine, Italy, 2023, (In print).
Abstract | Links | BibTeX | Tags: ai, eupilot, icsc
@inproceedings{23:iciap:fedmed:ws:fonio,
title = {Benchmarking Federated Learning Frameworks for Medical Imaging Tasks},
author = {Samuele Fonio},
editor = {G. L. Foresti and A. Fusiello and E. Hancock},
url = {https://link.springer.com/chapter/10.1007/978-3-031-51026-7_20},
doi = {10.1007/978-3-031-51026-7_20},
year = {2023},
date = {2023-09-01},
booktitle = {Image Analysis and Processing - ICIAP 2023 Workshops. ICIAP 2023},
volume = {14366},
publisher = {Springer, Cham},
address = {Udine, Italy},
abstract = {This paper presents a comprehensive benchmarking study of various Federated Learning (FL) frameworks applied to the task of Medical Image Classification. The research specifically addresses the often neglected and complex aspects of scalability and usability in off-the-shelf FL frameworks. Through experimental validation using real case deployments, we provide empirical evidence of the performance and practical relevance of open source FL frameworks. Our findings contribute valuable insights for anyone interested in deploying a FL system, with a particular focus on the healthcare domain—an increasingly attractive field for FL applications.},
note = {In print},
keywords = {ai, eupilot, icsc},
pubstate = {published},
tppubtype = {inproceedings}
}
Gianluca Mittone, Samuele Fonio
Benchmarking Federated Learning Scalability Proceedings Article
In: Proceedings of the 2nd Italian Conference on Big Data and Data Science, ITADATA 2023, September 11-13, 2023, CEUR, Naples, Italy, 2023.
Abstract | Links | BibTeX | Tags: eupilot, HPC, icsc
@inproceedings{23:itadata:extabstract:mittone:fonio,
title = {Benchmarking Federated Learning Scalability},
author = {Gianluca Mittone and Samuele Fonio},
url = {https://hdl.handle.net/2318/1933852},
year = {2023},
date = {2023-09-01},
booktitle = {Proceedings of the 2nd Italian Conference on Big Data and Data Science, ITADATA 2023, September 11-13, 2023},
publisher = {CEUR},
address = {Naples, Italy},
abstract = {Federated Learning (FL) is a widespread Machine Learning paradigm handling distributed Big Data. In this work, we demonstrate that different FL frameworks expose different scaling performances despite adopting the same technologies, highlighting the need for a more comprehensive study on the topic.},
keywords = {eupilot, HPC, icsc},
pubstate = {published},
tppubtype = {inproceedings}
}
Chi Hong, Jiyue Huang, Robert Birke, Lydia Y. Chen
Exploring and Exploiting Data-Free Model Stealing Proceedings Article
In: European Conference on Machine Learning and Principles and Practice of Knowledge Discovery in Databases (ECML PKDD), Turin, Italy, 2023.
Abstract | Links | BibTeX | Tags: eupilot, icsc
@inproceedings{23:hong:datafree,
title = {Exploring and Exploiting Data-Free Model Stealing},
author = {Chi Hong and Jiyue Huang and Robert Birke and Lydia Y. Chen},
url = {https://iris.unito.it/retrieve/ce44dec6-12c9-443d-99e7-f1141e50aa3a/Data-free%20Model%20Stealing.pdf},
doi = {10.1007/978-3-031-43424-2_2},
year = {2023},
date = {2023-09-01},
booktitle = {European Conference on Machine Learning and Principles and Practice of Knowledge Discovery in Databases (ECML PKDD)},
address = {Turin, Italy},
abstract = {Deep machine learning models, e.g., image classifier, are increasingly deployed in the wild to provide services to users. Adversaries are shown capable of stealing the knowledge of these models by sending inference queries and then training substitute models based on query results. The availability and quality of adversarial query inputs are undoubtedly crucial in the stealing process. The recent prior art demonstrates the feasibility of replacing real data by exploring the synthetic adversarial queries, so called data-free attacks, under strong adversarial assumptions, i.e., the deployed classier returns not only class labels but also class probabilities. In this paper, we consider a general adversarial model and propose an effective data-free stealing algorithm, Tandem-GAN, which not only explores synthetic queries but also explicitly exploits the high quality ones. The core of TandemGAN is composed of (i) substitute model which imitates the target model through synthetic queries and their inferred labels; and (ii) a tandem generator consisting of two networks, Gx and Ge, which first explores the synthetic data space via Gx and then exploits high-quality examples via Ge to maximize the knowledge transfer from the target to the substitute model. Our results on four datasets show that the accuracy of our trained substitute model ranges between 96-67% of the target model and outperforms the existing state-of-the-art data-free model stealing approach by up to 2.5X.},
keywords = {eupilot, icsc},
pubstate = {published},
tppubtype = {inproceedings}
}
Valentina Cesare, Ugo Becciani, Alberto Vecchiato, Mario Gilberto Lattanzi, Fabio Pitari, Marco Aldinucci, Beatrice Bucciarelli
The MPI + CUDA Gaia AVU–GSR Parallel Solver Toward Next-generation Exascale Infrastructures Journal Article
In: Publications of the Astronomical Society of the Pacific, vol. 135, no. 1049, 2023.
Abstract | Links | BibTeX | Tags: HPC
@article{23:GAIAMPI_PASP,
title = {The MPI + CUDA Gaia AVU–GSR Parallel Solver Toward Next-generation Exascale Infrastructures},
author = {Valentina Cesare and Ugo Becciani and Alberto Vecchiato and Mario Gilberto Lattanzi and Fabio Pitari and Marco Aldinucci and Beatrice Bucciarelli},
url = {https://iopscience.iop.org/article/10.1088/1538-3873/acdf1e/pdf},
doi = {10.1088/1538-3873/acdf1e},
year = {2023},
date = {2023-08-01},
journal = {Publications of the Astronomical Society of the Pacific},
volume = {135},
number = {1049},
abstract = {We ported to the GPU with CUDA the Astrometric Verification Unit–Global Sphere Reconstruction (AVU–GSR) Parallel Solver developed for the ESA Gaia mission, by optimizing a previous OpenACC porting of this application. The code aims to find, with a [10, 100] μarcsec precision, the astrometric parameters of about 10^8 stars, the attitude and instrumental settings of the Gaia satellite, and the global parameter γ of the parametrized Post-Newtonian formalism, by solving a system of linear equations, A × x = b, with the LSQR iterative algorithm. The coefficient matrix A of the final Gaia data set is large, with ∼1011 × 108 elements, and sparse, reaching a size of ∼10–100 TB, typical for the Big Data analysis, which requires an efficient parallelization to obtain scientific results in reasonable timescales. The speedup of the CUDA code over the original AVU–GSR solver, parallelized on the CPU with MPI + OpenMP, increases with the system size and the number of resources, reaching a maximum of ∼14×, >9× over the OpenACC application. This result is obtained by comparing the two codes on the CINECA cluster Marconi100, with 4 V100 GPUs per node. After verifying the agreement between the solutions of a set of systems with different sizes computed with the CUDA and the OpenMP codes and that the solutions showed the required precision, the CUDA code was put in production on Marconi100, essential for an optimal AVU–GSR pipeline and the successive Gaia Data Releases. This analysis represents a first step to understand the (pre-)Exascale behavior of a class of applications that follow the same structure of this code. In the next months, we plan to run this code on the pre-Exascale platform Leonardo of CINECA, with 4 next-generation A200 GPUs per node, toward a porting on this infrastructure, where we expect to obtain even higher performances.},
key = {icsc, eupex},
keywords = {HPC},
pubstate = {published},
tppubtype = {article}
}
Gianluca Mittone, Walter Riviera, Iacopo Colonnelli, Robert Birke, Marco Aldinucci
Model-Agnostic Federated Learning Proceedings Article
In: Euro-Par 2023: Parallel Processing, pp. 383–396, Springer, Limassol, Cyprus, 2023.
Abstract | Links | BibTeX | Tags: ai, confidential, eupilot, icsc, riscv
@inproceedings{23:mittone:mafl,
title = {Model-Agnostic Federated Learning},
author = {Gianluca Mittone and Walter Riviera and Iacopo Colonnelli and Robert Birke and Marco Aldinucci},
url = {https://doi.org/10.1007/978-3-031-39698-4_26},
doi = {10.1007/978-3-031-39698-4_26},
year = {2023},
date = {2023-08-01},
booktitle = {Euro-Par 2023: Parallel Processing},
volume = {14100},
pages = {383–396},
publisher = {Springer},
address = {Limassol, Cyprus},
institution = {Computer Science Department, University of Torino},
abstract = {Since its debut in 2016, Federated Learning (FL) has been tied to the inner workings of Deep Neural Networks (DNNs). On the one hand, this allowed its development and widespread use as DNNs proliferated. On the other hand, it neglected all those scenarios in which using DNNs is not possible or advantageous. The fact that most current FL frameworks only allow training DNNs reinforces this problem. To address the lack of FL solutions for non-DNN-based use cases, we propose MAFL (Model-Agnostic Federated Learning). MAFL marries a model-agnostic FL algorithm, AdaBoost.F, with an open industry-grade FL framework: Intel OpenFL. MAFL is the first FL system not tied to any specific type of machine learning model, allowing exploration of FL scenarios beyond DNNs and trees. We test MAFL from multiple points of view, assessing its correctness, flexibility and scaling properties up to 64 nodes. We optimised the base software achieving a 5.5x speedup on a standard FL scenario. MAFL is compatible with x86-64, ARM-v8, Power and RISC-V.},
keywords = {ai, confidential, eupilot, icsc, riscv},
pubstate = {published},
tppubtype = {inproceedings}
}
Zilong Zhao, Robert Birke, Lydia Y. Chen
GDTS: GAN-based Distributed Tabular Synthesizer Proceedings Article
In: 16th IEEE International Conference on Cloud Computing (CLOUD), IEEE, Chicago, USA, 2023.
Abstract | Links | BibTeX | Tags: ai
@inproceedings{23:cloud:gdts,
title = {GDTS: GAN-based Distributed Tabular Synthesizer},
author = {Zilong Zhao and Robert Birke and Lydia Y. Chen},
url = {https://iris.unito.it/retrieve/8bc610de-3ccd-4a0a-b97f-ee329e487b76/GDTS_IEEE_CLOUD_preprint.pdf},
doi = {10.1109/CLOUD60044.2023.00078},
year = {2023},
date = {2023-07-01},
booktitle = {16th IEEE International Conference on Cloud Computing (CLOUD)},
publisher = {IEEE},
address = {Chicago, USA},
abstract = {Generative Adversarial Networks (GANs) are typically trained to synthesize data, from images and more recently tabular data, under the assumption of directly accessible training data. While learning image GANs on Federated Learning (FL) and Multi-Discriminator (MD) systems has just been demonstrated, it is unknown if tabular GANs can be learned from decentralized data sources. Different from image GANs, state-of-the-art tabular GANs require prior knowledge on the data distribution of each (discrete and continuous) column to agree on a common encoding – risking privacy guarantees. In this paper, we propose GDTS, a distributed framework for GAN-based tabular synthesizer. GDTS provides different system architectures to match the two training paradigms termed GDTS FL and GDTS MD. Key to enable learning on distributed data is the proposed novel privacy-preserving multi-source feature encoding to capture the global data properties. In addition GDTS encompasses a weighting strategy based on table similarity to counter the detrimental effects of non-IID data and a validation pipeline to easily assess and compare the performance of different paradigms and hyper parameters. We evaluate the effectiveness of GDTS in terms of synthetic data quality, and overall training scalability. Experiments show that GDTS FL achieves better statistical similarity and machine learning utility between generated and original data compared to GDTS MD.},
keywords = {ai},
pubstate = {published},
tppubtype = {inproceedings}
}
Iacopo Colonnelli, Robert Birke, Marco Aldinucci
Experimenting with PyTorch on RISC-V Proceedings Article
In: RISC-V Summit Europe 2023, Barcelona, Spain, 2023, (Poster).
Abstract | Links | BibTeX | Tags: eupilot, icsc, riscv
@inproceedings{23:risc-v-summit,
title = {Experimenting with PyTorch on RISC-V},
author = {Iacopo Colonnelli and Robert Birke and Marco Aldinucci},
url = {https://iris.unito.it/retrieve/429bf344-9090-42c3-809c-1b8ac320a930/2023-06-08-Iacopo-COLONNELLI-abstract.pdf},
year = {2023},
date = {2023-06-01},
booktitle = {RISC-V Summit Europe 2023},
address = {Barcelona, Spain},
abstract = {RISC-V is an emerging instruction set architecture. Its modular and extensible open-source royalty-free design is increasingly attracting interest from both research and industry. Nowadays, different RISC-V-based boards can be bought off the shelf. However, software availability is equivalently vital in guaranteeing the RISC-V ecosystem's success. Here we contribute with the first publicly available port of PyTorch. PyTorch is one of the most popular Deep Learning libraries available today. As such, it is a crucial enabler in running state-of-the-art AI applications on RISC-V-based systems and a first step towards a fully democratic end-to-end codesign process.},
note = {Poster},
keywords = {eupilot, icsc, riscv},
pubstate = {published},
tppubtype = {inproceedings}
}
Alessia Antelmi, Gennaro Cordasco, Mirko Polato, Vittorio Scarano, Carmine Spagnuolo, Dingqi Yang
A Survey on Hypergraph Representation Learning Journal Article
In: ACM Comput. Surv., 2023, ISSN: 0360-0300.
Abstract | Links | BibTeX | Tags: analytics
@article{Antelmi_CSUR_23,
title = {A Survey on Hypergraph Representation Learning},
author = {Alessia Antelmi and Gennaro Cordasco and Mirko Polato and Vittorio Scarano and Carmine Spagnuolo and Dingqi Yang},
url = {https://doi.org/10.1145/3605776},
doi = {10.1145/3605776},
issn = {0360-0300},
year = {2023},
date = {2023-06-01},
journal = {ACM Comput. Surv.},
publisher = {Association for Computing Machinery},
address = {New York, NY, USA},
abstract = {Hypergraphs have attracted increasing attention in recent years thanks to their flexibility in naturally modeling a broad range of systems where high-order relationships exist among their interacting parts. This survey reviews the newly born hypergraph representation learning problem, whose goal is to learn a function to project objects - most commonly nodes - of an input hyper-network into a latent space such that both the structural and relational properties of the network can be encoded and preserved. We provide a thorough overview of existing literature and offer a new taxonomy of hypergraph embedding methods by identifying three main families of techniques, i.e., spectral, proximity-preserving, and (deep) neural networks. For each family, we describe its characteristics and our insights in a single yet flexible framework and then discuss the peculiarities of individual methods, as well as their pros and cons. We then review the main tasks, datasets, and settings in which hypergraph embeddings are typically used. We finally identify and discuss open challenges that would inspire further research in this field.},
keywords = {analytics},
pubstate = {published},
tppubtype = {article}
}
Marco Aldinucci, Robert Birke, Antonio Brogi, Emanuele Carlini, Massimo Coppola, Marco Danelutto, Patrizio Dazzi, Luca Ferrucci, Forti Stefano, Hanna Kavalionak, Gabriele Mencagli, Matteo Mordacchin, Marcelo Pasin, Federica Paganelli, Massimo Torquati
A Proposal for a Continuum-aware Programming Model: From Workflows to Services Autonomously Interacting in the Compute Continuum Proceedings Article
In: 2023 IEEE 47th Annual Computers, Software, and Applications Conference (COMPSAC), IEEE, Turin, Italy, 2023.
Abstract | Links | BibTeX | Tags: icsc
@inproceedings{23:aldinucci:continuum,
title = {A Proposal for a Continuum-aware Programming Model: From Workflows to Services Autonomously Interacting in the Compute Continuum},
author = {Marco Aldinucci and Robert Birke and Antonio Brogi and Emanuele Carlini and Massimo Coppola and Marco Danelutto and Patrizio Dazzi and Luca Ferrucci and Forti Stefano and Hanna Kavalionak and Gabriele Mencagli and Matteo Mordacchin and Marcelo Pasin and Federica Paganelli and Massimo Torquati},
url = {https://iris.unito.it/retrieve/2ae13a33-5814-43da-8ea6-2d3e8b122384/Continuum-aware-PM.pdf},
doi = {10.1109/COMPSAC57700.2023.00287},
year = {2023},
date = {2023-06-01},
booktitle = {2023 IEEE 47th Annual Computers, Software, and Applications Conference (COMPSAC)},
publisher = {IEEE},
address = {Turin, Italy},
abstract = {This paper proposes a continuum-aware programming model enabling the execution of application workflows across the compute continuum: cloud, fog and edge resources. It simplifies the management of heterogeneous nodes while alleviating the burden of programmers and unleashing innovation. This model optimizes the continuum through advanced development experiences by transforming workflows into autonomous service collaborations. It reduces complexity in positioning/interconnecting services across the continuum. A meta-model introduces high-level workflow descriptions as service networks with defined contracts and quality of service, thus enabling the deployment/management of workflows as first-class entities. It also provides automation based on policies, monitoring and heuristics. Tailored mechanisms orchestrate/manage services across the continuum, optimizing performance, cost, data protection and sustainability while managing risks. This model facilitates incremental development with visibility of design impacts and seamless evolution of applications and infrastructures. In this work, we explore this new computing paradigm showing how it can trigger the development of a new generation of tools to support the compute continuum progress.},
keywords = {icsc},
pubstate = {published},
tppubtype = {inproceedings}
}
Jani Valtari, Anna Kulmala, Sandro Schönborn, David Khozaya, Robert Birke, Reikko Jyrki
Real-life Pilot of Virtual Protection and Control - Experiences and Performance Analysis Proceedings Article
In: 27th International Conference on Electricity Distribution (CIRED), Rome, Italy, 2023.
Abstract | Links | BibTeX | Tags: RT
@inproceedings{23:valtari:pilot,
title = {Real-life Pilot of Virtual Protection and Control - Experiences and Performance Analysis},
author = {Jani Valtari and Anna Kulmala and Sandro Schönborn and David Khozaya and Robert Birke and Reikko Jyrki},
url = {https://iris.unito.it/retrieve/5de5fb00-02bf-4ba8-a4db-5876415d5105/virtualization_full_paper_cired2023_submitted.pdf},
doi = {10.1049/icp.2023.1219},
year = {2023},
date = {2023-06-01},
booktitle = {27th International Conference on Electricity Distribution (CIRED)},
address = {Rome, Italy},
abstract = {Virtualized protection and control (VPC) is seen as a promising evolution for the centralized protection and control (CPC) concept. Centralization of protection functions consolidates the functions of multiple traditional relays into one device. This consolidation reduces communications network complexity and offers effective ways to manage protection applications of the substation. Making the CPC available as a VPC software image instead of a dedicated device creates yet another degree of freedom. The solution becomes hardware independent, bringing more flexibility and scalability to the solution. ABB and Caruna together wanted to explore these possibilities in a real-life substation pilot. This paper describes the piloted VPC environment and the results from the piloting period. The results show that virtualization technology is suitable for time critical protection and control applications, with real-time performance comparable to existing non- virtualized solutions.},
keywords = {RT},
pubstate = {published},
tppubtype = {inproceedings}
}
Sandro Schönborn, Robert Birke, David Kozhaya, Thanikesavan Sivanthi
Real-Time Performance of Virtualised Protection and Control Software Proceedings Article
In: 27th International Conference on Electricity Distribution (CIRED), Rome, Italy, 2023.
Abstract | Links | BibTeX | Tags: RT
@inproceedings{23:schoenborn:vipac,
title = {Real-Time Performance of Virtualised Protection and Control Software},
author = {Sandro Schönborn and Robert Birke and David Kozhaya and Thanikesavan Sivanthi},
url = {https://iris.unito.it/retrieve/eb610327-6e38-4f5e-8673-e62f2d956821/10702-Scho%cc%88nborn.pdf},
doi = {10.1049/icp.2023.1028},
year = {2023},
date = {2023-06-01},
booktitle = {27th International Conference on Electricity Distribution (CIRED)},
address = {Rome, Italy},
abstract = {Substation automation is ever challenged by the integration of distributed energy resources which imposes higher deployment flexibility and adaptability for protection and control. Although virtualization helps to run software applications independent of the underlying platform in IT infrastructures and cloud computing, it is still not commonly used in the field of substation automation. This is mainly due to the real-time performance demands of substation automation protection and control applications. In this article, we present an approach for running substation automation protection and control software in virtual environments. We contrast the real-time performance of different virtualization technologies under different workloads and focus on the performance evaluation of protection and control software in container- based solutions running on Linux with PREEMPT RT. We also present additional results for performance achieved in virtual machines. Our results clearly demonstrate that it is possible to run substation automation protection and control software in virtual environments while still providing the necessary performance. This paves the way for the deployment of substation protection and control software in virtualisation environments.},
keywords = {RT},
pubstate = {published},
tppubtype = {inproceedings}
}
Jesus Carretero, Javier Garcia-Blas, Marco Aldinucci, Jean Baptiste Besnard Besnard, Jean-Thomas Acquaviva, André Brinkmann, Marc-André Vef, Emmanuel Jeannot, Alberto Miranda, Ramon Nou, Morris Riedel, Massimo Torquati, Felix Wolf
Adaptive multi-tier intelligent data manager for Exascale Proceedings Article
In: 20th ACM International Conference on Computing Frontiers (CF '23), ACM, Bologna, Italy, 2023.
Abstract | Links | BibTeX | Tags: admire
@inproceedings{23:admire:cf,
title = {Adaptive multi-tier intelligent data manager for Exascale},
author = {Jesus Carretero and Javier Garcia-Blas and Marco Aldinucci and Jean Baptiste Besnard Besnard and Jean-Thomas Acquaviva and André Brinkmann and Marc-André Vef and Emmanuel Jeannot and Alberto Miranda and Ramon Nou and Morris Riedel and Massimo Torquati and Felix Wolf},
url = {https://dl.acm.org/doi/pdf/10.1145/3587135.3592174},
doi = {10.1145/3587135.3592174},
year = {2023},
date = {2023-05-01},
booktitle = {20th ACM International Conference on Computing Frontiers (CF '23)},
publisher = {ACM},
address = {Bologna, Italy},
abstract = {The main objective of the ADMIRE project1 is the creation of an active I/O stack that dynamically adjusts computation and storage requirements through intelligent global coordination, the elasticity of computation and I/O, and the scheduling of storage resources along all levels of the storage hierarchy, while offering quality-of-service (QoS), energy efficiency, and resilience for accessing extremely large data sets in very heterogeneous computing and storage environments. We have developed a framework prototype that is able to dynamically adjust computation and storage requirements through intelligent global coordination, separated control, and data paths, the malleability of computation and I/O, the scheduling of storage resources along all levels of the storage hierarchy, and scalable monitoring techniques. The leading idea in ADMIRE is to co-design applications with ad-hoc storage systems that can be deployed with the application and adapt their computing and I/O behaviour on runtime, using malleability techniques, to increase the performance of applications and the throughput of the applications.},
keywords = {admire},
pubstate = {published},
tppubtype = {inproceedings}
}
Gianluca Mittone, Nicolò Tonci, Robert Birke, Iacopo Colonnelli, Doriana Medić, Andrea Bartolini, Roberto Esposito, Emanuele Parisi, Francesco Beneventi, Mirko Polato, Massimo Torquati, Luca Benini, Marco Aldinucci
Experimenting with Emerging RISC-V Systems for Decentralised Machine Learning Proceedings Article
In: 20th ACM International Conference on Computing Frontiers (CF '23), ACM, Bologna, Italy, 2023, ISBN: 979-8-4007-0140-5/23/05, (https://arxiv.org/abs/2302.07946).
Abstract | Links | BibTeX | Tags: ai, confidential, eupilot, HPC, icsc, riscv
@inproceedings{23:mittone:fl-riscv,
title = {Experimenting with Emerging RISC-V Systems for Decentralised Machine Learning},
author = {Gianluca Mittone and Nicolò Tonci and Robert Birke and Iacopo Colonnelli and Doriana Medić and Andrea Bartolini and Roberto Esposito and Emanuele Parisi and Francesco Beneventi and Mirko Polato and Massimo Torquati and Luca Benini and Marco Aldinucci},
url = {https://dl.acm.org/doi/pdf/10.1145/3587135.3592211},
doi = {10.1145/3587135.3592211},
isbn = {979-8-4007-0140-5/23/05},
year = {2023},
date = {2023-05-01},
booktitle = {20th ACM International Conference on Computing Frontiers (CF '23)},
publisher = {ACM},
address = {Bologna, Italy},
institution = {Computer Science Department, University of Torino},
abstract = {Decentralised Machine Learning (DML) enables collaborative machine learning without centralised input data. Federated Learning (FL) and Edge Inference are examples of DML. While tools for DML (especially FL) are starting to flourish, many are not flexible and portable enough to experiment with novel systems (e.g., RISC-V), non-fully connected topologies, and asynchronous collaboration schemes. We overcome these limitations via a domain-specific language allowing to map DML schemes to an underlying middleware, i.e. the FastFlow parallel programming library. We experiment with it by generating different working DML schemes on two emerging architectures (ARM-v8, RISC-V) and the x86-64 platform. We characterise the performance and energy efficiency of the presented schemes and systems. As a byproduct, we introduce a RISC-V porting of the PyTorch framework, the first publicly available to our knowledge.},
note = {https://arxiv.org/abs/2302.07946},
keywords = {ai, confidential, eupilot, HPC, icsc, riscv},
pubstate = {published},
tppubtype = {inproceedings}
}
Gianluca Mittone, Filip Svoboda, Marco Aldinucci, Nicholas D. Lane, Pietro Lio
A Federated Learning Benchmark for Drug-Target Interaction Proceedings Article
In: Companion Proceedings of the ACM Web Conference 2023 (WWW '23 Companion), ACM, Austin, Texas, 2023, ISBN: 978-1-4503-9419-2/23/04, (https://arxiv.org/abs/2302.07684).
Abstract | Links | BibTeX | Tags: ai, confidential, eupilot, icsc
@inproceedings{23:mittone:dti,
title = {A Federated Learning Benchmark for Drug-Target Interaction},
author = {Gianluca Mittone and Filip Svoboda and Marco Aldinucci and Nicholas D. Lane and Pietro Lio},
url = {https://hdl.handle.net/2318/1898472},
doi = {10.1145/3543873.3587687},
isbn = {978-1-4503-9419-2/23/04},
year = {2023},
date = {2023-04-01},
booktitle = {Companion Proceedings of the ACM Web Conference 2023 (WWW '23 Companion)},
publisher = {ACM},
address = {Austin, Texas},
institution = {Computer Science Department, University of Torino},
abstract = {Aggregating pharmaceutical data in the drug-target interaction (DTI) domain has the potential to deliver life-saving breakthroughs. It is, however, notoriously difficult due to regulatory constraints and commercial interests. This work proposes the application of federated learning, which we argue to be reconcilable with the industry's constraints, as it does not require sharing of any information that would reveal the entities' data or any other high-level summary of it. When used on a representative GraphDTA model and the KIBA dataset it achieves up to 15 percent improved performance relative to the best available non-privacy preserving alternative. Our extensive battery of experiments shows that, unlike in other domains, the non-IID data distribution in the DTI datasets does not deteriorate FL performance. Additionally, we identify a material trade-off between the benefits of adding new data, and the cost of adding more clients.},
note = {https://arxiv.org/abs/2302.07684},
keywords = {ai, confidential, eupilot, icsc},
pubstate = {published},
tppubtype = {inproceedings}
}
Adriano Marques Garcia, Dalvan Griebler, Claudio Schepke, André Sacilotto Santos, José Daniel García, Javier Fernández Muñoz, Luiz Gustavo Fernandes
A Latency, Throughput, and Programmability Perspective of GrPPI for Streaming on Multi-cores Proceedings Article
In: 31st Euromicro International Conference on Parallel, Distributed and Network-Based Processing (PDP), pp. 164-168, IEEE, Naples, Italy, 2023.
Abstract | Links | BibTeX | Tags: admire
@inproceedings{GARCIA:PDP:23,
title = {A Latency, Throughput, and Programmability Perspective of GrPPI for Streaming on Multi-cores},
author = {Adriano Marques Garcia and Dalvan Griebler and Claudio Schepke and André Sacilotto Santos and José Daniel García and Javier Fernández Muñoz and Luiz Gustavo Fernandes},
url = {https://iris.unito.it/retrieve/9165d2ef-7140-4645-87cc-269050341c1d/PDP_2023_SPbench_with_GrPPI.pdf},
doi = {10.1109/PDP59025.2023.00033},
year = {2023},
date = {2023-03-01},
booktitle = {31st Euromicro International Conference on Parallel, Distributed and Network-Based Processing (PDP)},
pages = {164-168},
publisher = {IEEE},
address = {Naples, Italy},
series = {PDP'23},
abstract = {Several solutions aim to simplify the burdening task of parallel programming. The GrPPI library is one of them. It allows users to implement parallel code for multiple backends through a unified, abstract, and generic layer while promising minimal overhead on performance. An outspread evaluation of GrPPI regarding stream parallelism with representative metrics for this domain, such as throughput and latency, was not yet done. In this work, we evaluate GrPPI focused on stream processing. We evaluate performance, memory usage, and programming effort and compare them against handwritten parallel code. For this, we use the benchmarking framework SPBench to build custom GrPPI benchmarks. The basis of the benchmarks is real applications, such as Lane Detection, Bzip2, Face Recognizer, and Ferret. Experiments show that while performance is competitive with handwritten code in some cases, in other cases, the infeasibility of fine-tuning GrPPI is a crucial drawback. Despite this, programmability experiments estimate that GrPPI has the potential to reduce by about three times the development time of parallel applications.},
keywords = {admire},
pubstate = {published},
tppubtype = {inproceedings}
}
Alberto Mulone, Sherine Awad, Davide Chiarugi, Marco Aldinucci
Porting the Variant Calling Pipeline for NGS data in cloud-HPC environment Proceedings Article
In: Shahriar, Hossain, Teranishi, Yuuichi, Cuzzocrea, Alfredo, Sharmin, Moushumi, Towey, Dave, Majumder, A. K. M. Jahangir Alam, Kashiwazaki, Hiroki, Yang, Ji-Jiang, Takemoto, Michiharu, Sakib, Nazmus, Banno, Ryohei, Ahamed, Sheikh Iqbal (Ed.): 47th IEEE Annual Computers, Software, and Applications Conference, COMPSAC 2023, pp. 1858–1863, IEEE, Torino, Italy, 2023.
Abstract | Links | BibTeX | Tags: across, icsc, streamflow
@inproceedings{23:mulone:wide:vcp,
title = {Porting the Variant Calling Pipeline for NGS data in cloud-HPC environment},
author = {Alberto Mulone and Sherine Awad and Davide Chiarugi and Marco Aldinucci},
editor = {Hossain Shahriar and Yuuichi Teranishi and Alfredo Cuzzocrea and Moushumi Sharmin and Dave Towey and A. K. M. Jahangir Alam Majumder and Hiroki Kashiwazaki and Ji-Jiang Yang and Michiharu Takemoto and Nazmus Sakib and Ryohei Banno and Sheikh Iqbal Ahamed},
url = {https://iris.unito.it/bitstream/2318/1919364/1/paper.pdf},
doi = {10.1109/COMPSAC57700.2023.00288},
year = {2023},
date = {2023-01-01},
booktitle = {47th IEEE Annual Computers, Software, and Applications Conference, COMPSAC 2023},
pages = {1858–1863},
publisher = {IEEE},
address = {Torino, Italy},
abstract = {In recent years we have understood the importance of analyzing and sequencing human genetic variation. A relevant aspect that emerged from the Covid-19 pandemic was the need to obtain results very quickly; this involved using High-Performance Computing (HPC) environments to execute the Next Generation Sequencing (NGS) pipeline. However, HPC is not always the most suitable environment for the entire execution of a pipeline, especially when it involves many heterogeneous tools. The ability to execute parts of the pipeline on different environments can lead to higher performance but also cheaper executions. This work shows the design and optimization process that led us to a state-of-the-art Variant Calling hybrid workflow based on the StreamFlow Workflow Management System (WfMS). We also compare StreamFlow with Snakemake, an established WfMS targeting HPC facilities, observing comparable performance on single environments and satisfactory improvements with a hybrid cloud-HPC configuration.},
howpublished = {47th IEEE Annual Computers, Software, and Applications Conference, COMPSAC 2023},
keywords = {across, icsc, streamflow},
pubstate = {published},
tppubtype = {inproceedings}
}
Iacopo Colonnelli, Bruno Casella, Gianluca Mittone, Yasir Arfat, Barbara Cantalupo, Roberto Esposito, Alberto Riccardo Martinelli, Doriana Medić, Marco Aldinucci
Federated Learning meets HPC and cloud Proceedings Article
In: Bufano, Filomena, Riggi, Simone, Sciacca, Eva, Schillirò, Francesco (Ed.): Astrophysics and Space Science Proceedings, pp. 193–199, Springer, Catania, Italy, 2023, ISBN: 978-3-031-34167-0, (Keynote talk).
Abstract | Links | BibTeX | Tags: across, eupilot, streamflow
@inproceedings{22:ml4astro,
title = {Federated Learning meets HPC and cloud},
author = {Iacopo Colonnelli and Bruno Casella and Gianluca Mittone and Yasir Arfat and Barbara Cantalupo and Roberto Esposito and Alberto Riccardo Martinelli and Doriana Medić and Marco Aldinucci},
editor = {Filomena Bufano and Simone Riggi and Eva Sciacca and Francesco Schillirò},
url = {https://iris.unito.it/retrieve/3ac66baa-9d9a-4e9f-94a5-13700694d8aa/ML4Astro.pdf},
doi = {10.1007/978-3-031-34167-0_39},
isbn = {978-3-031-34167-0},
year = {2023},
date = {2023-01-01},
booktitle = {Astrophysics and Space Science Proceedings},
volume = {60},
pages = {193–199},
publisher = {Springer},
address = {Catania, Italy},
abstract = {HPC and AI are fated to meet for several reasons. This article will discuss some of them and argue why this will happen through the set of methods and technologies that underpin cloud computing. As a paradigmatic example, we present a new federated learning system that collaboratively trains a deep learning model in different supercomputing centers. The system is based on the StreamFlow workflow manager designed for hybrid cloud-HPC infrastructures.},
howpublished = {Machine Learning for Astrophysics (ML4ASTRO)},
note = {Keynote talk},
keywords = {across, eupilot, streamflow},
pubstate = {published},
tppubtype = {inproceedings}
}
Alessia Antelmi, Luca La Cava, Arianna Pera
Tell Me Who You Are and I Will Predict Your Vulnerability to Political Persuasion Techniques Proceedings Article
In: The 12th International Conference on Complex Networks and their Applications-Book of Abstracts, 2023.
Abstract | Links | BibTeX | Tags: analytics, icsc
@inproceedings{Antelmi_CNA1_2023,
title = {Tell Me Who You Are and I Will Predict Your Vulnerability to Political Persuasion Techniques},
author = {Alessia Antelmi and Luca La Cava and Arianna Pera},
url = {https://iris.unito.it/bitstream/2318/1949370/1/_CNA__23__Personality_vs_propaganda.pdf},
year = {2023},
date = {2023-01-01},
booktitle = {The 12th International Conference on Complex Networks and their Applications-Book of Abstracts},
abstract = {Given the evolving role of social media in political communication and the strategic use of these platforms by politicians to shape public opinion, research has commonly focused on investigating computational propaganda as a means for automated information diffusion. Focusing on a less explored yet promising line, we aim to assess political persuasion in digital contexts by introducing a computational framework that combines Natural Language Processing and Network Science methods to investigate the linkage between persuasion techniques on social media and personality traits of online political audiences. Our final goal is to enhance public awareness of political tactics and encourage critical thinking in response to the online spread of political information.},
keywords = {analytics, icsc},
pubstate = {published},
tppubtype = {inproceedings}
}
Alessia Antelmi, Luca La Cava, Arianna Pera
Finding Hidden Swingers in the 2022 Italian Elections Twitter Discourse Proceedings Article
In: The 12th International Conference on Complex Networks and their Applications-Book of Abstracts, 2023.
Abstract | Links | BibTeX | Tags: analytics, icsc
@inproceedings{Antelmi_CNA_2023,
title = {Finding Hidden Swingers in the 2022 Italian Elections Twitter Discourse},
author = {Alessia Antelmi and Luca La Cava and Arianna Pera},
url = {https://iris.unito.it/bitstream/2318/1949354/1/_CNA__23__TweetYourMind.pdf},
year = {2023},
date = {2023-01-01},
booktitle = {The 12th International Conference on Complex Networks and their Applications-Book of Abstracts},
abstract = {The volume of the Italian online political discourse on social media has recently increased, but the coverage level does not compare with other Countries such as the US. Nonetheless, researchers focused on studying polarization and homophily with respect to political debates or investigating the role of populism in online engagement. In this research landscape, the analysis of political preference shifts through social media remains to be explored. We aim to bridge this gap by examining the Twitter discourse during the 2022 Italian general elections, with a specific emphasis on political "swingers". In particular, our findings indicate a stable political discourse in Italy, yet they also uncover a growing presence of political swingers willing to shift their support to significantly different factions.},
keywords = {analytics, icsc},
pubstate = {published},
tppubtype = {inproceedings}
}
Alessia Antelmi, Massimo Torquati, Daniele Gregori, Francesco Polzella, Gianmarco Spinatelli, Marco Aldinucci
The SWH-Analytics Framework Proceedings Article
In: Bena, Nicola, Martino, Beniamino Di, Maratea, Antonio, Sperduti, Alessandro, Nardo, Emanuel Di, Ciaramella, Angelo, Montella, Raffaele, Ardagna, Claudio A. (Ed.): Proceedings of the 2nd Italian Conference on Big Data and Data Science (ITADATA 2023), Naples, Italy, September 11-13, 2023, CEUR-WS.org, 2023.
Abstract | Links | BibTeX | Tags: admire, analytics, icsc
@inproceedings{Antelmi_ITADATA_2023,
title = {The SWH-Analytics Framework},
author = {Alessia Antelmi and Massimo Torquati and Daniele Gregori and Francesco Polzella and Gianmarco Spinatelli and Marco Aldinucci},
editor = {Nicola Bena and Beniamino Di Martino and Antonio Maratea and Alessandro Sperduti and Emanuel Di Nardo and Angelo Ciaramella and Raffaele Montella and Claudio A. Ardagna},
url = {https://ceur-ws.org/Vol-3606/paper76.pdf},
year = {2023},
date = {2023-01-01},
booktitle = {Proceedings of the 2nd Italian Conference on Big Data and Data Science (ITADATA 2023), Naples, Italy, September 11-13, 2023},
volume = {3606},
publisher = {CEUR-WS.org},
series = {CEUR Workshop Proceedings},
abstract = {The Software Heritage (SWH) dataset serves as a vast repository for open-source code, with the ambitious goal of preserving all publicly available open-source projects. Despite being designed to effectively archive project files, its size of nearly 1 petabyte presents challenges in efficiently supporting Big Data MapReduce or AI systems. To address this disparity and enable seamless custom analytics on the SWH dataset, we present the SWH-Analytics (SWHA) architecture. This development environment quickly and transparently runs custom analytic applications on open-source software data preserved over time by SWH.},
keywords = {admire, analytics, icsc},
pubstate = {published},
tppubtype = {inproceedings}
}
Iacopo Colonnelli
Workflow Models for Heterogeneous Distributed Systems Proceedings Article
In: Bena, Nicola, Martino, Beniamino Di, Maratea, Antonio, Sperduti, Alessandro, Nardo, Emanuel Di, Ciaramella, Angelo, Montella, Raffaele, Ardagna, Claudio A. (Ed.): Proceedings of the 2nd Italian Conference on Big Data and Data Science (ITADATA 2023), Naples, Italy, September 11-13, 2023, CEUR-WS.org, 2023.
Abstract | Links | BibTeX | Tags: across, eupex, icsc, jupyter-workflow, streamflow
@inproceedings{23:colonnelli:itadata,
title = {Workflow Models for Heterogeneous Distributed Systems},
author = {Iacopo Colonnelli},
editor = {Nicola Bena and Beniamino Di Martino and Antonio Maratea and Alessandro Sperduti and Emanuel Di Nardo and Angelo Ciaramella and Raffaele Montella and Claudio A. Ardagna},
url = {https://ceur-ws.org/Vol-3606/invited77.pdf},
year = {2023},
date = {2023-01-01},
booktitle = {Proceedings of the 2nd Italian Conference on Big Data and Data Science (ITADATA 2023), Naples, Italy, September 11-13, 2023},
volume = {3606},
publisher = {CEUR-WS.org},
series = {CEUR Workshop Proceedings},
abstract = {This article introduces a novel hybrid workflow abstraction that injects topology awareness directly into the definition of a distributed workflow model. In particular, the article briefly discusses the advantages brought by this approach to the design and orchestration of large-scale data-oriented workflows, the current level of support from state-of-the-art workflow systems, and some future research directions.},
keywords = {across, eupex, icsc, jupyter-workflow, streamflow},
pubstate = {published},
tppubtype = {inproceedings}
}
Bruno Casella, Lorenzo Paletto
Predicting Cryptocurrencies Market Phases through On-Chain Data Long-Term Forecasting Proceedings Article
In: Proceedings of the 2023 IEEE International Conference on Blockchain and Cryptocurrency (ICBC), 1-5 May 2023, Dubai, 2023, (https://ieeexplore.ieee.org/document/10174989).
Abstract | Links | BibTeX | Tags: epi, icsc
@inproceedings{23:casella:onchain,
title = {Predicting Cryptocurrencies Market Phases through On-Chain Data Long-Term Forecasting},
author = {Bruno Casella and Lorenzo Paletto},
url = {https://iris.unito.it/bitstream/2318/1902652/1/6.%20ICBC23%20-%20PREDICTING%20BTC.pdf},
doi = {https://doi.org/10.1109/ICBC56567.2023.10174989},
year = {2023},
date = {2023-01-01},
booktitle = {Proceedings of the 2023 IEEE International Conference on Blockchain and Cryptocurrency (ICBC), 1-5 May 2023, Dubai},
abstract = {Blockchain, the underlying technology of Bitcoin and several other cryptocurrencies, like Ethereum, produces a massive amount of open-access data that can be analyzed, providing important information about the network's activity and its respective token. The on-chain data have extensively been used as input to Machine Learning algorithms for predicting cryptocurrencies' future prices; however, there is a lack of study in predicting the future behaviour of on-chain data. This study aims to show how on-chain data can be used to detect cryptocurrency market regimes, like minimum and maximum, bear and bull market phases, and how forecasting these data can provide an optimal asset allocation for long-term investors.},
note = {https://ieeexplore.ieee.org/document/10174989},
keywords = {epi, icsc},
pubstate = {published},
tppubtype = {inproceedings}
}
Bruno Casella, Samuele Fonio
Architecture-Based FedAvg for Vertical Federated Learning Proceedings Article
In: Proceedings of the 3rd Workshop on Distributed Machine Learning for the Intelligent Computing Continuum (DML-ICC), IEEE/ACM UCC 2023, Taormina, Italy, 4 December 2023, 2023, (https://iris.unito.it/bitstream/2318/1949730/1/HALF_HVL_for_DML_ICC23___Taormina-2.pdf).
Abstract | Links | BibTeX | Tags: ai, epi, icsc
@inproceedings{23:casella:architecturalfedavg,
title = {Architecture-Based FedAvg for Vertical Federated Learning},
author = {Bruno Casella and Samuele Fonio},
url = {https://iris.unito.it/retrieve/173d9960-8531-419d-9bd5-5acce6694c4e/Aggregation%20Based%20VFL.pdf},
doi = {10.1145/3603166.3632559},
year = {2023},
date = {2023-01-01},
booktitle = {Proceedings of the 3rd Workshop on Distributed Machine Learning for the Intelligent Computing Continuum (DML-ICC), IEEE/ACM UCC 2023, Taormina, Italy, 4 December 2023},
abstract = {Federated Learning (FL) has emerged as a promising solution to address privacy concerns by collaboratively training Deep Learning (DL) models across distributed parties. This work proposes an architecture-based aggregation strategy in Vertical FL, where parties hold data with different attributes but shared instances. Our approach leverages the identical architectural parts, i.e. neural network layers, of different models to selectively aggregate weights, which is particularly relevant when collaborating with institutions holding different types of datasets, i.e., image, text, or tabular datasets. In a scenario where two entities train DL models, such as a Convolutional Neural Network (CNN) and a Multi-Layer Perceptron (MLP), our strategy computes the average only for architecturally identical segments. This preserves data-specific features learned from demographic and clinical data. We tested our approach on two clinical datasets, i.e., the COVID-CXR dataset and the ADNI study. Results show that our method achieves comparable results with the centralized scenario, in which all the data are collected in a single data lake, and benefits from FL generalizability. In particular, compared to the non-federated models, our proposed proof-of-concept model exhibits a slight performance loss on the COVID-CXR dataset (less than 8%), but outperforms ADNI models by up to 12%. Moreover, communication costs between training rounds are minimized by exchanging only the dense layer parameters.},
note = {https://iris.unito.it/bitstream/2318/1949730/1/HALF_HVL_for_DML_ICC23___Taormina-2.pdf},
keywords = {ai, epi, icsc},
pubstate = {published},
tppubtype = {inproceedings}
}
Matteo Pennisi, Federica Proietto Salanitri, Giovanni Bellitto, Bruno Casella, Marco Aldinucci, Simone Palazzo, Concetto Spampinato
Experience Replay as an Effective Strategy for Optimizing Decentralized Federated Learning Proceedings Article
In: Proceedings of the 1st Workshop on Visual Continual Learning, ICCV 2023, Paris, France, 2 October 2023, 2023, (https://ieeexplore.ieee.org/document/10350429).
Abstract | Links | BibTeX | Tags: ai
@inproceedings{23:casella:ERGANs,
title = {Experience Replay as an Effective Strategy for Optimizing Decentralized Federated Learning},
author = {Matteo Pennisi and Federica Proietto Salanitri and Giovanni Bellitto and Bruno Casella and Marco Aldinucci and Simone Palazzo and Concetto Spampinato},
url = {https://openaccess.thecvf.com/content/ICCV2023W/VCL/papers/Pennisi_Experience_Replay_as_an_Effective_Strategy_for_Optimizing_Decentralized_Federated_ICCVW_2023_paper.pdf},
doi = {10.1109/ICCVW60793.2023.00362},
year = {2023},
date = {2023-01-01},
booktitle = {Proceedings of the 1st Workshop on Visual Continual Learning, ICCV 2023, Paris, France, 2 October 2023},
abstract = {Federated and continual learning are training paradigms addressing data distribution shift in space and time. More specifically, federated learning tackles non-i.i.d data in space as information is distributed in multiple nodes, while continual learning faces with temporal aspect of training as it deals with continuous streams of data. Distribution shifts over space and time is what it happens in real federated learning scenarios that show multiple challenges. First, the federated model needs to learn sequentially while retaining knowledge from the past training rounds. Second, the model has also to deal with concept drift from the distributed data distributions. To address these complexities, we attempt to combine continual and federated learning strategies by proposing a solution inspired by experience replay and generative adversarial concepts for supporting decentralized distributed training. In particular, our approach relies on using limited memory buffers of synthetic privacy-preserving samples and interleaving training on local data and on buffer data. By translating the CL formulation into the task of integrating distributed knowledge with local knowledge, our method enables models to effectively integrate learned representation from local nodes, providing models the capability to generalize across multiple datasets.We test our integrated strategy on two realistic medical image analysis tasks — tuberculosis and melanoma classification — using multiple datasets in order to simulate realistic non-i.i.d. medical data scenarios. Results show that our approach achieves performance comparable to standard (non-federated) learning and significantly outperforms state-of-the-art federated methods in their centralized (thus, more favourable) formulation.},
note = {https://ieeexplore.ieee.org/document/10350429},
keywords = {ai},
pubstate = {published},
tppubtype = {inproceedings}
}
Giorgio Audrito, Alberto Riccardo Martinelli, Gianluca Torta
Parallelising an Aggregate Programming Framework with Message-Passing Interface Proceedings Article
In: 2023 IEEE International Conference on Autonomic Computing and Self-Organizing Systems Companion (ACSOS-C), pp. 140–145, 2023.
@inproceedings{23:acsos:fcppmpi,
title = {Parallelising an Aggregate Programming Framework with Message-Passing Interface},
author = {Giorgio Audrito and Alberto Riccardo Martinelli and Gianluca Torta},
doi = {10.1109/ACSOS-C58168.2023.00054},
year = {2023},
date = {2023-01-01},
booktitle = {2023 IEEE International Conference on Autonomic Computing and Self-Organizing Systems Companion (ACSOS-C)},
pages = {140–145},
keywords = {HPC},
pubstate = {published},
tppubtype = {inproceedings}
}
Matteo Pennisi, Federica Proietto Salanitri, Giovanni Bellitto, Bruno Casella, Marco Aldinucci, Simone Palazzo, Concetto Spampinato
FedER: Federated Learning through Experience Replay and Privacy-Preserving Data Synthesis Journal Article
In: Computer Vision and Image Understanding, vol. 238, pp. 103882, 2023.
Abstract | Links | BibTeX | Tags: ai
@article{23:casella:FedER,
title = {FedER: Federated Learning through Experience Replay and Privacy-Preserving Data Synthesis},
author = {Matteo Pennisi and Federica Proietto Salanitri and Giovanni Bellitto and Bruno Casella and Marco Aldinucci and Simone Palazzo and Concetto Spampinato},
url = {https://www.sciencedirect.com/science/article/pii/S107731422300262X?via%3Dihub},
doi = {10.1016/j.cviu.2023.103882},
year = {2023},
date = {2023-01-01},
journal = {Computer Vision and Image Understanding},
volume = {238},
pages = {103882},
institution = {Computer Science Department, University of Torino},
abstract = {In the medical field, multi-center collaborations are often sought to yield more generalizable findings by leveraging the heterogeneity of patient and clinical data. However, recent privacy regulations hinder the possibility to share data, and consequently, to come up with machine learning-based solutions that support diagnosis and prognosis. Federated learning (FL) aims at sidestepping this limitation by bringing AI-based solutions to data owners and only sharing local AI models, or parts thereof, that need then to be aggregated. However, most of the existing federated learning solutions are still at their infancy and show several shortcomings, from the lack of a reliable and effective aggregation scheme able to retain the knowledge learned locally to weak privacy preservation as real data may be reconstructed from model updates. Furthermore, the majority of these approaches, especially those dealing with medical data, relies on a centralized distributed learning strategy that poses robustness, scalability and trust issues. In this paper we present a federated and decentralized learning strategy, FedER, that, exploiting experience replay and generative adversarial concepts, effectively integrates features from local nodes, providing models able to generalize across multiple datasets while maintaining privacy. FedER is tested on two tasks — tuberculosis and melanoma classification — using multiple datasets in order to simulate realistic non-i.i.d. medical data scenarios. Results show that our approach achieves performance comparable to standard (non-federated) learning and significantly outperforms state-of-the-art federated methods in their centralized (thus, more favourable) formulation. Code is available at https://github.com/perceivelab/FedER},
keywords = {ai},
pubstate = {published},
tppubtype = {article}
}
Bruno Casella, Walter Riviera, Marco Aldinucci, Gloria Menegaz
MERGE: A model for multi-input biomedical federated learning Journal Article
In: Patterns, pp. 100856, 2023, ISSN: 2666-3899.
Abstract | Links | BibTeX | Tags: ai, epi, icsc
@article{23:fl:patterns,
title = {MERGE: A model for multi-input biomedical federated learning},
author = {Bruno Casella and Walter Riviera and Marco Aldinucci and Gloria Menegaz},
url = {https://www.sciencedirect.com/science/article/pii/S2666389923002404},
doi = {10.1016/j.patter.2023.100856},
issn = {2666-3899},
year = {2023},
date = {2023-01-01},
journal = {Patterns},
pages = {100856},
abstract = {Driven by the deep learning (DL) revolution, artificial intelligence (AI) has become a fundamental tool for many biomedical tasks, including analyzing and classifying diagnostic images. Imaging, however, is not the only source of information. Tabular data, such as personal and genomic data and blood test results, are routinely collected but rarely considered in DL pipelines. Nevertheless, DL requires large datasets that often must be pooled from different institutions, raising non-trivial privacy concerns. Federated learning (FL) is a cooperative learning paradigm that aims to address these issues by moving models instead of data across different institutions. Here, we present a federated multi-input architecture using images and tabular data as a methodology to enhance model performance while preserving data privacy. We evaluated it on two showcases: the prognosis of COVID-19 and patients' stratification in Alzheimer's disease, providing evidence of enhanced accuracy and F1 scores against single-input models and improved generalizability against non-federated models.},
keywords = {ai, epi, icsc},
pubstate = {published},
tppubtype = {article}
}
Javier Garcia-Blas, Genaro Sanchez-Gallegos, Cosmin Petre, Alberto Riccardo Martinelli, Marco Aldinucci, Jesus Carretero
Hercules: Scalable and Network Portable In-Memory Ad-Hoc File System for Data-Centric and High-Performance Applications Proceedings Article
In: Cano, José, Dikaiakos, Marios D., Papadopoulos, George A., Pericàs, Miquel, Sakellariou, Rizos (Ed.): Euro-Par 2023: Parallel Processing, pp. 679–693, Springer Nature Switzerland, Cham, 2023, ISBN: 978-3-031-39698-4.
Abstract | BibTeX | Tags: admire, HPC
@inproceedings{10.1007/978-3-031-39698-4_46,
title = {Hercules: Scalable and Network Portable In-Memory Ad-Hoc File System for Data-Centric and High-Performance Applications},
author = {Javier Garcia-Blas and Genaro Sanchez-Gallegos and Cosmin Petre and Alberto Riccardo Martinelli and Marco Aldinucci and Jesus Carretero},
editor = {José Cano and Marios D. Dikaiakos and George A. Papadopoulos and Miquel Pericàs and Rizos Sakellariou},
isbn = {978-3-031-39698-4},
year = {2023},
date = {2023-01-01},
booktitle = {Euro-Par 2023: Parallel Processing},
pages = {679–693},
publisher = {Springer Nature Switzerland},
address = {Cham},
abstract = {The growing demands for data processing by new data-intensive applications are putting pressure on the performance and capacity of HPC storage systems. The advancement in storage technologies, such as NVMe and persistent memory, are aimed at meeting these demands. However, relying solely on ultra-fast storage devices is not cost-effective, leading to the need for multi-tier storage hierarchies to move data based on its usage. To address this issue, ad-hoc file systems have been proposed as a solution. They utilise the available storage of compute nodes, such as memory and persistent storage, to create a temporary file system that adapts to the application behaviour in the HPC environment. This work presents the design, implementation, and evaluation of a distributed ad-hoc in-memory storage system (Hercules), highlighting the new communication model included in Hercules. This communication model takes advantage of the Unified Communication X framework (UCX). This solution leverages the capabilities of RDMA protocols, including Infiniband, Onmipath, shared memory, and zero-copy transfers. The preliminary evaluation results show excellent network utilisation compared with other existing technologies.},
keywords = {admire, HPC},
pubstate = {published},
tppubtype = {inproceedings}
}
Marco Aldinucci Mirko Polato Roberto Esposito
Boosting Methods for Federated Learning Proceedings Article
In: Calvanese, Diego, Diamantini, Claudia, Ferro, Nicola, Marchesin, Stefano, Silvello, Gianmaria, Tanca, Letizia (Ed.): Proc. of the 31th Italian Symposium on Advanced Database Systems,SEBD 2023, pp. 439–448, CEUR-WS.org, 2023.
Abstract | Links | BibTeX | Tags: eupilot
@inproceedings{DBLP:conf/sebd/Esposito23,
title = {Boosting Methods for Federated Learning},
author = {Marco Aldinucci Mirko Polato Roberto Esposito},
editor = {Diego Calvanese and Claudia Diamantini and Nicola Ferro and Stefano Marchesin and Gianmaria Silvello and Letizia Tanca},
url = {https://ceur-ws.org/Vol-3478/paper48.pdf},
year = {2023},
date = {2023-01-01},
booktitle = {Proc. of the 31th Italian Symposium on Advanced Database Systems,SEBD 2023},
pages = {439–448},
publisher = {CEUR-WS.org},
series = {CEUR Workshop Proceedings},
abstract = {Federated Learning (FL) has been proposed to develop better AI systems without compromising the privacy of final users and the legitimate interests of private companies. Initially deployed by Google to predict text input on mobile devices, FL has been deployed in many other industries. Since its introduction, Federated Learning mainly exploited the inner working of neural networks and other gradient descent-based algorithms by either exchanging the weights of the model or the gradients computed during learning. While this approach has been very successful, it rules out applying FL in contexts where other models are preferred, e.g., easier to interpret or known to work better. This paper proposes to leverage distributed versions of the AdaBoost algorithm to acquire strong federated models. In contrast with previous approaches, our proposal does not put any constraint on the client-side learning models and does not rely on inner workings of the learning algorithms used in the clients. We perform a large set of experiments on ten UCI datasets, comparing the algorithms in six non-iidness settings. Results show that the approach is effective, in the case of an IID setting, results are often near to the theoretical optimum (i.e., the performances of AdaBoost on the complete dataset). In case of non-IID settings, results very much depend on the severity of the non-IIDness.},
keywords = {eupilot},
pubstate = {published},
tppubtype = {inproceedings}
}
Pedro Ângelo, Viviana Bono, Mariangiola Dezani-Ciancaglini, Mário Florido
Gradual Guarantee for FJ with lambda-Expressions Proceedings Article
In: Tomb, Aaron (Ed.): Proceedings of the 25th ACM International Workshop on Formal Techniques for Java-like Programs, FTfJP 2023, Seattle, WA, USA, 18 July 2023, pp. 32–38, ACM, 2023.
Links | BibTeX | Tags: admire, icsc
@inproceedings{DBLP:conf/ftfjp/AngeloBDF23,
title = {Gradual Guarantee for FJ with lambda-Expressions},
author = {Pedro Ângelo and Viviana Bono and Mariangiola Dezani-Ciancaglini and Mário Florido},
editor = {Aaron Tomb},
url = {https://doi.org/10.1145/3605156.3606453},
doi = {10.1145/3605156.3606453},
year = {2023},
date = {2023-01-01},
booktitle = {Proceedings of the 25th ACM International Workshop on Formal Techniques for Java-like Programs, FTfJP 2023, Seattle, WA, USA, 18 July 2023},
pages = {32–38},
publisher = {ACM},
keywords = {admire, icsc},
pubstate = {published},
tppubtype = {inproceedings}
}
William Fornaciari, Federico Reghenzani, Federico Terraneo, Davide Baroffio, Cecilia Metra, Martin Omana, Josie E. Rodriguez Condia, Matteo Sonza Reorda, Robert Birke, Iacopo Colonnelli, Gianluca Mittone, Marco Aldinucci, Gabriele Mencagli, Francesco Iannone, Filippo Palombi, Giuseppe Zummo, Daniele Cesarini, Federico Tesser
RISC-V-based Platforms for HPC: Analyzing Non-functional Properties for Future HPC and Big-Data Clusters Proceedings Article
In: Embedded Computer Systems: Architectures, Modeling, and Simulation - 23rd International Conference, SAMOS 2023, Samos, Greece, 2023, (icsc).
Abstract | Links | BibTeX | Tags: icsc, riscv
@inproceedings{23:SAMOS,
title = {RISC-V-based Platforms for HPC: Analyzing Non-functional Properties for Future HPC and Big-Data Clusters},
author = {William Fornaciari and Federico Reghenzani and Federico Terraneo and Davide Baroffio and Cecilia Metra and Martin Omana and Josie E. Rodriguez Condia and Matteo Sonza Reorda and Robert Birke and Iacopo Colonnelli and Gianluca Mittone and Marco Aldinucci and Gabriele Mencagli and Francesco Iannone and Filippo Palombi and Giuseppe Zummo and Daniele Cesarini and Federico Tesser},
url = {https://iris.unito.it/retrieve/b627eab0-3aa1-4fd7-8685-f47c62c792b3/SAMOS_2023_CN_HPC_FL1.pdf},
doi = {10.1007/978-3-031-46077-7_26},
year = {2023},
date = {2023-01-01},
booktitle = {Embedded Computer Systems: Architectures, Modeling, and Simulation - 23rd International Conference, SAMOS 2023},
address = {Samos, Greece},
abstract = {High-PerformanceComputing(HPC)haveevolvedtobeused to perform simulations of systems where physical experimentation is pro- hibitively impractical, expensive, or dangerous. This paper provides a general overview and showcases the analysis of non-functional properties in RISC-V-based platforms for HPCs. In particular, our analyses target the evaluation of power and energy control, thermal management, and reliability assessment of promising systems, structures, and technologies devised for current and future generation of HPC machines. The main set of design methodologies and technologies developed within the activ- ities of the Future and HPC & Big Data spoke of the National Centre of HPC, Big Data and Quantum Computing project are described along with the description of the testbed for experimenting two-phase cooling approaches.},
note = {icsc},
keywords = {icsc, riscv},
pubstate = {published},
tppubtype = {inproceedings}
}
Alessia Antelmi, Daniele De Vinco, Gennaro Cordasco, Carmine Spagnuolo
Towards Unraveling Developers Communities in Stack Overflow and Reddit Proceedings Article
In: International Conference on Computational Social Science 2023, 2023.
Abstract | Links | BibTeX | Tags: analytics, icsc
@inproceedings{Antelmi_IC2S2_2023,
title = {Towards Unraveling Developers Communities in Stack Overflow and Reddit},
author = {Alessia Antelmi and Daniele De Vinco and Gennaro Cordasco and Carmine Spagnuolo},
url = {https://openreview.net/forum?id=WP5ZaAFP19},
year = {2023},
date = {2023-01-01},
booktitle = {International Conference on Computational Social Science 2023},
abstract = {This work investigates the developers' behavior and community formation around the twenty most popular programming languages. We examined two consecutive years of programming-related questions from Stack Overflow and Reddit, performing a longitudinal study on users' posting activity and their high-order interaction patterns abstracted via hypergraphs. Our analysis highlighted crucial differences in how these QA platforms are utilized by their users. In line with previous literature, it emphasized the constant decline of Stack Overflow in favor of more community-friendly platforms, such as Reddit, which has been growing rapidly lately.},
keywords = {analytics, icsc},
pubstate = {published},
tppubtype = {inproceedings}
}
Alessia Antelmi
Engagement in Open Data Workshops: The dark side of remote settings Proceedings Article
In: Methodologies and Intelligent Systems for Technology Enhanced Learning, 12th International Conference, Springer International Publishing, Cham, 2023.
Abstract | Links | BibTeX | Tags: analytics, icsc
@inproceedings{Antelmi_TEL4FC_2023,
title = {Engagement in Open Data Workshops: The dark side of remote settings},
author = {Alessia Antelmi},
url = {https://link.springer.com/chapter/10.1007/978-3-031-42134-1_33},
year = {2023},
date = {2023-01-01},
booktitle = {Methodologies and Intelligent Systems for Technology Enhanced Learning, 12th International Conference},
publisher = {Springer International Publishing},
address = {Cham},
abstract = {The increasing availability of Open Data gives birth to a fertile field for interested stakeholders to create value out of them; however, limited technical expertise and poor awareness are crucial barriers to their exploitation. Because of these reasons, there is an urge for learners to acquire data and information literacy competencies, which are essential for 21st-century skills, and become familiar with available Open Data sources and their potential uses. To promote the dialogue around activities to boost recognition of Open Data and improve users' skills to work with them, we proposed a series of workshops to introduce Italian high school learners to searching for, authoring, and building effective communication based on Open Data. This article describes an ongoing activity and details its organization, reports preliminary results on learners' engagement, and discusses both challenges of the remote setting as well as promising learning outcomes.},
keywords = {analytics, icsc},
pubstate = {published},
tppubtype = {inproceedings}
}
Doriana Medić, Marco Aldinucci
Towards formal model for location aware workflows Proceedings Article
In: Shahriar, Hossain, Teranishi, Yuuichi, Cuzzocrea, Alfredo, Sharmin, Moushumi, Towey, Dave, Majumder, A. K. M. Jahangir Alam, Kashiwazaki, Hiroki, Yang, Ji-Jiang, Takemoto, Michiharu, Sakib, Nazmus, Banno, Ryohei, Ahamed, Sheikh Iqbal (Ed.): 47th IEEE Annual Computers, Software, and Applications Conference, COMPSAC 2023, pp. 1864–1869, IEEE, Torino, Italy, 2023.
Abstract | Links | BibTeX | Tags: eupex, icsc, semantics
@inproceedings{23:medic:formal-model,
title = {Towards formal model for location aware workflows},
author = {Doriana Medić and Marco Aldinucci},
editor = {Hossain Shahriar and Yuuichi Teranishi and Alfredo Cuzzocrea and Moushumi Sharmin and Dave Towey and A. K. M. Jahangir Alam Majumder and Hiroki Kashiwazaki and Ji-Jiang Yang and Michiharu Takemoto and Nazmus Sakib and Ryohei Banno and Sheikh Iqbal Ahamed},
url = {https://iris.unito.it/retrieve/1f9f959c-cd88-4d9c-90ea-54f1c86a15bc/6210-medic.pdf},
doi = {10.1109/COMPSAC57700.2023.00289},
year = {2023},
date = {2023-01-01},
booktitle = {47th IEEE Annual Computers, Software, and Applications Conference, COMPSAC 2023},
pages = {1864–1869},
publisher = {IEEE},
address = {Torino, Italy},
abstract = {Designing complex applications and executing them on large-scale topologies of heterogeneous architectures is becoming increasingly crucial in many scientific domains. As a result, diverse workflow modelling paradigms are developed, most of them with no formalisation provided. In these circumstances, comparing two different models or switching from one system to the other becomes a hard nut to crack. This paper investigates the capability of process algebra to model a location aware workflow system. Distributed π-calculus is considered as the base of the formal model due to its ability to describe the communicating components that change their structure as an outcome of the communication. Later, it is discussed how the base model could be extended or modified to capture different features of location aware workflow system. The intention of this paper is to highlight the fact that due to its flexibility, π-calculus, could be a good candidate to represent the behavioural perspective of the workflow system.},
keywords = {eupex, icsc, semantics},
pubstate = {published},
tppubtype = {inproceedings}
}
Ovidio Filippo, Francesco Bruno, Tineke H. Pinxterhuis, Mariusz Gasior, Leor Perl, Luca Gaido, Domenico Tuttolomondo, Antonio Greco, Roberto Verardi, Gianluca Lo Martire, Mario Iannaccone, Attilio Leone, Gaetano Liccardo, Serena Caglioni, Rocio González Ferreiro, Giulio Rodinò, Giuseppe Musumeci, Giuseppe Patti, Irene Borzillo, Giuseppe Tarantini, Wojciech Wańha, Bruno Casella, Eline H Ploumen, Lukasz Pyka, Ran Kornowski, Andrea Gagnor, Raffaele Piccolo, Sergio Raposeiras Roubin, Davide Capodanno, Paolo Zocca, Federico Conrotto, Gaetano M De Ferrari, Clemens Birgelen, Fabrizio D'Ascenzo
In: Catheterization and Cardiovascular Interventions, 2023.
Abstract | Links | BibTeX | Tags: ai, cardio
@article{23:casella:ultra,
title = {Predictors of target lesion failure after treatment of left main, bifurcation, or chronic total occlusion lesions with ultrathin-strut drug-eluting coronary stents in the ULTRA registry},
author = {Ovidio Filippo and Francesco Bruno and Tineke H. Pinxterhuis and Mariusz Gasior and Leor Perl and Luca Gaido and Domenico Tuttolomondo and Antonio Greco and Roberto Verardi and Gianluca Lo Martire and Mario Iannaccone and Attilio Leone and Gaetano Liccardo and Serena Caglioni and Rocio González Ferreiro and Giulio Rodinò and Giuseppe Musumeci and Giuseppe Patti and Irene Borzillo and Giuseppe Tarantini and Wojciech Wańha and Bruno Casella and Eline H Ploumen and Lukasz Pyka and Ran Kornowski and Andrea Gagnor and Raffaele Piccolo and Sergio Raposeiras Roubin and Davide Capodanno and Paolo Zocca and Federico Conrotto and Gaetano M De Ferrari and Clemens Birgelen and Fabrizio D'Ascenzo},
url = {https://onlinelibrary.wiley.com/doi/full/10.1002/ccd.30696},
doi = {10.1002/ccd.30696},
year = {2023},
date = {2023-01-01},
journal = {Catheterization and Cardiovascular Interventions},
abstract = {Background: Data about the long-term performance of new-generation ultrathin-strut drug-eluting stents (DES) in challenging coronary lesions, such as left main (LM), bifurcation, and chronic total occlusion (CTO) lesions are scant. Methods: The international multicenter retrospective observational ULTRA study included consecutive patients treated from September 2016 to August 2021 with ultrathin-strut (<70µm) DES in challenging de novo lesions. Primary endpoint was target lesion failure (TLF): composite of cardiac death, target-lesion revascularization (TLR), target-vessel myocardial infarction (TVMI), or definite stent thrombosis (ST). Secondary endpoints included all-cause death, acute myocardial infarction (AMI), target vessel revascularization, and TLF components. TLF predictors were assessed with Cox multivariable analysis. Results: Of 1801 patients (age: 66.6$±$11.2 years; male: 1410 [78.3%]), 170 (9.4%) experienced TLF during follow-up of 3.1$±$1.4 years. In patients with LM, CTO, and bifurcation lesions, TLF rates were 13.5%, 9.9%, and 8.9%, respectively. Overall, 160 (8.9%) patients died (74 [4.1%] from cardiac causes). AMI and TVMI rates were 6.0% and 3.2%, respectively. ST occurred in 11 (1.1%) patients while 77 (4.3%) underwent TLR. Multivariable analysis identified the following predictors of TLF: age, STEMI with cardiogenic shock, impaired left ventricular ejection fraction, diabetes, and renal dysfunction. Among the procedural variables, total stent length increased TLF risk (HR: 1.01, 95% CI: 1-1.02 per mm increase), while intracoronary imaging reduced the risk substantially (HR: 0.35, 95% CI: 0.12-0.82). Conclusions: Ultrathin-strut DES showed high efficacy and satisfactory safety, even in patients with challenging coronary lesions. Yet, despite using contemporary gold-standard DES, the association persisted between established patient- and procedure-related features of risk and impaired 3-year clinical outcome.},
keywords = {ai, cardio},
pubstate = {published},
tppubtype = {article}
}
Bruno Casella, Roberto Esposito, Antonio Sciarappa, Carlo Cavazzoni, Marco Aldinucci
Experimenting with Normalization Layers in Federated Learning on non-IID scenarios Technical Report
Computer Science Department, University of Torino 2023.
Abstract | Links | BibTeX | Tags: confidential, epi, icsc
@techreport{23:casella:normalization,
title = {Experimenting with Normalization Layers in Federated Learning on non-IID scenarios},
author = {Bruno Casella and Roberto Esposito and Antonio Sciarappa and Carlo Cavazzoni and Marco Aldinucci},
url = {https://arxiv.org/pdf/2303.10630.pdf},
year = {2023},
date = {2023-01-01},
institution = {Computer Science Department, University of Torino},
abstract = {Training Deep Learning (DL) models require large, high-quality datasets, often assembled with data from different institutions. Federated Learning (FL) has been emerging as a method for privacy-preserving pooling of datasets employing collaborative training from different institutions by iteratively globally aggregating locally trained models. One critical performance challenge of FL is operating on datasets not independently and identically distributed (non-IID) among the federation participants. Even though this fragility cannot be eliminated, it can be debunked by a suitable optimization of two hyperparameters: layer normalization methods and collaboration frequency selection. In this work, we benchmark five different normalization layers for training Neural Networks (NNs), two families of non-IID data skew, and two datasets. Results show that Batch Normalization, widely employed for centralized DL, is not the best choice for FL, whereas Group and Layer Normalization consistently outperform Batch Normalization. Similarly, frequent model aggregation decreases convergence speed and mode quality.},
keywords = {confidential, epi, icsc},
pubstate = {published},
tppubtype = {techreport}
}
Yasir Arfat, Gianluca Mittone, Iacopo Colonnelli, Fabrizio D'Ascenzo, Roberto Esposito, Marco Aldinucci
Pooling critical datasets with Federated Learning Proceedings Article
In: 31st Euromicro International Conference on Parallel, Distributed and Network-Based Processing, PDP 2023, pp. 329–337, IEEE, Napoli, Italy, 2023.
Abstract | Links | BibTeX | Tags: admire, ai, cardio, confidential, hpc4ai
@inproceedings{23:praise-fl:pdp,
title = {Pooling critical datasets with Federated Learning},
author = {Yasir Arfat and Gianluca Mittone and Iacopo Colonnelli and Fabrizio D'Ascenzo and Roberto Esposito and Marco Aldinucci},
url = {https://iris.unito.it/retrieve/491e22ec-3db5-4989-a063-085a199edd20/23_pdp_fl.pdf},
doi = {10.1109/PDP59025.2023.00057},
year = {2023},
date = {2023-01-01},
booktitle = {31st Euromicro International Conference on Parallel, Distributed and Network-Based Processing, PDP 2023},
pages = {329–337},
publisher = {IEEE},
address = {Napoli, Italy},
abstract = {Federated Learning (FL) is becoming popular in different industrial sectors where data access is critical for security, privacy and the economic value of data itself. Unlike traditional machine learning, where all the data must be globally gathered for analysis, FL makes it possible to extract knowledge from data distributed across different organizations that can be coupled with different Machine Learning paradigms. In this work, we replicate, using Federated Learning, the analysis of a pooled dataset (with AdaBoost) that has been used to define the PRAISE score, which is today among the most accurate scores to evaluate the risk of a second acute myocardial infarction. We show that thanks to the extended-OpenFL framework, which implements AdaBoost.F, we can train a federated PRAISE model that exhibits comparable accuracy and recall as the centralised model. We achieved F1 and F2 scores which are consistently comparable to the PRAISE score study of a 16- parties federation but within an order of magnitude less time.},
keywords = {admire, ai, cardio, confidential, hpc4ai},
pubstate = {published},
tppubtype = {inproceedings}
}
Sandro Gepiro Contaldo, Luca Alessandri, Iacopo Colonnelli, Marco Beccuti, Marco Aldinucci
Bringing Cell Subpopulation Discovery on a Cloud-HPC Using rCASC and StreamFlow Book Chapter
In: Calogero, Raffaele Adolfo, Benes, Vladimir (Ed.): Single Cell Transcriptomics: Methods and Protocols, pp. 337–345, Springer US, New York, NY, 2023, ISBN: 978-1-0716-2756-3.
Abstract | Links | BibTeX | Tags: streamflow
@inbook{Contaldo2023,
title = {Bringing Cell Subpopulation Discovery on a Cloud-HPC Using rCASC and StreamFlow},
author = {Sandro Gepiro Contaldo and Luca Alessandri and Iacopo Colonnelli and Marco Beccuti and Marco Aldinucci},
editor = {Raffaele Adolfo Calogero and Vladimir Benes},
url = {https://datacloud.di.unito.it/index.php/s/KMfKo4m7GTGdZmF},
doi = {10.1007/978-1-0716-2756-3_17},
isbn = {978-1-0716-2756-3},
year = {2023},
date = {2023-01-01},
booktitle = {Single Cell Transcriptomics: Methods and Protocols},
pages = {337–345},
publisher = {Springer US},
address = {New York, NY},
abstract = {The idea behind novel single-cell RNA sequencing (scRNA-seq) pipelines is to isolate single cells through microfluidic approaches and generate sequencing libraries in which the transcripts are tagged to track their cell of origin. Modern scRNA-seq platforms are capable of analyzing up to many thousands of cells in each run. Then, combined with massive high-throughput sequencing producing billions of reads, scRNA-seq allows the assessment of fundamental biological properties of cell populations and biological systems at unprecedented resolution.},
keywords = {streamflow},
pubstate = {published},
tppubtype = {inbook}
}
Amirmasoud Ghiassi, Robert Birke, Lydia Chen
Robust Learning via Golden Symmetric Loss of (un)Trusted Labels Proceedings Article
In: SDM '23: SIAM International Conference on Data Mining, pp. 568–576, 2023.
Abstract | Links | BibTeX | Tags: textarossa
@inproceedings{sdm-ghiassi23,
title = {Robust Learning via Golden Symmetric Loss of (un)Trusted Labels},
author = {Amirmasoud Ghiassi and Robert Birke and Lydia Chen},
url = {https://datacloud.di.unito.it/index.php/s/b6z3moNLxnNiCxz},
doi = {10.1137/1.9781611977653.ch64},
year = {2023},
date = {2023-01-01},
booktitle = {SDM '23: SIAM International Conference on Data Mining},
pages = {568–576},
abstract = {Learning robust deep models against noisy labels becomes ever critical when today's data is commonly collected from open platforms and subject to adversarial corruption. The information on the label corruption process, i.e., corruption matrix, can greatly enhance the robustness of deep models but still fall behind in combating hard classes. In this paper, we propose to construct a golden symmetric loss (GSL) based on the estimated corruption matrix as to avoid overfitting to noisy labels and learn effectively from hard classes. GSL is the weighted sum of the corrected regular cross entropy and reverse cross entropy. By leveraging a small fraction of trusted clean data, we estimate the corruption matrix and use it to correct the loss as well as to determine the weights of GSL. We theoretically prove the robustness of the proposed loss function in the presence of dirty labels. We provide a heuristics to adaptively tune the loss weights of GSL according to the noise rate and diversity measured from the dataset. We evaluate our proposed golden symmetric loss on both vision and natural language deep models subject to different types of label noise patterns. Empirical results show that GSL can significantly outperform the existing robust training methods on different noise patterns, showing accuracy improvement up to 18% on CIFAR-100 and 1% on real world noisy dataset of Clothing1M.},
keywords = {textarossa},
pubstate = {published},
tppubtype = {inproceedings}
}
Adriano Marques Garcia, Dalvan Griebler, Claudio Schepke, Luiz Gustavo Fernandes
Micro-batch and data frequency for stream processing on multi-cores Journal Article
In: The Journal of Supercomputing, vol. 79, no. 8, pp. 9206-9244, 2023, ISBN: 1573-0484.
Abstract | Links | BibTeX | Tags: parallel
@article{GARCIA:JSuper:23,
title = {Micro-batch and data frequency for stream processing on multi-cores},
author = {Adriano Marques Garcia and Dalvan Griebler and Claudio Schepke and Luiz Gustavo Fernandes},
url = {https://iris.unito.it/retrieve/9328dbca-98ae-4ac5-b856-57c72db4444a/s11227-022-05024-y_preprint.pdf},
doi = {10.1007/s11227-022-05024-y},
isbn = {1573-0484},
year = {2023},
date = {2023-01-01},
journal = {The Journal of Supercomputing},
volume = {79},
number = {8},
pages = {9206-9244},
publisher = {Springer},
abstract = {Latency or throughput is often critical performance metrics in stream processing. Applications’ performance can fluctuate depending on the input stream. This unpredictability is due to the variety in data arrival frequency and size, complexity, and other factors. Researchers are constantly investigating new ways to mitigate the impact of these variations on performance with self-adaptive techniques involving elasticity or micro-batching. However, there is a lack of benchmarks capable of creating test scenarios to further evaluate these techniques. This work extends and improves the SPBench benchmarking framework to support dynamic micro-batching and data stream frequency management. We also propose a set of algorithms that generates the most commonly used frequency patterns for benchmarking stream processing in related work. It allows the creation of a wide variety of test scenarios. To validate our solution, we use SPBench to create custom benchmarks and evaluate the impact of micro-batching and data stream frequency on the performance of Intel TBB and FastFlow. These are two libraries that leverage stream parallelism for multi-core architectures. Our results demonstrated that our test cases did not benefit from micro-batches on multi-cores. For different data stream frequency configurations, TBB ensured the lowest latency, while FastFlow assured higher throughput in shorter pipelines.},
keywords = {parallel},
pubstate = {published},
tppubtype = {article}
}
2022
Yujin Zhu, Zilong Zhao, Robert Birke, Lydia Y. Chen
Permutation-Invariant Tabular Data Synthesis Proceedings Article
In: Tsumoto, Shusaku, Ohsawa, Yukio, Chen, Lei, Poel, Dirk Van, Hu, Xiaohua, Motomura, Yoichi, Takagi, Takuya, Wu, Lingfei, Xie, Ying, Abe, Akihiro, Raghavan, Vijay (Ed.): IEEE International Conference on Big Data (Big Data), pp. 5855–5864, IEEE, 2022.
Abstract | Links | BibTeX | Tags: analytics
@inproceedings{bigdata-zhu22,
title = {Permutation-Invariant Tabular Data Synthesis},
author = {Yujin Zhu and Zilong Zhao and Robert Birke and Lydia Y. Chen},
editor = {Shusaku Tsumoto and Yukio Ohsawa and Lei Chen and Dirk Van Poel and Xiaohua Hu and Yoichi Motomura and Takuya Takagi and Lingfei Wu and Ying Xie and Akihiro Abe and Vijay Raghavan},
url = {https://datacloud.di.unito.it/index.php/s/b6z3moNLxnNiCxz},
doi = {10.1109/BigData55660.2022.10020639},
year = {2022},
date = {2022-12-01},
booktitle = {IEEE International Conference on Big Data (Big Data)},
pages = {5855–5864},
publisher = {IEEE},
abstract = {Tabular data synthesis is an emerging approach to circumvent strict regulations on data privacy while discovering knowledge through big data. Although state-of-the-art AI-based tabular data synthesizers, e.g., table-GAN, CTGAN, TVAE, and CTAB-GAN, are effective at generating synthetic tabular data, their training is sensitive to column permutations of input data. In this paper, we first c onduct a n e xtensive e mpirical s tudy to disclose such a property of permutation invariance and an in-depth analysis of the existing synthesizers. We show that changing the input column order worsens the statistical difference between real and synthetic data by up to 38.67% due to the encoding of tabular data and the network architectures. To fully unleash the potential of big synthetic tabular data, we propose two solutions: (i) AE-GAN, a synthesizer that uses an autoencoder network to represent the tabular data and GAN networks to synthesize the latent representation, and (ii) a feature sorting algorithm to find t he s uitable c olumn o rder o f i nput d ata f or CNN-based synthesizers. We evaluate the proposed solutions on five datasets in terms of the sensitivity to the column permutation, the quality of synthetic data, and the utility in downstream analyses. Our results show that we enhance the property of permutation-invariance when training synthesizers and further improve the quality and utility of synthetic data, up to 22%, compared to the existing synthesizers.},
keywords = {analytics},
pubstate = {published},
tppubtype = {inproceedings}
}
Emilio Sulis, Ilaria Angela Amantea, Marco Aldinucci, Guido Boella, Renata Marinello, Marco Grosso, Paolo Platter, Serena Ambrosini
An ambient assisted living architecture for hospital at home coupled with a process-oriented perspective Journal Article
In: Journal of Ambient Intelligence and Humanized Computing, 2022, ISBN: 1868-5145.
Abstract | Links | BibTeX | Tags: ai
@article{Sulis2022,
title = {An ambient assisted living architecture for hospital at home coupled with a process-oriented perspective},
author = {Emilio Sulis and Ilaria Angela Amantea and Marco Aldinucci and Guido Boella and Renata Marinello and Marco Grosso and Paolo Platter and Serena Ambrosini},
url = {https://iris.unito.it/retrieve/c7eaab0b-f78b-4af0-8c17-fa5479d776e6/jaihc2021-preprint.pdf},
doi = {10.1007/s12652-022-04388-6},
isbn = {1868-5145},
year = {2022},
date = {2022-09-21},
journal = {Journal of Ambient Intelligence and Humanized Computing},
abstract = {The growing number of next-generation applications offers a relevant opportunity for healthcare services, generating an urgent need for architectures for systems integration. Moreover, the huge amount of stored information related to events can be explored by adopting a process-oriented perspective. This paper discusses an Ambient Assisted Living healthcare architecture to manage hospital home-care services. The proposed solution relies on adopting an event manager to integrate sources ranging from personal devices to web-based applications. Data are processed on a federated cloud platform offering computing infrastructure and storage resources to improve scientific research. In a second step, a business process analysis of telehealth and telemedicine applications is considered. An initial study explored the business process flow to capture the main sequences of tasks, activities, events. This step paves the way for the integration of process mining techniques to compliance monitoring in an AAL architecture framework.},
keywords = {ai},
pubstate = {published},
tppubtype = {article}
}
Iacopo Colonnelli, Marco Aldinucci
Hybrid Workflows For Large - Scale Scientific Applications Proceedings Article
In: Sixth EAGE High Performance Computing Workshop, pp. 1–5, European Association of Geoscientists & Engineers , Milano, Italy, 2022, ISSN: 2214-4609.
Abstract | Links | BibTeX | Tags: across, eupex
@inproceedings{22:eage-hpc-workshop,
title = {Hybrid Workflows For Large - Scale Scientific Applications},
author = {Iacopo Colonnelli and Marco Aldinucci},
url = {https://iris.unito.it/retrieve/d79ddabb-f9d7-4a55-9f84-1528b1533ba3/Extended_Abstract.pdf},
doi = {10.3997/2214-4609.2022615029},
issn = {2214-4609},
year = {2022},
date = {2022-09-01},
booktitle = {Sixth EAGE High Performance Computing Workshop},
pages = {1–5},
publisher = {European Association of Geoscientists & Engineers },
address = {Milano, Italy},
abstract = {Large-scale scientific applications are facing an irrevrsible transition from monolithic, high-performance oriented codes to modular and polyglot deployments of specialised (micro-)services. The reasons behind this transition are many: coupling of standard solvers with Deep Learning techniques, offloading of data analysis and visualisation to Cloud, and the advent of specialised hardware accelerators. Topology-aware Workflow Management Systems (WMSs) play a crucial role. In particular, topology-awareness allows an explicit mapping of workflow steps onto heterogeneous locations, allowing automated executions on top of hybrid architectures (e.g., cloud+HPC or classical+quantum). Plus, topology-aware WMSs can offer nonfunctional requirements OOTB, e.g. components' life-cycle orchestration, secure and efficient data transfers, fault tolerance, and cross-cluster execution of urgent workloads. Augmenting interactive Jupyter Notebooks with distributed workflow capabilities allows domain experts to prototype and scale applications using the same technological stack, while relying on a feature-rich and user-friendly web interface. This abstract will showcase how these general methodologies can be applied to a typical geoscience simulation pipeline based on the Full Wavefront Inversion (FWI) technique. In particular, a prototypical Jupyter Notebook will be executed interactively on Cloud. Preliminary data analyses and post-processing will be executed locally, while the computationally demanding optimisation loop will be scheduled on a remote HPC cluster.},
keywords = {across, eupex},
pubstate = {published},
tppubtype = {inproceedings}
}
Christopher Stewart, Nathaniel Morris, Lydia Y. Chen, Robert Birke
Performance Modeling for Short-Term Cache Allocation Proceedings Article
In: Proceedings of the 51st International Conference on Parallel Processing (ICPP), pp. 31:1–31:11, ACM, 2022.
Abstract | Links | BibTeX | Tags: parallel
@inproceedings{icpp-stewart22,
title = {Performance Modeling for Short-Term Cache Allocation},
author = {Christopher Stewart and Nathaniel Morris and Lydia Y. Chen and Robert Birke},
url = {https://doi.org/10.1145/3545008.3545094},
doi = {10.1145/3545008.3545094},
year = {2022},
date = {2022-08-01},
booktitle = {Proceedings of the 51st International Conference on Parallel Processing (ICPP)},
pages = {31:1–31:11},
publisher = {ACM},
abstract = {Short-term cache allocation grants and then revokes access to processor cache lines dynamically. For online services, short-term allocation can speed up targeted query executions and free up cache lines reserved, but normally not needed, for performance. However, in collocated settings, short-term allocation can increase cache contention, slowing down collocated query executions. To offset slowdowns, collocated services may request short-term allocation more often, making the problem worse. Short-term allocation policies manage which queries receive cache allocations and when. In collocated settings, these policies should balance targeted query speedups against slowdowns caused by recurring cache contention. We present a model-driven approach that (1) predicts response time under a given policy, (2) explores competing policies and (3) chooses policies that yield low response time for all collocated services. Our approach profiles cache usage offline, characterizes the effects of cache allocation policies using deep learning techniques and devises novel performance models for short-term allocation with online services. We tested our approach using data processing, cloud, and high-performance computing benchmarks collocated on Intel processors equipped with Cache Allocation Technology. Our models predicted median response time with 11% absolute percent error. Short-term allocation policies found using our approach out performed state-of-the-art shared cache allocation policies by 1.2-2.3X.},
keywords = {parallel},
pubstate = {published},
tppubtype = {inproceedings}
}
Mirko Polato, Roberto Esposito, Marco Aldinucci
Boosting the Federation: Cross-Silo Federated Learning without Gradient Descent Proceedings Article
In: Intl. Joint Conference on Neural Networks (IJCNN), pp. 1–10, IEEE, Padua, Italy, 2022.
Abstract | Links | BibTeX | Tags: eupilot, hpc4ai
@inproceedings{22:fl:ijcnn,
title = {Boosting the Federation: Cross-Silo Federated Learning without Gradient Descent},
author = {Mirko Polato and Roberto Esposito and Marco Aldinucci},
url = {https://iris.unito.it/retrieve/03a7b692-aecc-43db-a792-874c553d9ebe/ijcnn22-internal.pdf},
doi = {10.1109/IJCNN55064.2022.9892284},
year = {2022},
date = {2022-07-01},
booktitle = {Intl. Joint Conference on Neural Networks (IJCNN)},
pages = {1–10},
publisher = {IEEE},
address = {Padua, Italy},
abstract = {Federated Learning has been proposed to develop better AI systems without compromising the privacy of final users and the legitimate interests of private companies. Initially deployed by Google to predict text input on mobile devices, FL has been deployed in many other industries. Since its introduction, Federated Learning mainly exploited the inner working of neural networks and other gradient descent-based algorithms by either exchanging the weights of the model or the gradients computed during learning. While this approach has been very successful, it rules out applying FL in contexts where other models are preferred, e.g., easier to interpret or known to work better. This paper proposes FL algorithms that build federated models without relying on gradient descent-based methods. Specifically, we leverage distributed versions of the AdaBoost algorithm to acquire strong federated models. In contrast with previous approaches, our proposal does not put any constraint on the client-side learning models. We perform a large set of experiments on ten UCI datasets, comparing the algorithms in six non-iidness settings.},
keywords = {eupilot, hpc4ai},
pubstate = {published},
tppubtype = {inproceedings}
}
Adriano Marques Garcia, Dalvan Griebler, Claudio Schepke, Luiz Gustavo Fernandes
Evaluating Micro-batch and Data Frequency for Stream Processing Applications on Multi-cores Proceedings Article
In: 30th Euromicro International Conference on Parallel, Distributed and Network-Based Processing (PDP), pp. 10-17, IEEE, Valladolid, Spain, 2022.
Abstract | Links | BibTeX | Tags: parallel
@inproceedings{GARCIA:PDP:22,
title = {Evaluating Micro-batch and Data Frequency for Stream Processing Applications on Multi-cores},
author = {Adriano Marques Garcia and Dalvan Griebler and Claudio Schepke and Luiz Gustavo Fernandes},
url = {https://iris.unito.it/retrieve/f6d113e5-789b-4f8b-924d-8ca3d38e8d62/PDP_2022__SPBench_with_Batch_and_Data_Frequency_.pdf},
doi = {10.1109/PDP55904.2022.00011},
year = {2022},
date = {2022-04-01},
booktitle = {30th Euromicro International Conference on Parallel, Distributed and Network-Based Processing (PDP)},
pages = {10-17},
publisher = {IEEE},
address = {Valladolid, Spain},
series = {PDP'22},
abstract = {In stream processing, data arrives constantly and is often unpredictable. It can show large fluctuations in arrival frequency, size, complexity, and other factors. These fluctuations can strongly impact application latency and throughput, which are critical factors in this domain. Therefore, there is a significant amount of research on self-adaptive techniques involving elasticity or micro-batching as a way to mitigate this impact. However, there is a lack of benchmarks and tools for helping researchers to investigate micro-batching and data stream frequency implications. In this paper, we extend a benchmarking framework to support dynamic micro-batching and data stream frequency management. We used it to create custom benchmarks and compare latency and throughput aspects from two different parallel libraries. We validate our solution through an extensive analysis of the impact of micro-batching and data stream frequency on stream processing applications using Intel TBB and FastFlow, which are two libraries that leverage stream parallelism on multi-core architectures. Our results demonstrated up to 33% throughput gain over latency using micro-batches. Additionally, while TBB ensures lower latency, FastFlow ensures higher throughput in the parallel applications for different data stream frequency configurations.},
keywords = {parallel},
pubstate = {published},
tppubtype = {inproceedings}
}
Amirmasoud Ghiassi, Robert Birke, Lydia Y. Chen
LABNET: A Collaborative Method for DNN Training and Label Aggregation Proceedings Article
In: Rocha, Ana Paula, Steels, Luc, Herik, H. Jaap (Ed.): 14th International Conference on Agents and Artificial Intelligence (ICAART), pp. 56–66, SCITEPRESS, 2022.
Abstract | Links | BibTeX | Tags:
@inproceedings{ghiassi/iccart22,
title = {LABNET: A Collaborative Method for DNN Training and Label Aggregation},
author = {Amirmasoud Ghiassi and Robert Birke and Lydia Y. Chen},
editor = {Ana Paula Rocha and Luc Steels and H. Jaap Herik},
url = {https://www.scitepress.org/Link.aspx?doi=10.5220/0010770400003116},
doi = {10.5220/0010770400003116},
year = {2022},
date = {2022-02-01},
booktitle = {14th International Conference on Agents and Artificial Intelligence (ICAART)},
pages = {56–66},
publisher = {SCITEPRESS},
abstract = {Today, to label the massive datasets needed to train Deep Neural Networks (DNNs), cheap and error-prone methods such as crowdsourcing are used. Label aggregation methods aim to infer the true labels from noisy labels annotated by crowdsourcing workers via labels statistics features. Aggregated labels are the main data source to train deep neural networks, and their accuracy directly affects the deep neural network performance. In this paper, we argue that training DNN and aggregating labels are not two separate tasks. Incorporation between DNN training and label aggregation connects data features, noisy labels, and aggregated labels. Since each image contains valuable knowledge about its label, the data features help aggregation methods enhance their performance. We propose LABNET an iterative two-step method. Step one: the label aggregation algorithm provides labels to train the DNN. Step two: the DNN shares a representation of the data features with the label aggregation algorithm. These steps are repeated until the converging label aggregation error rate. To evaluate LABNET we conduct an extensive empirical comparison on CIFAR-10 and CIFAR-100 under different noise and worker statistics. Our evaluation results show that LABNET achieves the highest mean accuracy with an increase of at least 8% to 0.6% and lowest error rate with a reduction of 7.5% to 0.25% against existing aggregation and training methods in most cases.},
keywords = {},
pubstate = {published},
tppubtype = {inproceedings}
}
Federica Proietto Salanitri, Giovanni Bellitto, Simone Palazzo, Ismail Irmakci, Michael B. Wallace, Candice W. Bolan, Megan Engels, Sanne Hoogenboom, Marco Aldinucci, Ulas Bagci, Daniela Giordano, Concetto Spampinato
Neural Transformers for Intraductal Papillary Mucosal Neoplasms (IPMN) Classification in MRI images Proceedings Article
In: 44th Annual International Conference of the IEEE Engineering in Medicine & Biology Society, EMBC 2022, Glasgow, Scotland, United Kingdom, July 11-15, 2022, pp. 475–479, IEEE, 2022.
@inproceedings{DBLP:conf/embc/SalanitriBPIWBE22,
title = {Neural Transformers for Intraductal Papillary Mucosal Neoplasms (IPMN) Classification in MRI images},
author = {Federica Proietto Salanitri and Giovanni Bellitto and Simone Palazzo and Ismail Irmakci and Michael B. Wallace and Candice W. Bolan and Megan Engels and Sanne Hoogenboom and Marco Aldinucci and Ulas Bagci and Daniela Giordano and Concetto Spampinato},
url = {https://doi.org/10.1109/EMBC48229.2022.9871547},
doi = {10.1109/EMBC48229.2022.9871547},
year = {2022},
date = {2022-01-01},
booktitle = {44th Annual International Conference of the IEEE Engineering in Medicine & Biology Society, EMBC 2022, Glasgow, Scotland, United Kingdom, July 11-15, 2022},
pages = {475–479},
publisher = {IEEE},
keywords = {hpc4ai},
pubstate = {published},
tppubtype = {inproceedings}
}
Valentina Cesare, Ugo Becciani, Alberto Vecchiato, Mario Gilberto Lattanzi, Fabio Pitari, Mario Raciti, Giuseppe Tudisco, Marco Aldinucci, Beatrice Bucciarelli
The Gaia AVU-GSR parallel solver: Preliminary studies of a LSQR-based application in perspective of exascale systems Journal Article
In: Astronomy and Computing, pp. 100660, 2022, ISSN: 2213-1337.
Abstract | Links | BibTeX | Tags: eupex
@article{CESARE2022100660,
title = {The Gaia AVU-GSR parallel solver: Preliminary studies of a LSQR-based application in perspective of exascale systems},
author = {Valentina Cesare and Ugo Becciani and Alberto Vecchiato and Mario Gilberto Lattanzi and Fabio Pitari and Mario Raciti and Giuseppe Tudisco and Marco Aldinucci and Beatrice Bucciarelli},
url = {https://openaccess.inaf.it/handle/20.500.12386/32451},
doi = {10.1016/j.ascom.2022.100660},
issn = {2213-1337},
year = {2022},
date = {2022-01-01},
journal = {Astronomy and Computing},
pages = {100660},
abstract = {The Gaia Astrometric Verification Unit–Global Sphere Reconstruction (AVU–GSR) Parallel Solver aims to find the astrometric parameters for circa 10^8 stars in the Milky Way, the attitude and the instrumental specifications of the Gaia satellite, and the global parameter γ of the post Newtonian formalism. The code iteratively solves a system of linear equations, A×x=b, where the coefficient matrix A is large (circa 10^11×10^8 elements) and sparse. To solve this system of equations, the code exploits a hybrid implementation of the iterative PC-LSQR algorithm, where the computation related to different horizontal portions of the coefficient matrix is assigned to separate MPI processes. In the original code, each matrix portion is further parallelized over the OpenMP threads. To further improve the code performance, we ported the application to the GPU, replacing the OpenMP parallelization language with OpenACC. In this port, ∼95% of the data is copied from the host to the device at the beginning of the entire cycle of iterations, making the code compute bound rather than data-transfer bound. The OpenACC code presents a speedup of circa 1.5 over the OpenMP version but further optimizations are in progress to obtain higher gains. The code runs on multiple GPUs and it was tested on the CINECA supercomputer Marconi100, in anticipation of a port to the pre-exascale system Leonardo, that will be installed at CINECA in 2022.},
keywords = {eupex},
pubstate = {published},
tppubtype = {article}
}
Giovanni Agosta, Marco Aldinucci, Carlos Alvarez, Roberto Ammendola, Yasir Arfat, Olivier Beaumont, Massimo Bernaschi, Andrea Biagioni, Tommaso Boccali, Berenger Bramas, Carlo Brandolese, Barbara Cantalupo, Mauro Carrozzo, Daniele Cattaneo, Alessandro Celestini, Massimo Celino, Iacopo Colonnelli, Paolo Cretaro, Pasqua D'Ambra, Marco Danelutto, Roberto Esposito, Lionel Eyraud-Dubois, Antonio Filgueras, William Fornaciari, Ottorino Frezza, Andrea Galimberti, Francesco Giacomini, Brice Goglin, Daniele Gregori, Abdou Guermouche, Francesco Iannone, Michal Kulczewski, Francesca Lo Cicero, Alessandro Lonardo, Alberto R. Martinelli, Michele Martinelli, Xavier Martorell, Giuseppe Massari, Simone Montangero, Gianluca Mittone, Raymond Namyst, Ariel Oleksiak, Paolo Palazzari, Pier Stanislao Paolucci, Federico Reghenzani, Cristian Rossi, Sergio Saponara, Francesco Simula, Federico Terraneo, Samuel Thibault, Massimo Torquati, Matteo Turisini, Piero Vicini, Miquel Vidal, Davide Zoni, Giuseppe Zummo
Towards EXtreme scale technologies and accelerators for euROhpc hw/Sw supercomputing applications for exascale: The TEXTAROSSA approach Journal Article
In: Microprocessors and Microsystems, vol. 95, pp. 104679, 2022, ISSN: 0141-9331.
Abstract | Links | BibTeX | Tags: textarossa
@article{textarossa2022micpro:,
title = {Towards EXtreme scale technologies and accelerators for euROhpc hw/Sw supercomputing applications for exascale: The TEXTAROSSA approach},
author = {Giovanni Agosta and Marco Aldinucci and Carlos Alvarez and Roberto Ammendola and Yasir Arfat and Olivier Beaumont and Massimo Bernaschi and Andrea Biagioni and Tommaso Boccali and Berenger Bramas and Carlo Brandolese and Barbara Cantalupo and Mauro Carrozzo and Daniele Cattaneo and Alessandro Celestini and Massimo Celino and Iacopo Colonnelli and Paolo Cretaro and Pasqua D'Ambra and Marco Danelutto and Roberto Esposito and Lionel Eyraud-Dubois and Antonio Filgueras and William Fornaciari and Ottorino Frezza and Andrea Galimberti and Francesco Giacomini and Brice Goglin and Daniele Gregori and Abdou Guermouche and Francesco Iannone and Michal Kulczewski and Francesca Lo Cicero and Alessandro Lonardo and Alberto R. Martinelli and Michele Martinelli and Xavier Martorell and Giuseppe Massari and Simone Montangero and Gianluca Mittone and Raymond Namyst and Ariel Oleksiak and Paolo Palazzari and Pier Stanislao Paolucci and Federico Reghenzani and Cristian Rossi and Sergio Saponara and Francesco Simula and Federico Terraneo and Samuel Thibault and Massimo Torquati and Matteo Turisini and Piero Vicini and Miquel Vidal and Davide Zoni and Giuseppe Zummo},
doi = {10.1016/j.micpro.2022.104679},
issn = {0141-9331},
year = {2022},
date = {2022-01-01},
journal = {Microprocessors and Microsystems},
volume = {95},
pages = {104679},
abstract = {In the near future, Exascale systems will need to bridge three technology gaps to achieve high performance while remaining under tight power constraints: energy efficiency and thermal control; extreme computation efficiency via HW acceleration and new arithmetic; methods and tools for seamless integration of reconfigurable accelerators in heterogeneous HPC multi-node platforms. TEXTAROSSA addresses these gaps through a co-design approach to heterogeneous HPC solutions, supported by the integration and extension of HW and SW IPs, programming models, and tools derived from European research.},
keywords = {textarossa},
pubstate = {published},
tppubtype = {article}
}
Bruno Casella, Roberto Esposito, Carlo Cavazzoni, Marco Aldinucci
Benchmarking FedAvg and FedCurv for Image Classification Tasks Proceedings Article
In: Anisetti, Marco, Bonifati, Angela, Bena, Nicola, Ardagna, Claudio, Malerba, Donato (Ed.): Proceedings of the 1st Italian Conference on Big Data and Data Science, ITADATA 2022, September 20-21, 2022, CEUR-WS.org, 2022.
Abstract | Links | BibTeX | Tags: eupilot
@inproceedings{casella2022benchmarking,
title = {Benchmarking FedAvg and FedCurv for Image Classification Tasks},
author = {Bruno Casella and Roberto Esposito and Carlo Cavazzoni and Marco Aldinucci},
editor = {Marco Anisetti and Angela Bonifati and Nicola Bena and Claudio Ardagna and Donato Malerba},
url = {https://ceur-ws.org/Vol-3340/paper40.pdf},
year = {2022},
date = {2022-01-01},
booktitle = {Proceedings of the 1st Italian Conference on Big Data and Data Science, ITADATA 2022, September 20-21, 2022},
volume = {3340},
publisher = {CEUR-WS.org},
series = {CEUR Workshop Proceedings},
abstract = {Classic Machine Learning (ML) techniques require training on data available in a single data lake (either centralized or distributed). However, aggregating data from different owners is not always convenient for different reasons, including security, privacy and secrecy. Data carry a value that might vanish when shared with others; the ability to avoid sharing the data enables industrial applications where security and privacy are of paramount importance, making it possible to train global models by implementing only local policies which can be run independently and even on air-gapped data centres. Federated Learning (FL) is a distributed machine learning approach which has emerged as an effective way to address privacy concerns by only sharing local AI models while keeping the data decentralized. Two critical challenges of Federated Learning are managing the heterogeneous systems in the same federated network and dealing with real data, which are often not independently and identically distributed (non-IID) among the clients. In this paper, we focus on the second problem, i.e., the problem of statistical heterogeneity of the data in the same federated network. In this setting, local models might be strayed far from the local optimum of the complete dataset, thus possibly hindering the convergence of the federated model. Several Federated Learning algorithms, such as FedAvg, FedProx and Federated Curvature (FedCurv), aiming at tackling the non-IID setting, have already been proposed. This work provides an empirical assessment of the behaviour of FedAvg and FedCurv in common non-IID scenarios. Results show that the number of epochs per round is an important hyper-parameter that, when tuned appropriately, can lead to significant performance gains while reducing the communication cost. As a side product of this work, we release the non-IID version of the datasets we used so to facilitate further comparisons from the FL community.},
keywords = {eupilot},
pubstate = {published},
tppubtype = {inproceedings}
}
Marco Aldinucci, David Atienza, Federico Bolelli, Mónica Caballero, Iacopo Colonnelli, José Flich, Jon Ander Gómez, David González, Costantino Grana, Marco Grangetto, Simone Leo, Pedro López, Dana Oniga, Roberto Paredes, Luca Pireddu, Eduardo Quiñones, Tatiana Silva, Enzo Tartaglione, Marina Zapater
In: Curry, Edward, Auer, Sören, Berre, Arne J., Metzger, Andreas, Perez, Maria S., Zillner, Sonja (Ed.): Technologies and Applications for Big Data Value, pp. 183–202, Springer International Publishing, Cham, 2022, ISBN: 978-3-030-78307-5.
Abstract | Links | BibTeX | Tags: deephealth, streamflow
@incollection{22:TABDV,
title = {The DeepHealth Toolkit: A Key European Free and Open-Source Software for Deep Learning and Computer Vision Ready to Exploit Heterogeneous HPC and Cloud Architectures},
author = {Marco Aldinucci and David Atienza and Federico Bolelli and Mónica Caballero and Iacopo Colonnelli and José Flich and Jon Ander Gómez and David González and Costantino Grana and Marco Grangetto and Simone Leo and Pedro López and Dana Oniga and Roberto Paredes and Luca Pireddu and Eduardo Quiñones and Tatiana Silva and Enzo Tartaglione and Marina Zapater},
editor = {Edward Curry and Sören Auer and Arne J. Berre and Andreas Metzger and Maria S. Perez and Sonja Zillner},
url = {https://link.springer.com/content/pdf/10.1007/978-3-030-78307-5_9.pdf},
doi = {10.1007/978-3-030-78307-5_9},
isbn = {978-3-030-78307-5},
year = {2022},
date = {2022-01-01},
booktitle = {Technologies and Applications for Big Data Value},
pages = {183–202},
publisher = {Springer International Publishing},
address = {Cham},
chapter = {9},
abstract = {At the present time, we are immersed in the convergence between Big Data, High-Performance Computing and Artificial Intelligence. Technological progress in these three areas has accelerated in recent years, forcing different players like software companies and stakeholders to move quickly. The European Union is dedicating a lot of resources to maintain its relevant position in this scenario, funding projects to implement large-scale pilot testbeds that combine the latest advances in Artificial Intelligence, High-Performance Computing, Cloud and Big Data technologies. The DeepHealth project is an example focused on the health sector whose main outcome is the DeepHealth toolkit, a European unified framework that offers deep learning and computer vision capabilities, completely adapted to exploit underlying heterogeneous High-Performance Computing, Big Data and cloud architectures, and ready to be integrated into any software platform to facilitate the development and deployment of new applications for specific problems in any sector. This toolkit is intended to be one of the European contributions to the field of AI. This chapter introduces the toolkit with its main components and complementary tools, providing a clear view to facilitate and encourage its adoption and wide use by the European community of developers of AI-based solutions and data scientists working in the healthcare sector and others.},
keywords = {deephealth, streamflow},
pubstate = {published},
tppubtype = {incollection}
}
Bruno Casella, Alessio Chisari, Sebastiano Battiato, Mario Giuffrida
Transfer Learning via Test-time Neural Networks Aggregation Proceedings Article
In: Farinella, Giovanni Maria, Radeva, Petia, Bouatouch, Kadi (Ed.): Proceedings of the 17th International Joint Conference on Computer Vision, Imaging and Computer Graphics Theory and Applications, VISIGRAPP 2022, Volume 5: VISAPP, Online Streaming, February 6-8, 2022, pp. 642–649, INSTICC SciTePress, 2022, ISBN: 978-989-758-555-5.
Abstract | Links | BibTeX | Tags: ai
@inproceedings{22:VISAPP:transferlearning,
title = {Transfer Learning via Test-time Neural Networks Aggregation},
author = {Bruno Casella and Alessio Chisari and Sebastiano Battiato and Mario Giuffrida},
editor = {Giovanni Maria Farinella and Petia Radeva and Kadi Bouatouch},
url = {https://iris.unito.it/retrieve/handle/2318/1844159/947123/TRANSFER_LEARNING_VIA_TEST_TIME_NEURAL_NETWORKS_AGGREGATION.pdf},
doi = {10.5220/0010907900003124},
isbn = {978-989-758-555-5},
year = {2022},
date = {2022-01-01},
booktitle = {Proceedings of the 17th International Joint Conference on Computer Vision, Imaging and Computer Graphics Theory and Applications, VISIGRAPP 2022, Volume 5: VISAPP, Online Streaming, February 6-8, 2022},
pages = {642–649},
publisher = {SciTePress},
organization = {INSTICC},
abstract = {It has been demonstrated that deep neural networks outperform traditional machine learning. However, deep networks lack generalisability, that is, they will not perform as good as in a new (testing) set drawn from a different distribution due to the domain shift. In order to tackle this known issue, several transfer learning approaches have been proposed, where the knowledge of a trained model is transferred into another to improve performance with different data. However, most of these approaches require additional training steps, or they suffer from catastrophic forgetting that occurs when a trained model has overwritten previously learnt knowledge. We address both problems with a novel transfer learning approach that uses network aggregation. We train dataset-specific networks together with an aggregation network in a unified framework. The loss function includes two main components: a task-specific loss (such as cross-entropy) and an aggregation loss. The proposed aggregation loss allows our model to learn how trained deep network parameters can be aggregated with an aggregation operator. We demonstrate that the proposed approach learns model aggregation at test time without any further training step, reducing the burden of transfer learning to a simple arithmetical operation. The proposed approach achieves comparable performance w.r.t. the baseline. Besides, if the aggregation operator has an inverse, we will show that our model also inherently allows for selective forgetting, i.e., the aggregated model can forget one of the datasets it was trained on, retaining information on the others.},
keywords = {ai},
pubstate = {published},
tppubtype = {inproceedings}
}
Eduardo Quiñones, Jesus Perales, Jorge Ejarque, Asaf Badouh, Santiago Marco, Fabrice Auzanneau, François Galea, David González, José Ramón Hervás, Tatiana Silva, Iacopo Colonnelli, Barbara Cantalupo, Marco Aldinucci, Enzo Tartaglione, Rafael Tornero, José Flich, Jose Maria Martinez, David Rodriguez, Izan Catalán, Jorge Garcia, Carles Hernández
In: Terzo, Olivier, Martinovič, Jan (Ed.): HPC, Big Data, and AI Convergence Towards Exascale: Challenge and Vision, pp. 191–216, CRC Press, Boca Raton, Florida, 2022, ISBN: 978-1-0320-0984-1.
Abstract | Links | BibTeX | Tags: deephealth, streamflow
@incollection{22:deephealth:HPCbook,
title = {The DeepHealth HPC Infrastructure: Leveraging Heterogenous HPC and Cloud Computing Infrastructures for IA-based Medical Solutions},
author = {Eduardo Quiñones and Jesus Perales and Jorge Ejarque and Asaf Badouh and Santiago Marco and Fabrice Auzanneau and François Galea and David González and José Ramón Hervás and Tatiana Silva and Iacopo Colonnelli and Barbara Cantalupo and Marco Aldinucci and Enzo Tartaglione and Rafael Tornero and José Flich and Jose Maria Martinez and David Rodriguez and Izan Catalán and Jorge Garcia and Carles Hernández},
editor = {Olivier Terzo and Jan Martinovič},
url = {https://iris.unito.it/retrieve/handle/2318/1832050/912413/Preprint.pdf},
doi = {10.1201/9781003176664},
isbn = {978-1-0320-0984-1},
year = {2022},
date = {2022-01-01},
booktitle = {HPC, Big Data, and AI Convergence Towards Exascale: Challenge and Vision},
pages = {191–216},
publisher = {CRC Press},
address = {Boca Raton, Florida},
chapter = {10},
abstract = {This chapter presents the DeepHealth HPC toolkit for an efficient execution of deep learning (DL) medical application into HPC and cloud-computing infrastructures, featuring many-core, GPU, and FPGA acceleration devices. The toolkit offers to the European Computer Vision Library and the European Distributed Deep Learning Library (EDDL), developed in the DeepHealth project as well, the mechanisms to distribute and parallelize DL operations on HPC and cloud infrastructures in a fully transparent way. The toolkit implements workflow managers used to orchestrate HPC workloads for an efficient parallelization of EDDL training operations on HPC and cloud infrastructures, and includes the parallel programming models for an efficient execution EDDL inference and training operations on many-core, GPUs and FPGAs acceleration devices.},
keywords = {deephealth, streamflow},
pubstate = {published},
tppubtype = {incollection}
}
Martin Golasowski, Jan Martinovič, Marc Levrier, Stephan Hachinger, Sophia Karagiorgou, Aikaterini Papapostolou, Spiros Mouzakitis, Ioannis Tsapelas, Monica Caballero, Marco Aldinucci, Jon Ander Gómez, Antony Chazapis, Jean-Thomas Acquaviva
Toward the Convergence of High-Performance Computing, Cloud, and Big Data Domains Book Section
In: Terzo, Olivier, Martinovič, Jan (Ed.): HPC, Big Data, and AI Convergence Towards Exascale: Challenge and Vision, pp. 1–16, CRC Press, Boca Raton, Florida, 2022, ISBN: 978-1-0320-0984-1.
Abstract | Links | BibTeX | Tags: deephealth, streamflow
@incollection{22:intro:HPCbook,
title = {Toward the Convergence of High-Performance Computing, Cloud, and Big Data Domains},
author = {Martin Golasowski and Jan Martinovič and Marc Levrier and Stephan Hachinger and Sophia Karagiorgou and Aikaterini Papapostolou and Spiros Mouzakitis and Ioannis Tsapelas and Monica Caballero and Marco Aldinucci and Jon Ander Gómez and Antony Chazapis and Jean-Thomas Acquaviva},
editor = {Olivier Terzo and Jan Martinovič},
doi = {10.1201/9781003176664},
isbn = {978-1-0320-0984-1},
year = {2022},
date = {2022-01-01},
booktitle = {HPC, Big Data, and AI Convergence Towards Exascale: Challenge and Vision},
pages = {1–16},
publisher = {CRC Press},
address = {Boca Raton, Florida},
chapter = {1},
abstract = {Convergence between big data, high-performance computing, and the cloud is the key driving factor for sustainable economic growth in the future. Technological advances in many fields are determined by competence to gain precise information from the large amounts of data collected, which in turn requires powerful computing resources. This chapter provides an overview on the evolution of the three fields and four different points of view on their convergence provided by the CYBELE, DeepHealth, Evolve, and LEXIS projects funded by the European Union under the Horizon 2020 Programme.},
keywords = {deephealth, streamflow},
pubstate = {published},
tppubtype = {incollection}
}
Dana Oniga, Barbara Cantalupo, Enzo Tartaglione, Daniele Perlo, Marco Grangetto, Marco Aldinucci, Federico Bolelli, Federico Pollastri, Michele Cancilla, Laura Canalini, Costantino Grana, Cristina Muñoz Alcalde, Franco Alberto Cardillo, Monica Florea
Applications of AI and HPC in the Health Domain Book Section
In: Terzo, Olivier, Martinovič, Jan (Ed.): HPC, Big Data, and AI Convergence Towards Exascale: Challenge and Vision, pp. 217–239, CRC Press, Boca Raton, Florida, 2022, ISBN: 978-1-0320-0984-1.
Abstract | Links | BibTeX | Tags: deephealth, streamflow
@incollection{22:applications:HPCbook,
title = {Applications of AI and HPC in the Health Domain},
author = {Dana Oniga and Barbara Cantalupo and Enzo Tartaglione and Daniele Perlo and Marco Grangetto and Marco Aldinucci and Federico Bolelli and Federico Pollastri and Michele Cancilla and Laura Canalini and Costantino Grana and Cristina Muñoz Alcalde and Franco Alberto Cardillo and Monica Florea},
editor = {Olivier Terzo and Jan Martinovič},
doi = {10.1201/9781003176664},
isbn = {978-1-0320-0984-1},
year = {2022},
date = {2022-01-01},
booktitle = {HPC, Big Data, and AI Convergence Towards Exascale: Challenge and Vision},
pages = {217–239},
publisher = {CRC Press},
address = {Boca Raton, Florida},
chapter = {11},
abstract = {This chapter presents the applications of artificial intelligence (AI) and high-computing performance (HPC) in the health domain, illustrated by the description of five of the use cases that are developed in the DeepHealth project. In the context of the European Commission supporting the use of AI and HPC in the health sector, DeepHealth Project is helping health experts process large quantities of images, putting at their disposal DeepLearning and computer vision techniques, combined in the DeepHealth toolkit and HPC infrastructures. The DeepHealth toolkit is tested and validated through 15 use cases, each of them representing a biomedical application. The most promising use cases are described in the chapter, which concludes with the value proposition and the benefits that DeepHealth toolkit offers to future end users.},
keywords = {deephealth, streamflow},
pubstate = {published},
tppubtype = {incollection}
}
Iacopo Colonnelli, Marco Aldinucci, Barbara Cantalupo, Luca Padovani, Sergio Rabellino, Concetto Spampinato, Roberto Morelli, Rosario Di Carlo, Nicolò Magini, Carlo Cavazzoni
Distributed workflows with Jupyter Journal Article
In: Future Generation Computer Systems, vol. 128, pp. 282–298, 2022, ISSN: 0167-739X.
Abstract | Links | BibTeX | Tags: across, deephealth, jupyter-workflow, streamflow
@article{21:FGCS:jupyflow,
title = {Distributed workflows with Jupyter},
author = {Iacopo Colonnelli and Marco Aldinucci and Barbara Cantalupo and Luca Padovani and Sergio Rabellino and Concetto Spampinato and Roberto Morelli and Rosario Di Carlo and Nicolò Magini and Carlo Cavazzoni},
url = {https://www.sciencedirect.com/science/article/pii/S0167739X21003976},
doi = {10.1016/j.future.2021.10.007},
issn = {0167-739X},
year = {2022},
date = {2022-01-01},
journal = {Future Generation Computer Systems},
volume = {128},
pages = {282–298},
abstract = {The designers of a new coordination interface enacting complex workflows have to tackle a dichotomy: choosing a language-independent or language-dependent approach. Language-independent approaches decouple workflow models from the host code's business logic and advocate portability. Language-dependent approaches foster flexibility and performance by adopting the same host language for business and coordination code. Jupyter Notebooks, with their capability to describe both imperative and declarative code in a unique format, allow taking the best of the two approaches, maintaining a clear separation between application and coordination layers but still providing a unified interface to both aspects. We advocate the Jupyter Notebooks' potential to express complex distributed workflows, identifying the general requirements for a Jupyter-based Workflow Management System (WMS) and introducing a proof-of-concept portable implementation working on hybrid Cloud-HPC infrastructures. As a byproduct, we extended the vanilla IPython kernel with workflow-based parallel and distributed execution capabilities. The proposed Jupyter-workflow (Jw) system is evaluated on common scenarios for High Performance Computing (HPC) and Cloud, showing its potential in lowering the barriers between prototypical Notebooks and production-ready implementations.},
keywords = {across, deephealth, jupyter-workflow, streamflow},
pubstate = {published},
tppubtype = {article}
}
Bart Cox, Robert Birke, Lydia Y. Chen
Memory-aware and context-aware multi-DNN inference on the edge Journal Article
In: Pervasive and Mobile Computing, vol. 83, pp. 1–16, 2022, ISSN: 1574-1192.
Abstract | Links | BibTeX | Tags: ai
@article{COX2022101594,
title = {Memory-aware and context-aware multi-DNN inference on the edge},
author = {Bart Cox and Robert Birke and Lydia Y. Chen},
url = {https://www.sciencedirect.com/science/article/pii/S1574119222000372},
doi = {https://doi.org/10.1016/j.pmcj.2022.101594},
issn = {1574-1192},
year = {2022},
date = {2022-01-01},
journal = {Pervasive and Mobile Computing},
volume = {83},
pages = {1–16},
abstract = {Deep neural networks (DNNs) are becoming the core components of many applications running on edge devices, especially for real time image-based analysis. Increasingly, multi-faced knowledge is extracted by executing multiple DNNs inference models, e.g., identifying objects, faces, and genders from images. It is of paramount importance to guarantee low response times of such multi-DNN executions as it affects not only users quality of experience but also safety. The challenge, largely unaddressed by the state of the art, is how to overcome the memory limitation of edge devices without altering the DNN models. In this paper, we design and implement Masa, a responsive memory-aware multi-DNN execution and scheduling framework, which requires no modification of DNN models. The aim of Masa is to consistently ensure the average response time when deterministically and stochastically executing multiple DNN-based image analyses. The enabling features of Masa are (i) modeling inter- and intra-network dependency, (ii) leveraging complimentary memory usage of each layer, and (iii) exploring the context dependency of DNNs. We verify the correctness and scheduling optimality via mixed integer programming. We extensively evaluate two versions of Masa, context-oblivious and context-aware, on three configurations of Raspberry Pi and a large set of popular DNN models triggered by different generation patterns of images. Our evaluation results show that Masa can achieve lower average response times by up to 90% on devices with small memory, i.e., 512 MB to 1 GB, compared to the state of the art multi-DNN scheduling solutions.},
keywords = {ai},
pubstate = {published},
tppubtype = {article}
}
Guglielmo Gallone, Jeehoon Kang, Francesco Bruno, Jung-Kyu Han, Ovidio De Filippo, Han-Mo Yang, Mattia Doronzo, Kyung-Woo Park, Gianluca Mittone, Hyun-Jae Kang, Radoslaw Parma, Hyeon-Cheol Gwon, Enrico Cerrato, Woo Jung Chun, Grzegorz Smolka, Seung-Ho Hur, Gerard Helft, Seung Hwan Han, Saverio Muscoli, Young Bin Song, Filippo Figini, Ki Hong Choi, Giacomo Boccuzzi, Soon-Jun Hong, Daniela Trabattoni, Chang-Wook Nam, Massimo Giammaria, Hyo-Soo Kim, Federico Conrotto, Javier Escaned, Carlo Di Mario, Fabrizio D'Ascenzo, Bon-Kwon Koo, Gaetano Maria Ferrari
Impact of Left Ventricular Ejection Fraction on Procedural and Long-Term Outcomes of Bifurcation Percutaneous Coronary Intervention Journal Article
In: The American Journal of Cardiology, vol. 172, pp. 18–25, 2022, ISSN: 0002-9149.
Abstract | Links | BibTeX | Tags: ai, cardio
@article{GALLONE202218,
title = {Impact of Left Ventricular Ejection Fraction on Procedural and Long-Term Outcomes of Bifurcation Percutaneous Coronary Intervention},
author = {Guglielmo Gallone and Jeehoon Kang and Francesco Bruno and Jung-Kyu Han and Ovidio De Filippo and Han-Mo Yang and Mattia Doronzo and Kyung-Woo Park and Gianluca Mittone and Hyun-Jae Kang and Radoslaw Parma and Hyeon-Cheol Gwon and Enrico Cerrato and Woo Jung Chun and Grzegorz Smolka and Seung-Ho Hur and Gerard Helft and Seung Hwan Han and Saverio Muscoli and Young Bin Song and Filippo Figini and Ki Hong Choi and Giacomo Boccuzzi and Soon-Jun Hong and Daniela Trabattoni and Chang-Wook Nam and Massimo Giammaria and Hyo-Soo Kim and Federico Conrotto and Javier Escaned and Carlo Di Mario and Fabrizio D'Ascenzo and Bon-Kwon Koo and Gaetano Maria Ferrari},
url = {https://www.sciencedirect.com/science/article/pii/S0002914922001692},
doi = {https://doi.org/10.1016/j.amjcard.2022.02.015},
issn = {0002-9149},
year = {2022},
date = {2022-01-01},
journal = {The American Journal of Cardiology},
volume = {172},
pages = {18–25},
abstract = {The association of left ventricular ejection fraction (LVEF) with procedural and long-term outcomes after state-of-the-art percutaneous coronary intervention (PCI) of bifurcation lesions remains unsettled. A total of 5,333 patients who underwent contemporary coronary bifurcation PCI were included in the intercontinental retrospective combined insights from the unified RAIN (veRy thin stents for patients with left mAIn or bifurcatioN in real life) and COBIS (COronary BIfurcation Stenting) III bifurcation registries. Of 5,003 patients (93.8%) with known baseline LVEF, 244 (4.9%) had LVEF <40% (bifurcation with reduced ejection fraction [BIFrEF] group), 430 (8.6%) had LVEF 40% to 49% (bifurcation with mildly reduced ejection fraction [BIFmEF] group) and 4,329 (86.5%) had ejection fraction (EF) ≥50% (bifurcation with preserved ejection fraction [BIFpEF] group). The primary end point was the Kaplan-Meier estimate of major adverse cardiac events (MACEs) (a composite of all-cause death, myocardial infarction, and target vessel revascularization). Patients with BIFrEF had a more complex clinical profile and coronary anatomy. No difference in procedural (30 days) MACE was observed across EF categories, also after adjustment for in-study outcome predictors (BIFrEF vs BIFmEF: adjusted hazard ratio [adj-HR] 1.39, 95% confidence interval [CI] 0.37 to 5.21},
keywords = {ai, cardio},
pubstate = {published},
tppubtype = {article}
}
Adriano Marques Garcia, Dalvan Griebler, Claudio Schepke, Luiz Gustavo Fernandes
SPBench: a framework for creating benchmarks of stream processing applications Journal Article
In: Computing, vol. 105, no. 5, pp. 1077-1099, 2022, ISBN: 1436-5057.
Abstract | Links | BibTeX | Tags: parallel
@article{GARCIA:Computing:22,
title = {SPBench: a framework for creating benchmarks of stream processing applications},
author = {Adriano Marques Garcia and Dalvan Griebler and Claudio Schepke and Luiz Gustavo Fernandes},
url = {https://iris.unito.it/retrieve/f17ea8c2-ddd8-425b-b4e7-8315218a6969/s00607-021-01025-6_preprint.pdf},
doi = {10.1007/s00607-021-01025-6},
isbn = {1436-5057},
year = {2022},
date = {2022-01-01},
journal = {Computing},
volume = {105},
number = {5},
pages = {1077-1099},
publisher = {Springer},
abstract = {In a fast-changing data-driven world, real-time data processing systems are becoming ubiquitous in everyday applications. The increasing data we produce, such as audio, video, image, and, text are demanding quickly and efficiently computation. Stream Parallelism allows accelerating this computation for real-time processing. But it is still a challenging task and most reserved for experts. In this paper, we present SPBench, a framework for benchmarking stream processing applications. It aims to support users with a set of real-world stream processing applications, which are made accessible through an Application Programming Interface (API) and executable via Command Line Interface (CLI) to create custom benchmarks. We tested SPBench by implementing parallel benchmarks with Intel Threading Building Blocks (TBB), FastFlow, and SPar. This evaluation provided useful insights and revealed the feasibility of the proposed framework in terms of usage, customization, and performance analysis. SPBench demonstrated to be a high-level, reusable, extensible, and easy of use abstraction to build parallel stream processing benchmarks on multi-core architectures.},
keywords = {parallel},
pubstate = {published},
tppubtype = {article}
}
2021
Amirmasoud Ghiassi, Robert Birke, Lydia Y. Chen
TrustNet: Learning from Trusted Data Against (A)symmetric Label Noise Proceedings Article
In: 8th IEEE/ACM International Conference on Big Data Computing, Applications and Technologies (BDCAT), pp. 52–62, ACM, 2021.
Abstract | Links | BibTeX | Tags:
@inproceedings{bdcat-ghiassi21,
title = {TrustNet: Learning from Trusted Data Against (A)symmetric Label Noise},
author = {Amirmasoud Ghiassi and Robert Birke and Lydia Y. Chen},
url = {https://doi.org/10.1145/3492324.3494166},
doi = {10.1145/3492324.3494166},
year = {2021},
date = {2021-12-01},
booktitle = {8th IEEE/ACM International Conference on Big Data Computing, Applications and Technologies (BDCAT)},
pages = {52–62},
publisher = {ACM},
abstract = {Big Data systems allow collecting massive datasets to feed the data hungry deep learning. Labelling these ever-bigger datasets is increasingly challenging and label errors affect even highly curated sets. This makes robustness to label noise a critical property for weakly-supervised classifiers. The related works on resilient deep networks tend to focus on a limited set of synthetic noise patterns, and with disparate views on their impacts, e.g., robustness against symmetric v.s. asymmetric noise patterns. In this paper, we first extend the theoretical analysis of test accuracy for any given noise patterns. Based on the insights, we design TrustNet that first learns the pattern of noise corruption, being it both symmetric or asymmetric, from a small set of trusted data. Then, TrustNet is trained via a robust loss function, which weights the given labels against the inferred labels from the learned noise pattern. The weight is adjusted based on model uncertainty across training epochs. We evaluate TrustNet on synthetic label noise for CIFAR-10, CIFAR-100 and big real-world data with label noise, i.e., Clothing1M. We compare against state-of-the-art methods demonstrating the strong robustness of TrustNet under a diverse set of noise patterns.},
keywords = {},
pubstate = {published},
tppubtype = {inproceedings}
}
Zilong Zhao, Aditya Kunar, Robert Birke, Lydia Y. Chen
CTAB-GAN: Effective Table Data Synthesizing Proceedings Article
In: Balasubramanian, Vineeth N., Tsang, Ivor (Ed.): Proceedings of The 13th Asian Conference on Machine Learning, pp. 97–112, PMLR, 2021.
Abstract | Links | BibTeX | Tags:
@inproceedings{pmlr-v157-zhao21a,
title = {CTAB-GAN: Effective Table Data Synthesizing},
author = {Zilong Zhao and Aditya Kunar and Robert Birke and Lydia Y. Chen},
editor = {Vineeth N. Balasubramanian and Ivor Tsang},
url = {https://proceedings.mlr.press/v157/zhao21a.html},
year = {2021},
date = {2021-11-01},
booktitle = {Proceedings of The 13th Asian Conference on Machine Learning},
volume = {157},
pages = {97–112},
publisher = {PMLR},
series = {Proceedings of Machine Learning Research},
abstract = {While data sharing is crucial for knowledge development, privacy concerns and strict regulation (e.g., European General Data Protection Regulation (GDPR)) unfortunately limit its full effectiveness. Synthetic tabular data emerges as an alternative to enable data sharing while fulfilling regulatory and privacy constraints. The state-of-the-art tabular data synthesizers draw methodologies from Generative Adversarial Networks (GAN) and address two main data types in industry, i.e., continuous and categorical. In this paper, we develop CTAB-GAN, a novel conditional table GAN architecture that can effectively model diverse data types, including a mix of continuous and categorical variables. Moreover, we address data imbalance and long tail issues, i.e., certain variables have drastic frequency differences across large values. To achieve those aims, we first introduce the information loss, classification loss and generator loss to the conditional GAN. Secondly, we design a novel conditional vector, which efficiently encodes the mixed data type and skewed distribution of data variable. We extensively evaluate CTAB-GAN with the state of the art GANs that generate synthetic tables, in terms of data similarity and analysis utility. The results on five datasets show that the synthetic data of CTAB-GAN remarkably resembles the real data for all three types of variables and results into higher accuracy for five machine learning algorithms, by up to 17%.},
keywords = {},
pubstate = {published},
tppubtype = {inproceedings}
}
Taraneh Younesian, Zilong Zhao, Amirmasoud Ghiassi, Robert Birke, Lydia Y Chen
QActor: Active Learning on Noisy Labels Proceedings Article
In: Balasubramanian, Vineeth N., Tsang, Ivor (Ed.): Proceedings of The 13th Asian Conference on Machine Learning, pp. 548–563, PMLR, 2021.
Abstract | Links | BibTeX | Tags:
@inproceedings{pmlr-v157-younesian21a,
title = {QActor: Active Learning on Noisy Labels},
author = {Taraneh Younesian and Zilong Zhao and Amirmasoud Ghiassi and Robert Birke and Lydia Y Chen},
editor = {Vineeth N. Balasubramanian and Ivor Tsang},
url = {https://proceedings.mlr.press/v157/younesian21a.html},
year = {2021},
date = {2021-11-01},
booktitle = {Proceedings of The 13th Asian Conference on Machine Learning},
volume = {157},
pages = {548–563},
publisher = {PMLR},
series = {Proceedings of Machine Learning Research},
abstract = {Noisy labeled data is more a norm than a rarity for self-generated content that is continuously published on the web and social media from non-experts. Active querying experts are conventionally adopted to provide labels for the informative samples which don't have labels, instead of possibly incorrect labels. The new challenge that arises here is how to discern the informative and noisy labels which benefit from expert cleaning. In this paper, we aim to leverage the stringent oracle budget to robustly maximize learning accuracy. We propose a noise-aware active learning framework, QActor, and a novel measure emphCENT, which considers both cross-entropy and entropy to select informative and noisy labels for an expert cleansing. QActor iteratively cleans samples via quality models and actively querying an expert on those noisy yet informative samples. To adapt to learning capacity per iteration, QActor dynamically adjusts the query limit according to the learning loss for each learning iteration. We extensively evaluate different image datasets with noise label ratios ranging between 30% and 60%. Our results show that QActor can nearly match the optimal accuracy achieved using only clean data at the cost of only an additional 10% of ground truth data from the oracle.},
keywords = {},
pubstate = {published},
tppubtype = {inproceedings}
}
Giuliano Albanese, Robert Birke, Georgia Giannopoulou, Sandro Schönborn, Thanikesavan Sivanthi
Evaluation of Networking Options for Containerized Deployment of Real-Time Applications Proceedings Article
In: 26th IEEE International Conference on Emerging Technologies and Factory Automation (ETFA), pp. 1–8, IEEE, 2021.
Abstract | Links | BibTeX | Tags:
@inproceedings{etfa-albanese21,
title = {Evaluation of Networking Options for Containerized Deployment of Real-Time Applications},
author = {Giuliano Albanese and Robert Birke and Georgia Giannopoulou and Sandro Schönborn and Thanikesavan Sivanthi},
url = {https://doi.org/10.1109/ETFA45728.2021.9613320},
doi = {10.1109/ETFA45728.2021.9613320},
year = {2021},
date = {2021-09-01},
booktitle = {26th IEEE International Conference on Emerging Technologies and Factory Automation (ETFA)},
pages = {1–8},
publisher = {IEEE},
abstract = {Enterprises in the field of industrial automation experience an increasing demand for providing virtualized software solutions. Inspired by the recent trends in serverless and cloud computing, software virtualization is considered even for safety-critical applications with hard real-time requirements, as a means of avoiding hardware vendor lock-in and reducing volume and maintenance cost of devices. In this work, we evaluate the applicability of OS-level virtualization to an industrial automation use case. Our application runs in Docker containers on top of Linux patched with PREEMPT_RT. We investigate the ability of Docker coupled with diverse networking technologies to fulfill the latency requirements of the application under normal or heavy system load. We empirically compare four networking technologies with respect to communication latency and frequency of missing packets. The results indicate that Docker with certain technologies, such as the Single Root I/O Virtualization interface, performs robustly even under heavy load, enabling sufficient performance isolation and low overhead that does not jeopardise the real-time performance of our application.},
keywords = {},
pubstate = {published},
tppubtype = {inproceedings}
}
Giovanni Agosta, William Fornaciari, Andrea Galimberti, Giuseppe Massari, Federico Reghenzani, Federico Terraneo, Davide Zoni, Carlo Brandolese, Massimo Celino, Francesco Iannone, Paolo Palazzari, Giuseppe Zummo, Massimo Bernaschi, Pasqua D'Ambra, Sergio Saponara, Marco Danelutto, Massimo Torquati, Marco Aldinucci, Yasir Arfat, Barbara Cantalupo, Iacopo Colonnelli, Roberto Esposito, Alberto Riccardo Martinelli, Gianluca Mittone, Olivier Beaumont, Berenger Bramas, Lionel Eyraud-Dubois, Brice Goglin, Abdou Guermouche, Raymond Namyst, Samuel Thibault, Antonio Filgueras, Miquel Vidal, Carlos Alvarez, Xavier Martorell, Ariel Oleksiak, Michal Kulczewski, Alessandro Lonardo, Piero Vicini, Francesco Lo Cicero, Francesco Simula, Andrea Biagioni, Paolo Cretaro, Ottorino Frezza, Pier Stanislao Paolucci, Matteo Turisini, Francesco Giacomini, Tommaso Boccali, Simone Montangero, Roberto Ammendola
TEXTAROSSA: Towards EXtreme scale Technologies and Accelerators for euROhpc hw/Sw Supercomputing Applications for exascale Proceedings Article
In: Proc. of the 24th Euromicro Conference on Digital System Design (DSD), IEEE, Palermo, Italy, 2021.
Abstract | Links | BibTeX | Tags: streamflow, textarossa
@inproceedings{21:DSD:textarossa,
title = {TEXTAROSSA: Towards EXtreme scale Technologies and Accelerators for euROhpc hw/Sw Supercomputing Applications for exascale},
author = {Giovanni Agosta and William Fornaciari and Andrea Galimberti and Giuseppe Massari and Federico Reghenzani and Federico Terraneo and Davide Zoni and Carlo Brandolese and Massimo Celino and Francesco Iannone and Paolo Palazzari and Giuseppe Zummo and Massimo Bernaschi and Pasqua D'Ambra and Sergio Saponara and Marco Danelutto and Massimo Torquati and Marco Aldinucci and Yasir Arfat and Barbara Cantalupo and Iacopo Colonnelli and Roberto Esposito and Alberto Riccardo Martinelli and Gianluca Mittone and Olivier Beaumont and Berenger Bramas and Lionel Eyraud-Dubois and Brice Goglin and Abdou Guermouche and Raymond Namyst and Samuel Thibault and Antonio Filgueras and Miquel Vidal and Carlos Alvarez and Xavier Martorell and Ariel Oleksiak and Michal Kulczewski and Alessandro Lonardo and Piero Vicini and Francesco Lo Cicero and Francesco Simula and Andrea Biagioni and Paolo Cretaro and Ottorino Frezza and Pier Stanislao Paolucci and Matteo Turisini and Francesco Giacomini and Tommaso Boccali and Simone Montangero and Roberto Ammendola},
doi = {10.1109/DSD53832.2021.00051},
year = {2021},
date = {2021-08-01},
booktitle = {Proc. of the 24th Euromicro Conference on Digital System Design (DSD)},
publisher = {IEEE},
address = {Palermo, Italy},
abstract = {To achieve high performance and high energy effi- ciency on near-future exascale computing systems, three key technology gaps needs to be bridged. These gaps include: en- ergy efficiency and thermal control; extreme computation effi- ciency via HW acceleration and new arithmetics; methods and tools for seamless integration of reconfigurable accelerators in heterogeneous HPC multi-node platforms. TEXTAROSSA aims at tackling this gap through a co-design approach to heterogeneous HPC solutions, supported by the integration and extension of HW and SW IPs, programming models and tools derived from European research.},
keywords = {streamflow, textarossa},
pubstate = {published},
tppubtype = {inproceedings}
}
Amirmasoud Ghiassi, Robert Birke, Rui Han, Lydia Y. Chen
LABELNET: Recovering Noisy Labels Proceedings Article
In: International Joint Conference on Neural Networks (IJCNN), pp. 1–8, IEEE, 2021.
Abstract | Links | BibTeX | Tags:
@inproceedings{ijcnn-ghiassi21,
title = {LABELNET: Recovering Noisy Labels},
author = {Amirmasoud Ghiassi and Robert Birke and Rui Han and Lydia Y. Chen},
url = {https://doi.org/10.1109/IJCNN52387.2021.9533562},
doi = {10.1109/IJCNN52387.2021.9533562},
year = {2021},
date = {2021-07-01},
booktitle = {International Joint Conference on Neural Networks (IJCNN)},
pages = {1–8},
publisher = {IEEE},
abstract = {Today's available datasets in the wild, e.g., from social media and open platforms, present tremendous opportunities and challenges for deep learning, as there is a significant portion of tagged images, but often with noisy, i.e. erroneous, labels. Recent studies improve the robustness of deep models against noisy labels without the knowledge of true labels. In this paper, we advocate to derive a stronger classifier which proactively makes use of the noisy labels in addition to the original images - turning noisy labels into learning features. To such an end, we propose a novel framework, LABELNET, composed of Amateur and Expert, which iteratively learn from each other. Amateur is a regular image classifier trained by the feedback of Expert, which imitates how human experts would correct the predicted labels from Amateur using the noise pattern learnt from the knowledge of both the noisy and ground truth labels. The trained Amateur and Expert proactively leverage the images and their noisy labels to infer image classes. Our empirical evaluations on noisy versions of MNIST, CIFAR-10, CIFAR-100 and real-world data of Clothing1M show that the proposed model can achieve robust classification against a wide range of noise ratios and with as little as 20-50% training data, compared to state-of-the-art deep models that solely focus on distilling the impact of noisy labels.},
keywords = {},
pubstate = {published},
tppubtype = {inproceedings}
}
Marco Aldinucci, Giovanni Agosta, Antonio Andreini, Claudio A. Ardagna, Andrea Bartolini, Alessandro Cilardo, Biagio Cosenza, Marco Danelutto, Roberto Esposito, William Fornaciari, Roberto Giorgi, Davide Lengani, Raffaele Montella, Mauro Olivieri, Sergio Saponara, Daniele Simoni, Massimo Torquati
The Italian research on HPC key technologies across EuroHPC Proceedings Article
In: ACM Computing Frontiers, pp. 279–286, ACM, Virtual Conference, Italy, 2021.
Abstract | Links | BibTeX | Tags: admire, eupex, eupilot, textarossa
@inproceedings{21:CINI_acm_CF,
title = {The Italian research on HPC key technologies across EuroHPC},
author = {Marco Aldinucci and Giovanni Agosta and Antonio Andreini and Claudio A. Ardagna and Andrea Bartolini and Alessandro Cilardo and Biagio Cosenza and Marco Danelutto and Roberto Esposito and William Fornaciari and Roberto Giorgi and Davide Lengani and Raffaele Montella and Mauro Olivieri and Sergio Saponara and Daniele Simoni and Massimo Torquati},
url = {https://iris.unito.it/retrieve/handle/2318/1783118/744641/preprint.pdf},
doi = {10.1145/3457388.3458508},
year = {2021},
date = {2021-05-01},
booktitle = {ACM Computing Frontiers},
pages = {279–286},
publisher = {ACM},
address = {Virtual Conference, Italy},
abstract = {High-Performance Computing (HPC) is one of the strategic priorities for research and innovation worldwide due to its relevance for industrial and scientific applications. We envision HPC as composed of three pillars: infrastructures, applications, and key technologies and tools. While infrastructures are by construction centralized in large-scale HPC centers, and applications are generally within the purview of domain-specific organizations, key technologies fall in an intermediate case where coordination is needed, but design and development are often decentralized. A large group of Italian researchers has started a dedicated laboratory within the National Interuniversity Consortium for Informatics (CINI) to address this challenge. The laboratory, albeit young, has managed to succeed in its first attempts to propose a coordinated approach to HPC research within the EuroHPC Joint Undertaking, participating in the calls 2019-20 to five successful proposals for an aggregate total cost of 95M Euro. In this paper, we outline the working group's scope and goals and provide an overview of the five funded projects, which become fully operational in March 2021, and cover a selection of key technologies provided by the working group partners, highlighting their usage development within the projects.},
keywords = {admire, eupex, eupilot, textarossa},
pubstate = {published},
tppubtype = {inproceedings}
}
Carmelo Pino, Simone Palazzo, Francesca Trenta, Francesca Cordero, Ulas Bagci, Francesco Rundo, Sebastiano Battiato, Daniela Giordano, Marco Aldinucci, Concetto Spampinato
Interpretable Deep Model for Predicting Gene-Addicted Non-Small-Cell Lung Cancer in CT Scans Proceedings Article
In: 18th IEEE Intl. Symposium on Biomedical Imaging (ISBI), IEEE, Nice, France, 2021.
Abstract | Links | BibTeX | Tags: deephealth
@inproceedings{21:ct:isbi,
title = {Interpretable Deep Model for Predicting Gene-Addicted Non-Small-Cell Lung Cancer in CT Scans},
author = {Carmelo Pino and Simone Palazzo and Francesca Trenta and Francesca Cordero and Ulas Bagci and Francesco Rundo and Sebastiano Battiato and Daniela Giordano and Marco Aldinucci and Concetto Spampinato},
url = {https://iris.unito.it/retrieve/handle/2318/1790376/764762/21_ISBI_smallcell.pdf},
doi = {10.1109/ISBI48211.2021.9433832},
year = {2021},
date = {2021-04-01},
booktitle = {18th IEEE Intl. Symposium on Biomedical Imaging (ISBI)},
publisher = {IEEE},
address = {Nice, France},
abstract = {Genetic profiling and characterization of lung cancers have recently emerged as a new technique for targeted therapeutic treatment based on immunotherapy or molecular drugs. However, the most effective way to discover specific gene mutations through tissue biopsy has several limitations, from invasiveness to being a risky procedure. Recently, quantitative assessment of visual features from CT data has been demonstrated to be a valid alternative to biopsy for the diagnosis of gene-addicted tumors. In this paper, we present a deep model for automated lesion segmentation and classification as gene-addicted or not. The segmentation approach extends the 2D Tiramisu architecture for 3D segmentation through dense blocks and squeeze-and-excitation layers, while a multi-scale 3D CNN is used for lesion classification. We also train our model with adversarial samples, and show that this approach acts as a gradient regularizer and enhances model interpretability. We also built a dataset, the first of its nature, consisting of 73 CT scans annotated with the presence of a specific genomics profile. We test our approach on this dataset achieving a segmentation accuracy of 93.11% (Dice score) and a classification accuracy in identifying oncogene-addicted lung tumors of 82.00%.},
keywords = {deephealth},
pubstate = {published},
tppubtype = {inproceedings}
}
Chi Hong, Amirmasoud Ghiassi, Yichi Zhou, Robert Birke, Lydia Y. Chen
Online Label Aggregation: A Variational Bayesian Approach Proceedings Article
In: Leskovec, Jure, Grobelnik, Marko, Najork, Marc, Tang, Jie, Zia, Leila (Ed.): WWW '21: The Web Conference 2021, pp. 1904–1915, ACM / IW3C2, 2021.
Abstract | Links | BibTeX | Tags: ai
@inproceedings{www-hong21,
title = {Online Label Aggregation: A Variational Bayesian Approach},
author = {Chi Hong and Amirmasoud Ghiassi and Yichi Zhou and Robert Birke and Lydia Y. Chen},
editor = {Jure Leskovec and Marko Grobelnik and Marc Najork and Jie Tang and Leila Zia},
url = {https://doi.org/10.1145/3442381.3449933},
doi = {10.1145/3442381.3449933},
year = {2021},
date = {2021-04-01},
booktitle = {WWW '21: The Web Conference 2021},
pages = {1904–1915},
publisher = {ACM / IW3C2},
abstract = {Noisy labeled data is more a norm than a rarity for crowd sourced contents. It is effective to distill noise and infer correct labels through aggregating results from crowd workers. To ensure the time relevance and overcome slow responses of workers, online label aggregation is increasingly requested, calling for solutions that can incrementally infer true label distribution via subsets of data items. In this paper, we propose a novel online label aggregation framework, BiLA , which employs variational Bayesian inference method and designs a novel stochastic optimization scheme for incremental training. BiLA is flexible to accommodate any generating distribution of labels by the exact computation of its posterior distribution. We also derive the convergence bound of the proposed optimizer. We compare BiLA with the state of the art based on minimax entropy, neural networks and expectation maximization algorithms, on synthetic and real-world data sets. Our evaluation results on various online scenarios show that BiLA can effectively infer the true labels, with an error rate reduction of at least 10 to 1.5 percent points for synthetic and real-world datasets, respectively.},
keywords = {ai},
pubstate = {published},
tppubtype = {inproceedings}
}
Adriano Marques Garcia, Dalvan Griebler, Claudio Schepke, Luiz Gustavo Fernandes
Introducing a Stream Processing Framework for Assessing Parallel Programming Interfaces Proceedings Article
In: 29th Euromicro International Conference on Parallel, Distributed and Network-Based Processing (PDP), pp. 84-88, IEEE, Valladolid, Spain, 2021.
Abstract | Links | BibTeX | Tags: parallel
@inproceedings{GARCIA:PDP:21,
title = {Introducing a Stream Processing Framework for Assessing Parallel Programming Interfaces},
author = {Adriano Marques Garcia and Dalvan Griebler and Claudio Schepke and Luiz Gustavo Fernandes},
url = {https://iris.unito.it/retrieve/8aa73a3f-0b1f-41e4-9440-a87bbaf6e9c4/PDP_2021__Stream_bench_Framework_.pdf},
doi = {10.1109/PDP52278.2021.00021},
year = {2021},
date = {2021-03-01},
booktitle = {29th Euromicro International Conference on Parallel, Distributed and Network-Based Processing (PDP)},
pages = {84-88},
publisher = {IEEE},
address = {Valladolid, Spain},
series = {PDP'21},
abstract = {Stream Processing applications are spread across different sectors of industry and people's daily lives. The increasing data we produce, such as audio, video, image, and text are demanding quickly and efficiently computation. It can be done through Stream Parallelism, which is still a challenging task and most reserved for experts. We introduce a Stream Processing framework for assessing Parallel Programming Interfaces (PPIs). Our framework targets multi-core architectures and C++ stream processing applications, providing an API that abstracts the details of the stream operators of these applications. Therefore, users can easily identify all the basic operators and implement parallelism through different PPIs. In this paper, we present the proposed framework, implement three applications using its API, and show how it works, by using it to parallelize and evaluate the applications with the PPIs Intel TBB, FastFlow, and SPar. The performance results were consistent with the literature.},
keywords = {parallel},
pubstate = {published},
tppubtype = {inproceedings}
}
Bart Cox, Jeroen Galjaard, Amirmasoud Ghiassi, Robert Birke, Lydia Y. Chen
Masa: Responsive Multi-DNN Inference on the Edge Proceedings Article
In: 19th IEEE International Conference on Pervasive Computing and Communications (PerCom), pp. 1–10, IEEE, 2021.
Abstract | Links | BibTeX | Tags:
@inproceedings{percom-cox21a,
title = {Masa: Responsive Multi-DNN Inference on the Edge},
author = {Bart Cox and Jeroen Galjaard and Amirmasoud Ghiassi and Robert Birke and Lydia Y. Chen},
url = {https://doi.org/10.1109/PERCOM50583.2021.9439111},
doi = {10.1109/PERCOM50583.2021.9439111},
year = {2021},
date = {2021-03-01},
booktitle = {19th IEEE International Conference on Pervasive Computing and Communications (PerCom)},
pages = {1–10},
publisher = {IEEE},
abstract = {Deep neural networks (DNNs) are becoming the core components of many applications running on edge devices, especially for real time image-based analysis. Increasingly, multi-faced knowledge is extracted via executing multiple DNNs inference models, e.g., identifying objects, faces, and genders from images. The response times of multi-DNN highly affect users' quality of experience and safety as well. Different DNNs exhibit diversified resource requirements and execution patterns across layers and networks, which may easily exceed the available device memory and riskily degrade the responsiveness. In this paper, we design and implement Masa, a responsive memory-aware multi-DNN execution framework, an on-device middleware featuring on modeling inter- and intra-network dependency and leveraging complimentary memory usage of each layer. Masa can consistently ensure the average response time when deterministically and stochastically executing multiple DNN-based image analyses. We extensively evaluate Masa on three configurations of Raspberry Pi and a large set of popular DNN models triggered by different generation patterns of images. Our evaluation results show that Masa can achieve lower average response times by up to 90% on devices with small memory, i.e., 512 MB to 1 GB, compared to the state of the art multi-DNN scheduling solutions.},
keywords = {},
pubstate = {published},
tppubtype = {inproceedings}
}
Jeroen Galjaard, Bart Cox, Amirmasoud Ghiassi, Lydia Y. Chen, Robert Birke
MemA: Fast Inference of Multiple Deep Models Proceedings Article
In: 19th IEEE International Conference on Pervasive Computing and Communications Workshops and other Affiliated Events, pp. 281–286, IEEE, 2021.
Abstract | Links | BibTeX | Tags:
@inproceedings{percom-galjaard21,
title = {MemA: Fast Inference of Multiple Deep Models},
author = {Jeroen Galjaard and Bart Cox and Amirmasoud Ghiassi and Lydia Y. Chen and Robert Birke},
url = {https://doi.org/10.1109/PerComWorkshops51409.2021.9430952},
doi = {10.1109/PerComWorkshops51409.2021.9430952},
year = {2021},
date = {2021-03-01},
booktitle = {19th IEEE International Conference on Pervasive Computing and Communications Workshops and other Affiliated Events},
pages = {281–286},
publisher = {IEEE},
abstract = {The execution of deep neural network (DNN) inference jobs on edge devices has become increasingly popular. Multiple of such inference models can concurrently analyse the on-device data, e.g. images, to extract valuable insights. Prior art focuses on low-power accelerators, compressed neural network architectures, and specialized frameworks to reduce execution time of single inference jobs on edge devices which are resource constrained. However, it is little known how different scheduling policies can further improve the runtime performance of multi-inference jobs without additional edge resources. To enable the exploration of scheduling policies, we first develop an execution framework, EdgeCaffe, which splits the DNN inference jobs by loading and execution of each network layer. We empirically characterize the impact of loading and scheduling policies on the execution time of multi-inference jobs and point out their dependency on the available memory space. We propose a novel memory-aware scheduling policy, MemA, which opportunistically interleaves the executions of different types of DNN layers based on their estimated run-time memory demands. Our evaluation on exhaustive combinations of five networks, data inputs, and memory configurations show that MemA can alleviate the degradation of execution times of multi-inference (up to 5×) under severely constrained memory compared to standard scheduling policies without affecting accuracy.},
keywords = {},
pubstate = {published},
tppubtype = {inproceedings}
}
Gianluca Bontempi, Ricardo Chavarriaga, Hans De Canck, Emanuela Girardi, Holger Hoos, Iarla Kilbane‐Dawe, Tonio Ball, Ann Nowé, Jose Sousa, Davide Bacciu, Marco Aldinucci, Manlio De Domenico, Alessandro Saffiotti, Marco Maratea
The CLAIRE COVID-19 initiative: approach, experiences and recommendations Journal Article
In: Ethics and Information Technology, 2021.
Abstract | Links | BibTeX | Tags: deephealth
@article{21:eit:covidclaire,
title = {The CLAIRE COVID-19 initiative: approach, experiences and recommendations},
author = {Gianluca Bontempi and Ricardo Chavarriaga and Hans De Canck and Emanuela Girardi and Holger Hoos and Iarla Kilbane‐Dawe and Tonio Ball and Ann Nowé and Jose Sousa and Davide Bacciu and Marco Aldinucci and Manlio De Domenico and Alessandro Saffiotti and Marco Maratea},
url = {https://iris.unito.it/retrieve/handle/2318/1784271/747923/Bontempi2021_Article_TheCLAIRECOVID-19InitiativeApp-3.pdf},
doi = {10.1007/s10676-020-09567-7},
year = {2021},
date = {2021-02-01},
journal = {Ethics and Information Technology},
publisher = {Springer},
abstract = {A volunteer effort by Artificial Intelligence (AI) researchers has shown it can deliver significant research outcomes rapidly to help tackle COVID-19. Within two months, CLAIRE's self-organising volunteers delivered the World's first comprehensive curated repository of COVID-19-related datasets useful for drug-repurposing, drafted review papers on the role CT/X-ray scan analysis and robotics could play, and progressed research in other areas. Given the pace required and nature of voluntary efforts, the teams faced a number of challenges. These offer insights in how better to prepare for future volunteer scientific efforts and large scale, data-dependent AI collaborations in general. We offer seven recommendations on how to best leverage such efforts and collaborations in the context of managing future crises.},
keywords = {deephealth},
pubstate = {published},
tppubtype = {article}
}
Ivan Lanese, Doriana Medić, Claudio Antares Mezzina
Static versus dynamic reversibility in CCS Journal Article
In: Acta Informatica, vol. 58, pp. 1–34, 2021.
Abstract | Links | BibTeX | Tags: semantics
@article{21:journals:LaneseMM21,
title = {Static versus dynamic reversibility in CCS},
author = {Ivan Lanese and Doriana Medić and Claudio Antares Mezzina},
url = {https://doi.org/10.1007/s00236-019-00346-6},
doi = {10.1007/s00236-019-00346-6},
year = {2021},
date = {2021-01-01},
journal = {Acta Informatica},
volume = {58},
pages = {1–34},
abstract = {The notion of reversible computing is attracting interest because of its applications in diverse fields, in particular the study of programming abstractions for fault tolerant systems. Most computational models are not naturally reversible since computation causes loss of information, and history information must be stored to enable reversibility. In the literature, two approaches to reverse the CCS process calculus exist, differing on how history information is kept. Reversible CCS (RCCS), proposed by Danos and Krivine, exploits dedicated stacks of memories attached to each thread. CCS with Keys (CCSK), proposed by Phillips and Ulidowski, makes CCS operators static so that computation does not cause information loss. In this paper we show that RCCS and CCSK are equivalent in terms of LTS isomorphism.},
keywords = {semantics},
pubstate = {published},
tppubtype = {article}
}
Clément Aubert, Doriana Medić
Explicit Identifiers and Contexts in Reversible Concurrent Calculus Proceedings Article
In: Reversible Computation - 13th International Conference, RC 2021, Virtual Event, July 7-8, 2021, Proceedings, Springer, 2021.
Abstract | Links | BibTeX | Tags: semantics
@inproceedings{21:RC:AubertM21,
title = {Explicit Identifiers and Contexts in Reversible Concurrent Calculus},
author = {Clément Aubert and Doriana Medić},
url = {https://doi.org/10.1007/978-3-030-79837-6_9},
doi = {10.1007/978-3-030-79837-6_9},
year = {2021},
date = {2021-01-01},
booktitle = {Reversible Computation - 13th International Conference, RC 2021, Virtual Event, July 7-8, 2021, Proceedings},
publisher = {Springer},
abstract = {Existing formalisms for the algebraic specification and representation of networks of reversible agents suffer some shortcomings. Despite multiple attempts, reversible declensions of the Calculus of Communicating Systems (CCS) do not offer satisfactory adaptation of notions usual in ?forward-only? process algebras, such as replication or context. Existing formalisms disallow the ?hot-plugging? of processes during their execution in contexts with their own past. They also assume the existence of ?eternally fresh? keys or identifiers that, if implemented poorly, could result in unnecessary bottlenecks and look-ups involving all the threads. In this paper, we begin investigating those issues, by first designing a process algebra endowed with a mechanism to generate identifiers without the need to consult with the other threads. We use this calculus to recast the possible representations of non-determinism in CCS, and as a by-product establish a simple and straightforward definition of concurrency. Our reversible calculus is then proven to satisfy expected properties. We also observe that none of the reversible bisimulations defined thus far are congruences under our notion of ?reversible? contexts.},
keywords = {semantics},
pubstate = {published},
tppubtype = {inproceedings}
}
C. Pino, G. Vecchio, Marco Fronda, Marco Calandri, Marco Aldinucci, Concetto Spampinato
TwinLiverNet: Predicting TACE Treatment Outcome from CT scans for Hepatocellular Carcinoma using Deep Capsule Networks Proceedings Article
In: 43rd Annual International Conference of the IEEE Engineering in Medicine & Biology Society, EMBC 2021, Mexico, November 1-5, 2021, pp. 3039–3043, IEEE, 2021.
Abstract | Links | BibTeX | Tags: ai
@inproceedings{21:DBLP:conf/embc/PinoVFCAS21,
title = {TwinLiverNet: Predicting TACE Treatment Outcome from CT scans for Hepatocellular Carcinoma using Deep Capsule Networks},
author = {C. Pino and G. Vecchio and Marco Fronda and Marco Calandri and Marco Aldinucci and Concetto Spampinato},
url = {https://doi.org/10.1109/EMBC46164.2021.9630913},
doi = {10.1109/EMBC46164.2021.9630913},
year = {2021},
date = {2021-01-01},
booktitle = {43rd Annual International Conference of the IEEE Engineering in Medicine & Biology Society, EMBC 2021, Mexico, November 1-5, 2021},
pages = {3039–3043},
publisher = {IEEE},
abstract = {Predicting response to treatment plays a key role to assist radiologists in hepato-cellular carcinoma (HCC) therapy planning. The most widely used treatment for unresectable HCC is the trans-arterial chemoembolization (TACE). A complete radiological response after the first TACE is a reliable predictor of treatment favourable outcome. However, visual inspection of contrast-enhanced CT scans is time-consuming, error prone and too operator-dependent. Thus, in this paper we propose TwinLiverNet: a deep neural network that is able to predict TACE treatment outcome through learning visual cue from CT scans. TwinLiverNet, specifically, integrates 3D convolutions and capsule networks and is designed to process simultaneously late arterial and delayed phases from contrast-enhanced CTs. Experimental results carried out on a dataset consisting of 126 HCC lesions show that TwinLiverNet reaches an average accuracy of 82% in predicting complete response to TACE treatment. Furthermore, combining multiple CT phases (specifically, late arterial and delayed ones) yields a performance increase of over 12 percent points. Finally, the introduction of capsule layers into the model avoids the model to overfit, while enhancing accuracy.Clinical relevance— TwinLiverNet supports radiologists in visual inspection of CT scans to assess TACE treatment outcome, while reducing inter-operator variability.},
keywords = {ai},
pubstate = {published},
tppubtype = {inproceedings}
}
Marco Aldinucci, Valentina Cesare, Iacopo Colonnelli, Alberto Riccardo Martinelli, Gianluca Mittone, Barbara Cantalupo
Practical Parallelizazion of a Laplace Solver with MPI Proceedings Article
In: Iannone, Francesco (Ed.): ENEA CRESCO in the fight against COVID-19, pp. 21–24, ENEA, 2021.
Abstract | BibTeX | Tags: hpc4ai
@inproceedings{21:laplace:enea,
title = {Practical Parallelizazion of a Laplace Solver with MPI},
author = {Marco Aldinucci and Valentina Cesare and Iacopo Colonnelli and Alberto Riccardo Martinelli and Gianluca Mittone and Barbara Cantalupo},
editor = {Francesco Iannone},
year = {2021},
date = {2021-01-01},
booktitle = {ENEA CRESCO in the fight against COVID-19},
pages = {21–24},
publisher = {ENEA},
abstract = {This work exposes a practical methodology for the semi-automatic parallelization of existing code. We show how a scientific sequential code can be parallelized through our approach. The obtained parallel code is only slightly different from the starting sequential one, providing an example of how little re-designing our methodology involves. The performance of the parallelized code, executed on the CRESCO6 cluster, is then exposed and discussed. We also believe in the educational value of this approach and suggest its use as a teaching device for students.},
keywords = {hpc4ai},
pubstate = {published},
tppubtype = {inproceedings}
}
Iacopo Colonnelli, Barbara Cantalupo, Concetto Spampinato, Matteo Pennisi, Marco Aldinucci
Bringing AI pipelines onto cloud-HPC: setting a baseline for accuracy of COVID-19 diagnosis Proceedings Article
In: Iannone, Francesco (Ed.): ENEA CRESCO in the fight against COVID-19, ENEA, 2021.
Abstract | Links | BibTeX | Tags: streamflow
@inproceedings{21:covi:enea,
title = {Bringing AI pipelines onto cloud-HPC: setting a baseline for accuracy of COVID-19 diagnosis},
author = {Iacopo Colonnelli and Barbara Cantalupo and Concetto Spampinato and Matteo Pennisi and Marco Aldinucci},
editor = {Francesco Iannone},
url = {https://iris.unito.it/retrieve/handle/2318/1796029/779853/21_AI-pipelines_ENEA-COVID19.pdf},
doi = {10.5281/zenodo.5151511},
year = {2021},
date = {2021-01-01},
booktitle = {ENEA CRESCO in the fight against COVID-19},
publisher = {ENEA},
abstract = {HPC is an enabling platform for AI. The introduction of AI workloads in the HPC applications basket has non-trivial consequences both on the way of designing AI applications and on the way of providing HPC computing. This is the leitmotif of the convergence between HPC and AI. The formalized definition of AI pipelines is one of the milestones of HPC-AI convergence. If well conducted, it allows, on the one hand, to obtain portable and scalable applications. On the other hand, it is crucial for the reproducibility of scientific pipelines. In this work, we advocate the StreamFlow Workflow Management System as a crucial ingredient to define a parametric pipeline, called ``CLAIRE COVID-19 Universal Pipeline'', which is able to explore the optimization space of methods to classify COVID-19 lung lesions from CT scans, compare them for accuracy, and therefore set a performance baseline. The universal pipeline automatizes the training of many different Deep Neural Networks (DNNs) and many different hyperparameters. It, therefore, requires a massive computing power, which is found in traditional HPC infrastructure thanks to the portability-by-design of pipelines designed with StreamFlow. Using the universal pipeline, we identified a DNN reaching over 90% accuracy in detecting COVID-19 lesions in CT scans.},
keywords = {streamflow},
pubstate = {published},
tppubtype = {inproceedings}
}
Ovidio De Filippo, Jeehoon Kang, Francesco Bruno, Jung-Kyu Han, Andrea Saglietto, Han-Mo Yang, Giuseppe Patti, Kyung-Woo Park, Radoslaw Parma, Hyo-Soo Kim, Leonardo De Luca, Hyeon-Cheol Gwon, Mario Iannaccone, Woo Jung Chun, Grzegorz Smolka, Seung-Ho Hur, Enrico Cerrato, Seung Hwan Han, Carlo Mario, Young Bin Song, Javier Escaned, Ki Hong Choi, Gerard Helft, Joon-Hyung Doh, Alessandra Truffa Giachet, Soon-Jun Hong, Saverio Muscoli, Chang-Wook Nam, Guglielmo Gallone, Davide Capodanno, Daniela Trabattoni, Yoichi Imori, Veronica Dusi, Bernardo Cortese, Antonio Montefusco, Federico Conrotto, Iacopo Colonnelli, Imad Sheiban, Gaetano Maria Ferrari, Bon-Kwon Koo, Fabrizio D'Ascenzo
In: The American Journal of Cardiology, 2021, ISSN: 0002-9149.
Abstract | Links | BibTeX | Tags: ai, cardio
@article{21:ajc:bifurcat,
title = {Benefit of Extended Dual Antiplatelet Therapy Duration in Acute Coronary Syndrome Patients Treated with Drug Eluting Stents for Coronary Bifurcation Lesions (from the BIFURCAT Registry)},
author = {Ovidio De Filippo and Jeehoon Kang and Francesco Bruno and Jung-Kyu Han and Andrea Saglietto and Han-Mo Yang and Giuseppe Patti and Kyung-Woo Park and Radoslaw Parma and Hyo-Soo Kim and Leonardo De Luca and Hyeon-Cheol Gwon and Mario Iannaccone and Woo Jung Chun and Grzegorz Smolka and Seung-Ho Hur and Enrico Cerrato and Seung Hwan Han and Carlo Mario and Young Bin Song and Javier Escaned and Ki Hong Choi and Gerard Helft and Joon-Hyung Doh and Alessandra Truffa Giachet and Soon-Jun Hong and Saverio Muscoli and Chang-Wook Nam and Guglielmo Gallone and Davide Capodanno and Daniela Trabattoni and Yoichi Imori and Veronica Dusi and Bernardo Cortese and Antonio Montefusco and Federico Conrotto and Iacopo Colonnelli and Imad Sheiban and Gaetano Maria Ferrari and Bon-Kwon Koo and Fabrizio D'Ascenzo},
url = {https://www.sciencedirect.com/science/article/pii/S0002914921006354},
doi = {10.1016/j.amjcard.2021.07.005},
issn = {0002-9149},
year = {2021},
date = {2021-01-01},
journal = {The American Journal of Cardiology},
abstract = {Optimal dual antiplatelet therapy (DAPT) duration for patients undergoing percutaneous coronary intervention (PCI) for coronary bifurcations is an unmet issue. The BIFURCAT registry was obtained by merging two registries on coronary bifurcations. Three groups were compared in a two-by-two fashion: short-term DAPT (≤ 6 months), intermediate-term DAPT (6-12 months) and extended DAPT (>12 months). Major adverse cardiac events (MACE) (a composite of all-cause death, myocardial infarction (MI), target-lesion revascularization and stent thrombosis) were the primary endpoint. Single components of MACE were the secondary endpoints. Events were appraised according to the clinical presentation: chronic coronary syndrome (CCS) versus acute coronary syndrome (ACS). 5537 patients (3231 ACS, 2306 CCS) were included. After a median follow-up of 2.1 years (IQR 0.9-2.2), extended DAPT was associated with a lower incidence of MACE compared with intermediate-term DAPT (2.8% versus 3.4%, adjusted HR 0.23 [0.1-0.54], p <0.001), driven by a reduction of all-cause death in the ACS cohort. In the CCS cohort, an extended DAPT strategy was not associated with a reduced risk of MACE. In conclusion, among real-world patients receiving PCI for coronary bifurcation, an extended DAPT strategy was associated with a reduction of MACE in ACS but not in CCS patients.},
keywords = {ai, cardio},
pubstate = {published},
tppubtype = {article}
}
Yasir Arfat, Gianluca Mittone, Roberto Esposito, Barbara Cantalupo, Gaetano Maria De Ferrari, Marco Aldinucci
A Review of Machine Learning for Cardiology Journal Article
In: Minerva cardiology and angiology, 2021.
Abstract | Links | BibTeX | Tags: deephealth, hpc4ai
@article{21:ai4numbers:minerva,
title = {A Review of Machine Learning for Cardiology},
author = {Yasir Arfat and Gianluca Mittone and Roberto Esposito and Barbara Cantalupo and Gaetano Maria De Ferrari and Marco Aldinucci},
url = {https://iris.unito.it/retrieve/handle/2318/1796298/780512/21_AI4numbers-preprint.pdf},
doi = {10.23736/s2724-5683.21.05709-4},
year = {2021},
date = {2021-01-01},
journal = {Minerva cardiology and angiology},
abstract = {This paper reviews recent cardiology literature and reports how Artificial Intelligence Tools (specifically, Machine Learning techniques) are being used by physicians in the field. Each technique is introduced with enough details to allow the understanding of how it works and its intent, but without delving into details that do not add immediate benefits and require expertise in the field. We specifically focus on the principal Machine Learning based risk scores used in cardiovascular research. After introducing them and summarizing their assumptions and biases, we discuss their merits and shortcomings. We report on how frequently they are adopted in the field and suggest why this is the case based on our expertise in Machine Learning. We complete the analysis by reviewing how corresponding statistical approaches compare with them. Finally, we discuss the main open issues in applying Machine Learning tools to cardiology tasks, also drafting possible future directions. Despite the growing interest in these tools, we argue that there are many still underutilized techniques: while Neural Networks are slowly being incorporated in cardiovascular research, other important techniques such as Semi-Supervised Learning and Federated Learning are still underutilized. The former would allow practitioners to harness the information contained in large datasets that are only partially labeled, while the latter would foster collaboration between institutions allowing building larger and better models.},
keywords = {deephealth, hpc4ai},
pubstate = {published},
tppubtype = {article}
}
Marco Aldinucci, Valentina Cesare, Iacopo Colonnelli, Alberto Riccardo Martinelli, Gianluca Mittone, Barbara Cantalupo, Carlo Cavazzoni, Maurizio Drocco
Practical Parallelization of Scientific Applications with OpenMP, OpenACC and MPI Journal Article
In: Journal of Parallel and Distributed Computing, vol. 157, pp. 13–29, 2021.
Abstract | Links | BibTeX | Tags: HPC
@article{21:jpdc:loop,
title = {Practical Parallelization of Scientific Applications with OpenMP, OpenACC and MPI},
author = {Marco Aldinucci and Valentina Cesare and Iacopo Colonnelli and Alberto Riccardo Martinelli and Gianluca Mittone and Barbara Cantalupo and Carlo Cavazzoni and Maurizio Drocco},
url = {https://iris.unito.it/retrieve/handle/2318/1792557/770851/Practical_Parallelization_JPDC_preprint.pdf},
doi = {10.1016/j.jpdc.2021.05.017},
year = {2021},
date = {2021-01-01},
journal = {Journal of Parallel and Distributed Computing},
volume = {157},
pages = {13–29},
abstract = {This work aims at distilling a systematic methodology to modernize existing sequential scientific codes with a little re-designing effort, turning an old codebase into emphmodern code, i.e., parallel and robust code. We propose a semi-automatic methodology to parallelize scientific applications designed with a purely sequential programming mindset, possibly using global variables, aliasing, random number generators, and stateful functions. We demonstrate that the same methodology works for the parallelization in the shared memory model (via OpenMP), message passing model (via MPI), and General Purpose Computing on GPU model (via OpenACC). The method is demonstrated parallelizing four real-world sequential codes in the domain of physics and material science. The methodology itself has been distilled in collaboration with MSc students of the Parallel Computing course at the University of Torino, that applied it for the first time to the project works that they presented for the final exam of the course. Every year the course hosts some special lectures from industry representatives, who present how they use parallel computing and offer codes to be parallelizeda.},
keywords = {HPC},
pubstate = {published},
tppubtype = {article}
}
Daniele D'Agostino, Ivan Merelli, Marco Aldinucci, Daniele Cesini
Hardware and Software Solutions for Energy-Efficient Computing in Scientific Programming Journal Article
In: Scientific Programming, vol. 2021, pp. 5514284, 2021, ISBN: 1058-9244.
Abstract | Links | BibTeX | Tags: HPC
@article{21:dagostino:lowpower,
title = {Hardware and Software Solutions for Energy-Efficient Computing in Scientific Programming},
author = {Daniele D'Agostino and Ivan Merelli and Marco Aldinucci and Daniele Cesini},
url = {https://downloads.hindawi.com/journals/sp/2021/5514284.pdf},
doi = {10.1155/2021/5514284},
isbn = {1058-9244},
year = {2021},
date = {2021-01-01},
journal = {Scientific Programming},
volume = {2021},
pages = {5514284},
publisher = {Hindawi},
abstract = {Energy consumption is one of the major issues in today’s computer science, and an increasing number of scientific communities are interested in evaluating the tradeoff between time-to-solution and energy-to-solution. Despite, in the last two decades, computing which revolved around centralized computing infrastructures, such as supercomputing and data centers, the wide adoption of the Internet of Things (IoT) paradigm is currently inverting this trend due to the huge amount of data it generates, pushing computing power back to places where the data are generated—the so-called fog/edge computing. This shift towards a decentralized model requires an equivalent change in the software engineering paradigms, development environments, hardware tools, languages, and computation models for scientific programming because the local computational capabilities are typically limited and require a careful evaluation of power consumption. This paper aims to present how these concepts can be actually implemented in scientific software by presenting the state of the art of powerful, less power-hungry processors from one side and energy-aware tools and techniques from the other one.},
keywords = {HPC},
pubstate = {published},
tppubtype = {article}
}
Daniele D'Agostino, Pietro Liò, Marco Aldinucci, Ivan Merelli
Advantages of using graph databases to explore chromatin conformation capture experiments Journal Article
In: BMC Bioinformatics, vol. 22, no. 2, pp. 43–58, 2021, ISBN: 1471-2105.
Abstract | Links | BibTeX | Tags: deephealth, hpc4ai
@article{21:neohic:bmc,
title = {Advantages of using graph databases to explore chromatin conformation capture experiments},
author = {Daniele D'Agostino and Pietro Liò and Marco Aldinucci and Ivan Merelli},
url = {https://bmcbioinformatics.biomedcentral.com/track/pdf/10.1186/s12859-020-03937-0.pdf},
doi = {10.1186/s12859-020-03937-0},
isbn = {1471-2105},
year = {2021},
date = {2021-01-01},
journal = {BMC Bioinformatics},
volume = {22},
number = {2},
pages = {43–58},
abstract = {High-throughput sequencing Chromosome Conformation Capture (Hi-C) allows the study of DNA interactions and 3D chromosome folding at the genome-wide scale. Usually, these data are represented as matrices describing the binary contacts among the different chromosome regions. On the other hand, a graph-based representation can be advantageous to describe the complex topology achieved by the DNA in the nucleus of eukaryotic cells.},
keywords = {deephealth, hpc4ai},
pubstate = {published},
tppubtype = {article}
}
Marco Aldinucci
L'infrastruttura necessaria per creare interoperabilità tra pubbliche amministrazioni Book Section
In: Perin, Roberto Cavallo (Ed.): L'amministrazione pubblica con i big data: da Torino un dibattito sull'intelligenza artificiale, pp. 225–232, 2021, ISBN: 9788875901806.
Abstract | Links | BibTeX | Tags:
@incollection{21:bigdata:ius,
title = {L'infrastruttura necessaria per creare interoperabilità tra pubbliche amministrazioni},
author = {Marco Aldinucci},
editor = {Roberto Cavallo Perin},
url = {https://iris.unito.it/retrieve/handle/2318/1784335/748058/15.Aldinucci.pdf},
isbn = {9788875901806},
year = {2021},
date = {2021-01-01},
booktitle = {L'amministrazione pubblica con i big data: da Torino un dibattito sull'intelligenza artificiale},
pages = {225–232},
chapter = {15},
abstract = {L'articolo affronta il tema dell'interoperabilità dal punto di vista informatico, ponendo l'accento sulle infrastrutture necessarie affinché la comunicazione tra sistemi informatici pubblici sia possibile. La struttura a silos su cui si basa il sistema informativo della pubblica amministrazione italiana risulta inadeguato all'approccio della big data analysis che, a contrario, richiede la piena comunicabilità tra sistemi informativi affinché il reperimento dei dati su cui condurre sperimentazioni sia quanto più facile e mirato.},
keywords = {},
pubstate = {published},
tppubtype = {incollection}
}
Matteo Pennisi, Isaak Kavasidis, Concetto Spampinato, Vincenzo Schinina, Simone Palazzo, Federica Proietto Salanitri, Giovanni Bellitto, Francesco Rundo, Marco Aldinucci, Massimo Cristofaro, others
An Explainable AI System for Automated COVID-19 Assessment and Lesion Categorization from CT-scans Journal Article
In: Artificial Intelligence in Medicine, pp. 102114, 2021.
Abstract | Links | BibTeX | Tags: ai
@article{pennisi2021explainable,
title = {An Explainable AI System for Automated COVID-19 Assessment and Lesion Categorization from CT-scans},
author = {Matteo Pennisi and Isaak Kavasidis and Concetto Spampinato and Vincenzo Schinina and Simone Palazzo and Federica Proietto Salanitri and Giovanni Bellitto and Francesco Rundo and Marco Aldinucci and Massimo Cristofaro and others},
url = {https://iris.unito.it/retrieve/handle/2318/1792619/770952/2021_COVID_AIM_preprint.pdf},
doi = {10.1016/j.artmed.2021.102114},
year = {2021},
date = {2021-01-01},
journal = {Artificial Intelligence in Medicine},
pages = {102114},
publisher = {Elsevier},
abstract = {COVID-19 infection caused by SARS-CoV-2 pathogen has been a catastrophic pandemic outbreak all over the world, with exponential increasing of confirmed cases and, unfortunately, deaths. In this work we propose an AI-powered pipeline, based on the deep-learning paradigm, for automated COVID-19 detection and lesion categorization from CT scans. We first propose a new segmentation module aimed at automatically identifying lung parenchyma and lobes. Next, we combine the segmentation network with classification networks for COVID-19 identification and lesion categorization. We compare the model's classification results with those obtained by three expert radiologists on a dataset of 166 CT scans. Results showed a sensitivity of 90.3% and a specificity of 93.5% for COVID-19 detection, at least on par with those yielded by the expert radiologists, and an average lesion categorization accuracy of about 84%. Moreover, a significant role is played by prior lung and lobe segmentation, that allowed us to enhance classification performance by over 6 percent points. The interpretation of the trained AI models reveals that the most significant areas for supporting the decision on COVID-19 identification are consistent with the lesions clinically associated to the virus, i.e., crazy paving, consolidation and ground glass. This means that the artificial models are able to discriminate a positive patient from a negative one (both controls and patients with interstitial pneumonia tested negative to COVID) by evaluating the presence of those lesions into CT scans. Finally, the AI models are integrated into a user-friendly GUI to support AI explainability for radiologists, which is publicly available at http://perceivelab.com/covid-ai. The whole AI system is unique since, to the best of our knowledge, it is the first AI-based software, publicly available, that attempts to explain to radiologists what information is used by AI methods for making decisions and that proactively involves them in the decision loop to further improve the COVID-19 understanding.},
keywords = {ai},
pubstate = {published},
tppubtype = {article}
}
Zilong Zhao, Robert Birke, Rui Han, Bogdan Robu, Sara Bouchenak, Sonia Ben Mokhtar, Lydia Y. Chen
Enhancing Robustness of On-Line Learning Models on Highly Noisy Data Journal Article
In: IEEE Trans. Dependable Secur. Comput., vol. 18, no. 5, pp. 2177–2192, 2021.
Abstract | Links | BibTeX | Tags: ai
@article{ZhaoBHRBMC21,
title = {Enhancing Robustness of On-Line Learning Models on Highly Noisy Data},
author = {Zilong Zhao and Robert Birke and Rui Han and Bogdan Robu and Sara Bouchenak and Sonia Ben Mokhtar and Lydia Y. Chen},
url = {https://doi.org/10.1109/TDSC.2021.3063947},
doi = {10.1109/TDSC.2021.3063947},
year = {2021},
date = {2021-01-01},
journal = {IEEE Trans. Dependable Secur. Comput.},
volume = {18},
number = {5},
pages = {2177–2192},
abstract = {Classification algorithms have been widely adopted to detect anomalies for various systems, e.g., IoT, cloud and face recognition, under the common assumption that the data source is clean, i.e., features and labels are correctly set. However, data collected from the wild can be unreliable due to careless annotations or malicious data transformation for incorrect anomaly detection. In this article, we extend a two-layer on-line data selection framework: Robust Anomaly Detector (RAD) with a newly designed ensemble prediction where both layers contribute to the final anomaly detection decision. To adapt to the on-line nature of anomaly detection, we consider additional features of conflicting opinions of classifiers, repetitive cleaning, and oracle knowledge. We on-line learn from incoming data streams and continuously cleanse the data, so as to adapt to the increasing learning capacity from the larger accumulated data set. Moreover, we explore the concept of oracle learning that provides additional information of true labels for difficult data points. We specifically focus on three use cases, (i) detecting 10 classes of IoT attacks, (ii) predicting 4 classes of task failures of big data jobs, and (iii) recognising 100 celebrities faces. Our evaluation results show that RAD can robustly improve the accuracy of anomaly detection, to reach up to 98.95 percent for IoT device attacks (i.e., +7%), up to 85.03 percent for cloud task failures (i.e., +14%) under 40 percent label noise, and for its extension, it can reach up to 77.51 percent for face recognition (i.e., +39%) under 30 percent label noise. The proposed RAD and its extensions are general and can be applied to different anomaly detection algorithms.},
keywords = {ai},
pubstate = {published},
tppubtype = {article}
}
Robert Birke, Juan F. Pérez, Zhan Qiu, Mathias Björkqvist, Lydia Y. Chen
sPARE: Partial Replication for Multi-Tier Applications in the Cloud Journal Article
In: IEEE Trans. Serv. Comput., vol. 14, no. 2, pp. 574–588, 2021.
Abstract | Links | BibTeX | Tags: parallel
@article{BirkePQBC21,
title = {sPARE: Partial Replication for Multi-Tier Applications in the Cloud},
author = {Robert Birke and Juan F. Pérez and Zhan Qiu and Mathias Björkqvist and Lydia Y. Chen},
url = {https://doi.org/10.1109/TSC.2017.2780845},
doi = {10.1109/TSC.2017.2780845},
year = {2021},
date = {2021-01-01},
journal = {IEEE Trans. Serv. Comput.},
volume = {14},
number = {2},
pages = {574–588},
abstract = {Offering consistent low latency remains a key challenge for distributed applications, especially when deployed on the cloud where virtual machines (VMs) suffer from capacity variability caused by co-located tenants. Replicating redundant requests was shown to be an effective mechanism to defend application performance from high capacity variability. While the prior art centers on single-tier systems, it still remains an open question how to design replication strategies for distributed multi-tier systems. In this paper, we design a first of its kind PArtial REplication system, sPARE, that replicates and dispatches read-only workloads for distributed multi-tier web applications. The two key components of sPARE are (i) the variability-aware replicator that coordinates the replication levels on all tiers via an iterative searching algorithm, and (ii) the replication-aware arbiter that uses a novel token-based arbitration algorithm (TAD) to dispatch requests in each tier. We evaluate sPARE on web serving and searching applications, i.e., MediaWiki and Solr, the former deployed on our private cloud and the latter on Amazon EC2. Our results based on various interference patterns and traffic loads show that sPARE is able to improve the tail latency of MediaWiki and Solr by a factor of almost 2.7x and 2.9x, respectively.},
keywords = {parallel},
pubstate = {published},
tppubtype = {article}
}
Iacopo Colonnelli, Barbara Cantalupo, Roberto Esposito, Matteo Pennisi, Concetto Spampinato, Marco Aldinucci
HPC Application Cloudification: The StreamFlow Toolkit Proceedings Article
In: Bispo, João, Cherubin, Stefano, Flich, José (Ed.): 12th Workshop on Parallel Programming and Run-Time Management Techniques for Many-core Architectures and 10th Workshop on Design Tools and Architectures for Multicore Embedded Computing Platforms (PARMA-DITAM 2021), pp. 5:1–5:13, Schloss Dagstuhl – Leibniz-Zentrum für Informatik, Dagstuhl, Germany, 2021, ISSN: 2190-6807.
Abstract | Links | BibTeX | Tags: deephealth, hpc4ai, streamflow
@inproceedings{colonnelli_et_al:OASIcs.PARMA-DITAM.2021.5,
title = {HPC Application Cloudification: The StreamFlow Toolkit},
author = {Iacopo Colonnelli and Barbara Cantalupo and Roberto Esposito and Matteo Pennisi and Concetto Spampinato and Marco Aldinucci},
editor = {João Bispo and Stefano Cherubin and José Flich},
url = {https://drops.dagstuhl.de/opus/volltexte/2021/13641/pdf/OASIcs-PARMA-DITAM-2021-5.pdf},
doi = {10.4230/OASIcs.PARMA-DITAM.2021.5},
issn = {2190-6807},
year = {2021},
date = {2021-01-01},
booktitle = {12th Workshop on Parallel Programming and Run-Time Management Techniques for Many-core Architectures and 10th Workshop on Design Tools and Architectures for Multicore Embedded Computing Platforms (PARMA-DITAM 2021)},
volume = {88},
pages = {5:1–5:13},
publisher = {Schloss Dagstuhl – Leibniz-Zentrum für Informatik},
address = {Dagstuhl, Germany},
series = {Open Access Series in Informatics (OASIcs)},
abstract = {Finding an effective way to improve accessibility to High-Performance Computing facilities, still anchored to SSH-based remote shells and queue-based job submission mechanisms, is an open problem in computer science. This work advocates a cloudification of HPC applications through a cluster-as-accelerator pattern, where computationally demanding portions of the main execution flow hosted on a Cloud Finding an effective way to improve accessibility to High-Performance Computing facilities, still anchored to SSH-based remote shells and queue-based job submission mechanisms, is an open problem in computer science. This work advocates a cloudification of HPC applications through a cluster-as-accelerator pattern, where computationally demanding portions of the main execution flow hosted on a Cloud infrastructure can be offloaded to HPC environments to speed them up. We introduce StreamFlow, a novel Workflow Management System that supports such a design pattern and makes it possible to run the steps of a standard workflow model on independent processing elements with no shared storage. We validated the proposed approach's effectiveness on the CLAIRE COVID-19 universal pipeline, i.e. a reproducible workflow capable of automating the comparison of (possibly all) state-of-the-art pipelines for the diagnosis of COVID-19 interstitial pneumonia from CT scans images based on Deep Neural Networks (DNNs).},
keywords = {deephealth, hpc4ai, streamflow},
pubstate = {published},
tppubtype = {inproceedings}
}
Fabrizio D'Ascenzo, Ovidio De Filippo, Guglielmo Gallone, Gianluca Mittone, Marco Agostino Deriu, Mario Iannaccone, Albert Ariza-Solé, Christoph Liebetrau, Sergio Manzano-Fernández, Giorgio Quadri, Tim Kinnaird, Gianluca Campo, Jose Paulo Simao Henriques, James M Hughes, Alberto Dominguez-Rodriguez, Marco Aldinucci, Umberto Morbiducci, Giuseppe Patti, Sergio Raposeiras-Roubin, Emad Abu-Assi, Gaetano Maria De Ferrari, Francesco Piroli, Andrea Saglietto, Federico Conrotto, Pierluigi Omedé, Antonio Montefusco, Mauro Pennone, Francesco Bruno, Pier Paolo Bocchino, Giacomo Boccuzzi, Enrico Cerrato, Ferdinando Varbella, Michela Sperti, Stephen B. Wilton, Lazar Velicki, Ioanna Xanthopoulou, Angel Cequier, Andres Iniguez-Romo, Isabel Munoz Pousa, Maria Cespon Fernandez, Berenice Caneiro Queija, Rafael Cobas-Paz, Angel Lopez-Cuenca, Alberto Garay, Pedro Flores Blanco, Andrea Rognoni, Giuseppe Biondi Zoccai, Simone Biscaglia, Ivan Nunez-Gil, Toshiharu Fujii, Alessandro Durante, Xiantao Song, Tetsuma Kawaji, Dimitrios Alexopoulos, Zenon Huczek, Jose Ramon Gonzalez Juanatey, Shao-Ping Nie, Masa-aki Kawashiri, Iacopo Colonnelli, Barbara Cantalupo, Roberto Esposito, Sergio Leonardi, Walter Grosso Marra, Alaide Chieffo, Umberto Michelucci, Dario Piga, Marta Malavolta, Sebastiano Gili, Marco Mennuni, Claudio Montalto, Luigi Oltrona Visconti, Yasir Arfat
Machine learning-based prediction of adverse events following an acute coronary syndrome (PRAISE): a modelling study of pooled datasets Journal Article
In: The Lancet, vol. 397, no. 10270, pp. 199–207, 2021, ISSN: 0140-6736.
Abstract | Links | BibTeX | Tags: ai, cardio, deephealth, hpc4ai
@article{21:lancet,
title = {Machine learning-based prediction of adverse events following an acute coronary syndrome (PRAISE): a modelling study of pooled datasets},
author = {Fabrizio D'Ascenzo and Ovidio De Filippo and Guglielmo Gallone and Gianluca Mittone and Marco Agostino Deriu and Mario Iannaccone and Albert Ariza-Solé and Christoph Liebetrau and Sergio Manzano-Fernández and Giorgio Quadri and Tim Kinnaird and Gianluca Campo and Jose Paulo Simao Henriques and James M Hughes and Alberto Dominguez-Rodriguez and Marco Aldinucci and Umberto Morbiducci and Giuseppe Patti and Sergio Raposeiras-Roubin and Emad Abu-Assi and Gaetano Maria De Ferrari and Francesco Piroli and Andrea Saglietto and Federico Conrotto and Pierluigi Omedé and Antonio Montefusco and Mauro Pennone and Francesco Bruno and Pier Paolo Bocchino and Giacomo Boccuzzi and Enrico Cerrato and Ferdinando Varbella and Michela Sperti and Stephen B. Wilton and Lazar Velicki and Ioanna Xanthopoulou and Angel Cequier and Andres Iniguez-Romo and Isabel Munoz Pousa and Maria Cespon Fernandez and Berenice Caneiro Queija and Rafael Cobas-Paz and Angel Lopez-Cuenca and Alberto Garay and Pedro Flores Blanco and Andrea Rognoni and Giuseppe Biondi Zoccai and Simone Biscaglia and Ivan Nunez-Gil and Toshiharu Fujii and Alessandro Durante and Xiantao Song and Tetsuma Kawaji and Dimitrios Alexopoulos and Zenon Huczek and Jose Ramon Gonzalez Juanatey and Shao-Ping Nie and Masa-aki Kawashiri and Iacopo Colonnelli and Barbara Cantalupo and Roberto Esposito and Sergio Leonardi and Walter Grosso Marra and Alaide Chieffo and Umberto Michelucci and Dario Piga and Marta Malavolta and Sebastiano Gili and Marco Mennuni and Claudio Montalto and Luigi Oltrona Visconti and Yasir Arfat},
url = {https://www.researchgate.net/profile/James_Hughes3/publication/348501148_Machine_learning-based_prediction_of_adverse_events_following_an_acute_coronary_syndrome_PRAISE_a_modelling_study_of_pooled_datasets/links/6002a81ba6fdccdcb858b6c2/Machine-learning-based-prediction-of-adverse-events-following-an-acute-coronary-syndrome-PRAISE-a-modelling-study-of-pooled-datasets.pdf},
doi = {10.1016/S0140-6736(20)32519-8},
issn = {0140-6736},
year = {2021},
date = {2021-01-01},
journal = {The Lancet},
volume = {397},
number = {10270},
pages = {199–207},
abstract = {Background The accuracy of current prediction tools for ischaemic and bleeding events after an acute coronary syndrome (ACS) remains insufficient for individualised patient management strategies. We developed a machine learning-based risk stratification model to predict all-cause death, recurrent acute myocardial infarction, and major bleeding after ACS. Methods Different machine learning models for the prediction of 1-year post-discharge all-cause death, myocardial infarction, and major bleeding (defined as Bleeding Academic Research Consortium type 3 or 5) were trained on a cohort of 19826 adult patients with ACS (split into a training cohort [80%] and internal validation cohort [20%]) from the BleeMACS and RENAMI registries, which included patients across several continents. 25 clinical features routinely assessed at discharge were used to inform the models. The best-performing model for each study outcome (the PRAISE score) was tested in an external validation cohort of 3444 patients with ACS pooled from a randomised controlled trial and three prospective registries. Model performance was assessed according to a range of learning metrics including area under the receiver operating characteristic curve (AUC). Findings The PRAISE score showed an AUC of 0.82 (95% CI 0.78-0.85) in the internal validation cohort and 0.92 (0.90-0.93) in the external validation cohort for 1-year all-cause death; an AUC of 0.74 (0.70-0.78) in the internal validation cohort and 0.81 (0.76-0.85) in the external validation cohort for 1-year myocardial infarction; and an AUC of 0.70 (0.66-0.75) in the internal validation cohort and 0.86 (0.82-0.89) in the external validation cohort for 1-year major bleeding. Interpretation A machine learning-based approach for the identification of predictors of events after an ACS is feasible and effective. The PRAISE score showed accurate discriminative capabilities for the prediction of all-cause death, myocardial infarction, and major bleeding, and might be useful to guide clinical decision making.},
keywords = {ai, cardio, deephealth, hpc4ai},
pubstate = {published},
tppubtype = {article}
}
Iacopo Colonnelli, Barbara Cantalupo, Ivan Merelli, Marco Aldinucci
StreamFlow: cross-breeding cloud with HPC Journal Article
In: IEEE Transactions on Emerging Topics in Computing, vol. 9, no. 4, pp. 1723–1737, 2021.
Abstract | Links | BibTeX | Tags: deephealth, hpc4ai, streamflow
@article{20Lstreamflow:tetc,
title = {StreamFlow: cross-breeding cloud with HPC},
author = {Iacopo Colonnelli and Barbara Cantalupo and Ivan Merelli and Marco Aldinucci},
url = {https://arxiv.org/pdf/2002.01558},
doi = {10.1109/TETC.2020.3019202},
year = {2021},
date = {2021-01-01},
journal = {IEEE Transactions on Emerging Topics in Computing},
volume = {9},
number = {4},
pages = {1723–1737},
abstract = {Workflows are among the most commonly used tools in a variety of execution environments. Many of them target a specific environment; few of them make it possible to execute an entire workflow in different environments, e.g. Kubernetes and batch clusters. We present a novel approach to workflow execution, called StreamFlow, that complements the workflow graph with the declarative description of potentially complex execution environments, and that makes it possible the execution onto multiple sites not sharing a common data space. StreamFlow is then exemplified on a novel bioinformatics pipeline for single cell transcriptomic data analysis workflow.},
keywords = {deephealth, hpc4ai, streamflow},
pubstate = {published},
tppubtype = {article}
}
2020
Adriano Marques Garcia, Matheus Serpa, Dalvan Griebler, Claudio Schepke, Luiz Gustavo Fernandes, Philippe O. A. Navaux
The Impact of CPU Frequency Scaling on Power Consumption of Computing Infrastructures Proceedings Article
In: International Conference on Computational Science and its Applications (ICCSA), pp. 142-157, Springer, Cagliari, Italy, 2020.
Abstract | Links | BibTeX | Tags: parallel
@inproceedings{GARCIA:ICCSA:20,
title = {The Impact of CPU Frequency Scaling on Power Consumption of Computing Infrastructures},
author = {Adriano Marques Garcia and Matheus Serpa and Dalvan Griebler and Claudio Schepke and Luiz Gustavo Fernandes and Philippe O. A. Navaux},
url = {https://iris.unito.it/retrieve/3b8f3dc0-cd4d-4f36-801d-9e8c613ea2e8/ICCSA_Energy_governors_preprint.pdf},
doi = {10.1007/978-3-030-58817-5_12},
year = {2020},
date = {2020-07-01},
booktitle = {International Conference on Computational Science and its Applications (ICCSA)},
volume = {12254},
pages = {142-157},
publisher = {Springer},
address = {Cagliari, Italy},
series = {ICCSA'20},
abstract = {Since the demand for computing power increases, new architectures emerged to obtain better performance. Reducing the power and energy consumption of these architectures is one of the main challenges to achieving high-performance computing. Current research trends aim at developing new software and hardware techniques to achieve the best performance and energy trade-offs. In this work, we investigate the impact of different CPU frequency scaling techniques such as ondemand, performance, and powersave on the power and energy consumption of multi-core based computer infrastructure. We apply these techniques in PAMPAR, a parallel benchmark suite implemented in PThreads, OpenMP, MPI-1, and MPI-2 (spawn). We measure the energy and execution time of 10 benchmarks, varying the number of threads. Our results show that although powersave consumes up to 43.1% less power than performance and ondemand governors, it consumes the triple of energy due to the high execution time. Our experiments also show that the performance governor consumes up to 9.8% more energy than ondemand for CPU-bound benchmarks. Finally, our results show that PThreads has the lowest power consumption, consuming less than the sequential version for memory-bound benchmarks. Regarding performance, the performance governor achieved 3% of performance over the ondemand.},
keywords = {parallel},
pubstate = {published},
tppubtype = {inproceedings}
}
Doriana Medić, Claudio Antares Mezzina, Iain Phillips, Nobuko Yoshida
A parametric framework for reversible emph(pi)-calculi Journal Article
In: Information and Computation, vol. 275, pp. 104644, 2020.
Abstract | Links | BibTeX | Tags: semantics
@article{20:journals:MedicMPY20,
title = {A parametric framework for reversible emph(pi)-calculi},
author = {Doriana Medić and Claudio Antares Mezzina and Iain Phillips and Nobuko Yoshida},
url = {https://doi.org/10.1016/j.ic.2020.104644},
doi = {10.1016/j.ic.2020.104644},
year = {2020},
date = {2020-01-01},
journal = {Information and Computation},
volume = {275},
pages = {104644},
abstract = {This paper presents a study of causality in a reversible, concurrent setting. There exist various notions of causality in Pi-calculus, which differ in the treatment of parallel extrusions of the same name. Hence, by using a parametric way of bookkeeping the order and the dependencies among extruders it is possible to map different causal semantics into the same framework. Starting from this simple observation, we present a uniform framework for reversible ?-calculi that is parametric with respect to a data structure that stores information about the extrusion of a name. Different data structures yield different approaches to the parallel extrusion problem. We map three well-known causal semantics into our framework. We prove causal-consistency for the three instances of our framework. Furthermore, we prove a causal correspondence between the appropriate instances of the framework and the Boreale-Sangiorgi semantics and an operational correspondence with the reversible emph(pi)-calculus causal semantics.},
keywords = {semantics},
pubstate = {published},
tppubtype = {article}
}
Ivan Lanese, Doriana Medić
A General Approach to Derive Uncontrolled Reversible Semantics Proceedings Article
In: 31st International Conference on Concurrency Theory, CONCUR 2020, September 1-4, 2020, Vienna, Austria (Virtual Conference), pp. 33:1–33:24, Schloss Dagstuhl - Leibniz-Zentrum für Informatik, 2020.
Abstract | Links | BibTeX | Tags: semantics
@inproceedings{20:concur:LaneseM20,
title = {A General Approach to Derive Uncontrolled Reversible Semantics},
author = {Ivan Lanese and Doriana Medić},
url = {https://doi.org/10.4230/LIPIcs.CONCUR.2020.33},
doi = {10.4230/LIPIcs.CONCUR.2020.33},
year = {2020},
date = {2020-01-01},
booktitle = {31st International Conference on Concurrency Theory, CONCUR 2020, September 1-4, 2020, Vienna, Austria (Virtual Conference)},
volume = {171},
pages = {33:1–33:24},
publisher = {Schloss Dagstuhl - Leibniz-Zentrum für Informatik},
series = {LIPIcs},
abstract = {Reversible computing is a paradigm where programs can execute backward as well as in the usual forward direction. Reversible computing is attracting interest due to its applications in areas as different as biochemical modelling, simulation, robotics and debugging, among others. In concurrent systems the main notion of reversible computing is called causal-consistent reversibility, and it allows one to undo an action if and only if its consequences, if any, have already been undone. This paper presents a general and automatic technique to define a causal-consistent reversible extension for given forward models. We support models defined using a reduction semantics in a specific format and consider a causality relation based on resources consumed and produced. The considered format is general enough to fit many formalisms studied in the literature on causal-consistent reversibility, notably Higher-Order ?-calculus and Core Erlang, an intermediate language in the Erlang compilation. Reversible extensions of these models in the literature are ad hoc, while we build them using the same general technique. This also allows us to show in a uniform way that a number of relevant properties, causal-consistency in particular, hold in the reversible extensions we build. Our technique also allows us to go beyond the reversible models in the literature: we cover a larger fragment of Core Erlang, including remote error handling based on links, which has never been considered in the reversibility literature.},
keywords = {semantics},
pubstate = {published},
tppubtype = {inproceedings}
}
Doriana Medić, Claudio Antares Mezzina, Iain Phillips, Nobuko Yoshida
Towards a Formal Account for Software Transactional Memory Proceedings Article
In: Reversible Computation - 12th International Conference, RC 2020, Oslo, Norway, July 9-10, 2020, Proceedings, pp. 255–263, Springer, 2020.
Abstract | Links | BibTeX | Tags: semantics
@inproceedings{20:RC:MedicM0Y20,
title = {Towards a Formal Account for Software Transactional Memory},
author = {Doriana Medić and Claudio Antares Mezzina and Iain Phillips and Nobuko Yoshida},
url = {https://doi.org/10.1007/978-3-030-52482-1_16},
doi = {10.1007/978-3-030-52482-1_16},
year = {2020},
date = {2020-01-01},
booktitle = {Reversible Computation - 12th International Conference, RC 2020, Oslo, Norway, July 9-10, 2020, Proceedings},
volume = {12227},
pages = {255–263},
publisher = {Springer},
series = {Lecture Notes in Computer Science},
abstract = {Software transactional memory (STM) is a concurrency control mechanism for shared memory systems. It is opposite to the lock based mechanism, as it allows multiple processes to access the same set of variables in a concurrent way. Then according to the used policy, the effect of accessing to shared variables can be committed (hence, made permanent) or undone. In this paper, we define a formal framework for describing STMs and show how with a minor variation of the rules it is possible to model two common policies for STM: reader preference and writer preference.},
keywords = {semantics},
pubstate = {published},
tppubtype = {inproceedings}
}
Vasco Amaral, Beatriz Norberto, Miguel Goulão, Marco Aldinucci, Siegfried Benkner, Andrea Bracciali, Paulo Carreira, Edgars Celms, Luís Correia, Clemens Grelck, Helen Karatza, Christoph Kessler, Peter Kilpatrick, Hugo Martiniano, Ilias Mavridis, Sabri Pllana, Ana Respício, José Simão, Luís Veiga, Ari Visa
Programming languages for data-Intensive HPC applications: A systematic mapping study Journal Article
In: Parallel Computing, pp. 102584, 2020, ISSN: 0167-8191.
Abstract | Links | BibTeX | Tags: HPC
@article{20:sms:chipset,
title = {Programming languages for data-Intensive HPC applications: A systematic mapping study},
author = {Vasco Amaral and Beatriz Norberto and Miguel Goulão and Marco Aldinucci and Siegfried Benkner and Andrea Bracciali and Paulo Carreira and Edgars Celms and Luís Correia and Clemens Grelck and Helen Karatza and Christoph Kessler and Peter Kilpatrick and Hugo Martiniano and Ilias Mavridis and Sabri Pllana and Ana Respício and José Simão and Luís Veiga and Ari Visa},
url = {https://iris.unito.it/retrieve/689605/1-s2.0-S0167819119301759-main.pdf},
doi = {https://doi.org/10.1016/j.parco.2019.102584},
issn = {0167-8191},
year = {2020},
date = {2020-01-01},
journal = {Parallel Computing},
pages = {102584},
abstract = {A major challenge in modelling and simulation is the need to combine expertise in both software technologies and a given scientific domain. When High-Performance Computing (HPC) is required to solve a scientific problem, software development becomes a problematic issue. Considering the complexity of the software for HPC, it is useful to identify programming languages that can be used to alleviate this issue. Because the existing literature on the topic of HPC is very dispersed, we performed a Systematic Mapping Study (SMS) in the context of the European COST Action cHiPSet. This literature study maps characteristics of various programming languages for data-intensive HPC applications, including category, typical user profiles, effectiveness, and type of articles. We organised the SMS in two phases. In the first phase, relevant articles are identified employing an automated keyword-based search in eight digital libraries. This lead to an initial sample of 420 papers, which was then narrowed down in a second phase by human inspection of article abstracts, titles and projects to 152 relevant articles published in the period 2006–2018. The analysis of these articles enabled us to identify 26 programming languages referred to in 33 of relevant articles. We compared the outcome of the mapping study with results of our questionnaire-based survey that involved 57 HPC experts. The mapping study and the survey revealed that the desired features of programming languages for data-intensive HPC applications are portability, performance and usability. Furthermore, we observed that the majority of the programming languages used in the context of data-intensive HPC applications are text-based general-purpose programming languages. Typically these have a steep learning curve, which makes them difficult to adopt. We believe that the outcome of this study will inspire future research and development in programming languages for data-intensive HPC applications.},
keywords = {HPC},
pubstate = {published},
tppubtype = {article}
}
Daniele D'Agostino, Pietro Liò, Marco Aldinucci, Ivan Merelli
NeoHiC: A web application for the analysis of Hi-C data Proceedings Article
In: Lecture Notes in Computer Science (including subseries Lecture Notes in Artificial Intelligence and Lecture Notes in Bioinformatics), pp. 98–107, 2020, ISBN: 978-3-030-63061-4.
Abstract | Links | BibTeX | Tags:
@inproceedings{20:neohic:cibb,
title = {NeoHiC: A web application for the analysis of Hi-C data},
author = {Daniele D'Agostino and Pietro Liò and Marco Aldinucci and Ivan Merelli},
url = {https://iris.unito.it/retrieve/handle/2318/1766001/690791/20_neohic_cibb.pdf},
doi = {10.1007/978-3-030-63061-4_10},
isbn = {978-3-030-63061-4},
year = {2020},
date = {2020-01-01},
booktitle = {Lecture Notes in Computer Science (including subseries Lecture Notes in Artificial Intelligence and Lecture Notes in Bioinformatics)},
volume = {12313},
pages = {98–107},
abstract = {High-throughput sequencing Chromosome Conformation Capture (Hi-C) allows the study of chromatin interactions and 3D chromosome folding on a larger scale. A graph-based multi-level representation of Hi-C data is essential for proper visualisation of the spatial pattern they represent, in particular for comparing different experiments or for re-mapping omics-data in a space-aware context. The size of the HiC data hampers the straightforward use of currently available graph visualisation tools and libraries. In this paper, we present the first version of NeoHiC, a user-friendly web application for the progressive graph visualisation of Hi-C data based on the use of the Neo4j graph database. The user could select the richness of the environment of the query gene by choosing among a large number of proximity and distance metrics.},
keywords = {},
pubstate = {published},
tppubtype = {inproceedings}
}
Paul Metzger, Murray Cole, Christian Fensch, Marco Aldinucci, Enrico Bini
Enforcing Deadlines for Skeleton-based Parallel Programming Proceedings Article
In: 26th IEEE Real-Time and Embedded Technology and Applications Symposium (RTAS), Sydney, Australia, 2020.
Abstract | Links | BibTeX | Tags:
@inproceedings{20:farm:rtas,
title = {Enforcing Deadlines for Skeleton-based Parallel Programming},
author = {Paul Metzger and Murray Cole and Christian Fensch and Marco Aldinucci and Enrico Bini},
url = {https://iris.unito.it/retrieve/handle/2318/1741320/616056/20_ske_RTAS.pdf},
doi = {10.1109/RTAS48715.2020.000-7},
year = {2020},
date = {2020-01-01},
booktitle = {26th IEEE Real-Time and Embedded Technology and Applications Symposium (RTAS)},
address = {Sydney, Australia},
abstract = {High throughput applications with real-time guar- antees are increasingly relevant. For these applications, parallelism must be exposed to meet deadlines. Directed Acyclic Graphs (DAGs) are a popular and very general application model that can capture any possible interaction among threads. However, we argue that by constraining the application structure to a set of composable ``skeletons'', at the price of losing some generality w.r.t. DAGs, the following advantages are gained: (i) a finer model of the application enables tighter analysis, (ii) specialised scheduling policies are applicable, (iii) programming is simplified, (iv) specialised implementation techniques can be exploited transparently, and (v) the program can be automatically tuned to minimise resource usage while still meeting its hard deadlines. As a first step towards a set of real-time skeletons we conduct a case study with the job farm skeleton and the hard real- time XMOS xCore-200 microcontroller. We present an analytical framework for job farms that reduces the number of required cores by scheduling jobs in batches, while ensuring that deadlines are still met. Our experimental results demonstrate that batching reduces the minimum sustainable period by up to 22%, leading to a reduced number of required cores. The framework chooses the best parameters in 83% of cases and never selects parameters that cause deadline misses. Finally, we show that the overheads introduced by the skeleton abstraction layer are negligible.},
keywords = {},
pubstate = {published},
tppubtype = {inproceedings}
}
Vincent Reniers, Yuan Gao, Ren Zhang, Paolo Viviani, Akash Madhusudan, Bert Lagaisse, Svetla Nikova, Dimitri Van Landuyt, Riccardo Lombardi, Bart Preneel, Wouter Joosen
Authenticated and Auditable Data Sharing via Smart Contract Proceedings Article
In: Proceedings of the 35th ACM/SIGAPP Symposium on Applied Computing, pp. 1–8, ACM, Brno, Czech Republic, 2020, ISBN: xxx-x-xxxx-xxxx-x.
@inproceedings{20:sac:blockchain,
title = {Authenticated and Auditable Data Sharing via Smart Contract},
author = {Vincent Reniers and Yuan Gao and Ren Zhang and Paolo Viviani and Akash Madhusudan and Bert Lagaisse and Svetla Nikova and Dimitri Van Landuyt and Riccardo Lombardi and Bart Preneel and Wouter Joosen},
isbn = {xxx-x-xxxx-xxxx-x},
year = {2020},
date = {2020-01-01},
booktitle = {Proceedings of the 35th ACM/SIGAPP Symposium on Applied Computing},
pages = {1–8},
publisher = {ACM},
address = {Brno, Czech Republic},
series = {SAC '20},
abstract = {Our main use case features multiple companies that iteratively optimize on the architectural properties of aircraft components in a decentralized manner. In each optimization step of the so-called multi-disciplinary optimization (MDO) process, sensitive data is exchanged, and we require auditability and traceability of actions taken to assure compliance with signed legal agreements. In this paper, we present a distributed protocol that coordinates authenticated and auditable exchanges of files, leveraging a smart contract. The entire life cycle of a file exchange, including file registration, access request and key distribution, is recorded and traceable via the smart contract. Moreover, when one party raises a dispute, the smart contract can identify the dishonest party without compromising the file's confidentiality. The proposed protocol provides a simple, novel, yet efficient approach to exchange files with support for data access auditability between companies involved in a private consortium with no incentive to share files outside of the protocol. We implemented the protocol in Solidity, deployed it on a private Ethereum blockchain, and validated it within the use case of a decentralized workflow.},
keywords = {},
pubstate = {published},
tppubtype = {inproceedings}
}
Valentina Cesare, Iacopo Colonnelli, Marco Aldinucci
Practical Parallelization of Scientific Applications Proceedings Article
In: Proc. of 28th Euromicro Intl. Conference on Parallel Distributed and network-based Processing (PDP), pp. 376–384, IEEE, Västerås, Sweden, 2020.
Abstract | Links | BibTeX | Tags: c3s, hpc4ai
@inproceedings{20:looppar:pdp,
title = {Practical Parallelization of Scientific Applications},
author = {Valentina Cesare and Iacopo Colonnelli and Marco Aldinucci},
url = {https://iris.unito.it/retrieve/handle/2318/1735377/601141/2020_looppar_PDP.pdf},
doi = {10.1109/PDP50117.2020.00064},
year = {2020},
date = {2020-01-01},
booktitle = {Proc. of 28th Euromicro Intl. Conference on Parallel Distributed and network-based Processing (PDP)},
pages = {376–384},
publisher = {IEEE},
address = {Västerås, Sweden},
abstract = {This work aims at distilling a systematic methodology to modernize existing sequential scientific codes with a limited re-designing effort, turning an old codebase into modern code, i.e., parallel and robust code. We propose an automatable methodology to parallelize scientific applications designed with a purely sequential programming mindset, thus possibly using global variables, aliasing, random number generators, and stateful functions. We demonstrate the methodology by way of an astrophysical application, where we model at the same time the kinematic profiles of 30 disk galaxies with a Monte Carlo Markov Chain (MCMC), which is sequential by definition. The parallel code exhibits a 12 times speedup on a 48-core platform.},
keywords = {c3s, hpc4ai},
pubstate = {published},
tppubtype = {inproceedings}
}
Jose Daniel Garcia, Jose Daniel Rio, Marco Aldinucci, Fabio Tordini, Marco Danelutto, Gabriele Mencagli, Massimo Torquati
Challenging the abstraction penalty in parallel patterns libraries: Adding FastFlow support to GrPPI Journal Article
In: The Journal of Supercomputing, vol. 76, no. 7, pp. 5139–5159, 2020.
Abstract | Links | BibTeX | Tags: fastflow, rephrase
@article{19:jsupe:grppi,
title = {Challenging the abstraction penalty in parallel patterns libraries: Adding FastFlow support to GrPPI},
author = {Jose Daniel Garcia and Jose Daniel Rio and Marco Aldinucci and Fabio Tordini and Marco Danelutto and Gabriele Mencagli and Massimo Torquati},
url = {https://iris.unito.it/retrieve/handle/2318/1762686/744894/2020-js-grppi-postprint.pdf},
doi = {10.1007/s11227-019-02826-5},
year = {2020},
date = {2020-01-01},
journal = {The Journal of Supercomputing},
volume = {76},
number = {7},
pages = {5139–5159},
abstract = {In the last years, pattern-based programming has been recognized as a good practice for efficiently exploiting parallel hardware resources. Following this approach, multiple libraries have been designed for providing such high-level abstractions to ease the parallel programming. However, those libraries do not share a common interface. To pave the way, GrPPI has been designed for providing an intermediate abstraction layer between application developers and existing parallel programming frameworks like OpenMP, Intel TBB or ISO C++ threads. On the other hand, FastFlow has been adopted as an efficient object-based programming framework that may benefit from being supported as an additional GrPPI backend. However, the object-based approach presents some major challenges to be incorporated under the GrPPI type safe functional programming style. In this paper, we present the integration of FastFlow as a new GrPPI backend to demonstrate that structured parallel programming frameworks perfectly fit the GrPPI design. Additionally, we also demonstrate that GrPPI does not incur in additional overheads for providing its abstraction layer, and we study the programmability in terms of lines of code and cyclomatic complexity. In general, the presented work acts as reciprocal validation of both FastFlow (as an efficient, native structured parallel programming framework) and GrPPI (as an efficient abstraction layer on top of existing parallel programming frameworks).},
keywords = {fastflow, rephrase},
pubstate = {published},
tppubtype = {article}
}
2019
Adriano Marques Garcia, Claudio Schepke, Alessandro Gonçalves Girardi
PAMPAR: A new parallel benchmark for performance and energy consumption evaluation Journal Article
In: Concurrency and Computation: Practice and Experience, vol. 32, no. 20, pp. 1-21, 2019.
Abstract | Links | BibTeX | Tags: parallel
@article{GARCIA:CCPE:19,
title = {PAMPAR: A new parallel benchmark for performance and energy consumption evaluation},
author = {Adriano Marques Garcia and Claudio Schepke and Alessandro Gonçalves Girardi},
url = {https://iris.unito.it/retrieve/d514c682-a567-4a02-93b7-9e27b6d3da03/Concurrency___Computation__Practice___Experience__Final_Version_.pdf},
doi = {10.1002/cpe.5504},
year = {2019},
date = {2019-10-01},
journal = {Concurrency and Computation: Practice and Experience},
volume = {32},
number = {20},
pages = {1-21},
abstract = {This paper presents PAMPAR, a new benchmark to evaluate the performance and energy consumption of different Parallel Programming Interfaces (PPIs). The benchmark is composed of 11 algorithms implemented in PThreads, OpenMP, MPI-1, and MPI-2 (spawn) PPIs. Previous studies have used some of these pseudo-applications to perform this type of evaluation in different architectures since there is no benchmark that offers this variety of PPIs and communication models. In this work, we measure the energy and performance of each pseudo-application in a single architecture, varying the number of threads/processes. We also organize the pseudo-applications according to their memory accesses, floating-point operations, and branches. The goal is to show that this set of pseudo-applications has enough features to build a parallel benchmark. The results show that there is no single best case that provides both better performance and low energy consumption in the presented scenarios. Moreover, the pseudo-applications usage of the system resources are different enough to represent different scenarios and be efficient as a benchmark.},
keywords = {parallel},
pubstate = {published},
tppubtype = {article}
}
Paolo Viviani
Deep Learning at Scale with Nearest Neighbours Communications PhD Thesis
Computer Science Department, University of Torino, 2019.
Abstract | Links | BibTeX | Tags:
@phdthesis{19:dl:viviani:thesis,
title = {Deep Learning at Scale with Nearest Neighbours Communications},
author = {Paolo Viviani},
url = {https://zenodo.org/record/3516093/files/20190910_final_pdf.pdf},
doi = {10.5281/zenodo.3516093},
year = {2019},
date = {2019-09-01},
school = {Computer Science Department, University of Torino},
abstract = {As deep learning techniques become more and more popular, there is the need to move these applications from the data scientist's Jupyter notebook to efficient and reliable enterprise solutions. Moreover, distributed training of deep learning models will happen more and more outside the well-known borders of cloud and HPC infrastructure and will move to edge and mobile platforms. Current techniques for distributed deep learning have drawbacks in both these scenarios, limiting their long-term applicability. After a critical review of the established techniques for Data Parallel training from both a distributed computing and deep learning perspective, a novel approach based on nearest-neighbour communications is presented in order to overcome some of the issues related to mainstream approaches, such as global communication patterns. Moreover, in order to validate the proposed strategy, the Flexible Asynchronous Scalable Training (FAST) framework is introduced, which allows to apply the nearest-neighbours communications approach to a deep learning framework of choice. Finally, a relevant use-case is deployed on a medium-scale infrastructure to demonstrate both the framework and the methodology presented. Training convergence and scalability results are presented and discussed in comparison to a baseline defined by using state-of-the-art distributed training tools provided by a well-known deep learning framework.},
keywords = {},
pubstate = {published},
tppubtype = {phdthesis}
}
Marco Aldinucci, Stefano Bagnasco, Matteo Concas, Stefano Lusso, Sergio Rabellino, Danilo Demarchi, Sara Vallero
Managing a heterogeneous scientific computing cluster with cloud-like tools: ideas and experience Proceedings Article
In: European Physical Journal Web of Conferences, pp. 07030, 2019.
Abstract | Links | BibTeX | Tags:
@inproceedings{2019EPJWC.21407030A,
title = {Managing a heterogeneous scientific computing cluster with cloud-like tools: ideas and experience},
author = {Marco Aldinucci and Stefano Bagnasco and Matteo Concas and Stefano Lusso and Sergio Rabellino and Danilo Demarchi and Sara Vallero},
url = {https://iris.unito.it/retrieve/533279/epjconf_chep2018_07030.pdf},
doi = {10.1051/epjconf/201921407030},
year = {2019},
date = {2019-07-01},
booktitle = {European Physical Journal Web of Conferences},
volume = {214},
pages = {07030},
series = {European Physical Journal Web of Conferences},
abstract = {Obtaining CPU cycles on an HPC cluster is nowadays relatively simple and sometimes even cheap for academic institutions. However, in most of the cases providers of HPC services would not allow changes on the configuration, implementation of special features or a lower-level control on the computing infrastructure, for example for testing experimental configurations. The variety of use cases proposed by several departments of the University of Torino, including ones from solid-state chemistry, computational biology, genomics and many others, called for different and sometimes conflicting configurations; furthermore, several R&D activities in the field of scientific computing, with topics ranging from GPU acceleration to Cloud Computing technologies, needed a platform to be carried out on. The Open Computing Cluster for Advanced data Manipulation (OCCAM) is a multi-purpose flexible HPC cluster designed and operated by a collaboration between the University of Torino and the Torino branch of the Istituto Nazionale di Fisica Nucleare. It is aimed at providing a flexible and reconfigurable infrastructure to cater to a wide range of different scientific computing needs, as well as a platform for R&D activities on computational technologies themselves. We describe some of the use cases that prompted the design and construction of the system, its architecture and a first characterisation of its performance by some synthetic benchmark tools and a few realistic use-case tests.},
keywords = {},
pubstate = {published},
tppubtype = {inproceedings}
}
Adriano Marques Garcia, Claudio Schepke, Alessandro Gonçalves Girardi, Sherlon Almeida Silva
A New Parallel Benchmark for Performance Evaluation and Energy Consumption Proceedings Article
In: High Performance Computing for Computational Science – VECPAR 2018, pp. 188-201, Springer International Publishing, Cham, 2019, ISBN: 978-3-030-15996-2.
Abstract | Links | BibTeX | Tags: parallel
@inproceedings{GARCIA:VECPAR:19,
title = {A New Parallel Benchmark for Performance Evaluation and Energy Consumption},
author = {Adriano Marques Garcia and Claudio Schepke and Alessandro Gonçalves Girardi and Sherlon Almeida Silva},
url = {https://iris.unito.it/retrieve/1272dea3-b1ea-4356-af0d-d180cef341b9/VECPAR_2018_paper_preprint.pdf},
doi = {10.1007/978-3-030-15996-2_14},
isbn = {978-3-030-15996-2},
year = {2019},
date = {2019-03-01},
booktitle = {High Performance Computing for Computational Science – VECPAR 2018},
pages = {188-201},
publisher = {Springer International Publishing},
address = {Cham},
abstract = {This paper presents a new benchmark to evaluate performance and energy consumption of different Parallel Programming Interfaces (PPIs). The benchmark is composed of 11 algorithms implemented in PThreads, OpenMP, MPI-1 and MPI-2 (spawn) PPIs. Previous studies have used some of these applications to perform this type of evaluation in different architectures, since there is no benchmark that offers this variety of PPIs and communication models. In this work we measure the energy and performance of each application in a single architecture, varying the number of threads/processes. The goal is to show that this set of applications has enough features to form a parallel benchmark. The results show that there is no single best case that provides both better performance and low energy consumption in the presented scenarios. However, PThreads and OpenMP achieve the best trade-offs between performance and energy in most cases.},
keywords = {parallel},
pubstate = {published},
tppubtype = {inproceedings}
}
Massimo Torquati, Daniele De Sensi, Gabriele Mencagli, Marco Aldinucci, Marco Danelutto
Power-Aware Pipelining with Automatic Concurrency Control Journal Article
In: Concurrency and Computation: Practice and Experience, vol. 31, no. 5, 2019.
Abstract | Links | BibTeX | Tags: rephrase
@article{18:dynqueue:ccpe,
title = {Power-Aware Pipelining with Automatic Concurrency Control},
author = {Massimo Torquati and Daniele De Sensi and Gabriele Mencagli and Marco Aldinucci and Marco Danelutto},
url = {https://iris.unito.it/retrieve/handle/2318/1668445/414282/2018_CCPE.pdf},
doi = {10.1002/cpe.4652},
year = {2019},
date = {2019-01-01},
journal = {Concurrency and Computation: Practice and Experience},
volume = {31},
number = {5},
abstract = {Continuous streaming computations are usually composed of different modules, exchanging data through shared message queues. The selection of the algorithm used to access such queues (i.e. the concurrency control) is a critical aspect both for performance and power consumption. In this paper we describe the design of automatic concurrency control algorithm for implement- ing power-efficient communications on shared-memory multicores. The algorithm automatically switches between nonblocking and blocking concurrency protocols, getting the best from the two worlds, i.e. obtaining the same throughput offered by the nonblocking implementa- tion and the same power efficiency of the blocking concurrency protocol. We demonstrate the effectiveness of our approach using two micro-benchmarks and two real streaming applications},
keywords = {rephrase},
pubstate = {published},
tppubtype = {article}
}
Marco Aldinucci, Maurizio Drocco, Claudia Misale, Guy Tremblay
Languages for Big Data analysis Book Chapter
In: Sakr, Sherif, Zomaya, Albert (Ed.): Encyclopedia of Big Data Technologies, Springer International Publishing, Cham, 2019, ISBN: 978-3-319-63962-8.
Abstract | Links | BibTeX | Tags: parallel
@inbook{bigdata:encyclopedia:18,
title = {Languages for Big Data analysis},
author = {Marco Aldinucci and Maurizio Drocco and Claudia Misale and Guy Tremblay},
editor = {Sherif Sakr and Albert Zomaya},
url = {https://iris.unito.it/retrieve/handle/2318/1668051/413363/2019_bigdataframeworks_enc.pdf},
doi = {10.1007/978-3-319-63962-8_142-1},
isbn = {978-3-319-63962-8},
year = {2019},
date = {2019-01-01},
booktitle = {Encyclopedia of Big Data Technologies},
publisher = {Springer International Publishing},
address = {Cham},
abstract = {In this chapter, some of the most common tools for Big Data analytics are surveyed, inter-alia, Apache Spark, Flink, Storm, and Beam. They are compared against well-defined features concerning programming model (language expressivity and semantics), and execution model (parallel behaviour and run-time support). The implementation of a running example is provided for all of them.},
keywords = {parallel},
pubstate = {published},
tppubtype = {inbook}
}
Marco Danelutto, Tiziano De Matteis, Daniele De Sensi, Gabriele Mencagli, Massimo Torquati, Marco Aldinucci, Peter Kilpatrick
The RePhrase Extended Pattern Set for Data Intensive Parallel Computing Journal Article
In: International Journal of Parallel Programming, vol. 47, no. 1, pp. 74–93, 2019.
Abstract | Links | BibTeX | Tags: fastflow, rephrase
@article{17:rephrasepatterns:ijpp,
title = {The RePhrase Extended Pattern Set for Data Intensive Parallel Computing},
author = {Marco Danelutto and Tiziano De Matteis and Daniele De Sensi and Gabriele Mencagli and Massimo Torquati and Marco Aldinucci and Peter Kilpatrick},
url = {https://iris.unito.it/retrieve/handle/2318/1659336/387667/2017_ijpp_rephrase.pdf},
doi = {10.1007/s10766-017-0540-z},
year = {2019},
date = {2019-01-01},
journal = {International Journal of Parallel Programming},
volume = {47},
number = {1},
pages = {74–93},
abstract = {We discuss the extended parallel pattern set identified within the EU-funded project RePhrase as a candidate pattern set to support data intensive applications targeting heterogeneous architectures. The set has been designed to include three classes of pattern, namely i) core patterns, modelling common, not necessarily data intensive parallelism exploitation patterns, usually to be used in composition; ii) high level patterns, modelling common, complex and complete parallelism exploitation patterns; and iii) building block patterns, modelling the single components of data intensive applications, suitable for use–in composition–to implement patterns not covered by the core and high level patterns. We discuss the expressive power of the RePhrase extended pattern set and results illustrating the performances that may be achieved with the FastFlow implementation of the high level patterns.},
keywords = {fastflow, rephrase},
pubstate = {published},
tppubtype = {article}
}
Massimo Torquati, Gabriele Mencagli, Maurizio Drocco, Marco Aldinucci, Tiziano De Matteis, Marco Danelutto
On Dynamic Memory Allocation in Sliding-Window Parallel Patterns for Streaming Analytics Journal Article
In: The Journal of Supercomputing, vol. 75, no. 8, pp. 4114–4131, 2019.
Abstract | Links | BibTeX | Tags: fastflow, rephrase
@article{17:dmadasp:jsupe,
title = {On Dynamic Memory Allocation in Sliding-Window Parallel Patterns for Streaming Analytics},
author = {Massimo Torquati and Gabriele Mencagli and Maurizio Drocco and Marco Aldinucci and Tiziano De Matteis and Marco Danelutto},
url = {https://iris.unito.it/retrieve/handle/2318/1648626/362381/17_torquati_jsc.pdf},
doi = {10.1007/s11227-017-2152-1},
year = {2019},
date = {2019-01-01},
journal = {The Journal of Supercomputing},
volume = {75},
number = {8},
pages = {4114–4131},
abstract = {This work studies the issues related to dynamic memory management in Data Stream Processing, an emerging paradigm enabling the real-time processing of live data streams. In this paper we consider two streaming parallel patterns and we discuss different implementation variants related on how dynamic memory is managed. The results show that the standard mechanisms provided by modern C++ are not entirely adequate for maximizing the performance. Instead, the combined use of an efficient general-purpose memory allocator, a custom allocator optimized for the pattern considered and a custom variant of the C++ shared pointer mechanism, provides a performance improvement up to 16% on the best case.},
keywords = {fastflow, rephrase},
pubstate = {published},
tppubtype = {article}
}
Doriana Medić
Relative expressiveness of calculi for reversible concurrency Journal Article
In: Bull. EATCS, vol. 129, 2019.
Abstract | Links | BibTeX | Tags: semantics
@article{19:eatcs:Medic19,
title = {Relative expressiveness of calculi for reversible concurrency},
author = {Doriana Medić},
url = {http://bulletin.eatcs.org/index.php/beatcs/article/view/590/601},
year = {2019},
date = {2019-01-01},
journal = {Bull. EATCS},
volume = {129},
abstract = {A number of formalisms have been proposed to model various approaches to reversibility and to better understand its properties and characteristics. However, the relation between these formalisms has hardly been studied. This paper examines the expressiveness of the causal-consistent reversibility in process algebras CCS and emph(pi)-calculus. In particular, we show, by means of encodings, that LTSs of two reversible extensions of CCS, Reversible CCS [1] and CCS with Keys [2], are isomorphic up to some structural transformations of processes. To study different causal semantics for ?-calculus, we devise a uniform framework for reversible emph(pi)-calculi that is parametric with respect to a data structure that stores information about the extrusion of a name. Depending on the used data structure, different causal semantics can be obtained. We show that reversibility induced by our framework when instantiated with three different data structures is causally-consistent and prove a causal correspondence between certain causal semantics and matching instance of the framework.},
keywords = {semantics},
pubstate = {published},
tppubtype = {article}
}
Paolo Viviani, Maurizio Drocco, Daniele Baccega, Iacopo Colonnelli, Marco Aldinucci
Deep Learning at Scale Proceedings Article
In: Proc. of 27th Euromicro Intl. Conference on Parallel Distributed and network-based Processing (PDP), pp. 124–131, IEEE, Pavia, Italy, 2019.
Abstract | Links | BibTeX | Tags: ai
@inproceedings{19:deeplearn:pdp,
title = {Deep Learning at Scale},
author = {Paolo Viviani and Maurizio Drocco and Daniele Baccega and Iacopo Colonnelli and Marco Aldinucci},
url = {https://iris.unito.it/retrieve/handle/2318/1695211/487778/19_deeplearning_PDP.pdf},
doi = {10.1109/EMPDP.2019.8671552},
year = {2019},
date = {2019-01-01},
booktitle = {Proc. of 27th Euromicro Intl. Conference on Parallel Distributed and network-based Processing (PDP)},
pages = {124–131},
publisher = {IEEE},
address = {Pavia, Italy},
abstract = {This work presents a novel approach to distributed training of deep neural networks (DNNs) that aims to overcome the issues related to mainstream approaches to data parallel training. Established techniques for data parallel training are discussed from both a parallel computing and deep learning perspective, then a different approach is presented that is meant to allow DNN training to scale while retaining good convergence properties. Moreover, an experimental implementation is presented as well as some preliminary results.},
keywords = {ai},
pubstate = {published},
tppubtype = {inproceedings}
}
Ivan Merelli, Federico Fornari, Fabio Tordini, Daniele D'Agostino, Marco Aldinucci, Daniele Cesini
Exploiting Docker containers over Grid computing for a comprehensive study of chromatin conformation in different cell types Journal Article
In: Journal of Parallel and Distributed Computing, vol. 134, pp. 116–127, 2019, ISSN: 0743-7315.
Abstract | Links | BibTeX | Tags: bioinformatics
@article{19:merelli:jpdc,
title = {Exploiting Docker containers over Grid computing for a comprehensive study of chromatin conformation in different cell types},
author = {Ivan Merelli and Federico Fornari and Fabio Tordini and Daniele D'Agostino and Marco Aldinucci and Daniele Cesini},
url = {https://iris.unito.it/retrieve/handle/2318/1711684/532767/2019_Nuchart_JPDC_open.pdf},
doi = {10.1016/j.jpdc.2019.08.002},
issn = {0743-7315},
year = {2019},
date = {2019-01-01},
journal = {Journal of Parallel and Distributed Computing},
volume = {134},
pages = {116–127},
abstract = {Many bioinformatic applications require to exploit the capabilities of several computational resources to effectively access and process large and distributed datasets. In this context, Grid computing has been largely used to face unprecedented challenges in Computational Biology, at the cost of complex workarounds needed to make applications successfully running. The Grid computing paradigm, in fact, has always suffered from a lack of flexibility. Although this has been partially solved by Cloud computing, the on-demand approach is way distant from the original idea of volunteering computing that boosted the Grid paradigm. A solution to outpace the impossibility of creating custom environments for running applications in Grid is represented by the containerization technology. In this paper, we describe our experience in exploiting a Docker-based approach to run in a Grid environment a novel, computationally intensive, bioinformatic application, which models the DNA spatial conformation inside the nucleus of eukaryotic cells. Results assess the feasibility of this approach in terms of performance and efforts to run large experiments.},
keywords = {bioinformatics},
pubstate = {published},
tppubtype = {article}
}
Clemens Grelck, Ewa Niewiadomska-Szynkiewicz, Marco Aldinucci, Andrea Bracciali, Elisabeth Larsson
Why High-Performance Modelling and Simulation for Big Data Applications Matters Book Chapter
In: Kołodziej, Joanna, González-Vélez, Horacio (Ed.): High-Performance Modelling and Simulation for Big Data Applications: Selected Results of the COST Action IC1406 cHiPSet, no. 11400, pp. 1–35, Springer International Publishing, Cham, 2019, ISBN: 978-3-030-16272-6.
Abstract | Links | BibTeX | Tags: HPC
@inbook{Grelck2019,
title = {Why High-Performance Modelling and Simulation for Big Data Applications Matters},
author = {Clemens Grelck and Ewa Niewiadomska-Szynkiewicz and Marco Aldinucci and Andrea Bracciali and Elisabeth Larsson},
editor = {Joanna Kołodziej and Horacio González-Vélez},
url = {https://link.springer.com/content/pdf/10.1007%2F978-3-030-16272-6_1.pdf},
doi = {10.1007/978-3-030-16272-6_1},
isbn = {978-3-030-16272-6},
year = {2019},
date = {2019-01-01},
booktitle = {High-Performance Modelling and Simulation for Big Data Applications: Selected Results of the COST Action IC1406 cHiPSet},
number = {11400},
pages = {1–35},
publisher = {Springer International Publishing},
address = {Cham},
series = {LNCS},
abstract = {Modelling and Simulation (M&S) offer adequate abstractions to manage the complexity of analysing big data in scientific and engineering domains. Unfortunately, big data problems are often not easily amenable to efficient and effective use of High Performance Computing (HPC) facilities and technologies. Furthermore, M&S communities typically lack the detailed expertise required to exploit the full potential of HPC solutions while HPC specialists may not be fully aware of specific modelling and simulation requirements and applications.},
keywords = {HPC},
pubstate = {published},
tppubtype = {inbook}
}
Maurizio Drocco, Paolo Viviani, Iacopo Colonnelli, Marco Aldinucci, Marco Grangetto
Accelerating spectral graph analysis through wavefronts of linear algebra operations Proceedings Article
In: Proc. of 27th Euromicro Intl. Conference on Parallel Distributed and network-based Processing (PDP), pp. 9–16, IEEE, Pavia, Italy, 2019.
Abstract | Links | BibTeX | Tags: grid
@inproceedings{19:gsp:pdp,
title = {Accelerating spectral graph analysis through wavefronts of linear algebra operations},
author = {Maurizio Drocco and Paolo Viviani and Iacopo Colonnelli and Marco Aldinucci and Marco Grangetto},
url = {https://iris.unito.it/retrieve/handle/2318/1695315/488105/19_wavefront_PDP.pdf},
doi = {10.1109/EMPDP.2019.8671640},
year = {2019},
date = {2019-01-01},
booktitle = {Proc. of 27th Euromicro Intl. Conference on Parallel Distributed and network-based Processing (PDP)},
pages = {9–16},
publisher = {IEEE},
address = {Pavia, Italy},
abstract = {The wavefront pattern captures the unfolding of a parallel computation in which data elements are laid out as a logical multidimensional grid and the dependency graph favours a diagonal sweep across the grid. In the emerging area of spectral graph analysis, the computing often consists in a wavefront running over a tiled matrix, involving expensive linear algebra kernels. While these applications might benefit from parallel heterogeneous platforms (multi-core with GPUs),programming wavefront applications directly with high-performance linear algebra libraries yields code that is complex to write and optimize for the specific application. We advocate a methodology based on two abstractions (linear algebra and parallel pattern-based run-time), that allows to develop portable, self-configuring, and easy-to-profile code on hybrid platforms.},
keywords = {grid},
pubstate = {published},
tppubtype = {inproceedings}
}
Vincent Reniers, Dimitri Van Landuyt, Paolo Viviani, Bert Lagaisse, Riccardo Lombardi, Wouter Joosen
Analysis of Architectural Variants for Auditable Blockchain-based Private Data Sharing Proceedings Article
In: Proceedings of the 34th ACM/SIGAPP Symposium on Applied Computing, pp. 346–354, ACM, Limassol, Cyprus, 2019, ISBN: 978-1-4503-5933-7.
Abstract | Links | BibTeX | Tags:
@inproceedings{19:sac:blockchain,
title = {Analysis of Architectural Variants for Auditable Blockchain-based Private Data Sharing},
author = {Vincent Reniers and Dimitri Van Landuyt and Paolo Viviani and Bert Lagaisse and Riccardo Lombardi and Wouter Joosen},
url = {https://doi.acm.org/10.1145/3297280.3297316},
doi = {10.1145/3297280.3297316},
isbn = {978-1-4503-5933-7},
year = {2019},
date = {2019-01-01},
booktitle = {Proceedings of the 34th ACM/SIGAPP Symposium on Applied Computing},
pages = {346–354},
publisher = {ACM},
address = {Limassol, Cyprus},
series = {SAC '19},
abstract = {Many applications by design depend on costly trusted third-party auditors. One such example is the industrial application case of federated multi-disciplinary optimization (MDO), in which different organizations contribute to a complex engineering design effort. Although blockchain and distributed ledger technology (DLT) has strong potential in reducing the dependence on such intermediaries, the architectural complexity involved in designing a solution is daunting. In this paper, we analyze the architectural variants for decentralized private data sharing while guaranteeing auditability in terms of data access operations. Non-repudiation of actions taken by each party is a key requirement, as is availability of the shared data. % through storage governed by the chain. The architectural variants analyzed focus on attaining:~(i)~confidential data exchange, (ii)~maintaining and governing access to the shared data, (iii)~providing data access auditability, (iv)~data validation or conflict resolution, and to a lesser degree (v)~transaction and identity privacy. We systematically enumerate architectural decisions at the levels of:~storage, policy-based file access control, data encryption methods, and auditability mechanisms for private data. This analysis is based on extensive assessment of the state of the art on decentralized private data access management using static or dynamic policies, and private data validation without exposing confidential information. The main contribution of this work is a comprehensive overview of architectural variants for decentralized control of private, encrypted data, and the involved trade-offs in terms of performance, auditable trust and security. These findings are validated in the context on the aforementioned industry case that involves federated multi-disciplinary optimization (MDO).},
keywords = {},
pubstate = {published},
tppubtype = {inproceedings}
}
2018
Adriano Marques Garcia, Claudio Schepke, Alessandro Gonçalves Girardi, Sherlon Almeida Silva
Power Consumption of Parallel Programming Interfaces in Multicore Architectures: A Case Study Proceedings Article
In: 2018 Symposium on High Performance Computing Systems (WSCAD), pp. 77-83, 2018.
Abstract | Links | BibTeX | Tags: parallel
@inproceedings{GARCIA:WSCAD:18,
title = {Power Consumption of Parallel Programming Interfaces in Multicore Architectures: A Case Study},
author = {Adriano Marques Garcia and Claudio Schepke and Alessandro Gonçalves Girardi and Sherlon Almeida Silva},
url = {https://iris.unito.it/retrieve/cab823a1-a6f7-483f-929a-607a166e0e78/A_Case_Study___Adriano___IEEE.pdf},
doi = {10.1109/WSCAD.2018.00021},
year = {2018},
date = {2018-10-01},
booktitle = {2018 Symposium on High Performance Computing Systems (WSCAD)},
pages = {77-83},
abstract = {This paper presents a case study on the power consumption of different Parallel Programming Interfaces (PPIs) in multicore architectures. The study is based on the PAMPAR benchmark, which is composed of 11 algorithms implemented in PThreads, OpenMP, MPI-1 and MPI-2 (spawn) PPIs. The results show that there is no single best case that provides both better performance and low power consumption in the presented scenarios. However, PThreads and OpenMP achieve the best trade-offs between performance and power in most cases.},
keywords = {parallel},
pubstate = {published},
tppubtype = {inproceedings}
}
Claudia Misale, Maurizio Drocco, Guy Tremblay, Marco Aldinucci
PiCo: a Novel Approach to Stream Data Analytics Proceedings Article
In: Proc. of Euro-Par Workshops: 1st Intl. Workshop on Autonomic Solutions for Parallel and Distributed Data Stream Processing (Auto-DaSP 2017), Springer, Santiago de Compostela, Spain, 2018.
Abstract | Links | BibTeX | Tags: rephrase, toreador
@inproceedings{pico:autodasp:17,
title = {PiCo: a Novel Approach to Stream Data Analytics},
author = {Claudia Misale and Maurizio Drocco and Guy Tremblay and Marco Aldinucci},
url = {https://iris.unito.it/retrieve/handle/2318/1659344/409520/autodasp.pdf},
doi = {10.1007/978-3-319-75178-8_10},
year = {2018},
date = {2018-08-01},
booktitle = {Proc. of Euro-Par Workshops: 1st Intl. Workshop on Autonomic Solutions for Parallel and Distributed Data Stream Processing (Auto-DaSP 2017)},
volume = {10659},
publisher = {Springer},
address = {Santiago de Compostela, Spain},
series = {LNCS},
abstract = {In this paper, we present a new C++ API with a fluent interface called PiCo (Pipeline Composition). PiCo's programming model aims at making easier the programming of data analytics applications while preserving or enhancing their performance. This is attained through three key design choices: 1) unifying batch and stream data access models, 2) decoupling processing from data layout, and 3) exploiting a stream-oriented, scalable, effiicient C++11 runtime system. PiCo proposes a programming model based on pipelines and operators that are polymorphic with respect to data types in the sense that it is possible to re-use the same algorithms and pipelines on different data models (e.g., streams, lists, sets, etc.). Preliminary results show that PiCo can attain better performances in terms of execution times and hugely improve memory utilization when compared to Spark and Flink in both batch and stream processing.},
keywords = {rephrase, toreador},
pubstate = {published},
tppubtype = {inproceedings}
}
Gabriele Mencagli, Massimo Torquati, Fabio Lucattini, Salvatore Cuomo, Marco Aldinucci
Harnessing sliding-window execution semantics for parallel stream processing Journal Article
In: Journal of Parallel and Distributed Computing, vol. 116, pp. 74–88, 2018, ISSN: 0743-7315.
Abstract | Links | BibTeX | Tags: fastflow, rephrase
@article{17:slidingwindows:jpdc,
title = {Harnessing sliding-window execution semantics for parallel stream processing},
author = {Gabriele Mencagli and Massimo Torquati and Fabio Lucattini and Salvatore Cuomo and Marco Aldinucci},
url = {https://iris.unito.it/retrieve/e27ce42c-1381-2581-e053-d805fe0acbaa/preprint-jpdc-2017.pdf},
doi = {10.1016/j.jpdc.2017.10.021},
issn = {0743-7315},
year = {2018},
date = {2018-06-01},
journal = {Journal of Parallel and Distributed Computing},
volume = {116},
pages = {74–88},
abstract = {Abstract According to the recent trend in data acquisition and processing technology, big data are increasingly available in the form of unbounded streams of elementary data items to be processed in real-time. In this paper we study in detail the paradigm of sliding windows, a well-known technique for approximated queries that update their results continuously as new fresh data arrive from the stream. In this work we focus on the relationship between the various existing sliding window semantics and the way the query processing is performed from the parallelism perspective. From this study two alternative parallel models are identified, each covering semantics with very precise properties. Each model is described in terms of its pros and cons, and parallel implementations in the FastFlow framework are analyzed by discussing the layout of the concurrent data structures used for the efficient windows representation in each model.},
keywords = {fastflow, rephrase},
pubstate = {published},
tppubtype = {article}
}
Marco Aldinucci, Sergio Rabellino, Marco Pironti, Filippo Spiga, Paolo Viviani, Maurizio Drocco, Marco Guerzoni, Guido Boella, Marco Mellia, Paolo Margara, Idillio Drago, Roberto Marturano, Guido Marchetto, Elio Piccolo, Stefano Bagnasco, Stefano Lusso, Sara Vallero, Giuseppe Attardi, Alex Barchiesi, Alberto Colla, Fulvio Galeazzi
HPC4AI, an AI-on-demand federated platform endeavour Proceedings Article
In: ACM Computing Frontiers, Ischia, Italy, 2018.
Abstract | Links | BibTeX | Tags: hpc4ai, rephrase, toreador
@inproceedings{18:hpc4ai_acm_CF,
title = {HPC4AI, an AI-on-demand federated platform endeavour},
author = {Marco Aldinucci and Sergio Rabellino and Marco Pironti and Filippo Spiga and Paolo Viviani and Maurizio Drocco and Marco Guerzoni and Guido Boella and Marco Mellia and Paolo Margara and Idillio Drago and Roberto Marturano and Guido Marchetto and Elio Piccolo and Stefano Bagnasco and Stefano Lusso and Sara Vallero and Giuseppe Attardi and Alex Barchiesi and Alberto Colla and Fulvio Galeazzi},
url = {https://iris.unito.it/retrieve/handle/2318/1765596/689772/2018_hpc4ai_ACM_CF.pdf},
doi = {10.1145/3203217.3205340},
year = {2018},
date = {2018-05-01},
booktitle = {ACM Computing Frontiers},
address = {Ischia, Italy},
abstract = {In April 2018, under the auspices of the POR-FESR 2014-2020 program of Italian Piedmont Region, the Turin's Centre on High-Performance Computing for Artificial Intelligence (HPC4AI) was funded with a capital investment of 4.5Me and it began its deployment. HPC4AI aims to facilitate scientific research and engineering in the areas of Artificial Intelligence and Big Data Analytics. HPC4AI will specifically focus on methods for the on-demand provisioning of AI and BDA Cloud services to the regional and national industrial community, which includes the large regional ecosystem of Small-Medium Enterprises (SMEs) active in many different sectors such as automotive, aerospace, mechatronics, manufacturing, health and agrifood.},
keywords = {hpc4ai, rephrase, toreador},
pubstate = {published},
tppubtype = {inproceedings}
}
Paolo Viviani, Maurizio Drocco, Marco Aldinucci
Scaling Dense Linear Algebra on Multicore and Beyond: a Survey Proceedings Article
In: Proc. of 26th Euromicro Intl. Conference on Parallel Distributed and network-based Processing (PDP), IEEE, Cambridge, United Kingdom, 2018.
Abstract | Links | BibTeX | Tags:
@inproceedings{svd:pdp:18,
title = {Scaling Dense Linear Algebra on Multicore and Beyond: a Survey},
author = {Paolo Viviani and Maurizio Drocco and Marco Aldinucci},
url = {https://iris.unito.it/retrieve/handle/2318/1659340/387685/preprint_aperto.pdf},
doi = {10.1109/PDP2018.2018.00122},
year = {2018},
date = {2018-01-01},
booktitle = {Proc. of 26th Euromicro Intl. Conference on Parallel Distributed and network-based Processing (PDP)},
publisher = {IEEE},
address = {Cambridge, United Kingdom},
abstract = {The present trend in big-data analytics is to exploit algorithms with (sub-)linear time complexity, in this sense it is usually worth to investigate if the available techniques can be approximated to reach an affordable complexity. However, there are still problems in data science and engineering that involve algorithms with higher time complexity, like matrix inversion or Singular Value Decomposition (SVD). This work presents the results of a survey that reviews a number of tools meant to perform dense linear algebra at ``Big Data'' scale: namely, the proposed approach aims first to define a feasibility boundary for the problem size of shared-memory matrix factorizations, then to understand whether it is convenient to employ specific tools meant to scale out such dense linear algebra tasks on distributed platforms. The survey will eventually discuss the presented tools from the point of view of domain experts (data scientist, engineers), hence focusing on the trade-off between usability and performance.},
keywords = {},
pubstate = {published},
tppubtype = {inproceedings}
}
Fabio Tordini, Marco Aldinucci, Paolo Viviani, Ivan Merelli, Pietro Liò
Scientific Workflows on Clouds with Heterogeneous and Preemptible Instances Proceedings Article
In: Proc. of the Intl. Conference on Parallel Computing, ParCo 2017, 12-15 September 2017, Bologna, Italy, IOS Press, 2018.
Abstract | Links | BibTeX | Tags: rephrase
@inproceedings{18:parco:workflow,
title = {Scientific Workflows on Clouds with Heterogeneous and Preemptible Instances},
author = {Fabio Tordini and Marco Aldinucci and Paolo Viviani and Ivan Merelli and Pietro Liò},
url = {https://iris.unito.it/retrieve/handle/2318/1658510/385411/main.pdf},
doi = {10.3233/978-1-61499-843-3-605},
year = {2018},
date = {2018-01-01},
booktitle = {Proc. of the Intl. Conference on Parallel Computing, ParCo 2017, 12-15 September 2017, Bologna, Italy},
publisher = {IOS Press},
series = {Advances in Parallel Computing},
abstract = {The cloud environment is increasingly appealing for the HPC community, which has always dealt with scientific applications. However, there is still some skepticism about moving from traditional physical infrastructures to virtual HPC clusters. This mistrusting probably originates from some well known factors, including the effective economy of using cloud services, data and software availability, and the longstanding matter of data stewardship. In this work we discuss the design of a framework (based on Mesos) aimed at achieving a cost-effective and efficient usage of heterogeneous Processing Elements (PEs) for workflow execution, which supports hybrid cloud bursting over preemptible cloud Virtual Machines.},
keywords = {rephrase},
pubstate = {published},
tppubtype = {inproceedings}
}
Paolo Viviani, Marco Aldinucci, Roberto d'Ippolito, Jan Lemeire, Dean Vucinic
A Flexible Numerical Framework for Engineering—A Response Surface Modelling Application Book Chapter
In: Improved Performance of Materials: Design and Experimental Approaches, pp. 93–106, Springer International Publishing, Cham, 2018, ISBN: 978-3-319-59590-0.
Abstract | Links | BibTeX | Tags: repara, rephrase
@inbook{17:viviani:advstruct,
title = {A Flexible Numerical Framework for Engineering—A Response Surface Modelling Application},
author = {Paolo Viviani and Marco Aldinucci and Roberto d'Ippolito and Jan Lemeire and Dean Vucinic},
doi = {10.1007/978-3-319-59590-0_9},
isbn = {978-3-319-59590-0},
year = {2018},
date = {2018-01-01},
booktitle = {Improved Performance of Materials: Design and Experimental Approaches},
pages = {93–106},
publisher = {Springer International Publishing},
address = {Cham},
abstract = {This work presents an innovative approach adopted for the development of a new numerical software framework for accelerating dense linear algebra calculations and its application within an engineering context. In particular, response surface models (RSM) are a key tool to reduce the computational effort involved in engineering design processes like design optimization. However, RSMs may prove to be too expensive to be computed when the dimensionality of the system and/or the size of the dataset to be synthesized is significantly high or when a large number of different response surfaces has to be calculated in order to improve the overall accuracy (e.g. like when using ensemble modelling techniques). On the other hand, the potential of modern hybrid hardware (e.g. multicore, GPUs) is not exploited by current engineering tools, while they can lead to a significant performance improvement. To fill this gap, a software framework is being developed that enables the hybrid and scalable acceleration of the linear algebra core for engineering applications and especially of RSMs calculations with a user-friendly syntax that allows good portability between different hardware architectures, with no need of specific expertise in parallel programming and accelerator technology. The effectiveness of this framework is shown by comparing an accelerated code to a single-core calculation of a radial basis function RSM on some benchmark datasets. This approach is then validated within a real-life engineering application and the achievements are presented and discussed.},
keywords = {repara, rephrase},
pubstate = {published},
tppubtype = {inbook}
}
Marco Aldinucci, Marco Danelutto, Maurizio Drocco, Peter Kilpatrick, Claudia Misale, Guilherme Peretti Pezzi, Massimo Torquati
A Parallel Pattern for Iterative Stencil + Reduce Journal Article
In: Journal of Supercomputing, vol. 74, no. 11, pp. 5690–5705, 2018.
Abstract | Links | BibTeX | Tags: HPC, repara, rephrase
@article{16:stencilreduce:jsupe,
title = {A Parallel Pattern for Iterative Stencil + Reduce},
author = {Marco Aldinucci and Marco Danelutto and Maurizio Drocco and Peter Kilpatrick and Claudia Misale and Guilherme Peretti Pezzi and Massimo Torquati},
url = {https://iris.unito.it/retrieve/0716fc42-53d7-48c0-9469-697aabfe7759/jspaper.pdf},
doi = {10.1007/s11227-016-1871-z},
year = {2018},
date = {2018-01-01},
journal = {Journal of Supercomputing},
volume = {74},
number = {11},
pages = {5690–5705},
abstract = {We advocate the Loop-of-stencil-reduce pattern as a means of simplifying the implementation of data-parallel programs on heterogeneous multi-core platforms. Loop-of-stencil-reduce is general enough to subsume map, reduce, map-reduce, stencil, stencil-reduce, and, crucially, their usage in a loop in both data-parallel and streaming applications, or a combination of both. The pattern makes it possible to deploy a single stencil computation kernel on different GPUs. We discuss the implementation of Loop-of-stencil-reduce in FastFlow, a framework for the implementation of applications based on the parallel patterns. Experiments are presented to illustrate the use of Loop-of-stencil-reduce in developing data-parallel kernels running on heterogeneous systems.},
keywords = {HPC, repara, rephrase},
pubstate = {published},
tppubtype = {article}
}
Paolo Viviani, Maurizio Drocco, Marco Aldinucci
Pushing the boundaries of parallel Deep Learning - A practical approach Journal Article
In: CoRR, vol. abs/1806.09528, 2018.
Abstract | Links | BibTeX | Tags:
@article{18:arxiv:deeplearning,
title = {Pushing the boundaries of parallel Deep Learning - A practical approach},
author = {Paolo Viviani and Maurizio Drocco and Marco Aldinucci},
url = {https://arxiv.org/pdf/1806.09528},
year = {2018},
date = {2018-01-01},
journal = {CoRR},
volume = {abs/1806.09528},
abstract = {This work aims to assess the state of the art of data parallel deep neural network training, trying to identify potential research tracks to be exploited for performance improvement. Beside, it presents a design for a practical C++ library dedicated at implementing and unifying the current state of the art methodologies for parallel training in a performance-conscious framework, allowing the user to explore novel strategies without departing significantly from its usual work-flow.},
keywords = {},
pubstate = {published},
tppubtype = {article}
}
Claudia Misale, Maurizio Drocco, Guy Tremblay, Alberto R. Martinelli, Marco Aldinucci
PiCo: High-performance data analytics pipelines in modern C++ Journal Article
In: Future Generation Computer Systems, vol. 87, pp. 392–403, 2018.
Abstract | Links | BibTeX | Tags: fastflow, HPC, toreador
@article{18:fgcs:pico,
title = {PiCo: High-performance data analytics pipelines in modern C++},
author = {Claudia Misale and Maurizio Drocco and Guy Tremblay and Alberto R. Martinelli and Marco Aldinucci},
url = {https://iris.unito.it/retrieve/handle/2318/1668444/414280/fgcs_pico.pdf},
doi = {10.1016/j.future.2018.05.030},
year = {2018},
date = {2018-01-01},
booktitle = {Future Generation Computer Systems},
journal = {Future Generation Computer Systems},
volume = {87},
pages = {392–403},
abstract = {In this paper, we present a new C++ API with a fluent interface called PiCo (Pipeline Composition). PiCo's programming model aims at making easier the programming of data analytics applications while preserving or enhancing their performance. This is attained through three key design choices: (1) unifying batch and stream data access models, (2) decoupling processing from data layout, and (3) exploiting a stream-oriented, scalable, efficient C++11 runtime system. PiCo proposes a programming model based on pipelines and operators that are polymorphic with respect to data types in the sense that it is possible to reuse the same algorithms and pipelines on different data models (e.g., streams, lists, sets, etc.). Preliminary results show that PiCo, when compared to Spark and Flink, can attain better performances in terms of execution times and can hugely improve memory utilization, both for batch and stream processing.},
keywords = {fastflow, HPC, toreador},
pubstate = {published},
tppubtype = {article}
}
2017
Salvatore Cuomo, Marco Aldinucci, Massimo Torquati
Guest Editorial for Programming Models and Algorithms for Data Analysis in HPC Systems Journal Article
In: International Journal of Parallel Programming, pp. 1–3, 2017, ISSN: 0885-7458, (Editorial).
Abstract | Links | BibTeX | Tags: HPC
@article{17:ijpp:cuomo:editorial,
title = {Guest Editorial for Programming Models and Algorithms for Data Analysis in HPC Systems},
author = {Salvatore Cuomo and Marco Aldinucci and Massimo Torquati},
url = {https://doi.org/10.1007/s10766-017-0531-0},
doi = {10.1007/s10766-017-0531-0},
issn = {0885-7458},
year = {2017},
date = {2017-10-01},
journal = {International Journal of Parallel Programming},
pages = {1–3},
abstract = {Performance is still the hottest keyword in parallel and distributed systems: performance evaluation, design for performance, performance portability and scalability are just a few of the many possible declinations that nowadays are of paramount scientific importance. To tackle these challenges, system architects, applications programmers and data center managers need methodological tools to fit at best the overall workload and the available architecture, maximizing the overall performances and minimizing overheads, energy consumption or idle time while application developers mainly aim at algorithmic and software oriented performances. Proper methodologies for modeling and analysis are the way to turn complexity into opportunities.
This Special Issue of the International Journal of Parallel Programming welcomes papers that present practical and methodological approaches to analytical and simulative performance evaluation for architecturally complex systems and high-performance parallel and computing algorithm. Successful contributions have been done on specific technologies, applications and innovative solutions to system specifications and algorithmic schemes both.},
note = {Editorial},
keywords = {HPC},
pubstate = {published},
tppubtype = {article}
}
This Special Issue of the International Journal of Parallel Programming welcomes papers that present practical and methodological approaches to analytical and simulative performance evaluation for architecturally complex systems and high-performance parallel and computing algorithm. Successful contributions have been done on specific technologies, applications and innovative solutions to system specifications and algorithmic schemes both.
Maurizio Drocco
Parallel Programming with Global Asynchronous Memory: Models, C++ APIs and Implementations PhD Thesis
Computer Science Department, University of Torino, 2017.
Abstract | Links | BibTeX | Tags: fastflow, paraphrase, repara, rephrase, toreador
@phdthesis{17:gam:drocco:thesis,
title = {Parallel Programming with Global Asynchronous Memory: Models, C++ APIs and Implementations},
author = {Maurizio Drocco},
url = {https://zenodo.org/record/1037585/files/Drocco_phd_thesis.pdf},
doi = {10.5281/zenodo.1037585},
year = {2017},
date = {2017-10-01},
school = {Computer Science Department, University of Torino},
abstract = {In the realm of High Performance Computing (HPC), message passing has been the programming paradigm of choice for over twenty years. The durable MPI (Message Passing Interface) standard, with send/receive communication, broadcast, gather/scatter, and reduction collectives is still used to construct parallel programs where each communication is orchestrated by the de-vel-oper-based precise knowledge of data distribution and overheads; collective communications simplify the orchestration but might induce excessive synchronization. Early attempts to bring shared-memory programming model—with its programming adv-antages—to distributed computing, referred as the Distributed Shared Memory (DSM) model, faded away; one of the main issue was to combine performance and programmability with the memory consistency model. The recently proposed Partitioned Global Address Space (PGAS) model is a modern revamp of DSM that exposes data placement to enable optimizations based on locality, but it still addresses (simple) data-parallelism only and it relies on expensive sharing protocols. We advocate an alternative programming model for distributed computing based on a Global Asynchronous Memory (GAM), aiming to emphavoid coherency and consistency problems rather than solving them. We materialize GAM by designing and implementing a emphdistributed smart pointers library, inspired by C++ smart pointers. In this model, public and private pointers (resembling C++ shared and unique pointers, respectively) are moved around instead of messages (i.e., data), thus alleviating the user from the burden of minimizing transfers. On top of smart pointers, we propose a high-level C++ template library for writing applications in terms of dataflow-like networks, namely GAM nets, consisting of stateful processors exchanging pointers in fully asynchronous fashion. We demonstrate the validity of the proposed approach, from the expressiveness perspective, by showing how GAM nets can be exploited to implement higher-level parallel programming models, such as data and task parallelism. As for the performance perspective, the execution of two non-toy benchmarks on a number of different small-scale HPC clusters exhibits both close-to-ideal scalability and negligible overhead with respect to state-of-the-art benchmark implementations. For instance, the GAM implementation of a high-quality video restoration filter sustains a 100 fps throughput over 70%-noisy high-quality video streams on a 4-node cluster of Graphics Processing Units (GPUs), with minimal programming effort.},
keywords = {fastflow, paraphrase, repara, rephrase, toreador},
pubstate = {published},
tppubtype = {phdthesis}
}
Paula Severi, Luca Padovani, Emilio Tuosto, Mariangiola Dezani-Ciancaglini
On Sessions and Infinite Data Journal Article
In: Logical Methods in Computer Science, vol. Volume 13, Issue 2, 2017.
Links | BibTeX | Tags: rephrase, semantics
@article{lmcs:3725,
title = {On Sessions and Infinite Data},
author = {Paula Severi and Luca Padovani and Emilio Tuosto and Mariangiola Dezani-Ciancaglini},
url = {http://lmcs.episciences.org/3725},
doi = {10.23638/LMCS-13(2:9)2017},
year = {2017},
date = {2017-06-01},
journal = {Logical Methods in Computer Science},
volume = {Volume 13, Issue 2},
keywords = {rephrase, semantics},
pubstate = {published},
tppubtype = {article}
}
Maurizio Drocco, Claudia Misale, Guy Tremblay, Marco Aldinucci
A Formal Semantics for Data Analytics Pipelines Technical Report
Computer Science Department, University of Torino 2017, (https://arxiv.org/abs/1705.01629).
Links | BibTeX | Tags: rephrase, toreador
@techreport{17:drocco:techreport,
title = {A Formal Semantics for Data Analytics Pipelines},
author = {Maurizio Drocco and Claudia Misale and Guy Tremblay and Marco Aldinucci},
url = {https://doi.org/10.5281/zenodo.571802},
doi = {10.5281/zenodo.571802},
year = {2017},
date = {2017-05-01},
institution = {Computer Science Department, University of Torino},
note = {https://arxiv.org/abs/1705.01629},
keywords = {rephrase, toreador},
pubstate = {published},
tppubtype = {techreport}
}
Claudia Misale
PiCo: A Domain-Specific Language for Data Analytics Pipelines PhD Thesis
Computer Science Department, University of Torino, 2017.
Abstract | Links | BibTeX | Tags: fastflow, paraphrase, repara, rephrase, toreador
@phdthesis{17:pico:misale:thesis,
title = {PiCo: A Domain-Specific Language for Data Analytics Pipelines},
author = {Claudia Misale},
url = {https://iris.unito.it/retrieve/handle/2318/1633743/320170/Misale_thesis.pdf},
doi = {10.5281/zenodo.579753},
year = {2017},
date = {2017-05-01},
school = {Computer Science Department, University of Torino},
abstract = {In the world of Big Data analytics, there is a series of tools aiming at simplifying programming applications to be executed on clusters. Although each tool claims to provide better programming, data and execution models—for which only informal (and often confusing) semantics is generally provided—all share a common under- lying model, namely, the Dataflow model. Using this model as a starting point, it is possible to categorize and analyze almost all aspects about Big Data analytics tools from a high level perspective. This analysis can be considered as a first step toward a formal model to be exploited in the design of a (new) framework for Big Data analytics. By putting clear separations between all levels of abstraction (i.e., from the runtime to the user API), it is easier for a programmer or software designer to avoid mixing low level with high level aspects, as we are often used to see in state-of-the-art Big Data analytics frameworks.
From the user-level perspective, we think that a clearer and simple semantics is preferable, together with a strong separation of concerns. For this reason, we use the Dataflow model as a starting point to build a programming environment with a simplified programming model implemented as a Domain-Specific Language, that is on top of a stack of layers that build a prototypical framework for Big Data analytics.
The contribution of this thesis is twofold: first, we show that the proposed model is (at least) as general as existing batch and streaming frameworks (e.g., Spark, Flink, Storm, Google Dataflow), thus making it easier to understand high-level data-processing applications written in such frameworks. As result of this analysis, we provide a layered model that can represent tools and applications following the Dataflow paradigm and we show how the analyzed tools fit in each level.
Second, we propose a programming environment based on such layered model in the form of a Domain-Specific Language (DSL) for processing data collections, called PiCo (Pipeline Composition). The main entity of this programming model is the Pipeline, basically a DAG-composition of processing elements. This model is intended to give the user an unique interface for both stream and batch processing, hiding completely data management and focusing only on operations, which are represented by Pipeline stages. Our DSL will be built on top of the FastFlow library, exploiting both shared and distributed parallelism, and implemented in C++11/14 with the aim of porting C++ into the Big Data world.},
keywords = {fastflow, paraphrase, repara, rephrase, toreador},
pubstate = {published},
tppubtype = {phdthesis}
}
From the user-level perspective, we think that a clearer and simple semantics is preferable, together with a strong separation of concerns. For this reason, we use the Dataflow model as a starting point to build a programming environment with a simplified programming model implemented as a Domain-Specific Language, that is on top of a stack of layers that build a prototypical framework for Big Data analytics.
The contribution of this thesis is twofold: first, we show that the proposed model is (at least) as general as existing batch and streaming frameworks (e.g., Spark, Flink, Storm, Google Dataflow), thus making it easier to understand high-level data-processing applications written in such frameworks. As result of this analysis, we provide a layered model that can represent tools and applications following the Dataflow paradigm and we show how the analyzed tools fit in each level.
Second, we propose a programming environment based on such layered model in the form of a Domain-Specific Language (DSL) for processing data collections, called PiCo (Pipeline Composition). The main entity of this programming model is the Pipeline, basically a DAG-composition of processing elements. This model is intended to give the user an unique interface for both stream and batch processing, hiding completely data management and focusing only on operations, which are represented by Pipeline stages. Our DSL will be built on top of the FastFlow library, exploiting both shared and distributed parallelism, and implemented in C++11/14 with the aim of porting C++ into the Big Data world.
Paolo Viviani, Massimo Torquati, Marco Aldinucci, Roberto d'Ippolito
Multiple back-end support for the Armadillo linear algebra interface Proceedings Article
In: In proc. of the 32nd ACM Symposium on Applied Computing (SAC), pp. 1566–1573, Marrakesh, Morocco, 2017.
Abstract | Links | BibTeX | Tags: HPC, repara, rephrase
@inproceedings{17:sac:armadillo,
title = {Multiple back-end support for the Armadillo linear algebra interface},
author = {Paolo Viviani and Massimo Torquati and Marco Aldinucci and Roberto d'Ippolito},
url = {https://iris.unito.it/retrieve/handle/2318/1626229/299089/armadillo_4aperto.pdf},
year = {2017},
date = {2017-04-01},
booktitle = {In proc. of the 32nd ACM Symposium on Applied Computing (SAC)},
pages = {1566–1573},
address = {Marrakesh, Morocco},
abstract = {The Armadillo C++ library provides programmers with a high-level Matlab-like syntax for linear algebra. Its design aims at providing a good balance between speed and ease of use. It can be linked with different back-ends, i.e. different LAPACK-compliant libraries. In this work we present a novel run-time support of Armadillo, which gracefully extends mainstream implementation to enable back-end switching without recompilation and multiple back-end support. The extension is specifically designed to not affect Armadillo class template prototypes, thus to be easily interoperable with future evolutions of the Armadillo library itself. The proposed software stack is then tested for functionality and performance against a kernel code extracted from an industrial application.},
keywords = {HPC, repara, rephrase},
pubstate = {published},
tppubtype = {inproceedings}
}
Marco Aldinucci, Marco Danelutto, Daniele De Sensi, Gabriele Mencagli, Massimo Torquati
Towards Power-Aware Data Pipelining on Multicores Proceedings Article
In: Proceedings of the 10th International Symposium on High-Level Parallel Programming and Applications, Valladolid, Spain, 2017.
Abstract | Links | BibTeX | Tags: fastflow, rephrase
@inproceedings{17:hlpp:powerstream,
title = {Towards Power-Aware Data Pipelining on Multicores},
author = {Marco Aldinucci and Marco Danelutto and Daniele De Sensi and Gabriele Mencagli and Massimo Torquati},
url = {https://iris.unito.it/retrieve/handle/2318/1644982/351415/17_HLPP_powerstream.pdf},
year = {2017},
date = {2017-01-01},
booktitle = {Proceedings of the 10th International Symposium on High-Level Parallel Programming and Applications},
address = {Valladolid, Spain},
abstract = {Power consumption management has become a major concern in software development. Continuous streaming computations are usually com- posed by different modules, exchanging data through shared message queues. The selection of the algorithm used to access such queues (i.e., the concurrency control) is a critical aspect for both performance and power consumption. In this paper, we describe the design of an adaptive concurrency control algo- rithm for implementing power-efficient communications on shared memory multicores. The algorithm provides the throughput offered by a nonblocking implementation and the power efficiency of a blocking protocol. We demon- strate that our algorithm reduces the power consumption of data streaming computations without decreasing their throughput.},
keywords = {fastflow, rephrase},
pubstate = {published},
tppubtype = {inproceedings}
}
Claudia Misale, Maurizio Drocco, Marco Aldinucci, Guy Tremblay
A Comparison of Big Data Frameworks on a Layered Dataflow Model Journal Article
In: Parallel Processing Letters, vol. 27, no. 01, pp. 1–20, 2017.
Abstract | Links | BibTeX | Tags: rephrase, toreador
@article{17:bigdatasurvey:PPL,
title = {A Comparison of Big Data Frameworks on a Layered Dataflow Model},
author = {Claudia Misale and Maurizio Drocco and Marco Aldinucci and Guy Tremblay},
url = {https://iris.unito.it/retrieve/handle/2318/1626287/303421/preprintPPL_4aperto.pdf},
doi = {10.1142/S0129626417400035},
year = {2017},
date = {2017-01-01},
journal = {Parallel Processing Letters},
volume = {27},
number = {01},
pages = {1–20},
abstract = {In the world of Big Data analytics, there is a series of tools aiming at simplifying programming applications to be executed on clusters. Although each tool claims to provide better programming, data and execution models, for which only informal (and often confusing) semantics is generally provided, all share a common underlying model, namely, the Dataflow model. The Dataflow model we propose shows how various tools share the same expressiveness at different levels of abstraction. The contribution of this work is twofold: first, we show that the proposed model is (at least) as general as existing batch and streaming frameworks (e.g., Spark, Flink, Storm), thus making it easier to understand high-level data-processing applications written in such frameworks. Second, we provide a layered model that can represent tools and applications following the Dataflow paradigm and we show how the analyzed tools fit in each level.},
keywords = {rephrase, toreador},
pubstate = {published},
tppubtype = {article}
}
Marco Aldinucci, Marco Danelutto, Peter Kilpatrick, Massimo Torquati
FastFlow: high-level and efficient streaming on multi-core Book Chapter
In: Pllana, Sabri, Xhafa, Fatos (Ed.): Programming Multi-core and Many-core Computing Systems, Chapter 13, pp. 261–280, John Wiley & Sons, Ltd, 2017, ISBN: 9781119332015.
Abstract | Links | BibTeX | Tags: fastflow
@inbook{ff:wileybook:17,
title = {FastFlow: high-level and efficient streaming on multi-core},
author = {Marco Aldinucci and Marco Danelutto and Peter Kilpatrick and Massimo Torquati},
editor = {Sabri Pllana and Fatos Xhafa},
url = {http://calvados.di.unipi.it/storage/paper_files/2011_FF_tutorial-draft.pdf},
doi = {10.1002/9781119332015.ch13},
isbn = {9781119332015},
year = {2017},
date = {2017-01-01},
booktitle = {Programming Multi-core and Many-core Computing Systems},
pages = {261–280},
publisher = {John Wiley & Sons, Ltd},
chapter = {13},
series = {Parallel and Distributed Computing},
abstract = {This chapter first outlines FastFlow design and then shows sample use of the FastFlow programming environment together with performance results achieved on various state-of-the-art multicore architectures. The FastFlow framework has been designed according to four foundational principles: layered design; efficiency in base mechanisms; support for stream parallelism; and a programming model based on design pattern/algorithmic skeleton concepts. The core of the FastFlow framework provides an efficient implementation of single-producer-single-consumer (SPSC) first in-first out (FIFO) queues. The next tier up extends from one-to-one queues to one-to-many, many-to-one, and many-to-many synchronizations and data flows, which are implemented using only SPSC queues and arbiter threads, thus providing lock-free and wait-free arbitrary dataflow graphs. When designing and implementing new parallel applications using FastFlow, programmers instantiate patterns provided by FastFlow to adapt them to the specific needs of the application at hand. The chapter demonstrates how the principal FastFlow patterns may be used in a parallel application.},
keywords = {fastflow},
pubstate = {published},
tppubtype = {inbook}
}
Fabio Tordini, Maurizio Drocco, Claudia Misale, Luciano Milanesi, Pietro Liò, Ivan Merelli, Massimo Torquati, Marco Aldinucci
NuChart-II: the road to a fast and scalable tool for Hi-C data analysis Journal Article
In: International Journal of High Performance Computing Applications, vol. 31, no. 3, pp. 196–211, 2017.
Abstract | Links | BibTeX | Tags: bioinformatics, fastflow, repara, rephrase
@article{16:ijhpca:nuchart,
title = {NuChart-II: the road to a fast and scalable tool for Hi-C data analysis},
author = {Fabio Tordini and Maurizio Drocco and Claudia Misale and Luciano Milanesi and Pietro Liò and Ivan Merelli and Massimo Torquati and Marco Aldinucci},
url = {https://iris.unito.it/retrieve/handle/2318/1607126/238747/main.pdf},
doi = {10.1177/1094342016668567},
year = {2017},
date = {2017-01-01},
journal = {International Journal of High Performance Computing Applications},
volume = {31},
number = {3},
pages = {196–211},
abstract = {Recent advances in molecular biology and bioinformatics techniques brought to an explosion of the information about the spatial organisation of the DNA in the nucleus of a cell. High-throughput molecular biology techniques provide a genome-wide capture of the spatial organization of chromosomes at unprecedented scales, which permit to identify physical interactions between genetic elements located throughout a genome. Recent results have shown that there is a large correlation between co-localization and co-regulation of genes, but these important information are hampered by the lack of biologists-friendly analysis and visualisation software. In this work we present NuChart-II, an efficient and highly optimized tool for genomic data analysis that provides a gene-centric, graph-based representation of genomic information. While designing NuChart-II we addressed several common issues in the parallelisation of memory bound algorithms for shared-memory systems. With performance and usability in mind, NuChart-II is a R package that embeds a C++ engine: computing capabilities and memory hierarchy of multi-core architectures are fully exploited, while the versatile R environment for statistical analysis and data visualisation rises the level of abstraction and permits to orchestrate analysis and visualisation of genomic data.},
keywords = {bioinformatics, fastflow, repara, rephrase},
pubstate = {published},
tppubtype = {article}
}
Marco Aldinucci, Stefano Bagnasco, Stefano Lusso, Paolo Pasteris, Sergio Rabellino
OCCAM: a flexible, multi-purpose and extendable HPC cluster Proceedings Article
In: Journal of Physics: Conf. Series (CHEP 2016), pp. 082039, San Francisco, USA, 2017.
Abstract | Links | BibTeX | Tags: c3s, HPC
@inproceedings{16:occam:chep,
title = {OCCAM: a flexible, multi-purpose and extendable HPC cluster},
author = {Marco Aldinucci and Stefano Bagnasco and Stefano Lusso and Paolo Pasteris and Sergio Rabellino},
url = {http://iopscience.iop.org/article/10.1088/1742-6596/898/8/082039/meta},
doi = {10.1088/1742-6596/898/8/082039},
year = {2017},
date = {2017-01-01},
booktitle = {Journal of Physics: Conf. Series (CHEP 2016)},
volume = {898},
number = {8},
pages = {082039},
address = {San Francisco, USA},
abstract = {Obtaining CPU cycles on an HPC cluster is nowadays relatively simple and sometimes even cheap for academic institutions. However, in most of the cases providers of HPC services would not allow changes on the configuration, implementation of special features or a lower-level control on the computing infrastructure and networks, for example for testing new computing patterns or conducting research on HPC itself. The variety of use cases proposed by several departments of the University of Torino, including ones from solid-state chemistry, high-energy physics, computer science, big data analytics, computational biology, genomics and many others, called for different and sometimes conflicting configurations; furthermore, several R&D activities in the field of scientific computing, with topics ranging from GPU acceleration to Cloud Computing technologies, needed a platform to be carried out on. The Open Computing Cluster for Advanced data Manipulation (OCCAM) is a multi-purpose flexible HPC cluster designed and operated by a collaboration between the University of Torino and the Torino branch of the Istituto Nazionale di Fisica Nucleare. It is aimed at providing a flexible, reconfigurable and extendable infrastructure to cater to a wide range of different scientific computing needs, as well as a platform for R&D activities on computational technologies themselves. Extending it with novel architecture CPU, accelerator or hybrid microarchitecture (such as forthcoming Intel Xeon Phi Knights Landing) should be as a simple as plugging a node in a rack. The initial system counts slightly more than 1100 cpu cores and includes different types of computing nodes (standard dual-socket nodes, large quad-sockets nodes with 768 GB RAM, and multi-GPU nodes) and two separate disk storage subsystems: a smaller high-performance scratch area, based on the Lustre file system, intended for direct computational I/O and a larger one, of the order of 1PB, to archive near-line data for archival purposes. All the components of the system are interconnected through a 10Gb/s Ethernet layer with one-level topology and an InfiniBand FDR 56Gbps layer in fat-tree topology. A system of this kind, heterogeneous and reconfigurable by design, poses a number of challenges related to the frequency at which heterogeneous hardware resources might change their availability and shareability status, which in turn affect methods and means to allocate, manage, optimize, bill, monitor VMs, virtual farms, jobs, interactive bare-metal sessions, etc. This poster describes some of the use cases that prompted the design ad construction of the HPC cluster, its architecture and a first characterization of its performance by some synthetic benchmark tools and a few realistic use-case tests.},
keywords = {c3s, HPC},
pubstate = {published},
tppubtype = {inproceedings}
}
Concetto Spampinato, Simone Palazzo, Daniela Giordano, Marco Aldinucci, Rosalia Leonardi
Deep learning for automated skeletal bone age assessment in X-ray images Journal Article
In: Medical Image Analysis, vol. 36, pp. 41–51, 2017.
Abstract | Links | BibTeX | Tags: HPC
@article{17:deepx:conce,
title = {Deep learning for automated skeletal bone age assessment in X-ray images},
author = {Concetto Spampinato and Simone Palazzo and Daniela Giordano and Marco Aldinucci and Rosalia Leonardi},
url = {https://iris.unito.it/retrieve/e27ce42b-5743-2581-e053-d805fe0acbaa/main.pdf},
doi = {10.1016/j.media.2016.10.010},
year = {2017},
date = {2017-01-01},
journal = {Medical Image Analysis},
volume = {36},
pages = {41–51},
abstract = {Skeletal bone age assessment is a common clinical practice to investigate endocrinology, genetic and growth disorders in children. It is generally performed by radiological examination of the left hand by using either the Greulich and Pyle (G&P) method or the Tanner–Whitehouse (TW) one. However, both clinical procedures show several limitations, from the examination effort of radiologists to (most importantly) significant intra- and inter-operator variability. To address these problems, several automated approaches (especially relying on the TW method) have been proposed; nevertheless, none of them has been proved able to generalize to different races, age ranges and genders. In this paper, we propose and test several deep learning approaches to assess skeletal bone age automatically; the results showed an average discrepancy between manual and automatic evaluation of about 0.8 years, which is state-of-the-art performance. Furthermore, this is the first automated skeletal bone age assessment work tested on a public dataset and for all age ranges, races and genders, for which the source code is available, thus representing an exhaustive baseline for future research in the field. Beside the specific application scenario, this paper aims at providing answers to more general questions about deep learning on medical images: from the comparison between deep-learned features and manually-crafted ones, to the usage of deep-learning methods trained on general imagery for medical problems, to how to train a CNN with few images.},
keywords = {HPC},
pubstate = {published},
tppubtype = {article}
}
Mario Coppo, Mariangiola Dezani-Ciancaglini, Alejandro D'ıaz-Caro, Ines Margaria, Maddalena Zacchi
Retractions in Intersection Types Proceedings Article
In: Kobayashi, Naoki (Ed.): ITRS'16, pp. 31–47, 2017.
Links | BibTeX | Tags: rephrase, semantics
@inproceedings{CDMZ16,
title = {Retractions in Intersection Types},
author = {Mario Coppo and Mariangiola Dezani-Ciancaglini and Alejandro D'ıaz-Caro and Ines Margaria and Maddalena Zacchi},
editor = {Naoki Kobayashi},
url = {http://www.di.unito.it/~dezani/papers/cddmz.pdf},
doi = {10.4204/EPTCS.242.5},
year = {2017},
date = {2017-01-01},
booktitle = {ITRS'16},
volume = {242},
pages = {31–47},
series = {EPTCS},
keywords = {rephrase, semantics},
pubstate = {published},
tppubtype = {inproceedings}
}
Joshua Romero, Everett H. Phillips, Gregory Ruetsch, Massimiliano Fatica, Filippo Spiga, Paolo Giannozzi
A Performance Study of Quantum ESPRESSO's PWscf Code on Multi-core and GPU Systems Proceedings Article
In: High Performance Computing Systems. Performance Modeling, Benchmarking, and Simulation - 8th International Workshop, PMBS 2017, Denver, CO, USA, November 13, 2017, Proceedings, pp. 67–87, 2017.
@inproceedings{DBLP:conf/sc/RomeroPRFSG17,
title = {A Performance Study of Quantum ESPRESSO's PWscf Code on Multi-core and GPU Systems},
author = {Joshua Romero and Everett H. Phillips and Gregory Ruetsch and Massimiliano Fatica and Filippo Spiga and Paolo Giannozzi},
url = {https://doi.org/10.1007/978-3-319-72971-8_4},
doi = {10.1007/978-3-319-72971-8_4},
year = {2017},
date = {2017-01-01},
booktitle = {High Performance Computing Systems. Performance Modeling, Benchmarking, and Simulation - 8th International Workshop, PMBS 2017, Denver, CO, USA, November 13, 2017, Proceedings},
pages = {67–87},
keywords = {},
pubstate = {published},
tppubtype = {inproceedings}
}
Wissam Abu Ahmad, Andrea Bartolini, Francesco Beneventi, Luca Benini, Andrea Borghesi, Marco Cicala, Privato Forestieri, Cosimo Gianfreda, Daniele Gregori, Antonio Libri, Filippo Spiga, Simone Tinti
Design of an Energy Aware Petaflops Class High Performance Cluster Based on Power Architecture Proceedings Article
In: 2017 IEEE International Parallel and Distributed Processing Symposium Workshops, IPDPS Workshops 2017, Orlando / Buena Vista, FL, USA, May 29 - June 2, 2017, pp. 964–973, 2017.
@inproceedings{DBLP:conf/ipps/AhmadBBBBCFGGLS17,
title = {Design of an Energy Aware Petaflops Class High Performance Cluster Based on Power Architecture},
author = {Wissam Abu Ahmad and Andrea Bartolini and Francesco Beneventi and Luca Benini and Andrea Borghesi and Marco Cicala and Privato Forestieri and Cosimo Gianfreda and Daniele Gregori and Antonio Libri and Filippo Spiga and Simone Tinti},
url = {https://doi.org/10.1109/IPDPSW.2017.22},
doi = {10.1109/IPDPSW.2017.22},
year = {2017},
date = {2017-01-01},
booktitle = {2017 IEEE International Parallel and Distributed Processing Symposium Workshops, IPDPS Workshops 2017, Orlando / Buena Vista, FL, USA, May 29 - June 2, 2017},
pages = {964–973},
keywords = {HPC},
pubstate = {published},
tppubtype = {inproceedings}
}
2016
Paolo Viviani, Marco Aldinucci, Roberto d'Ippolito
An hybrid linear algebra framework for engineering Proceedings Article
In: Advanced Computer Architecture and Compilation for High-Performance and Embedded Systems (ACACES) – Poster Abstracts, Fiuggi, Italy, 2016.
Abstract | Links | BibTeX | Tags: HPC, repara
@inproceedings{16:acaces:armadillo,
title = {An hybrid linear algebra framework for engineering},
author = {Paolo Viviani and Marco Aldinucci and Roberto d'Ippolito},
url = {https://iris.unito.it/retrieve/handle/2318/1622382/300198/armadillo.pdf},
year = {2016},
date = {2016-07-01},
booktitle = {Advanced Computer Architecture and Compilation for High-Performance and Embedded Systems (ACACES) – Poster Abstracts},
address = {Fiuggi, Italy},
abstract = {The aim of this work is to provide developers and domain experts with simple (Matlab-like) inter- face for performing linear algebra tasks while retaining state-of-the-art computational speed. To achieve this goal we extend Armadillo C++ library is extended in order to support with multiple LAPACK-compliant back-ends targeting different architectures including CUDA GPUs; moreover our approach involves the possibility of dynamically switching between such back-ends in order to select the one which is most convenient based on the specific problem and hardware configura- tion. This approach is eventually validated within an industrial environment.},
keywords = {HPC, repara},
pubstate = {published},
tppubtype = {inproceedings}
}
Claudia Misale, Maurizio Drocco, Marco Aldinucci, Guy Tremblay
A Comparison of Big Data Frameworks on a Layered Dataflow Model Proceedings Article
In: Proc. of Intl. Workshop on High-Level Parallel Programming (HLPP), pp. 1–19, arXiv.org, Muenster, Germany, 2016.
Abstract | Links | BibTeX | Tags: rephrase, toreador
@inproceedings{16:bigdatasurvey:hlpp,
title = {A Comparison of Big Data Frameworks on a Layered Dataflow Model},
author = {Claudia Misale and Maurizio Drocco and Marco Aldinucci and Guy Tremblay},
url = {http://arxiv.org/pdf/1606.05293v1.pdf},
doi = {10.5281/zenodo.321866},
year = {2016},
date = {2016-07-01},
booktitle = {Proc. of Intl. Workshop on High-Level Parallel Programming (HLPP)},
pages = {1–19},
publisher = {arXiv.org},
address = {Muenster, Germany},
abstract = {In the world of Big Data analytics, there is a series of tools aiming at simplifying programming applications to be executed on clusters. Although each tool claims to provide better programming, data and execution models, for which only informal (and often confusing) semantics is generally provided, all share a common underlying model, namely, the Dataflow model. The Dataflow model we propose shows how various tools share the same expressiveness at different levels of abstraction. The contribution of this work is twofold: first, we show that the proposed model is (at least) as general as existing batch and streaming frameworks (e.g., Spark, Flink, Storm), thus making it easier to understand high-level data-processing applications written in such frameworks. Second, we provide a layered model that can represent tools and applications following the Dataflow paradigm and we show how the analyzed tools fit in each level.},
keywords = {rephrase, toreador},
pubstate = {published},
tppubtype = {inproceedings}
}
Fabio Tordini
The road towards a Cloud-based High-Performance solution for genomic data analysis PhD Thesis
Computer Science Department, University of Torino, Italy, 2016.
Abstract | Links | BibTeX | Tags: bioinformatics, fastflow
@phdthesis{tordiniThesis16,
title = {The road towards a Cloud-based High-Performance solution for genomic data analysis},
author = {Fabio Tordini},
url = {http://calvados.di.unipi.it/storage/paper_files/2016_tordini_phdthesis.pdf},
year = {2016},
date = {2016-04-01},
school = {Computer Science Department, University of Torino, Italy},
abstract = {Nowadays, molecular biology laboratories are delivering more and more data about DNA organisation, at increasing resolution and in a large number of samples. So much that genomic research is now facing many of the scale-out issues that high-performance computing has been addressing for years: they require powerful infrastructures with fast computing and storage capabilities, with substantial challenges in terms of data processing, statistical analysis and data representation. With this thesis we propose a high-performance pipeline for the analysis and interpretation of heterogeneous genomic information: beside performance, usability and availability are two essential requirements that novel Bioinformatics tools should satisfy. In this perspective, we propose and discuss our efforts towards a solid infrastructure for data processing and storage, where software that operates over data is exposed as a service, and is accessible by users through the Internet. We begin by presenting NuChart-II, a tool for the analysis and interpretation of spatial genomic information. With NuChart-II we propose a graph-based representation of genomic data, which can provide insights on the disposition of genomic elements in the DNA. We also discuss our approach for the normalisation of biases that affect raw sequenced data. We believe that many currently available tools for genomic data analysis are perceived as tricky and troublesome applications, that require highly specialised skills to obtain the desired outcomes. Concerning usability, we want to rise the level of abstraction perceived by the user, but maintain high performance and correctness while providing an exhaustive solution for data visualisation. We also intend to foster the availability of novel tools: in this work we also discuss a cloud solution that delivers computation and storage as dynamically allocated virtual resources via the Internet, while needed software is provided as a service. In this way, the computational demand of genomic research can be satisfied more economically by using lab-scale and enterprise-oriented technologies. Here we discuss our idea of a task farm for the integration of heterogeneous data resulting from different sequencing experiments: we believe that the integration of multi-omic features on a nuclear map can be a valuable mean for studying the interactions among genetic elements. This can reveal insights on biological mechanisms, such as genes regulation, translocations and epigenetic patterns.},
keywords = {bioinformatics, fastflow},
pubstate = {published},
tppubtype = {phdthesis}
}
Bogdan Nicolae, Carlos H. A. Costa, Claudia Misale, Kostas Katrinis, Yoonho Park
Towards Memory-Optimized Data Shuffling Patterns for Big Data Analytics Proceedings Article
In: IEEE/ACM 16th Intl. Symposium on Cluster, Cloud and Grid Computing, CCGrid 2016, IEEE, Cartagena, Colombia, 2016.
Abstract | Links | BibTeX | Tags: HPC
@inproceedings{16:ccgrid:misale,
title = {Towards Memory-Optimized Data Shuffling Patterns for Big Data Analytics},
author = {Bogdan Nicolae and Carlos H. A. Costa and Claudia Misale and Kostas Katrinis and Yoonho Park},
url = {http://ieeexplore.ieee.org/document/7515716/},
doi = {10.1109/CCGrid.2016.85},
year = {2016},
date = {2016-01-01},
booktitle = {IEEE/ACM 16th Intl. Symposium on Cluster, Cloud and Grid Computing, CCGrid 2016},
publisher = {IEEE},
address = {Cartagena, Colombia},
abstract = {Big data analytics is an indispensable tool in transforming science, engineering, medicine, healthcare, finance and ultimately business itself. With the explosion of data sizes and need for shorter time-to-solution, in-memory platforms such as Apache Spark gain increasing popularity. However, this introduces important challenges, among which data shuffling is particularly difficult: on one hand it is a key part of the computation that has a major impact on the overall performance and scalability so its efficiency is paramount, while on the other hand it needs to operate with scarce memory in order to leave as much memory available for data caching. In this context, efficient scheduling of data transfers such that it addresses both dimensions of the problem simultaneously is non-trivial. State-of-the-art solutions often rely on simple approaches that yield sub optimal performance and resource usage. This paper contributes a novel shuffle data transfer strategy that dynamically adapts to the computation with minimal memory utilization, which we briefly underline as a series of design principles.},
keywords = {HPC},
pubstate = {published},
tppubtype = {inproceedings}
}
Paolo Viviani, Marco Aldinucci, Roberto d'Ippolito, Jean Lemeire, Dean Vucinic
A flexible numerical framework for engineering - a Response Surface Modelling application Unpublished
2016.
Abstract | BibTeX | Tags: HPC, repara, rephrase
@unpublished{16:acex:armadillo,
title = {A flexible numerical framework for engineering - a Response Surface Modelling application},
author = {Paolo Viviani and Marco Aldinucci and Roberto d'Ippolito and Jean Lemeire and Dean Vucinic},
year = {2016},
date = {2016-01-01},
booktitle = {10th Intl. Conference on Advanced Computational Engineering and Experimenting (ACE-X)},
abstract = {This work presents the innovative approach adopted for the development of a new numerical software framework for accelerating Dense Linear Algebra calculations and its application within an engineering context. In particular, Response Surface Models (RSM) are a key tool to reduce the computational effort involved in engineering design processes like design optimization. However, RSMs may prove to be too expensive to be computed when the dimensionality of the system and/or the size of the dataset to be synthesized is significantly high or when a large number of different Response Surfaces has to be calculated in order to improve the overall accuracy (e.g. like when using Ensemble Modelling techniques). On the other hand, it is a known challenge that the potential of modern hybrid hardware (e.g. multicore, GPUs) is not exploited by current engineering tools, while they can lead to a significant performance improvement. To fill this gap, a software framework is being developed that enables the hybrid and scalable acceleration of the linear algebra core for engineering applications and especially of RSMs calculations with a user-friendly syntax that allows good portability between different hardware architectures, with no need of specific expertise in parallel programming and accelerator technology. The effectiveness of this framework is shown by comparing an accelerated code to a single-core calculation of a Radial Basis Function RSM on some benchmark datasets. This approach is then validated within a real-life engineering application and the achievements are presented and discussed.},
keywords = {HPC, repara, rephrase},
pubstate = {published},
tppubtype = {unpublished}
}
Maurizio Drocco, Claudia Misale, Marco Aldinucci
A Cluster-As-Accelerator approach for SPMD-free Data Parallelism Proceedings Article
In: Proc. of 24th Euromicro Intl. Conference on Parallel Distributed and network-based Processing (PDP), pp. 350–353, IEEE, Crete, Greece, 2016.
Abstract | Links | BibTeX | Tags: fastflow, rephrase
@inproceedings{skedato:pdp:16,
title = {A Cluster-As-Accelerator approach for SPMD-free Data Parallelism},
author = {Maurizio Drocco and Claudia Misale and Marco Aldinucci},
url = {https://iris.unito.it/retrieve/handle/2318/1611858/262689/2016_pdp_skedato.pdf},
doi = {10.1109/PDP.2016.97},
year = {2016},
date = {2016-01-01},
booktitle = {Proc. of 24th Euromicro Intl. Conference on Parallel Distributed and network-based Processing (PDP)},
pages = {350–353},
publisher = {IEEE},
address = {Crete, Greece},
abstract = {In this paper we present a novel approach for functional-style programming of distributed-memory clusters, targeting data-centric applications. The programming model proposed is purely sequential, SPMD-free and based on high- level functional features introduced since C++11 specification. Additionally, we propose a novel cluster-as-accelerator design principle. In this scheme, cluster nodes act as general inter- preters of user-defined functional tasks over node-local portions of distributed data structures. We envision coupling a simple yet powerful programming model with a lightweight, locality- aware distributed runtime as a promising step along the road towards high-performance data analytics, in particular under the perspective of the upcoming exascale era. We implemented the proposed approach in SkeDaTo, a prototyping C++ library of data-parallel skeletons exploiting cluster-as-accelerator at the bottom layer of the runtime software stack.},
keywords = {fastflow, rephrase},
pubstate = {published},
tppubtype = {inproceedings}
}
Vladimir Janjic, Christopher Brown, Kenneth MacKenzie, Kevin Hammond, Marco Danelutto, Marco Aldinucci, Jose Daniel Garcia
RPL: A Domain-Specific Language for Designing and Implementing Parallel C++ Applications Proceedings Article
In: Proc. of Intl. Euromicro PDP 2016: Parallel Distributed and network-based Processing, IEEE, Crete, Greece, 2016.
Abstract | Links | BibTeX | Tags: fastflow, rephrase
@inproceedings{rpl:pdp:16,
title = {RPL: A Domain-Specific Language for Designing and Implementing Parallel C++ Applications},
author = {Vladimir Janjic and Christopher Brown and Kenneth MacKenzie and Kevin Hammond and Marco Danelutto and Marco Aldinucci and Jose Daniel Garcia},
url = {https://iris.unito.it/retrieve/handle/2318/1597172/299237/2016_jsupe_stencil_pp_4aperto.pdf},
doi = {10.1109/PDP.2016.122},
year = {2016},
date = {2016-01-01},
booktitle = {Proc. of Intl. Euromicro PDP 2016: Parallel Distributed and network-based Processing},
publisher = {IEEE},
address = {Crete, Greece},
abstract = {Parallelising sequential applications is usually a very hard job, due to many different ways in which an application can be parallelised and a large number of programming models (each with its own advantages and disadvantages) that can be used. In this paper, we describe a method to semi- automatically generate and evaluate different parallelisations of the same application, allowing programmers to find the best parallelisation without significant manual reengineering of the code. We describe a novel, high-level domain-specific language, Refactoring Pattern Language (RPL), that is used to represent the parallel structure of an application and to capture its extra-functional properties (such as service time). We then describe a set of RPL rewrite rules that can be used to generate alternative, but semantically equivalent, parallel structures (parallelisations) of the same application. We also describe the RPL Shell that can be used to evaluate these parallelisations, in terms of the desired extra-functional properties. Finally, we describe a set of C++ refactorings, targeting OpenMP, Intel TBB and FastFlow parallel programming models, that semi-automatically apply the desired parallelisation to the application's source code, therefore giving a parallel version of the code. We demonstrate how the RPL and the refactoring rules can be used to derive efficient parallelisations of two realistic C++ use cases (Image Convolution and Ant Colony Optimisation).},
keywords = {fastflow, rephrase},
pubstate = {published},
tppubtype = {inproceedings}
}
Marco Aldinucci, Sonia Campa, Marco Danelutto, Peter Kilpatrick, Massimo Torquati
Pool Evolution: A Parallel Pattern for Evolutionary and Symbolic Computing Journal Article
In: International Journal of Parallel Programming, vol. 44, no. 3, pp. 531–551, 2016, ISSN: 0885-7458.
Abstract | Links | BibTeX | Tags: fastflow, paraphrase, repara
@article{pool:ijpp:15,
title = {Pool Evolution: A Parallel Pattern for Evolutionary and Symbolic Computing},
author = {Marco Aldinucci and Sonia Campa and Marco Danelutto and Peter Kilpatrick and Massimo Torquati},
url = {https://iris.unito.it/retrieve/handle/2318/1522392/42139/2015_ff_pool_ijpp.pdf},
doi = {10.1007/s10766-015-0358-5},
issn = {0885-7458},
year = {2016},
date = {2016-01-01},
journal = {International Journal of Parallel Programming},
volume = {44},
number = {3},
pages = {531–551},
publisher = {Springer US},
abstract = {We introduce a new parallel pattern derived from a specific application domain and show how it turns out to have application beyond its domain of origin. The pool evolution pattern models the parallel evolution of a population subject to mutations and evolving in such a way that a given fitness function is optimized. The pattern has been demonstrated to be suitable for capturing and modeling the parallel patterns underpinning various evolutionary algorithms, as well as other parallel patterns typical of symbolic computation. In this paper we introduce the pattern, we discuss its implementation on modern multi/many core architectures and finally present experimental results obtained with FastFlow and Erlang implementations to assess its feasibility and scalability.},
keywords = {fastflow, paraphrase, repara},
pubstate = {published},
tppubtype = {article}
}
Fabio Tordini, Ivan Merelli, Pietro Liò, Luciano Milanesi, Marco Aldinucci
NuchaRt: embedding high-level parallel computing in R for augmented Hi-C data analysis Book Section
In: Publishing, Springer International (Ed.): Computational Intelligence Methods for Bioinformatics and Biostatistics, vol. 9874, pp. 259–272, Springer International Publishing, Cham (ZG), 2016, ISBN: 978-3-319-44331-7.
Abstract | Links | BibTeX | Tags: bioinformatics, fastflow, repara
@incollection{15:lnbi:nuchaRt,
title = {NuchaRt: embedding high-level parallel computing in R for augmented Hi-C data analysis},
author = {Fabio Tordini and Ivan Merelli and Pietro Liò and Luciano Milanesi and Marco Aldinucci},
editor = {Springer International Publishing},
url = {https://iris.unito.it/retrieve/handle/2318/1608281/253372/rnuchart.pdf},
doi = {10.1007/978-3-319-44332-4},
isbn = {978-3-319-44331-7},
year = {2016},
date = {2016-01-01},
booktitle = {Computational Intelligence Methods for Bioinformatics and Biostatistics},
volume = {9874},
pages = {259–272},
publisher = {Springer International Publishing},
address = {Cham (ZG)},
series = {Lecture Notes in Computer Science},
abstract = {Recent advances in molecular biology and Bioinformatics techniques brought to an explosion of the information about the spatial organisation of the DNA in the nucleus. High-throughput chromosome conformation capture techniques provide a genome-wide capture of chromatin contacts at unprecedented scales, which permit to identify physical interactions between genetic elements located throughout the human genome. These important studies are hampered by the lack of biologists-friendly software. In this work we present NuchaRt, an R package that wraps NuChart-II, an efficient and highly optimized C++ tool for the exploration of Hi-C data. By rising the level of abstraction, NuchaRt proposes a high-performance pipeline that allows users to orchestrate analysis and visualisation of multi-omics data, making optimal use of the computing capabilities offered by modern multi-core architectures, combined with the versatile and well known R environment for statistical analysis and data visualisation.},
keywords = {bioinformatics, fastflow, repara},
pubstate = {published},
tppubtype = {incollection}
}
Fabio Tordini
A cloud solution for multi-omics data integration Proceedings Article
In: Proceedings of the 16th IEEE International Conference on Scalable Computing and Communication, pp. 559–566, IEEE Computer Society, 2016, (Best paper award).
Abstract | Links | BibTeX | Tags: bioinformatics, fastflow, rephrase
@inproceedings{16:scalcom:cloud,
title = {A cloud solution for multi-omics data integration},
author = {Fabio Tordini},
url = {http://calvados.di.unipi.it/storage/paper_files/2016_cloudpipeline_scalcom.pdf},
doi = {10.1109/UIC-ATC-ScalCom-CBDCom-IoP-SmartWorld.2016.131},
year = {2016},
date = {2016-01-01},
booktitle = {Proceedings of the 16th IEEE International Conference on Scalable Computing and Communication},
pages = {559–566},
publisher = {IEEE Computer Society},
abstract = {Recent advances in molecular biology and Bioinformatics techniques have brought to an explosion of the information about the spatial organisation of the DNA inside the nucleus. In particular, 3C-based techniques are revealing the genome folding for many different cell types, and permit to create a more effective representation of the disposition of genes in the three-dimensional space. This information can be used to re-interpret heterogeneous genomic data (multi-omic) relying on 3D maps of the chromosome. The storage and computational requirements needed to accomplish such operations on raw sequenced data have to be fulfilled using HPC solutions, and the the Cloud paradigm is a valuable and convenient mean for delivering HPC to Bioinformatics. In this work we describe a data analysis work-flow that allows the integration and the interpretation of multi-omic data on a sort of ``topographical'' nuclear map, capable of representing the effective disposition of genes in a graph-based representation. We propose a cloud-based task farm pattern to orchestrate the services needed to accomplish genomic data analysis, where each service represents a special-purpose tool, playing a part in well known data analysis pipelines.},
note = {Best paper award},
keywords = {bioinformatics, fastflow, rephrase},
pubstate = {published},
tppubtype = {inproceedings}
}
Manuel F. Dolz, David Rio Astorga, Javier Fernández, J. Daniel Garc'ıa, Félix Garc'ıa-Carballeira, Marco Danelutto, Massimo Torquati
Embedding Semantics of the Single-Producer/Single-Consumer Lock-Free Queue into a Race Detection Tool Proceedings Article
In: Proceedings of the 7th International Workshop on Programming Models and Applications for Multicores and Manycores, pp. 20–29, ACM, Barcelona, Spain, 2016, ISBN: 978-1-4503-4196-7.
Links | BibTeX | Tags: fastflow, repara
@inproceedings{16:PMAM:SPSC,
title = {Embedding Semantics of the Single-Producer/Single-Consumer Lock-Free Queue into a Race Detection Tool},
author = {Manuel F. Dolz and David Rio Astorga and Javier Fernández and J. Daniel Garc'ıa and Félix Garc'ıa-Carballeira and Marco Danelutto and Massimo Torquati},
url = {https://doi.acm.org/10.1145/2883404.2883406},
doi = {10.1145/2883404.2883406},
isbn = {978-1-4503-4196-7},
year = {2016},
date = {2016-01-01},
booktitle = {Proceedings of the 7th International Workshop on Programming Models and Applications for Multicores and Manycores},
pages = {20–29},
publisher = {ACM},
address = {Barcelona, Spain},
series = {PMAM'16},
keywords = {fastflow, repara},
pubstate = {published},
tppubtype = {inproceedings}
}
Andrea Bracciali, Marco Aldinucci, Murray Patterson, Tobias Marschall, Nadia Pisanti, Ivan Merelli, Massimo Torquati
pWhatsHap: efficient haplotyping for future generation sequencing Journal Article
In: BMC Bioinformatics, vol. 17, no. Suppl 11, pp. 342, 2016.
Abstract | Links | BibTeX | Tags: fastflow, paraphrase, rephrase
@article{16:pwhatshap:bmc,
title = {pWhatsHap: efficient haplotyping for future generation sequencing},
author = {Andrea Bracciali and Marco Aldinucci and Murray Patterson and Tobias Marschall and Nadia Pisanti and Ivan Merelli and Massimo Torquati},
url = {http://bmcbioinformatics.biomedcentral.com/track/pdf/10.1186/s12859-016-1170-y?site=bmcbioinformatics.biomedcentral.com},
doi = {10.1186/s12859-016-1170-y},
year = {2016},
date = {2016-01-01},
journal = {BMC Bioinformatics},
volume = {17},
number = {Suppl 11},
pages = {342},
abstract = {Background: Haplotype phasing is an important problem in the analysis of genomics information. Given a set of DNA fragments of an individual, it consists of determining which one of the possible alleles (alternative forms of a gene) each fragment comes from. Haplotype information is relevant to gene regulation, epigenetics, genome-wide association studies, evolutionary and population studies, and the study of mutations. Haplotyping is currently addressed as an optimisation problem aiming at solutions that minimise, for instance, error correction costs, where costs are a measure of the confidence in the accuracy of the information acquired from DNA sequencing. Solutions have typically an exponential computational complexity. WhatsHap is a recent optimal approach which moves computational complexity from DNA fragment length to fragment overlap, i.e., coverage, and is hence of particular interest when considering sequencing technology's current trends that are producing longer fragments. Results: Given the potential relevance of efficient haplotyping in several analysis pipelines, we have designed and engineered pWhatsHap, a parallel, high-performance version of WhatsHap. pWhatsHap is embedded in a toolkit developed in Python and supports genomics datasets in standard file formats. Building on WhatsHap, pWhatsHap exhibits the same complexity exploring a number of possible solutions which is exponential in the coverage of the dataset. The parallel implementation on multi-core architectures allows for a relevant reduction of the execution time for haplotyping, while the provided results enjoy the same high accuracy as that provided by WhatsHap, which increases with coverage. Conclusions: Due to its structure and management of the large datasets, the parallelisation of WhatsHap posed demanding technical challenges, which have been addressed exploiting a high-level parallel programming framework. The result, pWhatsHap, is a freely available toolkit that improves the efficiency of the analysis of genomics information.},
keywords = {fastflow, paraphrase, rephrase},
pubstate = {published},
tppubtype = {article}
}
Fabio Tordini, Marco Aldinucci, Luciano Milanesi, Pietro Liò, Ivan Merelli
The Genome Conformation as an Integrator of Multi-Omic Data: The Example of Damage Spreading in Cancer Journal Article
In: Frontiers in Genetics, vol. 7, no. 194, pp. 1–17, 2016.
Abstract | Links | BibTeX | Tags:
@article{2016_omics_fgenetics,
title = {The Genome Conformation as an Integrator of Multi-Omic Data: The Example of Damage Spreading in Cancer},
author = {Fabio Tordini and Marco Aldinucci and Luciano Milanesi and Pietro Liò and Ivan Merelli},
url = {http://journal.frontiersin.org/article/10.3389/fgene.2016.00194},
doi = {10.3389/fgene.2016.00194},
year = {2016},
date = {2016-01-01},
journal = {Frontiers in Genetics},
volume = {7},
number = {194},
pages = {1–17},
abstract = {Publicly available multi-omic databases, in particular if associated with medical annotations, are rich resources with the potential to lead a rapid transition from high-throughput molecular biology experiments to better clinical outcomes for patients. In this work, we propose a model for multi-omic data integration (i.e. genetic variations, gene expression, genome conformation and epigenetic patterns), which exploits a multi-layer network approach to analyse, visualize and obtain insights from such biological information, in order to use achieved results at a macroscopic level. Using this representation, we can describe how driver and passenger mutations accumulate during the development of diseases providing, for example, a tool able to characterise the evolution of cancer. Indeed, our test case concerns the MCF-7 breast cancer cell line, before and after the stimulation with estrogen, since many datasets are available for this case study. In particular, the integration of data about cancer mutations, gene functional annotations, genome conformation, epigenetic patterns, gene expression and metabolic pathways in our multi-layer representation will allow a better interpretation of the mechanisms behind a complex disease such as cancer. Thanks to this multi-layer approach, we focus on the interplay of chromatin conformation and cancer mutations in different pathways, such as metabolic processes, that are very important for tumour development. Working on this model, a variance analysis can be implemented to identify normal variations within each omics and to characterize, by contrast, variations that can be accounted to pathological samples compared to normal ones. This integrative model can be used to identify novel biomarkers and to provide innovative omic-based guidelines for treating many diseases, improving the efficacy of decision trees currently used in clinic.},
keywords = {},
pubstate = {published},
tppubtype = {article}
}
Bogdan Nicolae, Carlos H. A. Costa, Claudia Misale, Kostas Katrinis, Yoonho Park
Leveraging Adaptive I/O to Optimize Collective Data Shuffling Patterns for Big Data Analytics Journal Article
In: IEEE Transactions on Parallel and Distributed Systems, vol. PP, no. 99, 2016.
Abstract | Links | BibTeX | Tags:
@article{16:shuffle:tpds:misale,
title = {Leveraging Adaptive I/O to Optimize Collective Data Shuffling Patterns for Big Data Analytics},
author = {Bogdan Nicolae and Carlos H. A. Costa and Claudia Misale and Kostas Katrinis and Yoonho Park},
url = {https://iris.unito.it/retrieve/handle/2318/1624908/295954/tpds_4aperto.pdf},
doi = {10.1109/TPDS.2016.2627558},
year = {2016},
date = {2016-01-01},
journal = {IEEE Transactions on Parallel and Distributed Systems},
volume = {PP},
number = {99},
abstract = {Big data analytics is an indispensable tool in transforming science, engineering, medicine, health-care, finance and ultimately business itself. With the explosion of data sizes and need for shorter time-to-solution, in-memory platforms such as Apache Spark gain increasing popularity. In this context, data shuffling, a particularly difficult transformation pattern, introduces important challenges. Specifically, data shuffling is a key component of complex computations that has a major impact on the overall performance and scalability. Thus, speeding up data shuffling is a critical goal. To this end, state-of-the-art solutions often rely on overlapping the data transfers with the shuffling phase. However, they employ simple mechanisms to decide how much data and where to fetch it from, which leads to sub-optimal performance and excessive auxiliary memory utilization for the purpose of prefetching. The latter aspect is a growing concern, given evidence that memory per computation unit is continuously decreasing while interconnect bandwidth is increasing. This paper contributes a novel shuffle data transfer strategy that addresses the two aforementioned dimensions by dynamically adapting the prefetching to the computation. We implemented this novel strategy in Spark, a popular in-memory data analytics framework. To demonstrate the benefits of our proposal, we run extensive experiments on an HPC cluster with large core count per node. Compared with the default Spark shuffle strategy, our proposal shows: up to 40% better performance with 50% less memory utilization for buffering and excellent weak scalability.},
keywords = {},
pubstate = {published},
tppubtype = {article}
}
Ilaria Castellani, Mariangiola Dezani-Ciancaglini, Ugo Liguoro
Secure Multiparty Sessions with Topics Proceedings Article
In: PLACES'16, pp. 1–12, 2016.
Links | BibTeX | Tags: rephrase, semantics
@inproceedings{CDL16,
title = {Secure Multiparty Sessions with Topics},
author = {Ilaria Castellani and Mariangiola Dezani-Ciancaglini and Ugo Liguoro},
url = {http://www.di.unito.it/~dezani/papers/cdl16.pdf},
year = {2016},
date = {2016-01-01},
booktitle = {PLACES'16},
volume = {211},
pages = {1–12},
series = {EPTCS},
keywords = {rephrase, semantics},
pubstate = {published},
tppubtype = {inproceedings}
}
Ilaria Castellani, Mariangiola Dezani-Ciancaglini, Jorge A. Pérez
Self-Adaptation and Secure Information Flow in Multiparty Communications Journal Article
In: Formal Aspects of Computing, vol. 28, no. 4, pp. 669–696, 2016.
Links | BibTeX | Tags: rephrase, semantics
@article{CDP16,
title = {Self-Adaptation and Secure Information Flow in Multiparty Communications},
author = {Ilaria Castellani and Mariangiola Dezani-Ciancaglini and Jorge A. Pérez},
url = {http://www.di.unito.it/~dezani/papers/cdp16.pdf},
year = {2016},
date = {2016-01-01},
journal = {Formal Aspects of Computing},
volume = {28},
number = {4},
pages = {669–696},
publisher = {Springer},
keywords = {rephrase, semantics},
pubstate = {published},
tppubtype = {article}
}
Mario Coppo, Mariangiola Dezani-Ciancaglini, Betti Venneri
Parallel Monitors for Self-adaptive Sessions Proceedings Article
In: PLACES'16, pp. 25–36, 2016.
Links | BibTeX | Tags: rephrase, semantics
@inproceedings{CDV16,
title = {Parallel Monitors for Self-adaptive Sessions},
author = {Mario Coppo and Mariangiola Dezani-Ciancaglini and Betti Venneri},
url = {http://www.di.unito.it/~dezani/papers/cdv16.pdf},
year = {2016},
date = {2016-01-01},
booktitle = {PLACES'16},
volume = {211},
pages = {25–36},
series = {EPTCS},
keywords = {rephrase, semantics},
pubstate = {published},
tppubtype = {inproceedings}
}
Mariangiola Dezani-Ciancaglini, Silvia Ghilezan, Svetlana Jaksic, Jovanka Pantovic, Nobuko Yoshida
Denotational and Operational Preciseness of Subtyping: A Roadmap Proceedings Article
In: Theory and Practice of Formal Methods, pp. 155–172, 2016.
Links | BibTeX | Tags: rephrase, semantics
@inproceedings{DGJPY16,
title = {Denotational and Operational Preciseness of Subtyping: A Roadmap},
author = {Mariangiola Dezani-Ciancaglini and Silvia Ghilezan and Svetlana Jaksic and Jovanka Pantovic and Nobuko Yoshida},
url = {http://www.di.unito.it/~dezani/papers/dgjpy16.pdf},
doi = {10.1007/978-3-319-30734-3_12},
year = {2016},
date = {2016-01-01},
booktitle = {Theory and Practice of Formal Methods},
volume = {9660},
pages = {155–172},
series = {LNCS},
keywords = {rephrase, semantics},
pubstate = {published},
tppubtype = {inproceedings}
}
Mariangiola Dezani-Ciancaglini, Paola Giannini
Reversible Multiparty Sessions with Checkpoints Proceedings Article
In: EXPRESS/SOS'16, pp. 60–74, 2016.
Links | BibTeX | Tags: rephrase, semantics
@inproceedings{DG16,
title = {Reversible Multiparty Sessions with Checkpoints},
author = {Mariangiola Dezani-Ciancaglini and Paola Giannini},
url = {http://www.di.unito.it/~dezani/papers/dg16.pdf},
year = {2016},
date = {2016-01-01},
booktitle = {EXPRESS/SOS'16},
volume = {222},
pages = {60–74},
series = {EPTCS},
keywords = {rephrase, semantics},
pubstate = {published},
tppubtype = {inproceedings}
}
2015
Paolo Inaudi
Progettazione e sviluppo di un provider libfabric per la rete ad alte prestazioni Ronniee/A3Cube Masters Thesis
Computer Science Department, University of Torino, 2015.
@mastersthesis{tesi:inaudi:15,
title = {Progettazione e sviluppo di un provider libfabric per la rete ad alte prestazioni Ronniee/A3Cube},
author = {Paolo Inaudi},
year = {2015},
date = {2015-10-01},
school = {Computer Science Department, University of Torino},
keywords = {fastflow},
pubstate = {published},
tppubtype = {mastersthesis}
}
Marco Aldinucci, Marco Danelutto, Maurizio Drocco, Peter Kilpatrick, Guilherme Peretti Pezzi, Massimo Torquati
The Loop-of-Stencil-Reduce paradigm Proceedings Article
In: Proc. of Intl. Workshop on Reengineering for Parallelism in Heterogeneous Parallel Platforms (RePara), pp. 172–177, IEEE, Helsinki, Finland, 2015.
Abstract | Links | BibTeX | Tags: fastflow, HPC, repara
@inproceedings{opencl:ff:ispa:15,
title = {The Loop-of-Stencil-Reduce paradigm},
author = {Marco Aldinucci and Marco Danelutto and Maurizio Drocco and Peter Kilpatrick and Guilherme Peretti Pezzi and Massimo Torquati},
url = {https://iris.unito.it/retrieve/handle/2318/1523738/52857/15_RePara_ISPA.pdf},
doi = {10.1109/Trustcom.2015.628},
year = {2015},
date = {2015-08-01},
booktitle = {Proc. of Intl. Workshop on Reengineering for Parallelism in Heterogeneous Parallel Platforms (RePara)},
pages = {172–177},
publisher = {IEEE},
address = {Helsinki, Finland},
abstract = {In this paper we advocate the Loop-of-stencil-reduce pattern as a way to simplify the parallel programming of heterogeneous platforms (multicore+GPUs). Loop-of-Stencil-reduce is general enough to subsume map, reduce, map-reduce, stencil, stencil-reduce, and, crucially, their usage in a loop. It transparently targets (by using OpenCL) combinations of CPU cores and GPUs, and it makes it possible to simplify the deployment of a single stencil computation kernel on different GPUs. The paper discusses the implementation of Loop-of-stencil-reduce within the FastFlow parallel framework, considering a simple iterative data-parallel application as running example (Game of Life) and a highly effective parallel filter for visual data restoration to assess performance. Thanks to the high-level design of the Loop-of-stencil-reduce, it was possible to run the filter seamlessly on a multicore machine, on multi-GPUs, and on both.},
keywords = {fastflow, HPC, repara},
pubstate = {published},
tppubtype = {inproceedings}
}
Fabio Tordini, Maurizio Drocco, Ivan Merelli, Luciano Milanesi, Pietro Liò, Marco Aldinucci
NuChart-II: a graph-based approach for the analysis and interpretation of Hi-C data Proceedings Article
In: Serio, Clelia Di, Liò, Pietro, Nonis, Alessandro, Tagliaferri, Roberto (Ed.): Proc. of 11th Intl. Meeting on Computational Intelligence Methods for Bioinformatics and Biostatistics (CIBB), pp. 298–311, Springer, Cambridge, UK, 2015, ISBN: 978-3-319-24461-7.
Abstract | Links | BibTeX | Tags: bioinformatics, fastflow, paraphrase, repara
@inproceedings{14:ff:nuchart:cibb,
title = {NuChart-II: a graph-based approach for the analysis and interpretation of Hi-C data},
author = {Fabio Tordini and Maurizio Drocco and Ivan Merelli and Luciano Milanesi and Pietro Liò and Marco Aldinucci},
editor = {Clelia Di Serio and Pietro Liò and Alessandro Nonis and Roberto Tagliaferri},
url = {http://calvados.di.unipi.it/storage/paper_files/2014_nuchart_cibb.pdf},
doi = {10.1007/978-3-319-24462-4_25},
isbn = {978-3-319-24461-7},
year = {2015},
date = {2015-06-01},
booktitle = {Proc. of 11th Intl. Meeting on Computational Intelligence Methods for Bioinformatics and Biostatistics (CIBB)},
volume = {8623},
pages = {298–311},
publisher = {Springer},
address = {Cambridge, UK},
series = {LNCS},
abstract = {Long-range chromosomal associations between genomic regions, and their repositioning in the 3D space of the nucleus, are now considered to be key contributors to the regulation of gene expressions, and important links have been highlighted with other genomic features involved in DNA rearrangements. Recent Chromosome Conformation Capture (3C) measurements performed with high throughput sequencing (Hi-C) and molecular dynamics studies show that there is a large correlation between co-localization and co-regulation of genes, but these important researches are hampered by the lack of biologists-friendly analysis and visualisation software. In this work we present NuChart-II, a software that allows the user to annotate and visualize a list of input genes with information relying on Hi-C data, integrating knowledge data about genomic features that are involved in the chromosome spatial organization. This software works directly with sequenced reads to identify related Hi-C fragments, with the aim of creating gene-centric neighbourhood graphs on which multi-omics features can be mapped. NuChart-II is a highly optimized implementation of a previous prototype package developed in R, in which the graph-based representation of Hi-C data was tested. The prototype showed inevitable problems of scalability while working genome-wide on large datasets: particular attention has been paid in optimizing the data structures employed while constructing the neighbourhood graph, so as to foster an efficient parallel implementation of the software. The normalization of Hi-C data has been modified and improved, in order to provide a reliable estimation of proximity likelihood for the genes.},
keywords = {bioinformatics, fastflow, paraphrase, repara},
pubstate = {published},
tppubtype = {inproceedings}
}
Maurizio Drocco, Claudia Misale, Guilherme Peretti Pezzi, Fabio Tordini, Marco Aldinucci
Memory-Optimised Parallel Processing of Hi-C Data Proceedings Article
In: Proc. of 23rd Euromicro Intl. Conference on Parallel Distributed and network-based Processing (PDP), pp. 1–8, IEEE, 2015.
Abstract | Links | BibTeX | Tags: bioinformatics, fastflow, impact, paraphrase, repara
@inproceedings{nuchart:speedup:15,
title = {Memory-Optimised Parallel Processing of Hi-C Data},
author = {Maurizio Drocco and Claudia Misale and Guilherme Peretti Pezzi and Fabio Tordini and Marco Aldinucci},
url = {https://iris.unito.it/retrieve/handle/2318/1521910/40615/2015_pdp_memopt.pdf},
doi = {10.1109/PDP.2015.63},
year = {2015},
date = {2015-03-01},
booktitle = {Proc. of 23rd Euromicro Intl. Conference on Parallel Distributed and network-based Processing (PDP)},
pages = {1–8},
publisher = {IEEE},
abstract = {This paper presents the optimisation efforts on the creation of a graph-based mapping representation of gene adjacency. The method is based on the Hi-C process, starting from Next Generation Sequencing data, and it analyses a huge amount of static data in order to produce maps for one or more genes. Straightforward parallelisation of this scheme does not yield acceptable performance on multicore architectures since the scalability is rather limited due to the memory bound nature of the problem. This work focuses on the memory optimisations that can be applied to the graph construction algorithm and its (complex) data structures to derive a cache-oblivious algorithm and eventually to improve the memory bandwidth utilisation. We used as running example NuChart-II, a tool for annotation and statistic analysis of Hi-C data that creates a gene-centric neighborhood graph. The proposed approach, which is exemplified for Hi-C, addresses several common issue in the parallelisation of memory bound algorithms for multicore. Results show that the proposed approach is able to increase the parallel speedup from 7x to 22x (on a 32-core platform). Finally, the proposed C++ implementation outperforms the first R NuChart prototype, by which it was not possible to complete the graph generation because of strong memory-saturation problems.},
keywords = {bioinformatics, fastflow, impact, paraphrase, repara},
pubstate = {published},
tppubtype = {inproceedings}
}
Fabio Tordini, Maurizio Drocco, Claudia Misale, Luciano Milanesi, Pietro Liò, Ivan Merelli, Marco Aldinucci
Parallel Exploration of the Nuclear Chromosome Conformation with NuChart-II Proceedings Article
In: Proc. of 23rd Euromicro Intl. Conference on Parallel Distributed and network-based Processing (PDP), IEEE, 2015.
Abstract | Links | BibTeX | Tags: bioinformatics, fastflow, impact, paraphrase, repara
@inproceedings{nuchar:tool:15,
title = {Parallel Exploration of the Nuclear Chromosome Conformation with NuChart-II},
author = {Fabio Tordini and Maurizio Drocco and Claudia Misale and Luciano Milanesi and Pietro Liò and Ivan Merelli and Marco Aldinucci},
url = {https://iris.unito.it/retrieve/handle/2318/1522038/40619/2015_pdp_nuchartff.pdf},
doi = {10.1109/PDP.2015.104},
year = {2015},
date = {2015-03-01},
booktitle = {Proc. of 23rd Euromicro Intl. Conference on Parallel Distributed and network-based Processing (PDP)},
publisher = {IEEE},
abstract = {High-throughput molecular biology techniques are widely used to identify physical interactions between genetic elements located throughout the human genome. Chromosome Conformation Capture (3C) and other related techniques allow to investigate the spatial organisation of chromosomes in the cell's natural state. Recent results have shown that there is a large correlation between co-localization and co-regulation of genes, but these important information are hampered by the lack of biologists-friendly analysis and visualisation software. In this work we introduce NuChart-II, a tool for Hi-C data analysis that provides a gene-centric view of the chromosomal neighbour- hood in a graph-based manner. NuChart-II is an efficient and highly optimized C++ re-implementation of a previous prototype package developed in R. Representing Hi-C data using a graph-based approach overcomes the common view relying on genomic coordinates and permits the use of graph analysis techniques to explore the spatial conformation of a gene neighbourhood.},
keywords = {bioinformatics, fastflow, impact, paraphrase, repara},
pubstate = {published},
tppubtype = {inproceedings}
}
Paolo Viviani
Parallel Computing Techniques for High Energy Physics Masters Thesis
Physics Department, University of Torino, 2015.
Abstract | BibTeX | Tags: fastflow, impact
@mastersthesis{tesi:viviani:15,
title = {Parallel Computing Techniques for High Energy Physics},
author = {Paolo Viviani},
year = {2015},
date = {2015-01-01},
school = {Physics Department, University of Torino},
abstract = {Modern experimental achievements, with LHC results as a prominent but not exclusive representative, have undisclosed a new range of challenges concerning theoretical com- putations. Tree level QED calculation are no more satisfactory due to the very small experimental uncertainty of precision e+ e- measurements, so Next To Leading and Next to Next to Leading Order calculations are required. At the same time many-legs, high-order QCD processes needed to simulate LHC events are raising even more the bar of computational complexity. The drive for the present work has been the interest in calculating high multiplicity Higgs boson processes with a dedicated software library (RECOLA) currently under development at the University of Torino, as well as the related technological challenges. This thesis undertakes the task of exploring the possibilities offered by present and upcoming computing technologies in order to face these challenges properly. The first two chapters outlines the theoretical context and the available technologies. In chapter 3 a a case study is examined in full detail, in order to explore the suitability of different parallel computing solutions. In the chapter 4, some of those solutions are implemented in the context of the RECOLA library, allowing it to handle processes at a previously unexplored scale of complexity. Alongside, the potential of new, cost-effective parallel architectures is tested.},
keywords = {fastflow, impact},
pubstate = {published},
tppubtype = {mastersthesis}
}
Ivan Merelli, Fabio Tordini, Maurizio Drocco, Marco Aldinucci, Pietro Liò, Luciano Milanesi
Integrating Multi-omic features exploiting Chromosome Conformation Capture data Journal Article
In: Frontiers in Genetics, vol. 6, no. 40, 2015, ISSN: 1664-8021.
Abstract | Links | BibTeX | Tags: bioinformatics, fastflow
@article{nuchart:frontiers:15,
title = {Integrating Multi-omic features exploiting Chromosome Conformation Capture data},
author = {Ivan Merelli and Fabio Tordini and Maurizio Drocco and Marco Aldinucci and Pietro Liò and Luciano Milanesi},
url = {http://journal.frontiersin.org/Journal/10.3389/fgene.2015.00040/pdf},
doi = {10.3389/fgene.2015.00040},
issn = {1664-8021},
year = {2015},
date = {2015-01-01},
journal = {Frontiers in Genetics},
volume = {6},
number = {40},
abstract = {The representation, integration and interpretation of omic data is a complex task, in particular considering the huge amount of information that is daily produced in molecular biology laboratories all around the world. The reason is that sequencing data regarding expression profiles, methylation patterns, and chromatin domains is difficult to harmonize in a systems biology view, since genome browsers only allow coordinate-based representations, discarding functional clusters created by the spatial conformation of the DNA in the nucleus. In this context, recent progresses in high throughput molecular biology techniques and bioinformatics have provided insights into chromatin interactions on a larger scale and offer a formidable support for the interpretation of multi-omic data. In particular, a novel sequencing technique called Chromosome Conformation Capture (3C) allows the analysis of the chromosome organization in the cell's natural state. While performed genome wide, this technique is usually called Hi-C. Inspired by service applications such as Google Maps, we developed NuChart, an R package that integrates Hi-C data to describe the chromosomal neighbourhood starting from the information about gene positions, with the possibility of mapping on the achieved graphs genomic features such as methylation patterns and histone modifications, along with expression profiles. In this paper we show the importance of the NuChart application for the integration of multi-omic data in a systems biology fashion, with particular interest in cytogenetic applications of these techniques. Moreover, we demonstrate how the integration of multi-omic data can provide useful information in understanding why genes are in certain specific positions inside the nucleus and how epigenetic patterns correlate with their expression.},
keywords = {bioinformatics, fastflow},
pubstate = {published},
tppubtype = {article}
}
Marco Aldinucci, Andrea Bracciali, Tobias Marschall, Murray Patterson, Nadia Pisanti, Massimo Torquati
High-Performance Haplotype Assembly Proceedings Article
In: Serio, Clelia Di, Liò, Pietro, Nonis, Alessandro, Tagliaferri, Roberto (Ed.): Computational Intelligence Methods for Bioinformatics and Biostatistics - 11th International Meeting, CIBB 2014, Cambridge, UK, June 26-28, 2014, Revised Selected Papers, pp. 245–258, Springer, Cambridge, UK, 2015.
Abstract | Links | BibTeX | Tags: bioinformatics, fastflow
@inproceedings{14:ff:whatsapp:cibb,
title = {High-Performance Haplotype Assembly},
author = {Marco Aldinucci and Andrea Bracciali and Tobias Marschall and Murray Patterson and Nadia Pisanti and Massimo Torquati},
editor = {Clelia Di Serio and Pietro Liò and Alessandro Nonis and Roberto Tagliaferri},
url = {https://iris.unito.it/retrieve/handle/2318/1523292/46714/2014_pHaplo_cibb.pdf},
doi = {10.1007/978-3-319-24462-4_21},
year = {2015},
date = {2015-01-01},
booktitle = {Computational Intelligence Methods for Bioinformatics and Biostatistics - 11th International Meeting, CIBB 2014, Cambridge, UK, June 26-28, 2014, Revised Selected Papers},
volume = {8623},
pages = {245–258},
publisher = {Springer},
address = {Cambridge, UK},
series = {LNCS},
abstract = {The problem of Haplotype Assembly is an essential step in human genome analysis. It is typically formalised as the Minimum Error Correction (MEC) problem which is NP-hard. MEC has been approached using heuristics, integer linear programming, and fixed-parameter tractability (FPT), including approaches whose runtime is exponential in the length of the DNA fragments obtained by the sequencing process. Technological improvements are currently increasing fragment length, which drastically elevates computational costs for such methods. We present pWhatsHap, a multi-core parallelisation of WhatsHap, a recent FPT optimal approach to MEC. WhatsHap moves complexity from fragment length to fragment overlap and is hence of particular interest when considering sequencing technology's current trends. pWhatsHap further improves the efficiency in solving the MEC problem, as shown by experiments performed on datasets with high coverage.},
keywords = {bioinformatics, fastflow},
pubstate = {published},
tppubtype = {inproceedings}
}
Marco Aldinucci, Guilherme Peretti Pezzi, Maurizio Drocco, Concetto Spampinato, Massimo Torquati
Parallel Visual Data Restoration on Multi-GPGPUs using Stencil-Reduce Pattern Journal Article
In: International Journal of High Performance Computing Applications, vol. 29, no. 4, pp. 461–472, 2015.
Abstract | Links | BibTeX | Tags: fastflow, HPC, impact, paraphrase
@article{ff:denoiser:ijhpca:15,
title = {Parallel Visual Data Restoration on Multi-GPGPUs using Stencil-Reduce Pattern},
author = {Marco Aldinucci and Guilherme Peretti Pezzi and Maurizio Drocco and Concetto Spampinato and Massimo Torquati},
url = {https://iris.unito.it/retrieve/handle/2318/1522073/299200/ijhpca_4aperto.pdf},
doi = {10.1177/1094342014567907},
year = {2015},
date = {2015-01-01},
journal = {International Journal of High Performance Computing Applications},
volume = {29},
number = {4},
pages = {461–472},
abstract = {In this paper, a highly effective parallel filter for visual data restoration is presented. The filter is designed following a skeletal approach, using a newly proposed stencil-reduce, and has been implemented by way of the FastFlow parallel programming library. As a result of its high-level design, it is possible to run the filter seamlessly on a multicore machine, on multi-GPGPUs, or on both. The design and implementation of the filter are discussed, and an experimental evaluation is presented.},
keywords = {fastflow, HPC, impact, paraphrase},
pubstate = {published},
tppubtype = {article}
}
Guilherme Peretti Pezzi, Evelyne Vaissié, Yann Viala, Denis Caromel, Philippe Gourbesville
Parallel profiling of water distribution networks using the Clément formula Journal Article
In: Applied Mathematics and Computation, vol. 267, pp. 83–95, 2015, ISSN: 0096-3003, (The Fourth European Seminar on Computing (ESCO 2014)).
Abstract | Links | BibTeX | Tags: impact
@article{PerettiPezzi201583,
title = {Parallel profiling of water distribution networks using the Clément formula},
author = {Guilherme Peretti Pezzi and Evelyne Vaissié and Yann Viala and Denis Caromel and Philippe Gourbesville},
url = {http://www.sciencedirect.com/science/article/pii/S0096300315007080},
doi = {10.1016/j.amc.2015.05.084},
issn = {0096-3003},
year = {2015},
date = {2015-01-01},
journal = {Applied Mathematics and Computation},
volume = {267},
pages = {83–95},
abstract = {Abstract Optimization of water distribution is a crucial issue which has been targeted by many modeling tools. Useful models, implemented several decades ago, need to be updated and implemented in more powerful computing environments. This paper presents the distributed and redesigned version of a legacy hydraulic simulation software written in Fortran (IRMA) that has been used for over 30 years by the Société du Canal de Provence in order to design and to maintain water distribution networks. IRMA was developed aiming mainly at the treatment of irrigation networks – by using the Clément demand model and is now used to manage more than 6000 km of piped networks. The complexity and size of networks have been growing since the creation of IRMA and the legacy software could not handle the simulation of very large networks in terms of performance.SAC This limitation has finally imposed to redesign the code by using modern tools and language (Java), and also to run distributed simulations by using the ProActive Parallel Suite.},
note = {The Fourth European Seminar on Computing (ESCO 2014)},
keywords = {impact},
pubstate = {published},
tppubtype = {article}
}
Mohammed Sourouri, Johannes Langguth, Filippo Spiga, Scott B. Baden, Xing Cai
CPU+GPU Programming of Stencil Computations for Resource-Efficient Use of GPU Clusters Proceedings Article
In: 18th IEEE International Conference on Computational Science and Engineering, CSE 2015, Porto, Portugal, October 21-23, 2015, pp. 17–26, 2015.
@inproceedings{DBLP:conf/cse/SourouriLSBC15,
title = {CPU+GPU Programming of Stencil Computations for Resource-Efficient Use of GPU Clusters},
author = {Mohammed Sourouri and Johannes Langguth and Filippo Spiga and Scott B. Baden and Xing Cai},
url = {https://doi.org/10.1109/CSE.2015.33},
doi = {10.1109/CSE.2015.33},
year = {2015},
date = {2015-01-01},
booktitle = {18th IEEE International Conference on Computational Science and Engineering, CSE 2015, Porto, Portugal, October 21-23, 2015},
pages = {17–26},
keywords = {},
pubstate = {published},
tppubtype = {inproceedings}
}
Jens Glaser, Trung Dac Nguyen, Joshua A. Anderson, Pak Lui, Filippo Spiga, Jaime A. Millan, David C. Morse, Sharon C. Glotzer
Strong scaling of general-purpose molecular dynamics simulations on GPUs Journal Article
In: Computer Physics Communications, vol. 192, pp. 97–107, 2015.
@article{DBLP:journals/cphysics/GlaserNALSMMG15,
title = {Strong scaling of general-purpose molecular dynamics simulations on GPUs},
author = {Jens Glaser and Trung Dac Nguyen and Joshua A. Anderson and Pak Lui and Filippo Spiga and Jaime A. Millan and David C. Morse and Sharon C. Glotzer},
url = {https://doi.org/10.1016/j.cpc.2015.02.028},
doi = {10.1016/j.cpc.2015.02.028},
year = {2015},
date = {2015-01-01},
journal = {Computer Physics Communications},
volume = {192},
pages = {97–107},
keywords = {},
pubstate = {published},
tppubtype = {article}
}
2014
Michael G. Epitropakis, Andrea Bracciali, Marco Aldinucci, Emily Potts, Edmund K. Burke
Predictive scheduling for optimal cloud configuration Proceedings Article
In: Özcan, Ender, Burke, Edmund K., MCCollum, Barry (Ed.): Proc. of 10th Intl. Conference on the Practice and Theory of Automated Timetabling, PATAT, York, United Kingdom, 2014.
@inproceedings{cloud:patat:14,
title = {Predictive scheduling for optimal cloud configuration},
author = {Michael G. Epitropakis and Andrea Bracciali and Marco Aldinucci and Emily Potts and Edmund K. Burke},
editor = {Ender Özcan and Edmund K. Burke and Barry MCCollum},
url = {http://www.patatconference.org/patat2014/proceedings/3_12.pdf},
doi = {978-0-9929984-0-0},
year = {2014},
date = {2014-08-01},
booktitle = {Proc. of 10th Intl. Conference on the Practice and Theory of Automated Timetabling},
publisher = {PATAT},
address = {York, United Kingdom},
keywords = {},
pubstate = {published},
tppubtype = {inproceedings}
}
Marco Aldinucci, Sonia Campa, Marco Danelutto, Peter Kilpatrick, Massimo Torquati
Pool evolution: a domain specific parallel pattern Proceedings Article
In: Proc.of the 7th Intl. Symposium on High-level Parallel Programming and Applications (HLPP), Amsterdam, The Netherlands, 2014.
Abstract | Links | BibTeX | Tags: fastflow, paraphrase, repara
@inproceedings{2014:ff:pool:hlpp,
title = {Pool evolution: a domain specific parallel pattern},
author = {Marco Aldinucci and Sonia Campa and Marco Danelutto and Peter Kilpatrick and Massimo Torquati},
url = {http://calvados.di.unipi.it/storage/paper_files/2014_hlpp_pool.pdf},
year = {2014},
date = {2014-07-01},
booktitle = {Proc.of the 7th Intl. Symposium on High-level Parallel Programming and Applications (HLPP)},
address = {Amsterdam, The Netherlands},
abstract = {We introduce a new parallel pattern derived from a specific application domain and show how it turns out to have application beyond its domain of origin. The pool evolution pattern models the parallel evolution of a population subject to mutations and evolving in such a way that a given fitness function is optimized. The pattern has been demonstrated to be suitable for capturing and modeling the parallel patterns underpinning various evolutionary algorithms, as well as other parallel patterns typical of symbolic computation. In this paper we introduce the pattern, developed in the framework of the ParaPhrase EU-funded FP7 project, we discuss its implementation on modern multi/many core architectures and finally present experimental results obtained with FastFlow and Erlang implementations to assess its feasibility and scalability.},
keywords = {fastflow, paraphrase, repara},
pubstate = {published},
tppubtype = {inproceedings}
}
Marco Aldinucci, Massimo Torquati, Maurizio Drocco, Guilherme Peretti Pezzi, Concetto Spampinato
FastFlow: Combining Pattern-Level Abstraction and Efficiency in GPGPUs Proceedings Article
In: GPU Technology Conference (GTC), San Jose, CA, USA, 2014.
Abstract | Links | BibTeX | Tags: fastflow, HPC, impact, paraphrase
@inproceedings{ff:gtc:2014,
title = {FastFlow: Combining Pattern-Level Abstraction and Efficiency in GPGPUs},
author = {Marco Aldinucci and Massimo Torquati and Maurizio Drocco and Guilherme Peretti Pezzi and Concetto Spampinato},
url = {http://calvados.di.unipi.it/storage/talks/2014_S4729-Marco-Aldinucci.pdf},
year = {2014},
date = {2014-03-01},
booktitle = {GPU Technology Conference (GTC)},
address = {San Jose, CA, USA},
abstract = {Learn how FastFlow's parallel patterns can be used to design parallel applications for execution on both CPUs and GPGPUs while avoiding most of the complex low-level detail needed to make them efficient, portable and rapid to prototype. As use case, we will show the design and effectiveness of a novel universal image filtering template based on the variational approach.},
keywords = {fastflow, HPC, impact, paraphrase},
pubstate = {published},
tppubtype = {inproceedings}
}
Marco Aldinucci, Massimo Torquati, Maurizio Drocco, Guilherme Peretti Pezzi, Concetto Spampinato
An Overview of FastFlow: Combining Pattern-Level Abstraction and Efficiency in GPGPUs Proceedings Article
In: GPU Technology Conference (GTC), San Jose, CA, USA, 2014.
Abstract | Links | BibTeX | Tags: fastflow, HPC, impact, paraphrase
@inproceedings{ff:gtc:2014:short,
title = {An Overview of FastFlow: Combining Pattern-Level Abstraction and Efficiency in GPGPUs},
author = {Marco Aldinucci and Massimo Torquati and Maurizio Drocco and Guilherme Peretti Pezzi and Concetto Spampinato},
url = {http://calvados.di.unipi.it/storage/talks/2014_S4585-Marco-Aldinucci.pdf},
year = {2014},
date = {2014-03-01},
booktitle = {GPU Technology Conference (GTC)},
address = {San Jose, CA, USA},
abstract = {Get an overview of FastFlow's parallel patterns can be used to design parallel applications for execution on both CPUs and GPGPUs while avoiding most of the complex low-level detail needed to make them efficient, portable and rapid to prototype. For a more detailed and technical review of FastFlow's parallel patterns as well as a use case where we will show the design and effectiveness of a novel universal image filtering template based on the variational approach.},
keywords = {fastflow, HPC, impact, paraphrase},
pubstate = {published},
tppubtype = {inproceedings}
}
Daniele Buono, Marco Danelutto, Tiziano De Matteis, Gabriele Mencagli, Massimo Torquati
A Lightweight Run-Time Support For Fast Dense Linear Algebra on Multi-Core Proceedings Article
In: Proc. of the 12th International Conference on Parallel and Distributed Computing and Networks (PDCN 2014), IASTED, ACTA press, 2014.
@inproceedings{ff:ffmdf:pdcn:14,
title = {A Lightweight Run-Time Support For Fast Dense Linear Algebra on Multi-Core},
author = {Daniele Buono and Marco Danelutto and Tiziano De Matteis and Gabriele Mencagli and Massimo Torquati},
year = {2014},
date = {2014-02-01},
booktitle = {Proc. of the 12th International Conference on Parallel and Distributed Computing and Networks (PDCN 2014)},
publisher = {IASTED, ACTA press},
keywords = {fastflow},
pubstate = {published},
tppubtype = {inproceedings}
}
Marco Aldinucci, Massimo Torquati, Concetto Spampinato, Maurizio Drocco, Claudia Misale, Cristina Calcagno, Mario Coppo
Parallel stochastic systems biology in the cloud Journal Article
In: Briefings in Bioinformatics, vol. 15, no. 5, pp. 798–813, 2014, ISSN: 1467-5463.
Abstract | Links | BibTeX | Tags: bioinformatics, fastflow, impact, paraphrase
@article{cwc:cloud:bib:13,
title = {Parallel stochastic systems biology in the cloud},
author = {Marco Aldinucci and Massimo Torquati and Concetto Spampinato and Maurizio Drocco and Claudia Misale and Cristina Calcagno and Mario Coppo},
url = {https://iris.unito.it/retrieve/handle/2318/140080/22528/FF_Cloud_briefings_final_submitted_copy.pdf},
doi = {10.1093/bib/bbt040},
issn = {1467-5463},
year = {2014},
date = {2014-01-01},
journal = {Briefings in Bioinformatics},
volume = {15},
number = {5},
pages = {798–813},
abstract = {The stochastic modelling of biological systems, coupled with Monte Carlo simulation of models, is an increasingly popular technique in bioinformatics. The simulation-analysis workflow may result computationally expensive reducing the interactivity required in the model tuning. In this work, we advocate the high-level software design as a vehicle for building efficient and portable parallel simulators for the cloud. In particular, the Calculus of Wrapped Components (CWC) simulator for systems biology, which is designed according to the FastFlow pattern-based approach, is presented and discussed. Thanks to the FastFlow framework, the CWC simulator is designed as a high-level workflow that can simulate CWC models, merge simulation results and statistically analyse them in a single parallel workflow in the cloud. To improve interactivity, successive phases are pipelined in such a way that the workflow begins to output a stream of analysis results immediately after simulation is started. Performance and effectiveness of the CWC simulator are validated on the Amazon Elastic Compute Cloud.},
keywords = {bioinformatics, fastflow, impact, paraphrase},
pubstate = {published},
tppubtype = {article}
}
Concetto Spampinato, Isaak Kavasidis, Marco Aldinucci, Carmelo Pino, Daniela Giordano, Alberto Faro
Discovering Biological Knowledge by Integrating High Throughput Data and Scientific Literature on the Cloud Journal Article
In: Concurrency and Computation: Practice and Experience, vol. 26, no. 10, pp. 1771–1786, 2014.
Abstract | Links | BibTeX | Tags:
@article{biocloud:ccpe:13,
title = {Discovering Biological Knowledge by Integrating High Throughput Data and Scientific Literature on the Cloud},
author = {Concetto Spampinato and Isaak Kavasidis and Marco Aldinucci and Carmelo Pino and Daniela Giordano and Alberto Faro},
url = {https://iris.unito.it/retrieve/handle/2318/139542/22526/2013_biocloud_ccpe.pdf},
doi = {10.1002/cpe.3130},
year = {2014},
date = {2014-01-01},
journal = {Concurrency and Computation: Practice and Experience},
volume = {26},
number = {10},
pages = {1771–1786},
abstract = {In this paper, we present a bioinformatics knowledge discovery tool for extracting and validating associations between biological entities. By mining specialised scientific literature, the tool not only generates biological hypotheses in the form of associations between genes, proteins, miRNA and diseases, but also validates the plausibility of such associations against high-throughput biological data (e.g. microarray) and annotated databases (e.g. Gene Ontology). Both the knowledge discovery system and its validation are carried out by exploiting the advantages and the potentialities of the Cloud, which allowed us to derive and check the validity of thousands of biological associations in a reasonable amount of time. The system was tested on a dataset containing more than 1000 gene-disease associations achieving an average recall of about 71%, outperforming existing approaches. The results also showed that porting a data-intensive application in an IaaS cloud environment boosts significantly the application's efficiency.},
keywords = {},
pubstate = {published},
tppubtype = {article}
}
Marco Aldinucci, Sonia Campa, Marco Danelutto, Peter Kilpatrick, Massimo Torquati
Design patterns percolating to parallel programming framework implementation Journal Article
In: International Journal of Parallel Programming, vol. 42, no. 6, pp. 1012–1031, 2014, ISSN: 0885-7458.
Abstract | Links | BibTeX | Tags: fastflow, paraphrase
@article{ijpp:patterns:13,
title = {Design patterns percolating to parallel programming framework implementation},
author = {Marco Aldinucci and Sonia Campa and Marco Danelutto and Peter Kilpatrick and Massimo Torquati},
url = {https://iris.unito.it/retrieve/handle/2318/140069/22527/2013_ijpp_patterns-web_4aperto_1238811.pdf},
doi = {10.1007/s10766-013-0273-6},
issn = {0885-7458},
year = {2014},
date = {2014-01-01},
journal = {International Journal of Parallel Programming},
volume = {42},
number = {6},
pages = {1012–1031},
abstract = {Structured parallel programming is recognised as a viable and effective means of tackling parallel programming problems. Recently, a set of simple and powerful parallel building blocks (RISC-pb2l) has been proposed to support modelling and implementation of parallel frameworks. In this work we demonstrate how that same parallel building block set may be used to model both general purpose parallel programming abstractions, not usually listed in classical skeleton sets, and more specialized domain specific parallel patterns. We show how an implementation of RISC-pb2l can be realised via the FastFlow framework and present experimental evidence of the feasibility and efficiency of the approach.},
keywords = {fastflow, paraphrase},
pubstate = {published},
tppubtype = {article}
}
Marco Aldinucci, Salvatore Ruggieri, Massimo Torquati
Decision Tree Building on Multi-Core using FastFlow Journal Article
In: Concurrency and Computation: Practice and Experience, vol. 26, no. 3, pp. 800–820, 2014.
Abstract | Links | BibTeX | Tags: fastflow, paraphrase
@article{yadtff:ccpe:13,
title = {Decision Tree Building on Multi-Core using FastFlow},
author = {Marco Aldinucci and Salvatore Ruggieri and Massimo Torquati},
url = {https://iris.unito.it/retrieve/handle/2318/139522/118602/yadtff-j.pdf},
doi = {10.1002/cpe.3063},
year = {2014},
date = {2014-01-01},
journal = {Concurrency and Computation: Practice and Experience},
volume = {26},
number = {3},
pages = {800–820},
abstract = {The whole computer hardware industry embraced multi-core. The extreme optimisation of sequential algorithms is then no longer sufficient to squeeze the real machine power, which can be only exploited via thread-level parallelism. Decision tree algorithms exhibit natural concurrency that makes them suitable to be parallelised. This paper presents an in-depth study of the parallelisation of an implementation of the C4.5 algorithm for multi-core architectures. We characterise elapsed time lower bounds for the forms of parallelisations adopted, and achieve close to optimal performances. Our implementation is based on the FastFlow parallel programming environment and it requires minimal changes to the original sequential code.},
keywords = {fastflow, paraphrase},
pubstate = {published},
tppubtype = {article}
}
Guilherme Peretti Pezzi, Evelyne Vaissié, Yann Viala, Denis Caromel, Philippe Gourbesville
Parallel Profiling of Water Distribution Networks Using the Clément Formula Proceedings Article
In: 4th European Seminar on Computing, 2014.
Abstract | BibTeX | Tags: impact
@inproceedings{pezzi-clement:14,
title = {Parallel Profiling of Water Distribution Networks Using the Clément Formula},
author = {Guilherme Peretti Pezzi and Evelyne Vaissié and Yann Viala and Denis Caromel and Philippe Gourbesville},
year = {2014},
date = {2014-01-01},
booktitle = {4th European Seminar on Computing},
abstract = {Optimization of water distribution is a crucial issue which has been targeted by many modelling tools. Useful models, implemented several decades ago, need to be updated and implemented in more powerful computing environments. This paper presents the distributed and redesigned version of a legacy hydraulic simulation software written in Fortran (IRMA) that has been used for over 30 years by the Societé du Canal de Provence in order to design and to maintain water distribution networks. IRMA was developed aiming mainly the treatment of irrigation networks – by using the Clément demand model and is now used to manage more than 6.000 km of piped networks. The growing complexity and size of networks requested to redesign the code by using modern tools and language (Java) and also to run distributed simulations by using the ProActive Parallel Suite.},
keywords = {impact},
pubstate = {published},
tppubtype = {inproceedings}
}
Marco Aldinucci, Cristina Calcagno, Mario Coppo, Ferruccio Damiani, Maurizio Drocco, Eva Sciacca, Salvatore Spinella, Massimo Torquati, Angelo Troina
On designing multicore-aware simulators for systems biology endowed with on-line statistics Journal Article
In: BioMed Research International, 2014.
Abstract | Links | BibTeX | Tags: bioinformatics, fastflow, paraphrase
@article{cwcsim:ff:multicore:biomed:14,
title = {On designing multicore-aware simulators for systems biology endowed with on-line statistics},
author = {Marco Aldinucci and Cristina Calcagno and Mario Coppo and Ferruccio Damiani and Maurizio Drocco and Eva Sciacca and Salvatore Spinella and Massimo Torquati and Angelo Troina},
url = {http://downloads.hindawi.com/journals/bmri/2014/207041.pdf},
doi = {10.1155/2014/207041},
year = {2014},
date = {2014-01-01},
journal = {BioMed Research International},
abstract = {The paper arguments are on enabling methodologies for the design of a fully parallel, online, interactive tool aiming to support the bioinformatics scientists .In particular, the features of these methodologies, supported by the FastFlow parallel programming framework, are shown on a simulation tool to perform the modeling, the tuning, and the sensitivity analysis of stochastic biological models. A stochastic simulation needs thousands of independent simulation trajectories turning into big data that should be analysed by statistic and data mining tools. In the considered approach the two stages are pipelined in such a way that the simulation stage streams out the partial results of all simulation trajectories to the analysis stage that immediately produces a partial result. The simulation-analysis workflow is validated for performance and effectiveness of the online analysis in capturing biological systems behavior on a multicore platform and representative proof-of-concept biological systems. The exploited methodologies include pattern-based parallel programming and data streaming that provide key features to the software designers such as performance portability and efficient in-memory (big) data management and movement. Two paradigmatic classes of biological systems exhibiting multistable and oscillatory behavior are used as a testbed.},
keywords = {bioinformatics, fastflow, paraphrase},
pubstate = {published},
tppubtype = {article}
}
Marco Aldinucci, Maurizio Drocco, Guilherme Peretti Pezzi, Claudia Misale, Fabio Tordini, Massimo Torquati
Exercising high-level parallel programming on streams: a systems biology use case Proceedings Article
In: Proc. of 34th IEEE Intl. Conference on Distributed Computing Systems Workshops (ICDCSW), IEEE, Madrid, Spain, 2014.
Abstract | Links | BibTeX | Tags: bioinformatics, fastflow, impact, paraphrase
@inproceedings{cwc:gpu:dcperf:14,
title = {Exercising high-level parallel programming on streams: a systems biology use case},
author = {Marco Aldinucci and Maurizio Drocco and Guilherme Peretti Pezzi and Claudia Misale and Fabio Tordini and Massimo Torquati},
url = {https://iris.unito.it/retrieve/handle/2318/154516/26657/2014_dcperf_cwc_gpu.pdf},
doi = {10.1109/ICDCSW.2014.38},
year = {2014},
date = {2014-01-01},
booktitle = {Proc. of 34th IEEE Intl. Conference on Distributed Computing Systems Workshops (ICDCSW)},
publisher = {IEEE},
address = {Madrid, Spain},
abstract = {The stochastic modelling of biological systems, cou- pled with Monte Carlo simulation of models, is an increasingly popular technique in Bioinformatics. The simulation-analysis workflow may result into a computationally expensive task reducing the interactivity required in the model tuning. In this work, we advocate high-level software design as a vehicle for building efficient and portable parallel simulators for a variety of platforms, ranging from multi-core platforms to GPGPUs to cloud. In particular, the Calculus of Wrapped Compartments (CWC) parallel simulator for systems biology equipped with on- line mining of results, which is designed according to the FastFlow pattern-based approach, is discussed as a running example. In this work, the CWC simulator is used as a paradigmatic example of a complex C++ application where the quality of results is correlated with both computation and I/O bounds, and where high-quality results might turn into big data. The FastFlow parallel programming framework, which advocates C++ pattern- based parallel programming makes it possible to develop portable parallel code without relinquish neither run-time efficiency nor performance tuning opportunities. Performance and effectiveness of the approach are validated on a variety of platforms, inter-alia cache-coherent multi-cores, cluster of multi-core (Ethernet and Infiniband) and the Amazon Elastic Compute Cloud.},
keywords = {bioinformatics, fastflow, impact, paraphrase},
pubstate = {published},
tppubtype = {inproceedings}
}
Marco Aldinucci, Guilherme Peretti Pezzi, Maurizio Drocco, Fabio Tordini, Peter Kilpatrick, Massimo Torquati
Parallel video denoising on heterogeneous platforms Proceedings Article
In: Proc. of Intl. Workshop on High-level Programming for Heterogeneous and Hierarchical Parallel Systems (HLPGPU), 2014.
Abstract | Links | BibTeX | Tags: fastflow, impact, paraphrase
@inproceedings{ff:video:hlpgpu:14,
title = {Parallel video denoising on heterogeneous platforms},
author = {Marco Aldinucci and Guilherme Peretti Pezzi and Maurizio Drocco and Fabio Tordini and Peter Kilpatrick and Massimo Torquati},
url = {http://calvados.di.unipi.it/storage/paper_files/2014_ff_video_denoiser_hlpgpu.pdf},
year = {2014},
date = {2014-01-01},
booktitle = {Proc. of Intl. Workshop on High-level Programming for Heterogeneous and Hierarchical Parallel Systems (HLPGPU)},
abstract = {In this paper, a highly-effective parallel filter for video denoising is presented. The filter is designed using a skeletal approach, and has been implemented by way of the FastFlow parallel programming library. As a result of its high-level design, it is possible to run the filter seamlessly on a multi-core machine, on GPGPU(s), or on both. The design and the implementation of the filter are discussed, and an experimental evaluation is presented. Various mappings of the filtering stages are comparatively discussed.},
keywords = {fastflow, impact, paraphrase},
pubstate = {published},
tppubtype = {inproceedings}
}
Claudia Misale
Accelerating Bowtie2 with a lock-less concurrency approach and memory affinity Proceedings Article
In: Aldinucci, Marco, D'Agostino, Daniele, Kilpatrick, Peter (Ed.): Proc. of Intl. Euromicro PDP 2014: Parallel Distributed and network-based Processing, IEEE, Torino, Italy, 2014, ((Best paper award)).
Abstract | Links | BibTeX | Tags: fastflow, paraphrase
@inproceedings{ff:bowtie2:pdp:14,
title = {Accelerating Bowtie2 with a lock-less concurrency approach and memory affinity},
author = {Claudia Misale},
editor = {Marco Aldinucci and Daniele D'Agostino and Peter Kilpatrick},
url = {http://calvados.di.unipi.it/storage/paper_files/2014_pdp_bowtieff.pdf},
doi = {10.1109/PDP.2014.50},
year = {2014},
date = {2014-01-01},
booktitle = {Proc. of Intl. Euromicro PDP 2014: Parallel Distributed and network-based Processing},
publisher = {IEEE},
address = {Torino, Italy},
abstract = {The implementation of DNA alignment tools for Bioinformatics lead to face different problems that dip into performances. A single alignment takes an amount of time that is not predictable and there are different factors that can affect performances, for instance the length of sequences can determine the computational grain of the task and mismatches or insertion/deletion (indels) increase time needed to complete an alignment. Moreover, an alignment is a strong memory- bound problem because of the irregular memory access pat- terns and limitations in memory-bandwidth. Over the years, many alignment tools were implemented. A concrete example is Bowtie2, one of the fastest (concurrent, Pthread-based) and state of the art not GPU-based alignment tool. Bowtie2 exploits concurrency by instantiating a pool of threads, which have access to a global input dataset, share the reference genome and have access to different objects for collecting alignment results. In this paper a modified implementation of Bowtie2 is presented, in which the concurrency structure has been changed. The proposed implementation exploits the task-farm skeleton pattern implemented as a Master-Worker. The Master-Worker pattern permits to delegate only to the Master thread dataset reading and to make private to each Worker data structures that are shared in the original version. Only the reference genome is left shared. As a further optimisation, the Master and each Worker were pinned on cores and the reference genome was allocated interleaved among memory nodes. The proposed implementation is able to gain up to 10 speedup points over the original implementation.},
note = {(Best paper award)},
keywords = {fastflow, paraphrase},
pubstate = {published},
tppubtype = {inproceedings}
}
Alessandro Secco, Irfan Uddin, Guilherme Peretti Pezzi, Massimo Torquati
Message passing on InfiniBand RDMA for parallel run-time supports Proceedings Article
In: Aldinucci, Marco, D'Agostino, Daniele, Kilpatrick, Peter (Ed.): Proc. of Intl. Euromicro PDP 2014: Parallel Distributed and network-based Processing, IEEE, Torino, Italy, 2014.
Abstract | Links | BibTeX | Tags: fastflow, impact, paraphrase
@inproceedings{ff:infiniband:pdp:14,
title = {Message passing on InfiniBand RDMA for parallel run-time supports},
author = {Alessandro Secco and Irfan Uddin and Guilherme Peretti Pezzi and Massimo Torquati},
editor = {Marco Aldinucci and Daniele D'Agostino and Peter Kilpatrick},
url = {https://iris.unito.it/retrieve/handle/2318/151178/690885/2014_ff_infiniband_pdp.pdf},
doi = {10.1109/PDP.2014.23},
year = {2014},
date = {2014-01-01},
booktitle = {Proc. of Intl. Euromicro PDP 2014: Parallel Distributed and network-based Processing},
publisher = {IEEE},
address = {Torino, Italy},
abstract = {InfiniBand networks are commonly used in the high performance computing area. They offer RDMA-based opera- tions that help to improve the performance of communication subsystems. In this paper, we propose a minimal message-passing communication layer providing the programmer with a point-to- point communication channel implemented by way of InfiniBand RDMA features. Differently from other libraries exploiting the InfiniBand features, such as the well-known Message Passing Interface (MPI), the proposed library is a communication layer only rather than a programming model, and can be easily used as building block for high-level parallel programming frameworks. Evaluated on micro-benchmarks, the proposed RDMA-based communication channel implementation achieves a comparable performance with highly optimised MPI/InfiniBand implemen- tations. Eventually, the flexibility of the communication layer is evaluated by integrating it within the FastFlow parallel frame- work, currently supporting TCP/IP networks (via the ZeroMQ communication library).},
keywords = {fastflow, impact, paraphrase},
pubstate = {published},
tppubtype = {inproceedings}
}
Maurizio Drocco, Marco Aldinucci, Massimo Torquati
A Dynamic Memory Allocator for heterogeneous platforms Proceedings Article
In: Advanced Computer Architecture and Compilation for High-Performance and Embedded Systems (ACACES) – Poster Abstracts, HiPEAC, Fiuggi, Italy, 2014.
Abstract | Links | BibTeX | Tags: fastflow, HPC
@inproceedings{ff:acaces:14,
title = {A Dynamic Memory Allocator for heterogeneous platforms},
author = {Maurizio Drocco and Marco Aldinucci and Massimo Torquati},
url = {http://calvados.di.unipi.it/storage/paper_files/2014_ACACES_ex-abstract.pdf},
year = {2014},
date = {2014-01-01},
booktitle = {Advanced Computer Architecture and Compilation for High-Performance and Embedded Systems (ACACES) – Poster Abstracts},
publisher = {HiPEAC},
address = {Fiuggi, Italy},
abstract = {Modern computers are built upon heterogeneous multi-core/many cores architectures (e.g. GPGPU connected to multi-core CPU). Achieving peak performance on these architectures is hard and may require a substantial programming effort. High-level programming patterns, coupled with efficient low-level runtime supports, have been proposed to relieve the programmer from worrying about low-level details such as synchronisation of racing processes as well as those fine tunings needed to improve the overall performance. Among them are (parallel) dynamic memory allocation and effective exploitation of the memory hierarchy. The memory allocator is often a bottleneck that severely limits program scalability, robustness and portability on parallel systems. In this work we introduce a novel memory allocator, based on the FastFlow's allocator and the recently proposed CUDA Unified Memory, which aims to efficiently integrate host and device memories into a unique dynamic-allocable memory space, accessible transparently by both host and device code.},
keywords = {fastflow, HPC},
pubstate = {published},
tppubtype = {inproceedings}
}
Claudia Misale, Giulio Ferrero, Massimo Torquati, Marco Aldinucci
Sequence alignment tools: one parallel pattern to rule them all? Journal Article
In: BioMed Research International, 2014.
Abstract | Links | BibTeX | Tags: bioinformatics, fastflow, paraphrase, repara
@article{bowtie-bwa:ff:multicore:biomed:14,
title = {Sequence alignment tools: one parallel pattern to rule them all?},
author = {Claudia Misale and Giulio Ferrero and Massimo Torquati and Marco Aldinucci},
url = {http://downloads.hindawi.com/journals/bmri/2014/539410.pdf},
doi = {10.1155/2014/539410},
year = {2014},
date = {2014-01-01},
journal = {BioMed Research International},
abstract = {In this paper we advocate high-level programming methodology for Next Generation Sequencers (NGS) alignment tools for both productivity and absolute performance. We analyse the problem of parallel alignment and review the parallelisation strategies of the most popular alignment tools, which can all be abstracted to a single parallel paradigm. We compare these tools against their porting onto the FastFlow pattern-based programming framework, which provides programmers with high-level parallel patterns. By using a high-level approach, programmers are liberated from all complex aspects of parallel programming, such as synchronisation protocols and task scheduling, gaining more possibility for seamless performance tuning. In this work we show some use case in which, by using a high-level approach for parallelising NGS tools, it is possible to obtain comparable or even better absolute performance for all used datasets.},
keywords = {bioinformatics, fastflow, paraphrase, repara},
pubstate = {published},
tppubtype = {article}
}
2013
Maurizio Drocco
Parallel stochastic simulators in systems biology: the evolution of the species Masters Thesis
Computer Science Department, University of Torino, Italy, 2013.
Abstract | Links | BibTeX | Tags: fastflow
@mastersthesis{tesi:drocco:13,
title = {Parallel stochastic simulators in systems biology: the evolution of the species},
author = {Maurizio Drocco},
url = {http://calvados.di.unipi.it/storage/paper_files/2013_tesi_drocco.pdf},
year = {2013},
date = {2013-07-01},
school = {Computer Science Department, University of Torino, Italy},
abstract = {The stochastic simulation of biological systems is an increasingly popular technique in bioinformatics. It is often an enlightening technique, especially for multi-stable systems whose dynamics can be hardly captured with ordinary differential equations. To be effective, stochastic simulations should be supported by powerful statistical analysis tools. The simulation/analysis workflow may however result in being computationally expensive, thus compromising the interactivity required especially in model tuning. In this work we discuss the main opportunities to speed up the framework by parallelisation on modern multicore and hybrid multicore and distributed platforms, advocating the high-level design of simulators for stochastic systems as a vehicle for building efficient and portable parallel simulators endowed with on-line statistical analysis. In particular, the Calculus of Wrapped Compartments (CWC) Simulator, which is designed according to the FastFlow's pattern-based approach, is presented and discussed in this work.},
keywords = {fastflow},
pubstate = {published},
tppubtype = {mastersthesis}
}
Marco Aldinucci, Fabio Tordini, Maurizio Drocco, Massimo Torquati, Mario Coppo
Parallel stochastic simulators in system biology: the evolution of the species Proceedings Article
In: Proc. of 21st Euromicro Intl. Conference on Parallel Distributed and network-based Processing (PDP), IEEE, Belfast, Nothern Ireland, U.K., 2013.
Abstract | Links | BibTeX | Tags: bioinformatics, fastflow
@inproceedings{ff_cwc_distr:pdp:13,
title = {Parallel stochastic simulators in system biology: the evolution of the species},
author = {Marco Aldinucci and Fabio Tordini and Maurizio Drocco and Massimo Torquati and Mario Coppo},
url = {http://calvados.di.unipi.it/storage/paper_files/2013_cwc_d_PDP.pdf},
doi = {10.1109/PDP.2013.66},
year = {2013},
date = {2013-02-01},
booktitle = {Proc. of 21st Euromicro Intl. Conference on Parallel Distributed and network-based Processing (PDP)},
publisher = {IEEE},
address = {Belfast, Nothern Ireland, U.K.},
abstract = {The stochastic simulation of biological systems is an increasingly popular technique in Bioinformatics. It is often an enlightening technique, especially for multi-stable systems which dynamics can be hardly captured with ordinary differential equations. To be effective, stochastic simulations should be supported by powerful statistical analysis tools. The simulation-analysis workflow may however result in being computationally expensive, thus compromising the interactivity required in model tuning. In this work we advocate the high-level design of simulators for stochastic systems as a vehicle for building efficient and portable parallel simulators. In particular, the Calculus of Wrapped Components (CWC) simulator, which is designed according to the FastFlow's pattern-based approach, is presented and discussed in this work. FastFlow has been extended to support also clusters of multi-cores with minimal coding effort, assessing the portability of the approach.},
keywords = {bioinformatics, fastflow},
pubstate = {published},
tppubtype = {inproceedings}
}
Claudia Misale, Marco Aldinucci, Massimo Torquati
Memory affinity in multi-threading: the Bowtie2 case study Proceedings Article
In: Advanced Computer Architecture and Compilation for High-Performance and Embedded Systems (ACACES) – Poster Abstracts, HiPEAC, Fiuggi, Italy, 2013, ISBN: 9789038221908.
Abstract | Links | BibTeX | Tags: fastflow
@inproceedings{ff:acaces:13,
title = {Memory affinity in multi-threading: the Bowtie2 case study},
author = {Claudia Misale and Marco Aldinucci and Massimo Torquati},
url = {https://iris.unito.it/retrieve/handle/2318/143005/23874/2013_ACACES_ex-abstract.pdf},
isbn = {9789038221908},
year = {2013},
date = {2013-01-01},
booktitle = {Advanced Computer Architecture and Compilation for High-Performance and Embedded Systems (ACACES) – Poster Abstracts},
publisher = {HiPEAC},
address = {Fiuggi, Italy},
abstract = {The diffusion of the Next Generation Sequencing (NGS) has increased the amount of data obtainable by genomic experiments. From a DNA sample a NGS run is able to produce millions of short sequences (called reads), which should be mapped into a reference genome. In this paper, we analyse the performance of Bowtie2, a fast and popular DNA mapping tool. Bowtie2 exhibits a multithreading implementation on top of pthreads, spin-locks and SSE2 SIMD extension. From parallel computing viewpoint, is a paradigmatic example of a software requiring to address three fundamental problems in shared-memory programming for cache-coherent multi-core platforms: synchronisation efficiency at very fine grain (due to short reads), load-balancing (due to long reads), and efficient usage of memory subsystem (due to SSE2 memory pressure). We compare the original implementation against an alternative implementation on top of the FastFlow pattern-based programming framework. The proposed design exploits the high-level farm pattern of FastFlow, which is implemented top of nonblocking multi-threading and lock-less (CAS-free) queues, and provides the programmer with high-level mechanism to tune task scheduling to achieve both load-balancing and memory affinity. The proposed design, despite the high-level design, is always faster and more scalable with respect to the original one. The design of both original and alternative version will be presented along with their experimental evaluation on real-world data sets.},
keywords = {fastflow},
pubstate = {published},
tppubtype = {inproceedings}
}
Marco Aldinucci, Marco Danelutto, Peter Kilpatrick, Carlo Montangero, Laura Semini
Managing Adaptivity in Parallel Systems Book Section
In: Beckert, Bernhard, Damiani, Ferruccio, Boer, Frank S., Bonsangue, Marcello M. (Ed.): Formal Methods for Components and Objects: Intl. Symposium, FMCO 2011, Torino, Italy, October 3-5, 2011, Revised Invited Lectures, vol. 7542, pp. 199–217, Springer, 2013, ISBN: 978-3-642-35886-9.
Abstract | Links | BibTeX | Tags: paraphrase
@incollection{adaptivity:fmco:11,
title = {Managing Adaptivity in Parallel Systems},
author = {Marco Aldinucci and Marco Danelutto and Peter Kilpatrick and Carlo Montangero and Laura Semini},
editor = {Bernhard Beckert and Ferruccio Damiani and Frank S. Boer and Marcello M. Bonsangue},
url = {http://calvados.di.unipi.it/storage/paper_files/2013_fmco11_adaptivity.pdf},
doi = {10.1007/978-3-642-35887-6_11},
isbn = {978-3-642-35886-9},
year = {2013},
date = {2013-01-01},
booktitle = {Formal Methods for Components and Objects: Intl. Symposium, FMCO 2011, Torino, Italy, October 3-5, 2011, Revised Invited Lectures},
volume = {7542},
pages = {199–217},
publisher = {Springer},
series = {LNCS},
abstract = {The management of non-functional features (performance, security, power management, etc.) is traditionally a difficult, error prone task for programmers of parallel applications. To take care of these non-functional features, autonomic managers running policies represented as rules using sensors and actuators to monitor and transform a running parallel application may be used. We discuss an approach aimed at providing formal tool support to the integration of independently developed autonomic managers taking care of different non-functional concerns within the same parallel application. Our approach builds on the Behavioural Skeleton experience (autonomic management of non-functional features in structured parallel applications) and on previous results on conflict detection and resolution in rule-based systems.},
keywords = {paraphrase},
pubstate = {published},
tppubtype = {incollection}
}
Marco Aldinucci, Sonia Campa, Peter Kilpatrick, Massimo Torquati
Structured Data Access Annotations for Massively Parallel Computations Proceedings Article
In: Euro-Par 2012 Workshops, Proc. of the ParaPhrase Workshop on Parallel Processing, pp. 381–390, Springer, 2013.
Abstract | Links | BibTeX | Tags: fastflow, paraphrase
@inproceedings{annotation:para:12,
title = {Structured Data Access Annotations for Massively Parallel Computations},
author = {Marco Aldinucci and Sonia Campa and Peter Kilpatrick and Massimo Torquati},
url = {http://calvados.di.unipi.it/storage/paper_files/2013_annot_europar_workshops.pdf},
doi = {10.1007/978-3-642-36949-0_42},
year = {2013},
date = {2013-01-01},
booktitle = {Euro-Par 2012 Workshops, Proc. of the ParaPhrase Workshop on Parallel Processing},
volume = {7640},
pages = {381–390},
publisher = {Springer},
series = {LNCS},
abstract = {We describe an approach aimed at addressing the issue of joint exploitation of control (stream) and data parallelism in a skele-ton based parallel programming environment, based on annotations and refactoring. Annotations drive efficient implementation of a parallel com-putation. Refactoring is used to transform the associated skeleton tree into a more efficient, functionally equivalent skeleton tree. In most cases,cost models are used to drive the refactoring process. We show howsample use case applications/kernels may be optimized and discuss pre-liminary experiments with FastFlow assessing the theoretical results.},
keywords = {fastflow, paraphrase},
pubstate = {published},
tppubtype = {inproceedings}
}
Marco Aldinucci, Sonia Campa, Marco Danelutto, Peter Kilpatrick, Massimo Torquati
Targeting Distributed Systems in FastFlow Proceedings Article
In: Euro-Par 2012 Workshops, Proc. of the CoreGrid Workshop on Grids, Clouds and P2P Computing, pp. 47–56, Springer, 2013.
Abstract | Links | BibTeX | Tags: fastflow, paraphrase
@inproceedings{ff:distr:cgs:12,
title = {Targeting Distributed Systems in FastFlow},
author = {Marco Aldinucci and Sonia Campa and Marco Danelutto and Peter Kilpatrick and Massimo Torquati},
url = {http://calvados.di.unipi.it/storage/paper_files/2012_distr_ff_cgsymph.pdf},
doi = {10.1007/978-3-642-36949-0_7},
year = {2013},
date = {2013-01-01},
booktitle = {Euro-Par 2012 Workshops, Proc. of the CoreGrid Workshop on Grids, Clouds and P2P Computing},
volume = {7640},
pages = {47–56},
publisher = {Springer},
series = {LNCS},
abstract = {FastFlow is a structured parallel programming framework targeting shared memory multi-core architectures. In this paper we introduce a FastFlow extension aimed at supporting a network of multi-core workstation as well. The extension supports the execution of FastFlow programs by coordinating – in a structured way – the fine grain parallel activities running on a single workstation. We discuss the design and the implementation of this extension presenting preliminary experimental results validating it on state-of-the-art networked multi-core nodes.},
keywords = {fastflow, paraphrase},
pubstate = {published},
tppubtype = {inproceedings}
}
Kevin Hammond, Marco Aldinucci, Chris Brown, Francesco Cesarini, Marco Danelutto, Horacio González-Vélez, Peter Kilpatrick, Rainer Keller, Michael Rossbory, Gilad Shainer
The ParaPhrase Project: Parallel Patterns for Adaptive Heterogeneous Multicore Systems Book Section
In: Beckert, Bernhard, Damiani, Ferruccio, Boer, Frank S., Bonsangue, Marcello M. (Ed.): Formal Methods for Components and Objects: Intl. Symposium, FMCO 2011, Torino, Italy, October 3-5, 2011, Revised Invited Lectures, vol. 7542, pp. 218–236, Springer, 2013, ISBN: 978-3-642-35886-9.
Abstract | Links | BibTeX | Tags: paraphrase
@incollection{paraphrase:fmco:11,
title = {The ParaPhrase Project: Parallel Patterns for Adaptive Heterogeneous Multicore Systems},
author = {Kevin Hammond and Marco Aldinucci and Chris Brown and Francesco Cesarini and Marco Danelutto and Horacio González-Vélez and Peter Kilpatrick and Rainer Keller and Michael Rossbory and Gilad Shainer},
editor = {Bernhard Beckert and Ferruccio Damiani and Frank S. Boer and Marcello M. Bonsangue},
url = {http://calvados.di.unipi.it/storage/paper_files/2013_fmco11_paraphrase.pdf},
doi = {10.1007/978-3-642-35887-6_12},
isbn = {978-3-642-35886-9},
year = {2013},
date = {2013-01-01},
booktitle = {Formal Methods for Components and Objects: Intl. Symposium, FMCO 2011, Torino, Italy, October 3-5, 2011, Revised Invited Lectures},
volume = {7542},
pages = {218–236},
publisher = {Springer},
series = {LNCS},
abstract = {This paper describes the ParaPhrase project, a new 3-year targeted research project funded under EU Framework 7 Objective 3.4 (Computer Systems), starting in October 2011. ParaPhrase aims to follow a new approach to introducing parallelism using advanced refactoring techniques coupled with high-level parallel design patterns. The refactoring approach will use these design patterns to restructure programs defined as networks of software components into other forms that are more suited to parallel execution. The programmer will be aided by high-level cost information that will be integrated into the refactoring tools. The implementation of these patterns will then use a well-understood algorithmic skeleton approach to achieve good parallelism. A key ParaPhrase design goal is that parallel components are intended to match heterogeneous architectures, defined in terms of CPU/GPU combinations, for example. In order to achieve this, the ParaPhrase approach will map components at link time to the available hardware, and will then re-map them during program execution, taking account of multiple applications, changes in hardware resource availability, the desire to reduce communication costs etc. In this way, we aim to develop a new approach to programming that will be able to produce software that can adapt to dynamic changes in the system environment. Moreover, by using a strong component basis for parallelism, we can achieve potentially significant gains in terms of reducing sharing at a high level of abstraction, and so in reducing or even eliminating the costs that are usually associated with cache management, locking, and synchronisation.},
keywords = {paraphrase},
pubstate = {published},
tppubtype = {incollection}
}
Marco Aldinucci, Sonia Campa, Fabio Tordini, Massimo Torquati, Peter Kilpatrick
An abstract annotation model for skeletons Book Section
In: Beckert, Bernhard, Damiani, Ferruccio, Boer, Frank S., Bonsangue, Marcello M. (Ed.): Formal Methods for Components and Objects: Intl. Symposium, FMCO 2011, Torino, Italy, October 3-5, 2011, Revised Invited Lectures, vol. 7542, pp. 257–276, Springer, 2013, ISBN: 978-3-642-35886-9.
Abstract | Links | BibTeX | Tags: fastflow, paraphrase
@incollection{toolchain:fmco:11,
title = {An abstract annotation model for skeletons},
author = {Marco Aldinucci and Sonia Campa and Fabio Tordini and Massimo Torquati and Peter Kilpatrick},
editor = {Bernhard Beckert and Ferruccio Damiani and Frank S. Boer and Marcello M. Bonsangue},
url = {http://calvados.di.unipi.it/storage/paper_files/2013_fmco11_annotation.pdf},
doi = {10.1007/978-3-642-35887-6_14},
isbn = {978-3-642-35886-9},
year = {2013},
date = {2013-01-01},
booktitle = {Formal Methods for Components and Objects: Intl. Symposium, FMCO 2011, Torino, Italy, October 3-5, 2011, Revised Invited Lectures},
volume = {7542},
pages = {257–276},
publisher = {Springer},
series = {LNCS},
abstract = {Multi-core and many-core platforms are becoming increasingly heterogeneous and asymmetric. This significantly increases the porting and tuning effort required for parallel codes, which in turn often leads to a growing gap between peak machine power and actual application performance. In this work a first step toward the automated optimization of high level skeleton-based parallel code is discussed. The paper presents an abstract annotation model for skeleton programs aimed at formally describing suitable mapping of parallel activities on a high-level platform representation. The derived mapping and scheduling strategies are used to generate optimized run-time code.},
keywords = {fastflow, paraphrase},
pubstate = {published},
tppubtype = {incollection}
}
2012
Marco Aldinucci, Concetto Spampinato, Maurizio Drocco, Massimo Torquati, Simone Palazzo
A Parallel Edge Preserving Algorithm for Salt and Pepper Image Denoising Proceedings Article
In: Djemal, K., Deriche, M., Puech, W., Ucan, Osman N. (Ed.): Proc. of 2nd Intl. Conference on Image Processing Theory Tools and Applications (IPTA), pp. 97–102, IEEE, Istambul, Turkey, 2012, ISBN: 978-1-4673-2582-0.
Abstract | Links | BibTeX | Tags: fastflow, impact
@inproceedings{denoiser:ff:ipta:12,
title = {A Parallel Edge Preserving Algorithm for Salt and Pepper Image Denoising},
author = {Marco Aldinucci and Concetto Spampinato and Maurizio Drocco and Massimo Torquati and Simone Palazzo},
editor = {K. Djemal and M. Deriche and W. Puech and Osman N. Ucan},
url = {http://calvados.di.unipi.it/storage/paper_files/2012_2phasedenoiser_ff_ipta.pdf},
doi = {10.1109/IPTA.2012.6469567},
isbn = {978-1-4673-2582-0},
year = {2012},
date = {2012-10-01},
booktitle = {Proc. of 2nd Intl. Conference on Image Processing Theory Tools and Applications (IPTA)},
pages = {97–102},
publisher = {IEEE},
address = {Istambul, Turkey},
abstract = {In this paper a two-phase filter for removing ``salt and pepper'' noise is proposed. In the first phase, an adaptive median filter is used to identify the set of the noisy pixels; in the second phase, these pixels are restored according to a regularization method, which contains a data-fidelity term reflecting the impulse noise characteristics. The algorithm, which exhibits good performance both in denoising and in restoration, can be easily and effectively parallelized to exploit the full power of multi-core CPUs and GPGPUs; the proposed implementation based on the FastFlow library achieves both close-to-ideal speedup and very good wall-clock execution figures.},
keywords = {fastflow, impact},
pubstate = {published},
tppubtype = {inproceedings}
}
Marco Aldinucci, Marco Danelutto, Peter Kilpatrick, Massimiliano Meneghin, Massimo Torquati
An Efficient Unbounded Lock-Free Queue for Multi-core Systems Proceedings Article
In: Proc. of 18th Intl. Euro-Par 2012 Parallel Processing, pp. 662–673, Springer, Rhodes Island, Greece, 2012.
Abstract | Links | BibTeX | Tags: fastflow, paraphrase
@inproceedings{ff:spsc:europar:12,
title = {An Efficient Unbounded Lock-Free Queue for Multi-core Systems},
author = {Marco Aldinucci and Marco Danelutto and Peter Kilpatrick and Massimiliano Meneghin and Massimo Torquati},
url = {http://calvados.di.unipi.it/storage/paper_files/2012_spsc_europar.pdf},
doi = {10.1007/978-3-642-32820-6_65},
year = {2012},
date = {2012-08-01},
booktitle = {Proc. of 18th Intl. Euro-Par 2012 Parallel Processing},
volume = {7484},
pages = {662–673},
publisher = {Springer},
address = {Rhodes Island, Greece},
series = {LNCS},
abstract = {The use of efficient synchronization mechanisms is crucial for implementing fine grained parallel programs on modern shared cache multi-core architectures. In this paper we study this problem by considering Single-Producer/Single-Consumer (SPSC) coordination using unbounded queues. A novel unbounded SPSC algorithm capable of reducing the row synchronization latency and speeding up Producer-Consumer coordination is presented. The algorithm has been extensively tested on a shared-cache multi-core platform and a sketch proof of correctness is presented. The queues proposed have been used as basic building blocks to implement the FastFlow parallel framework, which has been demonstrated to offer very good performance for fine-grain parallel applications.},
keywords = {fastflow, paraphrase},
pubstate = {published},
tppubtype = {inproceedings}
}
Marco Aldinucci, Marco Danelutto, Peter Kilpatrick, Massimo Torquati
Targeting heterogeneous architectures via macro data flow Journal Article
In: Parallel Processing Letters, vol. 22, no. 2, 2012, ISSN: 0129-6264.
Abstract | Links | BibTeX | Tags: fastflow, paraphrase
@article{mdf:hplgpu:ppl:12,
title = {Targeting heterogeneous architectures via macro data flow},
author = {Marco Aldinucci and Marco Danelutto and Peter Kilpatrick and Massimo Torquati},
url = {http://calvados.di.unipi.it/storage/paper_files/2012_mdf_PPL-hplgpu.pdf},
doi = {10.1142/S0129626412400063},
issn = {0129-6264},
year = {2012},
date = {2012-06-01},
journal = {Parallel Processing Letters},
volume = {22},
number = {2},
abstract = {We propose a data flow based run time system as an efficient tool for supporting execution of parallel code on heterogeneous architectures hosting both multicore CPUs and GPUs. We discuss how the proposed run time system may be the target of both structured parallel applications developed using algorithmic skeletons/parallel design patterns and also more ``domain specific'' programming models. Experimental results demonstrating the feasibility of the approach are presented.},
keywords = {fastflow, paraphrase},
pubstate = {published},
tppubtype = {article}
}
Marco Aldinucci, Marco Danelutto, Massimo Torquati
FastFlow tutorial Technical Report
Università di Pisa, Dipartimento di Informatica, Italy no. TR-12-04, 2012.
Links | BibTeX | Tags: fastflow
@techreport{fastflow_tutorial:TR-12-04:12,
title = {FastFlow tutorial},
author = {Marco Aldinucci and Marco Danelutto and Massimo Torquati},
url = {http://compass2.di.unipi.it/TR/Files/TR-12-04.pdf.gz},
year = {2012},
date = {2012-03-01},
number = {TR-12-04},
institution = {Università di Pisa, Dipartimento di Informatica, Italy},
keywords = {fastflow},
pubstate = {published},
tppubtype = {techreport}
}
Massimo Torquati, Marco Vanneschi, Mehdi Amini, S. Guelton, Ronan Keryell, Vincent Lanore, F. -X. Pasquier, Michel Barreteau, R. Barrere, T. Petrisor, Eric Lenormand, C. Cantini, F. De Stefani
An innovative compilation tool-chain for embedded multi-core architectures Proceedings Article
In: Embedded World Conference, Nuremberg, Germany, 2012.
BibTeX | Tags:
@inproceedings{artemis:toolchain:12,
title = {An innovative compilation tool-chain for embedded multi-core architectures},
author = {Massimo Torquati and Marco Vanneschi and Mehdi Amini and S. Guelton and Ronan Keryell and Vincent Lanore and F. -X. Pasquier and Michel Barreteau and R. Barrere and T. Petrisor and Eric Lenormand and C. Cantini and F. De Stefani},
year = {2012},
date = {2012-02-01},
booktitle = {Embedded World Conference},
address = {Nuremberg, Germany},
keywords = {},
pubstate = {published},
tppubtype = {inproceedings}
}
Marco Aldinucci, Marco Danelutto, Lorenzo Anardu, Massimo Torquati, Peter Kilpatrick
Parallel patterns + Macro Data Flow for multi-core programming Proceedings Article
In: Proc. of Intl. Euromicro PDP 2012: Parallel Distributed and network-based Processing, pp. 27–36, IEEE, Garching, Germany, 2012.
Abstract | Links | BibTeX | Tags: fastflow
@inproceedings{dataflow:pdp:12,
title = {Parallel patterns + Macro Data Flow for multi-core programming},
author = {Marco Aldinucci and Marco Danelutto and Lorenzo Anardu and Massimo Torquati and Peter Kilpatrick},
url = {http://calvados.di.unipi.it/storage/paper_files/2012_mdf_PDP.pdf},
doi = {10.1109/PDP.2012.44},
year = {2012},
date = {2012-02-01},
booktitle = {Proc. of Intl. Euromicro PDP 2012: Parallel Distributed and network-based Processing},
pages = {27–36},
publisher = {IEEE},
address = {Garching, Germany},
abstract = {Data flow techniques have been around since the early '70s when they were used in compilers for sequential languages. Shortly after their introduction they were also considered as a possible model for parallel computing, although the impact here was limited. Recently, however, data flow has been identified as a candidate for efficient implementation of various programming models on multi-core architectures. In most cases, however, the burden of determining data flow ``macro'' instructions is left to the programmer, while the compiler/run time system manages only the efficient scheduling of these instructions. We discuss a structured parallel programming approach supporting automatic compilation of programs to macro data flow and we show experimental results demonstrating the feasibility of the approach and the efficiency of the resulting ``object'' code on different classes of state-of-the-art multi-core architectures. The experimental results use different base mechanisms to implement the macro data flow run time support, from plain pthreads with condition variables to more modern and effective lock- and fence-free parallel frameworks. Experimental results comparing efficiency of the proposed approach with those achieved using other, more classical, parallel frameworks are also presented.},
keywords = {fastflow},
pubstate = {published},
tppubtype = {inproceedings}
}
Mario Coppo, Ferruccio Damiani, Maurizio Drocco, Elena Grassi, Eva Sciacca, Salvatore Spinella, Angelo Troina
Simulation techniques for the calculus of wrapped compartments Journal Article
In: Theoretical Computer Science, vol. 431, pp. 75–95, 2012.
Abstract | Links | BibTeX | Tags: semantics
@article{DBLP:journals/tcs/CoppoDDGSST12,
title = {Simulation techniques for the calculus of wrapped compartments},
author = {Mario Coppo and Ferruccio Damiani and Maurizio Drocco and Elena Grassi and Eva Sciacca and Salvatore Spinella and Angelo Troina},
doi = {10.1016/j.tcs.2011.12.063},
year = {2012},
date = {2012-01-01},
journal = {Theoretical Computer Science},
volume = {431},
pages = {75–95},
abstract = {The modelling and analysis of biological systems has deep roots in Mathematics, specifically in the field of Ordinary Differential Equations (ODEs). Alternative approaches based on formal calculi, often derived from process algebras or term rewriting systems, provide a quite complementary way to analyse the behaviour of biological systems. These calculi allow to cope in a natural way with notions like compartments and membranes, which are not easy (sometimes impossible) to handle with purely numerical approaches, and are often based on stochastic simulation methods. Recently, it has also become evident that stochastic effects in regulatory networks play a crucial role in the analysis of such systems. Actually, in many situations it is necessary to use stochastic models. For example when the system to be described is based on the interaction of few molecules, when we are at the presence of a chemical instability, or when we want to simulate the functioning of a pool of entities whose compartmentalised structure evolves dynamically. In contrast, stable metabolic networks, involving a large number of reagents, for which the computational cost of a stochastic simulation becomes an insurmountable obstacle, are efficiently modelled with ODEs. In this paper we define a hybrid simulation method, combining the stochastic approach with ODEs, for systems described in the Calculus of Wrapped Compartments (CWC), a calculus on which we can express the compartmentalisation of a biological system whose evolution is defined by a set of rewrite rules.},
keywords = {semantics},
pubstate = {published},
tppubtype = {article}
}
Marco Aldinucci, Mario Coppo, Ferruccio Damiani, Maurizio Drocco, Eva Sciacca, Salvatore Spinella, Massimo Torquati, Angelo Troina
On Parallelizing On-Line Statistics for Stochastic Biological Simulations Proceedings Article
In: Alexander, Michael, D'Ambra, Pasqua, Belloum, Adam, Bosilca, George, Cannataro, Mario, Danelutto, Marco, Martino, Beniamino Di, Gerndt, Michael, Jeannot, Emmanuel, Namyst, Raymond, Roman, Jean, Scott, Stephen L., Träff, Jesper Larsson, Vallée, Geoffroy, Weidendorfer, Josef (Ed.): Proc. of Euro-Par Workshops: 2nd Workshop on High Performance Bioinformatics and Biomedicine (HiBB), pp. 3–12, Springer, Bordeaux, France, 2012.
Abstract | Links | BibTeX | Tags: bioinformatics, fastflow
@inproceedings{cwcsim:onlinestats:ff:hibb:11,
title = {On Parallelizing On-Line Statistics for Stochastic Biological Simulations},
author = {Marco Aldinucci and Mario Coppo and Ferruccio Damiani and Maurizio Drocco and Eva Sciacca and Salvatore Spinella and Massimo Torquati and Angelo Troina},
editor = {Michael Alexander and Pasqua D'Ambra and Adam Belloum and George Bosilca and Mario Cannataro and Marco Danelutto and Beniamino Di Martino and Michael Gerndt and Emmanuel Jeannot and Raymond Namyst and Jean Roman and Stephen L. Scott and Jesper Larsson Träff and Geoffroy Vallée and Josef Weidendorfer},
url = {http://calvados.di.unipi.it/storage/paper_files/2012_onlinestat_HiBB2011.pdf},
doi = {10.1007/978-3-642-29740-3_2},
year = {2012},
date = {2012-01-01},
booktitle = {Proc. of Euro-Par Workshops: 2nd Workshop on High Performance Bioinformatics and Biomedicine (HiBB)},
volume = {7156},
pages = {3–12},
publisher = {Springer},
address = {Bordeaux, France},
series = {LNCS},
abstract = {This work concerns a general technique to enrich parallel version of stochastic simulators for biological systems with tools for on-line statistical analysis of the results. In particular, within the FastFlow parallel programming framework, we describe the methodology and the implementation of a parallel Monte Carlo simulation infrastructure extended with user-defined on-line data filtering and mining functions. The simulator and the on-line analysis were validated on large multi-core platforms and representative proof-of-concept biological systems.},
keywords = {bioinformatics, fastflow},
pubstate = {published},
tppubtype = {inproceedings}
}
Fabio Tordini, Marco Aldinucci, Massimo Torquati
High-level lock-less programming for multicore Proceedings Article
In: Advanced Computer Architecture and Compilation for High-Performance and Embedded Systems (ACACES) – Poster Abstracts, HiPEAC, Fiuggi, Italy, 2012, ISBN: 9789038219875.
Abstract | Links | BibTeX | Tags: fastflow
@inproceedings{ff:acaces:12,
title = {High-level lock-less programming for multicore},
author = {Fabio Tordini and Marco Aldinucci and Massimo Torquati},
url = {http://calvados.di.unipi.it/storage/paper_files/2012_ACACES_ex-abstract.pdf},
isbn = {9789038219875},
year = {2012},
date = {2012-01-01},
booktitle = {Advanced Computer Architecture and Compilation for High-Performance and Embedded Systems (ACACES) – Poster Abstracts},
publisher = {HiPEAC},
address = {Fiuggi, Italy},
abstract = {Modern computers are built upon multi-core architectures. Achieving peak performance on these architectures is hard and may require a substantial programming effort. The synchronisation of many processes racing to access a common resource (the shared memory) has been a fundamental problem on parallel computing for years, and many solutions have been proposed to address this issue. Non-blocking synchronisation and transactional primitives have been envisioned as a way to reduce memory wall problem. Despite sometimes effective (and exhibiting a great momentum in the research community), they are only one facet of the problem, as their exploitation still requires non-trivial programming skills. With non-blocking philosophy in mind, we propose high-level programming patterns that will relieve the programmer from worrying about low-level details such as synchronisation of racing processes as well as those fine tunings needed to improve the overall performance, like proper (distributed) dynamic memory allocation and effective exploitation of the memory hierarchy.},
keywords = {fastflow},
pubstate = {published},
tppubtype = {inproceedings}
}
Thomas Weigold, Marco Aldinucci, Marco Danelutto, Vladimir Getov
Process-Driven Biometric Identification by means of Autonomic Grid Components Journal Article
In: Int. J. of Autonomous and Adaptive Communications Systems, vol. 5, no. 3, pp. 274–291, 2012, ISSN: 1754-8632.
Abstract | Links | BibTeX | Tags: grid
@article{ibm:ijaacs:12,
title = {Process-Driven Biometric Identification by means of Autonomic Grid Components},
author = {Thomas Weigold and Marco Aldinucci and Marco Danelutto and Vladimir Getov},
url = {http://calvados.di.unipi.it/storage/paper_files/2012_JAACS_Weigold.pdf},
doi = {10.1504/IJAACS.2012.047659},
issn = {1754-8632},
year = {2012},
date = {2012-01-01},
journal = {Int. J. of Autonomous and Adaptive Communications Systems},
volume = {5},
number = {3},
pages = {274–291},
publisher = {Inderscience Enterprises Ltd.},
abstract = {Today's business applications are increasingly process driven, meaning that the main application logic is executed by a dedicate process engine. In addition, component-oriented software development has been attracting attention for building complex distributed applications. In this paper we present the experiences gained from building a process-driven biometric identification application that makes use of Grid infrastructures via the Grid Component Model (GCM). GCM, besides guaranteeing access to Grid resources, supports autonomic management of notable parallel composite components. This feature is exploited within our biometric identification application to ensure real time identification of fingerprints. Therefore, we briefly introduce the GCM framework and the process engine used, and we describe the implementation of the application by means of autonomic GCM components. Finally, we summarize the results, experiences, and lessons learned focusing on the integration of autonomic GCM components and the process-driven approach.},
keywords = {grid},
pubstate = {published},
tppubtype = {article}
}
Filippo Spiga, Ivan Girotto
phiGEMM: A CPU-GPU Library for Porting Quantum ESPRESSO on Hybrid Systems Proceedings Article
In: Proceedings of the 20th Euromicro International Conference on Parallel, Distributed and Network-Based Processing, PDP 2012, Munich, Germany, February 15-17, 2012, pp. 368–375, 2012.
@inproceedings{DBLP:conf/pdp/SpigaG12,
title = {phiGEMM: A CPU-GPU Library for Porting Quantum ESPRESSO on Hybrid Systems},
author = {Filippo Spiga and Ivan Girotto},
url = {https://doi.org/10.1109/PDP.2012.72},
doi = {10.1109/PDP.2012.72},
year = {2012},
date = {2012-01-01},
booktitle = {Proceedings of the 20th Euromicro International Conference on Parallel, Distributed and Network-Based Processing, PDP 2012, Munich, Germany, February 15-17, 2012},
pages = {368–375},
keywords = {},
pubstate = {published},
tppubtype = {inproceedings}
}
2011
C Grandi, B Bockelman, D Bonacorsi, I Fisk, Isidro González Caballero, Fabio Farina, M Hernández, Sanjay Padhi, Sabyasachi Sarkar, Andrea Sciabà, I Sfiligoi, F Spiga, M Úbeda García, D C Van Der Ster, Marian Zvada
CMS Distributed Computing Integration in the LHC sustained operations era Journal Article
In: vol. 331, pp. 062032, 2011.
@article{11:cms,
title = {CMS Distributed Computing Integration in the LHC sustained operations era},
author = {C Grandi and B Bockelman and D Bonacorsi and I Fisk and Isidro González Caballero and Fabio Farina and M Hernández and Sanjay Padhi and Sabyasachi Sarkar and Andrea Sciabà and I Sfiligoi and F Spiga and M Úbeda García and D C Van Der Ster and Marian Zvada},
year = {2011},
date = {2011-12-01},
booktitle = {Journal of Physics: Conference Series},
volume = {331},
pages = {062032},
keywords = {parallel},
pubstate = {published},
tppubtype = {article}
}
Cristina Calcagno, Mario Coppo, Ferruccio Damiani, Maurizio Drocco, Eva Sciacca, Salvatore Spinella, Angelo Troina
Modelling Spatial Interactions in the Arbuscular Mycorrhizal Symbiosis using the Calculus of Wrapped Compartments Proceedings Article
In: Petre, Ion, Vink, Erik P. (Ed.): Proc. of 3rd Intl. Workshop on Computational Models for Cell Processes (CompMod), pp. 3–18, Aachen, Germany, 2011.
@inproceedings{DBLP:journals/corr/abs-1109-1363,
title = {Modelling Spatial Interactions in the Arbuscular Mycorrhizal Symbiosis using the Calculus of Wrapped Compartments},
author = {Cristina Calcagno and Mario Coppo and Ferruccio Damiani and Maurizio Drocco and Eva Sciacca and Salvatore Spinella and Angelo Troina},
editor = {Ion Petre and Erik P. Vink},
year = {2011},
date = {2011-09-01},
booktitle = {Proc. of 3rd Intl. Workshop on Computational Models for Cell Processes (CompMod)},
volume = {67},
pages = {3–18},
address = {Aachen, Germany},
series = {EPTCS},
abstract = {Arbuscular mycorrhiza (AM) is the most wide-spread plant-fungus symbiosis on earth. Investigating this kind of symbiosis is considered one of the most promising ways to develop methods to nurture plants in more natural manners, avoiding the complex chemical productions used nowadays to produce artificial fertilizers. In previous work we used the Calculus of Wrapped Compartments (CWC) to investigate different phases of the AM symbiosis. In this paper, we continue this line of research by modelling the colonisation of the plant root cells by the fungal hyphae spreading in the soil. This study requires the description of some spatial interaction. Although CWC has no explicit feature modelling a spatial geometry, the compartment labelling feature can be effectively exploited to define a discrete surface topology outlining the relevant sectors which determine the spatial properties of the system under consideration. Different situations and interesting spatial properties can be modelled and analysed in such a lightweight framework (which has not an explicit notion of geometry with coordinates and spatial metrics), thus exploiting the existing CWC simulation tool.},
keywords = {},
pubstate = {published},
tppubtype = {inproceedings}
}
Marco Aldinucci, Marco Danelutto, Peter Kilpatrick, Vamir Xhagjika
LIBERO: a framework for autonomic management of multiple non-functional concerns Proceedings Article
In: Guarracino, M. R., Vivien, F., Träff, J. L., Cannataro, M., Danelutto, M., Hast, A., Perla, F., Knüpfer, A., Martino, B. Di, Alexander, M. (Ed.): Euro-Par 2010 Workshops, Proc. of the CoreGrid Workshop on Grids, Clouds and P2P Computing, pp. 237–245, Springer, Ischia, Italy, 2011.
Abstract | Links | BibTeX | Tags: grid
@inproceedings{libero:cgsymph:10,
title = {LIBERO: a framework for autonomic management of multiple non-functional concerns},
author = {Marco Aldinucci and Marco Danelutto and Peter Kilpatrick and Vamir Xhagjika},
editor = {M. R. Guarracino and F. Vivien and J. L. Träff and M. Cannataro and M. Danelutto and A. Hast and F. Perla and A. Knüpfer and B. Di Martino and M. Alexander},
url = {http://calvados.di.unipi.it/storage/paper_files/2011_libero_coregridworkshop2010.pdf},
doi = {10.1007/978-3-642-21878-1_30},
year = {2011},
date = {2011-09-01},
booktitle = {Euro-Par 2010 Workshops, Proc. of the CoreGrid Workshop on Grids, Clouds and P2P Computing},
volume = {6586},
pages = {237–245},
publisher = {Springer},
address = {Ischia, Italy},
series = {LNCS},
abstract = {We describe a lightweight prototype framework (LIBERO) designed for experimentation with behavioural skeletons-components implementing a well-known parallelism exploitation pattern and a rule-based autonomic manager taking care of some non-functional feature related to pattern computation. LIBERO supports multiple autonomic managers within the same behavioural skeleton, each taking care of a different non-functional concern. We introduce LIBERO – built on plain Java and JBoss – and discuss how multiple managers may be coordinated to achieve a common goal using a two-phase coordination protocol developed in earlier work. We present experimental results that demonstrate how the prototype may be used to investigate autonomic management of multiple, independent concerns.},
keywords = {grid},
pubstate = {published},
tppubtype = {inproceedings}
}
Marco Aldinucci, Lorenzo Anardu, Marco Danelutto, Peter Kilpatrick, Massimo Torquati
Targeting multi cores by structured programming and data flow Technical Report
Università di Pisa, Dipartimento di Informatica, Italy no. TR-11-13, 2011.
@techreport{TR-11-13,
title = {Targeting multi cores by structured programming and data flow},
author = {Marco Aldinucci and Lorenzo Anardu and Marco Danelutto and Peter Kilpatrick and Massimo Torquati},
url = {http://compass2.di.unipi.it/TR/Files/TR-11-13.pdf.gz},
year = {2011},
date = {2011-09-01},
number = {TR-11-13},
institution = {Università di Pisa, Dipartimento di Informatica, Italy},
keywords = {},
pubstate = {published},
tppubtype = {techreport}
}
Marco Aldinucci, Marco Danelutto, Peter Kilpatrick, Massimiliano Meneghin, Massimo Torquati
Accelerating code on multi-cores with FastFlow Proceedings Article
In: Jeannot, E., Namyst, R., Roman, J. (Ed.): Proc. of 17th Intl. Euro-Par 2011 Parallel Processing, pp. 170–181, Springer, Bordeaux, France, 2011.
Abstract | Links | BibTeX | Tags: fastflow
@inproceedings{ff:acc:europar:11,
title = {Accelerating code on multi-cores with FastFlow},
author = {Marco Aldinucci and Marco Danelutto and Peter Kilpatrick and Massimiliano Meneghin and Massimo Torquati},
editor = {E. Jeannot and R. Namyst and J. Roman},
url = {http://calvados.di.unipi.it/storage/paper_files/2011_fastflow_acc_europar.pdf},
doi = {10.1007/978-3-642-23397-5_17},
year = {2011},
date = {2011-08-01},
booktitle = {Proc. of 17th Intl. Euro-Par 2011 Parallel Processing},
volume = {6853},
pages = {170–181},
publisher = {Springer},
address = {Bordeaux, France},
series = {LNCS},
abstract = {FastFlow is a programming framework specifically targeting cache-coherent shared-memory multicores. It is implemented as a stack of C++ template libraries built on top of lock-free (and memory fence free) synchronization mechanisms. Its philosophy is to combine programmability with performance. In this paper a new FastFlow programming methodology aimed at supporting parallelization of existing sequential code via offloading onto a dynamically created software accelerator is presented. The new methodology has been validated using a set of simple micro-benchmarks and some real applications.},
keywords = {fastflow},
pubstate = {published},
tppubtype = {inproceedings}
}
Marco Aldinucci, Andrea Bracciali, Pietro Liò, Anil Sorathiya, Massimo Torquati
StochKit-FF: Efficient Systems Biology on Multicore Architectures Proceedings Article
In: Guarracino, M. R., Vivien, F., Träff, J. L., Cannataro, M., Danelutto, M., Hast, A., Perla, F., Knüpfer, A., Martino, B. Di, Alexander, M. (Ed.): Euro-Par 2010 Workshops, Proc. of the 1st Workshop on High Performance Bioinformatics and Biomedicine (HiBB), pp. 167–175, Springer, Ischia, Italy, 2011.
Abstract | Links | BibTeX | Tags: bioinformatics
@inproceedings{stochkit-ff:hibb:10,
title = {StochKit-FF: Efficient Systems Biology on Multicore Architectures},
author = {Marco Aldinucci and Andrea Bracciali and Pietro Liò and Anil Sorathiya and Massimo Torquati},
editor = {M. R. Guarracino and F. Vivien and J. L. Träff and M. Cannataro and M. Danelutto and A. Hast and F. Perla and A. Knüpfer and B. Di Martino and M. Alexander},
url = {http://calvados.di.unipi.it/storage/paper_files/2010_stochkit-ff_hibb.pdf},
doi = {10.1007/978-3-642-21878-1_21},
year = {2011},
date = {2011-08-01},
booktitle = {Euro-Par 2010 Workshops, Proc. of the 1st Workshop on High Performance Bioinformatics and Biomedicine (HiBB)},
volume = {6586},
pages = {167–175},
publisher = {Springer},
address = {Ischia, Italy},
series = {LNCS},
abstract = {The stochastic modelling of biological systems is an informative, and in some cases, very adequate technique, which may however result in being more expensive than other modelling approaches, such as differential equations. We present StochKit-FF, a parallel version of StochKit, a reference toolkit for stochastic simulations. StochKit-FF is based on the FastFlow programming toolkit for multicores and exploits the novel concept of selective memory. We experiment StochKit-FF on a model of HIV infection dynamics, with the aim of extracting information from efficiently run experiments, here in terms of average and variance and, on a longer term, of more structured data.},
keywords = {bioinformatics},
pubstate = {published},
tppubtype = {inproceedings}
}
Marco Aldinucci, Maurizio Drocco, Daniela Giordano, Concetto Spampinato, Massimo Torquati
A Parallel Edge Preserving Algorithm for Salt and Pepper Image Denoising Technical Report
Università degli Studi di Torino, Dip. di Informatica, Italy no. 138/2011, 2011.
Links | BibTeX | Tags: fastflow
@techreport{ff:denoiser:tr138-2011,
title = {A Parallel Edge Preserving Algorithm for Salt and Pepper Image Denoising},
author = {Marco Aldinucci and Maurizio Drocco and Daniela Giordano and Concetto Spampinato and Massimo Torquati},
url = {http://calvados.di.unipi.it/storage/paper_files/2012_2phasedenoiser_ff_ipta.pdf},
year = {2011},
date = {2011-05-01},
number = {138/2011},
institution = {Università degli Studi di Torino, Dip. di Informatica, Italy},
keywords = {fastflow},
pubstate = {published},
tppubtype = {techreport}
}
Marco Aldinucci, Salvatore Ruggieri, Massimo Torquati
Porting Decision Tree Building and Pruning Algorithms to Multicore using FastFlow Technical Report
Università di Pisa, Dipartimento di Informatica, Italy no. TR-11-06, 2011.
Links | BibTeX | Tags: fastflow
@techreport{TR-11-06,
title = {Porting Decision Tree Building and Pruning Algorithms to Multicore using FastFlow},
author = {Marco Aldinucci and Salvatore Ruggieri and Massimo Torquati},
url = {http://compass2.di.unipi.it/TR/Files/TR-11-06.pdf.gz},
year = {2011},
date = {2011-03-01},
number = {TR-11-06},
institution = {Università di Pisa, Dipartimento di Informatica, Italy},
keywords = {fastflow},
pubstate = {published},
tppubtype = {techreport}
}
Marco Aldinucci, Mario Coppo, Ferruccio Damiani, Maurizio Drocco, Massimo Torquati, Angelo Troina
On Designing Multicore-Aware Simulators for Biological Systems Proceedings Article
In: Cotronis, Yiannis, Danelutto, Marco, Papadopoulos, George Angelos (Ed.): Proc. of 19th Euromicro Intl. Conference on Parallel Distributed and network-based Processing (PDP), pp. 318–325, IEEE, Ayia Napa, Cyprus, 2011.
Abstract | Links | BibTeX | Tags: fastflow
@inproceedings{ff:cwc:pdp:11,
title = {On Designing Multicore-Aware Simulators for Biological Systems},
author = {Marco Aldinucci and Mario Coppo and Ferruccio Damiani and Maurizio Drocco and Massimo Torquati and Angelo Troina},
editor = {Yiannis Cotronis and Marco Danelutto and George Angelos Papadopoulos},
url = {http://calvados.di.unipi.it/storage/paper_files/2011_ff_cwc_sim_PDP.pdf},
doi = {10.1109/PDP.2011.81},
year = {2011},
date = {2011-02-01},
booktitle = {Proc. of 19th Euromicro Intl. Conference on Parallel Distributed and network-based Processing (PDP)},
pages = {318–325},
publisher = {IEEE},
address = {Ayia Napa, Cyprus},
abstract = {The stochastic simulation of biological systems is an increasingly popular technique in bioinformatics. It often is an enlightening technique, which may however result in being computational expensive. We discuss the main opportunities to speed it up on multi-core platforms, which pose new challenges for parallelisation techniques. These opportunities are developed in two general families of solutions involving both the single simulation and a bulk of independent simulations (either replicas of derived from parameter sweep). Proposed solutions are tested on the parallelisation of the CWC simulator (Calculus of Wrapped Compartments) that is carried out according to proposed solutions by way of the FastFlow programming framework making possible fast development and efficient execution on multi-cores.},
keywords = {fastflow},
pubstate = {published},
tppubtype = {inproceedings}
}
Mario Coppo, Ferruccio Damiani, Maurizio Drocco, Elena Grassi, Mike Guether, Angelo Troina
Modelling Ammonium Transporters in Arbuscular Mycorrhiza Symbiosis Journal Article
In: Transactions on Computational Systems Biology, vol. 6575, no. 13, pp. 85–109, 2011.
Abstract | Links | BibTeX | Tags: semantics
@article{DBLP:journals/tcsb/Coppo/DDGGT11,
title = {Modelling Ammonium Transporters in Arbuscular Mycorrhiza Symbiosis},
author = {Mario Coppo and Ferruccio Damiani and Maurizio Drocco and Elena Grassi and Mike Guether and Angelo Troina},
doi = {10.1007/978-3-642-19748-2_5},
year = {2011},
date = {2011-01-01},
journal = {Transactions on Computational Systems Biology},
volume = {6575},
number = {13},
pages = {85–109},
abstract = {The Stochastic Calculus of Wrapped Compartments (SCWC) is a recently proposed variant of the Stochastic Calculus of Looping Sequences (SCLS), a language for the representation and simulation of biological systems. In this work we apply SCWC to model a newly discovered ammonium transporter. This transporter is believed to play a fundamental role for plant mineral acquisition, which takes place in the arbuscular mycorrhiza, the most wide-spread plant-fungus symbiosis on earth. Investigating this kind of symbiosis is considered one of the most promising ways to develop methods to nurture plants in more natural manners, avoiding the complex chemical productions used nowadays to produce artificial fertilizers. In our experiments the passage of NH3/NH4+ from the fungus to the plant has been dissected in known and hypothetical mechanisms; with the model so far we have been able to simulate the behavior of the system under different conditions. Our simulations confirmed some of the latest experimental results about the LjAMT2;2 transporter. Moreover, by comparing the behaviour of LjAMT2;2 with the behaviour of another ammonium transporter which exists in plants, viz. LjAMT1;1, our simulations support an hypothesis about why LjAMT2;2 is so selectively expressed in arbusculated cells.},
keywords = {semantics},
pubstate = {published},
tppubtype = {article}
}
2010
Marco Aldinucci, Mario Coppo, Ferruccio Damiani, Maurizio Drocco, Massimo Torquati, Angelo Troina
On Designing Multicore-Aware Simulators for Biological Systems Technical Report
Università degli Studi di Torino, Dipartimento di Informatica, Italy no. 131/2010, 2010.
@techreport{ff:cwc:pdp:11-tr,
title = {On Designing Multicore-Aware Simulators for Biological Systems},
author = {Marco Aldinucci and Mario Coppo and Ferruccio Damiani and Maurizio Drocco and Massimo Torquati and Angelo Troina},
year = {2010},
date = {2010-10-01},
number = {131/2010},
institution = {Università degli Studi di Torino, Dipartimento di Informatica, Italy},
keywords = {fastflow},
pubstate = {published},
tppubtype = {techreport}
}
Marco Aldinucci, Salvatore Ruggieri, Massimo Torquati
Porting Decision Tree Algorithms to Multicore using FastFlow Proceedings Article
In: Balcázar, José L., Bonchi, Francesco, Gionis, Aristides, Sebag, Michèle (Ed.): Proc. of European Conference in Machine Learning and Knowledge Discovery in Databases (ECML PKDD), pp. 7–23, Springer, Barcelona, Spain, 2010.
Abstract | Links | BibTeX | Tags: fastflow
@inproceedings{fastflow_c45:emclpkdd,
title = {Porting Decision Tree Algorithms to Multicore using FastFlow},
author = {Marco Aldinucci and Salvatore Ruggieri and Massimo Torquati},
editor = {José L. Balcázar and Francesco Bonchi and Aristides Gionis and Michèle Sebag},
url = {http://calvados.di.unipi.it/storage/paper_files/2010_c45FF_ECMLPKDD.pdf},
doi = {10.1007/978-3-642-15880-3_7},
year = {2010},
date = {2010-09-01},
booktitle = {Proc. of European Conference in Machine Learning and Knowledge Discovery in Databases (ECML PKDD)},
volume = {6321},
pages = {7–23},
publisher = {Springer},
address = {Barcelona, Spain},
series = {LNCS},
abstract = {The whole computer hardware industry embraced multicores. For these machines, the extreme optimisation of sequential algorithms is no longer sufficient to squeeze the real machine power, which can be only exploited via thread-level parallelism. Decision tree algorithms exhibit natural concurrency that makes them suitable to be parallelised. This paper presents an approach for easy-yet-efficient porting of an implementation of the C4.5 algorithm on multicores. The parallel porting requires minimal changes to the original sequential code, and it is able to exploit up to 7X speedup on an Intel dual-quad core machine.},
keywords = {fastflow},
pubstate = {published},
tppubtype = {inproceedings}
}
Mario Coppo, Ferruccio Damiani, Maurizio Drocco, Elena Grassi, Eva Sciacca, Salvatore Spinella, Angelo Troina
Hybrid Calculus of Wrapped Compartments Proceedings Article
In: Ciobanu, Gabriel, Koutny, Maciej (Ed.): Proc. of 4th Workshop on Membrane Computing and Biologically Inspired Process Calculi (MeCBIC), pp. 102–120, Jena, Germany, 2010.
@inproceedings{DBLP:journals/corr/abs-1011-0494,
title = {Hybrid Calculus of Wrapped Compartments},
author = {Mario Coppo and Ferruccio Damiani and Maurizio Drocco and Elena Grassi and Eva Sciacca and Salvatore Spinella and Angelo Troina},
editor = {Gabriel Ciobanu and Maciej Koutny},
year = {2010},
date = {2010-08-01},
booktitle = {Proc. of 4th Workshop on Membrane Computing and Biologically Inspired Process Calculi (MeCBIC)},
volume = {40},
pages = {102–120},
address = {Jena, Germany},
series = {EPTCS},
abstract = {The modelling and analysis of biological systems has deep roots in Mathematics, specifically in the field of ordinary differential equations (ODEs). Alternative approaches based on formal calculi, often derived from process algebras or term rewriting systems, provide a quite complementary way to analyze the behaviour of biological systems. These calculi allow to cope in a natural way with notions like compartments and membranes, which are not easy (sometimes impossible) to handle with purely numerical approaches, and are often based on stochastic simulation methods. Recently, it has also become evident that stochastic effects in regulatory networks play a crucial role in the analysis of such systems. Actually, in many situations it is necessary to use stochastic models. For example when the system to be described is based on the interaction of few molecules, when we are at the presence of a chemical instability, or when we want to simulate the functioning of a pool of entities whose compartmentalised structure evolves dynamically. In contrast, stable metabolic networks, involving a large number of reagents, for which the computational cost of a stochastic simulation becomes an insurmountable obstacle, are efficiently modelled with ODEs. In this paper we define a hybrid simulation method, combining the stochastic approach with ODEs, for systems described in CWC, a calculus on which we can express the compartmentalisation of a biological system whose evolution is defined by a set of rewrite rules.},
keywords = {},
pubstate = {published},
tppubtype = {inproceedings}
}
Marco Aldinucci, Marco Danelutto, Peter Kilpatrick
Autonomic Management of Multiple Non-Functional Concerns in Behavioural Skeletons Book Section
In: Desprez, Frédéric, Getov, Vladimir, Priol, Thierry, Yahyapour, Ramin (Ed.): Grids, P2P and Services Computing, pp. 89–103, Springer, 2010.
Abstract | Links | BibTeX | Tags: grid
@incollection{multiple-nf-concern:cgsymph:09:book,
title = {Autonomic Management of Multiple Non-Functional Concerns in Behavioural Skeletons},
author = {Marco Aldinucci and Marco Danelutto and Peter Kilpatrick},
editor = {Frédéric Desprez and Vladimir Getov and Thierry Priol and Ramin Yahyapour},
url = {http://calvados.di.unipi.it/storage/paper_files/2009_CGSymph_Autonomic_BeSke.pdf},
doi = {10.1007/978-1-4419-6794-7_8},
year = {2010},
date = {2010-08-01},
booktitle = {Grids, P2P and Services Computing},
pages = {89–103},
publisher = {Springer},
series = {CoreGRID},
abstract = {We introduce and address the problem of concurrent autonomic management of different non-functional concerns in parallel applications build as a hierarchical composition of behavioural skeletons. We first define the problems arising when multiple concerns are dealt with by independent managers, then we propose a methodology supporting coordinated management, and finally we discuss how autonomic management of multiple concerns may be implemented in a typical use case. Being based on the behavioural skeleton concept proposed in the CoreGRID GCM, it is anticipated that the methodology will be readily integrated into the current reference implementation of GCM based on Java ProActive and running on top of major grid middleware systems.},
keywords = {grid},
pubstate = {published},
tppubtype = {incollection}
}
Marco Aldinucci, Andrea Bracciali, Pietro Liò, Anil Sorathiya, Massimo Torquati
StochKit-FF: Efficient Systems Biology on Multicore Architectures Technical Report
Università di Pisa, Dipartimento di Informatica, Italy no. TR-10-12, 2010.
Abstract | Links | BibTeX | Tags: fastflow
@techreport{stochkit-ff:tr-10-12,
title = {StochKit-FF: Efficient Systems Biology on Multicore Architectures},
author = {Marco Aldinucci and Andrea Bracciali and Pietro Liò and Anil Sorathiya and Massimo Torquati},
url = {http://calvados.di.unipi.it/storage/paper_files/TR-10-12.pdf},
doi = {10.1007/978-3-642-21878-1_21},
year = {2010},
date = {2010-07-01},
number = {TR-10-12},
institution = {Università di Pisa, Dipartimento di Informatica, Italy},
abstract = {The stochastic modelling of biological systems is an informative, and in some cases, very adequate technique, which may however result in being more expensive than other modelling approaches, such as differential equations. We present StochKit-FF, a parallel version of StochKit, a reference toolkit for stochastic simulations. StochKit-FF is based on the FastFlow programming toolkit for multicores and exploits the novel concept of selective memory. We experiment StochKit-FF on a model of HIV infection dynamics, with the aim of extracting information from efficiently run experiments, here in terms of average and variance and, on a longer term, of more structured data.},
keywords = {fastflow},
pubstate = {published},
tppubtype = {techreport}
}
Marco Aldinucci, Andrea Bracciali, Pietro Liò
Formal Synthetic Immunology Journal Article
In: ERCIM News, vol. 82, pp. 40–41, 2010, ISSN: 0926-4981.
Abstract | Links | BibTeX | Tags: bioinformatics, fastflow
@article{stochkitff:ercimnews:10,
title = {Formal Synthetic Immunology},
author = {Marco Aldinucci and Andrea Bracciali and Pietro Liò},
url = {http://ercim-news.ercim.eu/images/stories/EN82/EN82-web.pdf},
issn = {0926-4981},
year = {2010},
date = {2010-07-01},
journal = {ERCIM News},
volume = {82},
pages = {40–41},
abstract = {The human immune system fights pathogens using an articulated set of strategies whose function is to maintain in health the organism. A large effort to formally model such a complex system using a computational approach is currently underway, with the goal of developing a discipline for engineering "synthetic" immune responses. This requires the integration of a range of analysis techniques developed for formally reasoning about the behaviour of complex dynamical systems. Furthermore, a novel class of software tools has to be developed, capable of efficiently analysing these systems on widely accessible computing platforms, such as commodity multi-core architectures..},
keywords = {bioinformatics, fastflow},
pubstate = {published},
tppubtype = {article}
}
Marco Aldinucci, Salvatore Ruggieri, Massimo Torquati
Porting Decision Tree Algorithms to Multicore using FastFlow Technical Report
Università di Pisa, Dipartimento di Informatica, Italy no. TR-10-11, 2010.
Abstract | Links | BibTeX | Tags: fastflow
@techreport{fastflow_c45:tr-10-11,
title = {Porting Decision Tree Algorithms to Multicore using FastFlow},
author = {Marco Aldinucci and Salvatore Ruggieri and Massimo Torquati},
url = {http://calvados.di.unipi.it/storage/paper_files/TR-10-11.pdf},
year = {2010},
date = {2010-05-01},
number = {TR-10-11},
institution = {Università di Pisa, Dipartimento di Informatica, Italy},
abstract = {The whole computer hardware industry embraced multicores. For these machines, the extreme optimisation of sequential algorithms is no longer sufficient to squeeze the real machine power, which can be only exploited via thread-level parallelism. Decision tree algorithms exhibit natural concurrency that makes them suitable to be parallelised. This paper presents an approach for easy-yet-efficient porting of an implementation of the C4.5 algorithm on multicores. The parallel porting requires minimal changes to the original sequential code, and it is able to exploit up to 7X speedup on an Intel dual-quad core machine.},
keywords = {fastflow},
pubstate = {published},
tppubtype = {techreport}
}
Mario Coppo, Ferruccio Damiani, Maurizio Drocco, Elena Grassi, Angelo Troina
Stochastic Calculus of Wrapped Compartments Proceedings Article
In: Pierro, Alessandra Di, Norman, Gethin (Ed.): Proc. of 8th Workshop on Quantitative Aspects of Programming Languages (QAPL), pp. 82–98, Paphos, Cyprus, 2010.
@inproceedings{DBLP:journals/corr/abs-1006-5099,
title = {Stochastic Calculus of Wrapped Compartments},
author = {Mario Coppo and Ferruccio Damiani and Maurizio Drocco and Elena Grassi and Angelo Troina},
editor = {Alessandra Di Pierro and Gethin Norman},
year = {2010},
date = {2010-03-01},
booktitle = {Proc. of 8th Workshop on Quantitative Aspects of Programming Languages (QAPL)},
volume = {28},
pages = {82–98},
address = {Paphos, Cyprus},
series = {EPTCS},
abstract = {The Calculus of Wrapped Compartments (CWC) is a variant of the Calculus of Looping Sequences (CLS). While keeping the same expressiveness, CWC strongly simplifies the development of automatic tools for the analysis of biological systems. The main simplification consists in the removal of the sequencing operator, thus lightening the formal treatment of the patterns to be matched in a term (whose complexity in CLS is strongly affected by the variables matching in the sequences). We define a stochastic semantics for this new calculus. As an application we model the interaction between macrophages and apoptotic neutrophils and a mechanism of gene regulation in E.Coli.},
keywords = {},
pubstate = {published},
tppubtype = {inproceedings}
}
Marco Aldinucci, Massimiliano Meneghin, Massimo Torquati
Efficient Smith-Waterman on multi-core with FastFlow Proceedings Article
In: Danelutto, Marco, Gross, Tom, Bourgeois, Julien (Ed.): Proc. of Intl. Euromicro PDP 2010: Parallel Distributed and network-based Processing, pp. 195–199, IEEE, Pisa, Italy, 2010.
Abstract | Links | BibTeX | Tags: fastflow
@inproceedings{fastflow:pdp:10,
title = {Efficient Smith-Waterman on multi-core with FastFlow},
author = {Marco Aldinucci and Massimiliano Meneghin and Massimo Torquati},
editor = {Marco Danelutto and Tom Gross and Julien Bourgeois},
url = {http://calvados.di.unipi.it/storage/paper_files/2010_fastflow_SW_PDP.pdf},
doi = {10.1109/PDP.2010.93},
year = {2010},
date = {2010-02-01},
booktitle = {Proc. of Intl. Euromicro PDP 2010: Parallel Distributed and network-based Processing},
pages = {195–199},
publisher = {IEEE},
address = {Pisa, Italy},
abstract = {Shared memory multiprocessors have returned to popularity thanks to rapid spreading of commodity multi-core architectures. However, little attention has been paid to supporting effective streaming applications on these architectures. In this paper we describe FastFlow, a low-level programming framework based on lock-free queues explicitly designed to support high-level languages for streaming applications. We compare FastFlow with state-of-the-art programming frameworks such as Cilk, OpenMP, and Intel TBB. We experimentally demonstrate that FastFlow is always more efficient than them on a given real world application: the speedup of FastFlow over other solutions may be substantial for fine grain tasks, for example +35% over OpenMP, +226% over Cilk, +96% over TBB for the alignment of protein P01111 against UniProt DB using the Smith-Waterman algorithm.},
keywords = {fastflow},
pubstate = {published},
tppubtype = {inproceedings}
}
Marco Aldinucci, Marco Danelutto, Peter Kilpatrick, Massimiliano Meneghin, Massimo Torquati
Accelerating sequential programs using FastFlow and self-offloading Technical Report
Università di Pisa, Dipartimento di Informatica, Italy no. TR-10-03, 2010.
Abstract | BibTeX | Tags: fastflow
@techreport{fastflow_acc:tr-10-03,
title = {Accelerating sequential programs using FastFlow and self-offloading},
author = {Marco Aldinucci and Marco Danelutto and Peter Kilpatrick and Massimiliano Meneghin and Massimo Torquati},
year = {2010},
date = {2010-02-01},
number = {TR-10-03},
institution = {Università di Pisa, Dipartimento di Informatica, Italy},
abstract = {Shared memory multiprocessors come back to popularity thanks to rapid spreading of commodity multi-core architectures. As ever, shared memory programs are fairly easy to write and quite hard to optimise; providing multi-core programmers with optimising tools and programming frameworks is a nowadays challenge. Few efforts have been done to support effective streaming applications on these architectures. In this paper we introduce FastFlow, a low-level programming framework based on lock-free queues explicitly designed to support high-level languages for streaming applications. We compare FastFlow with state-of-the-art programming frameworks such as Cilk, OpenMP, and Intel TBB. We experimentally demonstrate that FastFlow is always more efficient than all of them in a set of micro-benchmarks and on a real world application; the speedup edge of FastFlow over other solutions might be bold for fine grain tasks, as an example +35% on OpenMP, +226% on Cilk, +96% on TBB for the alignment of protein P01111 against UniProt DB using Smith-Waterman algorithm.},
keywords = {fastflow},
pubstate = {published},
tppubtype = {techreport}
}
CWC Simulator project Technical Manual
Sourceforge website 2010, (urlhttp://sourceforge.net/projects/cwcsimulator/).
BibTeX | Tags:
@manual{cwc:web,
title = {CWC Simulator project},
year = {2010},
date = {2010-01-01},
organization = {Sourceforge website},
note = {urlhttp://sourceforge.net/projects/cwcsimulator/},
keywords = {},
pubstate = {published},
tppubtype = {manual}
}
Marco Aldinucci
Efficient Parallel MonteCarlo with FastFlow Book Section
In: HPC-Europa2: Science and Supercomputing in Europe, research highlights 2010, Cineca, 2010.
Abstract | Links | BibTeX | Tags: bioinformatics, fastflow
@incollection{ff:hpc-europa:10,
title = {Efficient Parallel MonteCarlo with FastFlow},
author = {Marco Aldinucci},
url = {http://calvados.di.unipi.it/storage/paper_files/2010-ff_hpceuropa2_092-inform-Aldinucci.pdf},
year = {2010},
date = {2010-01-01},
booktitle = {HPC-Europa2: Science and Supercomputing in Europe, research highlights 2010},
publisher = {Cineca},
abstract = {The stochastic simulation of natural systems is a very informative but happens be computationally expensive. We present StochKit-FF, an parallel version of StochKit, a reference toolkit for stochastic simulations that sustantially improves StochKit performances on multi-core platforms.},
keywords = {bioinformatics, fastflow},
pubstate = {published},
tppubtype = {incollection}
}
Thomas Weigold, Marco Aldinucci, Marco Danelutto, Vladimir Getov
Integrating Autonomic Grid Components and Process-Driven Business Applications Proceedings Article
In: Vasilakos, Athanasios V., Beraldi, Roberto, Friedman, Roy, Mamei, Marco (Ed.): Autonomic Computing and Communications Systems Third International ICST Conference, Autonomics 2009, Limassol, Cyprus, September 9-11, 2009, Revised Selected Papers, pp. 98–113, Springer, Limassol, Cyprus, 2010, ISSN: 1867-8211.
Abstract | Links | BibTeX | Tags: grid
@inproceedings{ibm:autonomics:09,
title = {Integrating Autonomic Grid Components and Process-Driven Business Applications},
author = {Thomas Weigold and Marco Aldinucci and Marco Danelutto and Vladimir Getov},
editor = {Athanasios V. Vasilakos and Roberto Beraldi and Roy Friedman and Marco Mamei},
url = {http://calvados.di.unipi.it/storage/paper_files/2010_BS_autonomics09.pdf},
doi = {10.1007/978-3-642-11482-3_7},
issn = {1867-8211},
year = {2010},
date = {2010-01-01},
booktitle = {Autonomic Computing and Communications Systems Third International ICST Conference, Autonomics 2009, Limassol, Cyprus, September 9-11, 2009, Revised Selected Papers},
volume = {23},
pages = {98–113},
publisher = {Springer},
address = {Limassol, Cyprus},
series = {Lecture Notes of the Institute for Computer Sciences, Social-Informatics and Telecommunications Engineering (LNICST)},
abstract = {Today's business applications are increasingly process driven, meaning that the main application logic is executed by a dedicate process engine. In addition, component-oriented software development has been attracting attention for building complex distributed applications. In this paper we present the experiences gained from building a process-driven biometric identification application which makes use of Grid infrastructures via the Grid Component Model (GCM). GCM, besides guaranteeing access to Grid resources, supports autonomic management of notable parallel composite components. This feature is exploited within our biometric identification application to ensure real time identification of fingerprints. Therefore, we briefly introduce the GCM framework and the process engine used, and we describe the implementation of the application using autonomic GCM components. Finally, we summarize the results, experiences, and lessons learned focusing on the integration of autonomic GCM components and the process-driven approach.},
keywords = {grid},
pubstate = {published},
tppubtype = {inproceedings}
}
Marco Aldinucci, Marco Danelutto, Peter Kilpatrick
Skeletons for multi/many-core systems Proceedings Article
In: Chapman, Barbara, Desprez, Frédéric, Joubert, Gerhard R., Lichnewsky, Alain, Peters, Frans, Priol, Thierry (Ed.): Parallel Computing: From Multicores and GPU's to Petascale (Proc. of PARCO 2009, Lyon, France), pp. 265–272, IOS press, Lyon, France, 2010.
Abstract | Links | BibTeX | Tags:
@inproceedings{multicoreske:parco:09,
title = {Skeletons for multi/many-core systems},
author = {Marco Aldinucci and Marco Danelutto and Peter Kilpatrick},
editor = {Barbara Chapman and Frédéric Desprez and Gerhard R. Joubert and Alain Lichnewsky and Frans Peters and Thierry Priol},
url = {http://calvados.di.unipi.it/storage/paper_files/2010_muskel_multicore_parco.pdf},
doi = {10.3233/978-1-60750-530-3-265},
year = {2010},
date = {2010-01-01},
booktitle = {Parallel Computing: From Multicores and GPU's to Petascale (Proc. of PARCO 2009, Lyon, France)},
volume = {19},
pages = {265–272},
publisher = {IOS press},
address = {Lyon, France},
series = {Advances in Parallel Computing},
abstract = {We discuss how algorithmic skeletons (and structured parallel programming models in general) can be used to efficiently and seamlessly program multi-core as well as many-core systems. We introduce a new version of the muskel skeleton library that can be used to target multi/many-core systems and we present experimental results that demonstrate the feasibility of the approach. The experimental results presented also give an idea of the computational grains that can be exploited on current, state-of-the-art multi-core systems.},
keywords = {},
pubstate = {published},
tppubtype = {inproceedings}
}
Marco Aldinucci, Marco Danelutto, Massimiliano Meneghin, Massimo Torquati, Peter Kilpatrick
Efficient streaming applications on multi-core with FastFlow: The biosequence alignment test-bed Book Chapter
In: vol. 19, pp. 273–280, Elsevier, 2010.
Abstract | Links | BibTeX | Tags: fastflow
@inbook{fastflow:parco:09,
title = {Efficient streaming applications on multi-core with FastFlow: The biosequence alignment test-bed},
author = {Marco Aldinucci and Marco Danelutto and Massimiliano Meneghin and Massimo Torquati and Peter Kilpatrick},
url = {https://iris.unito.it/retrieve/handle/2318/67254/690859/2009_fastflow_parco.pdf},
doi = {10.3233/978-1-60750-530-3-273},
year = {2010},
date = {2010-01-01},
volume = {19},
pages = {273–280},
publisher = {Elsevier},
series = {Advances in Parallel Computing},
abstract = {Shared-memory multi-core architectures are becoming increasingly popular. While their parallelism and peak performance is ever increasing, their efficiency is often disappointing due to memory fence overheads. In this paper we present FastFlow, a programming methodology based on lock-free queues explicitly designed for programming streaming applications on multi-cores. The potential of FastFlow is evaluated on micro-benchmarks and on the Smith-Waterman sequence alignment application, which exhibits a substantial speedup against the state-of-the-art multi-threaded implementation (SWPS3 x86/SSE2).},
keywords = {fastflow},
pubstate = {published},
tppubtype = {inbook}
}
2009
Marco Aldinucci, Massimo Torquati, Massimiliano Meneghin
FastFlow: Efficient Parallel Streaming Applications on Multi-core Technical Report
Università di Pisa, Dipartimento di Informatica, Italy no. TR-09-12, 2009.
Abstract | Links | BibTeX | Tags: fastflow
@techreport{fastflow:tr-09-12,
title = {FastFlow: Efficient Parallel Streaming Applications on Multi-core},
author = {Marco Aldinucci and Massimo Torquati and Massimiliano Meneghin},
url = {http://arxiv.org/abs/0909.1187},
year = {2009},
date = {2009-09-01},
number = {TR-09-12},
institution = {Università di Pisa, Dipartimento di Informatica, Italy},
abstract = {Shared memory multiprocessors come back to popularity thanks to rapid spreading of commodity multi-core architectures. As ever, shared memory programs are fairly easy to write and quite hard to optimise; providing multi-core programmers with optimising tools and programming frameworks is a nowadays challenge. Few efforts have been done to support effective streaming applications on these architectures. In this paper we introduce FastFlow, a low-level programming framework based on lock-free queues explicitly designed to support high-level languages for streaming applications. We compare FastFlow with state-of-the-art programming frameworks such as Cilk, OpenMP, and Intel TBB. We experimentally demonstrate that FastFlow is always more efficient than all of them in a set of micro-benchmarks and on a real world application; the speedup edge of FastFlow over other solutions might be bold for fine grain tasks, as an example +35% on OpenMP, +226% on Cilk, +96% on TBB for the alignment of protein P01111 against UniProt DB using Smith-Waterman algorithm.},
keywords = {fastflow},
pubstate = {published},
tppubtype = {techreport}
}
Marco Aldinucci, Hinde Lilia Bouziane, Marco Danelutto, Christian Pérez
STKM on SCA: a Unified Framework with Components, Workflows and Algorithmic Skeletons Proceedings Article
In: Proc. of 15th Intl. Euro-Par 2009 Parallel Processing, pp. 678–690, Springer, Delft, The Netherlands, 2009.
Abstract | Links | BibTeX | Tags: grid
@inproceedings{stkm:europar:09,
title = {STKM on SCA: a Unified Framework with Components, Workflows and Algorithmic Skeletons},
author = {Marco Aldinucci and Hinde Lilia Bouziane and Marco Danelutto and Christian Pérez},
url = {http://calvados.di.unipi.it/storage/paper_files/2009_STKM_Europar.pdf},
doi = {10.1007/978-3-642-03869-3},
year = {2009},
date = {2009-08-01},
booktitle = {Proc. of 15th Intl. Euro-Par 2009 Parallel Processing},
volume = {5704},
pages = {678–690},
publisher = {Springer},
address = {Delft, The Netherlands},
series = {LNCS},
abstract = {This paper investigates an implementation of STKM, a Spatio-Temporal sKeleton Model. STKM expands the Grid Component Model (GCM) with an innovative programmable approach that allows programmers to compose an application by combining component, workflow and skeleton concepts. The paper deals with a projection of the STKM model on top of SCA and it evaluates its implementation using Tuscany Java SCA. Experimental results show the need and the benefits of the high level of abstraction offered by STKM.},
keywords = {grid},
pubstate = {published},
tppubtype = {inproceedings}
}
Marco Aldinucci, Marco Danelutto, Peter Kilpatrick
Autonomic management of multiple non-functional concerns in behavioural skeletons Technical Report
Università di Pisa, Dipartimento di Informatica, Italy no. TR-09-10, 2009.
@techreport{nf-concerns:tr-09-10,
title = {Autonomic management of multiple non-functional concerns in behavioural skeletons},
author = {Marco Aldinucci and Marco Danelutto and Peter Kilpatrick},
url = {http://arxiv.org/abs/0909.1517},
year = {2009},
date = {2009-07-01},
number = {TR-09-10},
institution = {Università di Pisa, Dipartimento di Informatica, Italy},
keywords = {},
pubstate = {published},
tppubtype = {techreport}
}
Marco Aldinucci, Marco Danelutto, Peter Kilpatrick
Autonomic management of non-functional concerns in distributed and parallel application programming Proceedings Article
In: Proc. of Intl. Parallel & Distributed Processing Symposium (IPDPS), pp. 1–12, IEEE, Rome, Italy, 2009.
Abstract | Links | BibTeX | Tags:
@inproceedings{beske:ipdps:09,
title = {Autonomic management of non-functional concerns in distributed and parallel application programming},
author = {Marco Aldinucci and Marco Danelutto and Peter Kilpatrick},
url = {http://calvados.di.unipi.it/storage/paper_files/2009_f_nf_IPDPS.pdf},
doi = {10.1109/IPDPS.2009.5161034},
year = {2009},
date = {2009-05-01},
booktitle = {Proc. of Intl. Parallel & Distributed Processing Symposium (IPDPS)},
pages = {1–12},
publisher = {IEEE},
address = {Rome, Italy},
abstract = {An approach to the management of non-functional concerns in massively parallel and/or distributed architectures that marries parallel programming patterns with autonomic computing is presented. The necessity and suitability of the adoption of autonomic techniques are evidenced. Issues arising in the implementation of autonomic managers taking care of multiple concerns and of coordination among hierarchies of such autonomic managers are discussed. Experimental results are presented that demonstrate the feasibility of the approach.},
keywords = {},
pubstate = {published},
tppubtype = {inproceedings}
}
Marco Aldinucci, Marco Danelutto, Peter Kilpatrick
Co-design of distributed systems using skeletons and autonomic management abstractions Proceedings Article
In: César, E., Alexander, M., Streit, A., Träff, J. L., Cérin, C., Knüpfer, A., Kranzlmüller, D., Jha, S. (Ed.): Euro-Par 2008 Workshops - Parallel Processing, Selected Papers, pp. 403–414, Springer, Las Palmas, Spain, 2009, ISBN: 978-3-642-00954-9.
Abstract | Links | BibTeX | Tags:
@inproceedings{abstraction:europarworkshop:09,
title = {Co-design of distributed systems using skeletons and autonomic management abstractions},
author = {Marco Aldinucci and Marco Danelutto and Peter Kilpatrick},
editor = {E. César and M. Alexander and A. Streit and J. L. Träff and C. Cérin and A. Knüpfer and D. Kranzlmüller and S. Jha},
url = {http://calvados.di.unipi.it/storage/paper_files/2009_abstraction_workshopeuropar.pdf},
doi = {10.1007/978-3-642-00955-6_46},
isbn = {978-3-642-00954-9},
year = {2009},
date = {2009-04-01},
booktitle = {Euro-Par 2008 Workshops - Parallel Processing, Selected Papers},
volume = {5415},
pages = {403–414},
publisher = {Springer},
address = {Las Palmas, Spain},
series = {LNCS},
abstract = {We discuss how common problems arising with multi/many-core distributed architectures can be effectively handled through co-design of parallel/distributed programming abstractions and of autonomic management of non-functional concerns. In particular, we demonstrate how restricted parallel/distributed patterns (or skeletons) may be efficiently managed by rule-based autonomic managers. We discuss the basic principles underlying pattern+manager co-design, current implementations inspired by this approach and some results achieved with a proof-of-concept prototype.},
keywords = {},
pubstate = {published},
tppubtype = {inproceedings}
}
Marco Aldinucci, Marco Danelutto, Peter Kilpatrick
Towards hierarchical management of autonomic components: a case study Proceedings Article
In: Baz, Didier El, Gross, Tom, Spies, Francois (Ed.): Proc. of Intl. Euromicro PDP 2009: Parallel Distributed and network-based Processing, pp. 3–10, IEEE, Weimar, Germany, 2009.
Abstract | Links | BibTeX | Tags:
@inproceedings{beske:pdp:09,
title = {Towards hierarchical management of autonomic components: a case study},
author = {Marco Aldinucci and Marco Danelutto and Peter Kilpatrick},
editor = {Didier El Baz and Tom Gross and Francois Spies},
url = {http://calvados.di.unipi.it/storage/paper_files/2009_hier_man_PDP.pdf},
doi = {10.1109/PDP.2009.48},
year = {2009},
date = {2009-02-01},
booktitle = {Proc. of Intl. Euromicro PDP 2009: Parallel Distributed and network-based Processing},
pages = {3–10},
publisher = {IEEE},
address = {Weimar, Germany},
abstract = {We address the issue of autonomic management in hierarchical component-based distributed systems. The long term aim is to provide a modeling framework for autonomic management in which QoS goals can be defined, plans for system adaptation described and proofs of achievement of goals by (sequences of) adaptations furnished. Here we present an early step on this path. We restrict our focus to skeleton-based systems in order to exploit their well-defined structure. The autonomic cycle is described using the Orc system orchestration language while the plans are presented as structural modifications together with associated costs and benefits. A case study is presented to illustrate the interaction of managers to maintain QoS goals for throughput under varying conditions of resource availability.},
keywords = {},
pubstate = {published},
tppubtype = {inproceedings}
}
Marco Aldinucci, Massimo Torquati
FastFlow website Technical Manual
2009, (urlhttp://mc-fastflow.sourceforge.net/).
BibTeX | Tags:
@manual{fastflow:web,
title = {FastFlow website},
author = {Marco Aldinucci and Massimo Torquati},
year = {2009},
date = {2009-01-01},
note = {urlhttp://mc-fastflow.sourceforge.net/},
keywords = {},
pubstate = {published},
tppubtype = {manual}
}
Marco Aldinucci, Sonia Campa, Patrizio Dazzi, Nicola Tonellotto
GridComp website Technical Manual
2009, (urlhttp://gridcomp.ercim.org/).
@manual{gridcomp-web,
title = {GridComp website},
author = {Marco Aldinucci and Sonia Campa and Patrizio Dazzi and Nicola Tonellotto},
url = {http://gridcomp.ercim.org/},
year = {2009},
date = {2009-01-01},
note = {urlhttp://gridcomp.ercim.org/},
keywords = {},
pubstate = {published},
tppubtype = {manual}
}
Marco Aldinucci, Marco Danelutto, Peter Kilpatrick
Semi-formal models to support program development: autonomic management within component based parallel and distributed programming Proceedings Article
In: Boer, Frank S., Bonsangue, Marcello M., Madelaine, Eric (Ed.): Formal Methods for Components and Objects: 7th Intl. Symposium, FMCO 2008, Sophia-Antipolis, France, October 20 - 24, 2008, Revised Lectures, pp. 204–225, Springer, 2009.
Abstract | Links | BibTeX | Tags:
@inproceedings{semi-formal:fmco:09,
title = {Semi-formal models to support program development: autonomic management within component based parallel and distributed programming},
author = {Marco Aldinucci and Marco Danelutto and Peter Kilpatrick},
editor = {Frank S. Boer and Marcello M. Bonsangue and Eric Madelaine},
url = {http://calvados.di.unipi.it/storage/paper_files/2009_semiformal_FMCO08.pdf},
doi = {10.1007/978-3-642-04167-9},
year = {2009},
date = {2009-01-01},
booktitle = {Formal Methods for Components and Objects: 7th Intl. Symposium, FMCO 2008, Sophia-Antipolis, France, October 20 - 24, 2008, Revised Lectures},
volume = {5751},
pages = {204–225},
publisher = {Springer},
series = {LNCS},
abstract = {Functional and non-functional concerns require different programming effort, different techniques and different methodologies when attempting to program efficient parallel/distributed applications. In this work we present a ``programmer oriented'' methodology based on formal tools that permits reasoning about parallel/distributed program development and refinement. The proposed methodology is semi-formal in that it does not require the exploitation of highly formal tools and techniques, while providing a palatable and effective support to programmers developing parallel/distributed applications, in particular when handling non-functional concerns.},
keywords = {},
pubstate = {published},
tppubtype = {inproceedings}
}
2008
Marco Aldinucci, Gabriel Antoniu, Marco Danelutto, Mathieu Jan
Fault-Tolerant Data Sharing for High-level Grid Programming: A Hierarchical Storage Architecture Book Section
In: Bubak, Marian, Gorlatch, Sergei, Priol, Thierry (Ed.): Achievements in European Research on Grid Systems, pp. 67–81, Springer, Kraków, Poland, 2008, ISBN: 978-0-387-72811-7.
Abstract | Links | BibTeX | Tags: parallel
@incollection{assist:juxmem:IW_book:07,
title = {Fault-Tolerant Data Sharing for High-level Grid Programming: A Hierarchical Storage Architecture},
author = {Marco Aldinucci and Gabriel Antoniu and Marco Danelutto and Mathieu Jan},
editor = {Marian Bubak and Sergei Gorlatch and Thierry Priol},
url = {http://calvados.di.unipi.it/storage/paper_files/2007_IW06_book_juxadhocmem.pdf},
doi = {10.1007/978-0-387-72812-4_6},
isbn = {978-0-387-72811-7},
year = {2008},
date = {2008-11-01},
booktitle = {Achievements in European Research on Grid Systems},
pages = {67–81},
publisher = {Springer},
address = {Kraków, Poland},
series = {CoreGRID},
abstract = {Enabling high-level programming models on grids is today a major challenge. A way to achieve this goal relies on the use of environments able to transparently and automatically provide adequate support for low-level, grid-specific issues (fault-tolerance, scalability, etc.). This paper discusses the above approach when applied to grid data management. As a case study, we propose a 2-tier software architecture that supports transparent, fault-tolerant, grid-level data sharing in the ASSIST programming environment (University of Pisa), based on the JuxMem grid data sharing service (INRIA Rennes).},
keywords = {parallel},
pubstate = {published},
tppubtype = {incollection}
}
Marco Aldinucci, Marco Danelutto, Hinde Lilia Bouziane, Christian Pérez
Towards Software Component Assembly Language Enhanced with Workflows and Skeletons Proceedings Article
In: Proc. of the ACM SIGPLAN Component-Based High Performance Computing (CBHPC), pp. 1–11, ACM, Karlsruhe, Germany, 2008, ISBN: 978-1-60558-311-2.
Abstract | Links | BibTeX | Tags:
@inproceedings{stkm:CBHPC:08,
title = {Towards Software Component Assembly Language Enhanced with Workflows and Skeletons},
author = {Marco Aldinucci and Marco Danelutto and Hinde Lilia Bouziane and Christian Pérez},
url = {http://calvados.di.unipi.it/storage/paper_files/2008_CBHPC.pdf},
doi = {10.1145/1456190.1456194},
isbn = {978-1-60558-311-2},
year = {2008},
date = {2008-10-01},
booktitle = {Proc. of the ACM SIGPLAN Component-Based High Performance Computing (CBHPC)},
pages = {1–11},
publisher = {ACM},
address = {Karlsruhe, Germany},
abstract = {We explore the possibilities offered by a programming model supporting components, workflows and skeletons. In particular we describe how Stcm (Spatio-Temporal Component Model), an already existing programming model supporting components and workflows, can be extended to also provide algorithmic skeleton concepts. Programmers are therefore enabled to assembly applications specifying both temporal and spatial relations among components and instantiating predefined skeleton composite components to implement all those application parts that can be easily modeled with the available skeletons. We discuss preliminary results as well as the benefits deriving from Stkm (Spatio-Temporal sKeleton Model) adoption in a couple of real applications.},
keywords = {},
pubstate = {published},
tppubtype = {inproceedings}
}
Marco Aldinucci, Marco Danelutto, Hinde Lilia Bouziane, Christian Pérez
Towards a Spatio-Temporal sKeleton Model implementation on top of SCA Technical Report
Institute on Programming Model, CoreGRID - Network of Excellence no. TR-0171, 2008.
@techreport{coregrid:tr0171,
title = {Towards a Spatio-Temporal sKeleton Model implementation on top of SCA},
author = {Marco Aldinucci and Marco Danelutto and Hinde Lilia Bouziane and Christian Pérez},
url = {http://calvados.di.unipi.it/storage/paper_files/tr-0171.pdf},
year = {2008},
date = {2008-09-01},
number = {TR-0171},
institution = {Institute on Programming Model, CoreGRID - Network of Excellence},
keywords = {},
pubstate = {published},
tppubtype = {techreport}
}
Marco Aldinucci, Marco Danelutto
Securing skeletal systems with limited performance penalty: the Muskel experience Journal Article
In: Journal of Systems Architecture, vol. 54, no. 9, pp. 868–876, 2008.
Abstract | Links | BibTeX | Tags: parallel
@article{security:jsa:07,
title = {Securing skeletal systems with limited performance penalty: the Muskel experience},
author = {Marco Aldinucci and Marco Danelutto},
url = {http://calvados.di.unipi.it/storage/paper_files/2008_security_JSA.pdf},
doi = {10.1016/j.sysarc.2008.02.008},
year = {2008},
date = {2008-09-01},
journal = {Journal of Systems Architecture},
volume = {54},
number = {9},
pages = {868–876},
publisher = {Elsevier},
abstract = {Algorithmic skeletons have been exploited to implement several parallel programming environments, targeting workstation clusters as well as workstation networks and computational grids. When targeting non-dedicated clusters, workstation networks and grids, security has to be taken adequately into account in order to guarantee both code and data confidentiality and integrity. However, introducing security is usually an expensive activity, both in terms of the effort required to managed security mechanisms and in terms of the time spent performing security related activities at run time.We discuss the cost of security introduction as well as how some features typical of skeleton technology can be exploited to improve the efficiency code and data securing in a typical skeleton based parallel programming environment and we evaluate the performance cost of security mechanisms implemented exploiting state of the art tools. In particular, we take into account the cost of security introduction in muskel, a Java based skeletal system exploiting macro data flow implementation technology. We consider the adoption of mechanisms that allow securing all the communications involving remote, unreliable nodes and we evaluate the cost of such mechanisms. Also, we consider the implications on the computational grains needed to scale secure and insecure skeletal computations.},
keywords = {parallel},
pubstate = {published},
tppubtype = {article}
}
Marco Aldinucci, Sonia Campa, Marco Danelutto, Patrizio Dazzi, Peter Kilpatrick, Domenico Laforenza, Nicola Tonellotto
Behavioural skeletons for component autonomic management on grids Book Section
In: Danelutto, Marco, Frangopoulou, Paraskevi, Getov, Vladimir (Ed.): Making Grids Work, pp. 3–16, Springer, 2008, ISBN: 978-0-387-78447-2.
Abstract | Links | BibTeX | Tags: parallel
@incollection{beske:cg_book:08,
title = {Behavioural skeletons for component autonomic management on grids},
author = {Marco Aldinucci and Sonia Campa and Marco Danelutto and Patrizio Dazzi and Peter Kilpatrick and Domenico Laforenza and Nicola Tonellotto},
editor = {Marco Danelutto and Paraskevi Frangopoulou and Vladimir Getov},
url = {http://calvados.di.unipi.it/storage/paper_files/2007_beske_cg_crete_book.pdf},
doi = {10.1007/978-0-387-78448-9_1},
isbn = {978-0-387-78447-2},
year = {2008},
date = {2008-08-01},
booktitle = {Making Grids Work},
pages = {3–16},
publisher = {Springer},
chapter = {Component Programming Models},
series = {CoreGRID},
abstract = {Autonomic management can improve the QoS provided by parallel/distributed applications. Within the CoreGRID Component Model, the autonomic management is tailored to the automatic – monitoring-driven – alteration of the component assembly and, therefore, is defined as the effect of (distributed)management code. This work yields a semantics based on hypergraph rewriting suitable tomodel the dynamic evolution and non-functional aspects of Service Oriented Architectures and component-based autonomic applications. In this regard, our main goal is to provide a formal description of adaptation operations that are typically only informally specified. We advocate that our approach makes easier to raise the level of abstraction of management code in autonomic and adaptive applications.},
keywords = {parallel},
pubstate = {published},
tppubtype = {incollection}
}
Marco Aldinucci, Marco Danelutto, Giorgio Zoppi, Peter Kilpatrick
Advances in Autonomic Components & Services Proceedings Article
In: Priol, Thierry, Vanneschi, Marco (Ed.): From Grids To Service and Pervasive Computing (Proc. of the CoreGRID Symposium 2008), pp. 3–18, Springer, Las Palmas, Spain, 2008, ISBN: 978-0-387-09454-0.
Abstract | Links | BibTeX | Tags: grid
@inproceedings{sca:cgsymph:08,
title = {Advances in Autonomic Components & Services},
author = {Marco Aldinucci and Marco Danelutto and Giorgio Zoppi and Peter Kilpatrick},
editor = {Thierry Priol and Marco Vanneschi},
url = {http://calvados.di.unipi.it/storage/paper_files/2008_SCA_cgsymph.pdf},
doi = {10.1007/978-0-387-09455-7_1},
isbn = {978-0-387-09454-0},
year = {2008},
date = {2008-08-01},
booktitle = {From Grids To Service and Pervasive Computing (Proc. of the CoreGRID Symposium 2008)},
pages = {3–18},
publisher = {Springer},
address = {Las Palmas, Spain},
series = {CoreGRID},
abstract = {Hierarchical autonomic management of structured grid applications can be efficiently implemented using production rule engines. Rules of the form "precondition-to-action" can be used to model the behaviour of autonomic managers in such a way that the autonomic control and the application management strategy are kept separate. This simplifies the manager design as well as user customization of autonomic manager policies. We briefly introduce rule-based autonomic managers. Then we discuss an implementation of a GCM-like behavioural skeleton – a composite component modelling a standard parallelism exploitation pattern with its own autonomic controller – in SCA/Tuscany. The implementation uses the JBoss rules engine to provide an autonomic behavioural skeleton component and services to expose the component functionality to the standard service framework. Performance results are discussed and finally similarities and differences with respect to the ProActive-based reference GCM implementation are discussed briefly.},
keywords = {grid},
pubstate = {published},
tppubtype = {inproceedings}
}
Marco Aldinucci, Emilio Tuosto
Towards a Formal Semantics for Autonomic Components Proceedings Article
In: Priol, Thierry, Vanneschi, Marco (Ed.): From Grids To Service and Pervasive Computing (Proc. of the CoreGRID Symposium 2008), pp. 31–45, Springer, Las Palmas, Spain, 2008, ISBN: 978-0-387-09454-0.
Abstract | Links | BibTeX | Tags: grid
@inproceedings{sem:cgsymph:08,
title = {Towards a Formal Semantics for Autonomic Components},
author = {Marco Aldinucci and Emilio Tuosto},
editor = {Thierry Priol and Marco Vanneschi},
url = {http://calvados.di.unipi.it/storage/paper_files/2008_sem_cgsymph.pdf},
doi = {10.1007/978-0-387-09455-7_3},
isbn = {978-0-387-09454-0},
year = {2008},
date = {2008-08-01},
booktitle = {From Grids To Service and Pervasive Computing (Proc. of the CoreGRID Symposium 2008)},
pages = {31–45},
publisher = {Springer},
address = {Las Palmas, Spain},
series = {CoreGRID},
abstract = {Autonomic management can improve the QoS provided by parallel/distributed applications. Within the CoreGRID Component Model, the autonomic management is tailored to the automatic – monitoring-driven – alteration of the component assembly and, therefore, is defined as the effect of (distributed)management code. This work yields a semantics based on hypergraph rewriting suitable tomodel the dynamic evolution and non-functional aspects of Service Oriented Architectures and component-based autonomic applications. In this regard, our main goal is to provide a formal description of adaptation operations that are typically only informally specified. We advocate that our approach makes easier to raise the level of abstraction of management code in autonomic and adaptive applications.},
keywords = {grid},
pubstate = {published},
tppubtype = {inproceedings}
}
Ana-Maria Oprescu, Thilo Kielmann, Marco Danelutto, Marco Aldinucci
Autonomic Behavior of Grid Applications using Component Platforms Technical Report
Institute on Programming Model, CoreGRID - Network of Excellence no. TR-0156, 2008.
@techreport{coregrid:tr0156,
title = {Autonomic Behavior of Grid Applications using Component Platforms},
author = {Ana-Maria Oprescu and Thilo Kielmann and Marco Danelutto and Marco Aldinucci},
url = {http://www.coregrid.net/mambo/images/stories/TechnicalReports/tr-0156.pdf},
year = {2008},
date = {2008-07-01},
number = {TR-0156},
institution = {Institute on Programming Model, CoreGRID - Network of Excellence},
keywords = {},
pubstate = {published},
tppubtype = {techreport}
}
Marco Aldinucci, Marco Danelutto, Hinde Lilia Bouziane, Christian Pérez
Towards Software Component Assembly Language Enhanced with Workflows and Skeletons Technical Report
Institute on Programming Model, CoreGRID - Network of Excellence no. TR-0153, 2008.
@techreport{coregrid:tr0153,
title = {Towards Software Component Assembly Language Enhanced with Workflows and Skeletons},
author = {Marco Aldinucci and Marco Danelutto and Hinde Lilia Bouziane and Christian Pérez},
url = {http://www.coregrid.net/mambo/images/stories/TechnicalReports/tr-0153.pdf},
year = {2008},
date = {2008-07-01},
number = {TR-0153},
institution = {Institute on Programming Model, CoreGRID - Network of Excellence},
keywords = {},
pubstate = {published},
tppubtype = {techreport}
}
Marco Aldinucci, Sonia Campa, Massimo Coppola, Marco Danelutto, Giorgio Zoppi, Alessandro Basso, Alexander Bolotov, Francoise Baude, Hinde Lilia Bouziane, Denis Caromel, Ludovic Henrio, Christian Pérez, Jose Cunha, Classen Michael, Philipp Classen, Christian Lengauer, J. Cohen, S. Mc Gough, Natalia Currle-Linde, Patrizio Dazzi, Nicola Tonellotto, Jan Dünnweber, Sergei Gorlatch, Peter Kilpatrick, Nadia Ranaldo, Eugenio Zimeo
Proceedings of the Programming Model Institute Technical meeting 2008 Technical Report
Institute of Programming Model, CoreGRID - Network of Excellence no. TR-0138, 2008.
@techreport{coregrid:tr0138,
title = {Proceedings of the Programming Model Institute Technical meeting 2008},
author = {Marco Aldinucci and Sonia Campa and Massimo Coppola and Marco Danelutto and Giorgio Zoppi and Alessandro Basso and Alexander Bolotov and Francoise Baude and Hinde Lilia Bouziane and Denis Caromel and Ludovic Henrio and Christian Pérez and Jose Cunha and Classen Michael and Philipp Classen and Christian Lengauer and J. Cohen and S. Mc Gough and Natalia Currle-Linde and Patrizio Dazzi and Nicola Tonellotto and Jan Dünnweber and Sergei Gorlatch and Peter Kilpatrick and Nadia Ranaldo and Eugenio Zimeo},
url = {http://www.coregrid.net/mambo/images/stories/TechnicalReports/tr-0138.pdf},
year = {2008},
date = {2008-05-01},
number = {TR-0138},
institution = {Institute of Programming Model, CoreGRID - Network of Excellence},
keywords = {},
pubstate = {published},
tppubtype = {techreport}
}
Marco Aldinucci, Marco Danelutto, Peter Kilpatrick, Patrizio Dazzi
From Orc Models to Distributed Grid Java code Proceedings Article
In: Gorlatch, Sergei, Fragopoulou, Paraskevi, Priol, Thierry (Ed.): Proc. of the Integrated Research in Grid Computing Workshop, pp. 2–13, Hersonissos, Crete, Greece, 2008.
Abstract | Links | BibTeX | Tags: grid
@inproceedings{orc:IW:08,
title = {From Orc Models to Distributed Grid Java code},
author = {Marco Aldinucci and Marco Danelutto and Peter Kilpatrick and Patrizio Dazzi},
editor = {Sergei Gorlatch and Paraskevi Fragopoulou and Thierry Priol},
url = {http://calvados.di.unipi.it/storage/paper_files/2008_IW_O2J.pdf},
year = {2008},
date = {2008-04-01},
booktitle = {Proc. of the Integrated Research in Grid Computing Workshop},
pages = {2–13},
address = {Hersonissos, Crete, Greece},
series = {CoreGRID},
abstract = {We present O2J, a Java library that allows implementation of Orc programs on distributed architectures including grids and clusters/networks of workstations. With minimal programming effort the grid programmer may implement Orc programs, as he/she is not required to write any low level code relating to distributed orchestration of the computation but only that required to implement Orc expressions. Using the prototype O2J implementation, grid application developers can reason about abstract grid orchestration code described in Orc. Once the required orchestration has been determined and its properties analysed, a grid application prototype can be simply, efficiently and quickly implemented by taking the Orc code, rewriting it into corresponding Java/O2J syntax and finally providing the functional code implementing the sites and processes involved. The proposed modus operandi brings a Model Driven Engineering approach to grid application development.},
keywords = {grid},
pubstate = {published},
tppubtype = {inproceedings}
}
Marco Aldinucci, Emilio Tuosto
Toward a Formal Semantics for Autonomic Components Technical Report
Università di Pisa, Dipartimento di Informatica, Italy no. TR-08-08, 2008.
@techreport{sem:tr-08-08,
title = {Toward a Formal Semantics for Autonomic Components},
author = {Marco Aldinucci and Emilio Tuosto},
url = {http://compass2.di.unipi.it/TR/Files/TR-08-08.pdf.gz},
year = {2008},
date = {2008-04-01},
number = {TR-08-08},
institution = {Università di Pisa, Dipartimento di Informatica, Italy},
keywords = {},
pubstate = {published},
tppubtype = {techreport}
}
Marco Aldinucci, Anne Benoit
Automatic mapping of ASSIST applications using process algebra Journal Article
In: Parallel Processing Letters, vol. 18, no. 1, pp. 175–188, 2008, ISSN: 0129-6264.
Abstract | Links | BibTeX | Tags: parallel
@article{assist:pepa:ppl:08,
title = {Automatic mapping of ASSIST applications using process algebra},
author = {Marco Aldinucci and Anne Benoit},
url = {http://calvados.di.unipi.it/storage/paper_files/2008_pepa_ppl.pdf},
doi = {10.1142/S0129626408003302},
issn = {0129-6264},
year = {2008},
date = {2008-03-01},
journal = {Parallel Processing Letters},
volume = {18},
number = {1},
pages = {175–188},
abstract = {Grid technologies aim to harness the computational capabilities of widely distributed collections of computers. Due to the heterogeneous and dynamic nature of the set of grid resources, the programming and optimisation burden of a low level approach to grid computing is clearly unacceptable for large scale, complex applications. The development of grid applications can be simplified by using high-level programming environments. In the present work, we address the problem of the mapping of a high-level grid application onto the computational resources. In order to optimise the mapping of the application, we propose to automatically generate performance models from the application using the process algebra PEPA. We target applications written with the high-level environment ASSIST, since the use of such a structured environment allows us to automate the study of the application more effectively.},
keywords = {parallel},
pubstate = {published},
tppubtype = {article}
}
Marco Aldinucci, Marco Danelutto, Peter Kilpatrick
Hierarchical autonomic management: a case study with skeletal systems Technical Report
Institute on Programming Model, CoreGRID - Network of Excellence no. TR-0127, 2008.
@techreport{coregrid:tr0127,
title = {Hierarchical autonomic management: a case study with skeletal systems},
author = {Marco Aldinucci and Marco Danelutto and Peter Kilpatrick},
url = {http://calvados.di.unipi.it/storage/paper_files/tr-0127.pdf},
year = {2008},
date = {2008-02-01},
number = {TR-0127},
institution = {Institute on Programming Model, CoreGRID - Network of Excellence},
keywords = {},
pubstate = {published},
tppubtype = {techreport}
}
Marco Aldinucci, Sonia Campa, Marco Danelutto, Marco Vanneschi, Patrizio Dazzi, Domenico Laforenza, Nicola Tonellotto, Peter Kilpatrick
Behavioural skeletons in GCM: autonomic management of grid components Proceedings Article
In: Baz, Didier El, Bourgeois, Julien, Spies, Francois (Ed.): Proc. of Intl. Euromicro PDP 2008: Parallel Distributed and network-based Processing, pp. 54–63, IEEE, Toulouse, France, 2008.
Abstract | Links | BibTeX | Tags: grid
@inproceedings{orc:pdp:08,
title = {Behavioural skeletons in GCM: autonomic management of grid components},
author = {Marco Aldinucci and Sonia Campa and Marco Danelutto and Marco Vanneschi and Patrizio Dazzi and Domenico Laforenza and Nicola Tonellotto and Peter Kilpatrick},
editor = {Didier El Baz and Julien Bourgeois and Francois Spies},
url = {http://calvados.di.unipi.it/storage/paper_files/2008_orc_PDP.pdf},
doi = {10.1109/PDP.2008.46},
year = {2008},
date = {2008-02-01},
booktitle = {Proc. of Intl. Euromicro PDP 2008: Parallel Distributed and network-based Processing},
pages = {54–63},
publisher = {IEEE},
address = {Toulouse, France},
abstract = {Autonomic management can be used to improve the QoS provided by parallel/distributed applications. We discuss behavioural skeletons introduced in earlier work: rather than relying on programmer ability to design "from scratch" efficient autonomic policies, we encapsulate general autonomic controller features into algorithmic skeletons. Then we leave to the programmer the duty of specifying the parameters needed to specialise the skeletons to the needs of the particular application at hand. This results in the programmer having the ability to fast prototype and tune distributed/parallel applications with non-trivial autonomic management capabilities. We discuss how behavioural skeletons have been implemented in the framework of GCM (the grid component model developed within the CoreGRID NoE and currently being implemented within the GridCOMP STREP project). We present results evaluating the overhead introduced by autonomic management activities as well as the overall behaviour of the skeletons. We also present results achieved with a long running application subject to autonomic management and dynamically adapting to changing features of the target architecture. Overall the results demonstrate both the feasibility of implementing autonomic control via behavioural skeletons and the effectiveness of our sample behavioural skeletons in managing the "functional replication" pattern(s).},
keywords = {grid},
pubstate = {published},
tppubtype = {inproceedings}
}
Marco Aldinucci, Massimo Torquati, Marco Vanneschi, Pierfrancesco Zuccato
The VirtuaLinux Storage Abstraction Layer for Efficient Virtual Clustering Proceedings Article
In: Baz, Didier El, Bourgeois, Julien, Spies, Francois (Ed.): Proc. of Intl. Euromicro PDP 2008: Parallel Distributed and network-based Processing, pp. 619–627, IEEE, Toulouse, France, 2008.
Abstract | Links | BibTeX | Tags:
@inproceedings{vlinux:pdp:08,
title = {The VirtuaLinux Storage Abstraction Layer for Efficient Virtual Clustering},
author = {Marco Aldinucci and Massimo Torquati and Marco Vanneschi and Pierfrancesco Zuccato},
editor = {Didier El Baz and Julien Bourgeois and Francois Spies},
url = {http://calvados.di.unipi.it/storage/paper_files/2008_VirtuaLinux_PDP.pdf},
doi = {10.1109/PDP.2008.86},
year = {2008},
date = {2008-02-01},
booktitle = {Proc. of Intl. Euromicro PDP 2008: Parallel Distributed and network-based Processing},
pages = {619–627},
publisher = {IEEE},
address = {Toulouse, France},
abstract = {VirtuaLinux is a meta-distribution that enables a standard Linux distribution to support robust physical and virtualized clusters. VirtuaLinux helps in avoiding the "single point of failure" effect by means of a combination of architectural strategies, including the transparent support for disk-less and master-less cluster configuration. VirtuaLinux supports the creation and management of Virtual Clusters in seamless way: VirtuaLinux Virtual Cluster Manager enables the system administrator to create, save, restore Xen-based Virtual Clusters, and to map and dynamically re-map them onto the nodes of the physical cluster. In this paper we introduce and discuss VirtuaLinux virtualization architecture, features, and tools, and in particular, the novel disk abstraction layer, which permits the fast and space-efficient creation of Virtual Clusters.},
keywords = {},
pubstate = {published},
tppubtype = {inproceedings}
}
Marco Aldinucci, Marco Danelutto, Peter Kilpatrick, Patrizio Dazzi
From Orc Models to Distributed Grid Java code Book Section
In: Gorlatch, Sergei, Fragopoulou, Paraskevi, Priol, Thierry (Ed.): Grid Computing: Achievements and Prospects, pp. 13–24, Springer, 2008, ISBN: 978-0-387-09456-4.
Abstract | Links | BibTeX | Tags: parallel
@incollection{orc:IW_book:08,
title = {From Orc Models to Distributed Grid Java code},
author = {Marco Aldinucci and Marco Danelutto and Peter Kilpatrick and Patrizio Dazzi},
editor = {Sergei Gorlatch and Paraskevi Fragopoulou and Thierry Priol},
url = {http://calvados.di.unipi.it/storage/paper_files/2008_IW_book_O2J.pdf},
doi = {10.1007/978-0-387-09457-1_2},
isbn = {978-0-387-09456-4},
year = {2008},
date = {2008-01-01},
booktitle = {Grid Computing: Achievements and Prospects},
pages = {13–24},
publisher = {Springer},
series = {CoreGRID},
abstract = {We present O2J, a Java library that allows implementation of Orc programs on distributed architectures including grids and clusters/networks of workstations. With minimal programming effort the grid programmer may implement Orc programs, as he/she is not required to write any low level code relating to distributed orchestration of the computation but only that required to implement Orc expressions. Using the prototype O2J implementation, grid application developers can reason about abstract grid orchestration code described inOrc. Once the required orchestration has been determined and its properties analysed, a grid application prototype can be simply, efficiently and quickly implemented by taking the Orc code, rewriting it into corresponding Java/O2J syntax and finally providing the functional code implementing the sites and processes involved. The proposed modus operandi brings aModel Driven Engineering approach to grid application development.},
keywords = {parallel},
pubstate = {published},
tppubtype = {incollection}
}
Marco Aldinucci, Marco Danelutto, Peter Kilpatrick
A framework for prototyping and reasoning about grid systems Proceedings Article
In: Bischof, C., Bücker, M., Gibbon, P., Joubert, G. R., Lippert, T., Mohr, B., Peters, F. J. (Ed.): Parallel Computing: Architectures, Algorithms and Applications, pp. 235–242, IOS press, Germany, 2008, ISBN: 9781586037963.
Abstract | Links | BibTeX | Tags: grid
@inproceedings{orc:parco:07,
title = {A framework for prototyping and reasoning about grid systems},
author = {Marco Aldinucci and Marco Danelutto and Peter Kilpatrick},
editor = {C. Bischof and M. Bücker and P. Gibbon and G. R. Joubert and T. Lippert and B. Mohr and F. J. Peters},
url = {http://calvados.di.unipi.it/storage/paper_files/2007_orc_parco.pdf},
isbn = {9781586037963},
year = {2008},
date = {2008-01-01},
booktitle = {Parallel Computing: Architectures, Algorithms and Applications},
volume = {15},
pages = {235–242},
publisher = {IOS press},
address = {Germany},
series = {ADVANCES IN PARALLEL COMPUTING},
abstract = {A framework supporting fast prototyping as well as tuning of distributed applications is presented. The approach is based on the adoption of a formal model that is used to describe the orchestration of distributed applications. The formal model (Orc by Misra and Cook) can be used to support semi-formal reasoning about the applications at hand. The paper describes how the framework can be used to derive and evaluate alternative orchestrations of a well know parallel/distributed computation pattern; and shows how the same formal model can be used to support generation of prototypes of distributed applications skeletons directly from the application description.},
keywords = {grid},
pubstate = {published},
tppubtype = {inproceedings}
}
Carlo Bertolli, Romano Fantacci, Gabriele Mencagli, Daniele Tarchi, Marco Vanneschi
Next generation grids and wireless communication networks: towards a novel integrated approach Journal Article
In: Wireless Communications and Mobile Computing, 2008, (To appear).
BibTeX | Tags:
@article{position:insyeme:09,
title = {Next generation grids and wireless communication networks: towards a novel integrated approach},
author = {Carlo Bertolli and Romano Fantacci and Gabriele Mencagli and Daniele Tarchi and Marco Vanneschi},
year = {2008},
date = {2008-01-01},
journal = {Wireless Communications and Mobile Computing},
note = {To appear},
keywords = {},
pubstate = {published},
tppubtype = {article}
}
Marco Aldinucci, Marco Danelutto, Massimo Torquati, Francesco Polzella, Gianmarco Spinatelli, Marco Vanneschi, Alessandro Gervaso, Manuel Cacitti, Pierfrancesco Zuccato
VirtuaLinux: virtualized high-density clusters with no single point of failure Proceedings Article
In: Bischof, C., Bücker, M., Gibbon, P., Joubert, G. R., Lippert, T., Mohr, B., Peters, F. J. (Ed.): Parallel Computing: Architectures, Algorithms and Applications, pp. 355–362, IOS press, The Netherlands, 2008.
Abstract | Links | BibTeX | Tags:
@inproceedings{virtualinux:parco:07,
title = {VirtuaLinux: virtualized high-density clusters with no single point of failure},
author = {Marco Aldinucci and Marco Danelutto and Massimo Torquati and Francesco Polzella and Gianmarco Spinatelli and Marco Vanneschi and Alessandro Gervaso and Manuel Cacitti and Pierfrancesco Zuccato},
editor = {C. Bischof and M. Bücker and P. Gibbon and G. R. Joubert and T. Lippert and B. Mohr and F. J. Peters},
url = {http://calvados.di.unipi.it/storage/paper_files/2007_vlinux_parco.pdf},
year = {2008},
date = {2008-01-01},
booktitle = {Parallel Computing: Architectures, Algorithms and Applications},
volume = {15},
pages = {355–362},
publisher = {IOS press},
address = {The Netherlands},
series = {ADVANCES IN PARALLEL COMPUTING},
abstract = {VirtuaLinux is a Linux meta-distribution that allows the creation, deployment and administration of both physical and virtualized clusters with no single point of failure. VirtuaLinux supports the creation and management of virtual clusters in seamless way: VirtuaLinux Virtual Cluster Manager enables the system administrator to create, save, restore Xen-based virtual clusters, and to map and dynamically remap them onto the nodes of the physical cluster. We introduces and discuss VirtuaLinux virtualization architecture, features, and tools. These rely on a novel disk abstraction layer, which enables the fast, space-efficient, dynamic creation of virtual clusters composed of fully independent complete virtual machines.},
keywords = {},
pubstate = {published},
tppubtype = {inproceedings}
}
2007
Marco Aldinucci, Marco Danelutto, Patrizio Dazzi
MUSKEL: an expandable skeleton environment Journal Article
In: Scalable Computing: Practice and Experience, vol. 8, no. 4, pp. 325–341, 2007.
Abstract | Links | BibTeX | Tags: parallel
@article{muskel:SCPE:07,
title = {MUSKEL: an expandable skeleton environment},
author = {Marco Aldinucci and Marco Danelutto and Patrizio Dazzi},
url = {http://www.scpe.org/index.php/scpe/article/view/429},
year = {2007},
date = {2007-12-01},
journal = {Scalable Computing: Practice and Experience},
volume = {8},
number = {4},
pages = {325–341},
abstract = {Programming models based on algorithmic skeletons promise to raise the level of abstraction perceived by programmers when implementing parallel applications, while guaranteeing good performance figures. At the same time, however, they restrict the freedom of programmers to implement arbitrary parallelism exploitation patterns. In fact, efficiency is achieved by restricting the parallelism exploitation patterns provided to the programmer to the useful ones for which efficient implementations, as well as useful and efficient compositions, are known. In this work we introduce muskel, a full Java library targeting workstation clusters, networks and grids and providing the programmers with a skeleton based parallel programming environment. muskel is implemented exploiting (macro) data flow technology, rather than the more usual skeleton technology relying on the use of implementation templates. Using data flow, muskel easily and efficiently implements both classical, predefined skeletons, and user-defined parallelism exploitation patterns. This provides a means to overcome some of the problems that Cole identified in his skeleton ``manifesto'' as the issues impairing skeleton success in the parallel programming arena. We discuss fully how user-defined skeletons are supported by exploiting a data flow implementation, experimental results and we also discuss extensions supporting the further characterization of skeletons with non-functional properties, such as security, through the use of Aspect Oriented Programming and annotations.},
keywords = {parallel},
pubstate = {published},
tppubtype = {article}
}
Marco Danelutto, Marcelo Pasin, Marco Vanneschi, Patrizio Dazzi, Luigi Presti, Domenico Laforenza
PAL: Exploiting Java Annotations for Parallelism Book Section
In: Bubak, Marian, Gorlatch, Sergei, Priol, Thierry (Ed.): Achievements in European Research on Grid Systems, pp. 83–96, Springer, Kraków, Poland, 2007.
@incollection{pal:IW_book:07,
title = {PAL: Exploiting Java Annotations for Parallelism},
author = {Marco Danelutto and Marcelo Pasin and Marco Vanneschi and Patrizio Dazzi and Luigi Presti and Domenico Laforenza},
editor = {Marian Bubak and Sergei Gorlatch and Thierry Priol},
year = {2007},
date = {2007-11-01},
booktitle = {Achievements in European Research on Grid Systems},
pages = {83–96},
publisher = {Springer},
address = {Kraków, Poland},
series = {CoreGRID},
keywords = {grid},
pubstate = {published},
tppubtype = {incollection}
}
Carlo Bertolli, Massimo Coppola, Corrado Zoccolo
The co-replication methodology and its application to structured parallel programs Proceedings Article
In: CompFrame '07: Proc. of the 2007 symposium on Component and framework technology in high-performance and scientific computing, pp. 39–48, ACM, Montreal, Quebec, Canada, 2007, ISBN: 978-1-59593-867-1.
@inproceedings{corep:bertolli:07,
title = {The co-replication methodology and its application to structured parallel programs},
author = {Carlo Bertolli and Massimo Coppola and Corrado Zoccolo},
url = {https://doi.acm.org/10.1145/1297385.1297393},
doi = {https://doi.acm.org/10.1145/1297385.1297393},
isbn = {978-1-59593-867-1},
year = {2007},
date = {2007-10-01},
booktitle = {CompFrame '07: Proc. of the 2007 symposium on Component and framework technology in high-performance and scientific computing},
pages = {39–48},
publisher = {ACM},
address = {Montreal, Quebec, Canada},
keywords = {},
pubstate = {published},
tppubtype = {inproceedings}
}
Marco Aldinucci, Marco Danelutto
Skeleton based parallel programming: functional and parallel semantic in a single shot Journal Article
In: Computer Languages, Systems and Structures, vol. 33, no. 3-4, pp. 179–192, 2007.
Abstract | Links | BibTeX | Tags: parallel
@article{lithium:sem:CLSS,
title = {Skeleton based parallel programming: functional and parallel semantic in a single shot},
author = {Marco Aldinucci and Marco Danelutto},
url = {http://calvados.di.unipi.it/storage/paper_files/2005_semantics_CLSS.pdf},
doi = {10.1016/j.cl.2006.07.004},
year = {2007},
date = {2007-10-01},
journal = {Computer Languages, Systems and Structures},
volume = {33},
number = {3-4},
pages = {179–192},
abstract = {Semantics of skeleton-based parallel programming languages comes usually as two distinct items: a functional semantics, modeling the function computed by the skeleton program, and a parallel semantics describing the ways used to exploit parallelism during the execution of the skeleton program. The former is usually expressed using some kind of semantic formalism, while the latter is almost always given in an informal way. Such a separation of functional and parallel semantics seriously impairs the possibility of programmers to use the semantic tools to prove properties of programs. In this work, we show how a formal semantic framework can be set up that handles both functional and parallel aspects of skeleton-based parallel programs. The framework is based on a labeled transition system. We show how different properties related to skeleton programs can be proved using such a system. We use Lithium, a skeleton-based full Java parallel programming environment, as the case study.},
keywords = {parallel},
pubstate = {published},
tppubtype = {article}
}
Thierry Priol, Marco Vanneschi (Ed.)
Toward Next Generation Grids, Proc. of the CorGRID Symposium 2007 Proceedings
Springer, Rennes, France, 2007.
BibTeX | Tags:
@proceedings{cgs:proc:07,
title = {Toward Next Generation Grids, Proc. of the CorGRID Symposium 2007},
editor = {Thierry Priol and Marco Vanneschi},
year = {2007},
date = {2007-09-01},
publisher = {Springer},
address = {Rennes, France},
keywords = {},
pubstate = {published},
tppubtype = {proceedings}
}
Massimo Coppola, Domenico Laforenza, Nicola Tonellotto, Marco Danelutto, Marco Vanneschi, Corrado Zoccolo
Managing User Expectation with Component Performance Contracts Proceedings Article
In: Proc. of the Workshop on Usage of Service Level Agreements in Grids, Springer, Austin, TX, USA, 2007.
BibTeX | Tags:
@inproceedings{cop:usla:07,
title = {Managing User Expectation with Component Performance Contracts},
author = {Massimo Coppola and Domenico Laforenza and Nicola Tonellotto and Marco Danelutto and Marco Vanneschi and Corrado Zoccolo},
year = {2007},
date = {2007-09-01},
booktitle = {Proc. of the Workshop on Usage of Service Level Agreements in Grids},
publisher = {Springer},
address = {Austin, TX, USA},
series = {CoreGRID},
keywords = {},
pubstate = {published},
tppubtype = {inproceedings}
}
Marco Aldinucci, Marco Danelutto, Peter Kilpatrick
Adding metadata to Orc to support reasoning about grid programming Proceedings Article
In: Priol, Thierry, Vanneschi, Marco (Ed.): Towards Next Generation Grids (Proc. of the CoreGRID Symposium 2007), pp. 205–214, Springer, Rennes, France, 2007, ISBN: 978-0-387-72497-3.
Abstract | Links | BibTeX | Tags: grid
@inproceedings{orc:metadata:cgs:07,
title = {Adding metadata to Orc to support reasoning about grid programming},
author = {Marco Aldinucci and Marco Danelutto and Peter Kilpatrick},
editor = {Thierry Priol and Marco Vanneschi},
url = {http://calvados.di.unipi.it/storage/paper_files/2007_orc_CGSymph.pdf},
doi = {10.1007/978-0-387-72498-0_19},
isbn = {978-0-387-72497-3},
year = {2007},
date = {2007-09-01},
booktitle = {Towards Next Generation Grids (Proc. of the CoreGRID Symposium 2007)},
pages = {205–214},
publisher = {Springer},
address = {Rennes, France},
series = {CoreGRID},
abstract = {Following earlier work demonstrating the utility of Orc as a means of specifying and reasoning about grid applications we propose the enhancement of such specifications with metadata that provide a means to extend an Orc specification with implementation oriented information. We argue that such specifications provide a useful refinement step in allowing reasoning about implementation related issues ahead of actual implementation or even prototyping. As examples, we demonstrate how such extended specifications can be used for investigating security related issues and for evaluating the cost of handling grid resource faults. The approach emphasises a semi-formal style of reasoning that makes maximum use of programmer domain knowledge and experience.},
keywords = {grid},
pubstate = {published},
tppubtype = {inproceedings}
}
Marco Danelutto, Marco Aldinucci, Peter Kilpatrick
Prototyping and reasoning about distributed systems: an Orc based framework Technical Report
Institute on Programming Model, CoreGRID - Network of Excellence no. TR-0102, 2007.
@techreport{coregrid:tr0102,
title = {Prototyping and reasoning about distributed systems: an Orc based framework},
author = {Marco Danelutto and Marco Aldinucci and Peter Kilpatrick},
url = {http://www.coregrid.net/mambo/images/stories/TechnicalReports/tr-0102.pdf},
year = {2007},
date = {2007-08-01},
number = {TR-0102},
institution = {Institute on Programming Model, CoreGRID - Network of Excellence},
keywords = {},
pubstate = {published},
tppubtype = {techreport}
}
Marco Aldinucci, Marco Danelutto, Peter Kilpatrick
Management in distributed systems: a semi-formal approach Proceedings Article
In: Kermarrec, A. -M., Bougé, L., Priol, T. (Ed.): Proc. of 13th Intl. Euro-Par 2007 Parallel Processing, pp. 651–661, Springer, Rennes, France, 2007, ISBN: 978-3-540-74465-8.
Abstract | Links | BibTeX | Tags: parallel, semantics
@inproceedings{orc:europar:07,
title = {Management in distributed systems: a semi-formal approach},
author = {Marco Aldinucci and Marco Danelutto and Peter Kilpatrick},
editor = {A. -M. Kermarrec and L. Bougé and T. Priol},
url = {http://calvados.di.unipi.it/storage/paper_files/2007_orc_europar.pdf},
doi = {10.1007/978-3-540-74466-5},
isbn = {978-3-540-74465-8},
year = {2007},
date = {2007-08-01},
booktitle = {Proc. of 13th Intl. Euro-Par 2007 Parallel Processing},
volume = {4641},
pages = {651–661},
publisher = {Springer},
address = {Rennes, France},
series = {LNCS},
abstract = {The reverse engineering of a skeleton based programming environment and redesign to distribute management activities of the system and thereby remove a potential single point of failure is considered. The Orc notation is used to facilitate abstraction of the design and analysis of its properties. It is argued that Orc is particularly suited to this role as this type of management is essentially an orchestration activity. The Orc specification of the original version of the system is modified via a series of semi-formally justified derivation steps to obtain a specification of the decentralized management version which is then used as a basis for its implementation. Analysis of the two specifications allows qualitative prediction of the expected performance of the derived version with respect to the original, and this prediction is borne out in practice.},
keywords = {parallel, semantics},
pubstate = {published},
tppubtype = {inproceedings}
}
Marco Aldinucci, Sonia Campa, Marco Danelutto, Patrizio Dazzi, Peter Kilpatrick, Domenico Laforenza, Nicola Tonellotto
Behavioural skeletons for component autonomic management on grids Proceedings Article
In: CoreGRID Workshop on Grid Programming Model, Grid and P2P Systems Architecture, Grid Systems, Tools and Environments, Heraklion, Crete, Greece, 2007.
Abstract | Links | BibTeX | Tags: parallel
@inproceedings{beske:cg:heraklion:07,
title = {Behavioural skeletons for component autonomic management on grids},
author = {Marco Aldinucci and Sonia Campa and Marco Danelutto and Patrizio Dazzi and Peter Kilpatrick and Domenico Laforenza and Nicola Tonellotto},
url = {http://compass2.di.unipi.it/TR/Files/TR-07-12.pdf.gz},
year = {2007},
date = {2007-06-01},
booktitle = {CoreGRID Workshop on Grid Programming Model, Grid and P2P Systems Architecture, Grid Systems, Tools and Environments},
address = {Heraklion, Crete, Greece},
abstract = {We present behavioural skeletons for the CoreGRID Component Model, which are an abstraction aimed at simplifying the development of GCM-based self-management applications. Behavioural skeletons abstract component self-managent in component-based design as design patterns abstract class design in classic OO development. As here we just wish to introduce the behavioural skeleton framework, emphasis is placed on general skeleton structure rather than on their autonomic management policies.},
keywords = {parallel},
pubstate = {published},
tppubtype = {inproceedings}
}
Marco Aldinucci, Pierfrancesco Zuccato
Virtual clusters with no single point of failure Proceedings Article
In: Intl. Supercomputing Conference (ISC2007), Poster session, Dresden, Germany, 2007.
Abstract | Links | BibTeX | Tags:
@inproceedings{virtualinux:poster:ics:07,
title = {Virtual clusters with no single point of failure},
author = {Marco Aldinucci and Pierfrancesco Zuccato},
url = {http://calvados.di.unipi.it/storage/paper_files/2007_ICS_VirtuaLinux.pdf},
year = {2007},
date = {2007-06-01},
booktitle = {Intl. Supercomputing Conference (ISC2007), Poster session},
address = {Dresden, Germany},
abstract = {VirtuaLinux is a Linux meta-distribution that allows the creation, deployment and administration of virtualized clusters with no single point of failure. VirtuaLinux architecture supports diskless configurations and provides an efficient, iSCSI based abstraction of the SAN. Clusters running VirtuaLinux exhibit no master node, thus boosting resilience and flexibility.},
keywords = {},
pubstate = {published},
tppubtype = {inproceedings}
}
Marco Aldinucci, Massimo Torquati, Marco Vanneschi, Manuel Cacitti, Alessandro Gervaso, Pierfrancesco Zuccato
VirtuaLinux Design Principles Technical Report
Università di Pisa, Dipartimento di Informatica, Italy no. TR-07-13, 2007.
@techreport{virtualinux:tr:07,
title = {VirtuaLinux Design Principles},
author = {Marco Aldinucci and Massimo Torquati and Marco Vanneschi and Manuel Cacitti and Alessandro Gervaso and Pierfrancesco Zuccato},
url = {http://calvados.di.unipi.it/storage/paper_files/2007_VirtuaLinux_TR-07-13.pdf},
year = {2007},
date = {2007-06-01},
number = {TR-07-13},
institution = {Università di Pisa, Dipartimento di Informatica, Italy},
keywords = {},
pubstate = {published},
tppubtype = {techreport}
}
Cristian Dittamo, Antonio Cisternino, Marco Danelutto
Parallelization of C# Programs Through Annotations Proceedings Article
In: Proc. of Practical Aspects of High-Level Parallel Programming Workshop (PAPP, co-located with ICCS 2007), pp. 585–592, Springer, Beijing, China, 2007.
@inproceedings{07:dcd:csharp,
title = {Parallelization of C# Programs Through Annotations},
author = {Cristian Dittamo and Antonio Cisternino and Marco Danelutto},
url = {https://dx.doi.org/10.1007/978-3-540-72586-2_86},
doi = {10.1007/978-3-540-72586-2_86},
year = {2007},
date = {2007-05-01},
booktitle = {Proc. of Practical Aspects of High-Level Parallel Programming Workshop (PAPP, co-located with ICCS 2007)},
volume = {4488},
pages = {585–592},
publisher = {Springer},
address = {Beijing, China},
series = {LNCS},
keywords = {},
pubstate = {published},
tppubtype = {inproceedings}
}
Marco Aldinucci, Sonia Campa, Marco Danelutto, Peter Kilpatrick, Patrizio Dazzi, Domenico Laforenza, Nicola Tonellotto
Behavioural skeletons for component autonomic management on grids Technical Report
Università di Pisa, Dipartimento di Informatica no. TR-07-12, 2007.
@techreport{beske:TR-07-12,
title = {Behavioural skeletons for component autonomic management on grids},
author = {Marco Aldinucci and Sonia Campa and Marco Danelutto and Peter Kilpatrick and Patrizio Dazzi and Domenico Laforenza and Nicola Tonellotto},
url = {http://compass2.di.unipi.it/TR/Files/TR-07-12.pdf.gz},
doi = {10.1007/978-0-387-78448-9_1},
year = {2007},
date = {2007-05-01},
number = {TR-07-12},
institution = {Università di Pisa, Dipartimento di Informatica},
keywords = {},
pubstate = {published},
tppubtype = {techreport}
}
Marco Aldinucci, Marco Danelutto, Peter Kilpatrick
Orc + metadata supporting grid programming Technical Report
Università di Pisa, Dipartimento di Informatica no. TR-07-10, 2007.
@techreport{orcmetadata:TR-07-10,
title = {Orc + metadata supporting grid programming},
author = {Marco Aldinucci and Marco Danelutto and Peter Kilpatrick},
url = {http://compass2.di.unipi.it/TR/Files/TR-07-10.pdf.gz},
year = {2007},
date = {2007-05-01},
number = {TR-07-10},
institution = {Università di Pisa, Dipartimento di Informatica},
keywords = {},
pubstate = {published},
tppubtype = {techreport}
}
Peter Kilpatrick, Marco Danelutto, Marco Aldinucci
Deriving Grid Applications from Abstract Models Technical Report
Institute on Programming Model, CoreGRID - Network of Excellence no. TR-0085, 2007.
@techreport{coregrid:tr0085,
title = {Deriving Grid Applications from Abstract Models},
author = {Peter Kilpatrick and Marco Danelutto and Marco Aldinucci},
url = {http://www.coregrid.net/mambo/images/stories/TechnicalReports/tr-0085.pdf},
year = {2007},
date = {2007-04-01},
number = {TR-0085},
institution = {Institute on Programming Model, CoreGRID - Network of Excellence},
keywords = {},
pubstate = {published},
tppubtype = {techreport}
}
Marco Aldinucci, Marco Danelutto, Peter Kilpatrick
Management in distributed systems: a semi-formal approach Technical Report
Università di Pisa, Dipartimento di Informatica no. TR-07-05, 2007.
@techreport{orc_muskel:TR-07-05,
title = {Management in distributed systems: a semi-formal approach},
author = {Marco Aldinucci and Marco Danelutto and Peter Kilpatrick},
url = {http://compass2.di.unipi.it/TR/Files/TR-07-05.pdf.gz},
doi = {10.1007/978-3-540-74466-5_69},
year = {2007},
date = {2007-02-01},
number = {TR-07-05},
institution = {Università di Pisa, Dipartimento di Informatica},
keywords = {},
pubstate = {published},
tppubtype = {techreport}
}
Marco Aldinucci, Marco Danelutto
The cost of security in skeletal systems Proceedings Article
In: D'Ambra, Pasqua, Guarracino, Mario Rosario (Ed.): Proc. of Intl. Euromicro PDP 2007: Parallel Distributed and network-based Processing, pp. 213–220, IEEE, Napoli, Italia, 2007.
Abstract | Links | BibTeX | Tags: grid
@inproceedings{security:euromicro:07,
title = {The cost of security in skeletal systems},
author = {Marco Aldinucci and Marco Danelutto},
editor = {Pasqua D'Ambra and Mario Rosario Guarracino},
url = {http://calvados.di.unipi.it/storage/paper_files/2007_security_PDP.pdf},
doi = {10.1109/PDP.2007.79},
year = {2007},
date = {2007-02-01},
booktitle = {Proc. of Intl. Euromicro PDP 2007: Parallel Distributed and network-based Processing},
pages = {213–220},
publisher = {IEEE},
address = {Napoli, Italia},
abstract = {Skeletal systems exploit algorithmical skeletons technology to provide the user very high level, efficient parallel programming environments. They have been recently demonstrated to be suitable for highly distributed architectures, such as workstation clusters, networks and grids. However, when using skeletal system for grid programming care must be taken to secure data and code transfers across non-dedicated, non-secure network links. In this work we take into account the cost of security introduction in muskel, a Java based skeletal system exploiting macro data flow implementation technology. We consider the adoption of mechanisms that allow securing all the communications taking place between remote, unreliable nodes and we evaluate the cost of such mechanisms. In particular, we consider the implications on the computational grains needed to scale secure and insecure skeletal computations.},
keywords = {grid},
pubstate = {published},
tppubtype = {inproceedings}
}
Nicola Tonellotto, Domenico Laforenza, Marco Danelutto, Marco Vanneschi, Corrado Zoccolo
A Performance Model for Stream-Based Computations Proceedings Article
In: D'Ambra, Pasqua, Guarracino, Mario Rosario (Ed.): Proc. of Intl. Euromicro PDP 2007: Parallel Distributed and network-based Processing, pp. 91–96, IEEE, Napoli, Italia, 2007.
BibTeX | Tags:
@inproceedings{zoccolo:streammodel:euromicro:07,
title = {A Performance Model for Stream-Based Computations},
author = {Nicola Tonellotto and Domenico Laforenza and Marco Danelutto and Marco Vanneschi and Corrado Zoccolo},
editor = {Pasqua D'Ambra and Mario Rosario Guarracino},
year = {2007},
date = {2007-02-01},
booktitle = {Proc. of Intl. Euromicro PDP 2007: Parallel Distributed and network-based Processing},
pages = {91–96},
publisher = {IEEE},
address = {Napoli, Italia},
keywords = {},
pubstate = {published},
tppubtype = {inproceedings}
}
Marco Aldinucci, Sonia Campa, Massimo Coppola, Marco Danelutto, Corrado Zoccolo, Francoise André, Jérémy Buisson
An abstract schema modeling adaptivity management Book Section
In: Gorlatch, Sergei, Danelutto, Marco (Ed.): Integrated Research in Grid Computing, pp. 89–102, Springer, 2007, ISBN: 978-0-387-47656-8.
Abstract | Links | BibTeX | Tags: grid
@incollection{adapt_rennes:IW_book:06,
title = {An abstract schema modeling adaptivity management},
author = {Marco Aldinucci and Sonia Campa and Massimo Coppola and Marco Danelutto and Corrado Zoccolo and Francoise André and Jérémy Buisson},
editor = {Sergei Gorlatch and Marco Danelutto},
url = {http://calvados.di.unipi.it/storage/paper_files/2006_IW_book_adapt.pdf},
doi = {10.1007/978-0-387-47658-2_7},
isbn = {978-0-387-47656-8},
year = {2007},
date = {2007-01-01},
booktitle = {Integrated Research in Grid Computing},
pages = {89–102},
publisher = {Springer},
series = {CoreGRID},
abstract = {Nowadays, component application adaptivity in Grid environments has been afforded in different ways, such those provided by the Dynaco/AFPAC framework and by the ASSIST environment. We propose an abstract schema that catches all the designing aspects a model for parallel component applications on Grid should define in order to uniformly handle the dynamic behavior of computing resources within complex parallel applications. The abstraction is validated by demonstrating how two different approaches to adaptivity, ASSIST and Dynaco/AFPAC, easily map to such schema.},
keywords = {grid},
pubstate = {published},
tppubtype = {incollection}
}
Marco Aldinucci, Anne Benoit
Towards the Automatic Mapping of ASSIST Applications for the Grid Book Section
In: Gorlatch, Sergei, Danelutto, Marco (Ed.): Integrated Research in Grid Computing, pp. 73–87, Springer, 2007, ISBN: 978-0-387-47656-8.
Abstract | Links | BibTeX | Tags: parallel
@incollection{assist:pepa:IW_book:06,
title = {Towards the Automatic Mapping of ASSIST Applications for the Grid},
author = {Marco Aldinucci and Anne Benoit},
editor = {Sergei Gorlatch and Marco Danelutto},
url = {http://calvados.di.unipi.it/storage/paper_files/2006_IW_book_pepa.pdf},
doi = {10.1007/978-0-387-47658-2_6},
isbn = {978-0-387-47656-8},
year = {2007},
date = {2007-01-01},
booktitle = {Integrated Research in Grid Computing},
pages = {73–87},
publisher = {Springer},
series = {CoreGRID},
abstract = {One of the most promising technical innovations in present-day computing is the invention of grid technologies which harness the computational power of widely distributed collections of computers. However, the programming and optimisation burden of a low level approach to grid computing is clearly unacceptable for large scale, complex applications. The development of grid applications can be simplified by using high-level programming environments. In the present work, we address the problem of the mapping of a high-level grid application onto the computational resources. In order to optimise the mapping of the application, we propose to automatically generate performance models from the application using the process algebra PEPA. We target in this work applications written with the high-level environment ASSIST, since the use of such a structured environment allows us to automate the study of the application more effectively.},
keywords = {parallel},
pubstate = {published},
tppubtype = {incollection}
}
Jan Dünnweber, Sergei Gorlatch, Sonia Campa, Marco Aldinucci, Marco Danelutto
Adaptable Parallel Components for Grid Programming Book Section
In: Gorlatch, Sergei, Danelutto, Marco (Ed.): Integrated Research in Grid Computing, pp. 43–57, Springer, 2007, ISBN: 978-0-387-47656-8.
Abstract | Links | BibTeX | Tags: grid
@incollection{codeadapt:IW_book:06,
title = {Adaptable Parallel Components for Grid Programming},
author = {Jan Dünnweber and Sergei Gorlatch and Sonia Campa and Marco Aldinucci and Marco Danelutto},
editor = {Sergei Gorlatch and Marco Danelutto},
url = {http://calvados.di.unipi.it/storage/paper_files/2006_IW_book_muester.pdf},
doi = {10.1007/978-0-387-47658-2_4},
isbn = {978-0-387-47656-8},
year = {2007},
date = {2007-01-01},
booktitle = {Integrated Research in Grid Computing},
pages = {43–57},
publisher = {Springer},
series = {CoreGRID},
abstract = {We suggest that parallel software components used for grid computing should be adaptable to application-specific requirements, instead of developing new components from scratch for each particular application. As an example, we take a parallel farm component which is "embarrassingly parallel", i. e. , free of dependencies, and adapt it to the wavefront processing pattern with dependencies that impact its behavior. We describe our approach in the context of Higher-Order Components (HOCs), with the Java-based system Lithium as our implementation framework. The adaptation process relies on HOCs' mobile code parameters that are shipped over the network of the grid. We describe our implementation of the proposed component adaptation method and report first experimental results for a particular grid application – the alignment of DNA sequence pairs, a popular, time-critical problem in computational molecular biology.},
keywords = {grid},
pubstate = {published},
tppubtype = {incollection}
}
Massimo Coppola, Marco Danelutto, Nicola Tonellotto, Marco Vanneschi, Corrado Zoccolo
Execution Support of High Performance Heterogeneous Component-Based Applications on the Grid Proceedings Article
In: Lehner, Wolfgang, Meyer, Norbert, Streit, Achim, Stewart, Craig (Ed.): in Proc. of Euro-Par 2006 Workshops: Parallel Processing, CoreGRID 2006, UNICORE Summit 2006, Petascale Computational Biology and Bioinformatics, Dresden, Germany, August 29-September 1, 2006, Revised Selected Papers, pp. 171–185, Springer, 2007.
BibTeX | Tags:
@inproceedings{DBLP:conf/europar/CoppolaDTVZ06,
title = {Execution Support of High Performance Heterogeneous Component-Based Applications on the Grid},
author = {Massimo Coppola and Marco Danelutto and Nicola Tonellotto and Marco Vanneschi and Corrado Zoccolo},
editor = {Wolfgang Lehner and Norbert Meyer and Achim Streit and Craig Stewart},
year = {2007},
date = {2007-01-01},
booktitle = {in Proc. of Euro-Par 2006 Workshops: Parallel Processing, CoreGRID 2006, UNICORE Summit 2006, Petascale Computational Biology and Bioinformatics, Dresden, Germany, August 29-September 1, 2006, Revised Selected Papers},
volume = {4375},
pages = {171–185},
publisher = {Springer},
series = {LNCS},
keywords = {},
pubstate = {published},
tppubtype = {inproceedings}
}
Marco Vanneschi, Luca Veraldi
Dynamicity in distributed applications: issues, problems and the ASSIST approach Journal Article
In: Parallel Computing, vol. 33, no. 12, pp. 822–845, 2007, ISSN: 0167-8191.
@article{dyn:van:pc:07,
title = {Dynamicity in distributed applications: issues, problems and the ASSIST approach},
author = {Marco Vanneschi and Luca Veraldi},
url = {http://dx.doi.org/10.1016/j.parco.2007.08.001},
doi = {http://dx.doi.org/10.1016/j.parco.2007.08.001},
issn = {0167-8191},
year = {2007},
date = {2007-01-01},
journal = {Parallel Computing},
volume = {33},
number = {12},
pages = {822–845},
publisher = {Elsevier},
address = {Amsterdam, The Netherlands},
keywords = {},
pubstate = {published},
tppubtype = {article}
}
Marcelo Pasin, Pierre Kuonen, Marco Danelutto, Marco Aldinucci
Skeleton Parallel Programming and Parallel Objects Book Section
In: Gorlatch, Sergei, Danelutto, Marco (Ed.): Integrated Research in Grid Computing, pp. 59–71, Springer, 2007, ISBN: 978-0-387-47656-8.
Abstract | Links | BibTeX | Tags: parallel
@incollection{pasin:IW_book:06,
title = {Skeleton Parallel Programming and Parallel Objects},
author = {Marcelo Pasin and Pierre Kuonen and Marco Danelutto and Marco Aldinucci},
editor = {Sergei Gorlatch and Marco Danelutto},
url = {http://calvados.di.unipi.it/storage/paper_files/2006_IW_book_popc.pdf},
doi = {10.1007/978-0-387-47658-2_5},
isbn = {978-0-387-47656-8},
year = {2007},
date = {2007-01-01},
booktitle = {Integrated Research in Grid Computing},
pages = {59–71},
publisher = {Springer},
series = {CoreGRID},
abstract = {This paper describes the ongoing work aimed at integrating the POP-C++ parallel object programming environment with the ASSIST component based parallel programming environment. Both these programming environments are shortly outlined, then several possibilities of integration are considered. For each one of these integration opportunities, the advantages and synergies that can be possibly achieved are outlined and discussed. The text explains how GEA, the ASSIST deployer can be considered as the basis for the integration of such different systems. An architecture is proposed, extending the existing tools to work together. The current status of integration of the two environments is discussed, along with the expected results and fallouts on the two programming environments.},
keywords = {parallel},
pubstate = {published},
tppubtype = {incollection}
}
Marco Aldinucci, Massimo Torquati, Pierfrancesco Zuccato
Virtualinux website Technical Manual
2007, (urlhttp://virtualinux.sourceforge.net/).
BibTeX | Tags:
@manual{virtualinux-web,
title = {Virtualinux website},
author = {Marco Aldinucci and Massimo Torquati and Pierfrancesco Zuccato},
year = {2007},
date = {2007-01-01},
note = {urlhttp://virtualinux.sourceforge.net/},
keywords = {},
pubstate = {published},
tppubtype = {manual}
}
2006
Marco Aldinucci, Francoise André, Jérémy Buisson, Sonia Campa, Massimo Coppola, Marco Danelutto, Corrado Zoccolo
Parallel program/component adaptivity management Proceedings Article
In: Joubert, G. R., Nagel, W. E., Peters, F. J., Plata, O., Tirado, P., Zapata, E. (Ed.): Parallel Computing: Current & Future Issues of High-End Computing (Proc. of PARCO 2005, Malaga, Spain), pp. 89–96, John von Neumann Institute for Computing, Germany, 2006.
Abstract | Links | BibTeX | Tags: parallel
@inproceedings{adaptivity:parco:05,
title = {Parallel program/component adaptivity management},
author = {Marco Aldinucci and Francoise André and Jérémy Buisson and Sonia Campa and Massimo Coppola and Marco Danelutto and Corrado Zoccolo},
editor = {G. R. Joubert and W. E. Nagel and F. J. Peters and O. Plata and P. Tirado and E. Zapata},
url = {http://calvados.di.unipi.it/storage/paper_files/2005_adaptivity_parco.pdf},
year = {2006},
date = {2006-12-01},
booktitle = {Parallel Computing: Current & Future Issues of High-End Computing (Proc. of PARCO 2005, Malaga, Spain)},
volume = {33},
pages = {89–96},
publisher = {John von Neumann Institute for Computing},
address = {Germany},
series = {NIC},
abstract = {Grid computing platforms require to handle dynamic behaviour of computing resources within complex parallel applications. We introduce a formalization of adaptive behaviour that separates the abstract model of the application from the implementation design. We exemplify the abstract adaptation schema on two applications, and we show how two quite different approaches to adaptivity, the ASSIST environment and the AFPAC framework, easily map to this common schema.},
keywords = {parallel},
pubstate = {published},
tppubtype = {inproceedings}
}
Marco Aldinucci, Marco Danelutto, Gianni Giaccherini, Massimo Torquati, Marco Vanneschi
Towards a distributed scalable data service for the grid Proceedings Article
In: Joubert, G. R., Nagel, W. E., Peters, F. J., Plata, O., Tirado, P., Zapata, E. (Ed.): Parallel Computing: Current & Future Issues of High-End Computing (Proc. of PARCO 2005, Malaga, Spain), pp. 73–80, John von Neumann Institute for Computing, Germany, 2006.
Abstract | Links | BibTeX | Tags: parallel
@inproceedings{adhoc:parco:05,
title = {Towards a distributed scalable data service for the grid},
author = {Marco Aldinucci and Marco Danelutto and Gianni Giaccherini and Massimo Torquati and Marco Vanneschi},
editor = {G. R. Joubert and W. E. Nagel and F. J. Peters and O. Plata and P. Tirado and E. Zapata},
url = {https://iris.unito.it/retrieve/handle/2318/60375/711125/2005_adhoc_parco.pdf},
year = {2006},
date = {2006-12-01},
booktitle = {Parallel Computing: Current & Future Issues of High-End Computing (Proc. of PARCO 2005, Malaga, Spain)},
volume = {33},
pages = {73–80},
publisher = {John von Neumann Institute for Computing},
address = {Germany},
series = {NIC},
abstract = {ADHOC (Adaptive Distributed Herd of Object Caches) is a Grid-enabled, fast, scalable object repository providing programmers with a general storage module. We present three different software tools based on ADHOC: A parallel cache for Apache, a DSM, and a main memory parallel file system. We also show that these tools exhibit a considerable performance and speedup both in absolute figures and w.r.t. other software tools exploiting the same features.},
keywords = {parallel},
pubstate = {published},
tppubtype = {inproceedings}
}
Marco Aldinucci, Marco Danelutto, Andrea Paternesi, Roberto Ravazzolo, Marco Vanneschi
Building interoperable grid-aware ASSIST applications via WebServices Proceedings Article
In: Joubert, G. R., Nagel, W. E., Peters, F. J., Plata, O., Tirado, P., Zapata, E. (Ed.): Parallel Computing: Current & Future Issues of High-End Computing (Proc. of PARCO 2005, Malaga, Spain), pp. 145–152, John von Neumann Institute for Computing, Germany, 2006, ISBN: 3000173528.
Abstract | Links | BibTeX | Tags: grid
@inproceedings{assist:webs:parco:05,
title = {Building interoperable grid-aware ASSIST applications via WebServices},
author = {Marco Aldinucci and Marco Danelutto and Andrea Paternesi and Roberto Ravazzolo and Marco Vanneschi},
editor = {G. R. Joubert and W. E. Nagel and F. J. Peters and O. Plata and P. Tirado and E. Zapata},
url = {http://calvados.di.unipi.it/storage/paper_files/2005_ws_parco.pdf},
isbn = {3000173528},
year = {2006},
date = {2006-12-01},
booktitle = {Parallel Computing: Current & Future Issues of High-End Computing (Proc. of PARCO 2005, Malaga, Spain)},
volume = {33},
pages = {145–152},
publisher = {John von Neumann Institute for Computing},
address = {Germany},
series = {NIC},
abstract = {The ASSIST environment provides a high-level programming toolkit for the grid. ASSIST applications are described by means of a coordination language, which can express arbitrary graphs of modules. These modules (or a graph of them) may be enclosed in components specifically designed for the grid (GRID.it components). In this paper we describe how ASSIST modules can be wired through standard Web Services, and how GRID.it components may be made available as standard Web Services.},
keywords = {grid},
pubstate = {published},
tppubtype = {inproceedings}
}
Marco Aldinucci, Gabriel Antoniu, Marco Danelutto, Mathieu Jan
Fault-Tolerant Data Sharing for High-level Grid Programming: A Hierarchical Storage Architecture Proceedings Article
In: Bubak, Marian, Gorlatch, Sergei, Priol, Thierry (Ed.): Proc. of the Integrated Research in Grid Computing Workshop, pp. 177–188, Academic Computing Centre CYFRONET AGH, Kraków, Poland, 2006.
Abstract | Links | BibTeX | Tags: grid
@inproceedings{assist:juxmem:IW:06,
title = {Fault-Tolerant Data Sharing for High-level Grid Programming: A Hierarchical Storage Architecture},
author = {Marco Aldinucci and Gabriel Antoniu and Marco Danelutto and Mathieu Jan},
editor = {Marian Bubak and Sergei Gorlatch and Thierry Priol},
url = {http://calvados.di.unipi.it/storage/paper_files/2006_IW_juxadhocmem.pdf},
year = {2006},
date = {2006-10-01},
booktitle = {Proc. of the Integrated Research in Grid Computing Workshop},
pages = {177–188},
publisher = {Academic Computing Centre CYFRONET AGH},
address = {Kraków, Poland},
series = {CoreGRID},
abstract = {Enabling high-level programming models on grids is today a major challenge. A way to achieve this goal relies on the use of environments able to transparently and automatically provide adequate support for low-level, grid-specific issues (fault-tolerance, scalability, etc.). This paper discusses the above approach when applied to grid data management. As a case study, we propose a 2-tier software architecture that supports transparent, fault-tolerant, grid-level data sharing in the ASSIST programming environment (University of Pisa), based on the JuxMem grid data sharing service (INRIA Rennes).},
keywords = {grid},
pubstate = {published},
tppubtype = {inproceedings}
}
Marco Aldinucci, Gabriel Antoniu, Marco Danelutto, Mathieu Jan
Fault-Tolerant Data Sharing for High-level Grid Programming: A Hierarchical Storage Architecture Technical Report
Institute on Programming Model, CoreGRID - Network of Excellence no. TR-0058, 2006.
@techreport{coregrid:tr0058,
title = {Fault-Tolerant Data Sharing for High-level Grid Programming: A Hierarchical Storage Architecture},
author = {Marco Aldinucci and Gabriel Antoniu and Marco Danelutto and Mathieu Jan},
url = {http://www.coregrid.net/mambo/images/stories/TechnicalReports/tr-0058.pdf},
year = {2006},
date = {2006-08-01},
number = {TR-0058},
institution = {Institute on Programming Model, CoreGRID - Network of Excellence},
keywords = {},
pubstate = {published},
tppubtype = {techreport}
}
Marco Aldinucci, Carlo Bertolli, Sonia Campa, Massimo Coppola, Marco Vanneschi, Luca Veraldi, Corrado Zoccolo
Self-Configuring and Self-Optimising Grid Components in the GCM model and their ASSIST Implementation Technical Report
Università di Pisa, Dipartimento di Informatica, Italy no. TR-06-13, 2006.
@techreport{self:tr:06-13,
title = {Self-Configuring and Self-Optimising Grid Components in the GCM model and their ASSIST Implementation},
author = {Marco Aldinucci and Carlo Bertolli and Sonia Campa and Massimo Coppola and Marco Vanneschi and Luca Veraldi and Corrado Zoccolo},
url = {http://compass2.di.unipi.it/TR/Files/TR-06-13.pdf.gz},
year = {2006},
date = {2006-08-01},
number = {TR-06-13},
institution = {Università di Pisa, Dipartimento di Informatica, Italy},
keywords = {},
pubstate = {published},
tppubtype = {techreport}
}
Marco Aldinucci, Carlo Bertolli, Sonia Campa, Massimo Coppola, Marco Vanneschi, Luca Veraldi, Corrado Zoccolo
Self-configuring and self-optimizing grid components in the GCM model and their ASSIST implementation Proceedings Article
In: Proc. of. HPC-GECO/Compframe (held in conjunction with HPDC-15), pp. 45–52, IEEE, Paris, France, 2006.
Abstract | Links | BibTeX | Tags: grid
@inproceedings{selfadapt:hpcgeco:06,
title = {Self-configuring and self-optimizing grid components in the GCM model and their ASSIST implementation},
author = {Marco Aldinucci and Carlo Bertolli and Sonia Campa and Massimo Coppola and Marco Vanneschi and Luca Veraldi and Corrado Zoccolo},
url = {http://calvados.di.unipi.it/storage/paper_files/2006_self_HPC-GECO.pdf},
year = {2006},
date = {2006-06-01},
booktitle = {Proc. of. HPC-GECO/Compframe (held in conjunction with HPDC-15)},
pages = {45–52},
publisher = {IEEE},
address = {Paris, France},
abstract = {We present the concept of autonomic super-component as a building block for Grid-aware applications. Super-components are parametric, higher-order components exhibiting a well-known parallel behaviour. The proposal of a super-component feature is part of the experience we gained in the implementation of the ASSIST environment, which allows the development of self-configuring and optimising component-based applications following a structured and hierarchical approach. We discuss how such approach to Grid programming influenced the design of the Grid Component Model (GCM).},
keywords = {grid},
pubstate = {published},
tppubtype = {inproceedings}
}
Marco Aldinucci, Marco Danelutto, Marco Vanneschi
Autonomic QoS in ASSIST Grid-aware components Proceedings Article
In: Proc. of Intl. Euromicro PDP 2006: Parallel Distributed and network-based Processing, pp. 221–230, IEEE, Montbéliard, France, 2006.
Abstract | Links | BibTeX | Tags: grid
@inproceedings{assist:qos:euromicro:06,
title = {Autonomic QoS in ASSIST Grid-aware components},
author = {Marco Aldinucci and Marco Danelutto and Marco Vanneschi},
url = {http://calvados.di.unipi.it/storage/paper_files/2006_QoS_PDP.pdf},
doi = {10.1109/PDP.2006.25},
year = {2006},
date = {2006-02-01},
booktitle = {Proc. of Intl. Euromicro PDP 2006: Parallel Distributed and network-based Processing},
pages = {221–230},
publisher = {IEEE},
address = {Montbéliard, France},
abstract = {Current Grid-aware applications are developed on existing software infrastructures, such as Globus, by developers who are experts on Grid software implementation. Although many useful applications have been produced this way, this approach may hardly support the additional complexity to Quality of Service (QoS) control in real application. We describe the ASSIST programming environment, the prototype of parallel programming environment currently under development at our group, as a suitable basis to capture all the desired features for QoS control for the Grid. Grid applications, built as compositions of ASSIST components, are supported by an innovative Grid Abstract Machine, which includes essential abstractions of standard middleware services and a hierarchical Application Manager, which may be considered as an early prototype of Autonomic Manager.},
keywords = {grid},
pubstate = {published},
tppubtype = {inproceedings}
}
Marco Aldinucci, Marco Danelutto
The cost of security in skeletal systems Technical Report
Università di Pisa, Dipartimento di Informatica, Italy no. TR-06-03, 2006.
@techreport{self:tr:06-03,
title = {The cost of security in skeletal systems},
author = {Marco Aldinucci and Marco Danelutto},
url = {http://compass2.di.unipi.it/TR/Files/TR-06-03.pdf.gz},
year = {2006},
date = {2006-02-01},
number = {TR-06-03},
institution = {Università di Pisa, Dipartimento di Informatica, Italy},
keywords = {},
pubstate = {published},
tppubtype = {techreport}
}
Marco Aldinucci, Marco Danelutto
Algorithmic skeletons meeting grids Journal Article
In: Parallel Computing, vol. 32, no. 7, pp. 449–462, 2006.
Abstract | Links | BibTeX | Tags: parallel
@article{advske:pc:06,
title = {Algorithmic skeletons meeting grids},
author = {Marco Aldinucci and Marco Danelutto},
url = {http://calvados.di.unipi.it/storage/paper_files/2006_advske_PC.pdf},
doi = {10.1016/j.parco.2006.04.001},
year = {2006},
date = {2006-01-01},
journal = {Parallel Computing},
volume = {32},
number = {7},
pages = {449–462},
abstract = {In this work, we discuss an extension of the set of principles that should guide the future design and development of skeletal programming systems, as defined by Cole in his "pragmatic manifesto'" paper. The three further principles introduced are related to the ability to exploit existing sequential code as well as to the ability to target typical modern architectures, those made out of heterogeneous processing elements with dynamically varying availability, processing power and connectivity features such as grids or heterogeneous, non-dedicated clusters. We outline two skeleton based programming environments currently developed at our university and we discuss how these environments adhere to the proposed set of principles. Eventually, we outline how some other relevant, well-known skeleton environments conform to the same set of principles.},
keywords = {parallel},
pubstate = {published},
tppubtype = {article}
}
Marco Aldinucci, Massimo Coppola, Marco Danelutto, Nicola Tonellotto, Marco Vanneschi, Corrado Zoccolo
High level grid programming with ASSIST Journal Article
In: Computational Methods in Science and Technology, vol. 12, no. 1, pp. 21–32, 2006.
Abstract | Links | BibTeX | Tags: parallel
@article{assist:CMST:06,
title = {High level grid programming with ASSIST},
author = {Marco Aldinucci and Massimo Coppola and Marco Danelutto and Nicola Tonellotto and Marco Vanneschi and Corrado Zoccolo},
url = {http://calvados.di.unipi.it/storage/paper_files/2006_assist_j_cmst.pdf},
year = {2006},
date = {2006-01-01},
journal = {Computational Methods in Science and Technology},
volume = {12},
number = {1},
pages = {21–32},
abstract = {The development of efficient Grid applications usually requires writing huge portions of code directly at the level of abstraction provided by the underlying Grid middleware. In this work we discuss an alternative approach, raising the level of abstraction used when programming Grid applications. Our approach requires programmers just to describe in a qualitative way the kind of parallelism they want to express. Then, compiler tools, loader tools and run time system take complete care of running the application on a Grid target architecture. This allows to move most of the cumbersome tasks related to Grid targeting and management from programmer responsibility to tools. This paper introduces the structured parallel programming environment ASSIST, whose design is aimed at raising the level of abstraction in Grid programming and discusses how it can support transparent Grid programming while implementing Grid adaptivity.},
keywords = {parallel},
pubstate = {published},
tppubtype = {article}
}
Marco Aldinucci, Massimo Coppola, Marco Danelutto, Marco Vanneschi, Corrado Zoccolo
ASSIST as a research framework for high-performance Grid programming environments Book Section
In: Cunha, J. C., Rana, O. F. (Ed.): Grid Computing: Software environments and Tools, pp. 230–256, Springer, 2006, ISBN: 978-1-85233-998-2.
Abstract | Links | BibTeX | Tags: grid
@incollection{assist:cunhabook:05,
title = {ASSIST as a research framework for high-performance Grid programming environments},
author = {Marco Aldinucci and Massimo Coppola and Marco Danelutto and Marco Vanneschi and Corrado Zoccolo},
editor = {J. C. Cunha and O. F. Rana},
url = {http://calvados.di.unipi.it/storage/paper_files/2005_assist_CuhnaBook.pdf},
doi = {10.1007/1-84628-339-6_10},
isbn = {978-1-85233-998-2},
year = {2006},
date = {2006-01-01},
booktitle = {Grid Computing: Software environments and Tools},
pages = {230–256},
publisher = {Springer},
chapter = {10},
abstract = {ASSIST is a programming environment supporting the development of parallel and distributed high-performance applications on a wide range of target architectures including massively parallel clusters/networks of workstations and Grids. We discuss how ASSIST can act as a valid research vehicle to study, experiment and realize Grid-aware programming environments for high-performance applications. Special emphasis is put on the innovative methodologies, strategies and tools for dynamically adaptive applications that represent the necessary step for the success of Grid platforms. We start considering which are the fundamental features of Grid-aware programming environments, based upon structured parallel programming and components technology. Then we show how ASSIST evolved from its very first version, only targeting workstation clusters, to the current version, targeting Grids and solving many critical problems related to expressive power, flexibility, interoperability and efficiency. We also discuss how ASSIST deals with interoperability issues. Eventually we discuss how an ASSIST-based model for supporting dynamically adaptive applications can be derived.},
keywords = {grid},
pubstate = {published},
tppubtype = {incollection}
}
Marco Aldinucci, Massimo Coppola, Sonia Campa, Marco Danelutto, Marco Vanneschi, Corrado Zoccolo
Structured implementation of component based grid programming environments Book Section
In: Getov, Vladimir, Laforenza, Domenico, Reinefeld, Alexander (Ed.): Future Generation Grids, pp. 217–239, Springer, 2006, ISBN: 978-0-387-27935-0.
Abstract | Links | BibTeX | Tags: grid
@incollection{assist:dagstuhl:05,
title = {Structured implementation of component based grid programming environments},
author = {Marco Aldinucci and Massimo Coppola and Sonia Campa and Marco Danelutto and Marco Vanneschi and Corrado Zoccolo},
editor = {Vladimir Getov and Domenico Laforenza and Alexander Reinefeld},
url = {http://calvados.di.unipi.it/storage/paper_files/2005_assist_Dagstuhl.pdf},
doi = {10.1007/978-0-387-29445-2_12},
isbn = {978-0-387-27935-0},
year = {2006},
date = {2006-01-01},
booktitle = {Future Generation Grids},
pages = {217–239},
publisher = {Springer},
series = {CoreGRID},
abstract = {The design,implementation and deployment of efficient high performance applications on Grids is usually a quite hard task, even in the case that modern and efficient grid middleware systems are used. We claim that most of the difficulties involved in such process can be moved away from programmer responsibility by following a structured programming model approach. The proposed approach relies on the development of a layered, component based execution environment. Each layer deals with distinct features and problems related to the implementation of GRID applications, exploiting the more appropriate techniques. Static optimizations are introduced in the compile layer, dynamic optimization are introduced in the run time layer, whereas modern grid middleware features are simply exploited using standard middleware systems as the final target architecture. We first discuss the general idea, then we discuss the peculiarities of the approach and eventually we discuss the preliminary results achieved in the GRID.it project, where a prototype high performance, component based, GRID programming environment is being developed using this approach.},
keywords = {grid},
pubstate = {published},
tppubtype = {incollection}
}
2005
Marco Aldinucci, Marco Danelutto, Andrea Paternesi, Roberto Ravazzolo, Marco Vanneschi
Building Interoperable Grid-aware ASSIST Applications via Web Services Technical Report
Università di Pisa, Dipartimento di Informatica, Italy no. TR-05-24, 2005.
Abstract | Links | BibTeX | Tags:
@techreport{assist:webs:tr-05-24,
title = {Building Interoperable Grid-aware ASSIST Applications via Web Services},
author = {Marco Aldinucci and Marco Danelutto and Andrea Paternesi and Roberto Ravazzolo and Marco Vanneschi},
url = {http://compass2.di.unipi.it/TR/Files/TR-05-24.pdf.gz},
year = {2005},
date = {2005-12-01},
number = {TR-05-24},
institution = {Università di Pisa, Dipartimento di Informatica, Italy},
abstract = {The ASSIST environment provides a high-level programming toolkit for the grid. ASSIST applications are described by means of a coordination language, which can express arbitrary graphs of modules. These modules (or a graph of them) may be enclosed in components specifically designed for the grid (GRID.it components). In this paper we describe how ASSIST modules can be wired through standard Web Services, and how GRID.it components may be made available as standard Web Services.},
keywords = {},
pubstate = {published},
tppubtype = {techreport}
}
Marco Aldinucci, Francoise André, Jérémy Buisson, Sonia Campa, Massimo Coppola, Marco Danelutto, Corrado Zoccolo
Parallel program/component adaptivity management Proceedings Article
In: Gorlatch, Sergei, Danelutto, Marco (Ed.): Proc. of the Integrated Research in Grid Computing Workshop, pp. 95–104, Università di Pisa, Dipartimento di Informatica, Pisa, Italy, 2005.
Abstract | Links | BibTeX | Tags: parallel
@inproceedings{adaptivity:IW:05,
title = {Parallel program/component adaptivity management},
author = {Marco Aldinucci and Francoise André and Jérémy Buisson and Sonia Campa and Massimo Coppola and Marco Danelutto and Corrado Zoccolo},
editor = {Sergei Gorlatch and Marco Danelutto},
url = {http://calvados.di.unipi.it/storage/paper_files/2006_IW_adapt.pdf},
year = {2005},
date = {2005-11-01},
booktitle = {Proc. of the Integrated Research in Grid Computing Workshop},
volume = {TR-05-22},
pages = {95–104},
publisher = {Università di Pisa, Dipartimento di Informatica},
address = {Pisa, Italy},
abstract = {Grid computing platforms require to handle dynamic behaviour of computing resources within complex parallel applications. We introduce a formalization of adaptive behaviour that separates the ab- stract model of the application from the implementation design. We ex- emplify the abstract adaptation schema on two applications, and we show how two quite different approaches to adaptivity, the ASSIST environ- ment and the AFPAC framework, easily map to this common schema.},
keywords = {parallel},
pubstate = {published},
tppubtype = {inproceedings}
}
Marco Aldinucci, Anne Benoit
Towards the Automatic Mapping of ASSIST Applications for the Grid Proceedings Article
In: Gorlatch, Sergei, Danelutto, Marco (Ed.): Proc. of the Integrated Research in Grid Computing Workshop, pp. 59–68, Università di Pisa, Dipartimento di Informatica, Pisa, Italy, 2005.
Abstract | Links | BibTeX | Tags: grid
@inproceedings{assist:pepa:IW:05,
title = {Towards the Automatic Mapping of ASSIST Applications for the Grid},
author = {Marco Aldinucci and Anne Benoit},
editor = {Sergei Gorlatch and Marco Danelutto},
url = {http://calvados.di.unipi.it/storage/paper_files/2006_IW_pepa.pdf},
year = {2005},
date = {2005-11-01},
booktitle = {Proc. of the Integrated Research in Grid Computing Workshop},
volume = {TR-05-22},
pages = {59–68},
publisher = {Università di Pisa, Dipartimento di Informatica},
address = {Pisa, Italy},
abstract = {One of the most promising technical innovations in present day computing is the invention of grid technologies which harness the computational power of widely distributed collections of computers. However, the programming and optimisation burden of a low level approach to grid computing is clearly unacceptable for large scale, complex applications. The development of grid applications can be simplified by using high-level programming environments. In the present work, we address the problem of the mapping of a high-level grid application onto the computational resources. In order to optimise the mapping of the application, we propose to automatically generate performance models from the application using the process algebra PEPA. We target in this work applications written with the high-level environment ASSIST, since the use of such a structured environment allows us to automate the study of the application more effectively.},
keywords = {grid},
pubstate = {published},
tppubtype = {inproceedings}
}
Jan Dünnweber, Sergei Gorlatch, Sonia Campa, Marco Aldinucci, Marco Danelutto
Using Code Parameters for Component Adaptations Proceedings Article
In: Gorlatch, Sergei, Danelutto, Marco (Ed.): Proc. of the Integrated Research in Grid Computing Workshop, pp. 49–57, Università di Pisa, Dipartimento di Informatica, Pisa, Italy, 2005.
Abstract | Links | BibTeX | Tags: grid
@inproceedings{codeadapt:IW:05,
title = {Using Code Parameters for Component Adaptations},
author = {Jan Dünnweber and Sergei Gorlatch and Sonia Campa and Marco Aldinucci and Marco Danelutto},
editor = {Sergei Gorlatch and Marco Danelutto},
url = {http://calvados.di.unipi.it/storage/paper_files/2006_IW_muenster.pdf},
year = {2005},
date = {2005-11-01},
booktitle = {Proc. of the Integrated Research in Grid Computing Workshop},
volume = {TR-05-22},
pages = {49–57},
publisher = {Università di Pisa, Dipartimento di Informatica},
address = {Pisa, Italy},
abstract = {Adaptation means that the behavior of a software component is adjusted to application or platform-specific requirements: new components required in a particular application do not need to be developed from scratch when available components can be adapted accordingly. Instead of introducing a new adaptation syntax (as it is done, e. g. , in AOP), we describe adaptations in the context of Java-based Higher-Order Components (HOCs). HOCs incorporate a code parameter plugin mechanism enabling adaptations on the grid. Our approach is illustrated using a case study of sequence alignment. We show how a HOC with the required provisions for data dependencies in this application can be generated by adapting a farm component, which is "embarrassingly parallel", i.e., free of data dependencies. This way, we could reuse the efficient farm implementation from the Lithium library, although our case study exhibits the wavefront pattern of parallelism which is different from the farm.},
keywords = {grid},
pubstate = {published},
tppubtype = {inproceedings}
}
Marcelo Pasin, Pierre Kuonen, Marco Danelutto, Marco Aldinucci
Skeleton Parallel Programming and Parallel Objects Proceedings Article
In: Gorlatch, Sergei, Danelutto, Marco (Ed.): Proc. of the Integrated Research in Grid Computing Workshop, pp. 115–124, Università di Pisa, Dipartimento di Informatica, Pisa, Italy, 2005.
Abstract | Links | BibTeX | Tags: grid
@inproceedings{pasin:IW:05,
title = {Skeleton Parallel Programming and Parallel Objects},
author = {Marcelo Pasin and Pierre Kuonen and Marco Danelutto and Marco Aldinucci},
editor = {Sergei Gorlatch and Marco Danelutto},
url = {http://calvados.di.unipi.it/storage/paper_files/2006_IW_popc.pdf},
year = {2005},
date = {2005-11-01},
booktitle = {Proc. of the Integrated Research in Grid Computing Workshop},
volume = {TR-05-22},
pages = {115–124},
publisher = {Università di Pisa, Dipartimento di Informatica},
address = {Pisa, Italy},
abstract = {We describe here the ongoing work aimed at integrating the POP-C++ parallel object programming environment with the ASSIST component based parallel programming environment. Both these programming environments are shortly outlined, first. Then several possibilities of integration are considered. For each one of these integration opportunities, the advantages and synergies that can be possibly achieved are outlined and discussed. Eventually, the current status of integration of the two environments is discussed, along with the expected results and fallouts on the two programming environments.},
keywords = {grid},
pubstate = {published},
tppubtype = {inproceedings}
}
Marco Aldinucci, Marco Danelutto, Gianni Giaccherini, Massimo Torquati, Marco Vanneschi
Towards a distributed scalable data service for the Grid Technical Report
Università di Pisa, Dipartimento di Informatica, Italy no. TR-05-21, 2005.
@techreport{adhoc:tr-05-21,
title = {Towards a distributed scalable data service for the Grid},
author = {Marco Aldinucci and Marco Danelutto and Gianni Giaccherini and Massimo Torquati and Marco Vanneschi},
url = {http://compass2.di.unipi.it/TR/Files/TR-05-21.pdf.gz},
year = {2005},
date = {2005-10-01},
number = {TR-05-21},
institution = {Università di Pisa, Dipartimento di Informatica, Italy},
keywords = {},
pubstate = {published},
tppubtype = {techreport}
}
Marco Aldinucci, Anne Benoit
Automatic mapping of ASSIST applications using process algebra Technical Report
Institute on Programming Model, CoreGRID - Network of Excellence no. TR-0016, 2005.
@techreport{coregrid:tr0016,
title = {Automatic mapping of ASSIST applications using process algebra},
author = {Marco Aldinucci and Anne Benoit},
url = {http://www.coregrid.net/mambo/images/stories/TechnicalReports/tr-0016.pdf},
doi = {10.1142/S0129626408003302},
year = {2005},
date = {2005-10-01},
number = {TR-0016},
institution = {Institute on Programming Model, CoreGRID - Network of Excellence},
keywords = {},
pubstate = {published},
tppubtype = {techreport}
}
Marco Aldinucci, Marco Vanneschi, Matteo Villa
Grid technologies and c-business for SMEs Proceedings Article
In: Cunningham, P., Cunningham, M. (Ed.): Innovation and the Knowledge Economy: Issues, Applications, Case Studies (Proc. of Intl. conference eChallenges 2005), IOS press, Amsterdam, The Netherland, 2005.
Abstract | Links | BibTeX | Tags: grid
@inproceedings{sfida:echallenges:05,
title = {Grid technologies and c-business for SMEs},
author = {Marco Aldinucci and Marco Vanneschi and Matteo Villa},
editor = {P. Cunningham and M. Cunningham},
url = {http://calvados.di.unipi.it/storage/paper_files/2005_SFIDA_echallenges.pdf},
year = {2005},
date = {2005-10-01},
booktitle = {Innovation and the Knowledge Economy: Issues, Applications, Case Studies (Proc. of Intl. conference eChallenges 2005)},
volume = {2},
publisher = {IOS press},
address = {Amsterdam, The Netherland},
series = {Information and Communication Technologies and the Knowledge Economy},
abstract = {We describe the objectives of project SFIDA, aiming at developing a Grid-based interoperable platform able to support next generation applications specifically addressing the needs of SMEs. We sketch the architecture of the platform under development in SFIDA, which will support componentization (e-services), intelligence (mining), collaboration (c-business), and customer business-processes orientation concepts on top of ASSIST, a Grid-aware high-level programming environment. The SFIDA project outcomes will be validated on Supply Chain Management applications matching various typical industrial cases, spanning from automotive, textile, food, white goods, and media retail. Finally we show what business benefits it is expected to bring.},
keywords = {grid},
pubstate = {published},
tppubtype = {inproceedings}
}
Marco Aldinucci, Marco Danelutto, Jan Dünnweber, Sergei Gorlatch
Optimization techniques for skeletons on grids Book Section
In: Grandinetti, L. (Ed.): Grid Computing and New Frontiers of High Performance Processing, vol. 14, pp. 255–273, Elsevier, 2005, ISSN: 09275452.
Abstract | Links | BibTeX | Tags: parallel
@incollection{vigoni:fut_rmi:book:05,
title = {Optimization techniques for skeletons on grids},
author = {Marco Aldinucci and Marco Danelutto and Jan Dünnweber and Sergei Gorlatch},
editor = {L. Grandinetti},
url = {http://calvados.di.unipi.it/storage/paper_files/2005_LithiumFutRMI_book.pdf},
doi = {10.1016/S0927-5452(05)80014-0},
issn = {09275452},
year = {2005},
date = {2005-10-01},
booktitle = {Grid Computing and New Frontiers of High Performance Processing},
volume = {14},
pages = {255–273},
publisher = {Elsevier},
chapter = {2},
series = {Advances in Parallel Computing},
abstract = {Skeletons are common patterns of parallelism, such as farm and pipeline, that can be abstracted and offered to the application programmer as programming primitives. We describe the use and implementation of skeletons on emerging computational grids, with the skeleton system Lithium, based on Java and RMI, as our reference programming syttem. Our main contribution is the exploration of optimization techniques for implementing skeletons on grids based on an optimized, future-based RMI mechanism, which we integrate into the macro-dataflow evaluation mechanism of Lithium. We discuss three optimizations: 1) a lookahead mechanism that allows to process multiple tasks concurrently at each grid server and thereby increases the overall degree of parallelism, 2) a lazy taskbinding technique that reduces interactions between grid servers and the task dispatcher, and 3) dynamic improvements that optimize the collecting of results and the work-load balancing. We report experimental results that demonstrate the improvements due to our optimizations on various testbeds, including a heterogeneous grid-like environment.},
keywords = {parallel},
pubstate = {published},
tppubtype = {incollection}
}
Marco Aldinucci, Francoise André, Jérémy Buisson, Sonia Campa, Massimo Coppola, Marco Danelutto, Corrado Zoccolo
Parallel program/component adaptivity management Technical Report
Institute on Programming Model, CoreGRID - Network of Excellence no. TR-0014, 2005.
@techreport{coregrid:tr0014,
title = {Parallel program/component adaptivity management},
author = {Marco Aldinucci and Francoise André and Jérémy Buisson and Sonia Campa and Massimo Coppola and Marco Danelutto and Corrado Zoccolo},
url = {http://www.coregrid.net/mambo/images/stories/TechnicalReports/tr-0014.pdf},
year = {2005},
date = {2005-09-01},
number = {TR-0014},
institution = {Institute on Programming Model, CoreGRID - Network of Excellence},
keywords = {},
pubstate = {published},
tppubtype = {techreport}
}
Marco Aldinucci, Alessandro Petrocelli, Edoardo Pistoletti, Massimo Torquati, Marco Vanneschi, Luca Veraldi, Corrado Zoccolo
Dynamic reconfiguration of grid-aware applications in ASSIST Proceedings Article
In: Cunha, J. C., Medeiros, P. D. (Ed.): Proc. of 11th Intl. Euro-Par 2005 Parallel Processing, pp. 771–781, Springer, 2005.
Abstract | Links | BibTeX | Tags: grid
@inproceedings{dyn:europar:05,
title = {Dynamic reconfiguration of grid-aware applications in ASSIST},
author = {Marco Aldinucci and Alessandro Petrocelli and Edoardo Pistoletti and Massimo Torquati and Marco Vanneschi and Luca Veraldi and Corrado Zoccolo},
editor = {J. C. Cunha and P. D. Medeiros},
url = {http://calvados.di.unipi.it/storage/paper_files/2005_assist_dyn_europar.pdf},
doi = {10.1007/11549468_84},
year = {2005},
date = {2005-08-01},
booktitle = {Proc. of 11th Intl. Euro-Par 2005 Parallel Processing},
volume = {3648},
pages = {771–781},
publisher = {Springer},
series = {LNCS},
abstract = {Current grid-aware applications are implemented on top of low-level libraries by developers who are experts on grid middleware architecture. This approach can hardly support the additional complexity of QoS control in real applications. We discuss a novel approach used in the ASSIST programming environment to implement/guarantee user provided QoS contracts in a transparent and effective way. Our approach is based on the implementation of automatic run-time reconfiguration of ASSIST application executions triggered by mismatch between the user provided QoS contract and the actual performance values achieved.},
keywords = {grid},
pubstate = {published},
tppubtype = {inproceedings}
}
Marco Aldinucci, Anne Benoit
Automatic mapping of ASSIST applications using process algebra Proceedings Article
In: Proc. of HLPP2005: Intl. Workshop on High-Level Parallel Programming, Warwick University, Coventry, UK 2005.
Abstract | Links | BibTeX | Tags: grid
@inproceedings{pepa_assist:hlpp:05,
title = {Automatic mapping of ASSIST applications using process algebra},
author = {Marco Aldinucci and Anne Benoit},
url = {http://calvados.di.unipi.it/storage/paper_files/2005_pepa_hlpp.pdf},
doi = {10.1142/S0129626408003302},
year = {2005},
date = {2005-07-01},
booktitle = {Proc. of HLPP2005: Intl. Workshop on High-Level Parallel Programming},
organization = {Warwick University, Coventry, UK},
abstract = {One of the most promising technical innovations in present-day computing is the invention of grid technologies which harness the computational power of widely distributed collections of computers. However, the programming and optimisation burden of a low level approach to grid computing is clearly unacceptable for large scale, complex applications. The development of grid applications can be simplified by using high-level programming environments. In the present work, we address the problem of the mapping of a high-level grid application onto the computational resources. In order to optimise the mapping of the application, we propose to automatically generate performance models from the application using the process algebra PEPA. We target applications written with the high-level environment ASSIST, since the use of such a structured environment allows us to automate the study of the application more effectively. Our methodology is presented through an example of a classical Divide&Conquer algorithm, together with results which demonstrate the efficiency of this approach.},
keywords = {grid},
pubstate = {published},
tppubtype = {inproceedings}
}
Jan Dünnweber, Sergei Gorlatch, Sonia Campa, Marco Aldinucci, Marco Danelutto
Behavior Customization of Parallel Components Application Programming Technical Report
Institute on Programming Model, CoreGRID - Network of Excellence no. TR-0002, 2005.
@techreport{coregrid:tr0002,
title = {Behavior Customization of Parallel Components Application Programming},
author = {Jan Dünnweber and Sergei Gorlatch and Sonia Campa and Marco Aldinucci and Marco Danelutto},
url = {http://www.coregrid.net/mambo/images/stories/TechnicalReports/tr-0002.pdf},
year = {2005},
date = {2005-04-01},
number = {TR-0002},
institution = {Institute on Programming Model, CoreGRID - Network of Excellence},
keywords = {},
pubstate = {published},
tppubtype = {techreport}
}
Marco Aldinucci, Alessandro Petrocelli, Edoardo Pistoletti, Massimo Torquati, Marco Vanneschi, Luca Veraldi, Corrado Zoccolo
Dynamic reconfiguration of Grid-aware applications in ASSIST Technical Report
Università di Pisa, Dipartimento di Informatica, Italy no. TR-05-05, 2005.
@techreport{dyn:tr-05-05,
title = {Dynamic reconfiguration of Grid-aware applications in ASSIST},
author = {Marco Aldinucci and Alessandro Petrocelli and Edoardo Pistoletti and Massimo Torquati and Marco Vanneschi and Luca Veraldi and Corrado Zoccolo},
url = {http://compass2.di.unipi.it/TR/Files/TR-05-05.pdf.gz},
year = {2005},
date = {2005-02-01},
number = {TR-05-05},
institution = {Università di Pisa, Dipartimento di Informatica, Italy},
keywords = {},
pubstate = {published},
tppubtype = {techreport}
}
Marco Aldinucci, Sergio Gusmeroli, Marco Vanneschi, Matteo Villa
SFIDA: interoperability in innovative c-business models for SMEs through an enabling Grid platform Proceedings Article
In: Pre-proc. of INTEROP-ESA: Intl. Conference on Interoperability on Enterprise Software and Applications, pp. 547–557, Geneva, Switzerland, 2005.
Abstract | Links | BibTeX | Tags: grid
@inproceedings{sfida:interop:05,
title = {SFIDA: interoperability in innovative c-business models for SMEs through an enabling Grid platform},
author = {Marco Aldinucci and Sergio Gusmeroli and Marco Vanneschi and Matteo Villa},
url = {http://calvados.di.unipi.it/storage/paper_files/2005_SFIDA_InteropESA.pdf},
year = {2005},
date = {2005-02-01},
booktitle = {Pre-proc. of INTEROP-ESA: Intl. Conference on Interoperability on Enterprise Software and Applications},
pages = {547–557},
address = {Geneva, Switzerland},
abstract = {This position paper describes the objectives of project "SFIDA" (co-funded by the Italian Government), aiming at developing a GRID-based inter-operability platform able to support next generation Supply Chain Management applications specifically addressing the needs of SMEs belonging to industrial districts and dynamic supply networks. Next generation SCM applications are intended in SFIDA to be based on componentization (e-services), intelligence (mining), collaboration (c-business) and customer business-processes orientation. The platform and the next generation SCM applications running on top of it will be tested in various typical industrial cases, spanning from automotive, textile, food, white goods and media retail.},
keywords = {grid},
pubstate = {published},
tppubtype = {inproceedings}
}
Marco Aldinucci, Sonia Campa, Massimo Coppola, Marco Danelutto, Domenico Laforenza, Diego Puppin, Luca Scarponi, Marco Vanneschi, Corrado Zoccolo
Components for high performance Grid programming in Grid.it Proceedings Article
In: Getov, V., Kielmann, T. (Ed.): Proc. of the Intl. Workshop on Component Models and Systems for Grid Applications, pp. 19–38, Springer, Saint-Malo, France, 2005, ISBN: 978-0-387-23351-2.
Abstract | Links | BibTeX | Tags: grid
@inproceedings{assist:stmalo:05,
title = {Components for high performance Grid programming in Grid.it},
author = {Marco Aldinucci and Sonia Campa and Massimo Coppola and Marco Danelutto and Domenico Laforenza and Diego Puppin and Luca Scarponi and Marco Vanneschi and Corrado Zoccolo},
editor = {V. Getov and T. Kielmann},
url = {http://calvados.di.unipi.it/storage/paper_files/2005_assist_ics_stmalo.pdf},
doi = {10.1007/0-387-23352-0_2},
isbn = {978-0-387-23351-2},
year = {2005},
date = {2005-01-01},
booktitle = {Proc. of the Intl. Workshop on Component Models and Systems for Grid Applications},
pages = {19–38},
publisher = {Springer},
address = {Saint-Malo, France},
series = {CoreGRID},
abstract = {This paper presents the main ideas of the high-performance component-based Grid programming environment of the Grid.it project. High-performance components are characterized by a programming model that integrates the concepts of structured parallelism, component interaction, compositionality, and adaptivity. We show that ASSIST, the prototype of parallel programming environment currently under development at our group, is a suitable basis to capture all the desired features of the component model in a flexible and efficient manner. For the sake of interoperability, ASSIST modules or programs are automatically encapsulated in standard frameworks; currently, we are experimenting Web Services and the CORBA Component Model. Grid applications, built as compositions of ASSIST components and possibly other existing (legacy) components, are supported by an innovative Grid Abstract Machine, that includes essential abstractions of standard middleware services and a hierarchical Application Manager (AM). AM supports static allocation and dynamic reallocation of adaptive applications according to a performance contract, a reconfiguration strategy, and a performance model.},
keywords = {grid},
pubstate = {published},
tppubtype = {inproceedings}
}
Marco Aldinucci, Marco Danelutto, Jan Dünnweber, Sergei Gorlatch
Optimization Techniques for Implementing Parallel Skeletons in Distributed Environments Technical Report
Institute on Programming Model, CoreGRID - Network of Excellence no. TR-0001, 2005.
@techreport{coregrid:tr0001,
title = {Optimization Techniques for Implementing Parallel Skeletons in Distributed Environments},
author = {Marco Aldinucci and Marco Danelutto and Jan Dünnweber and Sergei Gorlatch},
url = {http://www.coregrid.net/mambo/images/stories/TechnicalReports/tr-0001.pdf},
year = {2005},
date = {2005-01-01},
number = {TR-0001},
institution = {Institute on Programming Model, CoreGRID - Network of Excellence},
keywords = {},
pubstate = {published},
tppubtype = {techreport}
}
2004
Marco Aldinucci, Massimo Torquati
Accelerating apache farms through ad-HOC distributed scalable object repository Proceedings Article
In: Danelutto, Marco, Vanneschi, Marco, Laforenza, Domenico (Ed.): Proc. of 10th Intl. Euro-Par 2004 Parallel Processing, pp. 596–605, Springer, 2004.
Abstract | Links | BibTeX | Tags: parallel
@inproceedings{assist:adhoc:europar:04,
title = {Accelerating apache farms through ad-HOC distributed scalable object repository},
author = {Marco Aldinucci and Massimo Torquati},
editor = {Marco Danelutto and Marco Vanneschi and Domenico Laforenza},
url = {http://calvados.di.unipi.it/storage/paper_files/2004_hoc_europar.pdf},
doi = {10.1007/978-3-540-27866-5_78},
year = {2004},
date = {2004-08-01},
booktitle = {Proc. of 10th Intl. Euro-Par 2004 Parallel Processing},
volume = {3149},
pages = {596–605},
publisher = {Springer},
series = {LNCS},
abstract = {We present HOC: a fast, scalable object repository providing programmers with a general storage module. hoc may be used to implement DSMs as well as distributed cache subsystems. HOC is composed of a set of hot-pluggable cooperating processes that may sustain a close to optimal network traffic rate. We designed an HOC-based Web cache that extends the Apache Web server and remarkably improves Apache farms performances with no modification to the Apache core code.},
keywords = {parallel},
pubstate = {published},
tppubtype = {inproceedings}
}
Marco Aldinucci, Sonia Campa, Massimo Coppola, Silvia Magini, Paolo Pesciullesi, Laura Potiti, Roberto Ravazzolo, Massimo Torquati, Corrado Zoccolo
Targeting heterogeneous architectures in ASSIST: Experimental results Proceedings Article
In: Danelutto, Marco, Vanneschi, Marco, Laforenza, Domenico (Ed.): Proc. of 10th Intl. Euro-Par 2004 Parallel Processing, pp. 638–643, Springer, 2004, ISBN: 978-3-540-22924-7.
Abstract | Links | BibTeX | Tags: parallel
@inproceedings{assist:hetero:europar:04,
title = {Targeting heterogeneous architectures in ASSIST: Experimental results},
author = {Marco Aldinucci and Sonia Campa and Massimo Coppola and Silvia Magini and Paolo Pesciullesi and Laura Potiti and Roberto Ravazzolo and Massimo Torquati and Corrado Zoccolo},
editor = {Marco Danelutto and Marco Vanneschi and Domenico Laforenza},
url = {http://calvados.di.unipi.it/storage/paper_files/2004_hetero_europar.pdf},
doi = {10.1142/S0129626412400063},
isbn = {978-3-540-22924-7},
year = {2004},
date = {2004-08-01},
booktitle = {Proc. of 10th Intl. Euro-Par 2004 Parallel Processing},
volume = {3149},
pages = {638–643},
publisher = {Springer},
series = {LNCS},
abstract = {We describe how the ASSIST parallel programming environment can be used to run parallel programs on collections of heterogeneous workstations and evaluate the scalability of one task-farm real application and a data-parallel benchmark, comparing the actual performance figures measured when using homogeneous and heterogeneous workstation clusters. We describe also the ASSIST approach to heterogeneous distributed shared memory and provide preliminary performance figures of the current implementation.},
keywords = {parallel},
pubstate = {published},
tppubtype = {inproceedings}
}
Marco Aldinucci, Marco Danelutto, Jan Dünnweber
Optimization Techniques for Implementing Parallel Skeletons in Grid Environments Proceedings Article
In: Gorlatch, S. (Ed.): Proc. of CMPP: Intl. Workshop on Constructive Methods for Parallel Programming, pp. 35–47, Universität Münster, Germany, Stirling, Scotland, UK, 2004.
Abstract | Links | BibTeX | Tags: parallel
@inproceedings{lith_rmi:cmpp:04,
title = {Optimization Techniques for Implementing Parallel Skeletons in Grid Environments},
author = {Marco Aldinucci and Marco Danelutto and Jan Dünnweber},
editor = {S. Gorlatch},
url = {http://calvados.di.unipi.it/storage/paper_files/2004_RMI_cmpp.pdf},
year = {2004},
date = {2004-07-01},
booktitle = {Proc. of CMPP: Intl. Workshop on Constructive Methods for Parallel Programming},
pages = {35–47},
publisher = {Universität Münster, Germany},
address = {Stirling, Scotland, UK},
abstract = {Skeletons are common patterns of parallelism like, e.g., farm, pipeline that can be abstracted and offered to the application programmer as programming primitives. We describe the use and implementation of skeletons in a distributed grid environment, with the Java-based system Lithium as our reference implementation. Our main contribution are optimization techniques based on an asynchronous, optimized RMI interaction mechanism, which we integrated into the macro data flow (MDF) implementation technology of Lithium. We report initial experimental results that demonstrate the achieved improvements through the proposed optimizations on a simple grid testbed.},
keywords = {parallel},
pubstate = {published},
tppubtype = {inproceedings}
}
Marco Aldinucci, Massimo Torquati
Accelerating Apache farms through ad-HOC distributed scalable objects repository Technical Report
Università di Pisa, Dipartimento di Informatica, Italy no. TR-04-08, 2004.
@techreport{adhoc:tr-04-08,
title = {Accelerating Apache farms through ad-HOC distributed scalable objects repository},
author = {Marco Aldinucci and Massimo Torquati},
url = {http://compass2.di.unipi.it/TR/files/TR-04-08.ps.gz},
year = {2004},
date = {2004-02-01},
number = {TR-04-08},
institution = {Università di Pisa, Dipartimento di Informatica, Italy},
keywords = {},
pubstate = {published},
tppubtype = {techreport}
}
Marco Aldinucci, Massimo Coppola, Marco Danelutto, Marco Vanneschi, Corrado Zoccolo
ASSIST as a Research Framework for High-performance Grid Programming Environments Technical Report
Università di Pisa, Dipartimento di Informatica, Italy no. TR-04-09, 2004.
@techreport{assist:tr-04-09,
title = {ASSIST as a Research Framework for High-performance Grid Programming Environments},
author = {Marco Aldinucci and Massimo Coppola and Marco Danelutto and Marco Vanneschi and Corrado Zoccolo},
url = {http://compass2.di.unipi.it/TR/files/TR-04-09.ps.gz},
year = {2004},
date = {2004-02-01},
number = {TR-04-09},
institution = {Università di Pisa, Dipartimento di Informatica, Italy},
keywords = {},
pubstate = {published},
tppubtype = {techreport}
}
Marco Aldinucci, Sonia Campa, Pierpaolo Ciullo, Massimo Coppola, Marco Danelutto, Paolo Pesciullesi, Roberto Ravazzolo, Massimo Torquati, Marco Vanneschi, Corrado Zoccolo
A framework for experimenting with structure parallel programming environment design Proceedings Article
In: Joubert, G. R., Nagel, W. E., Peters, F. J., Walter, W. V. (Ed.): Parallel Computing: Software Technology, Algorithms, Architectures and Applications (Proc. of PARCO 2003, Dresden, Germany), pp. 617–624, Elsevier, 2004, ISSN: 09275452.
Abstract | Links | BibTeX | Tags: parallel
@inproceedings{assist:parco:03,
title = {A framework for experimenting with structure parallel programming environment design},
author = {Marco Aldinucci and Sonia Campa and Pierpaolo Ciullo and Massimo Coppola and Marco Danelutto and Paolo Pesciullesi and Roberto Ravazzolo and Massimo Torquati and Marco Vanneschi and Corrado Zoccolo},
editor = {G. R. Joubert and W. E. Nagel and F. J. Peters and W. V. Walter},
url = {http://calvados.di.unipi.it/storage/paper_files/2004_assist_parco03.pdf},
doi = {10.1016/S0927-5452(04)80077-7},
issn = {09275452},
year = {2004},
date = {2004-01-01},
booktitle = {Parallel Computing: Software Technology, Algorithms, Architectures and Applications (Proc. of PARCO 2003, Dresden, Germany)},
volume = {13},
pages = {617–624},
publisher = {Elsevier},
series = {Advances in Parallel Computing},
abstract = {ASSIST is a parallel programming environment aimed at providing programmers of complex parallel application with a suitable and effective programming tool. Being based on algoritmical skeletons and coordination languages technologies, the programming environment relieves the programmer from a number of cumbersome, error prone activities that are required when using traditional parallel programming environments. ASSIST has been specifically designed to be easily customizable in order to experiment different implementation techniques, solutions, algorithms or back-ends any time new features are required or new technologies become available. In this work we discuss how this goal has been achieved and how the current ASSIST programming environment has been already used to experiment solutions not implemented in the first version of the tool.},
keywords = {parallel},
pubstate = {published},
tppubtype = {inproceedings}
}
Marco Aldinucci, Marco Danelutto
An operational semantics for skeletons Proceedings Article
In: Joubert, G. R., Nagel, W. E., Peters, F. J., Walter, W. V. (Ed.): Parallel Computing: Software Technology, Algorithms, Architectures and Applications (Proc. of PARCO 2003, Dresden, Germany), pp. 63–70, Elsevier, Germany, 2004.
Abstract | Links | BibTeX | Tags: parallel
@inproceedings{lith:sem:parco:03,
title = {An operational semantics for skeletons},
author = {Marco Aldinucci and Marco Danelutto},
editor = {G. R. Joubert and W. E. Nagel and F. J. Peters and W. V. Walter},
url = {http://calvados.di.unipi.it/storage/paper_files/2004_sem_parco03.pdf},
doi = {10.1016/S0927-5452(04)80011-X},
year = {2004},
date = {2004-01-01},
booktitle = {Parallel Computing: Software Technology, Algorithms, Architectures and Applications (Proc. of PARCO 2003, Dresden, Germany)},
volume = {13},
pages = {63–70},
publisher = {Elsevier},
address = {Germany},
series = {Advances in Parallel Computing},
abstract = {A major weakness of the current programming systems based on skeletons is that parallel semantics is usually provided in an informal way, thus preventing any formal comparison about program behavior. We describe a schema suitable for the description of both functional and parallel semantics of skeletal languages which is aimed at filling this gap. The proposed schema of semantics represents a handy framework to prove the correctness and validate different rewriting rules. These can be used to transform a skeleton program into a functionally equivalent but possibly faster version.},
keywords = {parallel},
pubstate = {published},
tppubtype = {inproceedings}
}
2003
Marco Aldinucci
Dynamic shared data in structured parallel programming frameworks PhD Thesis
Computer Science Dept., University of Pisa, 2003.
@phdthesis{phd:marco:2003,
title = {Dynamic shared data in structured parallel programming frameworks},
author = {Marco Aldinucci},
year = {2003},
date = {2003-12-01},
school = {Computer Science Dept., University of Pisa},
keywords = {parallel},
pubstate = {published},
tppubtype = {phdthesis}
}
Marco Aldinucci
eskimo: experimenting with Skeletons in the Shared Address Model Journal Article
In: Parallel Processing Letters, vol. 13, no. 3, pp. 449–460, 2003, ISSN: 0129-6264.
Abstract | Links | BibTeX | Tags: parallel
@article{eskimo:PPL:03,
title = {eskimo: experimenting with Skeletons in the Shared Address Model},
author = {Marco Aldinucci},
url = {http://calvados.di.unipi.it/storage/paper_files/2003_eskimo_ppl.pdf},
doi = {10.1142/S0129626403001410},
issn = {0129-6264},
year = {2003},
date = {2003-09-01},
journal = {Parallel Processing Letters},
volume = {13},
number = {3},
pages = {449–460},
abstract = {We discuss the lack of expressivity in some skeleton-based parallel programmingframeworks. The problem is further exacerbated when approaching irregular problems and dealing with dynamic data structures. Shared memory programming has been argued to have substantial ease of programming advantages for this class of problems. We present the eskimo library which represents an attempt to merge the two programming models by introducing skeletons in a shared memory framework.},
keywords = {parallel},
pubstate = {published},
tppubtype = {article}
}
Marco Aldinucci, Sonia Campa, Pierpaolo Ciullo, Massimo Coppola, Marco Danelutto, Paolo Pesciullesi, Roberto Ravazzolo, Massimo Torquati, Marco Vanneschi, Corrado Zoccolo
ASSIST demo: a high level, high performance, portable, structured parallel programming environment at work Proceedings Article
In: Kosch, H., Böszörményi, L., Hellwagner, H. (Ed.): Proc. of 9th Intl. Euro-Par 2003 Parallel Processing, pp. 1295–1300, Springer, Klagenfurt, Austria, 2003.
Abstract | Links | BibTeX | Tags: parallel
@inproceedings{assist:demo:europar:03,
title = {ASSIST demo: a high level, high performance, portable, structured parallel programming environment at work},
author = {Marco Aldinucci and Sonia Campa and Pierpaolo Ciullo and Massimo Coppola and Marco Danelutto and Paolo Pesciullesi and Roberto Ravazzolo and Massimo Torquati and Marco Vanneschi and Corrado Zoccolo},
editor = {H. Kosch and L. Böszörményi and H. Hellwagner},
url = {http://calvados.di.unipi.it/storage/paper_files/2003_assist_demo_europar.pdf},
doi = {10.1007/978-3-540-45209-6_176},
year = {2003},
date = {2003-08-01},
booktitle = {Proc. of 9th Intl. Euro-Par 2003 Parallel Processing},
volume = {2790},
pages = {1295–1300},
publisher = {Springer},
address = {Klagenfurt, Austria},
series = {LNCS},
abstract = {This work summarizes the possibilities offered by parallel programming environment ASSIST by outlining some of the features that will be demonstrated at the conference demo session. We'll substantially show how this environment can be deployed on a Linux workstation network/cluster, how applications can be compiled and run using ASSIST and eventually, we'll discuss some ASSIST scalability and performance features. We'll also outline how the ASSIST environment can be used to target GRID architectures.},
keywords = {parallel},
pubstate = {published},
tppubtype = {inproceedings}
}
Marco Aldinucci, Sonia Campa, Pierpaolo Ciullo, Massimo Coppola, Silvia Magini, Paolo Pesciullesi, Laura Potiti, Roberto Ravazzolo, Massimo Torquati, Marco Vanneschi, Corrado Zoccolo
The Implementation of ASSIST, an Environment for Parallel and Distributed Programming Proceedings Article
In: Kosch, H., Böszörményi, L., Hellwagner, H. (Ed.): Proc. of 9th Intl Euro-Par 2003 Parallel Processing, pp. 712–721, Springer, Klagenfurt, Austria, 2003, ISBN: 978-3-540-40788-1.
Abstract | Links | BibTeX | Tags: parallel
@inproceedings{assist:imp:europar:03,
title = {The Implementation of ASSIST, an Environment for Parallel and Distributed Programming},
author = {Marco Aldinucci and Sonia Campa and Pierpaolo Ciullo and Massimo Coppola and Silvia Magini and Paolo Pesciullesi and Laura Potiti and Roberto Ravazzolo and Massimo Torquati and Marco Vanneschi and Corrado Zoccolo},
editor = {H. Kosch and L. Böszörményi and H. Hellwagner},
url = {http://calvados.di.unipi.it/storage/paper_files/2003_assist_imp_europar.pdf},
doi = {10.1007/b12024},
isbn = {978-3-540-40788-1},
year = {2003},
date = {2003-08-01},
booktitle = {Proc. of 9th Intl Euro-Par 2003 Parallel Processing},
volume = {2790},
pages = {712–721},
publisher = {Springer},
address = {Klagenfurt, Austria},
series = {LNCS},
abstract = {We describe the implementation of ASSIST, a programming environment for parallel and distributed programs. Its coordination language is based of the parallel skeleton model, extended with new features to enhance expressiveness, parallel software reuse, software component integration and interfacing to external resources. The compilation process and the structure of the run-time support of ASSIST are discussed with respect to the issues introduced by the new characteristics, presenting an analysis of the first test results.},
keywords = {parallel},
pubstate = {published},
tppubtype = {inproceedings}
}
Marco Aldinucci, Marco Danelutto, Paolo Teti
An advanced environment supporting structured parallel programming in Java Journal Article
In: Future Generation Computer Systems, vol. 19, no. 5, pp. 611–626, 2003.
Abstract | Links | BibTeX | Tags: parallel
@article{lithium:fgcs:03,
title = {An advanced environment supporting structured parallel programming in Java},
author = {Marco Aldinucci and Marco Danelutto and Paolo Teti},
url = {http://calvados.di.unipi.it/storage/paper_files/2003_lithium_fgcs.pdf},
doi = {10.1016/S0167-739X(02)00172-3},
year = {2003},
date = {2003-07-01},
journal = {Future Generation Computer Systems},
volume = {19},
number = {5},
pages = {611–626},
abstract = {In this work we present Lithium, a pure Java structured parallel programming environment based on skeletons (common, reusable and efficient parallelism exploitation patterns). Lithium is implemented as a Java package and represents both the first skeleton based programming environment in Java and the first complete skeleton based Java environment exploiting macro-data flow implementation techniques. Lithium supports a set of user code optimizations which are based on skeleton rewriting techniques. These optimizations improve both absolute performance and resource usage with respect to original user code. Parallel programs developed using the library run on any network of workstations provided the workstations support plain JRE. The paper describes the library implementation, outlines the optimization techniques used and eventually presents the performance results obtained on both synthetic and real applications.},
keywords = {parallel},
pubstate = {published},
tppubtype = {article}
}
Marco Aldinucci
eskimo: experimenting skeletons on the shared address model Proceedings Article
In: Proc. of HLPP2003: Intl. Workshop on High-Level Parallel Programming, pp. 89–100, Paris, France, 2003.
Abstract | Links | BibTeX | Tags: parallel
@inproceedings{eskimo:hlpp:03,
title = {eskimo: experimenting skeletons on the shared address model},
author = {Marco Aldinucci},
url = {http://calvados.di.unipi.it/storage/paper_files/2003_eskimo_ppl.pdf},
year = {2003},
date = {2003-06-01},
booktitle = {Proc. of HLPP2003: Intl. Workshop on High-Level Parallel Programming},
pages = {89–100},
address = {Paris, France},
abstract = {We discuss the lack of expressivity in some skeleton-based parallel programming frameworks. The problem is further exacerbated when approaching irregular problems and dealing with dynamic data structures. Shared memory programming has been argued to have substantial ease of programming advantages for this class of problems. We present the eskimo library which represents an attempt to merge the two programming models by introducing skeletons in a shared memory framework.},
keywords = {parallel},
pubstate = {published},
tppubtype = {inproceedings}
}
2002
Marco Aldinucci, Marco Danelutto
An operational semantic for skeletons Technical Report
Università di Pisa, Dipartimento di Informatica, Italy no. TR-02-13, 2002.
@techreport{semantics:tr-02-13,
title = {An operational semantic for skeletons},
author = {Marco Aldinucci and Marco Danelutto},
url = {http://compass2.di.unipi.it/TR/files/TR-02-13.ps.gz},
year = {2002},
date = {2002-07-01},
number = {TR-02-13},
institution = {Università di Pisa, Dipartimento di Informatica, Italy},
keywords = {},
pubstate = {published},
tppubtype = {techreport}
}
Marco Aldinucci
Automatic Program Transformation: The Meta Tool for Skeleton-based Languages Book Section
In: Gorlatch, Sergei, Lengauer, Christian (Ed.): Constructive Methods for Parallel Programming, pp. 59–78, Nova Science Publishers, NY, USA, 2002, ISBN: 1-59033-374-8.
Abstract | Links | BibTeX | Tags: parallel
@incollection{meta:CMPP:book:02,
title = {Automatic Program Transformation: The Meta Tool for Skeleton-based Languages},
author = {Marco Aldinucci},
editor = {Sergei Gorlatch and Christian Lengauer},
url = {http://calvados.di.unipi.it/storage/paper_files/2002_meta_book.a4.pdf},
isbn = {1-59033-374-8},
year = {2002},
date = {2002-01-01},
booktitle = {Constructive Methods for Parallel Programming},
pages = {59–78},
publisher = {Nova Science Publishers},
address = {NY, USA},
chapter = {5},
series = {Advances in Computation: Theory and Practice},
abstract = {Academic and commercial experience with skeleton-based systems has demonstrated the benefits of the approach but also the lack of methods and tools for algorithm design and performance prediction. We propose a (graphical) transformation tool based on a novel internal representation of programs that enables the user to effectively deal with program transformation. Given a skeleton-based language and a set of semantic-preserving transformation rules, the tool locates applicable transformations and provides performance estimates, thereby helping the programmer in navigating through the program refinement space.},
keywords = {parallel},
pubstate = {published},
tppubtype = {incollection}
}
2001
Marco Aldinucci, Sergei Gorlatch, Christian Lengauer, Susanna Pelagatti
Towards Parallel Programming by Transformation: The FAN Skeleton Framework Journal Article
In: Parallel Algorithms and Applications, vol. 16, no. 2-3, pp. 87–121, 2001.
Abstract | Links | BibTeX | Tags: parallel
@article{FAN:PPA:01,
title = {Towards Parallel Programming by Transformation: The FAN Skeleton Framework},
author = {Marco Aldinucci and Sergei Gorlatch and Christian Lengauer and Susanna Pelagatti},
url = {http://calvados.di.unipi.it/storage/paper_files/2001_FAN_paa.pdf},
doi = {10.1080/01495730108935268},
year = {2001},
date = {2001-03-01},
journal = {Parallel Algorithms and Applications},
volume = {16},
number = {2-3},
pages = {87–121},
abstract = {A Functional Abstract Notation (FAN) is proposed for the specification and design of parallel algorithms by means of skeletons - high-level patterns with parallel semantics. The main weakness of the current programming systems based on skeletons is that the user is still responsible for finding the most appropriate skeleton composition for a given application and a given parallel architecture. We describe a transformational framework for the development of skeletal programs which is aimed at filling this gap. The framework makes use of transformation rules which are semantic equivalences among skeleton compositions. For a given problem, an initial, possibly inefficient skeleton specification is refined by applying a sequence of transformations. Transformations are guided by a set of performance prediction models which forecast the behavior of each skeleton and the performance benefits of different rules. The design process is supported by a graphical tool which locates applicable transformations and provides performance estimates, thereby helping the programmer in navigating through the program refinement space. We give an overview of the FAN framework and exemplify its use with performance-directed program derivations for simple case studies. Our experience can be viewed as a first feasibility study of methods and tools for transformational, performance-directed parallel programming using skeletons.},
keywords = {parallel},
pubstate = {published},
tppubtype = {article}
}
2000
Marco Aldinucci
The Meta Transformation Tool for Skeleton-Based Languages Proceedings Article
In: Gorlatch, S., Lengauer, C. (Ed.): Proc. of CMPP: Intl. Workshop on Constructive Methods for Parallel Programming, pp. 53–68, Fakultät für mathematik und informatik Uni. Passau, Germany, 2000.
Abstract | Links | BibTeX | Tags: parallel
@inproceedings{aldinuc:meta:00,
title = {The Meta Transformation Tool for Skeleton-Based Languages},
author = {Marco Aldinucci},
editor = {S. Gorlatch and C. Lengauer},
url = {http://calvados.di.unipi.it/storage/paper_files/2000_meta_cmpp.pdf},
year = {2000},
date = {2000-07-01},
booktitle = {Proc. of CMPP: Intl. Workshop on Constructive Methods for Parallel Programming},
pages = {53–68},
publisher = {Uni. Passau, Germany},
organization = {Fakultät für mathematik und informatik},
abstract = {Academic and commercial experience with skeleton-based systems has demonstrated the benefits of the approach but also the lack of methods and tools for algorithm design and performance prediction. We propose a (graphical) transformation tool based on a novel internal representation of programs that enables the user to effectively deal with program transformation. Given a skeleton-based language and a set of semantic-preserving transformation rules, the tool locates applicable transformations and provides performance estimates, thereby helping the programmer in navigating through the program refinement space.},
keywords = {parallel},
pubstate = {published},
tppubtype = {inproceedings}
}
Marco Danelutto
Task Farm Computations in Java Proceedings Article
In: Bubak, Marian, Afsarmanesh, Hamideh, Williams, Roy, Hertzberger, Louis O. (Ed.): Proc. of the 8th Intl. Conference on High-Performance Computing and Networking (HPCN Europe 2000), pp. 385–394, Springer, Amsterdam, The Netherlands, 2000, ISBN: 3-540-67553-1.
@inproceedings{DBLP:conf/hpcn/Danelutto00,
title = {Task Farm Computations in Java},
author = {Marco Danelutto},
editor = {Marian Bubak and Hamideh Afsarmanesh and Roy Williams and Louis O. Hertzberger},
url = {http://link.springer.de/link/service/series/0558/bibs/1823/18230385.htm},
isbn = {3-540-67553-1},
year = {2000},
date = {2000-05-01},
booktitle = {Proc. of the 8th Intl. Conference on High-Performance Computing and Networking (HPCN Europe 2000)},
volume = {1823},
pages = {385–394},
publisher = {Springer},
address = {Amsterdam, The Netherlands},
series = {LNCS},
keywords = {},
pubstate = {published},
tppubtype = {inproceedings}
}
Marco Danelutto, Geppino Pucci
A Compact, Thread-Safe Communication Library for Efficient Cluster Computing Proceedings Article
In: Bubak, Marian, Afsarmanesh, Hamideh, Williams, Roy, Hertzberger, Louis O. (Ed.): Proc. of the 8th Intl. Conference on High-Performance Computing and Networking (HPCN Europe 2000), pp. 407–416, Springer, Amsterdam, The Netherlands, 2000, ISBN: 3-540-67553-1.
@inproceedings{DBLP:conf/hpcn/DaneluttoP00,
title = {A Compact, Thread-Safe Communication Library for Efficient Cluster Computing},
author = {Marco Danelutto and Geppino Pucci},
editor = {Marian Bubak and Hamideh Afsarmanesh and Roy Williams and Louis O. Hertzberger},
url = {http://link.springer.de/link/service/series/0558/bibs/1823/18230407.htm},
isbn = {3-540-67553-1},
year = {2000},
date = {2000-05-01},
booktitle = {Proc. of the 8th Intl. Conference on High-Performance Computing and Networking (HPCN Europe 2000)},
volume = {1823},
pages = {407–416},
publisher = {Springer},
address = {Amsterdam, The Netherlands},
series = {LNCS},
keywords = {},
pubstate = {published},
tppubtype = {inproceedings}
}
1999
Marco Aldinucci, Marco Danelutto
Stream parallel skeleton optimization Proceedings Article
In: Proc. of PDCS: Intl. Conference on Parallel and Distributed Computing and Systems, pp. 955–962, IASTED ACTA press, Cambridge, Massachusetts, USA, 1999.
Abstract | Links | BibTeX | Tags: parallel
@inproceedings{pdcs:nf:99,
title = {Stream parallel skeleton optimization},
author = {Marco Aldinucci and Marco Danelutto},
url = {http://calvados.di.unipi.it/storage/paper_files/1999_NF_pdcs.pdf},
year = {1999},
date = {1999-11-01},
booktitle = {Proc. of PDCS: Intl. Conference on Parallel and Distributed Computing and Systems},
pages = {955–962},
publisher = {ACTA press},
address = {Cambridge, Massachusetts, USA},
organization = {IASTED},
abstract = {We discuss the properties of the composition of stream parallel skeletons such as pipelines and farms. By looking at the ideal performance figures assumed to hold for these skeletons, we show that any stream parallel skeleton composition can always be rewritten into an equivalent "normal form" skeleton composition, delivering a service time which is equal or even better to the service time of the original skeleton composition, and achieving a better utilization of the processors used. The normal form is defined as a single farm built around a sequential worker code. Experimental results are discussed that validate this normal form.},
keywords = {parallel},
pubstate = {published},
tppubtype = {inproceedings}
}
1998
Marco Aldinucci, Massimo Coppola, Marco Danelutto
Rewriting skeleton programs: How to evaluate the data-parallel stream-parallel tradeoff Proceedings Article
In: Gorlatch, S. (Ed.): Proc. of CMPP: Intl. Workshop on Constructive Methods for Parallel Programming, pp. 44–58, Fakultät für mathematik und informatik Uni. Passau, Germany, 1998.
Abstract | Links | BibTeX | Tags: parallel
@inproceedings{aldinuc:stream-data:98,
title = {Rewriting skeleton programs: How to evaluate the data-parallel stream-parallel tradeoff},
author = {Marco Aldinucci and Massimo Coppola and Marco Danelutto},
editor = {S. Gorlatch},
url = {http://calvados.di.unipi.it/storage/paper_files/1998_transf_cmpp.pdf},
year = {1998},
date = {1998-05-01},
booktitle = {Proc. of CMPP: Intl. Workshop on Constructive Methods for Parallel Programming},
pages = {44–58},
publisher = {Uni. Passau, Germany},
organization = {Fakultät für mathematik und informatik},
abstract = {Some skeleton based parallel programming models allow the programmer to use both data and stream parallel skeletons within the same program. It is known that particular skeleton nestings can be formally rewritten into different nestings that preserve the functional semantics. Indeed, the kind and possibly the amount of parallelism usefully exploitable may change while rewriting takes place. Here we discuss an original framework allowing the user (and/or the compiling tools) of a skeleton based parallel programming language to evaluate whether or not the transformation of a skeleton program is worthwhile in terms of the final program performance. We address, in particular, the evaluation of transformations exchanging data parallel and stream parallel skeleton subtrees.},
keywords = {parallel},
pubstate = {published},
tppubtype = {inproceedings}
}