@article{da Cruz_Paulino_de Oliveira_Campos_Mattoso_2011, title={Capturing Distributed Provenance Metadata from Cloud-Based Scientific Workflows}, volume={2}, url={https://sol.sbc.org.br/journals/index.php/jidm/article/view/1384}, DOI={10.5753/jidm.2011.1384}, abstractNote={<span style="font-size: 9.0pt; mso-bidi-font-size: 11.0pt; line-height: 115%; font-family: " lang="EN-US">Workflows are scientific abstractions used in the modeling of scientific experiments. High performance computing environments such as clusters and grids are often required to run the experiments. Cloud computing is starting to be adopted by the scientific community. However, the cloud environment is still incipient in collecting and recording retrospective workflow provenance. This paper presents an approach to capturing distributed provenance metadata from cloud-based scientific workflows. The approach was implemented through an evolution of the Matrioshka architecture that was refactored for cloud environments. Preliminary results show that provenance metadata captured from the virtual components running at the cloud can aid scientists to manage and reproduce their large scale <em>in silico</em> experiments.</span>}, number={1}, journal={Journal of Information and Data Management}, author={da Cruz, Sergio Manuel Serra and Paulino, Carlos Eduardo and de Oliveira, Daniel and Campos, Maria Luiza Machado and Mattoso, Marta}, year={2011}, month={Aug.}, pages={43} }