@proceedings {Bruneo201598, title = {An SRN-based resiliency quantification approach}, journal = {Proceedings of the 36th International Conference on Application and Theory of Petri Nets and Concurrency (Petri Nets)}, volume = {9115 Lecture Notes in Computer Science}, year = {2015}, note = {cited By 0; Conference of 36th International Conference on Application and Theory of Petri Nets and Concurrency, Petri Nets 2015 ; Conference Date: 21 June 2015 Through 26 June 2015; Conference Code:119609}, pages = {98-116}, publisher = {Springer Verlag}, address = {Brussels, Belgium, 21-26 June 2015}, abstract = {

Resiliency is often considered as a synonym for faulttolerance and reliability/availability. We start from a different definition of resiliency as the ability to deliver services when encountering unexpected changes. Semantics of change is of extreme importance in order to accurately capture the real behavior of a system. We propose a resiliency analysis technique based on stochastic reward nets that allows the modeler: (1) to reuse an already existing dependability or performance model for a specific system with minimal modifications, and (2) to adapt the given model for specific change semantics. To automate the model analysis an algorithm is designed and the modeler is provided with a formalism that corresponds to the semantics. Our algorithm and approach is implemented to demonstrate the proposed resiliency quantification approach. Finally, we discuss the differences between our approach and an alternative technique based on deterministic and stochastic Petri nets and highlight the advantages of the proposed approach in terms of semantics specification. {\textcopyright} Springer International Publishing Switzerland 2015.

}, keywords = {Analysis techniques, Deterministic and stochastic Petri nets, Model analysis, Performance Model, Petri nets, Resiliency, Semantics, Stochastic models, Stochastic reward nets, Stochastic systems}, isbn = {9783319194875}, issn = {03029743}, doi = {10.1007/978-3-319-19488-2_5}, url = {http://www.scopus.com/inward/record.url?eid=2-s2.0-84937428490\&partnerID=40\&md5=7d0bbe99afba1a79df65b4e35e86a02c}, author = {Dario Bruneo and Francesco Longo and Marco Scarpa and Antonio Puliafito and Rahul Ghosh and Kishor S. Trivedi} } @proceedings {Distefano2014255, title = {Non-Markovian modeling of a BladeCenter chassis midplane}, journal = {Proceedings of the 11th European Workshop on Computer Performance Engineering (EPEW)}, volume = {8721 Lecture Notes in Computer Science}, year = {2014}, note = {cited By 0; Conference of 11th European Workshop on Computer Performance Engineering, EPEW 2014 ; Conference Date: 11 September 2014 Through 12 September 2014; Conference Code:107431}, pages = {255-269}, publisher = {Springer Verlag}, address = {Florence, Italy, 11-12 September 2014}, abstract = {

In distributed contexts such as Cloud computing, the reliability and availability of the provided resources and services have to be assured in order to meet user requirements. At the infrastructure level, this specification is translated into tighter ones on the datacenter hosting physical resources. In this paper, starting from a real case study of the IBM BladeCenter, we provide a technique for the quantitative evaluation of datacenter infrastructure availability. The proposed technique allows one to take into account both aging phenomena and multiple operating conditions. In particular, one subsystem of the BladeCenter, the chassis midplane, is studied. Indeed, based on the stochastic characterization of the midplane reliability through statistic measurements, a model dealing with the non-exponential failure time distribution thus obtained is evaluated to demonstrate the suitability and the effectiveness of the proposed technique. {\textcopyright} 2014 Springer International Publishing.

}, keywords = {Aging phenomena, Chassis, Failure-time distribution, Non-Markovian modeling, Operating condition, Physical resources, Quantitative evaluation, Reliability and availability, Stochastic models, Stochastic systems, User requirements}, isbn = {9783319108841}, issn = {03029743}, doi = {10.1007/978-3-319-10885-8_18}, url = {http://www.scopus.com/inward/record.url?eid=2-s2.0-84906969232\&partnerID=40\&md5=6840d4a28b6ed80a602f4db06c10343b}, author = {Salvatore Distefano and Francesco Longo and Marco Scarpa and Kishor S. Trivedi} } @article {Ghosh201457, title = {Scalable analytics for IaaS cloud availability}, journal = {IEEE Transactions on Cloud Computing - IEEE Computer Society}, volume = {2}, number = {1}, year = {2014}, note = {cited By 5}, pages = {57-70}, publisher = {Institute of Electrical and Electronics Engineers Inc.}, abstract = {

In a large Infrastructure-as-a-Service (IaaS) cloud, component failures are quite common. Such failures may lead to occasional system downtime and eventual violation of Service Level Agreements (SLAs) on the cloud service availability. The availability analysis of the underlying infrastructure is useful to the service provider to design a system capable of providing a defined SLA, as well as to evaluate the capabilities of an existing one. This paper presents a scalable, stochastic model-driven approach to quantify the availability of a large-scale IaaS cloud, where failures are typically dealt with through migration of physical machines among three pools: hot (running), warm (turned on, but not ready), and cold (turned off). Since monolithic models do not scale for large systems, we use an interacting Markov chain based approach to demonstrate the reduction in the complexity of analysis and the solution time. The three pools are modeled by interacting sub-models. Dependencies among them are resolved using fixed-point iteration, for which existence of a solution is proved. The analytic-numeric solutions obtained from the proposed approach and from the monolithic model are compared. We show that the errors introduced by interacting sub-models are insignificant and that our approach can handle very large size IaaS clouds. The simulative solution is also considered for the proposed model, and solution time of the methods are compared. {\textcopyright} 2014 IEEE.

}, keywords = {Availability, availability analysis, cloud computing, Downtime, Existence of a solutions, Infrastructure as a service (IaaS), Iterative methods, Lakes, Maintenance, Markov processes, Model driven approach, Numeric solutions, Service level agreement (SLAs), simulation, Stochastic models, Stochastic reward nets, Stochastic systems}, issn = {21687161}, doi = {10.1109/TCC.2014.2310737}, url = {http://www.scopus.com/inward/record.url?eid=2-s2.0-84906976356\&partnerID=40\&md5=a63dc67c92ef7620c8a3b33aca08348b}, author = {Rahul Ghosh and Francesco Longo and Flavio Frattini and Stefano Russo and Kishor S. Trivedi} } @article {Ghosh2014667, title = {Stochastic model driven capacity planning for an infrastructure-as-a-service cloud}, journal = {IEEE Transactions on Services Computing - IEEE Computer Society}, volume = {7}, number = {4}, year = {2014}, note = {cited By 1}, pages = {667-680}, publisher = {Institute of Electrical and Electronics Engineers}, abstract = {

From an enterprise perspective, one key motivation to transform the traditional IT management into Cloud is the cost reduction of the hosted services. In an Infrastructure-as-a-Service (IaaS) Cloud, virtual machine (VM) instances share the physical machines (PMs) in the provider{\textquoteright}s data center. With large number of PMs, providers can maintain low cost of service downtime at the expense of higher infrastructure and other operational costs (e.g., power consumption and cooling costs). Hence, determining the optimal PM capacity requirements that minimize the overall cost is of interest. In this paper, we show how a cost analysis and optimization framework can be developed using stochastic availability and performance models of an IaaS Cloud. Specifically, we study two cost minimization problems to address the capacity planning in an IaaS Cloud: 1) what is the optimal number of PMs that minimizes the total cost of ownership for a given downtime requirement set by service level agreements? and, 2) is it more economical to use cheaper but less reliable PMs or to use costlier but more reliable PMs for insuring the same availability characteristics? We use simulated annealing, a well-known stochastic search algorithm, to solve these optimization problems. Results from our analysis show that the optimal solutions are found within reasonable time. {\textcopyright} 2013 IEEE.

}, keywords = {Capacity planning, Capacity requirement, Clouds, Cost benefit analysis, Cost reduction, Downtime, Infrastructure as a service (IaaS), Maintenance, Optimization, Optimization framework, Optimization problems, Service Level Agreements, Simulated annealing, Stochastic models, Stochastic search algorithms, Stochastic systems, Total cost of ownership}, issn = {19391374}, doi = {10.1109/TSC.2013.44}, url = {http://www.scopus.com/inward/record.url?eid=2-s2.0-84919717849\&partnerID=40\&md5=34c70f14a9a3f838562335050a628985}, author = {Rahul Ghosh and Francesco Longo and Ruofan Xia and Vijay K. Naik and Kishor S. Trivedi} } @article {Ghosh20131216, title = {Modeling and performance analysis of large scale IaaS clouds}, journal = {Future Generation Computer Systems - Elsevier}, volume = {29}, number = {5}, year = {2013}, note = {cited By 10}, pages = {1216-1234}, abstract = {

For Cloud based services to support enterprise class production workloads, Mainframe like predictable performance is essential. However, the scale, complexity, and inherent resource sharing across workloads make the Cloud management for predictable performance difficult. As a first step towards designing Cloud based systems that achieve such performance and realize the service level objectives, we develop a scalable stochastic analytic model for performance quantification of Infrastructure-as-a-Service (IaaS) Cloud. Specifically, we model a class of IaaS Clouds that offer tiered services by configuring physical machines into three pools with different provisioning delay and power consumption characteristics. Performance behaviors in such IaaS Clouds are affected by a large set of parameters, e.g., workload, system characteristics and management policies. Thus, traditional analytic models for such systems tend to be intractable. To overcome this difficulty, we propose a multi-level interacting stochastic sub-models approach where the overall model solution is obtained iteratively over individual sub-model solutions. By comparing with a single-level monolithic model, we show that our approach is scalable, tractable, and yet retains high fidelity. Since the dependencies among the sub-models are resolved via fixed-point iteration, we prove the existence of a solution. Results from our analysis show the impact of workload and system characteristics on two performance measures: mean response delay and job rejection probability. {\textcopyright} 2012 Elsevier B.V. All rights reserved.

}, keywords = {Analytic modeling, Analytical models, Clouds, CTMC, Fixed-point iterations, IaaS, Infrastructure as a service (IaaS), Performance, Provisioning, Stochastic models, Stochastic systems, Submodels}, issn = {0167739X}, doi = {10.1016/j.future.2012.06.005}, url = {http://www.scopus.com/inward/record.url?eid=2-s2.0-84887062784\&partnerID=40\&md5=5aa7bb3aa9d27ba52b585a03501c8e18}, author = {Rahul Ghosh and Francesco Longo and Vijay K. Naik and Kishor S. Trivedi} }