@article{Jafar_Mounaf Al-hamad_Ghazal_2019, title={Modeling of checkpointing/rollback strategy towards optimal run time in parallel applications}, volume={41}, url={https://journal.tishreen.edu.sy/index.php/bassnc/article/view/8823}, abstractNote={<p>We present a mathematical model of checkpointing/rollback strategy, in order to ensure that execution of parallel applications in High Performance Computing (HPC) platform are completed in as little time as possible, which is achieved through  minimize the computations loss due to expected failures or unnecessary overhead of fault tolerant mechanisms.</p> <p>In our study, we are interested in special failure of components, which is called (crash fault), that shows a constant behavior of system during the work, either failure or work at for a moment, and we study a coordinated checkpointing strategy for fault tolerance to achieve continuity of the application despite the failures.</p> <p> </p> <p> </p>}, number={3}, journal={Tishreen University Journal -Basic Sciences Series}, author={Jafar, Samir and Mounaf Al-hamad, Mohammed and Ghazal, Rahaf}, year={2019}, month={Jul.} }