X-Git-Url: http://info.iut-bm.univ-fcomte.fr/pub/gitweb/simgrid.git/blobdiff_plain/9d500525ae7ff21cb8bbdb255e80d7e172a69fcf..8ab67fea317b43cb0f64495ff0f1972080b8ed1d:/examples/msg/masterslave/masterslave_failure.tesh diff --git a/examples/msg/masterslave/masterslave_failure.tesh b/examples/msg/masterslave/masterslave_failure.tesh index 58dc8d0d07..3c4ebcd51f 100644 --- a/examples/msg/masterslave/masterslave_failure.tesh +++ b/examples/msg/masterslave/masterslave_failure.tesh @@ -2,93 +2,94 @@ p Testing a simple master/slave example application handling failures -$ masterslave/masterslave_failure$EXEEXT --log=xbt_cfg.thres:critical --log=no_loc ${srcdir:=.}/small_platform_with_failures.xml ${srcdir:=.}/masterslave/deployment_masterslave.xml --cfg=path:${srcdir} -> [0.000000] [simix_process/WARNING] Cannot launch process 'slave' on failed host 'Fafard' -> [Tremblay:master:(1) 0.000000] [msg_test/INFO] Got 5 slave(s) : -> [Tremblay:master:(1) 0.000000] [msg_test/INFO] Jupiter -> [Tremblay:master:(1) 0.000000] [msg_test/INFO] Fafard -> [Tremblay:master:(1) 0.000000] [msg_test/INFO] Ginette -> [Tremblay:master:(1) 0.000000] [msg_test/INFO] Bourassa -> [Tremblay:master:(1) 0.000000] [msg_test/INFO] Tremblay -> [Tremblay:master:(1) 0.000000] [msg_test/INFO] Got 20 task to process : -> [Tremblay:master:(1) 0.147613] [msg_test/INFO] Send completed -> [Jupiter:slave:(3) 0.147613] [msg_test/INFO] Received "Task" -> [Jupiter:slave:(3) 0.147613] [msg_test/INFO] Communication time : "0.147613" -> [Jupiter:slave:(3) 0.147613] [msg_test/INFO] Processing "Task" -> [Jupiter:slave:(3) 0.802956] [msg_test/INFO] "Task" done -> [Jupiter:slave:(3) 1.100000] [msg_test/INFO] Gloups. The cpu on which I'm running just turned off!. See you! -> [Tremblay:master:(1) 10.147613] [msg_test/INFO] Mmh. Something went wrong with 'Fafard'. Nevermind. Let's keep going! -> [Tremblay:master:(1) 10.276113] [msg_test/INFO] Send completed -> [Ginette:slave:(4) 10.276113] [msg_test/INFO] Received "Task" -> [Ginette:slave:(4) 10.276113] [msg_test/INFO] Communication time : "0.128500" -> [Ginette:slave:(4) 10.276113] [msg_test/INFO] Processing "Task" -> [Tremblay:master:(1) 10.473605] [msg_test/INFO] Send completed -> [Bourassa:slave:(5) 10.473605] [msg_test/INFO] Received "Task" -> [Bourassa:slave:(5) 10.473605] [msg_test/INFO] Communication time : "0.197492" -> [Bourassa:slave:(5) 10.473605] [msg_test/INFO] Processing "Task" -> [Tremblay:master:(1) 10.475628] [msg_test/INFO] Send completed -> [Tremblay:slave:(2) 10.475628] [msg_test/INFO] Received "Task" -> [Tremblay:slave:(2) 10.475628] [msg_test/INFO] Communication time : "0.002023" -> [Tremblay:slave:(2) 10.475628] [msg_test/INFO] Processing "Task" -> [Tremblay:slave:(2) 10.985338] [msg_test/INFO] "Task" done -> [Ginette:slave:(4) 11.307211] [msg_test/INFO] "Task" done -> [Bourassa:slave:(5) 11.504703] [msg_test/INFO] "Task" done -> [Tremblay:master:(1) 20.475628] [msg_test/INFO] Mmh. Something went wrong with 'Jupiter'. Nevermind. Let's keep going! -> [Tremblay:master:(1) 30.475628] [msg_test/INFO] Mmh. Something went wrong with 'Fafard'. Nevermind. Let's keep going! -> [Tremblay:master:(1) 30.475628] [msg_test/INFO] Mmh. Something went wrong with 'Ginette'. Nevermind. Let's keep going! -> [Ginette:slave:(4) 30.475628] [msg_test/INFO] Mmh. Something went wrong. Nevermind. Let's keep going! -> [Tremblay:master:(1) 30.673120] [msg_test/INFO] Send completed -> [Bourassa:slave:(5) 30.673120] [msg_test/INFO] Received "Task" -> [Bourassa:slave:(5) 30.673120] [msg_test/INFO] Communication time : "0.197492" -> [Bourassa:slave:(5) 30.673120] [msg_test/INFO] Processing "Task" -> [Tremblay:master:(1) 30.675143] [msg_test/INFO] Send completed -> [Tremblay:slave:(2) 30.675143] [msg_test/INFO] Received "Task" -> [Tremblay:slave:(2) 30.675143] [msg_test/INFO] Communication time : "0.002023" -> [Tremblay:slave:(2) 30.675143] [msg_test/INFO] Processing "Task" -> [Tremblay:slave:(2) 31.184853] [msg_test/INFO] "Task" done -> [Bourassa:slave:(5) 31.704218] [msg_test/INFO] "Task" done -> [Tremblay:master:(1) 40.675143] [msg_test/INFO] Mmh. Something went wrong with 'Jupiter'. Nevermind. Let's keep going! -> [Tremblay:master:(1) 50.675143] [msg_test/INFO] Mmh. Something went wrong with 'Fafard'. Nevermind. Let's keep going! -> [Tremblay:master:(1) 50.803643] [msg_test/INFO] Send completed -> [Ginette:slave:(4) 50.803643] [msg_test/INFO] Received "Task" -> [Ginette:slave:(4) 50.803643] [msg_test/INFO] Communication time : "0.128500" -> [Ginette:slave:(4) 50.803643] [msg_test/INFO] Processing "Task" -> [Tremblay:master:(1) 51.001135] [msg_test/INFO] Send completed -> [Bourassa:slave:(5) 51.001135] [msg_test/INFO] Received "Task" -> [Bourassa:slave:(5) 51.001135] [msg_test/INFO] Communication time : "0.197492" -> [Bourassa:slave:(5) 51.001135] [msg_test/INFO] Processing "Task" -> [Tremblay:master:(1) 51.003158] [msg_test/INFO] Send completed -> [Tremblay:slave:(2) 51.003158] [msg_test/INFO] Received "Task" -> [Tremblay:slave:(2) 51.003158] [msg_test/INFO] Communication time : "0.002023" -> [Tremblay:slave:(2) 51.003158] [msg_test/INFO] Processing "Task" -> [Tremblay:slave:(2) 51.512868] [msg_test/INFO] "Task" done -> [Ginette:slave:(4) 51.834741] [msg_test/INFO] "Task" done -> [Bourassa:slave:(5) 52.032233] [msg_test/INFO] "Task" done -> [Tremblay:master:(1) 61.003158] [msg_test/INFO] Mmh. Something went wrong with 'Jupiter'. Nevermind. Let's keep going! -> [Tremblay:master:(1) 71.003158] [msg_test/INFO] Mmh. Something went wrong with 'Fafard'. Nevermind. Let's keep going! -> [Tremblay:master:(1) 71.131658] [msg_test/INFO] Send completed -> [Ginette:slave:(4) 71.131658] [msg_test/INFO] Received "Task" -> [Ginette:slave:(4) 71.131658] [msg_test/INFO] Communication time : "0.128500" -> [Ginette:slave:(4) 71.131658] [msg_test/INFO] Processing "Task" -> [Tremblay:master:(1) 71.329150] [msg_test/INFO] Send completed -> [Bourassa:slave:(5) 71.329150] [msg_test/INFO] Received "Task" -> [Bourassa:slave:(5) 71.329150] [msg_test/INFO] Communication time : "0.197492" -> [Bourassa:slave:(5) 71.329150] [msg_test/INFO] Processing "Task" -> [Tremblay:master:(1) 71.331173] [msg_test/INFO] Send completed -> [Tremblay:master:(1) 71.331173] [msg_test/INFO] All tasks have been dispatched. Let's tell everybody the computation is over. -> [Tremblay:slave:(2) 71.331173] [msg_test/INFO] Received "Task" -> [Tremblay:slave:(2) 71.331173] [msg_test/INFO] Communication time : "0.002023" -> [Tremblay:slave:(2) 71.331173] [msg_test/INFO] Processing "Task" -> [Tremblay:slave:(2) 71.840883] [msg_test/INFO] "Task" done -> [Ginette:slave:(4) 72.162756] [msg_test/INFO] "Task" done -> [Tremblay:master:(1) 72.331173] [msg_test/INFO] Mmh. Can't reach 'Jupiter'! Nevermind. Let's keep going! -> [Bourassa:slave:(5) 72.360248] [msg_test/INFO] "Task" done -> [Tremblay:master:(1) 73.331173] [msg_test/INFO] Mmh. Can't reach 'Fafard'! Nevermind. Let's keep going! -> [Ginette:slave:(4) 73.332446] [msg_test/INFO] Received "finalize" -> [Ginette:slave:(4) 73.332446] [msg_test/INFO] I'm done. See you! -> [Bourassa:slave:(5) 73.334401] [msg_test/INFO] Received "finalize" -> [Bourassa:slave:(5) 73.334401] [msg_test/INFO] I'm done. See you! -> [Tremblay:master:(1) 73.334416] [msg_test/INFO] Goodbye now! -> [Tremblay:slave:(2) 73.334416] [msg_test/INFO] Received "finalize" -> [Tremblay:slave:(2) 73.334416] [msg_test/INFO] I'm done. See you! -> [73.334416] [msg_test/INFO] Simulation time 73.3344 +! output sort +$ masterslave/masterslave_failure$EXEEXT --log=xbt_cfg.thres:critical --log=no_loc ${srcdir:=.}/small_platform_with_failures.xml ${srcdir:=.}/masterslave/deployment_masterslave.xml --cfg=path:${srcdir} --cfg=network/crosstraffic:0 "--log=root.fmt:[%10.6r]%e(%i:%P@%h)%e%m%n" +> [ 0.000000] (0:@) Cannot launch process 'slave' on failed host 'Fafard' +> [ 0.000000] (1:master@Tremblay) Got 5 slave(s) : +> [ 0.000000] (1:master@Tremblay) Jupiter +> [ 0.000000] (1:master@Tremblay) Fafard +> [ 0.000000] (1:master@Tremblay) Ginette +> [ 0.000000] (1:master@Tremblay) Bourassa +> [ 0.000000] (1:master@Tremblay) Tremblay +> [ 0.000000] (1:master@Tremblay) Got 20 task to process : +> [ 0.165166] (1:master@Tremblay) Send completed +> [ 0.165166] (3:slave@Jupiter) Received "Task" +> [ 0.165166] (3:slave@Jupiter) Communication time : "0.165166" +> [ 0.165166] (3:slave@Jupiter) Processing "Task" +> [ 0.820508] (3:slave@Jupiter) "Task" done +> [ 1.100000] (3:slave@Jupiter) Gloups. The cpu on which I'm running just turned off!. See you! +> [ 10.165166] (1:master@Tremblay) Mmh. Got timeouted while speaking to 'Fafard'. Nevermind. Let's keep going! +> [ 10.308946] (1:master@Tremblay) Send completed +> [ 10.308946] (4:slave@Ginette) Received "Task" +> [ 10.308946] (4:slave@Ginette) Communication time : "0.143780" +> [ 10.308946] (4:slave@Ginette) Processing "Task" +> [ 10.529922] (1:master@Tremblay) Send completed +> [ 10.529922] (5:slave@Bourassa) Received "Task" +> [ 10.529922] (5:slave@Bourassa) Communication time : "0.220976" +> [ 10.529922] (5:slave@Bourassa) Processing "Task" +> [ 10.532187] (1:master@Tremblay) Send completed +> [ 10.532187] (2:slave@Tremblay) Received "Task" +> [ 10.532187] (2:slave@Tremblay) Communication time : "0.002265" +> [ 10.532187] (2:slave@Tremblay) Processing "Task" +> [ 11.041897] (2:slave@Tremblay) "Task" done +> [ 11.340044] (4:slave@Ginette) "Task" done +> [ 11.561020] (5:slave@Bourassa) "Task" done +> [ 20.532187] (1:master@Tremblay) Mmh. Got timeouted while speaking to 'Jupiter'. Nevermind. Let's keep going! +> [ 30.532187] (1:master@Tremblay) Mmh. Got timeouted while speaking to 'Fafard'. Nevermind. Let's keep going! +> [ 30.532187] (1:master@Tremblay) Mmh. Something went wrong with 'Ginette'. Nevermind. Let's keep going! +> [ 30.532187] (4:slave@Ginette) Mmh. Something went wrong. Nevermind. Let's keep going! +> [ 30.753163] (1:master@Tremblay) Send completed +> [ 30.753163] (5:slave@Bourassa) Received "Task" +> [ 30.753163] (5:slave@Bourassa) Communication time : "0.220976" +> [ 30.753163] (5:slave@Bourassa) Processing "Task" +> [ 30.755428] (1:master@Tremblay) Send completed +> [ 30.755428] (2:slave@Tremblay) Received "Task" +> [ 30.755428] (2:slave@Tremblay) Communication time : "0.002265" +> [ 30.755428] (2:slave@Tremblay) Processing "Task" +> [ 31.265138] (2:slave@Tremblay) "Task" done +> [ 31.784261] (5:slave@Bourassa) "Task" done +> [ 40.755428] (1:master@Tremblay) Mmh. Got timeouted while speaking to 'Jupiter'. Nevermind. Let's keep going! +> [ 50.755428] (1:master@Tremblay) Mmh. Got timeouted while speaking to 'Fafard'. Nevermind. Let's keep going! +> [ 50.899209] (1:master@Tremblay) Send completed +> [ 50.899209] (4:slave@Ginette) Received "Task" +> [ 50.899209] (4:slave@Ginette) Communication time : "0.143780" +> [ 50.899209] (4:slave@Ginette) Processing "Task" +> [ 51.120185] (1:master@Tremblay) Send completed +> [ 51.120185] (5:slave@Bourassa) Received "Task" +> [ 51.120185] (5:slave@Bourassa) Communication time : "0.220976" +> [ 51.120185] (5:slave@Bourassa) Processing "Task" +> [ 51.122450] (1:master@Tremblay) Send completed +> [ 51.122450] (2:slave@Tremblay) Received "Task" +> [ 51.122450] (2:slave@Tremblay) Communication time : "0.002265" +> [ 51.122450] (2:slave@Tremblay) Processing "Task" +> [ 51.632160] (2:slave@Tremblay) "Task" done +> [ 51.930307] (4:slave@Ginette) "Task" done +> [ 52.151282] (5:slave@Bourassa) "Task" done +> [ 61.122450] (1:master@Tremblay) Mmh. Got timeouted while speaking to 'Jupiter'. Nevermind. Let's keep going! +> [ 71.122450] (1:master@Tremblay) Mmh. Got timeouted while speaking to 'Fafard'. Nevermind. Let's keep going! +> [ 71.266230] (1:master@Tremblay) Send completed +> [ 71.266230] (4:slave@Ginette) Received "Task" +> [ 71.266230] (4:slave@Ginette) Communication time : "0.143780" +> [ 71.266230] (4:slave@Ginette) Processing "Task" +> [ 71.487206] (1:master@Tremblay) Send completed +> [ 71.487206] (5:slave@Bourassa) Received "Task" +> [ 71.487206] (5:slave@Bourassa) Communication time : "0.220976" +> [ 71.487206] (5:slave@Bourassa) Processing "Task" +> [ 71.489471] (1:master@Tremblay) Send completed +> [ 71.489471] (1:master@Tremblay) All tasks have been dispatched. Let's tell everybody the computation is over. +> [ 71.489471] (2:slave@Tremblay) Received "Task" +> [ 71.489471] (2:slave@Tremblay) Communication time : "0.002265" +> [ 71.489471] (2:slave@Tremblay) Processing "Task" +> [ 71.999181] (2:slave@Tremblay) "Task" done +> [ 72.297328] (4:slave@Ginette) "Task" done +> [ 72.489471] (1:master@Tremblay) Mmh. Got timeouted while speaking to 'Jupiter'. Nevermind. Let's keep going! +> [ 72.518304] (5:slave@Bourassa) "Task" done +> [ 73.489471] (1:master@Tremblay) Mmh. Got timeouted while speaking to 'Fafard'. Nevermind. Let's keep going! +> [ 73.506023] (4:slave@Ginette) Received "finalize" +> [ 73.506023] (4:slave@Ginette) I'm done. See you! +> [ 73.531463] (5:slave@Bourassa) Received "finalize" +> [ 73.531463] (5:slave@Bourassa) I'm done. See you! +> [ 73.531658] (0:@) Simulation time 73.5317 +> [ 73.531658] (1:master@Tremblay) Goodbye now! +> [ 73.531658] (2:slave@Tremblay) Received "finalize" +> [ 73.531658] (2:slave@Tremblay) I'm done. See you!