Name | hadsm3dhet2_jo01_006594099_0 |
Workunit | 6797472 |
Created | 15 Mar 2010, 11:59:36 UTC |
Sent | 11 Oct 2010, 0:01:49 UTC |
Report deadline | 23 Sep 2011, 5:21:49 UTC |
Received | 16 Oct 2010, 21:51:14 UTC |
Server state | Over |
Outcome | Computation error |
Client state | Compute error |
Exit status | 22 (0x00000016) Unknown error code |
Computer ID | 948401 |
Run time | |
CPU time | 2 days 23 hours 42 min 29 sec |
Validate state | Invalid |
Credit | 2,481.08 |
Device peak FLOPS | 2.86 GFLOPS |
Application version | UK Met Office HadSM3 Slab Model v6.07 windows_intelx86 |
Stderr | <core_client_version>6.4.5</core_client_version> <![CDATA[ <message> The device does not recognize the command. (0x16) - exit code 22 (0x16) </message> <stderr_txt> CPDN Monitor - Quit request from BOINC... CPDN process is not running, exiting, bRetVal = 1, checkPID=7332, selfPID=7332, iMonCtr=1 CPDN Monitor - Quit request from BOINC... CPDN process is not running, exiting, bRetVal = 1, checkPID=8124, selfPID=8124, iMonCtr=1 CPDN Monitor - Quit request from BOINC... CPDN process is not running, exiting, bRetVal = 1, checkPID=7144, selfPID=7144, iMonCtr=1 CPDN Monitor - Quit request from BOINC... CPDN process is not running, exiting, bRetVal = 1, checkPID=8676, selfPID=8676, iMonCtr=1 CPDN Monitor - Quit request from BOINC... CPDN process is not running, exiting, bRetVal = 1, checkPID=8336, selfPID=8336, iMonCtr=1 CPDN Monitor - Quit request from BOINC... CPDN process is not running, exiting, bRetVal = 1, checkPID=5508, selfPID=5508, iMonCtr=1 CPDN Monitor - Quit request from BOINC... CPDN process is not running, exiting, bRetVal = 1, checkPID=7068, selfPID=7068, iMonCtr=1 CPDN Monitor - Quit request from BOINC... CPDN process is not running, exiting, bRetVal = 1, checkPID=6476, selfPID=6476, iMonCtr=1 CPDN Monitor - Quit request from BOINC... CPDN process is not running, exiting, bRetVal = 1, checkPID=8180, selfPID=8180, iMonCtr=1 CPDN Monitor - Quit request from BOINC... CPDN process is not running, exiting, bRetVal = 1, checkPID=4068, selfPID=4068, iMonCtr=1 CPDN Monitor - Quit request from BOINC... CPDN process is not running, exiting, bRetVal = 1, checkPID=7972, selfPID=7972, iMonCtr=1 CPDN Monitor - Quit request from BOINC... CPDN process is not running, exiting, bRetVal = 1, checkPID=8560, selfPID=8560, iMonCtr=1 CPDN Monitor - Quit request from BOINC... CPDN process is not running, exiting, bRetVal = 1, checkPID=7800, selfPID=7800, iMonCtr=1 CPDN Monitor - Quit request from BOINC... CPDN process is not running, exiting, bRetVal = 1, checkPID=3140, selfPID=3140, iMonCtr=1 CPDN Monitor - Quit request from BOINC... CPDN process is not running, exiting, bRetVal = 1, checkPID=8772, selfPID=8772, iMonCtr=1 CPDN Monitor - Quit request from BOINC... CPDN process is not running, exiting, bRetVal = 1, checkPID=632, selfPID=632, iMonCtr=1 CPDN Monitor - Quit request from BOINC... CPDN process is not running, exiting, bRetVal = 1, checkPID=2560, selfPID=2560, iMonCtr=1 CPDN Monitor - Quit request from BOINC... CPDN process is not running, exiting, bRetVal = 1, checkPID=9168, selfPID=9168, iMonCtr=1 CPDN Monitor - Quit request from BOINC... CPDN process is not running, exiting, bRetVal = 1, checkPID=7372, selfPID=7372, iMonCtr=1 CPDN Monitor - Quit request from BOINC... CPDN process is not running, exiting, bRetVal = 1, checkPID=6256, selfPID=6256, iMonCtr=1 CPDN Monitor - Quit request from BOINC... CPDN process is not running, exiting, bRetVal = 1, checkPID=6276, selfPID=6276, iMonCtr=1 CPDN Monitor - Quit request from BOINC... CPDN process is not running, exiting, bRetVal = 1, checkPID=2628, selfPID=2628, iMonCtr=1 CPDN Monitor - Quit request from BOINC... CPDN process is not running, exiting, bRetVal = 1, checkPID=6168, selfPID=6168, iMonCtr=1 CPDN Monitor - Quit request from BOINC... CPDN process is not running, exiting, bRetVal = 1, checkPID=7940, selfPID=7940, iMonCtr=1 CPDN Monitor - Quit request from BOINC... CPDN process is not running, exiting, bRetVal = 1, checkPID=6948, selfPID=6948, iMonCtr=1 CPDN Monitor - Quit request from BOINC... CPDN process is not running, exiting, bRetVal = 1, checkPID=8484, selfPID=8484, iMonCtr=1 CPDN Monitor - Quit request from BOINC... CPDN process is not running, exiting, bRetVal = 1, checkPID=4348, selfPID=4348, iMonCtr=1 No heartbeat from core client for 30 sec - exiting CPDN Monitor - No 'heartbeat' from BOINC... No heartbeat from core client for 30 sec - exiting No heartbeat from core client for 30 sec - exiting No heartbeat from core client for 30 sec - exiting No heartbeat from core client for 30 sec - exiting No heartbeat from core client for 30 sec - exiting No heartbeat from core client for 30 sec - exiting No heartbeat from core client for 30 sec - exiting No heartbeat from core client for 30 sec - exiting No heartbeat from core client for 30 sec - exiting CPDN process is not running, exiting, bRetVal = 1, checkPID=3816, selfPID=3816, iMonCtr=1 No heartbeat from core client for 30 sec - exiting CPDN Monitor - No 'heartbeat' from BOINC... No heartbeat from core client for 30 sec - exiting No heartbeat from core client for 30 sec - exiting No heartbeat from core client for 30 sec - exiting No heartbeat from core client for 30 sec - exiting No heartbeat from core client for 30 sec - exiting No heartbeat from core client for 30 sec - exiting No heartbeat from core client for 30 sec - exiting No heartbeat from core client for 30 sec - exiting No heartbeat from core client for 30 sec - exiting CPDN process is not running, exiting, bRetVal = 1, checkPID=4088, selfPID=4088, iMonCtr=1 CPDN Monitor - Quit request from BOINC... CPDN process is not running, exiting, bRetVal = 1, checkPID=6704, selfPID=6704, iMonCtr=1 CPDN Monitor - Quit request from BOINC... CPDN process is not running, exiting, bRetVal = 1, checkPID=7872, selfPID=7872, iMonCtr=1 CPDN Monitor - Quit request from BOINC... CPDN process is not running, exiting, bRetVal = 1, checkPID=7900, selfPID=7900, iMonCtr=1 MainError: 06:56:22 PM No files match the supplied pattern. MainError: 06:56:22 PM No files match the supplied pattern. MainError: 06:56:22 PM No files match the supplied pattern. MainError: 06:56:22 PM No files match the supplied pattern. MainError: 06:56:22 PM No files match the supplied pattern. MainError: 06:56:22 PM No files match the supplied pattern. MainError: 06:56:22 PM No files match the supplied pattern. MainError: 06:56:22 PM No files match the supplied pattern. MainError: 06:56:22 PM No files match the supplied pattern. MainError: 06:56:22 PM No files match the supplied pattern. MainError: 06:56:22 PM No files match the supplied pattern. MainError: 06:56:22 PM No files match the supplied pattern. MainError: 06:56:22 PM No files match the supplied pattern. MainError: 06:56:22 PM No files match the supplied pattern. MainError: 06:56:22 PM No files match the supplied pattern. MainError: 06:56:22 PM No files match the supplied pattern. MainError: 06:56:22 PM No files match the supplied pattern. MainError: 06:56:22 PM No files match the supplied pattern. MainError: 06:56:22 PM No files match the supplied pattern. MainError: 06:56:22 PM No files match the supplied pattern. MainError: 06:56:22 PM No files match the supplied pattern. MainError: 06:56:22 PM No files match the supplied pattern. MainError: 06:56:22 PM No files match the supplied pattern. MainError: 06:56:22 PM No files match the supplied pattern. MainError: 06:56:22 PM No files match the supplied pattern. MainError: 06:56:22 PM No files match the supplied pattern. MainError: 06:56:22 PM No files match the supplied pattern. MainError: 06:56:22 PM No files match the supplied pattern. MainError: 06:56:22 PM No files match the supplied pattern. MainError: 06:56:22 PM No files match the supplied pattern. MainError: 06:56:22 PM No files match the supplied pattern. MainError: 06:56:22 PM No files match the supplied pattern. MainError: 06:56:22 PM No files match the supplied pattern. MainError: 06:56:22 PM No files match the supplied pattern. MainError: 06:56:22 PM No files match the supplied pattern. MainError: 06:56:22 PM No files match the supplied pattern. MainError: 06:56:22 PM No files match the supplied pattern. MainError: 06:56:22 PM No files match the supplied pattern. MainError: 06:56:22 PM No files match the supplied pattern. MainError: 06:56:22 PM No files match the supplied pattern. MainError: 06:56:22 PM No files match the supplied pattern. MainError: 06:56:22 PM No files match the supplied pattern. MainError: 06:56:22 PM No files match the supplied pattern. MainError: 06:56:22 PM No files match the supplied pattern. MainError: 06:56:22 PM No files match the supplied pattern. MainError: 06:56:22 PM No files match the supplied pattern. MainError: 06:56:22 PM No files match the supplied pattern. MainError: 06:56:22 PM No files match the supplied pattern. MainError: 06:56:22 PM No files match the supplied pattern. MainError: 06:56:22 PM No files match the supplied pattern. MainError: 06:56:22 PM No files match the supplied pattern. MainError: 06:56:22 PM No files match the supplied pattern. MainError: 06:56:22 PM No files match the supplied pattern. MainError: 06:56:22 PM No files match the supplied pattern. MainError: 06:56:22 PM No files match the supplied pattern. MainError: 06:56:22 PM No files match the supplied pattern. CPDN Monitor - Quit request from BOINC... forrtl: Access is denied. CPDN process is not running, exiting, bRetVal = 1, checkPID=0, selfPID=1488, iMonCtr=1 Model crash detected, will try to restart... forrtl: Access is denied. CPDN process is not running, exiting, bRetVal = 1, checkPID=0, selfPID=1488, iMonCtr=1 Model crash detected, will try to restart... forrtl: Access is denied. CPDN process is not running, exiting, bRetVal = 1, checkPID=0, selfPID=1488, iMonCtr=1 Model crash detected, will try to restart... forrtl: Access is denied. CPDN process is not running, exiting, bRetVal = 1, checkPID=0, selfPID=1488, iMonCtr=1 Model crash detected, will try to restart... forrtl: Access is denied. CPDN process is not running, exiting, bRetVal = 1, checkPID=0, selfPID=1488, iMonCtr=1 Model crash detected, will try to restart... forrtl: Access is denied. CPDN process is not running, exiting, bRetVal = 1, checkPID=0, selfPID=1488, iMonCtr=1 Model crash detected, will try to restart... Sorry, too many model crashes! :-( called boinc_finish </stderr_txt> ]]> |
Latest Trickles Received | ||||||
---|---|---|---|---|---|---|
Time Sent (UTC) | Host ID | Result ID | Result Name | Timestep | CPU Time (sec) | Average (sec/TS) |
16 Oct 2010 21:44:20 | 948401 | 11002717 | hadsm3dhet2_jo01_006594099_0 | 10,802 | 257,839 | 0.9548 |
16 Oct 2010 19:00:14 | 948401 | 11002717 | hadsm3dhet2_jo01_006594099_0 | 259,248 | 247,869 | 0.9561 |
16 Oct 2010 16:03:08 | 948401 | 11002717 | hadsm3dhet2_jo01_006594099_0 | 248,446 | 237,920 | 0.9576 |
16 Oct 2010 10:23:40 | 948401 | 11002717 | hadsm3dhet2_jo01_006594099_0 | 237,644 | 228,006 | 0.9594 |
16 Oct 2010 07:21:21 | 948401 | 11002717 | hadsm3dhet2_jo01_006594099_0 | 226,842 | 217,761 | 0.9600 |
16 Oct 2010 04:09:15 | 948401 | 11002717 | hadsm3dhet2_jo01_006594099_0 | 216,040 | 206,579 | 0.9562 |
15 Oct 2010 09:36:15 | 948401 | 11002717 | hadsm3dhet2_jo01_006594099_0 | 205,238 | 196,474 | 0.9573 |
15 Oct 2010 06:30:48 | 948401 | 11002717 | hadsm3dhet2_jo01_006594099_0 | 194,436 | 186,298 | 0.9581 |
15 Oct 2010 02:54:28 | 948401 | 11002717 | hadsm3dhet2_jo01_006594099_0 | 183,634 | 176,007 | 0.9585 |
14 Oct 2010 12:42:28 | 948401 | 11002717 | hadsm3dhet2_jo01_006594099_0 | 172,832 | 165,812 | 0.9594 |
14 Oct 2010 06:51:38 | 948401 | 11002717 | hadsm3dhet2_jo01_006594099_0 | 162,030 | 155,520 | 0.9598 |
14 Oct 2010 03:41:02 | 948401 | 11002717 | hadsm3dhet2_jo01_006594099_0 | 151,228 | 144,985 | 0.9587 |
13 Oct 2010 19:45:49 | 948401 | 11002717 | hadsm3dhet2_jo01_006594099_0 | 140,426 | 134,543 | 0.9581 |
13 Oct 2010 06:24:44 | 948401 | 11002717 | hadsm3dhet2_jo01_006594099_0 | 129,624 | 124,277 | 0.9587 |
13 Oct 2010 03:15:31 | 948401 | 11002717 | hadsm3dhet2_jo01_006594099_0 | 118,822 | 113,472 | 0.9550 |
12 Oct 2010 23:47:11 | 948401 | 11002717 | hadsm3dhet2_jo01_006594099_0 | 108,020 | 101,742 | 0.9419 |
12 Oct 2010 20:53:04 | 948401 | 11002717 | hadsm3dhet2_jo01_006594099_0 | 97,218 | 91,516 | 0.9413 |
12 Oct 2010 18:00:09 | 948401 | 11002717 | hadsm3dhet2_jo01_006594099_0 | 86,416 | 81,404 | 0.9420 |
12 Oct 2010 14:26:10 | 948401 | 11002717 | hadsm3dhet2_jo01_006594099_0 | 75,614 | 71,257 | 0.9424 |
12 Oct 2010 06:18:42 | 948401 | 11002717 | hadsm3dhet2_jo01_006594099_0 | 64,812 | 61,204 | 0.9443 |
©2024 cpdn.org