Name | iF1NDmkZBavnShfckohDCDFpABFKDmABFKDmTuvUDmABFKDm5kynTm_1 |
Workunit | 1943037 |
Created | 4 Oct 2019, 8:03:22 UTC |
Sent | 7 Oct 2019, 10:14:11 UTC |
Report deadline | 14 Oct 2019, 10:14:11 UTC |
Received | 8 Oct 2019, 7:46:59 UTC |
Server state | Over |
Outcome | Success |
Client state | Done |
Exit status | 0 (0x00000000) |
Computer ID | 3682 |
Run time | 5 hours 47 min 34 sec |
CPU time | 22 hours 48 min 4 sec |
Validate state | Valid |
Credit | 860.51 |
Device peak FLOPS | 17.83 GFLOPS |
Application version | ATLAS Simulation v0.74 (native_mt) x86_64-pc-linux-gnu |
Peak working set size | 1.80 GB |
Peak swap size | 2.58 GB |
Peak disk usage | 650.86 MB |
<core_client_version>7.16.1</core_client_version> <![CDATA[ <stderr_txt> 03:59:15 (399207): wrapper (7.7.26015): starting 03:59:15 (399207): wrapper: running run_atlas (--nthreads 4) 2019-10-08 03:59:15,509: singularity image is /cvmfs/atlas.cern.ch/repo/containers/images/singularity/x86_64-centos7.img 2019-10-08 03:59:15,509: sys.argv = ['run_atlas', '--nthreads', '4'] 2019-10-08 03:59:15,510: THREADS=4 2019-10-08 03:59:15,510: Checking for CVMFS 2019-10-08 03:59:16,179: CVMFS is installed 2019-10-08 03:59:16,179: Checking Singularity... 2019-10-08 03:59:16,203: Singularity is installed, version singularity version 3.4.0-1.2.el7 2019-10-08 03:59:16,203: Testing the function of Singularity... 2019-10-08 03:59:16,203: Checking singularity with cmd:singularity exec -B /cvmfs /cvmfs/atlas.cern.ch/repo/containers/images/singularity/x86_64-centos7.img hostname 2019-10-08 03:59:16,299: Singularity Works... 2019-10-08 03:59:16,299: copy /home/dcameron/boinc/slots/1/shared/ATLAS.root_0 2019-10-08 03:59:16,738: copy /home/dcameron/boinc/slots/1/shared/input.tar.gz 2019-10-08 03:59:16,738: copy /home/dcameron/boinc/slots/1/shared/RTE.tar.gz 2019-10-08 03:59:16,738: copy /home/dcameron/boinc/slots/1/shared/start_atlas.sh 2019-10-08 03:59:16,738: export ATHENA_PROC_NUMBER=4; 2019-10-08 03:59:16,750: start atlas job with PandaID=4495528160 2019-10-08 03:59:16,751: cmd = singularity exec --pwd /home/dcameron/boinc/slots/1 -B /cvmfs,/home /cvmfs/atlas.cern.ch/repo/containers/images/singularity/x86_64-centos7.img sh start_atlas.sh > runtime_log 2> runtime_log.err 2019-10-08 09:46:46,375: running cmd return value is 0 2019-10-08 09:46:46,376: Moving ./HITS.19056367._006186.pool.root.1 to shared/HITS.pool.root.1 2019-10-08 09:46:46,376: HITS result file: 2019-10-08 09:46:46,381: -rw-------. 1 dcameron zp 242345156 Oct 8 09:45 shared/HITS.pool.root.1 2019-10-08 09:46:46,382: *****************The last 200 lines of the pilot log****************** 2019-10-08 09:46:46,385: "wallTime": 1 }, "total": { "cpuTime": 46, "wallTime": 78 }, "validation": { "cpuTime": 0, "wallTime": 0 }, "wallTime": 76 } }, "machine": { "cpu_family": "6", "linux_distribution": [ "CentOS Linux", "7.6.1810", "Core" ], "model": "60", "model_name": "Intel(R) Core(TM) i7-4790 CPU @ 3.60GHz", "node": "pcoslo5.cern.ch", "platform": "Linux-3.10.0-1062.1.1.el7.x86_64-x86_64-with-centos-7.6.1810-Core" }, "transform": { "cpuEfficiency": 0.9871, "cpuPWEfficiency": 0.9889, "cpuTime": 5, "cpuTimeTotal": 82095, "externalCpuTime": 174, "processedEvents": 200, "trfPredata": null, "wallTime": 20738 } } } 2019-10-08 07:45:42,909 | DEBUG | queue_monitor | pilot.util.auxiliary.4495528160 | update_server | xml:will send fileinfo 2019-10-08 07:45:42,909 | INFO | queue_monitor | pilot.control.job.4495528160 | send_state | pilot will not update the server (heartbeat message will be written to file) 2019-10-08 07:45:42,909 | INFO | queue_monitor | pilot.control.job.4495528160 | send_state | job 4495528160 has finished - writing final server update 2019-10-08 07:45:42,911 | WARNING | queue_monitor | pilot.api.analytics | get_fitted_data | wrong length of table data, x=[1570499986.0, 1570500047.0, 1570500108.0, 1570500169.0, 1570500230.0, 1570500291.0, 1570500352.0, 1570500413.0, 1570500474.0, 1570500535.0, 1570500596.0, 1570500657.0, 1570500718.0, 1570500779.0, 1570500840.0, 1570500901.0, 1570500962.0, 1570501023.0, 1570501084.0, 1570501145.0, 1570501206.0, 1570501267.0, 1570501328.0, 1570501389.0, 1570501450.0, 1570501511.0, 1570501572.0, 1570501633.0, 1570501694.0, 1570501755.0, 1570501816.0, 1570501877.0, 1570501938.0, 1570501999.0, 1570502060.0, 1570502121.0, 1570502182.0, 1570502243.0, 1570502304.0, 1570502365.0, 1570502426.0, 1570502487.0, 1570502548.0, 1570502609.0, 1570502670.0, 1570502731.0, 1570502792.0, 1570502853.0, 1570502914.0, 1570502975.0, 1570503036.0, 1570503097.0, 1570503158.0, 1570503219.0, 1570503280.0, 1570503341.0, 1570503402.0, 1570503463.0, 1570503524.0, 1570503585.0, 1570503646.0, 1570503707.0, 1570503768.0, 1570503829.0, 1570503890.0, 1570503951.0, 1570504012.0, 1570504073.0, 1570504134.0, 1570504195.0, 1570504256.0, 1570504317.0, 1570504378.0, 1570504439.0, 1570504500.0, 1570504561.0, 1570504622.0, 1570504683.0, 1570504744.0, 1570504805.0, 1570504866.0, 1570504927.0, 1570504988.0, 1570505049.0, 1570505110.0, 1570505171.0, 1570505232.0, 1570505293.0, 1570505354.0, 1570505415.0, 1570505476.0, 1570505537.0, 1570505598.0, 1570505659.0, 1570505720.0, 1570505781.0, 1570505842.0, 1570505903.0, 1570505964.0, 1570506025.0, 1570506086.0, 1570506147.0, 1570506208.0, 1570506269.0, 1570506330.0, 1570506391.0, 1570506452.0, 1570506513.0, 1570506574.0, 1570506635.0, 1570506696.0, 1570506757.0, 1570506818.0, 1570506879.0, 1570506940.0, 1570507001.0, 1570507062.0, 1570507123.0, 1570507184.0, 1570507245.0, 1570507306.0, 1570507367.0, 1570507428.0, 1570507489.0, 1570507550.0, 1570507611.0, 1570507672.0, 1570507733.0, 1570507794.0, 1570507855.0, 1570507916.0, 1570507977.0, 1570508038.0, 1570508099.0, 1570508160.0, 1570508221.0, 1570508282.0, 1570508343.0, 1570508404.0, 1570508465.0, 1570508526.0, 1570508587.0, 1570508648.0, 1570508709.0, 1570508770.0, 1570508831.0, 1570508892.0, 1570508953.0, 1570509014.0, 1570509075.0, 1570509136.0, 1570509197.0, 1570509258.0, 1570509319.0, 1570509380.0, 1570509441.0, 1570509502.0, 1570509563.0, 1570509624.0, 1570509685.0, 1570509746.0, 1570509807.0, 1570509868.0, 1570509929.0, 1570509990.0, 1570510051.0, 1570510112.0, 1570510173.0, 1570510234.0, 1570510295.0, 1570510356.0, 1570510417.0, 1570510478.0, 1570510539.0, 1570510600.0, 1570510661.0, 1570510722.0, 1570510783.0, 1570510844.0, 1570510905.0, 1570510966.0, 1570511027.0, 1570511088.0, 1570511149.0, 1570511210.0, 1570511271.0, 1570511332.0, 1570511393.0, 1570511454.0, 1570511515.0, 1570511576.0, 1570511637.0, 1570511698.0, 1570511759.0, 1570511820.0, 1570511881.0, 1570511942.0, 1570512003.0, 1570512064.0, 1570512125.0, 1570512186.0, 1570512247.0, 1570512308.0, 1570512369.0, 1570512430.0, 1570512491.0, 1570512552.0, 1570512613.0, 1570512674.0, 1570512735.0, 1570512796.0, 1570512857.0, 1570512918.0, 1570512979.0, 1570513040.0, 1570513101.0, 1570513162.0, 1570513223.0, 1570513284.0, 1570513345.0, 1570513406.0, 1570513467.0, 1570513528.0, 1570513589.0, 1570513650.0, 1570513711.0, 1570513772.0, 1570513833.0, 1570513894.0, 1570513955.0, 1570514016.0, 1570514077.0, 1570514138.0, 1570514199.0, 1570514260.0, 1570514321.0, 1570514382.0, 1570514443.0, 1570514504.0, 1570514565.0, 1570514626.0, 1570514687.0, 1570514748.0, 1570514809.0, 1570514870.0, 1570514931.0, 1570514992.0, 1570515053.0, 1570515114.0, 1570515175.0, 1570515236.0, 1570515297.0, 1570515358.0, 1570515419.0, 1570515480.0, 1570515541.0, 1570515602.0, 1570515663.0, 1570515724.0, 1570515785.0, 1570515846.0, 1570515907.0, 1570515968.0, 1570516029.0, 1570516090.0, 1570516151.0, 1570516212.0, 1570516273.0, 1570516334.0, 1570516395.0, 1570516456.0, 1570516517.0, 1570516578.0, 1570516639.0, 1570516700.0, 1570516761.0, 1570516822.0, 1570516883.0, 1570516944.0, 1570517005.0, 1570517066.0, 1570517127.0, 1570517188.0, 1570517249.0, 1570517310.0, 1570517371.0, 1570517432.0, 1570517493.0, 1570517554.0, 1570517615.0, 1570517676.0, 1570517737.0, 1570517798.0, 1570517859.0, 1570517920.0, 1570517981.0, 1570518042.0, 1570518103.0, 1570518164.0, 1570518225.0, 1570518286.0, 1570518347.0, 1570518408.0, 1570518469.0, 1570518530.0, 1570518591.0, 1570518652.0, 1570518713.0, 1570518774.0, 1570518835.0, 1570518896.0, 1570518957.0, 1570519018.0, 1570519079.0, 1570519140.0, 1570519201.0, 1570519262.0, 1570519323.0, 1570519384.0, 1570519445.0, 1570519506.0, 1570519567.0, 1570519628.0, 1570519689.0, 1570519750.0, 1570519811.0, 1570519872.0, 1570519933.0, 1570519994.0, 1570520055.0, 1570520116.0, 1570520177.0, 1570520238.0, 1570520299.0, 1570520360.0, 1570520421.0, 1570520482.0, 1570520543.0, 1570520604.0, 1570520665.0, 1570520726.0], y=[] (must be same and length>=2) 2019-10-08 07:45:42,911 | DEBUG | queue_monitor | pilot.util.auxiliary.4495528160 | get_job_metrics | job metrics="coreCount=4 actualCoreCount=4 nEvents=200 workDirSize=48997467" 2019-10-08 07:45:42,911 | INFO | queue_monitor | pilot.control.job.4495528160 | get_data_structure | total number of processed events: 200 (read) 2019-10-08 07:45:42,912 | INFO | queue_monitor | pilot.user.atlas.utilities | get_memory_values | using path: /home/dcameron/boinc/slots/1/PanDA_Pilot-4495528160/memory_monitor_summary.json (trf name=prmon) 2019-10-08 07:45:42,912 | DEBUG | queue_monitor | pilot.user.atlas.utilities | get_memory_monitor_info | summary_dictionary={'Max': {'rx_packets': 894184, 'nprocs': 12, 'nthreads': 1, 'rx_bytes': 1154033721, 'wtime': 20745, 'rss': 9412332, 'write_bytes': 0, 'vmem': 14141832, 'read_bytes': 0, 'stime': 164, 'tx_bytes': 916530194, 'pss': 2699830, 'wchar': 0, 'rchar': 0, 'tx_packets': 573333, 'swap': 0, 'utime': 82722}, 'Avg': {'write_bytes': 0, 'nprocs': 8, 'nthreads': 0, 'rx_bytes': 55627, 'rx_packets': 43, 'vmem': 13874811, 'read_bytes': 0, 'swap': 0, 'tx_bytes': 44179, 'pss': 2597040, 'wchar': 0, 'rchar': 0, 'tx_packets': 27, 'rss': 9223178}} 2019-10-08 07:45:42,912 | INFO | queue_monitor | pilot.user.atlas.utilities | get_memory_monitor_info | extracted standard info from prmon json 2019-10-08 07:45:42,912 | INFO | queue_monitor | pilot.user.atlas.utilities | get_memory_monitor_info | extracted standard memory fields from prmon json 2019-10-08 07:45:42,912 | INFO | queue_monitor | pilot.util.auxiliary.4495528160 | timing_report | .............................. 2019-10-08 07:45:42,913 | INFO | queue_monitor | pilot.util.auxiliary.4495528160 | timing_report | . Timing measurements: 2019-10-08 07:45:42,913 | INFO | queue_monitor | pilot.util.auxiliary.4495528160 | timing_report | . get job = 0 s 2019-10-08 07:45:42,913 | INFO | queue_monitor | pilot.util.auxiliary.4495528160 | timing_report | . initial setup = 0 s 2019-10-08 07:45:42,913 | INFO | queue_monitor | pilot.util.auxiliary.4495528160 | timing_report | . payload setup = 0 s 2019-10-08 07:45:42,913 | INFO | queue_monitor | pilot.util.auxiliary.4495528160 | timing_report | . total setup = 0 s 2019-10-08 07:45:42,913 | INFO | queue_monitor | pilot.util.auxiliary.4495528160 | timing_report | . stage-in = 0 s 2019-10-08 07:45:42,913 | INFO | queue_monitor | pilot.util.auxiliary.4495528160 | timing_report | . payload execution = 20757 s 2019-10-08 07:45:42,913 | INFO | queue_monitor | pilot.util.auxiliary.4495528160 | timing_report | . stage-out = 1 s 2019-10-08 07:45:42,913 | INFO | queue_monitor | pilot.util.auxiliary.4495528160 | timing_report | .............................. 2019-10-08 07:45:42,913 | INFO | queue_monitor | pilot.util.auxiliary.4495528160 | get_log_extracts | building log extracts (sent to the server as 'pilotLog') 2019-10-08 07:45:42,913 | DEBUG | queue_monitor | pilot.util.auxiliary.4495528160 | get_panda_tracer_log | PanDA tracer log does not exist: /home/dcameron/boinc/slots/1/PanDA_Pilot-4495528160/pandatracerlog.txt (ignoring) 2019-10-08 07:45:42,913 | INFO | queue_monitor | pilot.util.container | execute | executing command: tail -n 20 /home/dcameron/boinc/slots/1/PanDA_Pilot-4495528160/pilotlog.txt 2019-10-08 07:45:42,924 | WARNING | queue_monitor | pilot.util.auxiliary.4495528160 | get_log_extracts | detected the following tail of warning/fatal messages in the pilot log: - Log from pilotlog.txt -2019-10-08 07:45:42,911 | WARNING | queue_monitor | pilot.api.analytics | get_fitted_data | wrong length of table data, x=[1570499986.0, 1570500047.0, 1570500108.0, 1570500169.0, 1570500230.0, 1570500291.0, 1570500352.0, 1570500413.0, 1570500474.0, 1570500535.0, 1570500596.0, 1570500657.0, 1570500718.0, 1570500779.0, 1570500840.0, 1570500901.0, 1570500962.0, 1570501023.0, 1570501084.0, 1570501145.0, 1570501206.0, 1570501267.0, 1570501328.0, 1570501389.0, 1570501450.0, 1570501511.0, 1570501572.0, 1570501633.0, 1570501694.0, 1570501755.0, 1570501816.0, 1570501877.0, 1570501938.0, 1570501999.0, 1570502060.0, 1570502121.0, 1570502182.0, 1570502243.0, 1570502304.0, 1570502365.0, 1570502426.0, 1570502487.0, 1570502548.0, 1570502609.0, 1570502670.0, 1570502731.0, 1570502792.0, 1570502853.0, 1570502914.0, 1570502975.0, 1570503036.0, 1570503097.0, 1570503158.0, 1570503219.0, 1570503280.0, 1570503341.0, 1570503402.0, 1570503463.0, 1570503524.0, 1570503585.0, 1570503646.0, 1570503707.0, 1570503768.0, 1570503829.0, 1570503890.0, 1570503951.0, 1570504012.0, 1570504073.0, 1570504134.0, 1570504195.0, 1570504256.0, 1570504317.0, 1570504378.0, 1570504439.0, 1570504500.0, 1570504561.0, 1570504622.0, 1570504683.0, 1570504744.0, 1570504805.0, 1570504866.0, 1570504927.0, 1570504988.0, 1570505049.0, 1570505110.0, 1570505171.0, 1570505232.0, 1570505293.0, 1570505354.0, 1570505415.0, 1570505476.0, 1570505537.0, 1570505598.0, 1570505659.0, 1570505720.0, 1570505781.0, 1570505842.0, 1570505903.0, 1570505964.0, 1570506025.0, 1570506086.0, 1570506147.0, 1570506208.0, 1570506269.0, 1570506330.0, 1570506391.0, 1570506452.0, 1570506513.0, 1570506574.0, 1570506635.0, 1570506696.0, 1570506757.0, 1570506818.0, 1570506879.0, 1570506940.0, 1570507001.0, 1570507062.0, 1570507123.0, 1570507184.0, 1570507245.0, 1570507306.0, 1570507367.0, 1570507428.0, 1570507489.0, 1570507550.0, 1570507611.0, 1570507672.0, 1570507733.0, 1570507794.0, 1570507855.0, 1570507916.0, 1570507977.0, 1570508038.0, 1570508099.0, 1570508160.0, 1570508221.0, 1570508282.0, 1570508343.0, 1570508404.0, 1570508465.0, 1570508526.0, 1570508587.0, 1570508648.0, 1570508709.0, 1570508770.0, 1570508831.0, 1570508892.0, 1570508953.0, 1570509014.0, 1570509075.0, 1570509136.0, 1570509197.0, 1570509258.0, 1570509319.0, 1570509380.0, 1570509441.0, 1570509502.0, 1570509563.0, 1570509624.0, 1570509685.0, 1570509746.0, 1570509807.0, 1570509868.0, 1570509929.0, 1570509990.0, 1570510051.0, 1570510112.0, 1570510173.0, 1570510234.0, 1570510295.0, 1570510356.0, 1570510417.0, 1570510478.0, 1570510539.0, 1570510600.0, 1570510661.0, 1570510722.0, 1570510783.0, 1570510844.0, 1570510905.0, 1570510966.0, 1570511027.0, 1570511088.0, 1570511149.0, 1570511210.0, 1570511271.0, 1570511332.0, 1570511393.0, 1570511454.0, 1570511515.0, 1570511576.0, 1570511637.0, 1570511698.0, 1570511759.0, 1570511820.0, 1570511881.0, 1570511942.0, 1570512003.0, 1570512064.0, 1570512125.0, 1570512186.0, 1570512247.0, 1570512308.0, 1570512369.0, 1570512430.0, 1570512491.0, 1570512552.0, 1570512613.0, 1570512674.0, 1570512735.0, 1570512796.0, 1570512857.0, 1570512918.0, 1570512979.0, 1570513040.0, 1570513101.0, 1570513162.0, 1570513223.0, 1570513284.0, 1570513345.0, 1570513406.0, 1570513467.0, 1570513528.0, 1570513589.0, 1570513650.0, 1570513711.0, 1570513772.0, 1570513833.0, 1570513894.0, 1570513955.0, 1570514016.0, 1570514077.0, 1570514138.0, 1570514199.0, 1570514260.0, 1570514321.0, 1570514382.0, 1570514443.0, 1570514504.0, 1570514565.0, 1570514626.0, 1570514687.0, 1570514748.0, 1570514809.0, 1570514870.0, 1570514931.0, 1570514992.0, 1570515053.0, 1570515114.0, 1570515175.0, 1570515236.0, 1570515297.0, 1570515358.0, 1570515419.0, 1570515480.0, 1570515541.0, 1570515602.0, 1570515663.0, 1570515724.0, 1570515785.0, 1570515846.0, 1570515907.0, 1570515968.0, 1570516029.0, 1570516090.0, 1570516151.0, 1570516212.0, 1570516273.0, 1570516334.0, 1570516395.0, 1570516456.0, 1570516517.0, 1570516578.0, 1570516639.0, 1570516700.0, 1570516761.0, 1570516822.0, 1570516883.0, 1570516944.0, 1570517005.0, 1570517066.0, 1570517127.0, 1570517188.0, 1570517249.0, 1570517310.0, 1570517371.0, 1570517432.0, 1570517493.0, 1570517554.0, 1570517615.0, 1570517676.0, 1570517737.0, 1570517798.0, 1570517859.0, 1570517920.0, 1570517981.0, 1570518042.0, 1570518103.0, 1570518164.0, 1570518225.0, 1570518286.0, 1570518347.0, 1570518408.0, 1570518469.0, 1570518530.0, 1570518591.0, 1570518652.0, 1570518713.0, 1570518774.0, 1570518835.0, 1570518896.0, 1570518957.0, 1570519018.0, 1570519079.0, 1570519140.0, 1570519201.0, 1570519262.0, 1570519323.0, 1570519384.0, 1570519445.0, 1570519506.0, 1570519567.0, 1570519628.0, 1570519689.0, 1570519750.0, 1570519811.0, 1570519872.0, 1570519933.0, 1570519994.0, 1570520055.0, 1570520116.0, 1570520177.0, 1570520238.0, 1570520299.0, 1570520360.0, 1570520421.0, 1570520482.0, 1570520543.0, 1570520604.0, 1570520665.0, 1570520726.0], y=[] (must be same and length>=2) 2019-10-08 07:45:42,911 | DEBUG | queue_monitor | pilot.util.auxiliary.4495528160 | get_job_metrics | job metrics="coreCount=4 actualCoreCount=4 nEvents=200 workDirSize=48997467" 2019-10-08 07:45:42,911 | INFO | queue_monitor | pilot.control.job.4495528160 | get_data_structure | total number of processed events: 200 (read) 2019-10-08 07:45:42,912 | INFO | queue_monitor | pilot.user.atlas.utilities | get_memory_values | using path: /home/dcameron/boinc/slots/1/PanDA_Pilot-4495528160/memory_monitor_summary.json (trf name=prmon) 2019-10-08 07:45:42,912 | DEBUG | queue_monitor | pilot.user.atlas.utilities | get_memory_monitor_info | summary_dictionary={'Max': {'rx_packets': 894184, 'nprocs': 12, 'nthreads': 1, 'rx_bytes': 1154033721, 'wtime': 20745, 'rss': 9412332, 'write_bytes': 0, 'vmem': 14141832, 'read_bytes': 0, 'stime': 164, 'tx_bytes': 916530194, 'pss': 2699830, 'wchar': 0, 'rchar': 0, 'tx_packets': 573333, 'swap': 0, 'utime': 82722}, 'Avg': {'write_bytes': 0, 'nprocs': 8, 'nthreads': 0, 'rx_bytes': 55627, 'rx_packets': 43, 'vmem': 13874811, 'read_bytes': 0, 'swap': 0, 'tx_bytes': 44179, 'pss': 2597040, 'wchar': 0, 'rchar': 0, 'tx_packets': 27, 'rss': 9223178}} 2019-10-08 07:45:42,912 | INFO | queue_monitor | pilot.user.atlas.utilities | get_memory_monitor_info | extracted standard info from prmon json 2019-10-08 07:45:42,912 | INFO | queue_monitor | pilot.user.atlas.utilities | get_memory_monitor_info | extracted standard memory fields from prmon json 2019-10-08 07:45:42,912 | INFO | queue_monitor | pilot.util.auxiliary.4495528160 | timing_report | .............................. 2019-10-08 07:45:42,913 | INFO | queue_monitor | pilot.util.auxiliary.4495528160 | timing_report | . Timing measurements: 2019-10-08 07:45:42,913 | INFO | queue_monitor | pilot.util.auxiliary.4495528160 | timing_report | . get job = 0 s 2019-10-08 07:45:42,913 | INFO | queue_monitor | pilot.util.auxiliary.4495528160 | timing_report | . initial setup = 0 s 2019-10-08 07:45:42,913 | INFO | queue_monitor | pilot.util.auxiliary.4495528160 | timing_report | . payload setup = 0 s 2019-10-08 07:45:42,913 | INFO | queue_monitor | pilot.util.auxiliary.4495528160 | timing_report | . total setup = 0 s 2019-10-08 07:45:42,913 | INFO | queue_monitor | pilot.util.auxiliary.4495528160 | timing_report | . stage-in = 0 s 2019-10-08 07:45:42,913 | INFO | queue_monitor | pilot.util.auxiliary.4495528160 | timing_report | . payload execution = 20757 s 2019-10-08 07:45:42,913 | INFO | queue_monitor | pilot.util.auxiliary.4495528160 | timing_report | . stage-out = 1 s 2019-10-08 07:45:42,913 | INFO | queue_monitor | pilot.util.auxiliary.4495528160 | timing_report | .............................. 2019-10-08 07:45:42,913 | INFO | queue_monitor | pilot.util.auxiliary.4495528160 | get_log_extracts | building log extracts (sent to the server as 'pilotLog') 2019-10-08 07:45:42,913 | DEBUG | queue_monitor | pilot.util.auxiliary.4495528160 | get_panda_tracer_log | PanDA tracer log does not exist: /home/dcameron/boinc/slots/1/PanDA_Pilot-4495528160/pandatracerlog.txt (ignoring) 2019-10-08 07:45:42,913 | INFO | queue_monitor | pilot.util.container | execute | executing command: tail -n 20 /home/dcameron/boinc/slots/1/PanDA_Pilot-4495528160/pilotlog.txt 2019-10-08 07:45:42,925 | DEBUG | queue_monitor | pilot.control.job.4495528160 | send_state | wrote heartbeat to file /home/dcameron/boinc/slots/1/heartbeat.json 2019-10-08 07:45:42,925 | INFO | queue_monitor | pilot.control.job | queue_monitor | job 4495528160 was dequeued from the monitored payloads queue 2019-10-08 07:45:43,522 | INFO | retrieve | pilot.util.auxiliary.4495528160 | make_job_report | 2019-10-08 07:45:43,522 | INFO | retrieve | pilot.util.auxiliary.4495528160 | make_job_report | job summary report 2019-10-08 07:45:43,523 | INFO | retrieve | pilot.util.auxiliary.4495528160 | make_job_report | -------------------------------------------------- 2019-10-08 07:45:43,523 | INFO | retrieve | pilot.util.auxiliary.4495528160 | make_job_report | PanDA job id: 4495528160 2019-10-08 07:45:43,523 | INFO | retrieve | pilot.util.auxiliary.4495528160 | make_job_report | task id: 19056367 2019-10-08 07:45:43,523 | INFO | retrieve | pilot.util.auxiliary.4495528160 | make_job_report | errors: (none) 2019-10-08 07:45:43,523 | INFO | retrieve | pilot.util.auxiliary.4495528160 | make_job_report | status: LOG_TRANSFER = DONE 2019-10-08 07:45:43,523 | INFO | retrieve | pilot.util.auxiliary.4495528160 | make_job_report | pilot state: finished 2019-10-08 07:45:43,523 | INFO | retrieve | pilot.util.auxiliary.4495528160 | make_job_report | transexitcode: 0 2019-10-08 07:45:43,523 | INFO | retrieve | pilot.util.auxiliary.4495528160 | make_job_report | exeerrorcode: 0 2019-10-08 07:45:43,523 | INFO | retrieve | pilot.util.auxiliary.4495528160 | make_job_report | exeerrordiag: 2019-10-08 07:45:43,523 | INFO | retrieve | pilot.util.auxiliary.4495528160 | make_job_report | exitcode: 0 2019-10-08 07:45:43,523 | INFO | retrieve | pilot.util.auxiliary.4495528160 | make_job_report | exitmsg: OK 2019-10-08 07:45:43,523 | INFO | retrieve | pilot.util.auxiliary.4495528160 | make_job_report | cpuconsumptiontime: 82421 s 2019-10-08 07:45:43,523 | INFO | retrieve | pilot.util.auxiliary.4495528160 | make_job_report | nevents: 200 2019-10-08 07:45:43,523 | INFO | retrieve | pilot.util.auxiliary.4495528160 | make_job_report | neventsw: 0 2019-10-08 07:45:43,523 | INFO | retrieve | pilot.util.auxiliary.4495528160 | make_job_report | pid: 406113 2019-10-08 07:45:43,523 | INFO | retrieve | pilot.util.auxiliary.4495528160 | make_job_report | pgrp: 406113 2019-10-08 07:45:43,523 | INFO | retrieve | pilot.util.auxiliary.4495528160 | make_job_report | corecount: 4 2019-10-08 07:45:43,523 | INFO | retrieve | pilot.util.auxiliary.4495528160 | make_job_report | event service: False 2019-10-08 07:45:43,523 | INFO | retrieve | pilot.util.auxiliary.4495528160 | make_job_report | -------------------------------------------------- 2019-10-08 07:45:43,523 | INFO | retrieve | pilot.util.auxiliary.4495528160 | make_job_report | 2019-10-08 07:45:43,523 | INFO | retrieve | pilot.control.job.4495528160 | has_job_completed | job 4495528160 has completed 2019-10-08 07:45:43,524 | INFO | retrieve | pilot.util.processes | cleanup | overall cleanup function is called 2019-10-08 07:45:43,527 | DEBUG | retrieve | pilot.util.processes | cleanup | work directory was removed: /home/dcameron/boinc/slots/1/PanDA_Pilot-4495528160 2019-10-08 07:45:44,532 | INFO | retrieve | pilot.info.jobdata | collect_zombies | --- collectZombieJob: --- 10, [406113] 2019-10-08 07:45:44,532 | INFO | retrieve | pilot.info.jobdata | collect_zombies | zombie collector trying to kill pid 406113 2019-10-08 07:45:44,532 | INFO | retrieve | pilot.info.jobdata | collect_zombies | harmless exception when collecting zombies: [Errno 10] No child processes 2019-10-08 07:45:44,616 | WARNING | job_monitor | pilot.control.job | check_job_monitor_waiting_time | no jobs in monitored_payloads queue (waited for 72 s) 2019-10-08 07:45:45,536 | INFO | retrieve | pilot.util.processes | cleanup | collected zombie processes 2019-10-08 07:45:45,536 | INFO | retrieve | pilot.util.processes | cleanup | will now attempt to kill all subprocesses of pid=406113 2019-10-08 07:45:45,605 | INFO | retrieve | pilot.util.processes | kill_processes | process IDs to be killed: [406113] (in reverse order) 2019-10-08 07:45:45,638 | WARNING | retrieve | pilot.util.processes | kill_processes | found no corresponding commands to process id(s) 2019-10-08 07:45:45,638 | INFO | retrieve | pilot.util.processes | kill_orphans | Do not look for orphan processes in BOINC jobs 2019-10-08 07:45:45,638 | INFO | retrieve | pilot.control.job | retrieve | ready for new job 2019-10-08 07:45:45,638 | INFO | retrieve | root | retrieve | pilot has finished for previous job - re-establishing logging No handlers could be found for logger "pilot.util.mpi" 2019-10-08 07:45:45,640 | INFO | retrieve | pilot.util.auxiliary | pilot_version_banner | ***************************************** 2019-10-08 07:45:45,640 | INFO | retrieve | pilot.util.auxiliary | pilot_version_banner | *** PanDA Pilot version 2.1.25 (11) *** 2019-10-08 07:45:45,640 | INFO | retrieve | pilot.util.auxiliary | pilot_version_banner | ***************************************** 2019-10-08 07:45:45,640 | INFO | retrieve | pilot.util.auxiliary | pilot_version_banner | 2019-10-08 07:45:45,641 | INFO | retrieve | pilot.util.auxiliary | display_architecture_info | architecture information: 2019-10-08 07:45:45,676 | INFO | retrieve | pilot.util.auxiliary | display_architecture_info | LSB Version: :core-4.1-amd64:core-4.1-noarch Distributor ID: CentOS Description: CentOS Linux release 7.6.1810 (Core) Release: 7.6.1810 Codename: Core 2019-10-08 07:45:45,677 | INFO | retrieve | pilot.util.auxiliary | pilot_version_banner | ***************************************** 2019-10-08 07:45:46,179 | DEBUG | retrieve | pilot.util.monitoring | check_local_space | checking local space on /home/dcameron/boinc/slots/1 2019-10-08 07:45:46,191 | INFO | retrieve | pilot.util.monitoring | check_local_space | sufficient remaining disk space (70701285376 B) 2019-10-08 07:45:46,191 | WARNING | retrieve | pilot.control.job | proceed_with_getjob | since timefloor is set to 0, pilot was only allowed to run one job 2019-10-08 07:45:46,191 | DEBUG | retrieve | pilot.control.job | retrieve | [job] retrieve thread has finished 2019-10-08 07:45:46,211 | DEBUG | create_data_payload | pilot.control.job | create_data_payload | [job] create_data_payload thread has finished 2019-10-08 07:45:46,212 | INFO | validate_pre | pilot.control.payload | validate_pre | [payload] validate_pre thread has finished 2019-10-08 07:45:46,212 | DEBUG | copytool_in | pilot.control.data | copytool_in | [data] copytool_in thread has finished 2019-10-08 07:45:46,220 | WARNING | copytool_out | pilot.util.common | should_abort | data:copytool_out:received graceful stop - abort after this iteration 2019-10-08 07:45:46,234 | INFO | monitor | pilot.control.monitor | control | [monitor] control thread has ended 2019-10-08 07:45:46,497 | INFO | execute_payloads | pilot.control.payload | execute_payloads | [payload] execute_payloads thread has finished 2019-10-08 07:45:46,509 | DEBUG | validate | pilot.control.job | validate | [job] validate thread has finished 2019-10-08 07:45:46,532 | DEBUG | MainThread | pilot.workflow.generic | run | thread count now at 10 threads 2019-10-08 07:45:46,532 | DEBUG | MainThread | pilot.workflow.generic | run | enumerate: [<_MainThread(MainThread, started 140087538149184)>, <ExcThread(job, started 140087376516864)>, <ExcThread(job_monitor, started 140086523979520)>, <ExcThread(payload, started 140087136352000)>, <ExcThread(validate_post, started 140087085995776)>, <ExcThread(failed_post, started 140086515586816)>, <ExcThread(queue_monitor, started 140086507194112)>, <ExcThread(queue_monitoring, started 140087119566592)>, <ExcThread(data, started 140087359731456)>, <ExcThread(copytool_out, started 140087127959296)>] 2019-10-08 07:45:47,036 | DEBUG | data | pilot.control.data | control | data control ending since graceful_stop has been set 2019-10-08 07:45:47,036 | DEBUG | data | pilot.control.data | control | [data] control thread has finished 2019-10-08 07:45:47,221 | DEBUG | copytool_out | pilot.control.data | copytool_out | [data] copytool_out thread has finished 2019-10-08 07:45:47,234 | DEBUG | MainThread | pilot.workflow.generic | run | thread count now at 8 threads 2019-10-08 07:45:47,235 | DEBUG | MainThread | pilot.workflow.generic | run | enumerate: [<_MainThread(MainThread, started 140087538149184)>, <ExcThread(job, started 140087376516864)>, <ExcThread(job_monitor, started 140086523979520)>, <ExcThread(payload, started 140087136352000)>, <ExcThread(validate_post, started 140087085995776)>, <ExcThread(failed_post, started 140086515586816)>, <ExcThread(queue_monitor, started 140086507194112)>, <ExcThread(queue_monitoring, started 140087119566592)>] 2019-10-08 07:45:47,252 | DEBUG | payload | pilot.control.payload | control | payload control ending since graceful_stop has been set 2019-10-08 07:45:47,252 | DEBUG | payload | pilot.control.payload | control | [payload] control thread has finished 2019-10-08 07:45:47,291 | WARNING | queue_monitor | pilot.util.common | should_abort | job:queue_monitor:received graceful stop - abort after this iteration 2019-10-08 07:45:47,291 | DEBUG | queue_monitor | pilot.control.job | queue_monitor | [job] queue monitor thread has finished 2019-10-08 07:45:47,362 | WARNING | queue_monitoring | pilot.util.common | should_abort | data:queue_monitoring:received graceful stop - abort after this iteration 2019-10-08 07:45:47,435 | DEBUG | MainThread | pilot.workflow.generic | run | thread count now at 6 threads 2019-10-08 07:45:47,435 | DEBUG | MainThread | pilot.workflow.generic | run | enumerate: [<_MainThread(MainThread, started 140087538149184)>, <ExcThread(job, started 140087376516864)>, <ExcThread(job_monitor, started 140086523979520)>, <ExcThread(validate_post, started 140087085995776)>, <ExcThread(failed_post, started 140086515586816)>, <ExcThread(queue_monitoring, started 140087119566592)>] 2019-10-08 07:45:47,484 | DEBUG | job | pilot.control.job | control | job control ending since graceful_stop has been set 2019-10-08 07:45:47,484 | DEBUG | job | pilot.control.job | control | [job] control thread has finished 2019-10-08 07:45:47,520 | INFO | validate_post | pilot.control.payload | validate_post | [payload] validate_post thread has finished 2019-10-08 07:45:47,536 | DEBUG | MainThread | pilot.workflow.generic | run | thread count now at 4 threads 2019-10-08 07:45:47,536 | DEBUG | MainThread | pilot.workflow.generic | run | enumerate: [<_MainThread(MainThread, started 140087538149184)>, <ExcThread(job_monitor, started 140086523979520)>, <ExcThread(failed_post, started 140086515586816)>, <ExcThread(queue_monitoring, started 140087119566592)>] 2019-10-08 07:45:47,591 | INFO | failed_post | pilot.control.payload | failed_post | [payload] failed_post thread has finished 2019-10-08 07:45:47,636 | DEBUG | MainThread | pilot.workflow.generic | run | thread count now at 3 threads 2019-10-08 07:45:47,637 | DEBUG | MainThread | pilot.workflow.generic | run | enumerate: [<_MainThread(MainThread, started 140087538149184)>, <ExcThread(job_monitor, started 140086523979520)>, <ExcThread(queue_monitoring, started 140087119566592)>] 2019-10-08 07:45:50,363 | DEBUG | queue_monitoring | pilot.control.data | queue_monitoring | [data] queue_monitor thread has finished 2019-10-08 07:45:50,454 | DEBUG | MainThread | pilot.workflow.generic | run | thread count now at 2 threads 2019-10-08 07:45:50,454 | DEBUG | MainThread | pilot.workflow.generic | run | enumerate: [<_MainThread(MainThread, started 140087538149184)>, <ExcThread(job_monitor, started 140086523979520)>] 2019-10-08 07:46:46,192 | WARNING | job_monitor | pilot.control.job | check_job_monitor_waiting_time | no jobs in monitored_payloads queue (waited for 134 s) 2019-10-08 07:46:46,192 | DEBUG | job_monitor | pilot.control.job | job_monitor | [job] job monitor thread has finished 2019-10-08 07:46:46,211 | INFO | MainThread | pilot.workflow.generic | run | end of generic workflow (traces error code: 0) 2019-10-08 07:46:46,212 | INFO | MainThread | root | wrap_up | traces error code: 0 2019-10-08 07:46:46,212 | INFO | MainThread | root | wrap_up | pilot has finished 2019-10-08 07:46:46 UTC [wrapper] ==== pilot stdout END ==== 2019-10-08 07:46:46 UTC [wrapper] ==== wrapper stdout RESUME ==== 2019-10-08 07:46:46 UTC [wrapper] Pilot exit status: 0 2019-10-08 07:46:46 UTC [wrapper] STATUSCODE: 0 2019-10-08 07:46:46 UTC [wrapper] apfmon messages muted ---- find pandaIDs.out ---- total 56 -rw-------. 1 dcameron zp 11357 Jul 25 16:38 LICENSE -rw-------. 1 dcameron zp 20 Sep 9 13:04 MANIFEST.IN -rw-------. 1 dcameron zp 11 Oct 8 03:59 pandaIDs.out drwx------. 14 dcameron zp 216 Oct 8 03:59 pilot -rwx------. 1 dcameron zp 20136 Sep 9 13:04 pilot.py -rw-------. 1 dcameron zp 9 Sep 9 13:04 PILOTVERSION -rw-------. 1 dcameron zp 2251 Jul 25 16:38 README.md -rw-------. 1 dcameron zp 760 Aug 22 11:01 setup.py -rw-------. 1 dcameron zp 221 Jul 25 16:38 TODO.md 2019-10-08 07:46:46 UTC [wrapper] pandaIDs.out files: -rw-------. 1 dcameron zp 11 Oct 8 03:59 /home/dcameron/boinc/slots/1/pilot2/pandaIDs.out 2019-10-08 07:46:46 UTC [wrapper] pandaIDs.out content: 4495528160 2019-10-08 07:46:46 UTC [wrapper] Test setup, not cleaning 2019-10-08 07:46:46 UTC [wrapper] ==== wrapper stdout END ==== 2019-10-08 07:46:46 UTC [wrapper] ==== wrapper stderr END ==== 2019-10-08 07:46:46 UTC [wrapper] wrapper wrapperexiting ec=0, duration=20850 2019-10-08 07:46:46 UTC [wrapper] apfmon messages muted 2019-10-08 09:46:46,388: ***************diag file************ 2019-10-08 09:46:46,388: runtimeenvironments=APPS/HEP/ATLAS-SITE; Processors=1 WallTime=20849.45s KernelTime=515.04s UserTime=82084.58s CPUUsage=396% MaxResidentMemory=1947636kB AverageResidentMemory=0kB AverageTotalMemory=0kB AverageUnsharedMemory=0kB AverageUnsharedStack=0kB AverageSharedMemory=0kB PageSize=4096B MajorPageFaults=25628 MinorPageFaults=22216611 Swaps=0 ForcedSwitches=562792 WaitSwitches=11930780 Inputs=8154730 Outputs=1021800 SocketReceived=0 SocketSent=0 Signals=0 nodename=David_Cameron@pcoslo5.cern.ch exitcode=0 2019-10-08 09:46:46,392: ******************************WorkDir*********************** 2019-10-08 09:46:46,392: total 220768 drwxrwx--x. 7 dcameron zp 4096 Oct 8 09:46 . drwxrwx--x. 4 dcameron zp 24 Oct 7 12:10 .. -rw-------. 1 dcameron zp 7595462 Oct 8 03:59 agis_ddmendpoints.json -rw-------. 1 dcameron zp 3936675 Oct 8 03:59 agis_schedconf.cvmfs.json drwx------. 2 dcameron zp 6 Oct 8 03:59 .alrb drwxr-xr-x. 3 dcameron zp 17 Oct 8 03:59 APPS -rw-------. 1 dcameron zp 548 Oct 8 03:59 .asetup -rw-------. 1 dcameron zp 4130 Oct 8 03:59 .asetup.save drwx------. 2 dcameron zp 6 Oct 8 03:59 .asetup-sysbin_406116 -rw-r--r--. 1 dcameron zp 0 Oct 8 03:59 boinc_lockfile -rw-r--r--. 1 dcameron zp 8192 Oct 8 09:46 boinc_mmap_file -rw-r--r--. 1 dcameron zp 537 Oct 8 09:40 boinc_task_state.xml -rw-r--r--. 1 dcameron zp 211651493 Oct 8 03:59 EVNT.18605811._000120.pool.root.1 -rw-------. 1 dcameron zp 71035 Oct 8 09:45 heartbeat.json -rw-------. 1 dcameron zp 513 Oct 8 09:46 iF1NDmkZBavnShfckohDCDFpABFKDmABFKDmTuvUDmABFKDm5kynTm.diag -rw-r--r--. 1 dcameron zp 6245 Oct 8 03:59 init_data.xml -rw-r--r--. 1 dcameron zp 267513 Oct 8 03:59 input.tar.gz -rw-r--r--. 1 dcameron zp 112 Oct 8 03:59 job.xml -rw-------. 1 dcameron zp 1195523 Oct 8 09:46 log.19056367._006186.job.log.1 -rw-------. 1 dcameron zp 882402 Oct 8 09:45 log.19056367._006186.job.log.tgz.1 -rw-------. 1 dcameron zp 797 Oct 8 09:45 memory_monitor_summary.json -rw-------. 1 dcameron zp 463 Oct 8 09:46 output.list -rw-------. 1 dcameron zp 2886 Oct 3 10:23 pandaJobData.out drwx------. 3 dcameron zp 229 Oct 8 03:59 pilot2 -rw-r--r--. 1 dcameron zp 259319 Oct 3 09:27 pilot2.tar.gz -rw-------. 1 dcameron zp 9465 Oct 8 09:46 pilotlog.txt -rw-r--r--. 1 dcameron zp 4480 Oct 3 10:22 queuedata.json -rw-r--r--. 1 dcameron zp 815 Oct 8 03:59 RTE.tar.gz -rwxr-xr-x. 1 dcameron zp 7950 Oct 8 03:59 run_atlas -rwx------. 1 dcameron zp 12762 Oct 3 10:23 runpilot2-wrapper.sh -rw-r--r--. 1 dcameron zp 692 Oct 8 09:46 runtime_log -rw-r--r--. 1 dcameron zp 8048 Oct 8 09:46 runtime_log.err -rw-------. 1 dcameron zp 240 Oct 8 03:59 setup.sh.local drwxrwx--x. 2 dcameron zp 131 Oct 8 09:46 shared -rw-r--r--. 1 dcameron zp 8688 Oct 8 03:59 start_atlas.sh -rw-r--r--. 1 dcameron zp 38136 Oct 8 09:46 stderr.txt -rw-r--r--. 1 dcameron zp 107 Oct 8 03:59 wrapper_26015_x86_64-pc-linux-gnu -rw-r--r--. 1 dcameron zp 28 Oct 8 09:46 wrapper_checkpoint.txt 2019-10-08 09:46:46,392: running start_atlas return value is 0 2019-10-08 09:46:46,392: Parent exit 0 2019-10-08 09:46:46,392: child process exit 0 09:46:46 (399207): run_atlas exited; CPU time 82084.892452 09:46:46 (399207): called boinc_finish(0) </stderr_txt> ]]>
©2024 CERN