Hi,
We are using cta-ops-verify-tapeto carry out full and partial (10,1000,10) verifcation of tapes. We have observed the following:
- Files that failed to be verified with the message
{"epoch_time":1777455703.653701997,"local_time":"2026-04-29T10:41:43+0100","hostname":"getafix-ts10","program":"cta-taped","log_level":"ERROR","pid":2531628,"tid":2535720,"message":"File verification failed","drive_name":"obelix_ts1170_31","instance":"antares","sched_backend":"cephUser","thread":"DiskWrite","tapeDrive":"obelix_ts1170_31","tapeVid":"TD4290","mountId":"3599726","vo":"storaged_dls","tapePool":"dia_structsurf","threadCount":10,"threadID":1,"fileId":4383897767,"dstURL":"file://dummy","fSeq":58743,"errorMessage":"In DriveGeneric::readBlock: Failed ST read (with checksum) Errno=5: Input/output error","readWriteTime":0.0,"checksumingTime":0.0,"waitDataTime":875.922771,"waitReportingTime":0.001098,"checkingErrorTime":0.0,"openingTime":0.0,"closingTime":0.0,"transferTime":0.0,"totalTime":0.0,"dataVolume":0,"globalPayloadTransferSpeedMBps":0.0,"diskPerformanceMBps":0.0,"openRWCloseToTransferTimeRatio":0.0}
were successfully extracted with cta-readtp
- Running directly
cta-verify-fileon a single file, generated the same error (including some warning that there was “No tape block movement for too long”)
[root@getafix-ts14 ~]# cat /var/log/cta/cta-taped-obelix_ts1170_27.log | grep 4388468672
{"epoch_time":1778056954.407529676,"local_time":"2026-05-06T09:42:34+0100","hostname":"getafix-ts14","program":"cta-taped","log_level":"INFO","pid":3282061,"tid":3282216,"message":"Successfully positioned for reading","drive_name":"obelix_ts1170_27","instance":"antares","sched_backend":"cephUser","thread":"TapeRead","tapeDrive":"obelix_ts1170_27","tapeVid":"TD4345","mountId":"3616509","vo":"storaged_dls","tapePool":"diamond_i03","mediaType":"TS1170","logicalLibrary":"obelix_ts1170","mountType":"Retrieve","labelFormat":"0000","vendor":"IBM","capacityInBytes":50000000000000,"fileId":4388468672,"BlockId":146929882,"fSeq":6430,"dstURL":"file://dummy","isRepack":false,"isVerifyOnly":true}
{"epoch_time":1778058625.899924148,"local_time":"2026-05-06T10:10:25+0100","hostname":"getafix-ts14","program":"cta-taped","log_level":"WARN","pid":3282061,"tid":3282215,"message":"No tape block movement for too long during recalling","drive_name":"obelix_ts1170_27","instance":"antares","sched_backend":"cephUser","thread":"Watchdog","tapeDrive":"obelix_ts1170_27","tapeVid":"TD4345","mountId":"3616509","vo":"storaged_dls","tapePool":"diamond_i03","TimeSinceLastBlockMove":600.049411,"TimeSinceLastBlockMoveReport":1848.173852,"NoBlockMoveMaxSecs":600.0,"fileId":4388468672,"fSeq":6430}
{"epoch_time":1778059347.941049972,"local_time":"2026-05-06T10:22:27+0100","hostname":"getafix-ts14","program":"cta-taped","log_level":"WARN","pid":3282061,"tid":3282215,"message":"No tape block movement for too long during recalling","drive_name":"obelix_ts1170_27","instance":"antares","sched_backend":"cephUser","thread":"Watchdog","tapeDrive":"obelix_ts1170_27","tapeVid":"TD4345","mountId":"3616509","vo":"storaged_dls","tapePool":"diamond_i03","TimeSinceLastBlockMove":600.085557,"TimeSinceLastBlockMoveReport":722.04083,"NoBlockMoveMaxSecs":600.0,"fileId":4388468672,"fSeq":6430}
{"epoch_time":1778059655.712842825,"local_time":"2026-05-06T10:27:35+0100","hostname":"getafix-ts14","program":"cta-taped","log_level":"ERROR","pid":3282061,"tid":3282216,"message":"Error reading a file in TapeReadFileTask","drive_name":"obelix_ts1170_27","instance":"antares","sched_backend":"cephUser","thread":"TapeRead","tapeDrive":"obelix_ts1170_27","tapeVid":"TD4345","mountId":"3616509","vo":"storaged_dls","tapePool":"diamond_i03","mediaType":"TS1170","logicalLibrary":"obelix_ts1170","mountType":"Retrieve","labelFormat":"0000","vendor":"IBM","capacityInBytes":50000000000000,"fileId":4388468672,"BlockId":146929882,"fSeq":6430,"dstURL":"file://dummy","isRepack":false,"isVerifyOnly":true,"fileBlock":72,"ErrorMessage":"In DriveGeneric::readBlock: Failed ST read (with checksum) Errno=5: Input/output error"}
{"epoch_time":1778059655.713455697,"local_time":"2026-05-06T10:27:35+0100","hostname":"getafix-ts14","program":"cta-taped","log_level":"ERROR","pid":3282061,"tid":3282217,"message":"In DriveGeneric::readBlock: Failed ST read (with checksum) Errno=5: Input/output error","drive_name":"obelix_ts1170_27","instance":"antares","sched_backend":"cephUser","thread":"DiskWrite","tapeDrive":"obelix_ts1170_27","tapeVid":"TD4345","mountId":"3616509","vo":"storaged_dls","tapePool":"diamond_i03","threadCount":10,"threadID":0,"fileId":4388468672,"dstURL":"file://dummy","fSeq":6430,"received_archiveFileID":4388468672,"expected_NSBLOCKId":0,"received_NSBLOCKId":null,"failed_Status":true}
{"epoch_time":1778059655.714488000,"local_time":"2026-05-06T10:27:35+0100","hostname":"getafix-ts14","program":"cta-taped","log_level":"ERROR","pid":3282061,"tid":3282217,"message":"File verification failed","drive_name":"obelix_ts1170_27","instance":"antares","sched_backend":"cephUser","thread":"DiskWrite","tapeDrive":"obelix_ts1170_27","tapeVid":"TD4345","mountId":"3616509","vo":"storaged_dls","tapePool":"diamond_i03","threadCount":10,"threadID":0,"fileId":4388468672,"dstURL":"file://dummy","fSeq":6430,"errorMessage":"In DriveGeneric::readBlock: Failed ST read (with checksum) Errno=5: Input/output error","readWriteTime":0.0,"checksumingTime":0.0,"waitDataTime":2831.242039,"waitReportingTime":0.000987,"checkingErrorTime":0.0,"openingTime":0.0,"closingTime":0.0,"transferTime":0.0,"totalTime":0.0,"dataVolume":0,"globalPayloadTransferSpeedMBps":0.0,"diskPerformanceMBps":0.0,"openRWCloseToTransferTimeRatio":0.0}
{"epoch_time":1778059655.716557071,"local_time":"2026-05-06T10:27:35+0100","hostname":"getafix-ts14","program":"cta-taped","log_level":"ERROR","pid":3282061,"tid":3282227,"message":"In RecallReportPacker::ReportError::execute(): failing retrieve job after exception.","drive_name":"obelix_ts1170_27","instance":"antares","sched_backend":"cephUser","thread":"RecallReportPacker","tapeDrive":"obelix_ts1170_27","tapeVid":"TD4345","mountId":"3616509","vo":"storaged_dls","tapePool":"diamond_i03","failureLog":"May 6 10:27:35.715120 getafix-ts14 In DriveGeneric::readBlock: Failed ST read (with checksum) Errno=5: Input/output error","fileId":4388468672}
{"epoch_time":1778059655.783726379,"local_time":"2026-05-06T10:27:35+0100","hostname":"getafix-ts14","program":"cta-taped","log_level":"INFO","pid":3282061,"tid":3282227,"message":"In OStoreDB::RetrieveJob::failTransfer(): enqueued job for reporting","drive_name":"obelix_ts1170_27","instance":"antares","sched_backend":"cephUser","thread":"RecallReportPacker","tapeDrive":"obelix_ts1170_27","mountId":"3616509","vo":"storaged_dls","tapePool":"diamond_i03","fileId":4388468672,"copyNb":1,"failureReason":"May 6 10:27:35.715120 getafix-ts14 In DriveGeneric::readBlock: Failed ST read (with checksum) Errno=5: Input/output error","requestObject":"RetrieveRequest-Frontend-cta-front01.scd.rl.ac.uk-368749-20260413-11:31:35-0-155632","retriesWithinMount":1,"maxRetriesWithinMount":3,"totalRetries":1,"maxTotalRetries":6}
- In the most recent case of a file that failed to be verified with the above message, apart from successfully extracting it with
cta-readtp, the file was also successfully recalled to EOS viaxrdfs prepare -s
Our questions: does cta-verify-tape use a different mechanism to read a file from tape to a dummy which is different than the one used by cta-readtp and cta-taped? Is this mechanism reliable as an indicator for a a failed file verifcation or is it prone to generate false positives?
Thanks,
George