TapeReadTask.hpp 10.6 KB
Newer Older
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
/******************************************************************************
 *
 * This file is part of the Castor project.
 * See http://castor.web.cern.ch/castor
 *
 * Copyright (C) 2003  CERN
 * This program is free software; you can redistribute it and/or
 * modify it under the terms of the GNU General Public License
 * as published by the Free Software Foundation; either version 2
 * of the License, or (at your option) any later version.
 * This program is distributed in the hope that it will be useful,
 * but WITHOUT ANY WARRANTY; without even the implied warranty of
 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
 * GNU General Public License for more details.
 * You should have received a copy of the GNU General Public License
 * along with this program; if not, write to the Free Software
 * Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA 02111-1307, USA.
 *
 * 
 *
 * @author Castor Dev team, castor-dev@cern.ch
 *****************************************************************************/

#pragma once

26

David COME's avatar
David COME committed
27
#include "castor/tape/tapeserver/daemon/DataPipeline.hpp"
28
29
#include "castor/tape/tapeserver/daemon/RecallMemoryManager.hpp"
#include "castor/tape/tapeserver/daemon/DataConsumer.hpp"
30
#include "castor/exception/Exception.hpp"
31
#include "castor/tape/tapeserver/daemon/AutoReleaseBlock.hpp"
32
#include "castor/tape/tapeserver/daemon/TaskWatchDog.hpp"
33
#include "castor/tape/tapeserver/daemon/TapeSessionStats.hpp"
34
#include "castor/utils/Timer.hpp"
35

36
37
38
39
namespace castor {
namespace tape {
namespace tapeserver {
namespace daemon {
40
41
42
43
  /**
   * This class is in charge of 
   * 
   */
44
class TapeReadTask {
45
public:
46
47
48
49
50
51
  /**
   * COnstructor
   * @param ftr The file being recalled. We acquire the ownership on the pointer
   * @param destination the task that will consume the memory blocks
   * @param mm The memory manager to get free block
   */
52
  TapeReadTask(cta::RetrieveJob *retrieveJob,
53
    DataConsumer & destination, RecallMemoryManager & mm): 
54
    m_retrieveJob(retrieveJob), m_fifo(destination), m_mm(mm) {}
55
    
56
57
58
59
60
61
62
    /**
     * @param rs the read session holding all we need to be able to read from the tape
     * @param lc the log context for .. logging purpose
     * The actual function that will do the job.
     * The main loop is :
     * Acquire a free memory block from the memory manager , fill it, push it 
     */
63
  void execute(castor::tape::tapeFile::ReadSession & rs,
64
    castor::log::LogContext & lc,RecallWatchDog& watchdog,
65
    TapeSessionStats & stats, castor::utils::Timer & timer) {
66

67
68
69
    using castor::log::Param;
    typedef castor::log::LogContext::ScopedParam ScopedParam;
    
70
    // Set the common context for all the coming logs (file info)
71
    log::ScopedParamContainer params(lc);
72
    params.add("NSHOSTNAME", m_retrieveJob->archiveFile.nsHostName)
73
          .add("NSFILEID", m_retrieveJob->archiveFile.fileId)
74
75
76
          .add("BlockId", m_retrieveJob->tapeFileLocation.blockId)
          .add("fSeq", m_retrieveJob->tapeFileLocation.fSeq)
          .add("path", m_retrieveJob->archiveFile.path);
77
    
78
79
    // We will clock the stats for the file itself, and eventually add those
    // stats to the session's.
80
    TapeSessionStats localStats;
81
    castor::utils::Timer localTime;
82
    castor::utils::Timer totalTime(localTime);
83

84
85
    // Read the file and transmit it
    bool stillReading = true;
86
87
    //for counting how many mem blocks have used and how many tape blocks
    //(because one mem block can hold several tape blocks
88
89
    int fileBlock = 0;
    int tapeBlock = 0;
90
91
92
93
94
    // This out-of-try-catch variables allows us to record the stage of the 
    // process we're in, and to count the error if it occurs.
    // We will not record errors for an empty string. This will allow us to
    // prevent counting where error happened upstream.
    std::string currentErrorToCount = "";
95
96
    MemBlock* mb=NULL;
    try {
97
      currentErrorToCount = "Error_tapePositionForRead";
98
      std::unique_ptr<castor::tape::tapeFile::ReadFile> rf(openReadFile(rs,lc));
99
100
101
      // At that point we already read the header.
      localStats.headerVolume += TapeSessionStats::headerVolumePerFile;

102
      lc.log(LOG_INFO, "Successfully positioned for reading");
103
      localStats.positionTime += timer.secs(castor::utils::Timer::resetCounter);
104
      watchdog.notifyBeginNewJob();
105
      localStats.waitReportingTime += timer.secs(castor::utils::Timer::resetCounter);
106
      currentErrorToCount = "Error_tapeReadData";
107
108
109
      while (stillReading) {
        // Get a memory block and add information to its metadata
        mb=m_mm.getFreeBlock();
110
        localStats.waitFreeMemoryTime += timer.secs(castor::utils::Timer::resetCounter);
111
        
112
        mb->m_fSeq = m_retrieveJob->tapeFileLocation.fSeq;
113
        mb->m_fileBlock = fileBlock++;
114
        mb->m_fileid = m_retrieveJob->archiveFile.fileId;
115
116
117
118
119
120
121
        mb->m_tapeFileBlock = tapeBlock;
        mb->m_tapeBlockSize = rf->getBlockSize();
        try {
          // Fill up the memory block with tape block
          // append conveniently returns false when there will not be more space
          // for an extra tape block, and throws an exception if we reached the
          // end of file. append() also protects against reading too big tape blocks.
122
123
124
          while (mb->m_payload.append(*rf)) {
            tapeBlock++;
          }
125
        } catch (const castor::exception::EndOfFile&) {
126
127
128
          // append() signaled the end of the file.
          stillReading = false;
        }
129
        localStats.readWriteTime += timer.secs(castor::utils::Timer::resetCounter);
130
131
132
        localStats.dataVolume += mb->m_payload.size();
        // Pass the block to the disk write task
        m_fifo.pushDataBlock(mb);
133
        mb=NULL;
134
        watchdog.notify();
135
        localStats.waitReportingTime += timer.secs(castor::utils::Timer::resetCounter);
136
      } //end of while(stillReading)
137
138
      //  we have to signal the end of the tape read to the disk write task.
      m_fifo.pushDataBlock(NULL);
139
      // Log the successful transfer
140
      localStats.totalTime = localTime.secs();
141
142
143
144
      // Count the trailer size
      localStats.headerVolume += TapeSessionStats::trailerVolumePerFile;
      // We now transmitted one file:
      localStats.filesCount++;
145
      params.add("positionTime", localStats.positionTime)
146
            .add("readWriteTime", localStats.readWriteTime)
147
148
            .add("waitFreeMemoryTime",localStats.waitFreeMemoryTime)
            .add("waitReportingTime",localStats.waitReportingTime)
149
            .add("transferTime",localStats.transferTime())
150
            .add("totalTime", localStats.totalTime)
151
            .add("dataVolume",localStats.dataVolume)
152
            .add("headerVolume",localStats.headerVolume)
153
            .add("driveTransferSpeedMBps",
154
155
                    localStats.totalTime?(1.0*localStats.dataVolume+1.0*localStats.headerVolume)
                     /1000/1000/localStats.totalTime:0)
156
            .add("payloadTransferSpeedMBps",
157
                     localStats.totalTime?1.0*localStats.dataVolume/1000/1000/localStats.totalTime:0);
Eric Cano's avatar
Eric Cano committed
158
      lc.log(LOG_INFO, "File successfully read from tape");
159
160
161
      // Add the local counts to the session's
      stats.add(localStats);
    } //end of try
162
    catch (const castor::exception::Exception & ex) {
163
      //we end up there because :
164
      //-- openReadFile brought us here (cant position to the file)
165
      //-- m_payload.append brought us here (error while reading the file)
166
167
168
169
      // Record the error in the watchdog
      if (currentErrorToCount.size()) {
        watchdog.addToErrorCount(currentErrorToCount);
      }
170
171
172
173
174
      // This is an error case. Log and signal to the disk write task
      { 
        castor::log::LogContext::ScopedParam sp0(lc, Param("fileBlock", fileBlock));
        castor::log::LogContext::ScopedParam sp1(lc, Param("ErrorMessage", ex.getMessageValue()));
        castor::log::LogContext::ScopedParam sp2(lc, Param("ErrorCode", ex.code()));
175
        lc.log(LOG_ERR, "Error reading a file in TapeReadFileTask (backtrace follows)");
176
177
178
179
180
181
      }
      {
        castor::log::LogContext lc2(lc.logger());
        lc2.logBacktrace(LOG_ERR, ex.backtrace());
      }
      
182
183
      // mb might or might not be allocated at this point, but 
      // reportErrorToDiskTask will deal with the allocation if required.
184
      reportErrorToDiskTask(ex.getMessageValue(),ex.code(),mb);
185
    } //end of catch
186
    watchdog.fileFinished();
187
  }
188
189
190
191
  /**
   * Get a valid block and ask to cancel the disk write task
   */
  void reportCancellationToDiskTask(){
192
    MemBlock* mb =m_mm.getFreeBlock();
193
    mb->m_fSeq = m_retrieveJob->tapeFileLocation.fSeq;
194
    mb->m_fileid = m_retrieveJob->archiveFile.fileId;
195
196
197
    //mark the block cancelled and push it (plus signal the end)
     mb->markAsCancelled();
     m_fifo.pushDataBlock(mb);
198
  }
199
200
201
private:
  /**
   * Do the actual report to the disk write task
202
203
   * @param errorMsg The error message we will give to the client
   * @param mb The mem block we will use
204
   */
205
  void reportErrorToDiskTask(const std::string& msg,int code,MemBlock* mb = NULL){
206
207
208
209
    //If we are not provided with a block, allocate it and
    // fill it up
    if (!mb) {
      mb=m_mm.getFreeBlock();
210
      mb->m_fSeq = m_retrieveJob->tapeFileLocation.fSeq;
211
      mb->m_fileid = m_retrieveJob->archiveFile.fileId;
212
213
    }
    //mark the block failed and push it (plus signal the end)
214
     mb->markAsFailed(msg,code);
215
216
217
     m_fifo.pushDataBlock(mb);
     m_fifo.pushDataBlock(NULL);
   }
218
219
  /** 
   * Open the file on the tape. In case of failure, log and throw
220
   * Copying the unique_ptr on the calling point will give us the ownership of the 
221
   * object.
222
   * @return if successful, return an unique_ptr on the ReadFile we want
223
   */
224
  std::unique_ptr<castor::tape::tapeFile::ReadFile> openReadFile(
225
226
227
228
229
  castor::tape::tapeFile::ReadSession & rs, castor::log::LogContext & lc){

    using castor::log::Param;
    typedef castor::log::LogContext::ScopedParam ScopedParam;

230
    std::unique_ptr<castor::tape::tapeFile::ReadFile> rf;
231
    try {
232
      rf.reset(new castor::tape::tapeFile::ReadFile(&rs, *m_retrieveJob));
233
234
235
236
237
238
239
240
241
242
      lc.log(LOG_DEBUG, "Successfully opened the tape file");
    } catch (castor::exception::Exception & ex) {
      // Log the error
      ScopedParam sp0(lc, Param("ErrorMessage", ex.getMessageValue()));
      ScopedParam sp1(lc, Param("ErrorCode", ex.code()));
      lc.log(LOG_ERR, "Failed to open tape file for reading");
      throw;
    }
    return rf;
  }
243
244
245
246
  
  /**
   * All we need to know about the file we are recalling
   */
247
  std::unique_ptr<cta::RetrieveJob> m_retrieveJob;
248
249
250
251
  
  /**
   * The task (seen as a Y) that will consume all the blocks we read
   */
252
  DataConsumer & m_fifo;
253
254
255
256
  
  /**
   *  The MemoryManager from whom we get free memory blocks 
   */
257
258
  RecallMemoryManager & m_mm;

259
};
260
261
262
263
}
}
}
}
264