00001
00002
00003
00004
00005
00006
00007
00008
00009
00010
00011
00012
00013
00014
00015
00016
00017
00018
00019
00020
00021
00022
00023
00024
00025
00026
00027
00028
00029
00030
00031
00032
00033
00034 #include "SequenceReaderMulti.h"
00035
00036
00037
00038
00039
00040
00041
00042 SequenceReaderMulti::SequenceReaderMulti( ostream& monitoringStream )
00043 : SequenceReader( monitoringStream ), thisReader_( allReaders_.begin() ),
00044 isFirstSeq_(true)
00045 {
00046 monitoringStream_ << "constructing SequenceReaderMulti" << endl;
00047 }
00048
00049 SequenceReaderMulti::~SequenceReaderMulti()
00050 {
00051 monitoringStream_ << "destructing SequenceReaderMulti" << endl;
00052 for ( vector<SeqReaderInfo>::iterator i( allReaders_.begin() );
00053 i != allReaders_.end() ; i++ ) delete i->ptr_;
00054 }
00055
00056 SequenceReaderMulti::SequenceReaderMulti( const SequenceReaderMulti& rhs)
00057 : SequenceReader( rhs.monitoringStream_ ),
00058 allReaders_( rhs.allReaders_ ),
00059 thisReader_( allReaders_.begin() ),
00060 isFirstSeq_( rhs.isFirstSeq_ ),
00061 bitsPerSymbol_( rhs.bitsPerSymbol_ ),
00062 sourceDataType_( rhs.sourceDataType_ )
00063 {
00064 monitoringStream_ << "copy constructing SequenceReaderMulti\n";
00065 for ( vector<SeqReaderInfo>::const_iterator i(rhs.allReaders_.begin());
00066 i!=rhs.allReaders_.end(); i++)
00067 {
00068 allReaders_.push_back( SeqReaderInfo() );
00069 allReaders_.back().ptr_=i->ptr_->clone();
00070 }
00071
00072 }
00073
00074
00075
00076
00077
00078
00079
00080
00081
00082
00083
00084 void SequenceReaderMulti::rewind( void )
00085 {
00086
00087 for ( vector<SeqReaderInfo>::iterator i
00088 = allReaders_.begin();
00089 i != allReaders_.end();
00090 i++ )
00091 {
00092 (i->ptr_)->rewind();
00093 }
00094 thisReader_ = allReaders_.begin();
00095 lastSequenceNumber_ = 0;
00096 }
00097
00098
00099
00100
00101
00102
00103
00104
00105
00106
00107 void SequenceReaderMulti::addReader( SequenceReader& seq )
00108 {
00109 if (isFirstSeq_)
00110 {
00111 isFirstSeq_ = false;
00112 bitsPerSymbol_ = seq.getBitsPerSymbol();
00113 sourceDataType_ = seq.getSourceDataType();
00114 }
00115 else
00116 {
00117 assert(bitsPerSymbol_ == seq.getBitsPerSymbol());
00118 assert(sourceDataType_ == seq.getSourceDataType());
00119 }
00120
00121
00122 allReaders_.push_back( SeqReaderInfo() );
00123 allReaders_.back().ptr_=seq.clone();
00124 thisReader_
00125 = static_cast<vector<SeqReaderInfo>::iterator>(&allReaders_.back());
00126 }
00127
00128
00129
00130
00131
00132
00133 void SequenceReaderMulti::addReader( SequenceReader* pSeq )
00134 {
00135 if (isFirstSeq_)
00136 {
00137 isFirstSeq_ = false;
00138 bitsPerSymbol_ = pSeq->getBitsPerSymbol();
00139 sourceDataType_ = pSeq->getSourceDataType();
00140 }
00141 else
00142 {
00143 assert(bitsPerSymbol_ == pSeq->getBitsPerSymbol());
00144 assert(sourceDataType_ == pSeq->getSourceDataType());
00145 }
00146
00147 allReaders_.push_back( SeqReaderInfo() );
00148 allReaders_.back().ptr_=pSeq;
00149 thisReader_
00150 = static_cast<vector<SeqReaderInfo>::iterator>(&allReaders_.back());
00151 }
00152
00153
00154
00155
00156
00157
00158
00159 bool SequenceReaderMulti::findSequence( SequenceNumber seqNum )
00160 {
00161
00162
00163 currentSeqNum_ = seqNum;
00164 for ( thisReader_ = allReaders_.begin();
00165 thisReader_ != allReaders_.end(); thisReader_++ )
00166 {
00167 if (thisReader_->allSeqsRead_)
00168 {
00169 if ( currentSeqNum_ <= thisReader_->size_ )
00170 {
00171
00172 lastSequenceNumber_ = --seqNum;
00173 return true;
00174 }
00175 }
00176 else
00177 {
00178 if ( thisReader_->ptr_->findSequence( currentSeqNum_ ) == true )
00179 {
00180 lastSequenceNumber_ = --seqNum;
00181 return true;
00182 }
00183 else
00184 thisReader_->size_ = thisReader_->ptr_->getNumSequencesInFile();
00185
00186 }
00187
00188
00189 currentSeqNum_ -= thisReader_->ptr_->getNumSequencesInFile();
00190
00191
00192 }
00193
00194 return false;
00195
00196
00197
00198
00199
00200
00201
00202
00203
00204
00205
00206
00207
00208
00209
00210
00211
00212
00213 }
00214
00215
00216
00217
00218
00219
00220
00221
00222
00223 bool SequenceReaderMulti::findReader( SequenceNumber& seqNum )
00224 {
00225 DEBUG_L3( "SequenceReaderMulti::findReader" );
00226
00227
00228
00229
00230 if ( seqNum > getNumSequencesInFile() )
00231 {
00232 return false;
00233
00234
00235
00236
00237
00238 }
00239
00240 for ( vector<SeqReaderInfo>::iterator i = allReaders_.begin();
00241 i != allReaders_.end(); i++ )
00242 {
00243 if ( seqNum <= i->size_ ) { thisReader_ = i; break; }
00244 seqNum -= i->size_;
00245 }
00246
00247 return true;
00248
00249
00250 }
00251
00252
00253
00254
00255 void SequenceReaderMulti::changeMode( SequenceReaderMode* pMode )
00256 {
00257 for ( vector<SeqReaderInfo>::iterator i = allReaders_.begin();
00258 i != allReaders_.end(); i++ )
00259 {
00260 (i->ptr_)->changeMode(pMode);
00261 }
00262 }
00263
00264
00265
00266
00267
00268
00269
00270
00271
00272
00273
00274 int SequenceReaderMulti::getNextSequence
00275 ( WordSequence& nextSeq, int wordLength )
00276 {
00277 DEBUG_L2( "SequenceReaderMulti::getNextSequence" );
00278
00279 int numInLast;
00280
00281 while
00282 ( ( thisReader_
00283 != allReaders_.end() )
00284 && ( ( numInLast
00285 = thisReader_->ptr_->getNextSequence( nextSeq, wordLength ) )
00286 == -1 ) )
00287 {
00288 if ( thisReader_->allSeqsRead_ == false )
00289 {
00290 thisReader_->size_ = (thisReader_->ptr_)->getNumSequencesInFile();
00291 thisReader_->allSeqsRead_ = true;
00292 }
00293 thisReader_++;
00294
00295 }
00296
00297 if (thisReader_ == allReaders_.end())
00298 {
00299 monitoringStream_
00300 << "SequenceReaderMulti::getNextSequence - last seq has been read.\n";
00301 return -1;
00302 }
00303
00304 if ( numInLast != -1 ) lastSequenceNumber_++;
00305
00306 return numInLast;
00307
00308 }
00309
00310
00311
00312
00313
00314
00315
00316 int SequenceReaderMulti::getSequence
00317 ( WordSequence& nextSeq, SequenceNumber sequenceNumber, int wordLength )
00318 {
00319 DEBUG_L2( "SequenceReaderMulti::getSequence" );
00320
00321
00322 if (!findReader( sequenceNumber )) return -1;
00323
00324 lastSequenceNumber_ = sequenceNumber;
00325 (thisReader_->ptr_)->rewind();
00326
00327 return (thisReader_->ptr_)->getSequence
00328 ( nextSeq, sequenceNumber, wordLength );
00329
00330 }
00331
00332
00333
00334
00335
00336 void SequenceReaderMulti::getLastSequenceName( string& seqName ) const
00337 {
00338 (thisReader_->ptr_)->getLastSequenceName( seqName );
00339 }
00340
00341
00342
00343
00344
00345
00346
00347 SequenceNumber SequenceReaderMulti::computeNumSequencesInFile( void )
00348 {
00349 SequenceNumber numSeqs = 0;
00350 for ( vector<SeqReaderInfo>::iterator i
00351 = allReaders_.begin();
00352 i != allReaders_.end();
00353 i++ )
00354 {
00355 if ( i->allSeqsRead_ == false )
00356 {
00357 i->size_ = (i->ptr_)->getNumSequencesInFile();
00358 i->allSeqsRead_ = true;
00359 }
00360 numSeqs += i->size_;
00361 }
00362 thisReader_ = allReaders_.end();
00363 lastSequenceNumber_ = numSeqs;
00364 return numSeqs;
00365 }
00366
00367
00368
00369
00370
00371 int SequenceReaderMulti::getBitsPerSymbol ( void ) const
00372 {
00373 if (isFirstSeq_) assert(1==0);
00374 return bitsPerSymbol_;
00375
00376
00377 }
00378
00379
00380
00381
00382
00383 SourceDataType SequenceReaderMulti::getSourceDataType( void ) const
00384 {
00385 if (isFirstSeq_) assert(1==0);
00386 return sourceDataType_;
00387
00388
00389 }
00390
00391
00392
00393
00394
00395 bool SequenceReaderMulti::printName( ostream& os, SequenceNumber seqNum )
00396 {
00397
00398 lastSequenceNumber_ = seqNum;
00399
00400 if (!findReader(seqNum)) return false;
00401 (thisReader_->ptr_)->printName( os, seqNum );
00402 return true;
00403 }
00404
00405
00406
00407
00408
00409 bool SequenceReaderMulti::printSideInfo( ostream& os, SequenceNumber seqNum )
00410 {
00411
00412 lastSequenceNumber_ = seqNum;
00413
00414 if (!findReader(seqNum)) return false;
00415 (thisReader_->ptr_)->printSideInfo( os, seqNum );
00416 return true;
00417 }
00418
00419
00420
00421
00422
00423
00424 bool SequenceReaderMulti::printSource( ostream& os, SequenceNumber seqNum )
00425 {
00426 lastSequenceNumber_ = seqNum;
00427
00428 if (!findReader(seqNum)) return false;
00429 (thisReader_->ptr_)->printSource( os, seqNum );
00430 return true;
00431 }
00432
00433
00434
00435
00436 void SequenceReaderMulti::extractSource
00437 ( char** pSource,
00438 SequenceNumber seqNum,
00439 SequenceOffset seqStart,
00440 SequenceOffset seqEnd )
00441 {
00442
00443
00444
00445
00446
00447
00448 SequenceReaderState* pState(saveState());
00449
00450 if (!findSequence(seqNum))
00451 {
00452 monitoringStream_ << "extSource: Requested sequence number (" << seqNum
00453 << ") exceeds number of sequences in collection ("
00454 << getNumSequencesInFile() << ")." << endl;
00455 throw SSAHAException
00456 ("Invalid sequence number in SequenceReaderMulti::extractSource");
00457 }
00458
00459 (thisReader_->ptr_)->extractSource
00460 ( pSource, currentSeqNum_, seqStart, seqEnd );
00461
00462
00463
00464
00465
00466
00467 restoreState(pState);
00468
00469
00470
00471
00472 }
00473
00474
00475 void SequenceReaderMulti::saveIndexImp
00476 ( ostream& fileFile,
00477 ostream& indexFile,
00478 int& fileNumber )
00479 {
00480 computeNumSequencesInFile();
00481 for ( vector<SeqReaderInfo>::iterator i
00482 = allReaders_.begin();
00483 i != allReaders_.end();
00484 i++ )
00485 {
00486 (i->ptr_)->saveIndexImp( fileFile, indexFile, fileNumber );
00487 fileNumber++;
00488 }
00489
00490 }
00491
00492
00493
00494
00495
00496