29 #include "boost/thread/thread.hpp"
30 #include "boost/thread/barrier.hpp"
31 #include "boost/exception/all.hpp"
32 #include "boost/foreach_field.hpp"
36 using namespace pwiz::util;
37 using namespace pwiz::proteome;
46 const vector<string>& cleavageAgentNames = Digestion::getCleavageAgentNames();
50 *
os_ <<
"Cleavage agents:" << endl;
51 BOOST_FOREACH(CVID agentCvid, cleavageAgents)
54 << Digestion::getCleavageAgentRegex(agentCvid)
58 *
os_ <<
"\nCleavage agent names" << endl;
59 BOOST_FOREACH(
string agentName, cleavageAgentNames)
61 *
os_ << agentName << endl;
120 const string& expectedSequence,
121 size_t expectedOffset,
122 size_t expectedMissedCleavages,
123 size_t expectedSpecificTermini,
124 const string& expectedPrefix,
125 const string& expectedSuffix)
139 cerr <<
"Testing peptide " << peptide.
sequence() <<
": " << e.what() << endl;
146 if (
os_) *
os_ <<
"Fully-specific BSA digest (offset, missed cleavages, specific termini, length, sequence)" << endl;
148 vector<DigestedPeptide> trypticPeptides(trypticDigestion.
begin(), trypticDigestion.
end());
149 set<DigestedPeptide, DigestedPeptideLessThan> trypticPeptideSet(trypticPeptides.begin(), trypticPeptides.end());
171 unit_assert(!trypticPeptideSet.count(
"MKWVTFISLLLL"));
175 unit_assert(trypticPeptideSet.count(
"RDTHKSEIAHRFK"));
176 unit_assert(trypticPeptideSet.count(
"DTHKSEIAHRFK"));
179 unit_assert(trypticPeptideSet.count(
"EACFAVEGPKLVVSTQTALA"));
180 unit_assert(trypticPeptides.back().sequence() ==
"LVVSTQTALA");
183 unit_assert(!trypticPeptideSet.count(
"MKWVTFISLLLLFSSAYSRGVFRRDTHK"));
184 unit_assert(!trypticPeptideSet.count(
"LKPDPNTLCDEFKADEKKFWGKYLYEIARR"));
189 unit_assert(trypticPeptideSet.count(
"VLASSARQRLR"));
192 unit_assert(!trypticPeptideSet.count(
"MKWVTFISLLLLFSSAYSRGVFRRDTHKSEIAHRFKDLGEEHFK"));
195 unit_assert(trypticPeptideSet.count(
"KWVTFISLLLLFSSAYSR"));
200 if (
os_) *
os_ <<
"Semi-specific BSA digest (offset, missed cleavages, specific termini, length, sequence)" << endl;
202 set<DigestedPeptide, DigestedPeptideLessThan>::const_iterator peptideItr;
204 vector<DigestedPeptide> semitrypticPeptides(semitrypticDigestion.
begin(), semitrypticDigestion.
end());
205 set<DigestedPeptide, DigestedPeptideLessThan> semitrypticPeptideSet(semitrypticPeptides.begin(), semitrypticPeptides.end());
237 unit_assert(semitrypticPeptides[0].NTerminusIsSpecific() &&
238 !semitrypticPeptides[0].CTerminusIsSpecific());
240 peptideItr = semitrypticPeptideSet.find(
"MKWVTFISLLLLFSSAYSR");
241 unit_assert(peptideItr != semitrypticPeptideSet.end());
246 peptideItr->CTerminusIsSpecific());
248 peptideItr = semitrypticPeptideSet.find(
"KWVTFISLLLLFSSAYSR");
249 unit_assert(peptideItr != semitrypticPeptideSet.end());
254 peptideItr->CTerminusIsSpecific());
256 peptideItr = semitrypticPeptideSet.find(
"KWVTFISLLLLFSSAYSRG");
257 unit_assert(peptideItr == semitrypticPeptideSet.end());
259 peptideItr = semitrypticPeptideSet.find(
"WVTFISLLLLFSSAYSR");
260 unit_assert(peptideItr != semitrypticPeptideSet.end());
265 peptideItr->CTerminusIsSpecific());
267 peptideItr = semitrypticPeptideSet.find(
"WVTFISLLLLFSSAYSRG");
268 unit_assert(peptideItr != semitrypticPeptideSet.end());
273 !peptideItr->CTerminusIsSpecific());
275 peptideItr = semitrypticPeptideSet.find(
"VTFISLLLLFSSAYSRG");
276 unit_assert(peptideItr == semitrypticPeptideSet.end());
279 unit_assert(semitrypticPeptideSet.count(
"WVTFISLLLLFSSAYSR"));
280 unit_assert(semitrypticPeptideSet.count(
"VTFISLLLLFSSAYSR"));
281 unit_assert(!semitrypticPeptideSet.count(
"VTFISLLLLFSSAYS"));
284 unit_assert(semitrypticPeptideSet.count(
"FAVEGPKLVVSTQTALA"));
285 unit_assert(!semitrypticPeptideSet.count(
"FAVEGPKLVVSTQTAL"));
290 if (
os_) *
os_ <<
"Non-specific BSA digest (offset, missed cleavages, specific termini, length, sequence)" << endl;
292 set<DigestedPeptide, DigestedPeptideLessThan>::const_iterator peptideItr;
294 vector<DigestedPeptide> nontrypticPeptides(nontrypticDigestion.
begin(), nontrypticDigestion.
end());
295 set<DigestedPeptide, DigestedPeptideLessThan> nontrypticPeptideSet(nontrypticPeptides.begin(), nontrypticPeptides.end());
319 unit_assert(nontrypticPeptides[0].NTerminusIsSpecific() &&
320 !nontrypticPeptides[0].CTerminusIsSpecific());
322 peptideItr = nontrypticPeptideSet.find(
"MKWVTFISLLLLFSSAYSR");
323 unit_assert(peptideItr != nontrypticPeptideSet.end());
328 peptideItr->CTerminusIsSpecific());
330 peptideItr = nontrypticPeptideSet.find(
"KWVTFISLLLLFSSAYSR");
331 unit_assert(peptideItr != nontrypticPeptideSet.end());
336 peptideItr->CTerminusIsSpecific());
338 peptideItr = nontrypticPeptideSet.find(
"KWVTFISLLLLFSSAYSRG");
339 unit_assert(peptideItr == nontrypticPeptideSet.end());
341 peptideItr = nontrypticPeptideSet.find(
"WVTFISLLLLFSSAYSR");
342 unit_assert(peptideItr != nontrypticPeptideSet.end());
347 peptideItr->CTerminusIsSpecific());
349 peptideItr = nontrypticPeptideSet.find(
"WVTFISLLLLFSSAYSRG");
350 unit_assert(peptideItr != nontrypticPeptideSet.end());
355 !peptideItr->CTerminusIsSpecific());
357 peptideItr = nontrypticPeptideSet.find(
"VTFISLLLLFSSAYSRG");
358 unit_assert(peptideItr != nontrypticPeptideSet.end());
363 !peptideItr->CTerminusIsSpecific());
366 unit_assert(nontrypticPeptideSet.count(
"WVTFISLLLLFSSAYSR"));
367 unit_assert(nontrypticPeptideSet.count(
"VTFISLLLLFSSAYSR"));
368 unit_assert(nontrypticPeptideSet.count(
"VTFISLLLLFSSAYS"));
371 unit_assert(nontrypticPeptideSet.count(
"FAVEGPKLVVSTQTALA"));
372 unit_assert(nontrypticPeptideSet.count(
"FAVEGPKLVVSTQTAL"));
376 unit_assert(nontrypticPeptideSet.count(
"KWVTFISLLLLFSSAYSR"));
377 unit_assert(!nontrypticPeptideSet.count(
"KWVTFISLLLLFSSAYSRG"));
382 unit_assert(nontrypticPeptideSet.count(
"VLASSAR"));
385 unit_assert(!nontrypticPeptideSet.count(
"EYEATLEECCAKDDPHACYSTVFDK"));
390 if (
os_) *
os_ <<
"Semi-specific BSA digest w/ methionine clipping (offset, missed cleavages, specific termini, length, sequence)" << endl;
392 set<DigestedPeptide, DigestedPeptideLessThan>::const_iterator peptideItr;
394 vector<DigestedPeptide> semitrypticPeptides(semitrypticDigestion.
begin(), semitrypticDigestion.
end());
395 set<DigestedPeptide, DigestedPeptideLessThan> semitrypticPeptideSet(semitrypticPeptides.begin(), semitrypticPeptides.end());
428 unit_assert(semitrypticPeptides[0].NTerminusIsSpecific() &&
429 !semitrypticPeptides[0].CTerminusIsSpecific());
431 peptideItr = semitrypticPeptideSet.find(
"KWVTFISLLLLFSSAYS");
432 unit_assert(peptideItr != semitrypticPeptideSet.end());
438 peptideItr = semitrypticPeptideSet.find(
"KWVTFISLLLLFSSAYSR");
439 unit_assert(peptideItr != semitrypticPeptideSet.end());
444 peptideItr->CTerminusIsSpecific());
446 peptideItr = semitrypticPeptideSet.find(
"KWVTFISLLLLFSSAYSRG");
447 unit_assert(peptideItr == semitrypticPeptideSet.end());
449 peptideItr = semitrypticPeptideSet.find(
"WVTFISLLLLFSSAYSR");
450 unit_assert(peptideItr != semitrypticPeptideSet.end());
455 peptideItr->CTerminusIsSpecific());
457 peptideItr = semitrypticPeptideSet.find(
"WVTFISLLLLFSSAYSRG");
458 unit_assert(peptideItr != semitrypticPeptideSet.end());
463 !peptideItr->CTerminusIsSpecific());
465 peptideItr = semitrypticPeptideSet.find(
"VTFISLLLLFSSAYSRG");
466 unit_assert(peptideItr == semitrypticPeptideSet.end());
469 unit_assert(semitrypticPeptideSet.count(
"WVTFISLLLLFSSAYSR"));
470 unit_assert(semitrypticPeptideSet.count(
"KWVTFISLLLLFSSAYSR"));
471 unit_assert(semitrypticPeptideSet.count(
"KWVTFISLLLLFSSAYS"));
472 unit_assert(!semitrypticPeptideSet.count(
"VTFISLLLLFSSAYS"));
475 unit_assert(semitrypticPeptideSet.count(
"FAVEGPKLVVSTQTALA"));
476 unit_assert(!semitrypticPeptideSet.count(
"FAVEGPKLVVSTQTAL"));
481 if (
os_) *
os_ <<
"BSA digestion test" << endl;
484 Peptide bsa(
"MKWVTFISLLLLFSSAYSRGVFRRDTHKSEIAHRFKDLGEEHFKGLVLIAFSQYLQQCPF"
485 "DEHVKLVNELTEFAKTCVADESHAGCEKSLHTLFGDELCKVASLRETYGDMADCCEKQEP"
486 "ERNECFLSHKDDSPDLPKLKPDPNTLCDEFKADEKKFWGKYLYEIARRHPYFYAPELLYY"
487 "ANKYNGVFQECCQAEDKGACLLPKIETMREKVLASSARQRLRCASIQKFGERALKAWSVA"
488 "RLSQKFPKAEFVEVTKLVTDLTKVHKECCHGDLLECADDRADLAKYICDNQDTISSKLKE"
489 "CCDKPLLEKSHCIAEVEKDAIPENLPPLTADFAEDKDVCKNYQEAKDAFLGSFLYEYSRR"
490 "HPEYAVSVLLRLAKEYEATLEECCAKDDPHACYSTVFDKLKHLVDEPQNLIKQNCDQFEK"
491 "LGEYGFQNALIVRYTRKVPQVSTPTLVEVSRSLGKVGTRCCTKPESERMPCTEDYLSLIL"
492 "NRLCVLHEKTPVSEKVTKCCTESLVNRRPCFSALTPDETYVPKAFDEKLFTFHADICTLP"
493 "DTEKQIKKQTALVELLKHKPKATEEQLKTVMENFVAFVDKCCAADDKEACFAVEGPKLVV"
513 Digestion funkyDigestion(bsa, boost::regex(
"(?<=A[DE])(?=[FG])"),
Digestion::Config(0, 5, 100000, Digestion::FullySpecific,
false));
514 vector<Peptide> funkyPeptides(funkyDigestion.
begin(), funkyDigestion.
end());
516 unit_assert_operator_equal(
"MKWVTFISLLLLFSSAYSRGVFRRDTHKSEIAHRFKDLGEEHFKGLVLIAFSQYLQQCPFDEHVKLVNELTEFAKTCVADESHAGCEKSLHTLFGDELCKVASLRETYGDMADCCEKQEPERNECFLSHKDDSPDLPKLKPDPNTLCDEFKADEKKFWGKYLYEIARRHPYFYAPELLYYANKYNGVFQECCQAEDKGACLLPKIETMREKVLASSARQRLRCASIQKFGERALKAWSVARLSQKFPKAE", funkyPeptides[0].sequence());
517 unit_assert_operator_equal(
"FVEVTKLVTDLTKVHKECCHGDLLECADDRADLAKYICDNQDTISSKLKECCDKPLLEKSHCIAEVEKDAIPENLPPLTAD", funkyPeptides[1].sequence());
518 unit_assert_operator_equal(
"FAEDKDVCKNYQEAKDAFLGSFLYEYSRRHPEYAVSVLLRLAKEYEATLEECCAKDDPHACYSTVFDKLKHLVDEPQNLIKQNCDQFEKLGEYGFQNALIVRYTRKVPQVSTPTLVEVSRSLGKVGTRCCTKPESERMPCTEDYLSLILNRLCVLHEKTPVSEKVTKCCTESLVNRRPCFSALTPDETYVPKAFDEKLFTFHADICTLPDTEKQIKKQTALVELLKHKPKATEEQLKTVMENFVAFVDKCCAADDKEACFAVEGPKLVVSTQTALA", funkyPeptides[2].sequence());
522 vector<Peptide> aspnPeptides(aspnDigestion.
begin(), aspnDigestion.
end());
531 vector<Peptide> noCleavagePeptides(noCleavageDigestion.
begin(), noCleavageDigestion.
end());
538 vector<Peptide> unspecificCleavagePeptides(unspecificCleavageDigestion.
begin(), unspecificCleavageDigestion.
end());
647 status.
exception = boost::copy_exception(runtime_error(e.what()));
651 status.
exception = boost::copy_exception(runtime_error(
"Unhandled exception in worker thread."));
659 boost::barrier testBarrier(testThreadCount);
660 list<pair<boost::shared_ptr<thread>,
ThreadStatus> > threads;
661 for (
int i=0; i < testThreadCount; ++i)
663 threads.push_back(make_pair(boost::shared_ptr<thread>(),
ThreadStatus()));
664 threads.back().first.reset(
new thread(
testThreadSafetyWorker, &testBarrier, boost::ref(threads.back().second)));
667 set<boost::shared_ptr<thread> > finishedThreads;
668 while (finishedThreads.size() < threads.size())
669 BOOST_FOREACH_FIELD((boost::shared_ptr<thread>& t)(
ThreadStatus& status), threads)
671 if (t->timed_join(boost::posix_time::seconds(1)))
672 finishedThreads.insert(t);
674 if (status.exception != NULL)
675 boost::rethrow_exception(status.exception);
680 int main(
int argc,
char* argv[])
684 if (argc>1 && !strcmp(argv[1],
"-v"))
os_ = &cout;
685 if (
os_) *
os_ <<
"DigestionTest\n";