Source of file MsgfPlusSearchParameters.php
Size: 16,067 Bytes - Last Modified: 2019-05-10T12:24:09+01:00
src/Search/Parameters/MsgfPlusSearchParameters.php
123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172
Covered by 1 test(s):
73
Covered by 1 test(s):
747576777879808182
Covered by 1 test(s):
83848586878889909192939495
Covered by 1 test(s):
96
Covered by 1 test(s):
979899100
Covered by 1 test(s):
101102103104105106107108109110111112113114
Covered by 2 test(s):
115
Covered by 1 test(s):
116117118
Covered by 1 test(s):
119
Covered by 1 test(s):
120121122123
Covered by 1 test(s):
124125126127128129130131132133134135136137138139140141142143144
Covered by 2 test(s):
145
Covered by 1 test(s):
146147148
Covered by 1 test(s):
149
Covered by 1 test(s):
150151152153
Covered by 1 test(s):
154155156157158159160161162163164165166167168169170171172
Covered by 2 test(s):
173
Covered by 1 test(s):
174175176
Covered by 1 test(s):
177
Covered by 1 test(s):
178179180181
Covered by 1 test(s):
182183184185186187188189190191192193194195196
Covered by 2 test(s):
197
Covered by 1 test(s):
198199200
Covered by 1 test(s):
201
Covered by 1 test(s):
202203204205206207208209210211212213214215216
Covered by 2 test(s):
217
Covered by 1 test(s):
218219220
Covered by 1 test(s):
221
Covered by 1 test(s):
222223224225
Covered by 1 test(s):
226227228229230231232233234235236237238239240
Covered by 2 test(s):
241
Covered by 1 test(s):
242243244
Covered by 1 test(s):
245
Covered by 1 test(s):
246247248249
Covered by 1 test(s):
250251252253254255256257258259260261262263
Covered by 2 test(s):
264
Covered by 1 test(s):
265266267
Covered by 1 test(s):
268
Covered by 1 test(s):
269270271272273274275276277
Covered by 1 test(s):
278279280281282283284285286287288
Covered by 2 test(s):
289
Covered by 1 test(s):
290291292
Covered by 1 test(s):
293
Covered by 1 test(s):
294295296297
Covered by 1 test(s):
298299300301302303304305306307308
Covered by 2 test(s):
309
Covered by 1 test(s):
310311312
Covered by 1 test(s):
313
Covered by 1 test(s):
314315316317
Covered by 1 test(s):
318319320321322323324325326327328329
Covered by 2 test(s):
330
Covered by 1 test(s):
331332333
Covered by 1 test(s):
334
Covered by 1 test(s):
335336337338
Covered by 1 test(s):
339340341342343344345346347348349350
Covered by 2 test(s):
351
Covered by 1 test(s):
352353354
Covered by 1 test(s):
355
Covered by 1 test(s):
356357358359
Covered by 1 test(s):
360361362363364365366367368369370
Covered by 2 test(s):
371
Covered by 1 test(s):
372373374
Covered by 1 test(s):
375
Covered by 1 test(s):
376377378379
Covered by 1 test(s):
380381382383384385386387388389390391392393394
Covered by 2 test(s):
395
Covered by 1 test(s):
396397398
Covered by 1 test(s):
399
Covered by 1 test(s):
400401402403
Covered by 1 test(s):
404405406407408409410411412413414415
Covered by 2 test(s):
416
Covered by 1 test(s):
417418419
Covered by 1 test(s):
420
Covered by 1 test(s):
421422423424
Covered by 1 test(s):
425426427428429430431432433434435
Covered by 2 test(s):
436
Covered by 1 test(s):
437438439
Covered by 1 test(s):
440
Covered by 1 test(s):
441442443444
Covered by 1 test(s):
445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501
| <?php /** * Copyright 2016 University of Liverpool * * Licensed under the Apache License, Version 2.0 (the "License"); * you may not use this file except in compliance with the License. * You may obtain a copy of the License at * * http://www.apache.org/licenses/LICENSE-2.0 * * Unless required by applicable law or agreed to in writing, software * distributed under the License is distributed on an "AS IS" BASIS, * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. * See the License for the specific language governing permissions and * limitations under the License. */ namespace pgb_liv\php_ms\Search\Parameters; use pgb_liv\php_ms\Core\Modification; /** * Encapsulation class for MS-GF+ search parameters * * @author Andrew Collins */ class MsgfPlusSearchParameters extends AbstractSearchParameters implements SearchParametersInterface { private $outputFile; private $isotopeErrorRange; private $numOfThreads; private $fragmentationMethodId; private $ms2DetectorId; private $protocolId; private $tolerableTrypticTermini; private $modificationFile; private $minPeptideLength; private $maxPeptideLength; private $minPrecursorCharge; private $maxPrecursorCharge; private $numMatchesPerSpec; private $additionalFeatures; private $showQValue; private $chargeCarrierMass; /** * Filename where the output (mzIdentML 1.1 format) will be written. * File extension must be "mzid" (case sensitive). * By default, the output file name will be "[SpectrumFileName].mzid". * E.g. for the input spectrum file "test.mzML", the output will be written to "test.mzid" if this parameter is not specified. * * @param string $filePath * Full file path to the file that MS-GF+ should create */ public function setOutputFile($filePath) { $this->outputFile = $filePath; } /** * Gets the current output file path * * @return string */ public function getOutputFile() { return $this->outputFile; } /** * Takes into account of the error introduced by choosing non-monoisotopic peak for fragmentation. * If the parent mass tolerance is equal to or larger than 0.5Da or 500ppm, this parameter will be ignored. * The combination of -t and -ti determines the precursor mass tolerance. * E.g. "-t 20ppm -ti -1,2" tests abs(exp-calc-n*1.00335Da)<20ppm for n=-1, 0, 1, 2. * * @param string $range */ public function setIsotopeErrorRange($range) { $this->isotopeErrorRange = $range; } public function getIsotopeErrorRange() { return $this->isotopeErrorRange; } /** * (Number of concurrent threads to be executed, Default: Number of available cores) * * Number of concurrent threads to be executed together. * Default value is the number of available logical cores (e.g. 8 for quad-core processor with hyper-threading support). * * @param int $threadCount * Number of concurrent threads to be executed */ public function setNumOfThreads($threadCount) { if (! is_int($threadCount) || $threadCount < 0) { throw new \InvalidArgumentException('Argument 1 must be a positive integer'); } $this->numOfThreads = $threadCount; } public function getNumOfThreads() { return $this->numOfThreads; } /** * (0: as written in the spectrum or CID if no info (Default), 1: CID, 2: ETD, 3: HCD, 4: Merge spectra from the same precursor) * * Fragmentation method identifier (used to determine the scoring model). * If the identifier is 0 and fragmentation method is written in the spectrum file (e.g. mzML files), MS-GF+ will recognize the fragmentation method and use * a relevant scoring model. * If the identifier is 0 and there is no fragmentation method information in the spectrum (e.g. mgf files), CID model will be used by default. * If the identifier is non-zero and the spectrum has fragmentation method information, only the spectra that match with the identifier will be processed. * If the identifier is non-zero and the spectrum has no fragmentation method information, MS-GF+ will process all spectra assuming the specified * fragmentation method. * If the identifier is 4, MS/MS spectra from the same precursor ion (e.g. CID/ETD pairs, CID/HCD/ETD triplets) will be merged and the "merged" spectrum * will be used for searching instead of individual spectra. See Kim et al., MCP 2010 for details. * * @param int $method * Fragmentation method identifier */ public function setFragmentationMethodId($method) { if (! is_int($method) || $method < 0 || $method > 4) { throw new \InvalidArgumentException('Argument 1 must be an integer between 0 and 4'); } $this->fragmentationMethodId = $method; } public function getFragmentationMethodId() { return $this->fragmentationMethodId; } /** * (0: Low-res LCQ/LTQ (Default for CID and ETD), 1: High-res LTQ (Default for HCD), 2: TOF, 3: Q-Exactive) * * Identifier of the instrument to generate MS/MS spectra (used to determine the scoring model). * For "hybrid" spectra with high-precision MS1 and low-precision MS2, use 0. * For usual low-precision instruments (e.g. Thermo LTQ), use 0. * If MS/MS fragment ion peaks are of high-precision (e.g. tolerance = 10ppm), use 2. * For TOF instruments, use 2. * For Q-Exactive HCD spectra, use 3. * For other HCD spectra, use 1. * * @param int $identifier * Identifier of the instrument to generate MS/MS spectra */ public function setMs2DetectorId($identifier) { if (! is_int($identifier) || $identifier < 0 || $identifier > 3) { throw new \InvalidArgumentException('Argument 1 must be an integer between 0 and 3'); } $this->ms2DetectorId = $identifier; } public function getMs2DetectorId() { return $this->ms2DetectorId; } /** * Enzyme identifier. * Trypsin (1) will be used by default. * 0: unspecific cleavage, 1: Trypsin (default), 2: Chymotrypsin, 3: Lys-C, 4: Lys-N, 5: glutamyl endopeptidase (Glu-C), 6: Arg-C, 7: Asp-N, 8: alphaLP, 9: * no cleavage * Use 9 for peptidomics studies * * @param int $enzyme * Enzyme identifier */ public function setEnzyme($enzyme) { if (! is_int($enzyme) || $enzyme < 0 || $enzyme > 9) { throw new \InvalidArgumentException('Argument 1 must be an integer between 0 and 9'); } parent::setEnzyme($enzyme); } /** * Protocol identifier. * Protocols are used to enable scoring parameters for enriched and/or labeled samples. * 0: No protocol (Default) * 1: Phosphorylation: for phosphopeptide enriched samples * 2: iTRAQ: for iTRAQ-labeled samples * 3: iTRAQPhospho: for phosphopeptide enriched and iTRAQ-labeled samples * * @param int $identifier * Protocol identifier */ public function setProtocolId($identifier) { if (! is_int($identifier) || $identifier < 0 || $identifier > 3) { throw new \InvalidArgumentException('Argument 1 must be an integer between 0 and 3'); } $this->protocolId = $identifier; } public function getProtocolId() { return $this->protocolId; } /** * This parameter is used to apply the enzyme cleavage specificity rule when searching the database. * Specifies the minimum number of termini matching the enzyme specificity rule. * For example, for trypsin, K.ACDEFGHR.C (NTT=2), G.ACDEFGHR.C (NTT=1), K.ACDEFGHI.C (NTT=1) and G.ACDEFGHR.C (NTT=0). * '-ntt 2' will search for fully tryptic peptides only. * By default, -ntt 2 will be used. Using -ntt 1 (or 0) will make the search significantly slower. * * @param int $identifier * Number of tolerable (tryptic) termini */ public function setTolerableTrypticTermini($identifier) { if (! is_int($identifier) || $identifier < 0 || $identifier > 2) { throw new \InvalidArgumentException('Argument 1 must be an integer between 0 and 2'); } $this->tolerableTrypticTermini = $identifier; } public function getTolerableTrypticTermini() { return $this->tolerableTrypticTermini; } /** * Modification file name. * ModificationFile contains the modifications to be considered in the search. * If -mod option is not specified, standard amino acids with fixed Carboamidomethylation C will be used. * * @see https://raw.githubusercontent.com/sangtaekim/msgfplus/master/doc/examples/Mods.txt Example modification file. * @param string $filePath * Modification file path */ public function setModificationFile($filePath) { if (! file_exists($filePath)) { throw new \InvalidArgumentException('Argument 1 must be a validation modification file'); } $this->modificationFile = $filePath; } /** * Returns the modification file specified by setModificationFile. * * @return string The path to the modification file set by setModificationFile. Else returns null. */ public function getModificationFile() { return $this->modificationFile; } /** * Minimum length of the peptide to be considered. * (Default: 6) * * @param int $length */ public function setMinPeptideLength($length) { if (! is_int($length) || $length < 0) { throw new \InvalidArgumentException('Argument 1 must be a positive integer'); } $this->minPeptideLength = $length; } public function getMinPeptideLength() { return $this->minPeptideLength; } /** * Maximum length of the peptide to be considered. * (Default: 40) * * @param int $length */ public function setMaxPeptideLength($length) { if (! is_int($length) || $length < 0) { throw new \InvalidArgumentException('Argument 1 must be a positive integer'); } $this->maxPeptideLength = $length; } public function getMaxPeptideLength() { return $this->maxPeptideLength; } /** * Minimum precursor charge to consider. * This parameter is used only for spectra with no charge. * (Default: 2) * * @param int $charge */ public function setMinPrecursorCharge($charge) { if (! is_int($charge) || $charge < 0) { throw new \InvalidArgumentException('Argument 1 must be a positive integer'); } $this->minPrecursorCharge = $charge; } public function getMinPrecursorCharge() { return $this->minPrecursorCharge; } /** * Maximum precursor charge to consider. * This parameter is used only for spectra with no charge. * (Default: 3) * * @param int $charge */ public function setMaxPrecursorCharge($charge) { if (! is_int($charge) || $charge < 0) { throw new \InvalidArgumentException('Argument 1 must be a positive integer'); } $this->maxPrecursorCharge = $charge; } public function getMaxPrecursorCharge() { return $this->maxPrecursorCharge; } /** * Expected false discovery rates (EFDRs) will be reported only when this value is 1. * * @param int $psmCount * Number of peptide matches per spectrum to report. */ public function setNumMatchesPerSpectrum($psmCount) { if (! is_int($psmCount) || $psmCount < 0) { throw new \InvalidArgumentException('Argument 1 must be a positive integer'); } $this->numMatchesPerSpec = $psmCount; } public function getNumMatchesPerSpectrum() { return $this->numMatchesPerSpec; } /** * If 0, only basic scores are reported. * If 1, the following features are reported * MS2IonCurrent: Summed intensity of all product ions * ExplainedIonCurrentRatio: Summed intensity of all matched product ions (e.g. b, b-H2O, y, etc.) divided by MS2IonCurrent * NTermIonCurrentRatio: Summed intensity of all matched prefix ions (e.g. b, b-H2O, etc.) divided by MS2IonCurrent * CTermIonCurrentRatio: Summed intensity of all matched suffix ions (e.g. y, y-H2O, etc.) divided by MS2IonCurrent * * @param bool $bool */ public function setAdditionalFeatures($bool) { if (! is_bool($bool)) { throw new \InvalidArgumentException('Argument 1 must be a boolean'); } $this->additionalFeatures = $bool; } public function getAdditionalFeatures() { return $this->additionalFeatures; } /** * If false, QValue and PepQValue are not reported. * If true, QValue (PSM-level Q-value) and PepQValue (peptide-level Q-value) are reported (Default). * This parameter is ignored when "-tda 0". * * @param bool $bool */ public function setShowQValue($bool) { if (! is_bool($bool)) { throw new \InvalidArgumentException('Argument 1 must be a boolean'); } $this->showQValue = $bool; } public function getShowQValue() { return $this->showQValue; } /** * Mass of charge carrier, Default: mass of proton (1.00727649) * * @param float $mass * Mass of charge carrier */ public function setChargeCarrierMass($mass) { if (! is_float($mass)) { throw new \InvalidArgumentException('Argument 1 must be a float'); } $this->chargeCarrierMass = $mass; } public function getChargeCarrierMass() { return $this->chargeCarrierMass; } /** * Creates a modification file from an array of modifications * * @param Modification[] $modifications * @param number $numMods * Max number of modifications to search per peptide * @return string File path the newly created modification file */ public static function createModificationFile(array $modifications, $numMods = 2) { // TODO: // All array must be this class // NumMods must be uint $data = 'NumMods=' . $numMods . PHP_EOL; foreach ($modifications as $modification) { $entry = $modification->getMonoisotopicMass() . ','; $entry .= count($modification->getResidues()) == 0 ? '*' : implode('', $modification->getResidues()); $entry .= ','; $entry .= $modification->isFixed() ? 'fix,' : 'opt,'; $position = ''; switch ($modification->getPosition()) { case Modification::POSITION_PROTEIN_NTERM: $position = 'Prot-N-term'; break; case Modification::POSITION_PROTEIN_CTERM: $position = 'Prot-C-term'; break; case Modification::POSITION_NTERM: $position = 'N-term'; break; case Modification::POSITION_CTERM: $position = 'C-term'; break; case Modification::POSITION_ANY: default: $position = 'any'; break; } $entry .= $position . ','; $entry .= $modification->getName(); $data .= $entry . PHP_EOL; } $modFile = tempnam(sys_get_temp_dir(), 'php-msMsgfMods'); file_put_contents($modFile, $data); return $modFile; } } |