Skip to content
New issue

Have a question about this project? Sign up for a free GitHub account to open an issue and contact its maintainers and the community.

By clicking “Sign up for GitHub”, you agree to our terms of service and privacy statement. We’ll occasionally send you account related emails.

Already on GitHub? Sign in to your account

Read CID/EAD mode from wiff2 files #3087

Merged
merged 15 commits into from
Aug 1, 2024
Merged
Show file tree
Hide file tree
Changes from all commits
Commits
File filter

Filter by extension

Filter by extension

Conversations
Failed to load comments.
Loading
Jump to
Jump to file
Failed to load files.
Loading
Diff view
Diff view
245 changes: 193 additions & 52 deletions pwiz/data/common/cv.cpp

Large diffs are not rendered by default.

82 changes: 73 additions & 9 deletions pwiz/data/common/cv.hpp
Original file line number Diff line number Diff line change
Expand Up @@ -41,12 +41,10 @@
// [psi-ms.obo]
#define _PSI_MS_OBO_
// format-version: 1.2
// data-version: 4.1.136
// date: 10:11:2023 11:30
// saved-by: Chris Bielow
// data-version: 4.1.163
// date: 19:07:2024 07:15
// saved-by: Joshua Klein
// auto-generated-by: OBO-Edit 2.3.1
// import: http://purl.obolibrary.org/obo/pato.obo
// import: http://purl.obolibrary.org/obo/stato.owl
// default-namespace: MS
// namespace-id-rule: * MS:$sequence(7,0,9999999)$
// namespace-id-rule: * PEFF:$sequence(7,0,9999999)$
Expand Down Expand Up @@ -79,7 +77,7 @@
// [unimod.obo]
#define _UNIMOD_OBO_
// format-version: 1.4
// date: 05:10:2023 14:38
// date: 29:02:2024 10:49
//
// [unit.obo]
#define _UNIT_OBO_
Expand Down Expand Up @@ -307,6 +305,9 @@ enum PWIZ_API_DECL CVID
/// Duration: The period of time during which something continues.
NCIT_Duration = 100325330,

/// Number: A numeral or string of numerals expressing value, quantity, or identification.
NCIT_Number = 100325337,

/// Action: A thing done.
NCIT_Action = 100325404,

Expand Down Expand Up @@ -1822,6 +1823,9 @@ enum PWIZ_API_DECL CVID
/// laser desorption ionization: The formation of gas-phase ions by the interaction of a pulsed laser with a solid or liquid material.
MS_laser_desorption_ionization = 1000393,

/// no sequence database: No reference sequence database was used in the search process to determine the identified peptide sequence, for example as with de novo sequencing.
MS_no_sequence_database = 1000394,

/// liquid secondary ionization: The ionization of any species by the interaction of a focused beam of ions with a sample that is dissolved in a solvent matrix. See also fast atom bombardment and secondary ionization.
MS_liquid_secondary_ionization = 1000395,

Expand Down Expand Up @@ -2719,6 +2723,9 @@ enum PWIZ_API_DECL CVID
/// 4000 Series Explorer Software: SCIEX or Applied Biosystems software for data acquisition and analysis.
MS_4000_Series_Explorer_Software = 1000659,

/// Xevo MRT MS: Waters Corporation Xevo MRT Mass Spectrometer.
MS_Xevo_MRT_MS = 1000660,

/// GPS Explorer: SCIEX or Applied Biosystems software for data acquisition and analysis.
MS_GPS_Explorer = 1000661,

Expand Down Expand Up @@ -3256,6 +3263,9 @@ enum PWIZ_API_DECL CVID
/// isolation window upper offset: The extent of the isolation window in m/z above the isolation window target m/z. The lower and upper offsets may be asymmetric about the target m/z.
MS_isolation_window_upper_offset = 1000829,

/// precision: Precision is the degree of how close repeated measurements are to each other. This can, for example, be expressed using the standard deviation.
MS_precision = 1000830,

/// sample preparation: Properties of the preparation steps which took place before the measurement was performed.
MS_sample_preparation = 1000831,

Expand Down Expand Up @@ -3373,8 +3383,8 @@ enum PWIZ_API_DECL CVID
/// structural formula: A chemical formula showing the number of atoms of each element in a molecule, their spatial arrangement, and their linkage to each other.
MS_structural_formula = 1000867,

/// SMILES formula: The simplified molecular input line entry specification or SMILES is a specification for unambiguously describing the structure of a chemical compound using a short ASCII string.
MS_SMILES_formula = 1000868,
/// SMILES string: The simplified molecular input line entry specification or SMILES is a specification for unambiguously describing the structure of a chemical compound using a short ASCII string.
MS_SMILES_string = 1000868,

/// collision gas pressure: The gas pressure of the collision gas used for collisional excitation.
MS_collision_gas_pressure = 1000869,
Expand Down Expand Up @@ -8713,6 +8723,12 @@ enum PWIZ_API_DECL CVID
/// FLASHDeconv: Ultrafast, High-Quality Feature Deconvolution for Top-Down Proteomics.
MS_FLASHDeconv = 1002714,

/// temperature chromatogram: Representation of temperature versus time.
MS_temperature_chromatogram = 1002715,

/// measured element: The component or dimension of an object being measured, for example the temperature of an instrument component over time.
MS_measured_element = 1002716,

/// Pegasus BT: LECO bench-top GC time-of-flight mass spectrometer.
MS_Pegasus_BT = 1002719,

Expand Down Expand Up @@ -10594,7 +10610,7 @@ enum PWIZ_API_DECL CVID
/// identification based on multiple spectra: Provides an identifier to encode identifications based on multiple spectra.
MS_identification_based_on_multiple_spectra = 1003332,

/// regular expression for encoding identifications based on multiple spectra.: ^(?<MULTIPLE_SPECTRA_IDENTIFIER>[0-9]+)(?::(?<PARENT_OR_CHILD>P|C))$
/// regular expression for encoding identifications based on multiple spectra.: ^(?<MULTIPLE_SPECTRA_IDENTIFIER>[0-9]+)(?::(?<PARENT_OR_CHILD>P|C))?$
MS_regular_expression_for_encoding_identifications_based_on_multiple_spectra_ = 1003333,

/// parent term for PSM-level scores for identifications based on multiple spectra: Parent term for PSM-level scores for identifications based on multiple spectra.
Expand Down Expand Up @@ -10813,6 +10829,33 @@ enum PWIZ_API_DECL CVID
/// pymzqc: A Python package for reading, validating, and writing mzQC files.
MS_pymzqc = 1003402,

/// InChI: IUPAC International Chemical Identifier.
MS_InChI = 1003403,

/// timsTOF HT: Bruker Daltonics' timsTOF HT.
MS_timsTOF_HT = 1003404,

/// mzRecal: MS1 recalibration using identified peptides as internal calibrants.
MS_mzRecal = 1003405,

/// spectrum clustering software: Software designed to group multiple mass spectra by high similarity, generally with the goal of grouping replicate spectra derived from the same analyte.
MS_spectrum_clustering_software = 1003406,

/// Scout: Identifying crosslinked peptides in complex protein mixtures
MS_Scout = 1003407,

/// Scout score: Scout identification search engine score
MS_Scout_score = 1003408,

/// Stellar: Thermo Scientific Stellar mass spectrometer contains a quadrupole mass filter, a collision cell, and a quadrupole linear ion trap mass analyzer.
MS_Stellar = 1003409,

/// electron beam energy: The kinetic energy of the electron beam used in dissociation methods induced by a free electron beam, such as electron-capture dissociation (ECD), electron-detachment dissociation (EDD), and electron-activated dissociation (EAD).
MS_electron_beam_energy = 1003410,

/// Number of Occurrences: The number of times something happened.
NCIT_Number_of_Occurrences = 103150827,

/// PSI-MS CV Quality Control Vocabulary: PSI Quality Control controlled vocabulary term.
MS_PSI_MS_CV_Quality_Control_Vocabulary = 4000000,

Expand Down Expand Up @@ -11302,6 +11345,21 @@ enum PWIZ_API_DECL CVID
/// median MS2 precursor charge in identified spectra: Median MS2 precursor charge in identified spectra. The used type of identification should be noted in the metadata or analysis methods section of the recording file for the respective run. In case of multiple acceptance criteria (FDR) available in proteomics, PSM-level FDR should be used for better comparability.
MS_median_MS2_precursor_charge_in_identified_spectra = 4000176,

/// contaminant protein abundance fraction: The fraction of total protein abundance in a mass spectrometry run or a group of runs which can be attributed to a user-defined list of contaminant proteins (e.g. using the cRAP contaminant database).
MS_contaminant_protein_abundance_fraction = 4000177,

/// precursor ppm deviation mean: The mean of the distribution of observed precursor mass accuracies (MS:4000072) [in ppm] of identified MS2 spectra after user-defined acceptance criteria (FDR) are applied
MS_precursor_ppm_deviation_mean = 4000178,

/// precursor ppm deviation sigma: The standard deviation of the distribution of observed precursor mass accuracies (MS:4000072) [in ppm] of identified MS2 spectra after user-defined acceptance criteria (FDR) are applied
MS_precursor_ppm_deviation_sigma = 4000179,

/// table of missed cleavage counts: The number of identified peptides with corresponding number of missed cleavages after user-defined acceptance criteria are applied. The number of missed cleavages per peptide is given in the 'number of missed cleavages' column, the respective count of such peptides identified in the 'Number of Occurrences' column. The highest 'missed cleavages' row is to be interpreted as that number of missed cleavages or higher.
MS_table_of_missed_cleavage_counts = 4000180,

/// identified MS2 quarter RT fraction: The interval used for acquisition of the first, second, third, and fourth quarter of all identified MS2 events divided by retention time duration.
MS_identified_MS2_quarter_RT_fraction = 4000181,

/// unimod root node: The root node of the unimod modifications ontology.
UNIMOD_unimod_root_node = 300000000,

Expand Down Expand Up @@ -15871,6 +15929,12 @@ enum PWIZ_API_DECL CVID
/// DVFQQQTGG: SUMOylation by Endogenous SUMO2/3 following Lys C and Asp-N serial digestion.
UNIMOD_DVFQQQTGG = 300002085,

/// iST-NHS specific cysteine modification: Preomics iST-NHS Kit specific cysteine modification.
UNIMOD_iST_NHS_specific_cysteine_modification = 300002086,

/// Label:13C(2)15N(1): 13C(2) 15N(1) Silac label.
UNIMOD_Label_13C_2_15N_1_ = 300002088,

/// unit: A unit of measurement is a standardized quantity of a physical quality.
UO_unit = 400000000,

Expand Down
Loading
Loading