11#include <OpenMS/config.h>
53 const std::vector<ProteinIdentification>& protein_identifications,
55 bool export_all_psms =
false);
70 const std::vector<ProteinIdentification>& protein_identifications,
72 bool export_all_psms =
false);
85 const std::vector<ProteinIdentification>& protein_identifications,
87 const std::string& filename,
88 bool export_all_psms =
false,
105 const std::shared_ptr<arrow::Table>& table,
106 const std::string& filename,
142 const std::vector<ProteinIdentification>& protein_identifications,
143 const std::vector<const PeptideIdentification*>& peptide_identification_ptrs,
144 const std::string& filename,
145 bool export_all_psms =
false,
146 size_t batch_size = 1000000,
165 const std::shared_ptr<arrow::Table>& table,
166 std::vector<ProteinIdentification>& protein_identifications,
Container for peptide identifications from multiple spectra.
Definition PeptideIdentificationList.h:66
Export PSM (Peptide Spectrum Match) data to Apache Arrow format following QPX PSM schema.
Definition QPXFile.h:43
static std::shared_ptr< arrow::Table > exportToArrow(const std::vector< ProteinIdentification > &protein_identifications, const PeptideIdentificationList &peptide_identifications, bool export_all_psms=false)
Export PSMs to Arrow table using PSMSchema for lossless round-trips.
static bool exportToParquet(const std::vector< ProteinIdentification > &protein_identifications, const PeptideIdentificationList &peptide_identifications, const std::string &filename, bool export_all_psms=false, const ParquetWriteConfig &config=ParquetWriteConfig{})
Export PSM data to Parquet file.
static bool exportToParquetStreaming(const std::vector< ProteinIdentification > &protein_identifications, const std::vector< const PeptideIdentification * > &peptide_identification_ptrs, const std::string &filename, bool export_all_psms=false, size_t batch_size=1000000, const ParquetWriteConfig &config=ParquetWriteConfig{}, int n_threads=1)
Stream PSMs to a QPX Parquet file in row-batches to cap peak memory.
static bool exportToParquet(const std::shared_ptr< arrow::Table > &table, const std::string &filename, const ParquetWriteConfig &config=ParquetWriteConfig{})
Write a pre-built QPX PSM Arrow table to a Parquet file.
static bool importFromArrow(const std::shared_ptr< arrow::Table > &table, std::vector< ProteinIdentification > &protein_identifications, PeptideIdentificationList &peptide_identifications)
Import PSMs from a PSMSchema Arrow table.
static std::shared_ptr< arrow::Table > exportPSMsToQPXArrow(const std::vector< ProteinIdentification > &protein_identifications, const PeptideIdentificationList &peptide_identifications, bool export_all_psms=false)
Export PSMs to QPX Parquet eXchange format Arrow table (QPXPSMSchema).
Main OpenMS namespace.
Definition openswathalgo/include/OpenMS/OPENSWATHALGO/DATAACCESS/ISpectrumAccess.h:19
Definition ArrowIOHelpers.h:22
Configuration for Parquet file writing.
Definition MSExperimentArrowExport.h:136