Skip to content
New issue

Have a question about this project? Sign up for a free GitHub account to open an issue and contact its maintainers and the community.

By clicking “Sign up for GitHub”, you agree to our terms of service and privacy statement. We’ll occasionally send you account related emails.

Already on GitHub? Sign in to your account

snip those raw files #732

Open
wants to merge 30 commits into
base: master
Choose a base branch
from
Open
Show file tree
Hide file tree
Changes from all commits
Commits
Show all changes
30 commits
Select commit Hold shift + click to select a range
a6b1639
correct Within calculation
Nov 18, 2021
fa4da8b
update unit tests
Nov 18, 2021
3246567
conflicts resolved back to upstream
Feb 4, 2022
a018d4d
Merge remote-tracking branch 'upstream/master'
Feb 15, 2022
15a37d0
Merge remote-tracking branch 'upstream/master'
Feb 17, 2022
892fa45
this is the spot
Feb 18, 2022
211013c
Merge remote-tracking branch 'upstream/master'
Feb 25, 2022
68104ee
Merge branch 'master' of https://github.com/trishorts/mzLib
trishorts Mar 9, 2022
d715a08
Merge remote-tracking branch 'upstream/master'
Mar 16, 2022
3565522
Merge remote-tracking branch 'upstream/master'
Mar 23, 2022
72e7b53
Merge remote-tracking branch 'upstream/master'
Mar 29, 2022
593872a
Merge remote-tracking branch 'upstream/master'
trishorts Apr 13, 2022
42dd034
Merge branch 'master' of https://github.com/trishorts/mzLib
trishorts Apr 13, 2022
fbeaec0
Merge remote-tracking branch 'upstream/master'
trishorts Jun 1, 2022
614ded7
Merge remote-tracking branch 'upstream/master'
Jun 14, 2022
47307c8
Merge branch 'master' of https://github.com/trishorts/mzLib
Jun 14, 2022
28e05ae
Merge remote-tracking branch 'upstream/master'
Jul 6, 2022
0a7c609
Merge remote-tracking branch 'upstream/master'
Jul 26, 2022
630d8c7
Merge remote-tracking branch 'upstream/master'
trishorts Jul 27, 2022
f6a386b
Merge branch 'master' of https://github.com/trishorts/mzLib
trishorts Jul 27, 2022
d673800
Merge remote-tracking branch 'upstream/master'
Sep 11, 2022
675a0ae
Merge branch 'master' of https://github.com/trishorts/mzLib
Sep 11, 2022
15d4baf
Merge remote-tracking branch 'upstream/master'
Sep 27, 2022
03ca9f7
Merge remote-tracking branch 'upstream/master'
Oct 4, 2022
d0a4c79
Merge remote-tracking branch 'upstream/master'
Jan 30, 2023
894b998
Merge remote-tracking branch 'upstream/master'
Mar 15, 2023
88269a1
Merge remote-tracking branch 'upstream/master'
trishorts Apr 24, 2023
9a9b24a
Merge remote-tracking branch 'upstream/master'
trishorts Jun 29, 2023
b4ad231
add space
trishorts Jun 29, 2023
b417087
snipper
trishorts Sep 21, 2023
File filter

Filter by extension

Filter by extension

Conversations
Failed to load comments.
Loading
Jump to
Jump to file
Failed to load files.
Loading
Diff view
Diff view
82 changes: 82 additions & 0 deletions mzLib/Readers/MzML/SnipCreator.cs
Original file line number Diff line number Diff line change
@@ -0,0 +1,82 @@
using MassSpectrometry;

namespace Readers;

public class SnipCreator
{
public void Snipper(string origDataFile, int startScan, int endScan)
{

FilteringParams filter = new FilteringParams(200, 0.01, 1, null, false, false, true);
var reader = MsDataFileReader.GetDataFile(origDataFile);
reader.LoadAllStaticData(filter, 1);

var scans = reader.GetAllScansList();
var scansToKeep = scans.Where(x => x.OneBasedScanNumber >= startScan && x.OneBasedScanNumber <= endScan).ToList();

List<(int oneBasedScanNumber, int? oneBasedPrecursorScanNumber)> scanNumbers = new List<(int oneBasedScanNumber, int? oneBasedPrecursorScanNumber)>();

foreach (var scan in scansToKeep)
{
if (scan.OneBasedPrecursorScanNumber.HasValue && (scan.OneBasedPrecursorScanNumber.Value - startScan + 1) >= 0)
{
scanNumbers.Add((scan.OneBasedScanNumber, scan.OneBasedPrecursorScanNumber));
}
}

Dictionary<int, int> scanNumberMap = new Dictionary<int, int>();

foreach (var scanNumber in scanNumbers)
{
if (!scanNumberMap.ContainsKey(scanNumber.oneBasedScanNumber))
{
scanNumberMap.Add(scanNumber.oneBasedScanNumber, scanNumber.oneBasedScanNumber - startScan + 1);
}
if (scanNumber.oneBasedPrecursorScanNumber.HasValue && !scanNumberMap.ContainsKey(scanNumber.oneBasedPrecursorScanNumber.Value))
{
scanNumberMap.Add(scanNumber.oneBasedPrecursorScanNumber.Value, scanNumber.oneBasedPrecursorScanNumber.Value - startScan + 1);
}
}
List<MsDataScan> scansForTheNewFile = new List<MsDataScan>();


foreach (var scanNumber in scanNumbers)
{
MsDataScan scan = scansToKeep.First(x => x.OneBasedScanNumber == scanNumber.oneBasedScanNumber);

MsDataScan newDataScan = new MsDataScan(
scan.MassSpectrum,
scanNumberMap[scan.OneBasedScanNumber],
scan.MsnOrder,
scan.IsCentroid,
scan.Polarity,
scan.RetentionTime,
scan.ScanWindowRange,
scan.ScanFilter,
scan.MzAnalyzer,
scan.TotalIonCurrent,
scan.InjectionTime,
scan.NoiseData,
scan.NativeId.Replace(scan.OneBasedPrecursorScanNumber.ToString(), scanNumberMap[scan.OneBasedScanNumber].ToString()),
scan.SelectedIonMZ,
scan.SelectedIonChargeStateGuess,
scan.SelectedIonIntensity,
scan.IsolationMz,
scan.IsolationWidth,
scan.DissociationType,
scanNumberMap[scan.OneBasedPrecursorScanNumber.Value],
scan.SelectedIonMonoisotopicGuessMz,
scan.HcdEnergy
);
scansForTheNewFile.Add(newDataScan);
}

string outPath = origDataFile.Replace(".mzML", "_snip.mzML");

SourceFile sourceFile = new SourceFile(reader.SourceFile.NativeIdFormat,
reader.SourceFile.MassSpectrometerFileFormat, reader.SourceFile.CheckSum, reader.SourceFile.Uri.ToString(),
reader.SourceFile.FileName);

MzmlMethods.CreateAndWriteMyMzmlWithCalibratedSpectra(new GenericMsDataFile(scansForTheNewFile.ToArray(),sourceFile), outPath, false);
}
}
91 changes: 91 additions & 0 deletions mzLib/Test/FileReadingTests/TestMzML.cs
Original file line number Diff line number Diff line change
Expand Up @@ -2,6 +2,7 @@
using System.Collections.Generic;
using System.IO;
using System.Linq;
using System.Security;
using System.Threading.Tasks;
using System.Xml.Serialization;
using Chemistry;
Expand Down Expand Up @@ -96,6 +97,96 @@ public static void ReadMzMlInNewEra()
Assert.AreEqual(20, scans[1].MassSpectrum.XArray.Count());
}

[Test]
public static void SnipMzMl()
{
string origDataFile = @"E:\Projects\GlycoNickLei_PXD017646\2019_07_30_GlycoPepMix_35trig_EThcD35_rep2.raw";
int startScan = 5715;
int endScan = 5915;
FilteringParams filter = new FilteringParams(200, 0.01, 1, null, false, false, true);
var reader = MsDataFileReader.GetDataFile(origDataFile);
reader.LoadAllStaticData(filter, 1);

var scans = reader.GetAllScansList();
var scansToKeep = scans.Where(x => x.OneBasedScanNumber >= startScan && x.OneBasedScanNumber <= endScan).ToList();

List<(int oneBasedScanNumber, int? oneBasedPrecursorScanNumber)> scanNumbers = new List<(int oneBasedScanNumber, int? oneBasedPrecursorScanNumber)>();
Copy link
Collaborator

Choose a reason for hiding this comment

The reason will be displayed to describe this comment to others. Learn more.

Should this test implement the class you wrote above?


foreach (var scan in scansToKeep)
{
if (scan.OneBasedPrecursorScanNumber.HasValue)
{
scanNumbers.Add((scan.OneBasedScanNumber, scan.OneBasedPrecursorScanNumber.Value));
}
else
{
scanNumbers.Add((scan.OneBasedScanNumber, null));
}
}

Dictionary<int, int> scanNumberMap = new Dictionary<int, int>();

foreach (var scanNumber in scanNumbers)
{
if (!scanNumberMap.ContainsKey(scanNumber.oneBasedScanNumber) && (scanNumber.oneBasedScanNumber - startScan + 1) > 0)
{
scanNumberMap.Add(scanNumber.oneBasedScanNumber, scanNumber.oneBasedScanNumber - startScan + 1);
}
if (scanNumber.oneBasedPrecursorScanNumber.HasValue && !scanNumberMap.ContainsKey(scanNumber.oneBasedPrecursorScanNumber.Value) && (scanNumber.oneBasedPrecursorScanNumber.Value - startScan + 1) > 0)
{
scanNumberMap.Add(scanNumber.oneBasedPrecursorScanNumber.Value, scanNumber.oneBasedPrecursorScanNumber.Value - startScan + 1);
}
}
List<MsDataScan> scansForTheNewFile = new List<MsDataScan>();


foreach (var scanNumber in scanNumbers)
{
MsDataScan scan = scansToKeep.First(x => x.OneBasedScanNumber == scanNumber.oneBasedScanNumber);

int? newOneBasedPrecursorScanNumber = null;
if (scan.OneBasedPrecursorScanNumber.HasValue && scanNumberMap.ContainsKey(scan.OneBasedPrecursorScanNumber.Value))
{
newOneBasedPrecursorScanNumber = scanNumberMap[scan.OneBasedPrecursorScanNumber.Value];
}
MsDataScan newDataScan = new MsDataScan(
scan.MassSpectrum,
scanNumberMap[scan.OneBasedScanNumber],
scan.MsnOrder,
scan.IsCentroid,
scan.Polarity,
scan.RetentionTime,
scan.ScanWindowRange,
scan.ScanFilter,
scan.MzAnalyzer,
scan.TotalIonCurrent,
scan.InjectionTime,
scan.NoiseData,
scan.NativeId.Replace(scan.OneBasedScanNumber.ToString(), scanNumberMap[scan.OneBasedScanNumber].ToString()),
scan.SelectedIonMZ,
scan.SelectedIonChargeStateGuess,
scan.SelectedIonIntensity,
scan.IsolationMz,
scan.IsolationWidth,
scan.DissociationType,
newOneBasedPrecursorScanNumber,
scan.SelectedIonMonoisotopicGuessMz,
scan.HcdEnergy
);
scansForTheNewFile.Add(newDataScan);
}

string outPath = origDataFile.Replace(".raw", "_snip.mzML").ToString();

SourceFile sourceFile = new SourceFile(reader.SourceFile.NativeIdFormat,
reader.SourceFile.MassSpectrometerFileFormat, reader.SourceFile.CheckSum, reader.SourceFile.FileChecksumType, reader.SourceFile.Uri, reader.SourceFile.Id, reader.SourceFile.FileName);


MzmlMethods.CreateAndWriteMyMzmlWithCalibratedSpectra(new GenericMsDataFile(scansForTheNewFile.ToArray(), sourceFile), outPath, false);

Assert.IsTrue(false);
}

[Test]
public void LoadBadMzml()
{
Expand Down
1 change: 1 addition & 0 deletions mzLib/Test/TestBayesianEstimation.cs
Original file line number Diff line number Diff line change
Expand Up @@ -95,6 +95,7 @@ public static void TestOneSampleBayesianEstimation()
Assert.That(Math.Round(highestDensityInterval.hdi_end, 3) == 1.062);
}


[Test]
/// <summary>
/// Bayesian estimation of the difference in means between two samples.
Expand Down