Skip to content
New issue

Have a question about this project? Sign up for a free GitHub account to open an issue and contact its maintainers and the community.

By clicking “Sign up for GitHub”, you agree to our terms of service and privacy statement. We’ll occasionally send you account related emails.

Already on GitHub? Sign in to your account

Transcriptomics Digestion and Fragmentation #801

Merged
merged 19 commits into from
Oct 15, 2024
Merged
Show file tree
Hide file tree
Changes from 18 commits
Commits
File filter

Filter by extension

Filter by extension


Conversations
Failed to load comments.
Loading
Jump to
Jump to file
Failed to load files.
Loading
Diff view
Diff view
1 change: 1 addition & 0 deletions mzLib/Chemistry/ClassExtensions.cs
Original file line number Diff line number Diff line change
Expand Up @@ -48,6 +48,7 @@ public static double ToMass(this double massToChargeRatio, int charge)
return Math.Abs(charge) * massToChargeRatio - charge * Constants.ProtonMass;
}

public static double? RoundedDouble(this double myNumber, int places = 9) => RoundedDouble(myNumber as double?, places);
public static double? RoundedDouble(this double? myNumber, int places = 9)
{
if (myNumber != null)
Expand Down
5 changes: 5 additions & 0 deletions mzLib/MassSpectrometry/Enums/DissociationType.cs
Original file line number Diff line number Diff line change
Expand Up @@ -109,6 +109,11 @@ public enum DissociationType
/// </summary>
LowCID,

/// <summary>
/// activated ion electron photo detachment dissociation
/// </summary>
aEPD,

Unknown,
AnyActivationType,
Custom,
Expand Down
9 changes: 2 additions & 7 deletions mzLib/MzLibUtil/MzLibException.cs
Original file line number Diff line number Diff line change
Expand Up @@ -3,11 +3,6 @@
namespace MzLibUtil
{
[Serializable]
public class MzLibException : Exception
{
public MzLibException(string message)
: base(message)
{
}
}
public class MzLibException(string message, Exception innerException = null)
: Exception(message, innerException);
}
19 changes: 6 additions & 13 deletions mzLib/Omics/Fragmentation/FragmentationTerminus.cs
Original file line number Diff line number Diff line change
@@ -1,19 +1,12 @@
using System;
using System.Collections.Generic;
using System.Linq;
using System.Text;
using System.Threading.Tasks;

namespace Omics.Fragmentation
namespace Omics.Fragmentation
{
public enum FragmentationTerminus
{
Both, //N- and C-terminus
N, //N-terminus only
C, //C-terminus only
{
Both, //N- and C-terminus
N, //N-terminus only
C, //C-terminus only
None, //used for internal fragments, could be used for top down intact mass?
FivePrime, // 5' for NucleicAcids
ThreePrime, // 3' for NucleicAcids
}

}
}
162 changes: 161 additions & 1 deletion mzLib/Omics/Fragmentation/Oligo/DissociationTypeCollection.cs

Large diffs are not rendered by default.

141 changes: 141 additions & 0 deletions mzLib/Omics/Fragmentation/Oligo/TerminusSpecificProductTypes.cs
Original file line number Diff line number Diff line change
@@ -0,0 +1,141 @@
using System;
using System.Collections.Generic;
using System.Linq;
using System.Text;
using System.Threading.Tasks;

namespace Omics.Fragmentation.Oligo
{
public static class TerminusSpecificProductTypes
{
public static List<ProductType> GetRnaTerminusSpecificProductTypes(
this FragmentationTerminus fragmentationTerminus)
{
return ProductIonTypesFromSpecifiedTerminus[fragmentationTerminus];
}

/// <summary>
/// The types of ions that can be generated from an oligo fragment, based on the terminus of the fragment
/// </summary>
public static Dictionary<FragmentationTerminus, List<ProductType>> ProductIonTypesFromSpecifiedTerminus = new Dictionary<FragmentationTerminus, List<ProductType>>
{
{
FragmentationTerminus.FivePrime, new List<ProductType>
{
ProductType.a, ProductType.aWaterLoss, ProductType.aBaseLoss,
ProductType.b, ProductType.bWaterLoss, ProductType.bBaseLoss,
ProductType.c, ProductType.cWaterLoss, ProductType.cBaseLoss,
ProductType.d, ProductType.dWaterLoss, ProductType.dBaseLoss,
}
},
{
FragmentationTerminus.ThreePrime, new List<ProductType>
{
ProductType.w, ProductType.wWaterLoss, ProductType.wBaseLoss,
ProductType.x, ProductType.xWaterLoss, ProductType.xBaseLoss,
ProductType.y, ProductType.yWaterLoss, ProductType.yBaseLoss,
ProductType.z, ProductType.zWaterLoss, ProductType.zBaseLoss,
}
},
{
FragmentationTerminus.Both, new List<ProductType>
{

ProductType.a, ProductType.aWaterLoss, ProductType.aBaseLoss,
ProductType.b, ProductType.bWaterLoss, ProductType.bBaseLoss,
ProductType.c, ProductType.cWaterLoss, ProductType.cBaseLoss,
ProductType.d, ProductType.dWaterLoss, ProductType.dBaseLoss,
ProductType.w, ProductType.wWaterLoss, ProductType.wBaseLoss,
ProductType.x, ProductType.xWaterLoss, ProductType.xBaseLoss,
ProductType.y, ProductType.yWaterLoss, ProductType.yBaseLoss,
ProductType.z, ProductType.zWaterLoss, ProductType.zBaseLoss,
ProductType.M
}

},
{
FragmentationTerminus.None, new List<ProductType>()
}
};


public static FragmentationTerminus GetRnaTerminusType(this ProductType fragmentType)
{
switch (fragmentType)
{
case ProductType.a:
case ProductType.aWaterLoss:
case ProductType.aBaseLoss:
case ProductType.b:
case ProductType.bWaterLoss:
case ProductType.bBaseLoss:
case ProductType.c:
case ProductType.cWaterLoss:
case ProductType.cBaseLoss:
case ProductType.d:
case ProductType.dWaterLoss:
case ProductType.dBaseLoss:
case ProductType.w:
case ProductType.wWaterLoss:
case ProductType.wBaseLoss:
case ProductType.x:
case ProductType.xWaterLoss:
case ProductType.xBaseLoss:
case ProductType.y:
case ProductType.yWaterLoss:
case ProductType.yBaseLoss:
case ProductType.z:
case ProductType.zWaterLoss:
case ProductType.zBaseLoss:
case ProductType.M:
return ProductTypeToFragmentationTerminus[fragmentType];

case ProductType.aStar:
case ProductType.aDegree:
case ProductType.bAmmoniaLoss:
case ProductType.yAmmoniaLoss:
case ProductType.zPlusOne:
case ProductType.D:
case ProductType.Ycore:
case ProductType.Y:
default:
throw new ArgumentOutOfRangeException(nameof(fragmentType), fragmentType, null);
}
}


/// <summary>
/// The terminus of the oligo fragment that the product ion is generated from
/// </summary>
public static Dictionary<ProductType, FragmentationTerminus> ProductTypeToFragmentationTerminus = new Dictionary<ProductType, FragmentationTerminus>
{
{ ProductType.a, FragmentationTerminus.FivePrime },
{ ProductType.aWaterLoss, FragmentationTerminus.FivePrime },
{ ProductType.aBaseLoss, FragmentationTerminus.FivePrime },
{ ProductType.b, FragmentationTerminus.FivePrime },
{ ProductType.bWaterLoss, FragmentationTerminus.FivePrime },
{ ProductType.bBaseLoss, FragmentationTerminus.FivePrime },
{ ProductType.c, FragmentationTerminus.FivePrime },
{ ProductType.cWaterLoss, FragmentationTerminus.FivePrime },
{ ProductType.cBaseLoss, FragmentationTerminus.FivePrime },
{ ProductType.d, FragmentationTerminus.FivePrime },
{ ProductType.dWaterLoss, FragmentationTerminus.FivePrime },
{ ProductType.dBaseLoss, FragmentationTerminus.FivePrime },

{ ProductType.w, FragmentationTerminus.ThreePrime },
{ ProductType.wWaterLoss, FragmentationTerminus.ThreePrime },
{ ProductType.wBaseLoss, FragmentationTerminus.ThreePrime },
{ ProductType.x, FragmentationTerminus.ThreePrime },
{ ProductType.xWaterLoss, FragmentationTerminus.ThreePrime },
{ ProductType.xBaseLoss, FragmentationTerminus.ThreePrime },
{ ProductType.y, FragmentationTerminus.ThreePrime },
{ ProductType.yWaterLoss, FragmentationTerminus.ThreePrime },
{ ProductType.yBaseLoss, FragmentationTerminus.ThreePrime },
{ ProductType.z, FragmentationTerminus.ThreePrime },
{ ProductType.zWaterLoss, FragmentationTerminus.ThreePrime },
{ ProductType.zBaseLoss, FragmentationTerminus.ThreePrime },

{ ProductType.M, FragmentationTerminus.Both }
};
}
}
18 changes: 18 additions & 0 deletions mzLib/Test/Test.csproj
Original file line number Diff line number Diff line change
Expand Up @@ -494,6 +494,24 @@
</None>
<None Update="FileReadingTests\SearchResults\VariantCrossTest.psmtsv">
<CopyToOutputDirectory>Always</CopyToOutputDirectory>
</None>
<None Update="Transcriptomics\TestData\20mer1.fasta">
<CopyToOutputDirectory>Always</CopyToOutputDirectory>
</None>
<None Update="Transcriptomics\TestData\20mer1.fasta.gz">
<CopyToOutputDirectory>PreserveNewest</CopyToOutputDirectory>
</None>
<None Update="Transcriptomics\TestData\20mer1.xml">
<CopyToOutputDirectory>Always</CopyToOutputDirectory>
</None>
<None Update="Transcriptomics\TestData\20mer1.xml.gz">
<CopyToOutputDirectory>Always</CopyToOutputDirectory>
</None>
<None Update="Transcriptomics\TestData\ModomicsUnmodifiedTrimmed.fasta">
<CopyToOutputDirectory>PreserveNewest</CopyToOutputDirectory>
</None>
<None Update="Transcriptomics\TestData\ModomicsUnmodifiedTrimmed.fasta.gz">
<CopyToOutputDirectory>PreserveNewest</CopyToOutputDirectory>
</None>
<None Update="DataFiles\centroid_1x_MS1_4x_autoMS2.d\**">
<CopyToOutputDirectory>Always</CopyToOutputDirectory>
Expand Down
2 changes: 2 additions & 0 deletions mzLib/Test/Transcriptomics/TestData/20mer1.fasta
Original file line number Diff line number Diff line change
@@ -0,0 +1,2 @@
>id:2|Name:20mer1|SOterm:20mer1|Type:tRNA|Subtype:Ala|Feature:VGC|Cellular_Localization:freezer|Species:standard
GUACUGCCUCUAGUGAAGCA
Binary file added mzLib/Test/Transcriptomics/TestData/20mer1.fasta.gz
Binary file not shown.
17 changes: 17 additions & 0 deletions mzLib/Test/Transcriptomics/TestData/20mer1.xml
Original file line number Diff line number Diff line change
@@ -0,0 +1,17 @@
<?xml version="1.0" encoding="utf-8"?>
<mzLibProteinDb>
<entry>
<accession>20mer1</accession>
<name>20mer1</name>
<protein>
<recommendedName>
<fullName>20mer1</fullName>
</recommendedName>
</protein>
<gene />
<organism>
<name type="scientific">standard</name>
</organism>
<sequence length="20">GUACUGCCUCUAGUGAAGCA</sequence>
</entry>
</mzLibProteinDb>
Binary file added mzLib/Test/Transcriptomics/TestData/20mer1.xml.gz
Binary file not shown.
Original file line number Diff line number Diff line change
@@ -0,0 +1,10 @@
>id:1|Name:tdbR00000010|SOterm:SO:0000254|Type:tRNA|Subtype:Ala|Feature:VGC|Cellular_Localization:prokaryotic cytosol|Species:Escherichia coli
GGGGCUAUAGCUCAGCUGGGAGAGCGCCUGCUUUGCACGCAGGAGGUCUGCGGUUCGAUCCCGCAUAGCUCCACCA
>id:2|Name:tdbR00000008|SOterm:SO:0000254|Type:tRNA|Subtype:Ala|Feature:GGC|Cellular_Localization:prokaryotic cytosol|Species:Escherichia coli
GGGGCUAUAGCUCAGCUGGGAGAGCGCUUGCAUGGCAUGCAAGAGGUCAGCGGUUCGAUCCCGCUUAGCUCCACCA
>id:3|Name:tdbR00000356|SOterm:SO:0001036|Type:tRNA|Subtype:Arg|Feature:ICG|Cellular_Localization:prokaryotic cytosol|Species:Escherichia coli
GCAUCCGUAGCUCAGCUGGAUAGAGUACUCGGCUACGAACCGAGCGGUCGGAGGUUCGAAUCCUCCCGGAUGCACCA
>id:4|Name:tdbR00000359|SOterm:SO:0001036|Type:tRNA|Subtype:Arg|Feature:CCG|Cellular_Localization:prokaryotic cytosol|Species:Escherichia coli
GCGCCCGUAGCUCAGCUGGAUAGAGCGCUGCCCUCCGGAGGCAGAGGUCUCAGGUUCGAAUCCUGUCGGGCGCGCCA
>id:5|Name:tdbR00000358|SOterm:SO:0001036|Type:tRNA|Subtype:Arg|Feature:UCU|Cellular_Localization:prokaryotic cytosol|Species:Escherichia coli
GCGCCCUUAGCUCAGUUGGAUAGAGCAACGACCUUCUAAGUCGUGGGCCGCAGGUUCGAAUCCUGCAGGGCGCGCCA
Binary file not shown.
Loading
Loading