use of com.compomics.util.experiment.biology.modifications.Modification in project peptide-shaker by compomics.
the class ModificationLocalizationScorer method attachDeltaScore.
/**
* Scores the modification locations using the delta score.
*
* @param identification Identification object containing the matches.
* @param spectrumMatch The spectrum match of interest.
* @param sequenceMatchingParameters The sequence matching preferences.
* @param modificationProvider The modification provider to use.
*/
public void attachDeltaScore(Identification identification, SpectrumMatch spectrumMatch, SequenceMatchingParameters sequenceMatchingParameters, ModificationProvider modificationProvider) {
PSModificationScores modificationScores = (PSModificationScores) spectrumMatch.getUrParam(PSModificationScores.dummy);
if (modificationScores == null) {
modificationScores = new PSModificationScores();
spectrumMatch.addUrParam(modificationScores);
}
Peptide psPeptide = spectrumMatch.getBestPeptideAssumption().getPeptide();
HashMap<Integer, TreeMap<Double, ArrayList<PeptideAssumption>>> assumptions = spectrumMatch.getPeptideAssumptionsMap();
String mainSequence = psPeptide.getSequence();
HashMap<String, List<Integer>> modificationParameters = Arrays.stream(psPeptide.getVariableModifications()).collect(Collectors.groupingBy(ModificationMatch::getModification, HashMap::new, Collectors.mapping(ModificationMatch::getSite, Collectors.toList())));
for (Entry<String, List<Integer>> entry : modificationParameters.entrySet()) {
String modName = entry.getKey();
List<Integer> sites = entry.getValue();
Modification modification1 = modificationProvider.getModification(modName);
for (int modSite : sites) {
double refP = 1, secondaryP = 1;
for (TreeMap<Double, ArrayList<PeptideAssumption>> algorithmAssumptions : assumptions.values()) {
for (ArrayList<PeptideAssumption> assumptionsAtScore : algorithmAssumptions.values()) {
for (PeptideAssumption peptideAssumption : assumptionsAtScore) {
if (peptideAssumption.getPeptide().getSequence().equals(mainSequence)) {
boolean modificationAtSite = false, modificationFound = false;
Peptide peptide = peptideAssumption.getPeptide();
for (ModificationMatch modMatch : peptide.getVariableModifications()) {
Modification modification2 = modificationProvider.getModification(modMatch.getModification());
if (modification1.getMass() == modification2.getMass()) {
modificationFound = true;
PSParameter psParameter = (PSParameter) peptideAssumption.getUrParam(PSParameter.dummy);
double p = psParameter.getProbability();
if (modMatch.getSite() == modSite) {
modificationAtSite = true;
if (p < refP) {
refP = p;
}
}
}
}
if (!modificationAtSite && modificationFound) {
PSParameter psParameter = (PSParameter) peptideAssumption.getUrParam(PSParameter.dummy);
double p = psParameter.getProbability();
if (p < secondaryP) {
secondaryP = p;
}
}
}
}
}
}
ModificationScoring modificationScoring = modificationScores.getModificationScoring(modName);
if (modificationScoring == null) {
modificationScoring = new ModificationScoring(modName);
modificationScores.addModificationScoring(modName, modificationScoring);
}
if (secondaryP < refP) {
secondaryP = refP;
}
double deltaScore = (secondaryP - refP) * 100;
modificationScoring.setDeltaScore(modSite, deltaScore);
}
identification.updateObject(spectrumMatch.getKey(), spectrumMatch);
}
}
use of com.compomics.util.experiment.biology.modifications.Modification in project peptide-shaker by compomics.
the class ModificationLocalizationScorer method scorePTMs.
/**
* Scores PTMs in a protein match.
*
* @param identification The identification object containing the matches.
* @param proteinMatch The protein match.
* @param identificationParameters The identification parameters.
* @param scorePeptides If true, peptides will be scored as well.
* @param modificationProvider The modification provider to use.
* @param waitingHandler The waiting handler to sue, ignored if null.
*/
public void scorePTMs(Identification identification, ProteinMatch proteinMatch, IdentificationParameters identificationParameters, boolean scorePeptides, ModificationProvider modificationProvider, WaitingHandler waitingHandler) {
HashMap<Integer, ArrayList<String>> confidentSites = new HashMap<>();
HashMap<Integer, HashMap<Integer, HashSet<String>>> ambiguousSites = new HashMap<>();
for (long peptideKey : proteinMatch.getPeptideMatchesKeys()) {
PeptideMatch peptideMatch = identification.getPeptideMatch(peptideKey);
Peptide peptide = peptideMatch.getPeptide();
PSParameter psParameter = (PSParameter) peptideMatch.getUrParam(PSParameter.dummy);
if (psParameter.getMatchValidationLevel().isValidated() && peptide.getNVariableModifications() > 0) {
PSModificationScores peptideScores = (PSModificationScores) peptideMatch.getUrParam(PSModificationScores.dummy);
if (peptideScores == null || scorePeptides) {
scorePTMs(identification, peptideMatch, identificationParameters, modificationProvider, waitingHandler);
peptideScores = (PSModificationScores) peptideMatch.getUrParam(PSModificationScores.dummy);
}
if (peptideScores != null) {
int[] peptideStart = peptide.getProteinMapping().get(proteinMatch.getLeadingAccession());
for (int confidentSite : peptideScores.getConfidentSites()) {
for (int peptideTempStart : peptideStart) {
int siteOnProtein = peptideTempStart + confidentSite - 1;
ArrayList<String> modificationsAtSite = confidentSites.get(siteOnProtein);
if (modificationsAtSite == null) {
modificationsAtSite = new ArrayList<>();
confidentSites.put(siteOnProtein, modificationsAtSite);
}
for (String modName : peptideScores.getConfidentModificationsAt(confidentSite)) {
if (!modificationsAtSite.contains(modName)) {
modificationsAtSite.add(modName);
}
}
}
}
for (int representativeSite : peptideScores.getRepresentativeSites()) {
HashMap<Integer, HashSet<String>> peptideAmbiguousSites = peptideScores.getAmbiguousModificationsAtRepresentativeSite(representativeSite);
for (int peptideTempStart : peptideStart) {
int proteinRepresentativeSite = peptideTempStart + representativeSite - 1;
HashMap<Integer, HashSet<String>> proteinAmbiguousSites = ambiguousSites.get(proteinRepresentativeSite);
if (proteinAmbiguousSites == null) {
proteinAmbiguousSites = new HashMap<>(peptideAmbiguousSites.size());
ambiguousSites.put(proteinRepresentativeSite, proteinAmbiguousSites);
}
for (int peptideSite : peptideAmbiguousSites.keySet()) {
int siteOnProtein = peptideTempStart + peptideSite - 1;
proteinAmbiguousSites.put(siteOnProtein, peptideAmbiguousSites.get(peptideSite));
}
}
}
}
}
}
// remove ambiguous sites where a confident was found and merge overlapping groups
PSModificationScores proteinScores = new PSModificationScores();
ArrayList<Integer> representativeSites = new ArrayList<>(ambiguousSites.keySet());
Collections.sort(representativeSites);
for (Integer representativeSite : representativeSites) {
HashMap<Integer, HashSet<String>> secondarySitesMap = ambiguousSites.get(representativeSite);
ArrayList<Integer> secondarySites = new ArrayList<>(secondarySitesMap.keySet());
for (int secondarySite : secondarySites) {
ArrayList<String> confidentModifications = confidentSites.get(secondarySite);
if (confidentModifications != null) {
boolean sameModification = confidentModifications.stream().map(modName -> modificationProvider.getModification(modName)).anyMatch(confidentModification -> secondarySitesMap.get(secondarySite).stream().map(modName -> modificationProvider.getModification(modName)).anyMatch(secondaryModification -> secondaryModification.getMass() == confidentModification.getMass()));
if (sameModification) {
ambiguousSites.remove(representativeSite);
break;
}
}
if (secondarySite != representativeSite) {
ArrayList<Integer> tempRepresentativeSites = new ArrayList<>(ambiguousSites.keySet());
Collections.sort(tempRepresentativeSites);
for (Integer previousSite : tempRepresentativeSites) {
if (previousSite >= representativeSite) {
break;
}
if (previousSite == secondarySite) {
HashMap<Integer, HashSet<String>> previousSites = ambiguousSites.get(previousSite);
HashSet<String> previousModifications = previousSites.get(previousSite);
boolean sameModification = previousModifications.stream().map(modName -> modificationProvider.getModification(modName)).anyMatch(previousModification -> secondarySitesMap.get(secondarySite).stream().map(modName -> modificationProvider.getModification(modName)).anyMatch(secondaryModification -> secondaryModification.getMass() == previousModification.getMass()));
if (sameModification) {
for (int tempSecondarySite : secondarySitesMap.keySet()) {
if (!previousSites.containsKey(secondarySite)) {
previousSites.put(tempSecondarySite, secondarySitesMap.get(tempSecondarySite));
}
}
ambiguousSites.remove(representativeSite);
}
}
}
}
}
}
for (int confidentSite : confidentSites.keySet()) {
for (String modName : confidentSites.get(confidentSite)) {
proteinScores.addConfidentModificationSite(modName, confidentSite);
}
}
for (int representativeSite : ambiguousSites.keySet()) {
proteinScores.addAmbiguousModificationSites(representativeSite, ambiguousSites.get(representativeSite));
}
proteinMatch.addUrParam(proteinScores);
}
use of com.compomics.util.experiment.biology.modifications.Modification in project peptide-shaker by compomics.
the class ModificationLocalizationScorer method attachProbabilisticScore.
/**
* Attaches the selected probabilistic modification score.
*
* @param spectrumMatch The spectrum match studied, the score will be
* calculated for the best assumption only.
* @param sequenceProvider The protein sequence provider to use.
* @param spectrumProvider The spectrum provider to use.
* @param modificationProvider The modification provider to use.
* @param identificationParameters The identification parameters.
* @param peptideSpectrumAnnotator The peptide spectrum annotator to use.
* @param identification The identification object containing the matches.
*/
private void attachProbabilisticScore(SpectrumMatch spectrumMatch, SequenceProvider sequenceProvider, SpectrumProvider spectrumProvider, ModificationProvider modificationProvider, IdentificationParameters identificationParameters, PeptideSpectrumAnnotator peptideSpectrumAnnotator, Identification identification) {
SearchParameters searchParameters = identificationParameters.getSearchParameters();
AnnotationParameters annotationParameters = identificationParameters.getAnnotationParameters();
ModificationLocalizationParameters scoringParameters = identificationParameters.getModificationLocalizationParameters();
SequenceMatchingParameters sequenceMatchingParameters = identificationParameters.getSequenceMatchingParameters();
SequenceMatchingParameters modificationSequenceMatchingParameters = scoringParameters.getSequenceMatchingParameters();
ModificationParameters modificationParameters = searchParameters.getModificationParameters();
PSModificationScores modificationScores = (PSModificationScores) spectrumMatch.getUrParam(PSModificationScores.dummy);
if (modificationScores != null) {
modificationScores = new PSModificationScores();
spectrumMatch.addUrParam(modificationScores);
}
HashMap<Double, ArrayList<Modification>> modificationsMap = new HashMap<>(1);
HashMap<Double, Integer> nMod = new HashMap<>(1);
PeptideAssumption bestPeptideAssumption = spectrumMatch.getBestPeptideAssumption();
Peptide peptide = bestPeptideAssumption.getPeptide();
for (ModificationMatch modificationMatch : peptide.getVariableModifications()) {
Modification refMod = modificationProvider.getModification(modificationMatch.getModification());
double modMass = refMod.getMass();
if (!modificationsMap.containsKey(modMass)) {
ArrayList<Modification> modifications = modificationFactory.getSameMassNotFixedModifications(modMass, searchParameters).stream().map(modification -> modificationProvider.getModification(modification)).collect(Collectors.toCollection(ArrayList::new));
modificationsMap.put(modMass, modifications);
nMod.put(modMass, 1);
} else {
nMod.put(modMass, nMod.get(modMass) + 1);
}
}
if (!modificationsMap.isEmpty()) {
String spectrumFile = spectrumMatch.getSpectrumFile();
String spectrumTitle = spectrumMatch.getSpectrumTitle();
Spectrum spectrum = spectrumProvider.getSpectrum(spectrumFile, spectrumTitle);
SpecificAnnotationParameters specificAnnotationParameters = annotationParameters.getSpecificAnnotationParameters(spectrumFile, spectrumTitle, bestPeptideAssumption, modificationParameters, sequenceProvider, modificationSequenceMatchingParameters, peptideSpectrumAnnotator);
for (double modMass : modificationsMap.keySet()) {
HashMap<Integer, Double> scores = null;
if (scoringParameters.getSelectedProbabilisticScore() == ModificationLocalizationScore.PhosphoRS) {
scores = PhosphoRS.getSequenceProbabilities(peptide, modificationsMap.get(modMass), modificationParameters, spectrum, sequenceProvider, annotationParameters, specificAnnotationParameters, scoringParameters.isProbabilisticScoreNeutralLosses(), sequenceMatchingParameters, modificationSequenceMatchingParameters, peptideSpectrumAnnotator);
if (scores == null) {
throw new IllegalArgumentException("An error occurred while scoring spectrum " + spectrumTitle + " of file " + spectrumFile + " with PhosphoRS.");
// Most likely a compatibility issue with utilities
}
}
if (scores != null) {
// remap to searched modifications
Modification mappedModification = null;
String peptideSequence = peptide.getSequence();
for (int site : scores.keySet()) {
if (site == 0) {
// N-term mod
for (Modification modification : modificationsMap.get(modMass)) {
if (modification.getModificationType().isNTerm()) {
mappedModification = modification;
break;
}
}
if (mappedModification == null) {
throw new IllegalArgumentException("Could not map the PTM of mass " + modMass + " on the N-terminus of the peptide " + peptideSequence + ".");
}
} else if (site == peptideSequence.length() + 1) {
// C-term mod
for (Modification modification : modificationsMap.get(modMass)) {
if (modification.getModificationType().isCTerm()) {
mappedModification = modification;
break;
}
}
if (mappedModification == null) {
throw new IllegalArgumentException("Could not map the PTM of mass " + modMass + " on the C-terminus of the peptide " + peptideSequence + ".");
}
} else {
for (Modification modification : modificationsMap.get(modMass)) {
mappedModification = modification;
break;
}
if (mappedModification == null) {
throw new IllegalArgumentException("Could not map the PTM of mass " + modMass + " at site " + site + " in peptide " + peptide.getSequence() + ".");
}
}
String modName = mappedModification.getName();
ModificationScoring modificationScoring = modificationScores.getModificationScoring(modName);
if (modificationScoring == null) {
modificationScoring = new ModificationScoring(modName);
modificationScores.addModificationScoring(modName, modificationScoring);
}
modificationScoring.setProbabilisticScore(site, scores.get(site));
}
}
}
identification.updateObject(spectrumMatch.getKey(), spectrumMatch);
}
}
use of com.compomics.util.experiment.biology.modifications.Modification in project peptide-shaker by compomics.
the class ModificationLocalizationScorer method modificationSiteInference.
/**
* Infers the modification site of the best peptide assumption of the given
* spectrum match.
*
* @param spectrumMatch The spectrum match.
* @param sequenceProvider The sequence provider to use.
* @param modificationProvider The modification provider to use.
* @param identificationParameters The identification parameters.
*/
public void modificationSiteInference(SpectrumMatch spectrumMatch, SequenceProvider sequenceProvider, ModificationProvider modificationProvider, IdentificationParameters identificationParameters) {
Peptide peptide = spectrumMatch.getBestPeptideAssumption().getPeptide();
int nVariableModifications = peptide.getNVariableModifications();
if (nVariableModifications > 0) {
SearchParameters searchParameters = identificationParameters.getSearchParameters();
PSModificationScores modificationScores = (PSModificationScores) spectrumMatch.getUrParam(PSModificationScores.dummy);
HashMap<Double, ArrayList<ModificationMatch>> modMatchesMap = new HashMap<>(nVariableModifications);
HashMap<Double, HashMap<Integer, String>> possiblePositions = new HashMap<>(nVariableModifications);
HashMap<Double, HashMap<Integer, ArrayList<String>>> confidentSites = new HashMap<>(nVariableModifications);
for (ModificationMatch modificationMatch : peptide.getVariableModifications()) {
String modName = modificationMatch.getModification();
Modification modification = modificationProvider.getModification(modName);
double modMass = modification.getMass();
ArrayList<ModificationMatch> modOccurence = modMatchesMap.get(modMass);
if (modOccurence == null) {
modOccurence = new ArrayList<>(1);
modMatchesMap.put(modMass, modOccurence);
}
HashMap<Integer, String> modPossibleSites = possiblePositions.get(modMass);
if (modPossibleSites == null) {
modPossibleSites = new HashMap<>(1);
possiblePositions.put(modMass, modPossibleSites);
}
boolean maybeNotTerminal = modification.getModificationType() == ModificationType.modaa;
if (!maybeNotTerminal) {
ArrayList<String> expectedModifications = modificationFactory.getExpectedVariableModifications(searchParameters);
for (String otherModName : expectedModifications) {
if (!otherModName.equals(modName)) {
Modification otherModification = modificationProvider.getModification(otherModName);
if (otherModification.getMass() == modMass && modification.getModificationType() != otherModification.getModificationType()) {
maybeNotTerminal = true;
break;
}
}
}
}
if (maybeNotTerminal) {
modOccurence.add(modificationMatch);
for (String similarModName : modificationFactory.getSameMassNotFixedModifications(modMass, searchParameters)) {
Modification similarModification = modificationProvider.getModification(similarModName);
if (modification.getMass() == modMass) {
int[] possibleSites = ModificationUtils.getPossibleModificationSites(peptide, similarModification, sequenceProvider, identificationParameters.getModificationLocalizationParameters().getSequenceMatchingParameters());
for (int pos : possibleSites) {
modPossibleSites.put(pos, similarModName);
}
}
}
} else {
ModificationScoring modificationScoring = modificationScores.getModificationScoring(modName);
if (modificationScoring == null) {
modificationScoring = new ModificationScoring(modName);
modificationScores.addModificationScoring(modName, modificationScoring);
}
modificationScoring.setSiteConfidence(modificationMatch.getSite(), ModificationScoring.VERY_CONFIDENT);
modificationMatch.setConfident(true);
HashMap<Integer, ArrayList<String>> modificationSites = confidentSites.get(modification.getMass());
if (modificationSites == null) {
modificationSites = new HashMap<>(1);
confidentSites.put(modMass, modificationSites);
}
int site = modificationMatch.getSite();
ArrayList<String> modNames = modificationSites.get(site);
if (modNames == null) {
modNames = new ArrayList<>(1);
modificationSites.put(site, modNames);
}
modNames.add(modName);
}
}
ModificationLocalizationParameters modificationScoringParameters = identificationParameters.getModificationLocalizationParameters();
Set<Double> modMasses = modMatchesMap.keySet();
// p score -> d-score -> Map mod mass -> site -> list of modifications
TreeMap<Double, TreeMap<Double, TreeMap<Double, HashMap<Integer, HashSet<String>>>>> ambiguousScoreToSiteMap = new TreeMap<>();
HashMap<Double, Integer> nRepresentativesMap = new HashMap<>(modMasses.size());
ArrayList<ModificationMatch> assignedModifications = new ArrayList<>(peptide.getNVariableModifications());
// p-score -> d-score -> mod mass -> list of posssible sites
TreeMap<Double, TreeMap<Double, TreeMap<Double, TreeSet<Integer>>>> scoreToSiteMap = new TreeMap<>();
for (double modMass : modMasses) {
ArrayList<ModificationMatch> modificationMatches = modMatchesMap.get(modMass);
int nMods = modificationMatches.size();
HashMap<Integer, String> modificationPossibleSites = possiblePositions.get(modMass);
int nPossibleSites = modificationPossibleSites.size();
HashMap<Integer, ArrayList<String>> modificationConfidentSites = confidentSites.get(modMass);
if (modificationConfidentSites == null) {
modificationConfidentSites = new HashMap<>(1);
confidentSites.put(modMass, modificationConfidentSites);
}
if (nPossibleSites < nMods) {
throw new IllegalArgumentException("The occurence of modification of mass " + modMass + " (" + modificationMatches.size() + ") is higher than the number of possible sites (" + modificationPossibleSites.size() + ") on sequence " + peptide.getSequence() + " in spectrum " + spectrumMatch.getKey() + ".");
} else if (modificationPossibleSites.size() == modificationMatches.size()) {
for (ModificationMatch modMatch : modificationMatches) {
String modName = modMatch.getModification();
int site = modMatch.getSite();
ModificationScoring modificationScoring = modificationScores.getModificationScoring(modName);
if (modificationScoring == null) {
modificationScoring = new ModificationScoring(modName);
modificationScores.addModificationScoring(modName, modificationScoring);
}
modificationScoring.setSiteConfidence(site, ModificationScoring.VERY_CONFIDENT);
modMatch.setConfident(true);
ArrayList<String> modificationsAtAA = modificationConfidentSites.get(site);
if (modificationsAtAA == null) {
modificationsAtAA = new ArrayList<>(1);
modificationConfidentSites.put(site, modificationsAtAA);
}
modificationsAtAA.add(modName);
assignedModifications.add(modMatch);
}
} else if (!modificationScoringParameters.isProbabilisticScoreCalculation()) {
// no probabilistic score in that case
double pScore = 0;
for (ModificationMatch modificationMatch : modificationMatches) {
String modName = modificationMatch.getModification();
ModificationScoring modificationScoring = modificationScores.getModificationScoring(modName);
int site = modificationMatch.getSite();
Double dScore = modificationScoring.getDeltaScore(site);
if (dScore == 0.0) {
modificationScoring.setSiteConfidence(site, ModificationScoring.RANDOM);
modificationMatch.setConfident(false);
} else if (dScore <= 95) {
modificationScoring.setSiteConfidence(site, ModificationScoring.DOUBTFUL);
modificationMatch.setConfident(false);
} else {
modificationScoring.setSiteConfidence(site, ModificationScoring.CONFIDENT);
modificationMatch.setConfident(true);
ArrayList<String> modificationsAtAA = modificationConfidentSites.get(site);
if (modificationsAtAA == null) {
modificationsAtAA = new ArrayList<>(1);
modificationConfidentSites.put(site, modificationsAtAA);
}
modificationsAtAA.add(modName);
}
if (!modificationMatch.getConfident()) {
TreeMap<Double, TreeMap<Double, HashMap<Integer, HashSet<String>>>> pScoreAmbiguousMap = ambiguousScoreToSiteMap.get(pScore);
if (pScoreAmbiguousMap == null) {
pScoreAmbiguousMap = new TreeMap<>();
ambiguousScoreToSiteMap.put(pScore, pScoreAmbiguousMap);
}
TreeMap<Double, HashMap<Integer, HashSet<String>>> dScoreAmbiguousMap = pScoreAmbiguousMap.get(dScore);
if (dScoreAmbiguousMap == null) {
dScoreAmbiguousMap = new TreeMap<>();
pScoreAmbiguousMap.put(dScore, dScoreAmbiguousMap);
}
HashMap<Integer, HashSet<String>> massAmbiguousMap = dScoreAmbiguousMap.get(modMass);
if (massAmbiguousMap == null) {
massAmbiguousMap = new HashMap<>(nPossibleSites);
dScoreAmbiguousMap.put(modMass, massAmbiguousMap);
}
HashSet<String> modifications = massAmbiguousMap.get(site);
if (modifications == null) {
modifications = new HashSet<>(1);
massAmbiguousMap.put(site, modifications);
}
modifications.add(modName);
}
assignedModifications.add(modificationMatch);
}
} else {
for (int site : modificationPossibleSites.keySet()) {
String modName = modificationPossibleSites.get(site);
ModificationScoring modificationScoring = modificationScores.getModificationScoring(modName);
double pScore = 0;
double dScore = 0;
if (modificationScoring != null) {
pScore = modificationScoring.getProbabilisticScore(site);
dScore = modificationScoring.getDeltaScore(site);
}
TreeMap<Double, TreeMap<Double, TreeSet<Integer>>> pScoreMap = scoreToSiteMap.get(pScore);
if (pScoreMap == null) {
pScoreMap = new TreeMap<>();
scoreToSiteMap.put(pScore, pScoreMap);
}
TreeMap<Double, TreeSet<Integer>> dScoreMap = pScoreMap.get(dScore);
if (dScoreMap == null) {
dScoreMap = new TreeMap<>();
pScoreMap.put(dScore, dScoreMap);
}
TreeSet<Integer> dScoreSites = dScoreMap.get(modMass);
if (dScoreSites == null) {
dScoreSites = new TreeSet<>();
dScoreMap.put(modMass, dScoreSites);
}
dScoreSites.add(site);
}
}
}
// Assign modifications to the sites passing the threshold.
if (!scoreToSiteMap.isEmpty()) {
HashMap<Double, Integer> processedSitesMap = new HashMap<>(modMasses.size());
for (Entry<Double, TreeMap<Double, TreeMap<Double, TreeSet<Integer>>>> entry1 : scoreToSiteMap.descendingMap().entrySet()) {
double pScore = entry1.getKey();
TreeMap<Double, TreeMap<Double, TreeSet<Integer>>> pScoreMap = entry1.getValue();
for (Entry<Double, TreeMap<Double, TreeSet<Integer>>> entry2 : pScoreMap.descendingMap().entrySet()) {
double dScore = entry2.getKey();
TreeMap<Double, TreeSet<Integer>> dScoreMap = entry2.getValue();
for (Entry<Double, TreeSet<Integer>> entry : dScoreMap.entrySet()) {
double modificationMass = entry.getKey();
ArrayList<ModificationMatch> modificationMatches = modMatchesMap.get(modificationMass);
HashMap<Integer, String> modificationPossibleSites = possiblePositions.get(modificationMass);
HashMap<Integer, ArrayList<String>> modificationConfidentSites = confidentSites.get(modificationMass);
int nMods = modificationMatches.size();
int nPossibleSites = modificationPossibleSites.size();
double randomScoreThreshold = modificationScoringParameters.getSelectedProbabilisticScore().getRandomThreshold(nMods, nPossibleSites);
double confidenceThreshold = modificationScoringParameters.getProbabilisticScoreThreshold();
TreeSet<Integer> sites = dScoreMap.get(modificationMass);
Integer nAssignedSites = processedSitesMap.get(modificationMass);
if (nAssignedSites == null) {
nAssignedSites = 0;
}
for (int site : sites) {
String modName = modificationPossibleSites.get(site);
ModificationScoring modificationScoring = modificationScores.getModificationScoring(modName);
if (modificationScoring == null) {
modificationScoring = new ModificationScoring(modName);
modificationScores.addModificationScoring(modName, modificationScoring);
}
ModificationMatch modificationMatch = null;
if (nAssignedSites < nMods) {
boolean alreadyOccupied = false;
for (ModificationMatch assignedMatch : assignedModifications) {
if (assignedMatch.getSite() == site) {
alreadyOccupied = true;
break;
}
}
if (!alreadyOccupied) {
if (pScore >= confidenceThreshold) {
modificationMatch = modificationMatches.get(nAssignedSites);
modificationMatch.setSite(site);
modificationMatch.setModification(modName);
assignedModifications.add(modificationMatch);
modificationScoring.setSiteConfidence(site, ModificationScoring.VERY_CONFIDENT);
modificationMatch.setConfident(true);
ArrayList<String> modificationsAtAA = modificationConfidentSites.get(site);
if (modificationsAtAA == null) {
modificationsAtAA = new ArrayList<>(1);
modificationConfidentSites.put(site, modificationsAtAA);
}
modificationsAtAA.add(modName);
nAssignedSites++;
processedSitesMap.put(modificationMass, nAssignedSites);
} else if (pScore > randomScoreThreshold) {
modificationScoring.setSiteConfidence(site, ModificationScoring.DOUBTFUL);
} else {
modificationScoring.setSiteConfidence(site, ModificationScoring.RANDOM);
}
}
}
if (modificationMatch == null) {
TreeMap<Double, TreeMap<Double, HashMap<Integer, HashSet<String>>>> pScoreAmbiguousMap = ambiguousScoreToSiteMap.get(pScore);
if (pScoreAmbiguousMap == null) {
pScoreAmbiguousMap = new TreeMap<>();
ambiguousScoreToSiteMap.put(pScore, pScoreAmbiguousMap);
}
TreeMap<Double, HashMap<Integer, HashSet<String>>> dScoreAmbiguousMap = pScoreAmbiguousMap.get(dScore);
if (dScoreAmbiguousMap == null) {
dScoreAmbiguousMap = new TreeMap<>();
pScoreAmbiguousMap.put(dScore, dScoreAmbiguousMap);
}
HashMap<Integer, HashSet<String>> massAmbiguousMap = dScoreAmbiguousMap.get(modificationMass);
if (massAmbiguousMap == null) {
massAmbiguousMap = new HashMap<>(nPossibleSites);
dScoreAmbiguousMap.put(modificationMass, massAmbiguousMap);
}
HashSet<String> modifications = massAmbiguousMap.get(site);
if (modifications == null) {
modifications = new HashSet<>(1);
massAmbiguousMap.put(site, modifications);
}
modifications.add(modName);
}
}
}
}
}
}
// See whether there are sites that are not confidently assigned.
for (double modMass : confidentSites.keySet()) {
HashMap<Integer, ArrayList<String>> modConfidentSitesMap = confidentSites.get(modMass);
ArrayList<Integer> modConfidentSites = new ArrayList<>(modConfidentSitesMap.keySet());
int nConfident = 0;
for (int site : modConfidentSites) {
ArrayList<String> modifications = modConfidentSitesMap.get(site);
for (String modName : modifications) {
modificationScores.addConfidentModificationSite(modName, site);
}
nConfident += modifications.size();
}
modConfidentSites.size();
ArrayList<ModificationMatch> modificationMatches = modMatchesMap.get(modMass);
int nMods = modificationMatches.size();
if (nConfident < nMods) {
int nRepresentatives = nMods - nConfident;
if (nRepresentatives > 0) {
nRepresentativesMap.put(modMass, nRepresentatives);
}
}
}
// Create ambiguous site groups and assign the remaining modifications to the best scoring sites.
if (!nRepresentativesMap.isEmpty()) {
HashMap<Double, HashMap<Integer, HashMap<Integer, HashSet<String>>>> representativeToSecondaryMap = getRepresentativeToSecondaryMap(ambiguousScoreToSiteMap, nRepresentativesMap);
for (Entry<Double, HashMap<Integer, HashMap<Integer, HashSet<String>>>> entry1 : representativeToSecondaryMap.entrySet()) {
double modMass = entry1.getKey();
HashMap<Integer, HashMap<Integer, HashSet<String>>> massMap = entry1.getValue();
ArrayList<ModificationMatch> modificationMatches = modMatchesMap.get(modMass);
int nMods = modificationMatches.size();
int nRepresentativeSites = nRepresentativesMap.get(modMass);
if (nRepresentativeSites != massMap.size()) {
throw new IllegalArgumentException("Unexpected number of representative sites.");
}
int nConfident = nMods - nRepresentativeSites;
int modMatchIndex = nConfident;
for (Entry<Integer, HashMap<Integer, HashSet<String>>> entry : massMap.entrySet()) {
int representativeSite = entry.getKey();
HashMap<Integer, HashSet<String>> sites = entry.getValue();
modificationScores.addAmbiguousModificationSites(representativeSite, sites);
ModificationMatch modificationMatch = modificationMatches.get(modMatchIndex);
String modName = null;
for (String possibleModName : sites.get(representativeSite)) {
Modification possibleModification = modificationProvider.getModification(possibleModName);
if (possibleModification.getMass() == modMass) {
modName = possibleModName;
break;
}
}
if (modName == null) {
throw new IllegalArgumentException("No candidate modification of mass " + modMass + " found at site " + representativeSite + " on peptide " + peptide.getSequence() + ".");
}
modificationMatch.setModification(modName);
modificationMatch.setSite(representativeSite);
modificationMatch.setConfident(false);
modMatchIndex++;
}
}
}
}
}
use of com.compomics.util.experiment.biology.modifications.Modification in project peptide-shaker by compomics.
the class QCPanel method getPeptideModificationEnrichmentSpecificityDataset.
/**
* Returns the dataset for the peptide modification rate QC plot.
*
* @return the dataset for the peptide modification rate QC plot
*/
private DefaultCategoryDataset getPeptideModificationEnrichmentSpecificityDataset() {
ModificationFactory modificationFactory = ModificationFactory.getInstance();
Identification identification = peptideShakerGUI.getIdentification();
SequenceProvider sequenceProvider = peptideShakerGUI.getSequenceProvider();
IdentificationParameters identificationParameters = peptideShakerGUI.getIdentificationParameters();
ModificationParameters modificationParameters = identificationParameters.getSearchParameters().getModificationParameters();
SequenceMatchingParameters modificationSequenceMatchingParameters = identificationParameters.getModificationLocalizationParameters().getSequenceMatchingParameters();
ArrayList<String> modNames = modificationParameters.getAllNotFixedModifications();
HashMap<String, Integer> modifiedPeptidesMap = new HashMap<>(modNames.size());
HashMap<String, Integer> possiblyModifiedPeptidesMap = new HashMap<>(modNames.size());
progressDialog.setPrimaryProgressCounterIndeterminate(false);
progressDialog.setMaxPrimaryProgressCounter(identification.getPeptideIdentification().size());
progressDialog.setValue(0);
PeptideMatchesIterator peptideMatchesIterator = identification.getPeptideMatchesIterator(progressDialog);
PeptideMatch peptideMatch;
while ((peptideMatch = peptideMatchesIterator.next()) != null) {
PSParameter psParameter = (PSParameter) peptideMatch.getUrParam(PSParameter.dummy);
if (psParameter.getMatchValidationLevel().isValidated()) {
Peptide peptide = peptideMatch.getPeptide();
for (String modName : modificationParameters.getAllNotFixedModifications()) {
Modification modification = modificationFactory.getModification(modName);
int[] possibleSites = ModificationUtils.getPossibleModificationSites(peptide, modification, sequenceProvider, modificationSequenceMatchingParameters);
if (possibleSites.length != 0) {
Integer nPossiblePeptides = possiblyModifiedPeptidesMap.get(modName);
if (nPossiblePeptides == null) {
possiblyModifiedPeptidesMap.put(modName, 1);
} else {
possiblyModifiedPeptidesMap.put(modName, nPossiblePeptides + 1);
}
boolean modified = false;
for (ModificationMatch modificationMatch : peptide.getVariableModifications()) {
if (modificationMatch.getModification().equals(modName)) {
modified = true;
break;
}
}
if (modified) {
Integer nModifiedPeptides = modifiedPeptidesMap.get(modName);
if (nModifiedPeptides == null) {
modifiedPeptidesMap.put(modName, 1);
} else {
modifiedPeptidesMap.put(modName, nModifiedPeptides + 1);
}
}
}
}
}
if (progressDialog.isRunCanceled()) {
break;
}
progressDialog.increaseSecondaryProgressCounter();
}
DefaultCategoryDataset dataset = new DefaultCategoryDataset();
for (String modName : modificationParameters.getAllNotFixedModifications()) {
Integer nFound = modifiedPeptidesMap.get(modName);
if (nFound == null) {
nFound = 0;
}
Integer nPossible = possiblyModifiedPeptidesMap.get(modName);
Double rate = 0.0;
if (nPossible != null) {
rate = (100.0 * nFound) / nPossible;
}
dataset.addValue(rate, "Modified", modName);
double rest = 0.0;
if (nPossible != null) {
rest = 100 - rate;
}
dataset.addValue(rest, "Not Modified", modName);
}
return dataset;
}
Aggregations