Source code for relion.convert

# **************************************************************************
# *
# * Authors:     J.M. De la Rosa Trevin ( [1]
# *
# * [1] SciLifeLab, Stockholm University
# *
# * This program is free software; you can redistribute it and/or modify
# * it under the terms of the GNU General Public License as published by
# * the Free Software Foundation; either version 3 of the License, or
# * (at your option) any later version.
# *
# * This program is distributed in the hope that it will be useful,
# * but WITHOUT ANY WARRANTY; without even the implied warranty of
# * GNU General Public License for more details.
# *
# * You should have received a copy of the GNU General Public License
# * along with this program; if not, write to the Free Software
# * Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA
# * 02111-1307  USA
# *
# *  All comments concerning this program package may be sent to the
# *  e-mail address ''
# *
# **************************************************************************

import math

from .convert_utils import *
from .convert_deprecated import *
from .convert_coordinates import *
from .dataimport import *

# Writing of star files will be handle by the Writer class
# We have a new implementation of it for Relion > 3.1 since
# the star file format has changed in 3.1.
from . import convert30
from . import convert31

[docs]def createReader(**kwargs): """ Create a new Reader instance. By default it will create the new version (3.1 or newer) of STAR file. It can also be forced to use old format by passing the format='30' argument """ is30 = kwargs.get('format', '') == '30' Reader = convert30.Reader if is30 else convert31.Reader return Reader(**kwargs)
[docs]def createWriter(**kwargs): """ Create a new Writer instance. By default it will create the new version (3.1 or newer) of STAR file. It can also be forced to use old format by passing the format='30' argument """ is30 = kwargs.get('format', '') == '30' Writer = convert30.Writer if is30 else convert31.Writer return Writer(**kwargs)
[docs]def writeSetOfParticles(imgSet, starFile, **kwargs): """ Convenience function to a SetOfImages as Relion metadata using a Writer. Params: imgSet: the SetOfImages instance. starFile: the filename where to write the meta Keyword Arguments: outputDir: where binary files will be converted or linked. blockName: The name of the data block (default particles) fillMagnification: If True set magnification values (default False) alignType: extraLabels: postprocessImageRow: format: string value to specify STAR format, if '30' it will use Relion3.0 format """ return createWriter(**kwargs).writeSetOfParticles(imgSet, starFile, **kwargs)
[docs]def readSetOfParticles(starFile, partsSet, **kwargs): """ Convert a star file into a set of particles. Params: starFile: the filename of the star file partsSet: output particles set Keyword Arguments: blockName: The name of the data block (default particles) alignType: removeDisabled: format: string value to specify STAR format, if '30' it will use Relion3.0 format """ return createReader(**kwargs).readSetOfParticles(starFile, partsSet, **kwargs)
[docs]class ClassesLoader: """ Helper class to read classes information from star files produced by Relion classification runs (2D or 3D). """ def __init__(self, protocol, alignType): self._protocol = protocol self._alignType = alignType self._reader = None # Will be created later def _loadClassesInfo(self, iteration): """ Read some information about the produced Relion 3D classes from the * file. """ self._classesInfo = {} # store classes info, indexed by class id modelFn = self._protocol._getFileName('model', iter=iteration) modelIter = Table.iterRows('model_classes@' + modelFn) for classNumber, row in enumerate(modelIter): index, fn = relionToLocation(row.rlnReferenceImage) # Store info indexed by id self._classesInfo[classNumber + 1] = (index, fn, row)
[docs] def fillClassesFromIter(self, clsSet, iteration): """ Create the SetOfClasses3D from a given iteration. """ prot = self._protocol # shortcut self._loadClassesInfo(iteration) dataStar = prot._getFileName('data', iter=iteration) pixelSize = prot.inputParticles.get().getSamplingRate() self._reader = createReader(alignType=self._alignType, pixelSize=pixelSize) mdIter = Table.iterRows('particles@' + dataStar, key='rlnImageId') clsSet.classifyItems(updateItemCallback=self._updateParticle, updateClassCallback=self._updateClass, itemDataIterator=mdIter, doClone=False)
def _updateParticle(self, item, row): item.setClassId(row.rlnClassNumber) self._reader.setParticleTransform(item, row) if getattr(self, '__updatingFirst', True): self._reader.createExtraLabels(item, row, PARTICLE_EXTRA_LABELS) self.__updatingFirst = False else: self._reader.setExtraLabels(item, row) def _updateClass(self, item): classId = item.getObjId() if classId in self._classesInfo: index, fn, row = self._classesInfo[classId] item.setAlignment(self._alignType) if self._alignType == ALIGN_PROJ: fn += ':mrc' # mark reference as a MRC volume item.getRepresentative().setLocation(index, fn) item._rlnClassDistribution = Float(row.rlnClassDistribution) item._rlnAccuracyRotations = Float(row.rlnAccuracyRotations) item._rlnAccuracyTranslationsAngst = Float(row.rlnAccuracyTranslationsAngst)
[docs]class DefocusGroups: """ Helper class to create defocus groups for particles. """
[docs] class Group: """ Single CTF group. """ def __init__(self, id): = id self.count = 0 self.minDefocus = math.inf self.maxDefocus = -math.inf
[docs] def addDefocus(self, defocus): self.count += 1 if defocus < self.minDefocus: self.minDefocus = defocus if defocus > self.maxDefocus: self.maxDefocus = defocus
def __initGroups(self): self._groups = [] def __addGroup(self): group = self.Group(len(self._groups) + 1) self._groups.append(group) return group def __init__(self): self._groups = [] def __len__(self): return len(self._groups) def __iter__(self): return iter(self._groups) def __str__(self): s = ">>> Defocus groups: %d\n" % len(self) row_format = u"{:>15}{:>15}{:>10}\n" s += row_format.format("Min (A)", "Max (A)", "Count") for group in self._groups: s += row_format.format("%0.3f" % group.minDefocus, "%0.3f" % group.maxDefocus, group.count) return s
[docs] def splitByDiff(self, inputParts, defocusDiff=1000, minGroupSize=10): self.__initGroups() group = self.__addGroup() for part in inputParts.iterItems(orderBy=['_ctfModel._defocusU']): defocus = part.getCTF().getDefocusU() # Only when we reach the min number of particles # and the defocus difference, we create a new group if (group.count >= minGroupSize and (defocus - group.minDefocus > defocusDiff)): group = self.__addGroup() group.addDefocus(defocus)
[docs] def getGroup(self, defocus): """ Return the group that this defocus belong. """ if (defocus < self._groups[0].minDefocus or defocus > self._groups[-1].maxDefocus): return None for group in self._groups: if defocus <= group.maxDefocus: return group