Gemfury

theresearchsoftwarecompany / dplus-api python

Repository URL to install this package:
Details
dplus-api / CalculationInput.py
from __future__ import print_function

import json
import warnings
import csv
from dplus.Signal import Signal
from dplus.State import State


class CalculationInput(State):
    """
    A base class of the parameters for dplus generate or fit.
    """

    def __init__(self, use_gpu=True, is2D=False):
        super().__init__(is2D)
        self._use_gpu = use_gpu

    @property
    def use_gpu(self):
        """
        boolean flag, determines whether run the fit/generate calculation with or without gpu.

        :return: boolean value
        """
        return self._use_gpu

    @use_gpu.setter
    def use_gpu(self, flag):
        assert isinstance(flag, bool)
        self._use_gpu = flag
        if flag:
            if not self.DomainPreferences.use_grid:
                print("When using GPU, use_grid must be enabled. Enabling automatically.")
                self.DomainPreferences.use_grid = True

    @property
    def x(self):
        return self.DomainPreferences.x

    @property
    def y(self):
        return self.DomainPreferences.y


    @property
    def signal(self):
        return self.DomainPreferences.signal

    @signal.setter
    def signal(self, signal):
        assert isinstance(signal, Signal)
        self.DomainPreferences.signal = signal

    @property
    def args(self):
        """
        build the arguments params for D+ backed from CalculationInput fields.

        :return: The json dict that is send to D+ backed
        """
        self.validate_use_grid()
        return dict(args=dict(state=self.serialize(),
                              x=self.x,
                              y=self.y,
                              mask=self._mask),
                    options=dict(useGPU=self.use_gpu))

    @property
    def _filenames(self):
        return self._get_all_filenames()

    @property
    def _mask(self):
        # as of right now, the c++ code only has nomask, which is an array of zeros
        try:
            return [0] * len(self.y)
        except TypeError:  # y=None
            return None

    @staticmethod
    def copy_from_state(state):
        '''
        creates a CalculationInput based on an existing state

        :param state: a State class instance
        :return: new CalculationInput instance
        '''
        old_dict = state.serialize()
        new_input = CalculationInput()
        new_input.load_from_dictionary(old_dict)
        return new_input

    @staticmethod
    def _web_load(args_dict):
        stateInput = CalculationInput()
        try:
            stateInput.load_from_dictionary(args_dict["state"])
        except Exception as e:
            raise ValueError("Invalid state: " + str(e))
        x = args_dict["x"]
        y = args_dict.get("y")

        args_signal = Signal(x, y)
        state_signal = stateInput.DomainPreferences.signal
        if args_signal.x != state_signal.x or args_signal.y != state_signal.y:
            # order of priorities:
            if stateInput.DomainPreferences.signal_file:
                # 1. if a signal file is loaded, that takes precedence
                warnings.warn(
                    "the arguments supplied with the args file do not match the signal file. using signal file")
            else:
                # 2. if no signal file is loaded, than the provided x/y arrays take precedence over the qmin/qmax/res_steps provided in state
                warnings.warn("the arguments supplied in the state do not match the x/y args provided. using x/y args")
                stateInput.signal = args_signal
        return stateInput

    @staticmethod
    def _load_from_args_file(filename):
        with open(filename, 'r') as statefile:
            input = json.load(statefile)
        # TODO: add reading from options
        options = input.get("options")
        use_gpu = options.get("useGPU")
        input = CalculationInput._web_load(input["args"])
        if use_gpu:
            input.use_gpu = use_gpu
        return input

    @staticmethod
    def load_from_state_file(filename, use_gpu=True, is2D=False):
        """
        receives the location of a file that contains a serialized parameter tree (state) and creates instance of /
        CalculationInput from the file.

        :param filename: location of a state file
        :return: CalculationInput instance
        """
        with open(filename, 'r') as statefile:
            input = json.load(statefile)
        stateInput = CalculationInput(use_gpu)
        stateInput.load_from_dictionary(input, is2D)
        return stateInput

    @staticmethod
    def load_from_PDB(filename, qmax):
        """
        receives the location of a PDB file and qmax, and automatically creates a guess at the grid size based on the pdb.

        :param filename: location of a PDB file
        :param qmax: The max q value for the creation of the pdb grid size
        :return: instance of GenerateInput
        """

        def _calculate_grid_size(pdbfile, q):
            import numpy as np
            x, y, z = _get_x_y_z_window(pdbfile)
            max_len = np.sqrt(x * x + y * y + z * z)
            max_len /= 10  # convert from nm to angstrom
            density = int(max_len) / np.pi
            grid_size = int(2 * q * density + 3)
            grid_size /= 10
            grid_size += 1
            grid_size = int(grid_size)
            grid_size *= 10
            if grid_size < 20:
                grid_size = 20  # minimum grid size
            return grid_size

        def _get_x_y_z_window(file):
            x_coords = []
            y_coords = []
            z_coords = []
            for line in file:
                record_name = line[0:6]
                if record_name in ["ATOM  ", "HETATM"]:
                    x_coords.append(float(line[30:38]))
                    y_coords.append(float(line[38:46]))
                    z_coords.append(float(line[46:54]))
            x_len = max(x_coords) - min(x_coords)
            y_len = max(y_coords) - min(y_coords)
            z_len = max(z_coords) - min(z_coords)
            return x_len, y_len, z_len

        with open(filename) as pdbfile:  # checks file exists
            if not filename.endswith(".pdb"):
                raise NameError("Not a pdb file")
            grid_size = _calculate_grid_size(pdbfile, qmax)

        from dplus.DataModels.models import PDB
        c = CalculationInput()
        pdb = PDB(filename)
        pdb.centered = True
        pdb.anomfilename = ""
        pdb.use_grid = True
        c.add_model(pdb)
        c.DomainPreferences.grid_size = grid_size
        c.DomainPreferences.convergence = 0.001
        c.DomainPreferences.orientation_iterations = 1000000
        c.DomainPreferences.use_grid = True
        c.DomainPreferences.q_max = qmax
        c.use_gpu = True

        return c

    @staticmethod
    def load_from_EPDB(filename, qmax):
        """
        receives the location of a PDB file and qmax, and automatically creates a guess at the grid size based on the pdb.

        :param filename: location of a PDB file
        :param qmax: The max q value for the creation of the pdb grid size
        :return: instance of GenerateInput
        """

        def _calculate_grid_size(pdbfile, q):
            import numpy as np
            x, y, z = _get_x_y_z_window(pdbfile)
            max_len = np.sqrt(x * x + y * y + z * z)
            max_len /= 10  # convert from nm to angstrom
            density = int(max_len) / np.pi
            grid_size = int(2 * q * density + 3)
            grid_size /= 10
            grid_size += 1
            grid_size = int(grid_size)
            grid_size *= 10
            if grid_size < 20:
                grid_size = 20  # minimum grid size
            return grid_size

        def _get_x_y_z_window(file):
            x_coords = []
            y_coords = []
            z_coords = []
            for line in file:
                record_name = line[0:6]
                if record_name in ["ATOM  ", "HETATM"]:
                    x_coords.append(float(line[30:38]))
                    y_coords.append(float(line[38:46]))
                    z_coords.append(float(line[46:54]))
            x_len = max(x_coords) - min(x_coords)
            y_len = max(y_coords) - min(y_coords)
            z_len = max(z_coords) - min(z_coords)
            return x_len, y_len, z_len

        with open(filename) as pdbfile:  # checks file exists
            if not filename.endswith(".pdb"):
                raise NameError("Not a pdb file")
            grid_size = _calculate_grid_size(pdbfile, qmax)

        from dplus.DataModels.models import EPDB
        c = CalculationInput()
        pdb = EPDB(filename)
        pdb.centered = True
        pdb.anomfilename = ""
        pdb.use_grid = True
        c.add_model(pdb)
        c.DomainPreferences.grid_size = grid_size
        c.DomainPreferences.convergence = 0.001
        c.DomainPreferences.orientation_iterations = 1000000
        c.DomainPreferences.use_grid = True
        c.DomainPreferences.q_max = qmax
        c.use_gpu = True

        return c

    def write_to_dol(self):
        '''For now works only with states built inside the API'''
        if len(self.get_models_by_type('Manual Symmetry')) == 0:
            raise ValueError('Your state has no Manual Symmetries')
        else:
            for ManSym in self.get_models_by_type('Manual Symmetry'):
                if ManSym.name == '':
                    dol_name = '%08d.dol' % (ManSym.model_ptr)
                else:
                    dol_name = ManSym.name + '.dol'

                with open(dol_name, 'w+', encoding='utf-8', newline='') as file:
                    dol = csv.writer(file, delimiter='\t', quoting=csv.QUOTE_NONNUMERIC)
                    layer_num = 0
                    for layer in ManSym.serialize()['Parameters']:
                        dol.writerow([layer_num, *layer])
                        layer_num += 1


def suggest_parameters(x, y, z, q, use_GPU=False):
    '''Given model size in direction x, y, z and qmax, return the suggested parameters to input into the state as a
    dictionary.'''

    import numpy as np
    import sys
    suggested_params = {'Generation_params': {'Grid_size': int(20), 'Integration_method': 'Monte Carlo (Mersenne '
                                              'Twister)', 'Integration_iterations': int(1e6), 'Convergence': 1e-3,
                                              'Generated_points': int(q * 100)},
                        'Fitting Parameters': {'Fitting_method': 'Levenberg-Marquardt', 'Iterations': 6,
                                               'Convergence': 1e-2, 'Ratio_residuals': 'Trivial Loss', 'Step_size':
                                                   0.1, 'Der_eps': 0.1},
                        'Required Memory': 0
                        }

    maxLen = np.sqrt(x**2 + y**2 + z**2)
    density = maxLen / np.pi

    defSize = 2 * q * density + 3

    defSize /= 10
    defSize += 1
    defSize *= 10

    smallest = x
    largest = x
    if largest < y:
        largest = y
    if largest < z:
        largest = z

    if smallest > y:
        smallest = y
    if smallest > z:
        smallest = z

    should_be_adaptive = (largest > 5. * smallest)

    suggested_params['Generation_params']['Grid_size'] = int(defSize)

    i = (defSize / 2) + 3
    totalSize = (6 * i * (i + 1) * (3 + 3 + 2 * 6 * i)) / 6
    totalSize += 1
    totalSize *= 2

    numBytes = 8 * totalSize  # 8 is from the size of a double in cpp

    mbs = float(numBytes) / (1024. * 1024.)
    suggested_params['Required Memory'] = int(mbs)

    if (mbs > 1000.):
        print("Caution: You should consider using the hybrid method.")
    elif (mbs > 250.):
        print("Note: You may want to consider using the hybrid method.")

    if use_GPU:
        suggested_params['Generation_params']['Integration_method'] = 'Adaptive (VEGAS) Monte Carlo'
    else:
        if should_be_adaptive:
            suggested_params['Generation_params']['Integration_method'] = 'Adaptive Gauss Kronrod'
        else:
            suggested_params['Generation_params']['Integration_method'] = 'Monte Carlo (Mersenne Twister)'

    return suggested_params
theresearchsoftwarecompany / dplus-api python

Products

About

Resources

Contact Gemfury