python-sscha/Modules/Minimizer.py at 27c8853e55010b496a5fc3a0e9206f49517f07c6 · SSCHAcode/python-sscha · GitHub

1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
248
249
250
251
252
253
254
255
256
257
258
259
260
261
262
263
264
265
266
267
268
269
270
271
272
273
274
275
276
277
278
279
280
281
282
283
284
285
286
287
288
289
290
291
292
293
294
295
296
297
298
299
300
301
302
303
304
305
306
307
308
309
310
311
312
313
314
315
316
317
318
319
320
321
322
323
324
325
326
327
328
329
330
331
332
333
334
335
336
337
338
339
340
341
342
343
344
345
346
347
348
349
350
351
352
353
354
355
356
357
358
359
360
361
362
363
364
365
366
367
368
369
370
371
372
373
374
375
376
377
378
379
380
381
382
383
384
385
386
387
388
389
390
391
392
393
394
395
396
397
398
399
400
401
402
403
404
405
406
407
408
409
410
411
412
413
414
415
import numpy as np
import sys, os
import difflib


from sscha.Parallel import pprint as print

__ERROR_THR__ = 1e-7

class Minimizer:
    def __init__(self, minim_struct = True, algorithm = "sdes", root_representation = "normal", step = 1, verbose = True, fixed_step = False, struct_step_ratio = 1):
        """
        This class is a minimizer that performs the optimization given the gradient of the dynamical matrix.

        Parameters
        ----------
            minim_struc : bool
                If true minimizes also the structure
            algorithm : string
                The algorithm used for the minimization
            root_representation : string
                One between 'normal', 'sqrt' (or 'root2') and 'root4'.
                If normal the minimization is performed in the force constant matrix space, otherwise on the space of
                one of the root of the force constant matrix.
            step : double
                The initial step of the minimization
            fixed_step : bool
                If True, skip the line minimization and keep the step fixed during the whole minimization.
            struct_step_ratio : float
                Default 1. It is a manual precondition to slow down or accelerate the minimization of the structure with
                respect to the dynamical matrix. If bigger than 1, the structure minimization has a bigger step, and vice versa.
                It must be positive
        """

        self.minim_struct = minim_struct
        self.algorithm = algorithm
        self.step = step
        self.step_index = 0 # The index of the minimization
        self.root_representation = root_representation
        self.verbose = verbose

        self.old_direction = None
        self.current_direction = None

        self.current_x = None
        self.old_x = None
        self.old_kl = None
        self.dyn = None
        self.nq = 0
        self.n_modes = 0
        self.fixed_step = fixed_step
        self.struct_step_ratio = struct_step_ratio  #

        self.new_direction = True
        self.direction = None


        # Some parameter to optimize the evolution

        # Maximum step of the kl ratio for the minimization
        self.kl_ratio_thr = 0.9

        # The default combinations assures that 3 steps are required to decrement the same incremented step.
        # How much try to increase the step when a good step is found (must be > 1)
        self.increment_step = 1.5
        # How much decrease the step when it is too big (must be < 1)
        self.decrement_step = .87358046475


        # Setup the attribute control
        self.__total_attributes__ = [item for item in self.__dict__.keys()]
        self.fixed_attributes = True # This must be the last attribute to be setted


    def __setattr__(self, name, value):
        """
        This method is used to set an attribute.
        It will raise an exception if the attribute does not exists (with a suggestion of similar entries)
        """


        if "fixed_attributes" in self.__dict__:
            if name in self.__total_attributes__:
                super(self.__class__, self).__setattr__(name, value)
            elif self.fixed_attributes:
                similar_objects = str( difflib.get_close_matches(name, self.__total_attributes__))
                ERROR_MSG = """
        Error, the attribute '{}' is not a member of '{}'.
        Suggested similar attributes: {} ?
        """.format(name, type(self).__name__,  similar_objects)

                raise AttributeError(ERROR_MSG)
        else:
            super(self.__class__, self).__setattr__(name, value)

        # Check the constrains in some of the attributes
        if name == "step":
            assert value >= 0, "Error, the step must be positive, value = {}".format(value)
        if name == "struct_step_ratio":
            assert value > 0, "Error, {} must be positive, value = {}".format(name, value)


    def init(self, dyn, kl_ratio):
        """
        Initialize the minimizer with the current dynamical matrix and structure.

        Parameters
        ----------
            dyn : CC.Phonons.Phonons
                The dynamical matrix that identifies the starting point for the minimization.
            kl_ratio : float
                The initial Kong-Liu effective sample size
        """
        self.step_index = 0

        # create a vector of the dyn shape
        self.nq = len(dyn.q_tot)
        self.n_modes = dyn.structure.N_atoms * 3
        self.dyn = dyn

        x_dyn = np.zeros( self.nq * self.n_modes**2, dtype = np.complex128)

        pos = 0
        dynq = np.zeros( (self.nq, self.n_modes, self.n_modes), dtype = np.complex128)
        for i in range(self.nq):
            x_dyn[pos : pos + self.n_modes**2] = dyn.dynmats[i].ravel()
            dynq[i, :,:] = dyn.dynmats[i]
            pos += self.n_modes**2

        # Transform in root space if needed.
        if self.root_representation != "normal":
            new_dyn, _ = get_root_dyn_grad(dynq, np.zeros(dynq.shape, dtype = np.complex128), self.root_representation)
            x_dyn[:] = new_dyn.ravel()

        if self.minim_struct:
            x_struct = np.zeros(self.n_modes, dtype = np.complex128)
            x_struct[:] = dyn.structure.coords.ravel()
            self.current_x  = np.concatenate((x_dyn, x_struct))
        else:
            self.current_x = x_dyn

        self.old_x = self.current_x.copy()
        self.old_kl = kl_ratio
        self.new_direction = True

    def transform_gradients(self, dyn_gradient, structure_gradient = None):
        """
        Transform the gradients from dynamical matrix and structure
        to a single vector.
        The result of this function is what is needed by the run_step method.

        Parameters
        ----------
            dyn_gradient : ndarray( nq, nmodes, nmodes)
                The gradient of the dynamical matrix
            structure_gradient : ndarray(nmodes), optional
                The gradient of the structure (only needed if self.minim_struct = True)

        Results
        -------
            gradient : ndarray
                1D array where the gradients are collapsed all togheter.
        """

        if not self.minim_struct:
            return dyn_gradient.ravel()

        return np.concatenate( (dyn_gradient.ravel(), structure_gradient.ravel() * self.struct_step_ratio) )

    def get_dyn_struct(self):
        """
        From the current position of the minimization,
        get back the dynamical matrix and the structure
        """

        dynq = np.zeros( (self.nq, self.n_modes, self.n_modes), dtype = np.complex128)

        for i in range(self.nq):
            dynq[i,  :, :] = self.current_x[ i * self.n_modes**2 : (i+1) * self.n_modes**2].reshape( (self.n_modes, self.n_modes))

        # Revert the dynamical matrix if we are in the root representation
        dynq = get_standard_dyn(dynq, self.root_representation)

        struct = self.dyn.structure.coords.copy()
        if self.minim_struct:
            struct = self.current_x[self.nq * self.n_modes * self.n_modes :].reshape(self.dyn.structure.coords.shape)
        return dynq, struct

    def is_new_direction(self):
        """
        Return if a new direction must be chosen.
        """

        if self.fixed_step:
            return True
        return self.new_direction


    def run_step(self, gradient, kl_new):
        """
        Perform the minimization step with the line minimization
        """
        # Check consistency
        ERR="""
Error, increment must be bigger than 1 and decrement lower than 1.
       If you want to fix the step set fixed_step = True.
"""
        assert self.increment_step > 1 and self.decrement_step < 1, ERR
        if self.fixed_step:
            self.new_direction = True

        if self.new_direction:
            # A new direction, update the position with the last one
            self.old_kl = kl_new
            if self.algorithm.lower() in ["sdes", "sd", "steepest descend"]:
                self.direction = gradient.copy()
            else:
                raise NotImplementedError("Error, algorithm '{}' not implemented".format(self.algorithm))

            self.old_x = self.current_x.copy()
            self.new_direction = False

            # Enlarge the step
            if not self.fixed_step:
                self.step *= self.increment_step

            # Perform the minimization step for new direction
            self.current_x = self.old_x - self.step * self.direction
        else:
            # Proceed with the line minimization

            # Compute the scalar product between the gradient and the direction
            # (Considering real and imaginary part as independent)
            scalar = np.dot(np.real(self.direction), np.real(gradient))
            scalar += np.dot(np.imag(self.direction), np.imag(gradient))

            kl_ratio = kl_new / self.old_kl

            # Check if the step was too big (scalar is negative or kl_ratio is below the threshold)
            # and decrement the step if needed
            if (scalar < 0) or (kl_ratio < self.kl_ratio_thr):
                self.step *= self.decrement_step

                if self.verbose:
                    print("Step too large (scalar = {} | kl_ratio = {}), reducing to {}".format(scalar, kl_ratio, self.step))
                    #print("Direction: ", self.direction)
                    #print("Gradient: ", gradient)

                # Try again with reduced step
                self.current_x = self.old_x - self.step * self.direction
            else:
                # The step is good, therefore next step perform a new direction
                self.new_direction = True
                if self.verbose:
                    print("Good step found with {}, try increment".format(self.step))
                # DO NOT update current_x - we accept the current position
                # (current_x was already updated in the previous step)


    def update_dyn(self, new_kl_ratio, dyn_gradient, structure_gradient = None):
        """
        Update the dynamical matrix.

        Parameters
        ----------
            new_kl_ratio : float
                Kong Liu effective sample size ratio of the current dynamical matrix
            dyn_gradient : ndarray( nq, nmodes, nmodes)
                The gradient of the dynamical matrix
            structure_gradient : ndarray(nmodes), optional
                The gradient of the structure (only needed if self.minim_struct = True)

        Results
        -------
            dyn : CC.Phonons.Phonons
                The updated dynamical matrix with the correct minimization step.
        """
        # Get things properly if the KL ratio is null

        if np.isnan(new_kl_ratio):
            new_kl_ratio = 0

        assert new_kl_ratio - 1 < __ERROR_THR__, "Error, the kl_ratio is defined between (0, 1], {} given.".format(new_kl_ratio)

        current_dyn, _  = self.get_dyn_struct()

        # Now we can obtain the gradient in the root representation
        root_dyn, root_grad = get_root_dyn_grad(current_dyn, dyn_gradient, self.root_representation)

        grad_vector = self.transform_gradients(root_grad, structure_gradient)
        self.run_step(grad_vector, new_kl_ratio)


def get_root_dyn_grad(dyn_q, grad_q, root_representation = "sqrt"):
    """
    ROOT MINIMIZATION STEP
    ======================

    As for the [Monacelli, Errea, Calandra, Mauri, PRB 2017], the nonlinear
    change of variable is used to perform the step.

    It works as follows:

    .. math::

        \\Phi \\rightarrow \\sqrt{x}{\\Phi}

        \\frac{\\partial F}{\\partial \\Phi} \\rightarrow \\frac{\\partial F}{\\partial \\sqrt{x}{\\Phi}}

        \\sqrt{x}{\\Phi^{(n)}} \\stackrel{\\frac{\\partial F}{\\partial \\sqrt{x}{\\Phi}}}{\\longrightarrow} \\sqrt{x}{\\Phi^{(n+1)}}

        \\Phi^{(n+1)} = \\left(\\sqrt{x}{\\Phi^{(n+1)}})^{x}

    Where the specific update step is determined by the minimization_algorithm, while the :math:`x` order
    of the root representation is determined by the root_representation argument.

    Parameters
    ----------
        dyn_q : ndarray( NQ x 3nat x 3nat )
            The dynamical matrix in q space. The Nq are the total number of q.
        grad_q : ndarray( NQ x 3nat x 3nat )
            The gradient of the dynamical matrix.
        step_size : float
            The step size for the minimization
        root_representation : string
            choice between "normal", "sqrt" and "root4". The value of :math:`x` will be, respectively,
            1, 2, 4.
        minimization_algorithm : string
            The minimization algorithm to be used for the update.

    Result
    ------
        new_dyn_q : ndarray( NQ x 3nat x 3nat )
            The updated dynamical matrix in q space
    """
    ALLOWED_REPRESENTATION = ["normal", "root4", "sqrt", "root2"]

    # Avoid case sensitiveness
    root_representation = root_representation.lower()

    if not root_representation in ALLOWED_REPRESENTATION:
        raise ValueError("Error, root_representation is %s must be one of '%s'." % (root_representation,
                                                                                  ", ".join(ALLOWED_REPRESENTATION)))
    # Allow also for the usage of root2 instead of sqrt
    if root_representation == "root2":
        root_representation = "sqrt"

    # Apply the diagonalization
    nq = np.shape(dyn_q)[0]

    # Check if gradient and dyn_q have the same number of q points
    if nq != np.shape(grad_q)[0]:
        raise ValueError("Error, the number of q point of the dynamical matrix %d and gradient %d does not match!" % (nq, np.shape(grad_q)[0]))

    # Create the root representation
    new_dyn = np.zeros(np.shape(dyn_q), dtype = np.complex128)
    new_grad = np.zeros(np.shape(dyn_q), dtype = np.complex128)

    # Copy
    new_dyn[:,:,:] = dyn_q
    new_grad[:,:,:] = grad_q

    # Cycle over all the q points
    if root_representation != "normal":
        for iq in range(nq):
            # Dyagonalize the matrix
            eigvals, eigvects = np.linalg.eigh(dyn_q[iq, :, :])

            # Regularize acustic modes
            if iq == 0:
                eigvals[eigvals < 0] = 0.

            # The sqrt conversion
            new_dyn[iq, :, :] = np.einsum("a, ba, ca", np.sqrt(eigvals), eigvects, np.conj(eigvects))
            new_grad[iq, :, :] = new_dyn[iq, :, :].dot(grad_q[iq, :, :]) + grad_q[iq, :, :].dot(new_dyn[iq, :, :])

            # If root4 another loop needed
            if root_representation == "root4":
                new_dyn[iq, :, :] = np.einsum("a, ba, ca", np.sqrt(np.sqrt(eigvals)), eigvects, np.conj(eigvects))
                new_grad[iq, :, :] = new_dyn[iq, :, :].dot(new_grad[iq, :, :]) + new_grad[iq, :, :].dot(new_dyn[iq, :, :])

    return new_dyn, new_grad

def get_standard_dyn(root_dyn, root_representation):
    """
    Get the standard dynamical matrix from the root representation

    Parameters
    ----------
        root_dyn : ndarray (nq x 3nats x 3nats)
            The dynamical matrix in the root representation
        root_representation : string
            The kind of root representation
    """

    nq, _, __ = root_dyn.shape

    new_dyn = root_dyn.copy()
    if root_representation != "normal":
        for iq in range(nq):
            # The square root conversion
            new_dyn[iq, :, :] = new_dyn[iq, :,:].dot(new_dyn[iq, :,:])

            # The root4 conversion
            if root_representation == "root4":
                new_dyn[iq, :, :] = new_dyn[iq, :,:].dot(new_dyn[iq, :,:])

    # Return the matrix
    return new_dyn