opencl_fdtd/opencl_fdtd/simulation.py

"""
Class for constructing and holding the basic FDTD operations and fields
"""

from typing import List, Dict, Callable
from collections import OrderedDict
import numpy
import jinja2
import warnings

import pyopencl
import pyopencl.array
from pyopencl.elementwise import ElementwiseKernel

from fdfd_tools import vec


__author__ = 'Jan Petykiewicz'


# Create jinja2 env on module load
jinja_env = jinja2.Environment(loader=jinja2.PackageLoader(__name__, 'kernels'))


class Simulation(object):
    """
    Constructs and holds the basic FDTD operations and related fields

    After constructing this object, call the (update_E, update_H, update_S) members
     to perform FDTD updates on the stored (E, H, S) fields:

        pmls = [{'axis': a, 'polarity': p} for a in 'xyz' for p in 'np']
        sim = Simulation(grid.grids, do_poynting=True, pmls=pmls)
        with open('sources.c', 'w') as f:
            f.write('{}'.format(sim.sources))

        for t in range(max_t):
            sim.update_E([]).wait()

            # Find the linear index for the center point, for Ey
            ind = numpy.ravel_multi_index(tuple(grid.shape//2), dims=grid.shape, order='C') + \
                    numpy.prod(grid.shape) * 1
            # Perturb the field (i.e., add a soft current source)
            sim.E[ind] += numpy.sin(omega * t * sim.dt)
            event = sim.update_H([])
            if sim.update_S:
                event = sim.update_S([event])
            event.wait()

            with lzma.open('saved_simulation', 'wb') as f:
                dill.dump(fdfd_tools.unvec(sim.E.get(), grid.shape), f)

    Code in the form
        event2 = sim.update_H([event0, event1])
     indicates that the update_H operation should be prepared immediately, but wait for
     event0 and event1 to occur (i.e. previous operations to finish) before starting execution.
     event2 can then be used to prepare further operations to be run after update_H.
    """
    E = None    # type: List[pyopencl.array.Array]
    H = None    # type: List[pyopencl.array.Array]
    S = None    # type: List[pyopencl.array.Array]
    eps = None  # type: List[pyopencl.array.Array]
    dt = None   # type: float

    arg_type = None     # type: numpy.float32 or numpy.float64

    context = None      # type: pyopencl.Context
    queue = None        # type: pyopencl.CommandQueue

    update_E = None     # type: Callable[[List[pyopencl.Event]], pyopencl.Event]
    update_H = None     # type: Callable[[List[pyopencl.Event]], pyopencl.Event]
    update_S = None     # type: Callable[[List[pyopencl.Event]], pyopencl.Event]
    sources = None      # type: Dict[str, str]

    def __init__(self,
                 epsilon: List[numpy.ndarray],
                 pmls: List[Dict[str, int or float]],
                 dt: float = .99/numpy.sqrt(3),
                 initial_fields: Dict[str, List[numpy.ndarray]] = None,
                 context: pyopencl.Context = None,
                 queue: pyopencl.CommandQueue = None,
                 float_type: numpy.float32 or numpy.float64 = numpy.float32,
                 do_poynting: bool = True):
        """
        Initialize the simulation.

        :param epsilon: List containing [eps_r,xx, eps_r,yy, eps_r,zz], where each element is a Yee-shifted ndarray
                spanning the simulation domain. Relative epsilon is used.
        :param pmls: List of dicts with keys:
            'axis': One of 'x', 'y', 'z'.
            'direction': One of 'n', 'p'.
            'thickness': Number of layers, default 8.
            'epsilon_eff': Effective epsilon to match to. Default 1.0.
            'mu_eff': Effective mu to match to. Default 1.0.
            'ln_R_per_layer': Desired (ln(R) / thickness) value. Default -1.6.
            'm': Polynomial grading exponent. Default 3.5.
            'ma': Exponent for alpha. Default 1.
        :param dt: Time step. Default is .99/sqrt(3).
        :param initial_E: Initial E-field (default is 0 everywhere). Same format as epsilon.
        :param initial_H: Initial H-field (default is 0 everywhere). Same format as epsilon.
        :param context: pyOpenCL context. If not given, pyopencl.create_some_context(False) is called.
        :param queue: pyOpenCL command queue. If not given, pyopencl.CommandQueue(context) is called.
        :param float_type: numpy.float32 or numpy.float64. Default numpy.float32.
        :param do_poynting: If true, enables calculation of the poynting vector, S.
                Poynting vector calculation adds the following computational burdens:
                    * During update_H, ~6 extra additions/cell are performed in order to spatially
                        average E and temporally average H. These quantities are multiplied
                        (6 multiplications/cell) and then stored (6 writes/cell, cache-friendly).
                    * update_S performs a discrete cross product using the precalculated products
                        from update_H. This is not nice to the cache and similar to e.g. update_E
                        in complexity.
                    * GPU memory requirements are approximately doubled, since S and the intermediate
                        products must be stored.
        """
        if initial_fields is None:
            initial_fields = {}

        self.shape = epsilon[0].shape
        self.arg_type = float_type
        self.sources = {}
        self._create_context(context, queue)
        self._create_eps(epsilon)

        if dt > .99/numpy.sqrt(3):
            warnings.warn('Warning: unstable dt: {}'.format(dt))
        elif dt <= 0:
            raise Exception('Invalid dt: {}'.format(dt))
        else:
            self.dt = dt

        self.E = self._create_field(initial_fields.get('E', None))
        self.H = self._create_field(initial_fields.get('H', None))

        for pml in pmls:
            pml.setdefault('thickness', 8)
            pml.setdefault('epsilon_eff', 1.0)
            pml.setdefault('mu_eff', 1.0)
            pml.setdefault('ln_R_per_layer', -1.6)
            pml.setdefault('m', 3.5)
            pml.setdefault('ma', 1)

        ctype = type_to_C(self.arg_type)

        def ptr(arg: str) -> str:
            return ctype + ' *' + arg

        base_fields = OrderedDict()
        base_fields[ptr('E')] = self.E
        base_fields[ptr('H')] = self.H
        base_fields[ctype + ' dt'] = self.dt

        eps_field = OrderedDict()
        eps_field[ptr('eps')] = self.eps

        common_source = jinja_env.get_template('common.cl').render(
                ftype=ctype,
                shape=self.shape,
                )
        jinja_args = {
                'common_header': common_source,
                'pmls': pmls,
                'do_poynting': do_poynting,
                }
        E_source = jinja_env.get_template('update_e.cl').render(**jinja_args)
        H_source = jinja_env.get_template('update_h.cl').render(**jinja_args)

        self.sources['E'] = E_source
        self.sources['H'] = H_source


        S_fields = OrderedDict()
        if do_poynting:
            S_source = jinja_env.get_template('update_s.cl').render(**jinja_args)
            self.sources['S'] = S_source

            self.oS = pyopencl.array.zeros(self.queue, self.E.shape + (2,), dtype=self.arg_type)
            self.S = pyopencl.array.zeros_like(self.E)
            S_fields[ptr('oS')] = self.oS
            S_fields[ptr('S')] = self.S

        '''
        PML
        '''
        pml_e_fields, pml_h_fields = self._create_pmls(pmls)

        '''
        Create operations
        '''
        self.update_E = self._create_operation(E_source, (base_fields, eps_field, pml_e_fields))
        self.update_H = self._create_operation(H_source, (base_fields, pml_h_fields, S_fields))
        if do_poynting:
            self.update_S = self._create_operation(S_source, (base_fields, S_fields))


    def _create_pmls(self, pmls):
        ctype = type_to_C(self.arg_type)
        def ptr(arg: str) -> str:
            return ctype + ' *' + arg

        pml_e_fields = OrderedDict()
        pml_h_fields = OrderedDict()
        for pml in pmls:
            a = 'xyz'.find(pml['axis'])

            sigma_max = -pml['ln_R_per_layer'] / 2 * (pml['m'] + 1)
            kappa_max = numpy.sqrt(pml['mu_eff'] * pml['epsilon_eff'])
            alpha_max = 0           # TODO: Nonzero alpha?

            def par(x):
                scaling = ((x / (pml['thickness'])) ** pml['m'])
                sigma = scaling * sigma_max
                kappa = 1 + scaling * (kappa_max - 1)
                alpha = ((1 - x / pml['thickness']) ** pml['ma']) * alpha_max
                p0 = numpy.exp(-(sigma / kappa + alpha) * self.dt)
                p1 = sigma / (sigma + kappa * alpha) * (p0 - 1)
                p2 = 1/kappa
                return p0, p1, p2

            xe, xh = (numpy.arange(1, pml['thickness'] + 1, dtype=self.arg_type)[::-1] for _ in range(2))
            if pml['polarity'] == 'p':
                xe -= 0.5
            elif pml['polarity'] == 'n':
                xh -= 0.5

            pml_p_names = [['p' + pml['axis'] + i + eh + pml['polarity'] for i in '012'] for eh in 'eh']
            for name_e, name_h, pe, ph in zip(pml_p_names[0], pml_p_names[1], par(xe), par(xh)):
                pml_e_fields[ptr(name_e)] = pyopencl.array.to_device(self.queue, pe)
                pml_h_fields[ptr(name_h)] = pyopencl.array.to_device(self.queue, ph)

            uv = 'xyz'.replace(pml['axis'], '')
            psi_base = 'Psi_' + pml['axis'] + pml['polarity'] + '_'
            psi_names = [[psi_base + eh + c for c in uv] for eh in 'EH']

            psi_shape = list(self.shape)
            psi_shape[a] = pml['thickness']

            for ne, nh in zip(*psi_names):
                pml_e_fields[ptr(ne)] = pyopencl.array.zeros(self.queue, tuple(psi_shape), dtype=self.arg_type)
                pml_h_fields[ptr(nh)] = pyopencl.array.zeros(self.queue, tuple(psi_shape), dtype=self.arg_type)
        return pml_e_fields, pml_h_fields

    def _create_operation(self, source, args_fields):
        args = OrderedDict()
        [args.update(d) for d in args_fields]
        update = ElementwiseKernel(self.context, operation=source,
                                   arguments=', '.join(args.keys()))
        return lambda e: update(*args.values(), wait_for=e)


    def _create_context(self, context: pyopencl.Context = None,
                        queue: pyopencl.CommandQueue = None):
        if context is None:
            self.context = pyopencl.create_some_context()
        else:
            self.context = context

        if queue is None:
            self.queue = pyopencl.CommandQueue(self.context)
        else:
            self.queue = queue

    def _create_eps(self, epsilon: List[numpy.ndarray]):
        if len(epsilon) != 3:
            raise Exception('Epsilon must be a list with length of 3')
        if not all((e.shape == epsilon[0].shape for e in epsilon[1:])):
            raise Exception('All epsilon grids must have the same shape. Shapes are {}', [e.shape for e in epsilon])
        if not epsilon[0].shape == self.shape:
            raise Exception('Epsilon shape mismatch. Expected {}, got {}'.format(self.shape, epsilon[0].shape))
        self.eps = pyopencl.array.to_device(self.queue, vec(epsilon).astype(self.arg_type))

    def _create_field(self, initial_value: List[numpy.ndarray] = None):
        if initial_value is None:
            return pyopencl.array.zeros_like(self.eps)
        else:
            if len(initial_value) != 3:
                Exception('Initial field value must be a list of length 3')
            if not all((f.shape == self.shape for f in initial_value)):
                Exception('Initial field list elements must have same shape as epsilon elements')
            return pyopencl.array.to_device(self.queue, vec(initial_value).astype(self.arg_type))

def type_to_C(float_type) -> str:
    """
    Returns a string corresponding to the C equivalent of a numpy type.
    Only works for float16, float32, float64.

    :param float_type: e.g. numpy.float32
    :return: string containing the corresponding C type (eg. 'double')
    """
    if float_type == numpy.float16:
        arg_type = 'half'
    elif float_type == numpy.float32:
        arg_type = 'float'
    elif float_type == numpy.float64:
        arg_type = 'double'
    else:
        raise Exception('Unsupported type')
    return arg_type
Initial commit 8 years ago			`"""`
			`Class for constructing and holding the basic FDTD operations and fields`
			`"""`

			`from typing import List, Dict, Callable`
Rewrite, with the following features: - Move to jinja2 templates for the opencl code - Combine PML code into the E, H updates for speed - Add Poynting vector calculation code, including precalculation during H update - Use arrays for PML parameters (p0, p1) - Switch to linearized, C-ordered fields (~50% performance boost??) - Added jinja2 and fdfd_tools dependencies 8 years ago			`from collections import OrderedDict`
Initial commit 8 years ago			`import numpy`
Rewrite, with the following features: - Move to jinja2 templates for the opencl code - Combine PML code into the E, H updates for speed - Add Poynting vector calculation code, including precalculation during H update - Use arrays for PML parameters (p0, p1) - Switch to linearized, C-ordered fields (~50% performance boost??) - Added jinja2 and fdfd_tools dependencies 8 years ago			`import jinja2`
Initial commit 8 years ago			`import warnings`

			`import pyopencl`
			`import pyopencl.array`
			`from pyopencl.elementwise import ElementwiseKernel`

Rewrite, with the following features: - Move to jinja2 templates for the opencl code - Combine PML code into the E, H updates for speed - Add Poynting vector calculation code, including precalculation during H update - Use arrays for PML parameters (p0, p1) - Switch to linearized, C-ordered fields (~50% performance boost??) - Added jinja2 and fdfd_tools dependencies 8 years ago			`from fdfd_tools import vec`


			`__author__ = 'Jan Petykiewicz'`


			`# Create jinja2 env on module load`
			`jinja_env = jinja2.Environment(loader=jinja2.PackageLoader(__name__, 'kernels'))`
Initial commit 8 years ago

			`class Simulation(object):`
			`"""`
			`Constructs and holds the basic FDTD operations and related fields`
doc updates 7 years ago
			`After constructing this object, call the (update_E, update_H, update_S) members`
			`to perform FDTD updates on the stored (E, H, S) fields:`

improve pml specification 7 years ago			`pmls = [{'axis': a, 'polarity': p} for a in 'xyz' for p in 'np']`
			`sim = Simulation(grid.grids, do_poynting=True, pmls=pmls)`
doc updates 7 years ago			`with open('sources.c', 'w') as f:`
			`f.write('{}'.format(sim.sources))`

			`for t in range(max_t):`
			`sim.update_E([]).wait()`

			`# Find the linear index for the center point, for Ey`
			`ind = numpy.ravel_multi_index(tuple(grid.shape//2), dims=grid.shape, order='C') + \`
			`numpy.prod(grid.shape) * 1`
			`# Perturb the field (i.e., add a soft current source)`
			`sim.E[ind] += numpy.sin(omega * t * sim.dt)`
			`event = sim.update_H([])`
			`if sim.update_S:`
			`event = sim.update_S([event])`
			`event.wait()`

			`with lzma.open('saved_simulation', 'wb') as f:`
			`dill.dump(fdfd_tools.unvec(sim.E.get(), grid.shape), f)`

			`Code in the form`
			`event2 = sim.update_H([event0, event1])`
			`indicates that the update_H operation should be prepared immediately, but wait for`
			`event0 and event1 to occur (i.e. previous operations to finish) before starting execution.`
			`event2 can then be used to prepare further operations to be run after update_H.`
Initial commit 8 years ago			`"""`
			`E = None # type: List[pyopencl.array.Array]`
			`H = None # type: List[pyopencl.array.Array]`
Rewrite, with the following features: - Move to jinja2 templates for the opencl code - Combine PML code into the E, H updates for speed - Add Poynting vector calculation code, including precalculation during H update - Use arrays for PML parameters (p0, p1) - Switch to linearized, C-ordered fields (~50% performance boost??) - Added jinja2 and fdfd_tools dependencies 8 years ago			`S = None # type: List[pyopencl.array.Array]`
Initial commit 8 years ago			`eps = None # type: List[pyopencl.array.Array]`
			`dt = None # type: float`

			`arg_type = None # type: numpy.float32 or numpy.float64`

			`context = None # type: pyopencl.Context`
			`queue = None # type: pyopencl.CommandQueue`

doc updates 7 years ago			`update_E = None # type: Callable[[List[pyopencl.Event]], pyopencl.Event]`
			`update_H = None # type: Callable[[List[pyopencl.Event]], pyopencl.Event]`
			`update_S = None # type: Callable[[List[pyopencl.Event]], pyopencl.Event]`
Rewrite, with the following features: - Move to jinja2 templates for the opencl code - Combine PML code into the E, H updates for speed - Add Poynting vector calculation code, including precalculation during H update - Use arrays for PML parameters (p0, p1) - Switch to linearized, C-ordered fields (~50% performance boost??) - Added jinja2 and fdfd_tools dependencies 8 years ago			`sources = None # type: Dict[str, str]`
Initial commit 8 years ago
			`def __init__(self,`
			`epsilon: List[numpy.ndarray],`
improve pml specification 7 years ago			`pmls: List[Dict[str, int or float]],`
Rewrite, with the following features: - Move to jinja2 templates for the opencl code - Combine PML code into the E, H updates for speed - Add Poynting vector calculation code, including precalculation during H update - Use arrays for PML parameters (p0, p1) - Switch to linearized, C-ordered fields (~50% performance boost??) - Added jinja2 and fdfd_tools dependencies 8 years ago			`dt: float = .99/numpy.sqrt(3),`
Add _create_context(), _create_operation(), and _create_pmls(), and generalize initial field value args 6 years ago			`initial_fields: Dict[str, List[numpy.ndarray]] = None,`
Rewrite, with the following features: - Move to jinja2 templates for the opencl code - Combine PML code into the E, H updates for speed - Add Poynting vector calculation code, including precalculation during H update - Use arrays for PML parameters (p0, p1) - Switch to linearized, C-ordered fields (~50% performance boost??) - Added jinja2 and fdfd_tools dependencies 8 years ago			`context: pyopencl.Context = None,`
			`queue: pyopencl.CommandQueue = None,`
			`float_type: numpy.float32 or numpy.float64 = numpy.float32,`
			`do_poynting: bool = True):`
Initial commit 8 years ago			`"""`
			`Initialize the simulation.`

			`:param epsilon: List containing [eps_r,xx, eps_r,yy, eps_r,zz], where each element is a Yee-shifted ndarray`
			`spanning the simulation domain. Relative epsilon is used.`
improve pml specification 7 years ago			`:param pmls: List of dicts with keys:`
			`'axis': One of 'x', 'y', 'z'.`
			`'direction': One of 'n', 'p'.`
			`'thickness': Number of layers, default 8.`
			`'epsilon_eff': Effective epsilon to match to. Default 1.0.`
			`'mu_eff': Effective mu to match to. Default 1.0.`
			`'ln_R_per_layer': Desired (ln(R) / thickness) value. Default -1.6.`
			`'m': Polynomial grading exponent. Default 3.5.`
			`'ma': Exponent for alpha. Default 1.`
			`:param dt: Time step. Default is .99/sqrt(3).`
Initial commit 8 years ago			`:param initial_E: Initial E-field (default is 0 everywhere). Same format as epsilon.`
			`:param initial_H: Initial H-field (default is 0 everywhere). Same format as epsilon.`
			`:param context: pyOpenCL context. If not given, pyopencl.create_some_context(False) is called.`
			`:param queue: pyOpenCL command queue. If not given, pyopencl.CommandQueue(context) is called.`
			`:param float_type: numpy.float32 or numpy.float64. Default numpy.float32.`
doc updates 7 years ago			`:param do_poynting: If true, enables calculation of the poynting vector, S.`
			`Poynting vector calculation adds the following computational burdens:`
			`* During update_H, ~6 extra additions/cell are performed in order to spatially`
			`average E and temporally average H. These quantities are multiplied`
			`(6 multiplications/cell) and then stored (6 writes/cell, cache-friendly).`
			`* update_S performs a discrete cross product using the precalculated products`
			`from update_H. This is not nice to the cache and similar to e.g. update_E`
			`in complexity.`
			`* GPU memory requirements are approximately doubled, since S and the intermediate`
			`products must be stored.`
Initial commit 8 years ago			`"""`
Add _create_context(), _create_operation(), and _create_pmls(), and generalize initial field value args 6 years ago			`if initial_fields is None:`
			`initial_fields = {}`
Initial commit 8 years ago
Add _create_context(), _create_operation(), and _create_pmls(), and generalize initial field value args 6 years ago			`self.shape = epsilon[0].shape`
			`self.arg_type = float_type`
			`self.sources = {}`
			`self._create_context(context, queue)`
			`self._create_eps(epsilon)`
Initial commit 8 years ago
			`if dt > .99/numpy.sqrt(3):`
			`warnings.warn('Warning: unstable dt: {}'.format(dt))`
			`elif dt <= 0:`
			`raise Exception('Invalid dt: {}'.format(dt))`
			`else:`
			`self.dt = dt`

Add _create_context(), _create_operation(), and _create_pmls(), and generalize initial field value args 6 years ago			`self.E = self._create_field(initial_fields.get('E', None))`
			`self.H = self._create_field(initial_fields.get('H', None))`
Initial commit 8 years ago
improve pml specification 7 years ago			`for pml in pmls:`
			`pml.setdefault('thickness', 8)`
			`pml.setdefault('epsilon_eff', 1.0)`
			`pml.setdefault('mu_eff', 1.0)`
			`pml.setdefault('ln_R_per_layer', -1.6)`
			`pml.setdefault('m', 3.5)`
			`pml.setdefault('ma', 1)`
Initial commit 8 years ago
Rewrite, with the following features: - Move to jinja2 templates for the opencl code - Combine PML code into the E, H updates for speed - Add Poynting vector calculation code, including precalculation during H update - Use arrays for PML parameters (p0, p1) - Switch to linearized, C-ordered fields (~50% performance boost??) - Added jinja2 and fdfd_tools dependencies 8 years ago			`ctype = type_to_C(self.arg_type)`
Initial commit 8 years ago
Rewrite, with the following features: - Move to jinja2 templates for the opencl code - Combine PML code into the E, H updates for speed - Add Poynting vector calculation code, including precalculation during H update - Use arrays for PML parameters (p0, p1) - Switch to linearized, C-ordered fields (~50% performance boost??) - Added jinja2 and fdfd_tools dependencies 8 years ago			`def ptr(arg: str) -> str:`
			`return ctype + ' *' + arg`

			`base_fields = OrderedDict()`
			`base_fields[ptr('E')] = self.E`
			`base_fields[ptr('H')] = self.H`
			`base_fields[ctype + ' dt'] = self.dt`

			`eps_field = OrderedDict()`
			`eps_field[ptr('eps')] = self.eps`

			`common_source = jinja_env.get_template('common.cl').render(`
			`ftype=ctype,`
Add _create_context(), _create_operation(), and _create_pmls(), and generalize initial field value args 6 years ago			`shape=self.shape,`
Rewrite, with the following features: - Move to jinja2 templates for the opencl code - Combine PML code into the E, H updates for speed - Add Poynting vector calculation code, including precalculation during H update - Use arrays for PML parameters (p0, p1) - Switch to linearized, C-ordered fields (~50% performance boost??) - Added jinja2 and fdfd_tools dependencies 8 years ago			`)`
			`jinja_args = {`
			`'common_header': common_source,`
			`'pmls': pmls,`
			`'do_poynting': do_poynting,`
			`}`
			`E_source = jinja_env.get_template('update_e.cl').render(**jinja_args)`
			`H_source = jinja_env.get_template('update_h.cl').render(**jinja_args)`

			`self.sources['E'] = E_source`
			`self.sources['H'] = H_source`

Add _create_context(), _create_operation(), and _create_pmls(), and generalize initial field value args 6 years ago

			`S_fields = OrderedDict()`
Rewrite, with the following features: - Move to jinja2 templates for the opencl code - Combine PML code into the E, H updates for speed - Add Poynting vector calculation code, including precalculation during H update - Use arrays for PML parameters (p0, p1) - Switch to linearized, C-ordered fields (~50% performance boost??) - Added jinja2 and fdfd_tools dependencies 8 years ago			`if do_poynting:`
			`S_source = jinja_env.get_template('update_s.cl').render(**jinja_args)`
			`self.sources['S'] = S_source`

Add _create_context(), _create_operation(), and _create_pmls(), and generalize initial field value args 6 years ago			`self.oS = pyopencl.array.zeros(self.queue, self.E.shape + (2,), dtype=self.arg_type)`
Rewrite, with the following features: - Move to jinja2 templates for the opencl code - Combine PML code into the E, H updates for speed - Add Poynting vector calculation code, including precalculation during H update - Use arrays for PML parameters (p0, p1) - Switch to linearized, C-ordered fields (~50% performance boost??) - Added jinja2 and fdfd_tools dependencies 8 years ago			`self.S = pyopencl.array.zeros_like(self.E)`
			`S_fields[ptr('oS')] = self.oS`
			`S_fields[ptr('S')] = self.S`

			`'''`
			`PML`
			`'''`
Add _create_context(), _create_operation(), and _create_pmls(), and generalize initial field value args 6 years ago			`pml_e_fields, pml_h_fields = self._create_pmls(pmls)`

			`'''`
			`Create operations`
			`'''`
			`self.update_E = self._create_operation(E_source, (base_fields, eps_field, pml_e_fields))`
			`self.update_H = self._create_operation(H_source, (base_fields, pml_h_fields, S_fields))`
			`if do_poynting:`
			`self.update_S = self._create_operation(S_source, (base_fields, S_fields))`


			`def _create_pmls(self, pmls):`
			`ctype = type_to_C(self.arg_type)`
			`def ptr(arg: str) -> str:`
			`return ctype + ' *' + arg`

Rewrite, with the following features: - Move to jinja2 templates for the opencl code - Combine PML code into the E, H updates for speed - Add Poynting vector calculation code, including precalculation during H update - Use arrays for PML parameters (p0, p1) - Switch to linearized, C-ordered fields (~50% performance boost??) - Added jinja2 and fdfd_tools dependencies 8 years ago			`pml_e_fields = OrderedDict()`
			`pml_h_fields = OrderedDict()`
			`for pml in pmls:`
improve pml specification 7 years ago			`a = 'xyz'.find(pml['axis'])`

Implement proper kappa for PML 6 years ago			`sigma_max = -pml['ln_R_per_layer'] / 2 * (pml['m'] + 1)`
			`kappa_max = numpy.sqrt(pml['mu_eff'] * pml['epsilon_eff'])`
			`alpha_max = 0 # TODO: Nonzero alpha?`
improve pml specification 7 years ago
			`def par(x):`
Implement proper kappa for PML 6 years ago			`scaling = ((x / (pml['thickness'])) ** pml['m'])`
			`sigma = scaling * sigma_max`
			`kappa = 1 + scaling * (kappa_max - 1)`
improve pml specification 7 years ago			`alpha = ((1 - x / pml['thickness']) ** pml['ma']) * alpha_max`
Implement proper kappa for PML 6 years ago			`p0 = numpy.exp(-(sigma / kappa + alpha) * self.dt)`
			`p1 = sigma / (sigma + kappa * alpha) * (p0 - 1)`
			`p2 = 1/kappa`
			`return p0, p1, p2`
improve pml specification 7 years ago
Add _create_context(), _create_operation(), and _create_pmls(), and generalize initial field value args 6 years ago			`xe, xh = (numpy.arange(1, pml['thickness'] + 1, dtype=self.arg_type)[::-1] for _ in range(2))`
improve pml specification 7 years ago			`if pml['polarity'] == 'p':`
			`xe -= 0.5`
			`elif pml['polarity'] == 'n':`
			`xh -= 0.5`

Implement proper kappa for PML 6 years ago			`pml_p_names = [['p' + pml['axis'] + i + eh + pml['polarity'] for i in '012'] for eh in 'eh']`
improve pml specification 7 years ago			`for name_e, name_h, pe, ph in zip(pml_p_names[0], pml_p_names[1], par(xe), par(xh)):`
			`pml_e_fields[ptr(name_e)] = pyopencl.array.to_device(self.queue, pe)`
			`pml_h_fields[ptr(name_h)] = pyopencl.array.to_device(self.queue, ph)`

			`uv = 'xyz'.replace(pml['axis'], '')`
			`psi_base = 'Psi_' + pml['axis'] + pml['polarity'] + '_'`
Rewrite, with the following features: - Move to jinja2 templates for the opencl code - Combine PML code into the E, H updates for speed - Add Poynting vector calculation code, including precalculation during H update - Use arrays for PML parameters (p0, p1) - Switch to linearized, C-ordered fields (~50% performance boost??) - Added jinja2 and fdfd_tools dependencies 8 years ago			`psi_names = [[psi_base + eh + c for c in uv] for eh in 'EH']`

Add _create_context(), _create_operation(), and _create_pmls(), and generalize initial field value args 6 years ago			`psi_shape = list(self.shape)`
improve pml specification 7 years ago			`psi_shape[a] = pml['thickness']`
Rewrite, with the following features: - Move to jinja2 templates for the opencl code - Combine PML code into the E, H updates for speed - Add Poynting vector calculation code, including precalculation during H update - Use arrays for PML parameters (p0, p1) - Switch to linearized, C-ordered fields (~50% performance boost??) - Added jinja2 and fdfd_tools dependencies 8 years ago
			`for ne, nh in zip(*psi_names):`
			`pml_e_fields[ptr(ne)] = pyopencl.array.zeros(self.queue, tuple(psi_shape), dtype=self.arg_type)`
			`pml_h_fields[ptr(nh)] = pyopencl.array.zeros(self.queue, tuple(psi_shape), dtype=self.arg_type)`
Add _create_context(), _create_operation(), and _create_pmls(), and generalize initial field value args 6 years ago			`return pml_e_fields, pml_h_fields`
rename lib 7 years ago
Add _create_context(), _create_operation(), and _create_pmls(), and generalize initial field value args 6 years ago			`def _create_operation(self, source, args_fields):`
			`args = OrderedDict()`
			`[args.update(d) for d in args_fields]`
			`update = ElementwiseKernel(self.context, operation=source,`
			`arguments=', '.join(args.keys()))`
			`return lambda e: update(*args.values(), wait_for=e)`
Rewrite, with the following features: - Move to jinja2 templates for the opencl code - Combine PML code into the E, H updates for speed - Add Poynting vector calculation code, including precalculation during H update - Use arrays for PML parameters (p0, p1) - Switch to linearized, C-ordered fields (~50% performance boost??) - Added jinja2 and fdfd_tools dependencies 8 years ago

Add _create_context(), _create_operation(), and _create_pmls(), and generalize initial field value args 6 years ago			`def _create_context(self, context: pyopencl.Context = None,`
			`queue: pyopencl.CommandQueue = None):`
			`if context is None:`
			`self.context = pyopencl.create_some_context()`
			`else:`
			`self.context = context`
Initial commit 8 years ago
Add _create_context(), _create_operation(), and _create_pmls(), and generalize initial field value args 6 years ago			`if queue is None:`
			`self.queue = pyopencl.CommandQueue(self.context)`
			`else:`
			`self.queue = queue`
Initial commit 8 years ago
Add _create_field() and _create_eps() 6 years ago			`def _create_eps(self, epsilon: List[numpy.ndarray]):`
			`if len(epsilon) != 3:`
			`raise Exception('Epsilon must be a list with length of 3')`
			`if not all((e.shape == epsilon[0].shape for e in epsilon[1:])):`
			`raise Exception('All epsilon grids must have the same shape. Shapes are {}', [e.shape for e in epsilon])`
			`if not epsilon[0].shape == self.shape:`
			`raise Exception('Epsilon shape mismatch. Expected {}, got {}'.format(self.shape, epsilon[0].shape))`
			`self.eps = pyopencl.array.to_device(self.queue, vec(epsilon).astype(self.arg_type))`

			`def _create_field(self, initial_value: List[numpy.ndarray] = None):`
			`if initial_value is None:`
			`return pyopencl.array.zeros_like(self.eps)`
			`else:`
			`if len(initial_value) != 3:`
			`Exception('Initial field value must be a list of length 3')`
			`if not all((f.shape == self.shape for f in initial_value)):`
			`Exception('Initial field list elements must have same shape as epsilon elements')`
			`return pyopencl.array.to_device(self.queue, vec(initial_value).astype(self.arg_type))`
Initial commit 8 years ago
Rewrite, with the following features: - Move to jinja2 templates for the opencl code - Combine PML code into the E, H updates for speed - Add Poynting vector calculation code, including precalculation during H update - Use arrays for PML parameters (p0, p1) - Switch to linearized, C-ordered fields (~50% performance boost??) - Added jinja2 and fdfd_tools dependencies 8 years ago			`def type_to_C(float_type) -> str:`
			`"""`
			`Returns a string corresponding to the C equivalent of a numpy type.`
			`Only works for float16, float32, float64.`
Initial commit 8 years ago
Rewrite, with the following features: - Move to jinja2 templates for the opencl code - Combine PML code into the E, H updates for speed - Add Poynting vector calculation code, including precalculation during H update - Use arrays for PML parameters (p0, p1) - Switch to linearized, C-ordered fields (~50% performance boost??) - Added jinja2 and fdfd_tools dependencies 8 years ago			`:param float_type: e.g. numpy.float32`
			`:return: string containing the corresponding C type (eg. 'double')`
			`"""`
			`if float_type == numpy.float16:`
			`arg_type = 'half'`
			`elif float_type == numpy.float32:`
			`arg_type = 'float'`
			`elif float_type == numpy.float64:`
			`arg_type = 'double'`
			`else:`
			`raise Exception('Unsupported type')`
			`return arg_type`