#!/usr/local/bin/env python

#=============================================================================================
# MODULE DOCSTRING
#=============================================================================================

"""
Implicit Ligand Theory

Stage 1: Sampling receptor conformations.

@author John D. Chodera <jchodera@gmail.com>
@author David D. L. Minh <daveminh@gmail.com>

All code in this repository is released under the GNU General Public License.

This program is free software: you can redistribute it and/or modify it under
the terms of the GNU General Public License as published by the Free Software
Foundation, either version 3 of the License, or (at your option) any later
version.

This program is distributed in the hope that it will be useful, but WITHOUT ANY
WARRANTY; without even the implied warranty of MERCHANTABILITY or FITNESS FOR A
PARTICULAR PURPOSE.  See the GNU General Public License for more details.
 
You should have received a copy of the GNU General Public License along with
this program.  If not, see <http://www.gnu.org/licenses/>.

TODO

"""

#=============================================================================================
# GLOBAL IMPORTS
#=============================================================================================

import os
import os.path
import sys
import copy
import time

import numpy
import numpy.random 

import simtk.unit as units
import simtk.openmm as openmm

from alchemy import AbsoluteAlchemicalFactory
from thermodynamics import ThermodynamicState
from repex import HamiltonianExchange

#=============================================================================================
# MAIN
#=============================================================================================

if __name__ == '__main__':    
    # Initialize command-line argument parser.

    usage = """
    USAGE

    python %prog --sourcedir source-directory [-v | --verbose] [-i | --iterations ITERATIONS] [--restraints restraint-type] --output output-netcdf

    EXAMPLES

    # Specify directory containing prmtop and crd files (complex, ligand, receptor) ending in .prmtop and .crd
    python %prog --sourcedir ../../src/examples/benzene-toluene --iterations 1000 --output output.nc --verbose

    NOTES

    In atom ordering, receptor comes before ligand atoms.

    """

    # Parse command-line arguments.
    from optparse import OptionParser
    parser = OptionParser(usage=usage)
    parser.add_option("--sourcedir", dest="source_directory", default=None, help="source directory containing complex, ligand, and receptor prmtop and crd files", metavar="SOURCE_DIRECTORY")
    parser.add_option("-v", "--verbose", action="store_true", dest="verbose", default=False, help="verbosity flag")
    parser.add_option("-i", "--iterations", dest="niterations", type="int", default=None, help="number of iterations", metavar="ITERATIONS")
    parser.add_option("--restraints", dest="restraint_type", default=None, help="specify ligand restraint type: 'harmonic' or 'flat-bottom' (default: 'flat-bottom')")
    parser.add_option("--output", dest="store_filename", default=None, help="specify output NetCDF file---must be unique for each calculation (default: 'output.nc')")

    # Parse command-line arguments.
    (options, args) = parser.parse_args()

    # Check arguments for validity.
    if not options.source_directory:
        parser.error("source directory containing ligand, receptor, and complex crd and prmtop files must be specified")
    if not os.path.exists(options.source_directory):
        parser.error("source directory '%s' does not exist" % options.source_directory)

    # Create System objects from AMBER prmtop files and load coordinates.
    if options.verbose: print "Reading AMBER prmtop and inpcrd files from directory '%s'..." % options.source_directory
    # NOTE: Hard-coded options for now.
    # TODO: Handle explicit solvent systems and different kinds of GB / nonbonded / constraint treatments.
    # TODO: Can add constraints to hydrogens in ligand only later.
    import simtk.openmm.app as app
    nonbondedMethod = app.NoCutoff
    implicitSolvent = app.OBC2
    constraints = None
    removeCMMotion = False
    systems = dict()
    initial_positions = dict()
    for name in ['complex', 'receptor', 'ligand']:
        # Read prmtop.
        prmtop_filename = os.path.join(options.source_directory, '%s.prmtop' % name)
        if options.verbose: print "Reading %s..." % prmtop_filename
        systems[name] = app.AmberPrmtopFile(prmtop_filename).createSystem(nonbondedMethod=nonbondedMethod, implicitSolvent=implicitSolvent, constraints=constraints, removeCMMotion=removeCMMotion)
        # Read coordinates.
        inpcrd_filename = os.path.join(options.source_directory, '%s.crd' % name)
        if options.verbose: print "Reading %s..." % inpcrd_filename
        initial_positions[name] = app.AmberInpcrdFile(inpcrd_filename).getPositions(asNumpy=True)

    #
    # Initialize NetCDF file.
    #

    # TODO: If NetCDF file already exists, we should append rather than overwrite.
    
    # Create NetCDF file.
    import netCDF4 as netcdf # netcdf4-python
    ncfile = netcdf.Dataset(options.store_filename, 'w', version='NETCDF4')
    
    # Create dimensions.
    ncfile.createDimension('iteration', 0) # unlimited number of iterations
    ncfile.createDimension('complex_atoms', systems['complex'].getNumParticles()) # number of atoms in system
    ncfile.createDimension('receptor_atoms', systems['receptor'].getNumParticles()) # number of atoms in system
    ncfile.createDimension('ligand_atoms', systems['ligand'].getNumParticles()) # number of atoms in system
    ncfile.createDimension('spatial', 3) # number of spatial dimensions

    # Create a group to store receptor trajectory.
    ncgrp = ncfile.createGroup('receptor')

    # Create variables.
    ncvar_positions = ncgrp.createVariable('positions', 'f', ('iteration','receptor_atoms','spatial'))
    ncvar_energies  = ncgrp.createVariable('potential', 'f', ('iteration',))        
    
    # Define units for variables.
    setattr(ncvar_positions, 'units', 'nanometers')
    setattr(ncvar_energies,  'units', 'kilojoules_per_mole')

    # Define long (human-readable) names for variables.
    setattr(ncvar_positions, "long_name", "positions[iteration][atom][spatial] is position of coordinate 'spatial' of atom 'atom' from replica 'replica' for iteration 'iteration'.")
    setattr(ncvar_energies,  "long_name", "potential[iteration] is the energy from iteration 'iteration'.")
    
    # Force sync to disk to avoid data loss.
    ncfile.sync()

    #
    # Run simulation of receptor, storing coordinates and potential energies.
    #

    # Create an integrator.
    # TODO: Allow user to set integrator options.
    temperature = 300.0 * units.kelvin
    collision_rate = 5.0 / units.picosecond
    timestep = 1.0 * units.femtosecond
    nsteps_per_iteration = 1000 # number of timesteps per iteration
    integrator = openmm.LangevinIntegrator(temperature, collision_rate, timestep)

    # Create a Context.
    context = openmm.Context(systems['receptor'], integrator)

    # Set positions.
    context.setPositions(initial_positions['receptor'])

    # Minimize energy.
    if options.verbose: print "Minimizing..."
    openmm.LocalEnergyMinimizer.minimize(context)

    # Collect snapshots.
    for iteration in range(options.niterations):
        if options.verbose: print "iteration %8d / %8d" % (iteration, options.niterations)
        # Run integration.
        integrator.step(nsteps_per_iteration)
        # Get positions and energies.
        state = context.getState(getPositions=True, getEnergy=True)
        positions = state.getPositions(asNumpy=True)
        potential = state.getPotentialEnergy()
        # Store snapshot.
        ncgrp.variables['positions'][iteration,:,:] = positions[:,:] / units.angstroms
        ncgrp.variables['potential'][iteration] = potential / units.kilojoules_per_mole
        ncfile.sync()

    # Close.
    ncfile.close()