# Copyright (C) 2010 Ion Torrent Systems, Inc. All Rights Reserved

"""
Tasks
=====

The ``publishers`` module contains Django views and their helper functions
related to the processing if publisher uploads.

Not all functions contained in ``publishers`` are actual Django views, only
those that take ``request`` as their first argument and appear in a ``urls``
module are in fact Django views.
"""

from __future__ import absolute_import
import datetime
import subprocess
import logging
import traceback
import os
import os.path
import time
import httplib
import mimetypes
import shutil
import time
import dateutil
from django.utils.encoding import force_unicode
from django.utils.translation import ugettext_lazy
from iondb.utils import validation, i18n_errors

from tastypie.bundle import Bundle

from django.core.exceptions import ObjectDoesNotExist
from django.shortcuts import render_to_response
from django.http import (
    HttpResponse,
    StreamingHttpResponse,
    HttpResponseRedirect,
    HttpResponseBadRequest,
)
from django import forms
from django.contrib.auth.decorators import login_required
from django.template import RequestContext, Context
from django.conf import settings

from iondb.rundb import models, labels
from iondb.rundb import publisher_types
from iondb.celery import app
from iondb.utils import validation

import json
from iondb.rundb.ajax import render_to_json
from celery.utils.log import get_task_logger


import httplib2
import urllib
from iondb.rundb.json_field import JSONEncoder
from iondb.utils.verify_types import RepresentsJSON

logger = logging.getLogger(__name__)


# ============================================================================
# Publisher Management
# ============================================================================


def search_for_publishers(pub_dir="/results/publishers/"):
    """
    Searches for new publishers, reads their publisher_meta.json, and makes any
    necessary updates to the publisher's record.
    """

    def create_new(name, version, path):
        pub = models.Publisher()
        pub.name = name
        pub.version = version
        pub.date = datetime.datetime.now()
        pub.path = path
        pub.save()

    def update_version(pub, version):
        pub.version = version
        pub.save()

    if os.path.exists(pub_dir):
        # only list files in the 'publishers' directory if they are actually folders
        folder_list = [
            i
            for i in os.listdir(pub_dir)
            if (os.path.isdir(os.path.join(pub_dir, i)) and i != "scratch")
        ]
        for pname in folder_list:
            full_path = os.path.join(pub_dir, pname)
            pub_meta_path = os.path.join(full_path, "publisher_meta.json")
            try:
                with open(pub_meta_path) as pub_meta_file:
                    publisher_meta = json.load(pub_meta_file)
                version = str(publisher_meta["version"])
            # Begin Righteous error reporting!
            except NameError:
                logger.error("Publisher %s is missing publisher_meta.json" % pname)
            except IOError as error:
                logger.error(
                    "Publisher %s failed to read publisher_meta.json with %s"
                    % (pname, error)
                )
            except (ValueError, KeyError) as error:
                logger.error(
                    "Publisher %s has an improperly formatted publisher_meta.json with %s"
                    % (pname, error)
                )
            else:
                try:
                    p = models.Publisher.objects.get(name=pname.strip())
                    if p.version != version:
                        update_version(p, version)
                        logger.info(
                            "Publisher %s updated to version %s" % (pname, version)
                        )
                except ObjectDoesNotExist:
                    create_new(pname, version, full_path)
                    logger.info("Publisher %s version %s added" % (pname, version))


def purge_publishers():
    """Removes records from publisher table which no longer have corresponding
    folder on the file system.  If the folder does not exist, we assume that
    the publisher has been deleted.  In any case, one cannot execute the
    publisher if the publisher's folder has been removed.
    """
    pubs = models.Publisher.objects.all()
    # for each record, test for corresponding folder
    for pub in pubs:
        # if folder does not exist
        if not os.path.isdir(pub.path):
            # remove this record
            pub.delete()
            logger.info(
                "Deleting publisher %s which no longer exists at %s"
                % (pub.name, pub.path)
            )


# ============================================================================
# Content Upload Publication
# ============================================================================


class PublisherContentUploadValidator(forms.Form):
    file = forms.FileField()
    meta = forms.CharField(widget=forms.HiddenInput)


def write_file(file_data, destination):
    """Write Django uploaded file object to disk incrementally in order to
    avoid sucking up all of the system's RAM by reading the whole thing in to
    memory at once.
    """
    out = open(destination, "wb+")
    for chunk in file_data.chunks():
        out.write(chunk)
    out.close()


def validate_plupload(request, pub_name, file_name, labelsContent):
    file_name = os.path.basename(file_name).strip().replace(" ", "_")

    if pub_name == "BED":
        # validate bed file name is unique
        if models.Content.objects.filter(file__endswith="/" + file_name).count() > 0:
            raise Exception(
                validation.invalid_entity_field_unique_value(
                    labelsContent.verbose_name,
                    labelsContent.pickfile.verbose_name,
                    file_name,
                )
            )

        # validate file name
        if not validation.is_valid_chars(file_name):
            raise Exception(validation.invalid_chars_error("BED file name"))

    return file_name


def write_plupload(request, pub_name):
    """file upload for plupload"""
    logger.info("Starting write plupload")

    pub = models.Publisher.objects.get(name=pub_name)
    meta = request.POST.get("meta", "{}")
    logger.debug("%s" % meta)

    if request.method == "POST":
        name = request.REQUEST.get("name", "")
        uploaded_file = request.FILES["file"]
        if not name:
            name = uploaded_file.name
        logger.debug("plupload name = '%s'" % name)

        try:
            labelsContent = labels.TargetRegionsContent  # default case
            if RepresentsJSON(meta):
                metaJson = json.loads(meta)
                labelsContent = (
                    labels.HotspotsContent
                    if metaJson and metaJson["hotspot"]
                    else labels.TargetRegionsContent
                )

            file_name = validate_plupload(request, pub_name, name, labelsContent)
        except Exception as err:
            return HttpResponseBadRequest(unicode(err))

        upload_dir = "/results/referenceLibrary/temp"
        if not os.path.exists(upload_dir):
            return render_to_json({"error": validation.missing_error(upload_dir)})

        dest_path = os.path.join(upload_dir, file_name)

        logger.debug("plupload destination = '%s'" % dest_path)

        chunk = request.REQUEST.get("chunk", "0")
        chunks = request.REQUEST.get("chunks", "0")

        logger.debug(
            "plupload chunk %s %s of %s" % (str(type(chunk)), str(chunk), str(chunks))
        )

        debug = [chunk, chunks]

        with open(dest_path, ("wb" if chunk == "0" else "ab")) as f:
            for content in uploaded_file.chunks():
                logger.debug("content chunk = '%d'" % len(content))
                f.write(content)

        my_contentupload_id = None
        if int(chunk) + 1 >= int(chunks):
            try:
                meta = json.loads(meta)
                meta["username"] = request.user.username
                upload = move_upload(pub, dest_path, file_name, json.dumps(meta))
                async_upload = run_pub_scripts.delay(pub, upload)
                my_contentupload_id = upload.id
            except Exception as err:
                logger.exception(
                    "There was a problem during upload of a file for a publisher."
                )
            else:
                logger.info("Successfully pluploaded %s" % name)

        logger.debug("plupload done")
        return render_to_json(
            {"chunk posted": debug, "contentupload_id": my_contentupload_id}
        )

    else:
        return render_to_json(
            {
                "method": i18n_errors.fatal_unsupported_http_method_expected(
                    request.method, "POST"
                )
            }
        )


def new_upload(pub, file_name, meta_data=None):

    upload_date = dateutil.parser.parse(time.asctime()).isoformat()

    # set up meta.json
    meta_data_dict = json.loads(meta_data)
    meta_data_dict["upload_date"] = upload_date
    meta_data = json.dumps(meta_data_dict)

    # create ContentUpload
    upload = models.ContentUpload()
    upload.status = "Saving"
    upload.publisher = pub
    upload.meta = meta_data
    upload.username = meta_data_dict.get("username", "")
    upload.source = meta_data_dict.get("source") or meta_data_dict.get("url", "")
    upload.upload_date = upload_date

    if "upload_type" in meta_data_dict:
        upload.upload_type = meta_data_dict["upload_type"]
    elif pub.name == "BED" and "hotspot" in meta_data_dict:
        upload.upload_type = (
            publisher_types.HOTSPOT
            if meta_data_dict["hotspot"]
            else publisher_types.TARGET
        )
    else:
        upload.upload_type = pub.name

    upload.save()

    upload_dir = os.path.join("/results/uploads", pub.name, str(upload.pk))
    upload.file_path = os.path.join(upload_dir, file_name)
    upload.save()

    try:
        meta_path = os.path.join(upload_dir, "meta.json")
        # set both the user and group to read/write to allow the celery tasks to write to this directory
        original_umask = os.umask(0)
        os.makedirs(upload_dir, 0o0775)
        open(meta_path, "w").write(meta_data)
    except OSError as err:
        logger.exception("File error while saving new %s upload" % pub)
        upload.status = "Error: %s" % err
        upload.save()
        raise
    finally:
        os.umask(original_umask)
    return upload


def move_upload(pub, file_path, file_name, meta_data=None):
    upload = new_upload(pub, file_name, meta_data)
    shutil.move(file_path, upload.file_path)
    upload.status = "Queued for processing"
    upload.save()
    return upload


def store_upload(pub, file_data, file_name, meta_data=None):
    """Create a unique folder for an uploaded file and begin editing it for
    publication.
    """
    upload = new_upload(pub, file_name, meta_data)
    write_file(file_data, upload.file_path)
    upload.status = "Queued for processing"
    upload.save()
    return upload


@app.task
def run_pub_scripts(pub, upload):
    """Spawn subshells in which the Publisher's editing scripts are run, with
    the upload's folder and the script's output folder as command line args.
    """
    task_logger = get_task_logger(__name__)
    try:
        # TODO: Handle unique file upload instance particulars
        task_logger.info("Editing upload for %s" % pub.name)
        previous_status = upload.status
        upload_path = upload.file_path
        upload_dir = os.path.dirname(upload_path)
        meta_path = os.path.join(upload_dir, "meta.json")
        pub_dir = pub.path
        pub_scripts = pub.get_editing_scripts()
        for script_path, stage_name in pub_scripts:
            # If at some point in the loop, one of the scripts changes the status,
            # then we cease updating it automatically.
            if upload.status == previous_status:
                previous_status = stage_name
                upload.status = stage_name
                upload.save()

            upload_id = str(upload.id)
            cmd = [script_path, upload_id, upload_dir, upload_path, meta_path]
            logpath = os.path.join(upload_dir, "publisher.log")
            # Spawn the test subprocess and wait for it to complete.
            with open(logpath, "a") as log_out:
                proc = subprocess.Popen(
                    cmd, stdout=log_out, stderr=subprocess.STDOUT, cwd=pub_dir
                )
                success = proc.wait() == 0

            # success = run_script(pub_dir, script_path, str(upload.id), upload_dir, upload_path, meta_path)
            # The script may have updated the upload during execution, so we reload
            upload = models.ContentUpload.objects.get(pk=upload.pk)
            if success:
                task_logger.info(
                    "Editing upload for %s finished %s" % (pub.name, script_path)
                )
            else:
                task_logger.error(
                    "Editing for %s died during %s." % (pub.name, script_path)
                )
                upload.status = "Error: %s" % stage_name
                upload.save()
            # If either the script itself or we set the status to anything starting
            # with "Error" then we abort further processing here.
            if upload.status.startswith("Error") or upload.status.startswith("Waiting"):
                return
        # At this point every script has finished running and we have not returned
        # early due to an error, alright!
        upload.status = "Successfully Completed"
        upload.save()
    except Exception:
        tb = "\n".join("    " + s for s in traceback.format_exc().split("\n"))
        task_logger.error(
            "Exception in %s upload %d during %s\n%s"
            % (pub.name, upload.id, stage_name, tb)
        )
        upload.status = "Error: processing failed."
        upload.save()


def edit_upload(pub, upload, meta=None):
    """Editing is the process which converts an uploaded file into one or more
    files of published content.
    """
    upload = store_upload(pub, upload, upload.name, meta)
    async_upload = run_pub_scripts.delay(pub, upload)
    return upload, async_upload


def publisher_upload(request, pub_name):
    """Display the publishers upload.html template on a GET of the page.
    If the view is POSTed to, the pass the uploaded data to the publisher.
    """
    pub = models.Publisher.objects.get(name=pub_name)

    if request.method == "POST":
        meta = request.POST.dict()
        files = list(request.FILES.values())

        if len(files) == 0:
            return render_to_json({"error": "Error: No file selected for upload"})
        else:
            try:
                meta["username"] = request.user.username
                upload, async_task = edit_upload(pub, files[0], json.dumps(meta))
                return render_to_json({"status": upload.status, "id": upload.id})
            except Exception as e:
                return render_to_json({"error": str(e)})
    else:
        action = request.get_full_path()
        error = ""
        contents = ""
        try:
            path = os.path.join(pub.path, "upload.html")
            with open(path, "r") as f:
                contents = f.read()
        except Exception:
            error = "Error: Unable to read %s" % path

        ctx = RequestContext(
            request, {"contents": contents, "action": action, "error": error}
        )
        return render_to_response(
            "rundb/configure/modal_publisher_upload.html", context_instance=ctx
        )


def publisher_api_upload(request, pub_name):
    """TastyPie does not support file uploads, so for now, this is handled
    outside of the normal API space.
    """
    if request.method == "POST":
        pub = models.Publisher.objects.get(name=pub_name)
        form = PublisherContentUploadValidator(request.POST, request.FILES)
        if form.is_valid():
            upload, async_task = edit_upload(
                pub, form.cleaned_data["file"], form.cleaned_data["meta"]
            )
            from iondb.rundb.api import ContentUploadResource

            resource = ContentUploadResource()
            bundle = Bundle(upload)
            serialized_upload = resource.serialize(
                None, resource.full_dehydrate(bundle), "application/json"
            )
            return HttpResponse(serialized_upload, mimetype="application/json")
        else:
            logger.warning(form.errors)
    else:
        return HttpResponseRedirect("/rundb/publish/%s/" % pub_name)


def upload_status(request, contentupload_id, frame=False):
    """If we're in an iframe, we can skip basically everything, and tell the
    template to redirect the parent window to the normal page.
    """
    if frame:
        return render_to_response(
            "rundb/ion_jailbreak.html",
            dictionary={
                "go": "/rundb/uploadstatus/%s/" % contentupload_id,
                "contentupload_id": contentupload_id,
            },
            context_instance=RequestContext(request),
        )
    upload = models.ContentUpload.objects.get(pk=contentupload_id)

    source = upload.source
    filemonitor = None
    try:
        filemonitor = models.FileMonitor.objects.get(url=source, status="Complete")
    except Exception as err:
        logger.error(err)

    logs = list(upload.logs.all())
    logs.sort(key=lambda x: x.timeStamp)

    file_log = ""
    try:
        with open(os.path.dirname(upload.file_path) + "/publisher.log", "r") as f:
            file_log = f.read()
    except Exception as err:
        # file_log = str(err)
        pass

    try:
        file_size_string = "(%s bytes)" % "{:,}".format(
            os.stat(upload.file_path).st_size
        )
    except Exception:
        file_size_string = ""

    processed_uploads = []
    for content in upload.contents.filter(type__in=["target", "hotspot"]):
        if "unmerged/detail" not in content.file:
            continue

        try:
            content_file_size_string = "(%s bytes)" % "{:,}".format(
                os.stat(content.file).st_size
            )
        except Exception:
            content_file_size_string = ""

        content_type = publisher_types.BED_TYPES.get(content.type) or content.type
        bonus_fields = []

        if content.type == "hotspot":
            if "reference" in content.meta:
                bonus_fields.append(
                    {
                        "label": labels.HotspotsContent.reference.verbose_name,
                        "value": content.meta["reference"],
                    }
                )
            if "num_loci" in content.meta:
                bonus_fields.append(
                    {
                        "label": labels.HotspotsContent.num_loci.verbose_name,
                        "value": "{:,}".format(content.meta["num_loci"]),
                    }
                )
            content_type_hash = "hotspots"

        else:
            if "reference" in content.meta:
                bonus_fields.append(
                    {
                        "label": labels.TargetRegionsContent.reference.verbose_name,
                        "value": content.meta["reference"],
                    }
                )
            if "num_targets" in content.meta:
                bonus_fields.append(
                    {
                        "label": labels.TargetRegionsContent.num_targets.verbose_name,
                        "value": "{:,}".format(content.meta["num_targets"]),
                    }
                )
            if "num_genes" in content.meta:
                bonus_fields.append(
                    {
                        "label": labels.TargetRegionsContent.num_genes.verbose_name,
                        "value": "{:,}".format(content.meta["num_genes"]),
                    }
                )
            if "num_bases" in content.meta:
                bonus_fields.append(
                    {
                        "label": labels.TargetRegionsContent.num_bases.verbose_name,
                        "value": "{:,}".format(content.meta["num_bases"]),
                    }
                )
            content_type_hash = "target-regions"

        enabled = content.meta.get("enabled", True)
        content_name = content.get_file_name()
        processed_uploads.append(
            {
                "file_name": content.file,
                "file_size_string": content_file_size_string,
                "file_name_label": labels.Content.file_name.verbose_name,  # 'Processed File'
                "content_type_hash": content_type_hash,
                "description": content.description,
                "description_label": labels.Content.description.verbose_name,  # 'Description'
                "notes": content.notes,
                "notes_label": labels.Content.notes.verbose_name,  # 'Notes'
                "enabled": content.enabled,
                "enabled_label": labels.Content.enabled.verbose_name,  # 'Enabled',
                "bonus_fields": bonus_fields,
                "content_id": content.id,
                "title": ugettext_lazy("Content.details.title").format(
                    content_type=content_type, content_name=content_name
                ),  #  u'{content_type} Details - {content_name}'
                "action_back_label": ugettext_lazy("global.action.backto").format(
                    name=content_type
                ),
                "action_back": "/configure/references/#{hash}".format(
                    hash=content_type_hash
                ),
            }
        )

    return render_to_response(
        "rundb/ion_publisher_upload_status.html",
        {
            "contentupload": upload,
            "upload_name": upload.get_file_name(),
            "logs": logs,
            "file_log": file_log,
            "file_path_label": labels.ContentUpload.file_path.verbose_name,
            "upload_type": publisher_types.BED_TYPES.get(upload.upload_type)
            or upload.upload_type,
            "upload_type_label": labels.ContentUpload.upload_type.verbose_name,
            "upload_date": upload.upload_date,
            "upload_date_label": labels.ContentUpload.upload_date.verbose_name,
            "file_size_string": file_size_string,
            "status_line": upload.status,
            "status_line_label": labels.ContentUpload.status.verbose_name,
            "processed_uploads": processed_uploads,
            "filemonitor": filemonitor,
        },
        context_instance=RequestContext(request),
    )


def content_download(request, content_id):
    content = models.Content.objects.get(pk=content_id)
    response = StreamingHttpResponse(open(content.file, "r"))
    response["Content-Type"] = "application/octet-stream"
    response["Content-Disposition"] = 'attachment; filename="%s"' % os.path.basename(
        content.file
    )
    return response


def upload_download(request, contentupload_id):
    upload = models.ContentUpload.objects.get(pk=contentupload_id)
    response = StreamingHttpResponse(open(upload.file_path, "r"))
    response["Content-Type"] = "application/octet-stream"
    response["Content-Disposition"] = 'attachment; filename="%s"' % os.path.basename(
        upload.file_path
    )
    return response


def content_add(request, hotspot=False):

    active_ref = None
    if request.method == "GET":
        active_ref = request.GET.get("reference", None)

    references = []

    # for ref in models.ReferenceGenome.objects.all():
    for ref in models.ReferenceGenome.objects.filter(
        index_version=settings.TMAP_VERSION
    ):
        references.append(
            {
                "long_name": ref.short_name + " - " + ref.name,
                "short_name": ref.short_name,
                "selected": ref.short_name == active_ref,
            }
        )
    if hotspot:
        title = ugettext_lazy("content_add_hotspots.title")
    else:
        title = ugettext_lazy("content_add_targetregions.title")
    return render_to_response(
        "rundb/ion_publisher_content_add.html",
        {
            "hotspot": hotspot,
            "references": references,
            "Content": labels.Content,
            "HotspotsContent": labels.HotspotsContent,
            "TargetRegionsContent": labels.TargetRegionsContent,
        },
        context_instance=RequestContext(request),
    )


def list_content(request):
    publishers = models.Publisher.objects.all()
    selected = request.GET.get("from", "")
    ctxd = {"publishers": publishers, "selected": selected}
    return render_to_response(
        "rundb/configure/contentupload_history.html",
        dictionary=ctxd,
        context_instance=RequestContext(request),
    )


def post_multipart(host, selector, fields, files):
    """Post fields and files to an http host as multipart/form-data.
    fields is a sequence of (name, value) elements for regular form fields.
    files is a sequence of (name, filename, value) elements for data to be uploaded as files
    Return the server's response page.
    """
    content_type, body = encode_multipart_formdata(fields, files)
    h = httplib.HTTP(host)
    h.putrequest("POST", selector)
    h.putheader("content-type", content_type)
    h.putheader("content-length", str(len(body)))
    h.endheaders()
    h.send(body)
    errcode, errmsg, headers = h.getreply()
    return h.file.read()


def encode_multipart_formdata(fields, files):
    """fields is a sequence of (name, value) elements for regular form fields.
    files is a sequence of (name, filename, value) elements for data to be uploaded as files
    Return (content_type, body) ready for httplib.HTTP instance
    """
    BOUNDARY = "GlobalNumberOfPiratesDecreasing-GlobalTemperatureIncreasing"
    CRLF = "\r\n"
    request = []
    for (key, value) in fields:
        request.extend(
            [
                "--" + BOUNDARY,
                'Content-Disposition: form-data; name="%s"' % key,
                "",
                value,
            ]
        )
    for (key, filename, value) in files:
        request.extend(
            [
                "--" + BOUNDARY,
                'Content-Disposition: form-data; name="%s"; filename="%s"'
                % (key, filename),
                "Content-Type: %s" % get_content_type(filename),
                "",
                value,
            ]
        )
    request.append("--" + BOUNDARY + "--")
    request.append("")
    body = CRLF.join(request)
    content_type = "multipart/form-data; boundary=%s" % BOUNDARY
    return content_type, body


def get_content_type(filename):
    return mimetypes.guess_type(filename)[0] or "application/octet-stream"


@app.task
def publish_file(args, pub_name, meta):
    """ This task will process file downloaded via FileMonitor """
    pub = models.Publisher.objects.get(name=pub_name)
    full_path, monitor_id = args
    if full_path:
        monitor = models.FileMonitor.objects.get(id=monitor_id)
        upload = move_upload(pub, full_path, monitor.name, meta)
        run_pub_scripts(pub, upload)


class call_api:
    def __init__(self):
        self.url = "http://localhost/rundb/api/v1/%s/"
        self.uri = "http://localhost/rundb/api/v1/%s/%s/"
        self.headers = {"Content-type": "application/json"}

    def post(self, where, **query):
        """Returns the API URI for the newly created item."""
        body = json.dumps(query, cls=JSONEncoder)
        item_url = self.url % where
        h = httplib2.Http()
        response, content = h.request(
            item_url, method="POST", body=body, headers=self.headers
        )
        return response["status"] == "201", response, content

    def patch(self, where, item_id, **update):
        """Returns True if successful; otherwise, False"""
        body = json.dumps(update, cls=JSONEncoder)
        item_uri = self.uri % (where, str(item_id))
        h = httplib2.Http()
        response, content = h.request(
            item_uri, method="PATCH", body=body, headers=self.headers
        )
        return response["status"] == "202", response, content

    def update_meta(self, meta, args):
        print("Updating Meta")
        meta_file_handle = open(args.meta_file, "w")
        json.dump(meta, meta_file_handle, cls=JSONEncoder, sort_keys=True, indent=4)
        meta_file_handle.close()
        self.patch("contentupload", args.upload_id, meta=meta)

    def get(self, where, **query):
        """Returns a JSON API result object."""
        body = urllib.urlencode(query)
        query_string = "%s?%s" % (self.url % where, body)
        h = httplib2.Http()
        response, content = h.request(
            query_string, method="GET", body=body, headers=self.headers
        )
        return json.loads(content), response, content

    def delete(self, where, item_id):
        """Returns a JSON API result object."""
        item_uri = self.uri % (where, str(item_id))
        h = httplib2.Http()
        response, content = h.request(item_uri, method="DELETE", headers=self.headers)

        return response["status"] == "204", response, content