import logging
import boto3
from app.config import Config
from app.metrics.pennsieve import get_pennseive_download_metrics
from scripts.monthly_downloads_html_template import create_html_template
from scripts.email_sender import EmailSender
from scripts.monthly_db import MonthlyStatsTable
from operator import itemgetter
import requests
import datetime
import json
from dateutil.relativedelta import relativedelta

def remove_duplicates(d_array):
    json_list = [json.dumps(d) for d in d_array]
    json_set = set(json_list)
    unique_list = [json.loads(d) for d in json_set]
    unique_list = sorted(unique_list, key=itemgetter("datasetId", "version"), reverse=True)
    return unique_list


class MonthlyStats(object):
    def __init__(self, debug_mode=False, debug_email=''):
        self.send_grid = EmailSender()
        self.user_stats = {}
        self.organization = Config.PENNSIEVE_ORGANIZATION
        self._pennsieve_temp_api_key = ''
        self.created_at = datetime.datetime.now()
        self.run_day = 1  # This is the day of the month emails will be sent
        self.debug_email = debug_email
        self.debug_mode = debug_mode
        if debug_mode:
            self.logging_address = debug_email
        else:
            self.logging_address = Config.METRICS_EMAIL_ADDRESS
        if Config.DATABASE_URL is not None:
            try:
                self.monthlytable = MonthlyStatsTable(Config.DATABASE_URL)
            except AttributeError:
                self.monthlytable = None

    # This will check against the database 
    def monthly_stats_required_check(self, timeNow=None, commit=True):
        if timeNow is None:
            timeNow = datetime.datetime.now().date()
        if self.monthlytable and self.monthlytable.sendingRequired(timeNow):
            sendgrid_responses = self.run()
            #Store the date and stats
            self.monthlytable.pushState(timeNow, self.user_stats, commit)
            return sendgrid_responses
        #return an empty array when no action is taken, keeping it consistent with run()
        #for testing
        return []

    def run(self):
        sendgrid_responses = []
        try:
            self.get_stats()
            sendgrid_responses = self.send_stats(self.user_stats)
        except BaseException as error:
            logging.exception(f'Hit error while running monthly stats. {error}')
            self.send_logging_email(f'Hit error while running monthly stats. {error}')
        else:
            self.send_logging_email(f'Monthly stats sent successfully \n'
                                    f'Sent to: {[self.user_stats[orcid_id]["email"] for orcid_id in self.user_stats if "email" in self.user_stats[orcid_id].keys()]} \n'
                                    f'Send grid Responses: {sendgrid_responses}')
        return sendgrid_responses

    def get_stats(self):
        self._pennsieve_temp_api_key = self.pennsieve_login()
        metrics = self.get_download_metrics_one_month()
        dataset_details_for_downloaded_datasets = self.get_dataset_details_from_pennsieve(metrics)
        self.user_stats = self.create_user_download_object(dataset_details_for_downloaded_datasets, metrics)
        self.pennsieve_user_details = self.get_emails_orcid_id_map_from_pennsieve()
        self.user_stats_object_post_processing()
        return self.user_stats

    def send_stats(self, user_stats):
        responses = []
        email_address = ''
        email_body = ''
        for orcid_id in user_stats:
            if 'email' in user_stats[orcid_id].keys():
                email_address = user_stats[orcid_id]['email']
                email_body = create_html_template(remove_duplicates(user_stats[orcid_id]['datasets']))
                if not self.debug_mode:  # don't want to max out our sendgrid account in testing
                    r = self.send_email(email_address, email_body)
                    responses.append(r)
        if self.debug_mode:
            responses = [self.send_logging_email(email_body)]  # send last email as log if in debug mode
        return responses

    # Get 1 month's metrics from Pennsieve
    def get_download_metrics_one_month(self):
        return get_pennseive_download_metrics(relativedelta(months=1))

    # Returns pennsieve api token valid for 24 hours
    def pennsieve_login(self):
        r = requests.get(f"{Config.PENNSIEVE_API_HOST}/authentication/cognito-config")
        r.raise_for_status()

        cognito_app_client_id = r.json()["tokenPool"]["appClientId"]
        cognito_region = r.json()["region"]

        cognito_idp_client = boto3.client(
            "cognito-idp",
            region_name=cognito_region,
            aws_access_key_id="",
            aws_secret_access_key="",
        )

        login_response = cognito_idp_client.initiate_auth(
            AuthFlow="USER_PASSWORD_AUTH",
            AuthParameters={"USERNAME": Config.PENNSIEVE_API_TOKEN, "PASSWORD": Config.PENNSIEVE_API_SECRET},
            ClientId=cognito_app_client_id,
        )

        api_key = login_response["AuthenticationResult"]["AccessToken"]
        return api_key

    # Places emails on the an object with orcid_ids
    def get_emails_orcid_id_map_from_pennsieve(self):
        r = requests.get(f"{Config.PENNSIEVE_API_HOST}/organizations/{self.organization}/members",
                         headers={"Authorization": f"Bearer {self._pennsieve_temp_api_key}"})
        r.raise_for_status()
        return r.json()

    # Add an emails field to the user stats object (which has a highest level of orcid id)
    # Sort the dataset list by id then version
    def user_stats_object_post_processing(self):
        for user in self.pennsieve_user_details:
            if 'orcid' in user.keys():
                orcid_id = user['orcid']['orcid']
                if orcid_id in self.user_stats.keys():
                    self.user_stats[orcid_id]['email'] = user['email']
                    self.user_stats[orcid_id]['datasets'] = self.user_stats[orcid_id]['datasets']

    # Get details for a given metrics object
    def get_dataset_details_from_pennsieve(self, metrics):
        # send a request asking for info on the datsets with downloads
        uniqueIds = set([d['datasetId'] for d in metrics])
        r = requests.get(f'{Config.PENNSIEVE_API_HOST}/discover/datasets', {
            'limit': 1000,
            'ids': uniqueIds
        })
        r.raise_for_status()
        return r.json()['datasets']

    #  Creates dictionary keyed by orcid id with download stats in a list for each orcid id
    def create_user_download_object(self, dataset_details_object, download_stats):
        users = {}
        for dataset in dataset_details_object:

            # filter to only have datsets with downloads
            downloadInfo = [d for d in download_stats if dataset['id'] == d['datasetId']]

            downloadInfo = self.add_dataset_name_to_download_info(dataset, downloadInfo)
            for contributor in dataset['contributors']:
                orcid_id = contributor['orcid']

                if orcid_id is not None:
                    # Add the download info with an orcid id as a key
                    if orcid_id not in users.keys():
                        users[orcid_id] = {}
                        users[orcid_id]['datasets'] = downloadInfo
                    else:
                        # Must to a dictionary 'get' below, as using += mutates the dictionary
                        users[orcid_id]['datasets'] = users.get(orcid_id)['datasets'] + downloadInfo

        return users

    def add_dataset_name_to_download_info(self, dataset, downloadInfo):
        for i in range(0, len(downloadInfo)):
            downloadInfo[i]['name'] = dataset['name']
        return downloadInfo

    # send email using sendgrid
    def send_email(self, email_address, email_body):
        if self.debug_mode:
            email_destination = self.debug_email
            return self.send_grid.sendgrid_email_with_unsubscribe_group(Config.METRICS_EMAIL_ADDRESS,
                                                                    email_destination,
                                                                    'SPARC monthly dataset download summary',
                                                                    email_body)
        elif Config.SEND_MONTHLY_STATS == 'TRUE':
            email_destination = email_address
            return self.send_grid.sendgrid_email_with_unsubscribe_group(Config.METRICS_EMAIL_ADDRESS,
                                                                    email_destination,
                                                                    'SPARC monthly dataset download summary',
                                                                    email_body)

    def send_logging_email(self, message):
        try:
            response = self.send_grid.sendgrid_email_with_unsubscribe_group(Config.METRICS_EMAIL_ADDRESS,
                                                                 self.logging_address,
                                                                 'SPARC monthly dataset download summary',
                                                                 message)
            if response.status_code == 202:
                logging.info(f'Logging email sent successfully to {self.logging_address} (202)')
            elif response.status_code == 403:
                logging.error('Could not send sendgrid email because rate limit is hit (403)')
            elif response.status_code == 401:
                logging.error('Could not send sendgrid email. Sendgrid keys are likely incorrect (401)')
            else:
                logging.error(f'Unknown error. Status code: {response.status_code}')
        except BaseException as err:
            logging.error(err)

        return response