Source code for oasislmf.platform_api.client

__all__ = [
    'APIClient',
    'ApiEndpoint',
    'FileEndpoint',
    'JsonEndpoint',
    'API_analyses',
    'API_models',
    'API_portfolios',
]

import io
import json
import logging
import os
import tarfile
import time
import pathlib

from posixpath import join as urljoin

import pandas as pd

from tqdm import tqdm
from requests_toolbelt import MultipartEncoder
from requests.exceptions import (
    HTTPError,
)
from .session import APISession
from ..utils.exceptions import OasisException



[docs]
class ApiEndpoint(object):
    """
    Used to Implement the default requests common to all Oasis API
    End points.
    """

    def __init__(self, session, url_endpoint, logger=None):

[docs]
        self.logger = logger or logging.getLogger(__name__)


[docs]
        self.session = session


[docs]
        self.url_endpoint = str(url_endpoint)



[docs]
    def create(self, data):
        return self.session.post(self.url_endpoint, json=data)



[docs]
    def get(self, ID=None):
        if ID:
            return self.session.get(urljoin(self.url_endpoint, f'{ID}/'))
        return self.session.get(self.url_endpoint)



[docs]
    def delete(self, ID):
        return self.session.delete(urljoin(self.url_endpoint, f'{ID}/'))



[docs]
    def search(self, metadata={}):
        search_string = ""
        for key in metadata:
            if not search_string:
                search_string = f'?{key}={metadata[key]}'
            else:
                search_string += f'&{key}={metadata[key]}'
        return self.session.get(f'{self.url_endpoint}{search_string}')





[docs]
class JsonEndpoint(object):
    """
    Used for JSON data End points.
    """

    def __init__(self, session, url_endpoint, url_resource, logger=None):

[docs]
        self.logger = logger or logging.getLogger(__name__)


[docs]
        self.session = session


[docs]
        self.url_endpoint = str(url_endpoint)


[docs]
        self.url_resource = str(url_resource)


    def _build_url(self, ID):
        return urljoin(self.url_endpoint, str(ID), self.url_resource)


[docs]
    def get(self, ID):
        return self.session.get(self._build_url(ID))



[docs]
    def post(self, ID, data):
        return self.session.post(self._build_url(ID), json=data)



[docs]
    def delete(self, ID):
        return self.session.delete(self._build_url(ID))



[docs]
    def download(self, ID, file_path, overwrite=True):
        abs_fp = os.path.realpath(os.path.expanduser(file_path))
        dir_fp = os.path.dirname(abs_fp)

        # Check and create base dir
        if not os.path.exists(dir_fp):
            os.makedirs(dir_fp)

        # Check if file exists
        if os.path.exists(abs_fp) and not overwrite:
            error_message = 'Local file alreday exists: {}'.format(abs_fp)
            raise IOError(error_message)

        with io.open(abs_fp, 'w', encoding='utf-8') as f:
            r = self.get(ID)
            f.write(json.dumps(r.json(), ensure_ascii=False, indent=4))
        return r





[docs]
class FileEndpoint(object):
    """
    File Resources Endpoint for Upload / Downloading
    """

    def __init__(self, session, url_endpoint, url_resource, logger=None):

[docs]
        self.logger = logger or logging.getLogger(__name__)


[docs]
        self.session = session


[docs]
        self.url_endpoint = str(url_endpoint)


[docs]
        self.url_resource = str(url_resource)


    def _build_url(self, ID):
        return urljoin(self.url_endpoint, str(ID), self.url_resource)

    def _set_content_type(self, file_path):
        content_type_map = {
            'parquet': 'application/octet-stream',
            'pq': 'application/octet-stream',
            'csv': 'text/csv',
            'gz': 'application/gzip',
            'zip': 'application/zip',
            'bz2': 'application/x-bzip2',
        }
        file_ext = pathlib.Path(file_path).suffix[1:].lower()
        return content_type_map[file_ext] if file_ext in content_type_map else 'text/csv'


[docs]
    def upload(self, ID, file_path, content_type=None):
        if not content_type:
            content_type = self._set_content_type(file_path)
        return self.session.upload(self._build_url(ID), file_path, content_type)



[docs]
    def upload_byte(self, ID, file_bytes, filename, content_type=None):
        if not content_type:
            content_type = self._set_content_type(filename)
        return self.session.upload_byte(self._build_url(ID), file_bytes, filename, content_type)



[docs]
    def download(self, ID, file_path, overwrite=True, chuck_size=1024):
        abs_fp = os.path.realpath(os.path.expanduser(file_path))
        dir_fp = os.path.dirname(abs_fp)

        # Check and create base dir
        if not os.path.exists(dir_fp):
            os.makedirs(dir_fp)

        # Check if file exists
        if os.path.exists(abs_fp) and not overwrite:
            error_message = 'Local file alreday exists: {}'.format(abs_fp)
            raise IOError(error_message)

        with io.open(abs_fp, 'wb') as f:
            r = self.session.get(self._build_url(ID), stream=True)
            for chunk in r.iter_content(chunk_size=chuck_size):
                f.write(chunk)
            return r



[docs]
    def get(self, ID):
        return self.session.get(self._build_url(ID))



[docs]
    def get_dataframe(self, ID):
        '''
        Return file endpoint as dict of pandas Dataframes:

        either 'application/gzip': search and extract all csv
        or 'text/csv': return as dataframe
        '''
        supported_content = [
            'text/csv',
            'application/gzip',
            'application/octet-stream',
        ]
        r = self.get(ID)
        file_type = r.headers['Content-Type']

        if file_type not in supported_content:
            raise OasisException(f'Unsupported filetype for Dataframe conversion: {file_type}')

        if file_type == 'text/csv':
            return pd.read_csv(io.StringIO(r.content.decode('utf-8')))

        if file_type == 'application/octet-stream':
            return pd.read_parquet(io.BytesIO(r.content))

        if file_type == 'application/gzip':
            dataframes_list = {}
            tar = tarfile.open(fileobj=io.BytesIO(r.content))

            for member in [f for f in tar.getmembers() if '.csv' in f.name]:
                csv = tar.extractfile(member)
                dataframes_list[os.path.basename(member.name)] = pd.read_csv(csv)

            for member in [f for f in tar.getmembers() if '.parquet' in f.name]:
                pq = tar.extractfile(member)
                dataframes_list[os.path.basename(member.name)] = pd.read_parquet(pq)
            return dataframes_list



[docs]
    def post(self, ID, data_object, content_type='application/json'):
        m = MultipartEncoder(fields={'file': ('data', data_object, content_type)})
        return self.session.post(
            self._build_url(ID),
            data=m,
            headers={'Content-Type': m.content_type}
        )



[docs]
    def post_dataframe(self, ID, data_frame):
        csv_buffer = io.StringIO()
        data_frame.to_csv(csv_buffer, index=False)
        return self.post(ID, data_object=csv_buffer, content_type='text/csv')



[docs]
    def delete(self, ID):
        return self.session.delete(self._build_url(ID))




class SettingTemplatesBaseEndpoint(object):
    def __init__(self, session, url_endpoint, url_resource=None, logger=None):
        self.logger = logger or logging.getLogger(__name__)
        self.session = session
        self.url_endpoint = str(url_endpoint)
        self.url_resource = url_resource

    def _build_url(self, model_pk, ID=None):
        url_components = [self.url_endpoint, str(model_pk), 'setting_templates/']
        if ID is not None:
            url_components += [str(ID)]

        if self.url_resource is not None:
            url_components += [str(self.url_resource)]

        return urljoin(*url_components)

    def get(self, model_pk, ID=None):
        return self.session.get(self._build_url(model_pk, ID))

    def post(self, model_pk, data, ID=None):
        return self.session.post(self._build_url(model_pk, ID), json=data)

    def delete(self, model_pk, ID):
        return self.session.delete(self._build_url(model_pk, ID))

    def put(self, model_pk, ID, data):
        return self.session.put(self._build_url(model_pk, ID), json=data)

    def patch(self, model_pk, ID, data):
        return self.session.patch(self._build_url(model_pk, ID), json=data)


class SettingTemplatesEndpoint(SettingTemplatesBaseEndpoint):
    """
    Settings Template Endpoint for interacting with analysis settings templates for a given model.
    """

    def __init__(self, session, url_endpoint, logger=None):
        super().__init__(session, url_endpoint)
        self.content = SettingTemplatesBaseEndpoint(session, url_endpoint, 'content/', logger=logger)



[docs]
class API_models(ApiEndpoint):
    def __init__(self, session, url_endpoint):
        super(API_models, self).__init__(session, url_endpoint)

[docs]
        self.resource_file = FileEndpoint(self.session, self.url_endpoint, 'resource_file/')


[docs]
        self.settings = JsonEndpoint(self.session, self.url_endpoint, 'settings/')


[docs]
        self.versions = JsonEndpoint(self.session, self.url_endpoint, 'versions/')


        # Platform 2.0 only (Check might be needed here)

[docs]
        self.chunking_configuration = JsonEndpoint(self.session, self.url_endpoint, 'chunking_configuration/')


[docs]
        self.scaling_configuration = JsonEndpoint(self.session, self.url_endpoint, 'scaling_configuration/')



[docs]
        self.setting_templates = SettingTemplatesEndpoint(self.session, self.url_endpoint)



[docs]
    def data_files(self, ID):
        return self.session.get('{}{}/data_files'.format(self.url_endpoint, ID))



[docs]
    def create(self, supplier_id, model_id, version_id, data_files=[]):
        data = {"supplier_id": supplier_id,
                "model_id": model_id,
                "version_id": version_id,
                "data_files": data_files}
        return self.session.post(self.url_endpoint, json=data)



[docs]
    def update(self, ID, supplier_id, model_id, version_id, data_files=[]):
        data = {"supplier_id": supplier_id,
                "model_id": model_id,
                "version_id": version_id,
                "data_files": data_files}
        return self.session.put('{}{}/'.format(self.url_endpoint, ID), json=data)





[docs]
class API_portfolios(ApiEndpoint):

    def __init__(self, session, url_endpoint):
        super(API_portfolios, self).__init__(session, url_endpoint)

[docs]
        self.accounts_file = FileEndpoint(self.session, self.url_endpoint, 'accounts_file/')


[docs]
        self.location_file = FileEndpoint(self.session, self.url_endpoint, 'location_file/')


[docs]
        self.reinsurance_info_file = FileEndpoint(self.session, self.url_endpoint, 'reinsurance_info_file/')


[docs]
        self.reinsurance_scope_file = FileEndpoint(self.session, self.url_endpoint, 'reinsurance_scope_file/')


[docs]
        self.storage_links = JsonEndpoint(self.session, self.url_endpoint, 'storage_links/')



[docs]
    def create(self, name):
        data = {"name": name}
        return self.session.post(self.url_endpoint, json=data)



[docs]
    def update(self, ID, name):
        data = {"name": name}
        return self.session.put('{}{}/'.format(self.url_endpoint, ID), json=data)



[docs]
    def create_analyses(self, ID, name, model_id):
        """ Create new analyses from Exisiting portfolio
        """
        data = {"name": name,
                "model": model_id}
        return self.session.post('{}{}/create_analysis/'.format(self.url_endpoint, ID), json=data)




class API_datafiles(ApiEndpoint):

    def __init__(self, session, url_endpoint):
        super(API_datafiles, self).__init__(session, url_endpoint)
        self.content = FileEndpoint(self.session, self.url_endpoint, 'content/')

    def create(self, file_description, file_category=None):
        data = {"file_description": file_description}
        if file_category is not None:
            data["file_category"] = file_category

        return self.session.post(self.url_endpoint, json=data)

    def update(self, ID, file_description, file_category=None):
        data = {"file_description": file_description}
        if file_category is not None:
            data["file_category"] = file_category
        return self.session.put('{}{}/'.format(self.url_endpoint, ID), json=data)


class API_task_status(ApiEndpoint):

    def __init__(self, session, url_endpoint):
        super(API_task_status, self).__init__(session, url_endpoint)
        self.output_log = FileEndpoint(self.session, self.url_endpoint, 'output_log/')
        self.error_log = FileEndpoint(self.session, self.url_endpoint, 'error_log/')



[docs]
class API_analyses(ApiEndpoint):

    def __init__(self, session, url_endpoint):
        super(API_analyses, self).__init__(session, url_endpoint)

[docs]
        self.lookup_errors_file = FileEndpoint(self.session, self.url_endpoint, 'lookup_errors_file/')


[docs]
        self.lookup_success_file = FileEndpoint(self.session, self.url_endpoint, 'lookup_success_file/')


[docs]
        self.lookup_validation_file = FileEndpoint(self.session, self.url_endpoint, 'lookup_validation_file/')


[docs]
        self.summary_levels_file = FileEndpoint(self.session, self.url_endpoint, 'summary_levels_file/')


[docs]
        self.input_file = FileEndpoint(self.session, self.url_endpoint, 'input_file/')


[docs]
        self.input_generation_traceback_file = FileEndpoint(self.session, self.url_endpoint, 'input_generation_traceback_file/')


[docs]
        self.output_file = FileEndpoint(self.session, self.url_endpoint, 'output_file/')


[docs]
        self.run_traceback_file = FileEndpoint(self.session, self.url_endpoint, 'run_traceback_file/')


[docs]
        self.run_log_file = FileEndpoint(self.session, self.url_endpoint, 'run_log_file/')


[docs]
        self.settings_file = FileEndpoint(self.session, self.url_endpoint, 'settings_file/')


[docs]
        self.settings = JsonEndpoint(self.session, self.url_endpoint, 'settings/')



[docs]
    def create(self, name, portfolio_id, model_id, data_files=[]):
        data = {"name": name,
                "portfolio": portfolio_id,
                "model": model_id,
                "complex_model_data_files": data_files}
        return self.session.post(self.url_endpoint, json=data)



[docs]
    def update(self, ID, name, portfolio_id, model_id, data_files=[]):
        data = {"name": name,
                "portfolio": portfolio_id,
                "model": model_id,
                "complex_model_data_files": data_files}
        return self.session.put('{}{}/'.format(self.url_endpoint, ID), json=data)



[docs]
    def status(self, ID):
        return self.get(ID).json()['status']



[docs]
    def generate(self, ID):
        return self.session.post('{}{}/generate_inputs/'.format(self.url_endpoint, ID), json={})



[docs]
    def run(self, ID):
        return self.session.post('{}{}/run/'.format(self.url_endpoint, ID), json={})



[docs]
    def generate_and_run(self, ID):
        return self.session.post('{}{}/generate_and_run/'.format(self.url_endpoint, ID), json={})



[docs]
    def cancel_analysis_run(self, ID):
        return self.session.post('{}{}/cancel_analysis_run/'.format(self.url_endpoint, ID), json={})



[docs]
    def cancel_generate_inputs(self, ID):
        return self.session.post('{}{}/cancel_generate_inputs/'.format(self.url_endpoint, ID), json={})



[docs]
    def cancel(self, ID):
        return self.session.post('{}{}/cancel/'.format(self.url_endpoint, ID), json={})



[docs]
    def copy(self, ID):
        return self.session.post('{}{}/copy/'.format(self.url_endpoint, ID), json={})



[docs]
    def data_files(self, ID):
        return self.session.get('{}{}/data_files/'.format(self.url_endpoint, ID))



[docs]
    def storage_links(self, ID):
        return self.session.get('{}{}/storage_links/'.format(self.url_endpoint, ID))



[docs]
    def sub_task_list(self, ID):
        return self.session.get('{}{}/sub_task_list/'.format(self.url_endpoint, ID))



# --- API Main Client ------------------------------------------------------- #



[docs]
class APIClient(object):
    def __init__(self, api_url='http://localhost:8000', api_ver='V2', username='admin', password='password', timeout=25, logger=None, **kwargs):

[docs]
        self.logger = logger or logging.getLogger(__name__)



[docs]
        self.api = APISession(api_url, username, password, timeout, **kwargs)


[docs]
        self.api_ver = api_ver.lower()


[docs]
        self.models = API_models(self.api, '{}{}/models/'.format(self.api.url_base, self.api_ver))


[docs]
        self.portfolios = API_portfolios(self.api, '{}{}/portfolios/'.format(self.api.url_base, self.api_ver))


[docs]
        self.analyses = API_analyses(self.api, '{}{}/analyses/'.format(self.api.url_base, self.api_ver))


[docs]
        self.data_files = API_datafiles(self.api, '{}{}/data_files/'.format(self.api.url_base, self.api_ver))


[docs]
        self.task_status = API_task_status(self.api, '{}{}/analysis-task-statuses/'.format(self.api.url_base, self.api_ver))



[docs]
    def oed_peril_codes(self):
        return self.api.get('{}oed_peril_codes/'.format(self.api.url_base))



[docs]
    def server_info(self):
        return self.api.get('{}server_info/'.format(self.api.url_base))



[docs]
    def healthcheck(self):
        return self.api.get('{}healthcheck/'.format(self.api.url_base))



[docs]
    def upload_portfolio_file(self, portfolio_id, portfolio_file, upload_data):
        """
        Upload a portfolio file using the API. Supports absolute filepaths or
        bytestreams.

        If uploading a byte stream `upload_data` is a dict with the keys `name`
        which is a `str` containing the filename and `bytes` containing the
        byte stream of the file data. For example:

        ```python
        upload_portfolio_file(<portfolio_id>, "location_file",
                              {'bytes': <byte_stream>, 'name': <filename>})
        ```

        Parameters
        :param portfolio_id: Portfolio {id} from
        :type portfolio_id: int

        :param portfolio_file: The name of the portfolio file to update. One of
            the following options `location_file`, `accounts_file`,
            `reinsurance_info_file` or `reinsurance_scope_file`.
        :type settings: str

        :param upload_data: The file to upload through the api. This should be
        a `str` if it is a filepath or a `dict` if it is a byte stream with the
        keys `name` and `bytes` corresponding to the filename and bytestream
        respectively.
        :type upload_data: [str, dict]
        ----------
        """
        if isinstance(upload_data, dict):
            getattr(self.portfolios, portfolio_file).upload_byte(portfolio_id,
                                                                 upload_data['bytes'],
                                                                 upload_data['name'])
            self.logger.info("File uploaded: {}".format(upload_data['name']))
        else:
            getattr(self.portfolios, portfolio_file).upload(portfolio_id, upload_data)
            self.logger.info("File uploaded: {}".format(upload_data))



[docs]
    def upload_inputs(self, portfolio_name=None, portfolio_id=None,
                      location_fp=None, accounts_fp=None, ri_info_fp=None, ri_scope_fp=None):
        if not portfolio_name:
            portfolio_name = time.strftime("Portfolio_%d%m%Y-%H%M%S")

        try:
            if portfolio_id:
                self.logger.info('Updating exisiting portfolio')
                portfolio = self.portfolios.update(portfolio_id, portfolio_name)
            else:
                self.logger.info('Creating portfolio')
                portfolio = self.portfolios.create(portfolio_name)
                portfolio_id = portfolio.json()['id']

            # Upload exposure
            if location_fp:
                self.upload_portfolio_file(portfolio_id, 'location_file', location_fp)
            if accounts_fp:
                self.upload_portfolio_file(portfolio_id, 'accounts_file', accounts_fp)
            if ri_info_fp:
                self.upload_portfolio_file(portfolio_id, 'reinsurance_info_file', ri_info_fp)
            if ri_scope_fp:
                self.upload_portfolio_file(portfolio_id, 'reinsurance_scope_file', ri_scope_fp)
            return portfolio.json()
        except HTTPError as e:
            self.api.unrecoverable_error(e, 'upload_inputs: failed')



[docs]
    def upload_settings(self, analyses_id, settings):
        """
        Upload an analyses run settings to an API

        Method to post JSON data or upload a settings file containing JSON data

        Parameters
        ----------
        :param analyses_id: Analyses settings {id} from, `v1/analyses/{id}/settings`
        :type analyses_id: int

        :param settings: Either a valid filepath or dictionary holding the settings
        :type settings: [str, dict]

        :return:
        :rtype None
        """
        if isinstance(settings, dict):
            self.analyses.settings.post(analyses_id, settings)
            self.logger.info("Settings JSON uploaded: {}".format(settings))

        elif os.path.isfile(str(settings)):
            with io.open(settings, 'r', encoding='utf-8') as f:
                data = json.load(f)
            self.analyses.settings.post(analyses_id, data)
            self.logger.info("Settings JSON uploaded: {}".format(settings))
        else:
            raise TypeError("'settings': not a valid filepath or dictionary")



[docs]
    def create_analysis(self, portfolio_id, model_id, analysis_name=None, analysis_settings_fp=None):
        try:
            if not analysis_name:
                analysis_name = time.strftime("Analysis_%d%m%Y-%H%M%S")

            analyses = self.analyses.create(analysis_name, portfolio_id, model_id).json()
            if analysis_settings_fp:
                self.upload_settings(analyses['id'], analysis_settings_fp)

            return analyses
        except HTTPError as e:
            self.api.unrecoverable_error(e, 'create_analysis: failed')



[docs]
    def run_generate(self, analysis_id, poll_interval=5):
        """
        Generates the inputs for the analysis based on the portfolio.
        The analysis must have one of the following statuses, `NEW`, `INPUTS_GENERATION_ERROR`,
        `INPUTS_GENERATION_CANCELLED`, `READY`, `RUN_COMPLETED`, `RUN_CANCELLED` or
        `RUN_ERROR`.
        """

        try:
            r = self.analyses.generate(analysis_id)
            analysis = r.json()
            self.logger.info('Inputs Generation: Starting (id={})'.format(analysis_id))
            logged_queued = None
            logged_running = None

            while True:
                if analysis['status'] in ['READY']:
                    self.logger.info('Inputs Generation: Complete (id={})'.format(analysis_id))
                    return True

                elif analysis['status'] in ['INPUTS_GENERATION_CANCELLED']:
                    self.logger.info('Input Generation: Cancelled (id={})'.format(analysis_id))
                    return False

                elif analysis['status'] in ['INPUTS_GENERATION_ERROR']:
                    self.logger.info('Input Generation: Failed (id={})'.format(analysis_id))
                    error_trace = self.analyses.input_generation_traceback_file.get(analysis_id).text
                    self.logger.error("\nServer logs:")
                    self.logger.error(error_trace)
                    return False

                elif analysis['status'] in ['INPUTS_GENERATION_QUEUED']:
                    if not logged_queued:
                        logged_queued = True
                        self.logger.info('Input Generation: Queued (id={})'.format(analysis_id))

                    time.sleep(poll_interval)
                    r = self.analyses.get(analysis_id)
                    analysis = r.json()
                    continue

                elif analysis['status'] in ['INPUTS_GENERATION_STARTED']:
                    if not logged_running:
                        logged_running = True
                        self.logger.info('Input Generation: Executing (id={})'.format(analysis_id))

                    if analysis.get('run_mode', '') == 'V2':
                        sub_tasks_list = self.analyses.sub_task_list(analysis_id).json()
                        with tqdm(total=len(sub_tasks_list),
                                  unit=' sub_task',
                                  desc='Input Generation') as pbar:

                            completed = []
                            while len(completed) < len(sub_tasks_list):
                                sub_tasks_list = self.analyses.sub_task_list(analysis_id).json()
                                analysis = self.analyses.get(analysis_id).json()
                                completed = [tsk for tsk in sub_tasks_list if tsk['status'] == 'COMPLETED']
                                pbar.update(len(completed) - pbar.n)
                                time.sleep(poll_interval)

                                # Exit conditions
                                if ('_CANCELLED' in analysis['status']) or ('_ERROR' in analysis['status']):
                                    break
                                elif 'READY' in analysis['status']:
                                    pbar.update(pbar.total - pbar.n)
                                    break

                    else:
                        time.sleep(poll_interval)
                        analysis = self.analyses.get(analysis_id).json()

                    continue

                else:
                    err_msg = "Input Generation: Unknown State'{}'".format(analysis['status'])
                    raise OasisException(err_msg)
        except HTTPError as e:
            self.api.unrecoverable_error(e, 'run_generate: failed')



[docs]
    def run_analysis(self, analysis_id, analysis_settings_fp=None, poll_interval=5):
        """
        Runs all the analysis. The analysis must have one of the following
        statuses, `NEW`, `RUN_COMPLETED`, `RUN_CANCELLED` or
        `RUN_ERROR`
        """
        try:
            if analysis_settings_fp:
                self.upload_settings(analysis_id, analysis_settings_fp)

            self.analyses.run(analysis_id)
            self.logger.info(f'Analysis Run: Starting (id={analysis_id})')
            return self._poll_analysis_until_complete(analysis_id, poll_interval)

        except HTTPError as e:
            self.api.unrecoverable_error(e, 'run_analysis: failed')


    def _poll_analysis_until_complete(self, analysis_id, poll_interval):
        logged_queued = False
        while True:
            analysis = self.analyses.get(analysis_id).json()
            status = analysis['status']
            if status == 'RUN_COMPLETED':
                self.logger.info(f'Analysis Run: Complete (id={analysis_id})')
                return True
            elif status == 'RUN_CANCELLED':
                self.logger.info(f'Analysis Run: Cancelled (id={analysis_id})')
                return False
            elif status == 'RUN_ERROR':
                error_trace = self.analyses.run_traceback_file.get(analysis_id).text
                self.logger.error(f'Analysis Run: Failed (id={analysis_id})\n\nServer logs:\n{error_trace}')
                return False
            elif status == 'RUN_QUEUED':
                if not logged_queued:
                    self.logger.info(f'Analysis Run: Queued (id={analysis_id})')
                    logged_queued = True
            elif status == 'RUN_STARTED':
                self.logger.info(f'Analysis Run: Executing (id={analysis_id})')
                self._run_until_complete(analysis_id, poll_interval)
                poll_interval = 0
            else:
                err_msg = f"Execution status in Unknown State: '{analysis['status']}'"
                self.logger.error(err_msg)
                raise OasisException(err_msg)
            time.sleep(poll_interval)

    def _run_until_complete(self, analysis_id, poll_interval):
        analysis = self.analyses.get(analysis_id).json()
        while analysis.get('num_events_total', 0) == 0:
            # Possible to stay here if no env vars given to worker
            if any(status in analysis['status'] for status in ['_CANCELLED', '_ERROR', 'COMPLETED']):
                return
            time.sleep(poll_interval)
            analysis = self.analyses.get(analysis_id).json()

        with tqdm(total=analysis['num_events_total'], unit=' gul stages', desc='Analysis Run') as pbar:
            while "COMPLETED" not in analysis['status']:
                pbar.update(analysis['num_events_complete'] - pbar.n)
                time.sleep(poll_interval)

                analysis = self.analyses.get(analysis_id).json()
                if ('_CANCELLED' in analysis['status']) or ('_ERROR' in analysis['status']):
                    break
                elif 'COMPLETED' in analysis['status']:
                    pbar.update(pbar.total - pbar.n)
                    break


[docs]
    def download_output(self, analysis_id, download_path='', filename=None, clean_up=False, overwrite=True):
        if not filename:
            filename = 'analysis_{}_output.tar.gz'.format(analysis_id)
        try:
            output_file = os.path.join(download_path, filename)
            self.analyses.output_file.download(ID=analysis_id, file_path=output_file, overwrite=overwrite)
            self.logger.info('Analysis Download output: filename={}, (id={})'.format(output_file, analysis_id))
            if clean_up:
                self.analyses.delete(analysis_id)
        except HTTPError as e:
            err_msg = 'Analysis Download output: Failed (id={})'.format(analysis_id)
            self.api.unrecoverable_error(e, err_msg)



[docs]
    def cancel_generate(self, analysis_id):
        """
        Cancels a currently inputs generation. The analysis status must be `GENERATING_INPUTS`
        """
        try:
            self.analyses.cancel_generate_inputs(analysis_id)
            self.logger.info('Cancelled Input generation: (Id={})'.format(analysis_id))
        except HTTPError as e:
            self.api.unrecoverable_error(e, 'cancel_generate: Failed')



[docs]
    def cancel_analysis(self, analysis_id):
        """
        Cancels a currently running analysis. The analysis must have one of the following
        statuses, `PENDING` or `STARTED`
        """
        try:
            self.analyses.cancel_analysis_run(analysis_id)
            self.logger.info('Cancelled analysis run: (Id={})'.format(analysis_id))
        except HTTPError as e:
            self.api.unrecoverable_error(e, 'cancel_analysis: Failed')