Source code for overture_song.client

# Copyright (c) 2018 The Ontario Institute for Cancer Research. All rights
# reserved.
#
# This program and the accompanying materials are made available under the
# terms of the GNU Public License v3.0. You should have received a copy of
# the GNU General Public License along with
# this program. If not, see <http://www.gnu.org/licenses/>.
#
# THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS IS"
# AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
# IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
# ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT HOLDER OR CONTRIBUTORS BE
# LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
# CONSEQUENTIAL DAMAGES (INCLUDING,BUT NOT LIMITED TO, PROCUREMENT OF
# SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA,OR PROFITS; OR BUSINESS
# INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER
# IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE)
# ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE
# POSSIBILITY OF SUCH DAMAGE.
#

import json
import logging
import os

from urllib3.exceptions import NewConnectionError

from overture_song.entities import Study
from overture_song.model import ManifestEntry, Manifest, SongError, ServerErrors
from overture_song.rest import ObjectRest
from overture_song.utils import SongClientException, convert_to_url_param_list, \
    check_type, write_object, check_state, check_song_state

logging.basicConfig(level=logging.INFO)
log = logging.getLogger("song.client")



[docs]class Api(object):

    def __init__(self, config):
        self.__config = config
        self.__rest = ObjectRest(access_token=config.access_token, debug=config.debug)
        self.__endpoints = Endpoints(config.server_url)

    @property
    def config(self):
        return self.__config

[docs]    def upload(self, json_payload, is_async_validation=False):
        self.check_is_alive()
        return self.__rest.post(
            self.__endpoints.upload(
                self.config.study_id,
                is_async_validation=is_async_validation), dict_data=json_payload)

[docs]    def status(self, upload_id):
        self.check_is_alive()
        endpoint = self.__endpoints.status(self.config.study_id, upload_id)
        return self.__rest.get(endpoint)

[docs]    def save(self, upload_id, ignore_analysis_id_collisions=False):
        self.check_is_alive()
        endpoint = self.__endpoints.save_by_id(
            self.config.study_id, upload_id, ignore_analysis_id_collisions=ignore_analysis_id_collisions)
        return self.__rest.post(endpoint)

[docs]    def get_analysis_files(self, analysis_id):
        self.check_is_alive()
        endpoint = self.__endpoints.get_analysis_files(self.config.study_id, analysis_id)
        return self.__rest.get(endpoint)

[docs]    def get_analysis(self, analysis_id):
        self.check_is_alive()
        endpoint = self.__endpoints.get_analysis(self.config.study_id, analysis_id)
        return self.__rest.get(endpoint)

[docs]    def is_alive(self):
        endpoint = self.__endpoints.is_alive()
        try:
            return self.__rest.get(endpoint) is not None
        except NewConnectionError as f:
            if self.config.debug:
                log.error(f)
            return False

[docs]    def publish(self, analysis_id):
        self.check_is_alive()
        endpoint = self.__endpoints.publish(self.config.study_id, analysis_id)
        return self.__rest.put(endpoint)

[docs]    def unpublish(self, analysis_id):
        self.check_is_alive()
        endpoint = self.__endpoints.unpublish(self.config.study_id, analysis_id)
        return self.__rest.put(endpoint)

[docs]    def suppress(self, analysis_id):
        self.check_is_alive()
        endpoint = self.__endpoints.suppress(self.config.study_id, analysis_id)
        return self.__rest.put(endpoint)

[docs]    def id_search(self, sample_id=None, specimen_id=None, donor_id=None, file_id=None):
        self.check_is_alive()
        endpoint = self.__endpoints.id_search(
            self.config.study_id, sample_id=sample_id, specimen_id=specimen_id, donor_id=donor_id, file_id=file_id)
        return self.__rest.get(endpoint)

[docs]    def info_search(self, is_include_info, **search_terms):
        self.check_is_alive()
        endpoint = self.__endpoints.info_search(self.config.study_id, is_include_info, **search_terms)
        return self.__rest.get(endpoint)

[docs]    def get_study(self, study_id):
        self.check_is_alive()
        endpoint = self.__endpoints.get_study(study_id)
        return self.__rest.get(endpoint)

[docs]    def get_schema(self, schema_id):
        self.check_is_alive()
        endpoint = self.__endpoints.get_schema(schema_id)
        return self.__rest.get(endpoint)

[docs]    def list_schemas(self):
        self.check_is_alive()
        endpoint = self.__endpoints.list_schemas()
        return self.__rest.get(endpoint)

[docs]    def get_entire_study(self, study_id):
        self.check_is_alive()
        endpoint = self.__endpoints.get_entire_study(study_id)
        return self.__rest.get(endpoint)

[docs]    def get_all_studies(self):
        self.check_is_alive()
        endpoint = self.__endpoints.get_all_studies()
        return self.__rest.get(endpoint)

[docs]    def save_study(self, study):
        self.check_is_alive()
        endpoint = self.__endpoints.save_study(study.studyId)
        return self.__rest.post(endpoint, dict_data=study.__dict__)

[docs]    def update_file(self, object_id, file_update_request):
        self.check_is_alive()
        endpoint = self.__endpoints.update_file(self.config.study_id, object_id)
        input = Api.__remove_null_keys(file_update_request.to_dict())
        return self.__rest.put(endpoint, dict_data=input)

[docs]    def check_is_alive(self):
        check_state(self.is_alive(), "The SONG server may not be running on '{}'".format(self.config.server_url))

    @classmethod
    def __remove_null_keys(cls, d ):
        out = {}
        for k in d.keys():
            if d[k] is not None:
                out[k] = d[k]
        return out


[docs]class StudyClient(object):

    def __init__(self, api):
        check_type(api, Api)
        self.__api = api

[docs]    def create(self, study):
        self.__api.save_study(study)

[docs]    def has(self, study_id):
        try:
            return self.__api.get_study(study_id) is not None
        except SongError as e:
            if e.errorId == ServerErrors.STUDY_ID_DOES_NOT_EXIST.get_error_id():
                return False
            else:
                raise e

[docs]    def read(self, study_id):
        response = self.__api.get_study(study_id)
        return Study.create_from_raw(response)


[docs]class UploadClient(object):

    def __init__(self, api):
        if not isinstance(api, Api):
            raise SongClientException('upload.client', "The argument must be an instance of Api")
        self.__api = api

[docs]    def upload_file(self, file_path, is_async_validation=False):
        if not os.path.exists(file_path):
            raise SongClientException('upload.client', "The file {} does not exist".format(file_path))

        with open(file_path, 'r') as file_content:
            json_data = json.load(file_content)  # just to validate the json
            return self.__api.upload(json_data, is_async_validation=is_async_validation)

[docs]    def check_upload_status(self, upload_id):
        return self.__api.status(upload_id)

[docs]    def save(self, upload_id, ignore_analysis_id_collisions=False):
        return self.__api.save(upload_id, ignore_analysis_id_collisions=ignore_analysis_id_collisions)

[docs]    def publish(self, analysis_id):
        return self.__api.publish(analysis_id)


[docs]class ManifestClient(object):

    def __init__(self, api):
        if not isinstance(api, Api):
            raise SongClientException("manifest.service", "The argument must be an instance of Api")
        self.__api = api

[docs]    def create_manifest(self, source_dir, analysis_id):
        manifest = Manifest(analysis_id)
        for file_object in self.__api.get_analysis_files(analysis_id):
            manifest_entry = ManifestEntry.create_manifest_entry(source_dir, file_object)
            manifest.add_entry(manifest_entry)
        return manifest

[docs]    def write_manifest(self, analysis_id, source_dir, output_file_path):
        check_song_state(os.path.exists(source_dir), "manifest.service",
                         "The source directory '{}' does not exist", source_dir)
        manifest = self.create_manifest(source_dir, analysis_id)
        missing_files = [me.fileName for me in manifest.entries if not os.path.exists(me.fileName)]

        check_song_state(len(missing_files) == 0, "manifest.service",
                         "The following files do not exist: \n '{}'",
                         "',\n'".join(missing_files))

        write_object(manifest, output_file_path, overwrite=True)


[docs]class Endpoints(object):

    def __init__(self, server_url):
        self.__server_url = server_url

[docs]    def upload(self, study_id, is_async_validation=False):
        if is_async_validation:
            return "{}/upload/{}/async".format(self.__server_url, study_id)
        else:
            return "{}/upload/{}".format(self.__server_url, study_id)

[docs]    def save_by_id(self, study_id, upload_id, ignore_analysis_id_collisions):
        return "{}/upload/{}/save/{}?ignoreAnalysisIdCollisions={}".format(
            self.__server_url, study_id, upload_id, ignore_analysis_id_collisions)

[docs]    def status(self, study_id, upload_id):
        return "{}/upload/{}/status/{}".format(self.__server_url, study_id, upload_id)

[docs]    def get_analysis_files(self, study_id, analysis_id):
        return "{}/studies/{}/analysis/{}/files".format(self.__server_url, study_id, analysis_id)

[docs]    def get_analysis(self, study_id, analysis_id):
        return "{}/studies/{}/analysis/{}".format(self.__server_url, study_id, analysis_id)

[docs]    def is_alive(self):
        return "{}/isAlive".format(self.__server_url)

[docs]    def update_file(self, study_id, object_id):
        return "{}/studies/{}/files/{}".format(self.__server_url, study_id, object_id)

[docs]    def publish(self, study_id, analysis_id):
        return "{}/studies/{}/analysis/publish/{}".format(self.__server_url, study_id, analysis_id)

[docs]    def unpublish(self, study_id, analysis_id):
        return "{}/studies/{}/analysis/unpublish/{}".format(self.__server_url, study_id, analysis_id)

[docs]    def suppress(self, study_id, analysis_id):
        return "{}/studies/{}/analysis/suppress/{}".format(self.__server_url, study_id, analysis_id)

[docs]    def list_schemas(self):
        return "{}/schema/list".format(self.__server_url)

[docs]    def get_schema(self, schema_id):
        return "{}/schema/{}".format(self.__server_url, schema_id)

[docs]    def id_search(self, study_id, sample_id=None, specimen_id=None, donor_id=None, file_id=None):
        return self.__id_search(study_id, sampleId=sample_id, specimenId=specimen_id, donorId=donor_id, fileId=file_id)

    def __id_search(self, study_id, **kwargs):
        param_list = []
        for key, value in kwargs.items():
            if value is not None:
                param_list.append(key+'='+value)
        params = '&'.join(param_list)
        return "{}/studies/{}/analysis/search/id?{}".format(self.__server_url, study_id, params)

[docs]    def info_search(self, study_id, is_include_info, **search_terms):
        params = '&'.join(convert_to_url_param_list(**search_terms))
        return "{}/studies/{}/analysis/search/info?includeInfo={}&{}".format(
            self.__server_url, study_id, is_include_info, params)

[docs]    def get_entire_study(self, study_id):
        return "{}/studies/{}/all".format(self.__server_url, study_id)

[docs]    def get_all_studies(self):
        return "{}/studies/all".format(self.__server_url)

[docs]    def get_study(self, study_id):
        return "{}/studies/{}".format(self.__server_url, study_id)

[docs]    def save_study(self, study_id):
        return "{}/studies/{}/".format(self.__server_url, study_id)