Source code for sampledb.searchresult

import pandas as pd
from pprint import pformat
from functools import reduce


[docs]class SearchResult(object):
    """
    An object containing the matching results of a search on the database.
    """

    def __init__(self, results):
        """
        Create a SearchResult.
        """
        self.results = pd.DataFrame(results)
        if self.results.size == 0:
            return
        self.results.sort_values(list(self.results.columns), inplace=True)
        self.results.reset_index(drop=True, inplace=True)

    def __repr__(self):
        return pformat(self.results.T.to_dict())

    def __str__(self):
        return pformat(self.results.T.to_dict())

    def __eq__(self, other):
        if type(other) is type(self):
            return self.results.equals(other.results)
        return False

    def __ne__(self, other):
        return not self.__eq__(other)

[docs]    def count(self):
        """
        Returns the number of samples that match the search.
        """
        return len(self.results)

[docs]    def filter(self, indices):
        """
        Filter the search results.
        Returns new SearchResult with only the filtered results.
        """
        df = self.results.filter(items=indices, axis=0)
        return SearchResult(df.reset_index(drop=True))

[docs]    def download(self, filename, schema={}):
        """
        Download the search results as a spreadsheet.
        """
        if len(self.results) == 0:
            print('You cannot download an empty spreadsheet.')
            return
        frames = []
        for name in self.results:
            f = self.results[name].rename(name.replace('_', ' ').title())
            f = f.to_frame()
            frames.append(f)
        df = reduce(lambda x, y: x.join(y), frames)

        cols = df.columns.tolist()
        order = schema.get('order', [])
        order = [o.replace('_', ' ').title() for o in order]
        order = [o for o in order if o in cols]
        order = order + [c for c in cols if c not in order]
        df = df[order]

        writer = pd.ExcelWriter(filename, engine='xlsxwriter')
        df.to_excel(writer, index=False)
        sheet = writer.sheets['Sheet1']
        for i, name in enumerate(df):
            width = max(len(str(val)) for val in df[name])
            width = max(width, len(name)) + 1
            sheet.set_column(i, i, width)
        writer.save()