aboutsummaryrefslogtreecommitdiff
path: root/wqflask/base/species.py
blob: 0ee046302e43e51069a69d4d4cd6c4c0a720f4ef (plain)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
from collections import OrderedDict
from dataclasses import dataclass
from dataclasses import InitVar
from typing import Optional, Dict, Any, Union
from wqflask.database import database_connection


@dataclass
class TheSpecies:
    """Data related to species."""
    dataset: Optional[Dict] = None
    species_name: Optional[str] = None

    def __post_init__(self) -> None:
        # Just an alias of species_name.  It's safe for this to be None.
        self.name = self.species_name
        with database_connection() as conn:
            self.chromosomes = Chromosomes(conn=conn,
                                           species=self.species_name,
                                           dataset=self.dataset)


@dataclass
class IndChromosome:
    """Data related to IndChromosome"""
    name: str
    length: int

    @property
    def mb_length(self) -> Union[int, float]:
        """Chromosome length in mega-bases"""
        return self.length / 1000000


@dataclass
class Chromosomes:
    """Data related to a chromosome"""
    conn: Any
    dataset: InitVar[Dict] = None
    species: Optional[str] = None

    def __post_init__(self, dataset) -> None:
        if self.species is None:
            self.dataset = dataset

    @property
    def chromosomes(self) -> OrderedDict:
        """Lazily fetch the chromosomes"""
        chromosomes = OrderedDict()
        with database_connection() as conn, conn.cursor() as cursor:
            if self.species is not None:
                cursor.execute(
                    "SELECT Chr_Length.Name, Chr_Length.OrderId, Length "
                    "FROM Chr_Length, Species WHERE "
                    "Chr_Length.SpeciesId = Species.SpeciesId AND "
                    "Species.Name = %s "
                    "ORDER BY OrderId", (self.species.capitalize(),))
            else:
                cursor.execute(
                    "SELECT Chr_Length.Name, Chr_Length.OrderId, "
                    "Length FROM Chr_Length, InbredSet WHERE "
                    "Chr_Length.SpeciesId = InbredSet.SpeciesId AND "
                    "InbredSet.Name = "
                    "%s ORDER BY OrderId", (self.dataset.group.name,))
            for name, _, length in cursor.fetchall():
                chromosomes[name] = IndChromosome(
                    name=name, length=length)
            return chromosomes