aboutsummaryrefslogtreecommitdiff
path: root/uploader/datautils.py
blob: 2ee079d30a6485f405bc123b6e6f0d890b7251a4 (plain)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
"""Generic data utilities: Rename module."""
import math
from typing import Sequence
from functools import reduce

def enumerate_sequence(seq: Sequence[dict], start:int = 1) -> Sequence[dict]:
    """Enumerate sequence beginning at 1"""
    return tuple({**item, "sequence_number": seqno}
                 for seqno, item in enumerate(seq, start=start))


def order_by_family(items: tuple[dict, ...],
                    family_key: str = "Family",
                    order_key: str = "FamilyOrderId") -> list:
    """Order the populations by their families."""
    def __family_order__(item):
        orderval = item[order_key]
        return math.inf if orderval is None else orderval

    def __order__(ordered, current):
        _key = (__family_order__(current), current[family_key])
        return {
            **ordered,
            _key: ordered.get(_key, tuple()) + (current,)
        }

    return sorted(tuple(reduce(__order__, items, {}).items()),
                  key=lambda item: item[0][0])


def safe_int(val: str) -> int:
    """
    Convert val into an integer: if val cannot be converted, return a zero.
    """
    try:
        return int(val)
    except ValueError:
        return 0