Source code for orm.measurement

import csv
from io import StringIO
from decimal import Decimal

import sqlalchemy as sql
from sqlalchemy.orm import (
    Mapped,
    mapped_column,
    relationship,
)
from sqlalchemy.ext.hybrid import hybrid_property

from app.model.orm.orm_base import OrmBase
from app.model.lib.conversion import convert_time
from app.model.lib.util import group_by_unique_name



[docs]
class Measurement(OrmBase):

[docs]
    __tablename__ = "Measurements"


    # A relationship that goes through the parent measurement context:

[docs]
    context_relationship = lambda: relationship(
        secondary='MeasurementContexts',
        viewonly=True,
    )



[docs]
    id: Mapped[int] = mapped_column(primary_key=True)



[docs]
    studyId: Mapped[str] = mapped_column(sql.ForeignKey('Studies.studyId'), nullable=False)


[docs]
    study: Mapped['Study'] = relationship(back_populates='measurements')



[docs]
    contextId: Mapped[int] = mapped_column(sql.ForeignKey('MeasurementContexts.id'))


[docs]
    context: Mapped['MeasurementContext'] = relationship(back_populates='measurements')



[docs]
    bioreplicate: Mapped['Bioreplicate']         = context_relationship()


[docs]
    compartment:  Mapped['Compartment']          = context_relationship()


[docs]
    technique:    Mapped['MeasurementTechnique'] = context_relationship()



[docs]
    timeInSeconds: Mapped[int] = mapped_column(sql.Integer,     nullable=False)



[docs]
    value: Mapped[Decimal] = mapped_column(sql.Numeric(20, 2), nullable=True)


[docs]
    std:   Mapped[Decimal] = mapped_column(sql.Numeric(20, 2), nullable=True)


    @hybrid_property

[docs]
    def timeInHours(self):
        return self.timeInSeconds / 3600


    @hybrid_property

[docs]
    def subjectId(self):
        return self.context.subjectId


    @hybrid_property

[docs]
    def subjectType(self):
        return self.context.subjectType


    @classmethod

[docs]
    def insert_from_csv_string(Self, db_session, study, csv_string, subject_type):
        from app.model.orm import MeasurementContext

        reader = csv.DictReader(StringIO(csv_string), dialect='unix')

        bioreplicates_by_name = group_by_unique_name(study.bioreplicates)
        compartments_by_name  = group_by_unique_name(study.compartments)
        context_cache = {}

        measurements = []

        for row in reader:
            bioreplicate = bioreplicates_by_name[row['Biological Replicate'].strip()]
            compartment  = compartments_by_name[row['Compartment'].strip()]

            if bioreplicate is None or compartment is None:
                # Missing entry, skip
                continue

            time_in_seconds = convert_time(row['Time'], source=study.timeUnits, target='s')

            for technique in study.measurementTechniques:
                if technique.subjectType != subject_type:
                    continue

                if subject_type == 'bioreplicate':
                    subjects = [bioreplicate]
                elif subject_type == 'strain':
                    subjects = study.strains
                elif subject_type == 'metabolite':
                    subjects = study.metabolites
                else:
                    raise KeyError(f"Unexpected subject type: {subject_type}")

                for subject in subjects:
                    value_column_name = technique.csv_column_name(subject.name)

                    value = row[value_column_name]
                    if value == '':
                        continue

                    std = row.get(f"{value_column_name} STD", None)
                    if std == '':
                        std = None

                    # Create a measurement context only if it doesn't already exist:
                    context_key = (bioreplicate.id, compartment.id, technique.id, subject.id, subject_type)
                    if context_key not in context_cache:
                        if subject_type == 'metabolite':
                            subjectId = subject.chebiId
                        else:
                            subjectId = subject.id

                        context = MeasurementContext(
                            # Relationships:
                            study=study,
                            bioreplicate=bioreplicate,
                            compartment=compartment,
                            # Subject:
                            subjectId=subjectId,
                            subjectType=subject_type,
                            # Technique:
                            techniqueId=technique.id,
                        )
                        context_cache[context_key] = context
                        db_session.add(context)

                    context = context_cache[context_key]
                    measurement = Measurement(
                        study=study,
                        context=context,
                        timeInSeconds=time_in_seconds,
                        value=value,
                        std=std,
                    )
                    measurements.append(measurement)

        db_session.add_all(measurements)
        db_session.commit()

        return measurements