Skip to content
New issue

Have a question about this project? Sign up for a free GitHub account to open an issue and contact its maintainers and the community.

By clicking “Sign up for GitHub”, you agree to our terms of service and privacy statement. We’ll occasionally send you account related emails.

Already on GitHub? Sign in to your account

Update Tools API openAPI contract and regenerate VCF results pydantic model #50

Open
wants to merge 3 commits into
base: dev
Choose a base branch
from
Open
Show file tree
Hide file tree
Changes from all commits
Commits
File filter

Filter by extension

Filter by extension

Conversations
Failed to load comments.
Loading
Jump to
Jump to file
Failed to load files.
Loading
Diff view
Diff view
Empty file added app/tests/models/__init__.py
Empty file.
164 changes: 164 additions & 0 deletions app/tests/models/test_vcf_results_model.py
Original file line number Diff line number Diff line change
@@ -0,0 +1,164 @@
import unittest
from pydantic import ValidationError

from vep.models.vcf_results_model import (
PaginationMetadata,
PredictedIntergenicConsequence,
PredictedTranscriptConsequence,
FeatureType,
Strand,
ReferenceVariantAllele,
Location,
AlternativeVariantAllele,
Variant,
Metadata,
VepResultsResponse,
)


class TestVCFResultModel(unittest.TestCase):

def test_predicted_intergenic_consequence(self):
consequence = PredictedIntergenicConsequence(
feature_type=None,
consequences=["intergenic_variant"]
)
Copy link
Contributor

@azangru azangru Oct 7, 2024

Choose a reason for hiding this comment

The reason will be displayed to describe this comment to others. Learn more.

Seeing now for the first time how the PredictedIntergenicConsequence class is instantiated, I think passing both these arguments to it is redundant (it must be the result of it being auto-generated from the schema). If the contract is that the PredictedIntergenicConsequence class will always serialise to:

{
  "feature_type": null,
  "consequences": ["intergenic_variant"]
}

and if the caller of the class always knows that it is calling the PredictedIntergenicConsequence class, then there shouldn't be any need to pass any data into it. This class can have the feature_type field set always to None, and the consequences field set always to ["intergenic_variant"].

self.assertIsNone(consequence.feature_type)
self.assertEqual(consequence.consequences, ["intergenic_variant"])

# Missing consequences should raise a ValidationError
with self.assertRaises(ValidationError):
PredictedIntergenicConsequence(feature_type=None)

def test_predicted_transcript_consequence(self):
consequence = PredictedTranscriptConsequence(
feature_type=FeatureType.transcript,
stable_id="ENST00000367770.8",
gene_stable_id="ENSG00000157764.13",
gene_symbol=None,
biotype="protein_coding",
is_canonical=True,
consequences=["missense_variant"],
strand=Strand.forward,
)
self.assertIsNone(consequence.gene_symbol)

# Valid instance without explicitly setting gene_symbol (default=None)
consequence_no_symbol = PredictedTranscriptConsequence(
feature_type=FeatureType.transcript,
stable_id="ENST00000367770.8",
gene_stable_id="ENSG00000157764.13",
biotype="protein_coding",
is_canonical=True,
consequences=["missense_variant"],
strand=Strand.forward,
)
self.assertIsNone(consequence_no_symbol.gene_symbol)

def test_alternative_variant_allele(self):
alternative_allele = AlternativeVariantAllele(
allele_sequence="A",
allele_type="insertion",
representative_population_allele_frequency=None,
predicted_molecular_consequences=[
PredictedIntergenicConsequence(
feature_type=None,
consequences=["intergenic_variant"],
)
],
)
self.assertIsNone(alternative_allele.representative_population_allele_frequency)

# Valid instance without explicitly setting representative_population_allele_frequency (default=None)
alternative_allele_no_freq = AlternativeVariantAllele(
allele_sequence="A",
allele_type="insertion",
predicted_molecular_consequences=[
PredictedIntergenicConsequence(
feature_type=None,
consequences=["intergenic_variant"],
)
],
)
self.assertIsNone(alternative_allele_no_freq.representative_population_allele_frequency)

def test_variant(self):
variant = Variant(
name=None,
allele_type="SNP",
location=Location(region_name="1", start=10000, end=10001),
reference_allele=ReferenceVariantAllele(allele_sequence="C"),
alternative_alleles=[
AlternativeVariantAllele(
allele_sequence="T",
allele_type="SNP",
predicted_molecular_consequences=[
PredictedIntergenicConsequence(
feature_type=None,
consequences=["intergenic_variant"]
)
]
)
]
)
self.assertIsNone(variant.name)

# Valid instance without explicitly setting name (default=None)
variant_no_name = Variant(
allele_type="SNP",
location=Location(region_name="1", start=10000, end=10001),
reference_allele=ReferenceVariantAllele(allele_sequence="C"),
alternative_alleles=[
AlternativeVariantAllele(
allele_sequence="T",
allele_type="SNP",
predicted_molecular_consequences=[
PredictedIntergenicConsequence(
feature_type=None,
consequences=["intergenic_variant"]
)
]
)
]
)
self.assertIsNone(variant_no_name.name)

def test_metadata_required(self):
metadata = Metadata(
pagination=PaginationMetadata(page=1, per_page=10, total=100)
)
self.assertEqual(metadata.pagination.page, 1)

# Invalid instance without pagination - should raise ValidationError
with self.assertRaises(ValidationError):
Metadata()

def test_vep_results_response(self):
metadata = Metadata(
pagination=PaginationMetadata(page=1, per_page=10, total=100)
)
variant = Variant(
name=None,
allele_type="SNV",
location=Location(region_name="1", start=10000, end=10001),
reference_allele=ReferenceVariantAllele(allele_sequence="A"),
alternative_alleles=[
AlternativeVariantAllele(
allele_sequence="T",
allele_type="SNP",
predicted_molecular_consequences=[
PredictedIntergenicConsequence(
feature_type=None,
consequences=["intergenic_variant"],
)
]
)
],
)
response = VepResultsResponse(metadata=metadata, variants=[variant])
self.assertEqual(response.metadata.pagination.page, 1)
self.assertEqual(len(response.variants), 1)

# Invalid instance without metadata - should raise ValidationError
with self.assertRaises(ValidationError):
VepResultsResponse(variants=[variant])
19 changes: 8 additions & 11 deletions app/vep/models/vcf_results_model.py
Original file line number Diff line number Diff line change
@@ -1,24 +1,18 @@
# generated by datamodel-codegen:
# filename: APISpecification.yaml
# timestamp: 2024-06-10T15:52:34+00:00

from __future__ import annotations

from enum import Enum
from typing import Any, List, Optional, Union

from pydantic import BaseModel, Field


class PaginationMetadata(BaseModel):
page: int
per_page: int
total: int


class PredictedIntergenicConsequence(BaseModel):
feature_type: Any = Field(
...,
feature_type: Optional[Any] = Field(
default=None,
description="The value of this field is always null. The presence of null in this field will serve as a marker that this is a consequence of an intergenic variant.",
)
consequences: List[str] = Field(
Expand All @@ -40,7 +34,7 @@ class PredictedTranscriptConsequence(BaseModel):
feature_type: FeatureType
stable_id: str = Field(..., description="transcript stable id, versioned")
gene_stable_id: str = Field(..., description="gene stable id, versioned")
gene_symbol: str
gene_symbol: Optional[str] = None
biotype: str
is_canonical: bool
consequences: List[str]
Expand All @@ -56,11 +50,11 @@ class Location(BaseModel):
start: int
end: int


class Metadata(BaseModel):
pagination: PaginationMetadata



class AlternativeVariantAllele(BaseModel):
allele_sequence: str
allele_type: str
Expand All @@ -71,7 +65,10 @@ class AlternativeVariantAllele(BaseModel):


class Variant(BaseModel):
name: str = Field(..., description="User's name for the variant; optional")
name: Optional[str] = Field(
default=None,
description="User's name for the variant; optional"
)
allele_type: str
location: Location
reference_allele: ReferenceVariantAllele
Expand Down