Feat: test consume_flux

This commit is contained in:
Bertrand Benjamin 2024-08-14 07:41:36 +02:00
parent 959b53e6a0
commit 08c7fbe4c5
2 changed files with 45 additions and 2 deletions

View File

@ -25,7 +25,7 @@ class Flux(BaseModel):
class State(BaseModel): class State(BaseModel):
statuses: dict[str, str] statuses: dict[str, dict]
qty_out: int qty_out: int
failed_lines: list[str] failed_lines: list[str]
start: datetime start: datetime

View File

@ -1,6 +1,7 @@
import pandas as pd import pandas as pd
import pytest import pytest
from dashboard.libs.flux.flux import Flux, consume_flux
from dashboard.libs.repository.repository import AbstractRepository from dashboard.libs.repository.repository import AbstractRepository
FakeTable = pd.DataFrame FakeTable = pd.DataFrame
@ -43,7 +44,17 @@ class FakeRepository(AbstractRepository):
def write(self, content, table, schema) -> dict[str, str]: def write(self, content, table, schema) -> dict[str, str]:
"""Write content into the table""" """Write content into the table"""
try:
self._schemas[schema][table]["df"] = content self._schemas[schema][table]["df"] = content
except KeyError:
self._schemas[schema][table] = {
"df": content,
"metadata": {
"status": "new",
"qty_read": 0,
"qty_write": 0,
},
}
self._schemas[schema][table]["metadata"]["status"] = "modified" self._schemas[schema][table]["metadata"]["status"] = "modified"
self._schemas[schema][table]["metadata"]["qty_write"] += 1 self._schemas[schema][table]["metadata"]["qty_write"] += 1
return self.infos(table, schema) return self.infos(table, schema)
@ -86,3 +97,35 @@ def test_fakerepository():
"qty_read": 1, "qty_read": 1,
"qty_write": 1, "qty_write": 1,
} }
def test_consume_flux():
source_repository = FakeRepository(
{
"source": {
"table1": pd.DataFrame({"A": [1, 2, 3]}),
},
}
)
dest_repository = FakeRepository(
{
"destination": {},
}
)
repositories = {
"source": source_repository,
"dest": dest_repository,
}
transformation = lambda dfs: {"dest": dfs[0] * 2}
flux = Flux(
sources=[{"repository": "source", "schema": "source", "table": "table1"}],
destinations={
"dest": {"repository": "dest", "schema": "destination", "table": "table1"}
},
transformation=transformation,
)
state = consume_flux(flux, repositories)
assert state.statuses["dest"] == {'status': 'modified', 'qty_read': 0, 'qty_write': 1}
assert dest_repository.read("table1", "destination").equals(pd.DataFrame({"A": [2, 4, 6]}))