Paolo Léonard PaoloLeonard

## Dockerfile
# app/Dockerfile

FROM python:3.11-slim

WORKDIR /app

RUN apt-get update && apt-get install -y \
    build-essential \
    curl \
    software-properties-common \

## dq_app.py
import streamlit as st
import yaml, json
import matplotlib.pyplot as plt

dq_score, dashboards = st.tabs(['Data quality score', 'Dashboards'])

with dq_score:
    st.title(f"""Data quality score""")

    schema, checks = {}, {}

## expectation_implementation.py
from copy import deepcopy
from typing import Dict, Tuple, Any, Optional, Callable, List

from great_expectations.core import ExpectationConfiguration
from great_expectations.execution_engine import (
    ExecutionEngine
)
from great_expectations.expectations.expectation import TableExpectation
from great_expectations.exceptions.exceptions import InvalidExpectationKwargsError

## table_metric.py
from typing import Dict, Tuple, Any

from great_expectations.core.batch_spec import PathBatchSpec
from great_expectations.execution_engine import (
    SparkDFExecutionEngine,
    PandasExecutionEngine
)
from great_expectations.expectations.metrics.metric_provider import metric_value
from great_expectations.expectations.metrics.table_metric_provider import (
    TableMetricProvider,

## comparator.py
from enum import Enum, auto
from statistics import mean


class SupportedComparisonEnum(Enum):
    """Enum class with the currently supported comparison type."""

    ABSOLUTE = auto()
    MEAN = auto()

## expect_table_row_count_to_be_more_than_others.py
"""
Custom table expectation which checks whether the row count is greater than the row count of other tables.

There are different ways to compare the row counts:
    * With absolute values, if one row count value of the other tables is greater than the current then the validation
    fails,
    * With mean values, if the mean of value of the other tables row count is greater than the current row count then
    the validation fails.
"""
from copy import deepcopy
	# app/Dockerfile

	FROM python:3.11-slim

	WORKDIR /app

	RUN apt-get update && apt-get install -y \
	build-essential \
	curl \
	software-properties-common \
	import streamlit as st
	import yaml, json
	import matplotlib.pyplot as plt

	dq_score, dashboards = st.tabs(['Data quality score', 'Dashboards'])

	with dq_score:
	st.title(f"""Data quality score""")

	schema, checks = {}, {}
	from copy import deepcopy
	from typing import Dict, Tuple, Any, Optional, Callable, List

	from great_expectations.core import ExpectationConfiguration
	from great_expectations.execution_engine import (
	ExecutionEngine
	)
	from great_expectations.expectations.expectation import TableExpectation
	from great_expectations.exceptions.exceptions import InvalidExpectationKwargsError
	from typing import Dict, Tuple, Any

	from great_expectations.core.batch_spec import PathBatchSpec
	from great_expectations.execution_engine import (
	SparkDFExecutionEngine,
	PandasExecutionEngine
	)
	from great_expectations.expectations.metrics.metric_provider import metric_value
	from great_expectations.expectations.metrics.table_metric_provider import (
	TableMetricProvider,
	from enum import Enum, auto
	from statistics import mean


	class SupportedComparisonEnum(Enum):
	"""Enum class with the currently supported comparison type."""

	ABSOLUTE = auto()
	MEAN = auto()
	"""
	Custom table expectation which checks whether the row count is greater than the row count of other tables.

	There are different ways to compare the row counts:
	* With absolute values, if one row count value of the other tables is greater than the current then the validation
	fails,
	* With mean values, if the mean of value of the other tables row count is greater than the current row count then
	the validation fails.
	"""
	from copy import deepcopy