Skip to content
Open
Show file tree
Hide file tree
Changes from all commits
Commits
File filter

Filter by extension

Filter by extension

Conversations
Failed to load comments.
Loading
Jump to
Jump to file
Failed to load files.
Loading
Diff view
Diff view
21 changes: 21 additions & 0 deletions Dockerfile
Original file line number Diff line number Diff line change
@@ -0,0 +1,21 @@
FROM python:3.10-slim

WORKDIR /app

RUN apt-get update && apt-get install -y --no-install-recommends \
build-essential \
&& rm -rf /var/lib/apt/lists/*

COPY . .

RUN pip install --no-cache-dir --upgrade pip && \
pip install --no-cache-dir "setuptools>=72.0.0,<80.0.0" wheel && \
pip install --no-cache-dir . && \
pip install --no-cache-dir "setuptools>=72.0.0,<80.0.0" && \
pip install --no-cache-dir jupyter

EXPOSE 8888

CMD ["jupyter", "notebook", "--ip=0.0.0.0", "--port=8888", "--no-browser", "--allow-root"]


18 changes: 0 additions & 18 deletions src/ydata_profiling/model/handler.py
Original file line number Diff line number Diff line change
Expand Up @@ -60,22 +60,4 @@ def handle(self, dtype: str, *args, **kwargs) -> dict:
return summary


def get_render_map() -> Dict[str, Callable]:
import ydata_profiling.report.structure.variables as render_algorithms

render_map = {
"Boolean": render_algorithms.render_boolean,
"Numeric": render_algorithms.render_real,
"Complex": render_algorithms.render_complex,
"Text": render_algorithms.render_text,
"DateTime": render_algorithms.render_date,
"Categorical": render_algorithms.render_categorical,
"URL": render_algorithms.render_url,
"Path": render_algorithms.render_path,
"File": render_algorithms.render_file,
"Image": render_algorithms.render_image,
"Unsupported": render_algorithms.render_generic,
"TimeSeries": render_algorithms.render_timeseries,
}

return render_map
5 changes: 2 additions & 3 deletions src/ydata_profiling/model/summarizer.py
Original file line number Diff line number Diff line change
Expand Up @@ -27,7 +27,7 @@
from ydata_profiling.model.pandas.describe_supported_pandas import (
pandas_describe_supported,
)
from ydata_profiling.model.summary_algorithms import ( # Check what is this method used for
from ydata_profiling.model.summary_algorithms import (
describe_file_1d,
describe_image_1d,
describe_path_1d,
Expand All @@ -50,9 +50,8 @@ def summarize(
return self.handle(str(dtype), config, series, {"type": str(dtype)})


# Revisit this with the correct support for Spark as well.
class ProfilingSummarizer(BaseSummarizer):
"""A summarizer for Pandas DataFrames."""
"""A summarizer supporting both Pandas and Spark DataFrames."""

def __init__(self, typeset: VisionsTypeset, use_spark: bool = False):
self.use_spark = use_spark and is_pyspark_installed()
Expand Down
2 changes: 1 addition & 1 deletion src/ydata_profiling/report/structure/report.py
Original file line number Diff line number Diff line change
Expand Up @@ -7,7 +7,7 @@
from ydata_profiling.config import Settings
from ydata_profiling.model import BaseDescription
from ydata_profiling.model.alerts import AlertType
from ydata_profiling.model.handler import get_render_map
from ydata_profiling.report.structure.variables import get_render_map
from ydata_profiling.report.presentation.core import (
HTML,
Collapse,
Expand Down
23 changes: 23 additions & 0 deletions src/ydata_profiling/report/structure/variables/__init__.py
Original file line number Diff line number Diff line change
@@ -1,3 +1,5 @@
from typing import Callable, Dict

from ydata_profiling.report.structure.variables.render_boolean import render_boolean
from ydata_profiling.report.structure.variables.render_categorical import (
render_categorical,
Expand All @@ -17,6 +19,26 @@
)
from ydata_profiling.report.structure.variables.render_url import render_url


def get_render_map() -> Dict[str, Callable]:
render_map = {
"Boolean": render_boolean,
"Numeric": render_real,
"Complex": render_complex,
"Text": render_text,
"DateTime": render_date,
"Categorical": render_categorical,
"URL": render_url,
"Path": render_path,
"File": render_file,
"Image": render_image,
"Unsupported": render_generic,
"TimeSeries": render_timeseries,
}

return render_map


__all__ = [
"render_boolean",
"render_categorical",
Expand All @@ -32,4 +54,5 @@
"render_text",
"render_timeseries",
"render_url",
"get_render_map",
]