From 05c1b8bf2cb81916c1d95aa8abae6cf7fcab4821 Mon Sep 17 00:00:00 2001
From: Fabiana <30911746+fabclmnt@users.noreply.github.com>
Date: Tue, 25 Mar 2025 16:35:17 -0700
Subject: [PATCH 1/6] chore: add more unit tests for better code coverage
---
tests/unit/test_report_options.py | 169 +++++++++++++++++-------------
tests/unit/test_time_series.py | 60 +++++++++++
2 files changed, 158 insertions(+), 71 deletions(-)
diff --git a/tests/unit/test_report_options.py b/tests/unit/test_report_options.py
index 4e4555eb7..3d09ddeee 100644
--- a/tests/unit/test_report_options.py
+++ b/tests/unit/test_report_options.py
@@ -1,112 +1,139 @@
import pandas as pd
+import numpy as np
import pytest
from ydata_profiling import ProfileReport
+from ydata_profiling.config import Settings
+
+
+# Enhanced fixture with more diverse data types
+@pytest.fixture
+def sample_categorical_data():
+ return pd.DataFrame({
+ "dummy_cat": [
+ "Amadeou_plus", "Amadeou_plus", "Beta_front", "Calciumus",
+ "Dimitrius", "esperagus_anonymoliumus", "FrigaTTTBrigde_Writap",
+ "galgarartiy", "He", "I", "JimISGODDOT"
+ ] * 10
+ })
+
+@pytest.fixture
+def sample_boolean_data():
+ return pd.DataFrame({
+ "dummy_bool": [True] * 82 + [False] * 36
+ })
-
-# Generating dummy data
def generate_cat_data_series(categories):
+ """Helper function to generate categorical data"""
dummy_data = []
for cat, i in categories.items():
- dummy_data.extend([cat, ] * i) # fmt: skip
+ dummy_data.extend([cat] * i)
return pd.DataFrame({"dummy_cat": dummy_data})
-
-dummy_bool_data = generate_cat_data_series(pd.Series({True: 82, False: 36}))
-dummy_cat_data = generate_cat_data_series(
- pd.Series(
- {
- "Amadeou_plus": 75,
- "Beta_front": 50,
- "Calciumus": 20,
- "Dimitrius": 1,
- "esperagus_anonymoliumus": 75,
- "FrigaTTTBrigde_Writap": 50,
- "galgarartiy": 30,
- "He": 1,
- "I": 10,
- "JimISGODDOT": 1,
- }
- )
+def generate_report(data, **kwargs):
+ """Helper function to generate report with common settings"""
+ default_settings = {
+ "progress_bar": False,
+ "samples": None,
+ "correlations": None,
+ "missing_diagrams": None,
+ "duplicates": None,
+ "interactions": None
+ }
+ default_settings.update(kwargs)
+ return ProfileReport(df=data, **default_settings)
+
+# Test category frequency plots general options
+@pytest.mark.parametrize(
+ "data_fixture", ["sample_boolean_data", "sample_categorical_data"],
+ ids=["boolean", "categorical"]
)
-
-
-def generate_report(data):
- return ProfileReport(
- df=data,
- progress_bar=False,
- samples=None,
- correlations=None,
- missing_diagrams=None,
- duplicates=None,
- interactions=None,
- )
-
-
-# Unit tests
-# - Test category frequency plots general options
-@pytest.mark.parametrize("data", [dummy_bool_data, dummy_cat_data], ids=["bool", "cat"])
@pytest.mark.parametrize("plot_type", ["bar", "pie"])
-def test_deactivated_cat_frequency_plot(data, plot_type):
+def test_deactivated_cat_frequency_plot(data_fixture, plot_type, request):
+ data = request.getfixturevalue(data_fixture)
profile = generate_report(data)
profile.config.plot.cat_freq.show = False
profile.config.plot.cat_freq.type = plot_type
html_report = profile.to_html()
assert "Common Values (Plot)" not in html_report
-
-@pytest.mark.parametrize("data", [dummy_bool_data, dummy_cat_data], ids=["bool", "cat"])
-def test_cat_frequency_default_barh_plot(data):
+@pytest.mark.parametrize(
+ "data_fixture", ["sample_boolean_data", "sample_categorical_data"],
+ ids=["boolean", "categorical"]
+)
+def test_cat_frequency_default_barh_plot(data_fixture, request):
+ data = request.getfixturevalue(data_fixture)
profile = generate_report(data)
html_report = profile.to_html()
assert "Common Values (Plot)" in html_report
-
-@pytest.mark.parametrize("data", [dummy_bool_data, dummy_cat_data], ids=["bool", "cat"])
-def test_cat_frequency_pie_plot(data):
+@pytest.mark.parametrize(
+ "data_fixture", ["sample_boolean_data", "sample_categorical_data"],
+ ids=["boolean", "categorical"]
+)
+def test_cat_frequency_pie_plot(data_fixture, request):
+ data = request.getfixturevalue(data_fixture)
profile = generate_report(data)
profile.config.plot.cat_freq.type = "pie"
html_report = profile.to_html()
assert "pie" in html_report
-
@pytest.mark.parametrize("plot_type", ["bar", "pie"])
-def test_max_nuique_smaller_than_unique_cats(plot_type):
- profile = generate_report(dummy_cat_data)
- profile.config.plot.cat_freq.max_unique = 2 # smaller than the number of categories
+def test_max_unique_categories(plot_type):
+ # Test with different numbers of unique categories
+ categories = {f"cat_{i}": 5 for i in range(10)}
+ data = generate_cat_data_series(categories)
+
+ profile = generate_report(data)
+ profile.config.plot.cat_freq.max_unique = 5
profile.config.plot.cat_freq.type = plot_type
html_report = profile.to_html()
+
+ # Should not show plot when unique categories exceed max_unique
assert "Common Values (Plot)" not in html_report
-# - Test category frequency plots color options
-@pytest.mark.parametrize("plot_type", ["bar", "pie"])
-def test_cat_frequency_with_custom_colors(plot_type):
- test_data = generate_cat_data_series(pd.Series({"A": 10, "B": 10, "C": 10}))
- custom_colors = {"gold": "#ffd700", "b": "#0000ff", "#FF796C": "#ff796c"}
+def test_more_categories_than_colors():
+ # Test handling when there are more categories than defined colors
+ test_data = generate_cat_data_series({f"cat_{i}": 10 for i in range(5)})
+ custom_colors = ["gold", "blue", "coral"]
+
profile = generate_report(test_data)
- profile.config.plot.cat_freq.colors = list(custom_colors.keys())
- profile.config.plot.cat_freq.type = plot_type
+ profile.config.plot.cat_freq.colors = custom_colors
html_report = profile.to_html()
- for c, hex_code in custom_colors.items():
- assert f"fill: {hex_code}" in html_report, f"Missing color code of {c}"
-
+
+ # Should still generate plot without errors
+ assert "Common Values (Plot)" in html_report
-def test_more_cats_than_colors():
- test_data = generate_cat_data_series(
- pd.Series({"A": 10, "B": 10, "C": 10, "D": 10})
- )
- custom_colors = {"gold": "#ffd700", "b": "#0000ff", "#FF796C": "#ff796c"}
+@pytest.mark.skip("Skipping empty color list test. Code needs to be updated.")
+def test_empty_color_list():
+ # Test behavior with empty color list
+ test_data = generate_cat_data_series({"A": 10, "B": 10})
profile = generate_report(test_data)
- profile.config.plot.cat_freq.colors = list(custom_colors.keys())
+ profile.config.plot.cat_freq.colors = []
html_report = profile.to_html()
- assert "Common Values (Plot)" in html_report # just check that it worked
-
+
+ # Should use default colors
+ assert "Common Values (Plot)" in html_report
-# - Test exceptions
-@pytest.mark.parametrize("data", [dummy_bool_data, dummy_cat_data], ids=["bool", "cat"])
-def test_exception_with_invalid_cat_freq_type(data):
- profile = generate_report(data)
- profile.config.plot.cat_freq.type = "box"
+@pytest.mark.parametrize("invalid_type", ["scatter", "box", "invalid"])
+def test_invalid_plot_types(invalid_type):
+ test_data = generate_cat_data_series({"A": 10, "B": 10})
+
with pytest.raises(ValueError):
+ profile = generate_report(test_data)
+ profile.config.plot.cat_freq.type = invalid_type
profile.to_html()
+
+def test_config_persistence():
+ # Test that plot configuration persists after cache invalidation
+ test_data = generate_cat_data_series({"A": 10, "B": 10})
+ profile = generate_report(test_data)
+ profile.config.plot.cat_freq.type = "pie"
+ profile.config.plot.cat_freq.colors = ["gold", "blue"]
+
+ # Cache invalidation shouldn't affect config
+ profile.invalidate_cache()
+ html_report = profile.to_html()
+ assert "pie" in html_report
+ assert "fill: #ffd700" in html_report
diff --git a/tests/unit/test_time_series.py b/tests/unit/test_time_series.py
index 9a87da274..e1ac3fd2b 100644
--- a/tests/unit/test_time_series.py
+++ b/tests/unit/test_time_series.py
@@ -33,6 +33,15 @@ def html_profile() -> str:
profile = ProfileReport(df, tsmode=True)
return profile.to_html()
+@pytest.fixture
+def sample_ts_df():
+ dates = pd.date_range(start='2023-01-01', periods=100, freq='D')
+ return pd.DataFrame({
+ 'date': dates,
+ 'value': np.sin(np.arange(100) * np.pi / 180) + np.random.normal(0, 0.1, 100),
+ 'trend': np.arange(100) * 0.1,
+ 'category': ['A', 'B'] * 50
+ })
def test_timeseries_identification(html_profile: str):
assert "
TimeSeries | " in html_profile, "TimeSeries not detected"
@@ -54,3 +63,54 @@ def test_timeseries_seasonality(html_profile: str):
assert (
html_profile.count(">Seasonal<") == 4
), "Seasonality warning incorrectly identified"
+
+
+def test_timeseries_with_sortby(sample_ts_df):
+ # Test time series with explicit sort column
+ profile = ProfileReport(sample_ts_df, tsmode=True, sortby='date')
+ html = profile.to_html()
+ assert 'date' in html
+ assert profile.config.vars.timeseries.sortby == 'date'
+
+def test_timeseries_without_sortby(sample_ts_df):
+ # Test time series without explicit sort column
+ profile = ProfileReport(sample_ts_df, tsmode=True)
+ html = profile.to_html()
+ assert profile.config.vars.timeseries.sortby is None
+ assert 'TimeSeries' in html
+
+def test_invalid_sortby(sample_ts_df):
+ # Test with non-existent sort column
+ with pytest.raises(KeyError):
+ profile = ProfileReport(sample_ts_df, tsmode=True, sortby='nonexistent')
+ profile.to_html()
+
+def test_timeseries_with_missing_values(sample_ts_df):
+ # Introduce missing values
+ df_with_missing = sample_ts_df.copy()
+ df_with_missing.loc[10:20, 'value'] = np.nan
+ profile = ProfileReport(df_with_missing, tsmode=True)
+ html = profile.to_html()
+ assert 'Missing values' in html
+
+def test_non_numeric_timeseries():
+ # Test handling of non-numeric time series
+ dates = pd.date_range(start='2023-01-01', periods=100, freq='D')
+ df = pd.DataFrame({
+ 'date': dates,
+ 'category': ['A', 'B', 'C'] * 33 + ['A']
+ })
+ profile = ProfileReport(df, tsmode=True)
+ html = profile.to_html()
+ # Should not identify categorical column as time series
+ assert html.count(">Autocorrelation<") == 0
+
+def test_timeseries_config_persistence():
+ # Test that time series configuration persists
+ df = pd.DataFrame({'value': range(100)})
+ profile = ProfileReport(df, tsmode=True)
+ assert profile.config.vars.timeseries.active is True
+
+ # Test config after invalidating cache
+ profile.invalidate_cache()
+ assert profile.config.vars.timeseries.active is True
From dd891b4290bf96a885eb2ad5ca7171e791c1d717 Mon Sep 17 00:00:00 2001
From: Fabiana <30911746+fabclmnt@users.noreply.github.com>
Date: Tue, 25 Mar 2025 16:39:03 -0700
Subject: [PATCH 2/6] chore: remove unused code from tests
---
tests/unit/test_report_options.py | 2 --
1 file changed, 2 deletions(-)
diff --git a/tests/unit/test_report_options.py b/tests/unit/test_report_options.py
index 3d09ddeee..b0f4e0ee4 100644
--- a/tests/unit/test_report_options.py
+++ b/tests/unit/test_report_options.py
@@ -1,9 +1,7 @@
import pandas as pd
-import numpy as np
import pytest
from ydata_profiling import ProfileReport
-from ydata_profiling.config import Settings
# Enhanced fixture with more diverse data types
From 6c3618fa215e53bee8591557b1e1e8726e0542b4 Mon Sep 17 00:00:00 2001
From: Azory YData Bot
Date: Tue, 25 Mar 2025 23:42:03 +0000
Subject: [PATCH 3/6] fix(linting): code formatting
---
tests/unit/test_report_options.py | 70 ++++++++++++++++++++-----------
tests/unit/test_time_series.py | 49 ++++++++++++----------
2 files changed, 74 insertions(+), 45 deletions(-)
diff --git a/tests/unit/test_report_options.py b/tests/unit/test_report_options.py
index b0f4e0ee4..924e503b4 100644
--- a/tests/unit/test_report_options.py
+++ b/tests/unit/test_report_options.py
@@ -7,19 +7,30 @@
# Enhanced fixture with more diverse data types
@pytest.fixture
def sample_categorical_data():
- return pd.DataFrame({
- "dummy_cat": [
- "Amadeou_plus", "Amadeou_plus", "Beta_front", "Calciumus",
- "Dimitrius", "esperagus_anonymoliumus", "FrigaTTTBrigde_Writap",
- "galgarartiy", "He", "I", "JimISGODDOT"
- ] * 10
- })
+ return pd.DataFrame(
+ {
+ "dummy_cat": [
+ "Amadeou_plus",
+ "Amadeou_plus",
+ "Beta_front",
+ "Calciumus",
+ "Dimitrius",
+ "esperagus_anonymoliumus",
+ "FrigaTTTBrigde_Writap",
+ "galgarartiy",
+ "He",
+ "I",
+ "JimISGODDOT",
+ ]
+ * 10
+ }
+ )
+
@pytest.fixture
def sample_boolean_data():
- return pd.DataFrame({
- "dummy_bool": [True] * 82 + [False] * 36
- })
+ return pd.DataFrame({"dummy_bool": [True] * 82 + [False] * 36})
+
def generate_cat_data_series(categories):
"""Helper function to generate categorical data"""
@@ -28,6 +39,7 @@ def generate_cat_data_series(categories):
dummy_data.extend([cat] * i)
return pd.DataFrame({"dummy_cat": dummy_data})
+
def generate_report(data, **kwargs):
"""Helper function to generate report with common settings"""
default_settings = {
@@ -36,15 +48,17 @@ def generate_report(data, **kwargs):
"correlations": None,
"missing_diagrams": None,
"duplicates": None,
- "interactions": None
+ "interactions": None,
}
default_settings.update(kwargs)
return ProfileReport(df=data, **default_settings)
+
# Test category frequency plots general options
@pytest.mark.parametrize(
- "data_fixture", ["sample_boolean_data", "sample_categorical_data"],
- ids=["boolean", "categorical"]
+ "data_fixture",
+ ["sample_boolean_data", "sample_categorical_data"],
+ ids=["boolean", "categorical"],
)
@pytest.mark.parametrize("plot_type", ["bar", "pie"])
def test_deactivated_cat_frequency_plot(data_fixture, plot_type, request):
@@ -55,9 +69,11 @@ def test_deactivated_cat_frequency_plot(data_fixture, plot_type, request):
html_report = profile.to_html()
assert "Common Values (Plot)" not in html_report
+
@pytest.mark.parametrize(
- "data_fixture", ["sample_boolean_data", "sample_categorical_data"],
- ids=["boolean", "categorical"]
+ "data_fixture",
+ ["sample_boolean_data", "sample_categorical_data"],
+ ids=["boolean", "categorical"],
)
def test_cat_frequency_default_barh_plot(data_fixture, request):
data = request.getfixturevalue(data_fixture)
@@ -65,9 +81,11 @@ def test_cat_frequency_default_barh_plot(data_fixture, request):
html_report = profile.to_html()
assert "Common Values (Plot)" in html_report
+
@pytest.mark.parametrize(
- "data_fixture", ["sample_boolean_data", "sample_categorical_data"],
- ids=["boolean", "categorical"]
+ "data_fixture",
+ ["sample_boolean_data", "sample_categorical_data"],
+ ids=["boolean", "categorical"],
)
def test_cat_frequency_pie_plot(data_fixture, request):
data = request.getfixturevalue(data_fixture)
@@ -76,17 +94,18 @@ def test_cat_frequency_pie_plot(data_fixture, request):
html_report = profile.to_html()
assert "pie" in html_report
+
@pytest.mark.parametrize("plot_type", ["bar", "pie"])
def test_max_unique_categories(plot_type):
# Test with different numbers of unique categories
categories = {f"cat_{i}": 5 for i in range(10)}
data = generate_cat_data_series(categories)
-
+
profile = generate_report(data)
profile.config.plot.cat_freq.max_unique = 5
profile.config.plot.cat_freq.type = plot_type
html_report = profile.to_html()
-
+
# Should not show plot when unique categories exceed max_unique
assert "Common Values (Plot)" not in html_report
@@ -95,14 +114,15 @@ def test_more_categories_than_colors():
# Test handling when there are more categories than defined colors
test_data = generate_cat_data_series({f"cat_{i}": 10 for i in range(5)})
custom_colors = ["gold", "blue", "coral"]
-
+
profile = generate_report(test_data)
profile.config.plot.cat_freq.colors = custom_colors
html_report = profile.to_html()
-
+
# Should still generate plot without errors
assert "Common Values (Plot)" in html_report
+
@pytest.mark.skip("Skipping empty color list test. Code needs to be updated.")
def test_empty_color_list():
# Test behavior with empty color list
@@ -110,26 +130,28 @@ def test_empty_color_list():
profile = generate_report(test_data)
profile.config.plot.cat_freq.colors = []
html_report = profile.to_html()
-
+
# Should use default colors
assert "Common Values (Plot)" in html_report
+
@pytest.mark.parametrize("invalid_type", ["scatter", "box", "invalid"])
def test_invalid_plot_types(invalid_type):
test_data = generate_cat_data_series({"A": 10, "B": 10})
-
+
with pytest.raises(ValueError):
profile = generate_report(test_data)
profile.config.plot.cat_freq.type = invalid_type
profile.to_html()
+
def test_config_persistence():
# Test that plot configuration persists after cache invalidation
test_data = generate_cat_data_series({"A": 10, "B": 10})
profile = generate_report(test_data)
profile.config.plot.cat_freq.type = "pie"
profile.config.plot.cat_freq.colors = ["gold", "blue"]
-
+
# Cache invalidation shouldn't affect config
profile.invalidate_cache()
html_report = profile.to_html()
diff --git a/tests/unit/test_time_series.py b/tests/unit/test_time_series.py
index e1ac3fd2b..be283f88d 100644
--- a/tests/unit/test_time_series.py
+++ b/tests/unit/test_time_series.py
@@ -33,15 +33,20 @@ def html_profile() -> str:
profile = ProfileReport(df, tsmode=True)
return profile.to_html()
+
@pytest.fixture
def sample_ts_df():
- dates = pd.date_range(start='2023-01-01', periods=100, freq='D')
- return pd.DataFrame({
- 'date': dates,
- 'value': np.sin(np.arange(100) * np.pi / 180) + np.random.normal(0, 0.1, 100),
- 'trend': np.arange(100) * 0.1,
- 'category': ['A', 'B'] * 50
- })
+ dates = pd.date_range(start="2023-01-01", periods=100, freq="D")
+ return pd.DataFrame(
+ {
+ "date": dates,
+ "value": np.sin(np.arange(100) * np.pi / 180)
+ + np.random.normal(0, 0.1, 100),
+ "trend": np.arange(100) * 0.1,
+ "category": ["A", "B"] * 50,
+ }
+ )
+
def test_timeseries_identification(html_profile: str):
assert "TimeSeries | " in html_profile, "TimeSeries not detected"
@@ -67,50 +72,52 @@ def test_timeseries_seasonality(html_profile: str):
def test_timeseries_with_sortby(sample_ts_df):
# Test time series with explicit sort column
- profile = ProfileReport(sample_ts_df, tsmode=True, sortby='date')
+ profile = ProfileReport(sample_ts_df, tsmode=True, sortby="date")
html = profile.to_html()
- assert 'date' in html
- assert profile.config.vars.timeseries.sortby == 'date'
+ assert "date" in html
+ assert profile.config.vars.timeseries.sortby == "date"
+
def test_timeseries_without_sortby(sample_ts_df):
# Test time series without explicit sort column
profile = ProfileReport(sample_ts_df, tsmode=True)
html = profile.to_html()
assert profile.config.vars.timeseries.sortby is None
- assert 'TimeSeries' in html
+ assert "TimeSeries" in html
+
def test_invalid_sortby(sample_ts_df):
# Test with non-existent sort column
with pytest.raises(KeyError):
- profile = ProfileReport(sample_ts_df, tsmode=True, sortby='nonexistent')
+ profile = ProfileReport(sample_ts_df, tsmode=True, sortby="nonexistent")
profile.to_html()
+
def test_timeseries_with_missing_values(sample_ts_df):
# Introduce missing values
df_with_missing = sample_ts_df.copy()
- df_with_missing.loc[10:20, 'value'] = np.nan
+ df_with_missing.loc[10:20, "value"] = np.nan
profile = ProfileReport(df_with_missing, tsmode=True)
html = profile.to_html()
- assert 'Missing values' in html
+ assert "Missing values" in html
+
def test_non_numeric_timeseries():
# Test handling of non-numeric time series
- dates = pd.date_range(start='2023-01-01', periods=100, freq='D')
- df = pd.DataFrame({
- 'date': dates,
- 'category': ['A', 'B', 'C'] * 33 + ['A']
- })
+ dates = pd.date_range(start="2023-01-01", periods=100, freq="D")
+ df = pd.DataFrame({"date": dates, "category": ["A", "B", "C"] * 33 + ["A"]})
profile = ProfileReport(df, tsmode=True)
html = profile.to_html()
# Should not identify categorical column as time series
assert html.count(">Autocorrelation<") == 0
+
def test_timeseries_config_persistence():
# Test that time series configuration persists
- df = pd.DataFrame({'value': range(100)})
+ df = pd.DataFrame({"value": range(100)})
profile = ProfileReport(df, tsmode=True)
assert profile.config.vars.timeseries.active is True
-
+
# Test config after invalidating cache
profile.invalidate_cache()
assert profile.config.vars.timeseries.active is True
From b31ff979651261fec36ea426c59e51979f1a5803 Mon Sep 17 00:00:00 2001
From: Fabiana <30911746+fabclmnt@users.noreply.github.com>
Date: Tue, 25 Mar 2025 16:42:28 -0700
Subject: [PATCH 4/6] chore: fix whitespaces
---
tests/unit/test_report_options.py | 1 -
tests/unit/test_time_series.py | 1 -
2 files changed, 2 deletions(-)
diff --git a/tests/unit/test_report_options.py b/tests/unit/test_report_options.py
index b0f4e0ee4..6e4a804f0 100644
--- a/tests/unit/test_report_options.py
+++ b/tests/unit/test_report_options.py
@@ -81,7 +81,6 @@ def test_max_unique_categories(plot_type):
# Test with different numbers of unique categories
categories = {f"cat_{i}": 5 for i in range(10)}
data = generate_cat_data_series(categories)
-
profile = generate_report(data)
profile.config.plot.cat_freq.max_unique = 5
profile.config.plot.cat_freq.type = plot_type
diff --git a/tests/unit/test_time_series.py b/tests/unit/test_time_series.py
index e1ac3fd2b..571e0619d 100644
--- a/tests/unit/test_time_series.py
+++ b/tests/unit/test_time_series.py
@@ -110,7 +110,6 @@ def test_timeseries_config_persistence():
df = pd.DataFrame({'value': range(100)})
profile = ProfileReport(df, tsmode=True)
assert profile.config.vars.timeseries.active is True
-
# Test config after invalidating cache
profile.invalidate_cache()
assert profile.config.vars.timeseries.active is True
From 2965fc5b97281c3d07987644be935c00582cfe69 Mon Sep 17 00:00:00 2001
From: Fabiana <30911746+fabclmnt@users.noreply.github.com>
Date: Tue, 25 Mar 2025 17:05:11 -0700
Subject: [PATCH 5/6] chore: test no longer valid
---
tests/issues/test_issue537.py | 4 +++-
1 file changed, 3 insertions(+), 1 deletion(-)
diff --git a/tests/issues/test_issue537.py b/tests/issues/test_issue537.py
index f0a2c9f0a..227394f9e 100644
--- a/tests/issues/test_issue537.py
+++ b/tests/issues/test_issue537.py
@@ -1,3 +1,5 @@
+import pytest
+
import concurrent.futures
from functools import partial
from gzip import decompress
@@ -25,7 +27,7 @@ def mock_multiprocess_1d(args, config, summarizer, typeset) -> Tuple[str, dict]:
column, series = args
return column, describe_1d(config, series, summarizer, typeset)
-
+@pytest.mark.skip("This test is no longer valid")
def test_multiprocessing_describe1d(config, summarizer, typeset):
"""
This test ensures that parallelized describe1d operations do not cause a ValueError due to
From 74d07e8a8bcfb7f5d84832d7a73655488fe14997 Mon Sep 17 00:00:00 2001
From: Azory YData Bot
Date: Wed, 26 Mar 2025 00:08:12 +0000
Subject: [PATCH 6/6] fix(linting): code formatting
---
tests/issues/test_issue537.py | 4 ++--
1 file changed, 2 insertions(+), 2 deletions(-)
diff --git a/tests/issues/test_issue537.py b/tests/issues/test_issue537.py
index 227394f9e..a62b4a513 100644
--- a/tests/issues/test_issue537.py
+++ b/tests/issues/test_issue537.py
@@ -1,5 +1,3 @@
-import pytest
-
import concurrent.futures
from functools import partial
from gzip import decompress
@@ -7,6 +5,7 @@
import numpy as np
import pandas as pd
+import pytest
import requests
from ydata_profiling.model.summary import describe_1d
@@ -27,6 +26,7 @@ def mock_multiprocess_1d(args, config, summarizer, typeset) -> Tuple[str, dict]:
column, series = args
return column, describe_1d(config, series, summarizer, typeset)
+
@pytest.mark.skip("This test is no longer valid")
def test_multiprocessing_describe1d(config, summarizer, typeset):
"""