11# Title of the document
2- title : " Pandas Profiling Report"
2+ title : YData Profiling Report
33
44# Metadata
55dataset :
@@ -27,93 +27,97 @@ progress_bar: true
2727
2828# Per variable type description settings
2929vars :
30- num :
31- quantiles :
32- - 0.05
33- - 0.25
34- - 0.5
35- - 0.75
36- - 0.95
37- skewness_threshold : 20
38- low_categorical_threshold : 5
39- # Set to zero to disable
40- chi_squared_threshold : 0.999
41- cat :
42- length : true
43- characters : true
44- words : true
45- cardinality_threshold : 50
46- n_obs : 5
47- # Set to zero to disable
48- chi_squared_threshold : 0.999
49- coerce_str_to_date : false
50- redact : false
51- histogram_largest : 50
52- stop_words : []
53- bool :
54- n_obs : 3
55- # string to boolean mapping dict
56- mappings :
57- t : true
58- f : false
59- yes : true
60- no : false
61- y : true
62- n : false
63- true : true
64- false : false
65- file :
66- active : false
67- image :
68- active : false
69- exif : true
70- hash : true
71- path :
72- active : false
73- url :
74- active : false
75- timeseries :
76- active : false
77- autocorrelation : 0.7
78- lags : [1, 7, 12, 24, 30]
79- significance : 0.05
80- pacf_acf_lag : 100
30+ num :
31+ quantiles :
32+ - 0.05
33+ - 0.25
34+ - 0.5
35+ - 0.75
36+ - 0.95
37+ skewness_threshold : 20
38+ low_categorical_threshold : 5
39+ # Set to zero to disable
40+ chi_squared_threshold : 0.999
41+ cat :
42+ length : true
43+ characters : true
44+ words : true
45+ cardinality_threshold : 50
46+ n_obs : 5
47+ # Set to zero to disable
48+ chi_squared_threshold : 0.999
49+ coerce_str_to_date : false
50+ redact : false
51+ histogram_largest : 50
52+ stop_words : []
53+ bool :
54+ n_obs : 3
55+ # string to boolean mapping dict
56+ mappings :
57+ t : true
58+ f : false
59+ yes : true
60+ no : false
61+ y : true
62+ n : false
63+ " true " : true
64+ " false " : false
65+ file :
66+ active : false
67+ image :
68+ active : false
69+ exif : true
70+ hash : true
71+ path :
72+ active : false
73+ url :
74+ active : false
75+ timeseries :
76+ active : false
77+ autocorrelation : 0.7
78+ lags :
79+ - 1
80+ - 7
81+ - 12
82+ - 24
83+ - 30
84+ significance : 0.05
85+ pacf_acf_lag : 100
8186
8287# Sort the variables. Possible values: "ascending", "descending" or null (leaves original sorting)
8388sort : null
8489
8590# which diagrams to show
8691missing_diagrams :
87- bar : true
88- matrix : true
89- heatmap : true
92+ bar : true
93+ matrix : true
94+ heatmap : true
9095
9196correlations :
92- pearson :
93- calculate : false
94- warn_high_correlations : true
95- threshold : 0.9
96- spearman :
97- calculate : false
98- warn_high_correlations : false
99- threshold : 0.9
100- kendall :
101- calculate : false
102- warn_high_correlations : false
103- threshold : 0.9
104- phi_k :
105- calculate : false
106- warn_high_correlations : false
107- threshold : 0.9
108- cramers :
109- calculate : false
110- warn_high_correlations : true
111- threshold : 0.9
112- auto :
113- calculate : true
114- warn_high_correlations : true
115- threshold : 0.9
116-
97+ pearson :
98+ calculate : false
99+ warn_high_correlations : true
100+ threshold : 0.9
101+ spearman :
102+ calculate : false
103+ warn_high_correlations : false
104+ threshold : 0.9
105+ kendall :
106+ calculate : false
107+ warn_high_correlations : false
108+ threshold : 0.9
109+ phi_k :
110+ calculate : false
111+ warn_high_correlations : false
112+ threshold : 0.9
113+ cramers :
114+ calculate : false
115+ warn_high_correlations : true
116+ threshold : 0.9
117+ auto :
118+ calculate : true
119+ warn_high_correlations : true
120+ threshold : 0.9
117121
118122# Bivariate / Pairwise relations
119123interactions :
@@ -128,38 +132,38 @@ report:
128132
129133# Plot-specific settings
130134plot :
131- # Image format (svg or png)
132- image_format : " svg"
133- dpi : 800
135+ # Image format (svg or png)
136+ image_format : svg
137+ dpi : 800
134138
135- scatter_threshold : 1000
139+ scatter_threshold : 1000
136140
137- correlation :
138- cmap : ' RdBu'
139- bad : ' #000000'
141+ correlation :
142+ cmap : RdBu
143+ bad : " #000000"
140144
141- missing :
142- cmap : ' RdBu'
143- # Force labels when there are > 50 variables
144- # https://github.com/ResidentMario/missingno/issues/93#issuecomment-513322615
145- force_labels : true
145+ missing :
146+ cmap : RdBu
147+ # Force labels when there are > 50 variables
148+ # https://github.com/ResidentMario/missingno/issues/93#issuecomment-513322615
149+ force_labels : true
146150
147- cat_frequency :
148- show : true # if false, the category frequency plot is turned off
149- type : ' bar' # options: 'bar', 'pie'
150- max_unique : 10
151- colors : null # use null for default or give a list of matplotlib recognised strings
151+ cat_frequency :
152+ show : true # if false, the category frequency plot is turned off
153+ type : bar # options: 'bar', 'pie'
154+ max_unique : 10
155+ colors : null # use null for default or give a list of matplotlib recognized strings
152156
153- histogram :
154- x_axis_labels : true
157+ histogram :
158+ x_axis_labels : true
155159
156- # Number of bins (set to 0 to automatically detect the bin size)
157- bins : 50
160+ # Number of bins (set to 0 to automatically detect the bin size)
161+ bins : 50
158162
159- # Maximum number of bins (when bins=0)
160- max_bins : 250
163+ # Maximum number of bins (when bins=0)
164+ max_bins : 250
161165
162- font_path : null
166+ font_path : null
163167
164168# The number of observations to show
165169n_obs_unique : 5
@@ -171,49 +175,49 @@ memory_deep: false
171175
172176# Configuration related to the duplicates
173177duplicates :
174- head : 10
175- key : " # duplicates"
178+ head : 10
179+ key : " # duplicates"
176180
177181# Configuration related to the samples area
178182samples :
179- head : 10
180- tail : 10
181- random : 0
183+ head : 10
184+ tail : 10
185+ random : 0
182186
183187# Configuration related to the rejection of variables
184188reject_variables : true
185189
186190# When in a Jupyter notebook
187191notebook :
188- iframe :
189- height : ' 800px'
190- width : ' 100%'
191- # or 'src'
192- attribute : ' srcdoc'
192+ iframe :
193+ height : 800px
194+ width : 100%
195+ # or 'src'
196+ attribute : srcdoc
193197
194198html :
195- # Minify the html
196- minify_html : true
199+ # Minify the html
200+ minify_html : true
197201
198- # Offline support
199- use_local_assets : true
202+ # Offline support
203+ use_local_assets : true
200204
201- # If true, single file, else directory with assets
202- inline : true
205+ # If true, single file, else directory with assets
206+ inline : true
203207
204- # Show navbar
205- navbar_show : true
208+ # Show navbar
209+ navbar_show : true
206210
207- # Assets prefix if inline = true
208- assets_prefix : null
211+ # Assets prefix if inline = true
212+ assets_prefix : null
209213
210- # Styling options for the HTML report
211- style :
212- theme : null
213- logo : " "
214- primary_colors :
215- - " #377eb8 "
216- - " #e41a1c "
217- - " #4daf4a "
214+ # Styling options for the HTML report
215+ style :
216+ theme : null
217+ logo : " "
218+ primary_colors :
219+ - " #0d6efd "
220+ - " #dc3545 "
221+ - " #198754 "
218222
219- full_width : false
223+ full_width : false
0 commit comments