# Title of the document title: "" dataset: description: "" creator: "" author: "" copyright_holder: "" copyright_year: "" url: "" # Number of workers (0=multiprocessing.cpu_count()) pool_size: 0 # Show the progress bar progress_bar: True variables: descriptions: {} # Per variable type description settings vars: num: quantiles: - 0.05 - 0.25 - 0.5 - 0.75 - 0.95 skewness_threshold: 20 low_categorical_threshold: 5 # Set to zero to disable chi_squared_threshold: 0.999 cat: length: True unicode: False cardinality_threshold: 50 n_obs: 5 # Set to zero to disable chi_squared_threshold: 0.999 coerce_str_to_date: False redact: False bool: n_obs: 3 file: active: False image: active: False exif: True hash: True # Sort the variables. Possible values: ascending, descending or None (leaves original sorting) sort: None # which diagrams to show missing_diagrams: bar: True matrix: True heatmap: True dendrogram: True correlations: pearson: calculate: True warn_high_correlations: True threshold: 0.9 spearman: calculate: True warn_high_correlations: False kendall: calculate: True warn_high_correlations: False phi_k: calculate: True warn_high_correlations: False cramers: calculate: True warn_high_correlations: True threshold: 0.9 # Deprecated: do not use recoded: calculate: False warn_high_correlations: False threshold: 0.0 # Bivariate / Pairwise relations interactions: targets: [] continuous: True # For categorical categorical_maximum_correlation_distinct: 100 # Plot-specific settings plot: # Image format (svg or png) image_format: "svg" dpi: 800 scatter_threshold: 1000 correlation: cmap: 'RdBu' bad: '#000000' missing: cmap: 'RdBu' # Force labels when there are > 50 variables # https://github.com/ResidentMario/missingno/issues/93#issuecomment-513322615 force_labels: True pie: # display a pie chart if the number of distinct values is smaller or equal (set to 0 to disable) max_unique: 10 histogram: x_axis_labels: True # Number of bins (set to 0 to automatically detect the bin size) bins: 50 # Maximum number of bins (when bins=0) max_bins: 250 # The number of observations to show n_obs_unique: 10 n_extreme_obs: 10 n_freq_table_max: 25 # Use `deep` flag for memory_usage memory_deep: False # Configuration related to the duplicates duplicates: head: 10 # Configuration related to the samples area samples: head: 10 tail: 10 # Configuration related to the rejection of variables reject_variables: True # When in a Jupyter notebook notebook: iframe: height: '800px' width: '100%' # or 'src' attribute: 'srcdoc' html: # Minify the html minify_html: True # Offline support use_local_assets: True # If True, single file, else directory with assets inline: True # Show navbar navbar_show: True # For internal use file_name: None # Styling options for the HTML report style: theme: None logo: "" primary_color: "#337ab7" full_width: False