Total variation distance similarity score per categorical column
Source:R/quality_metrics.R
tvd_similarity.RdTotal variation distance similarity score per categorical column
Examples
# \donttest{
syn <- gaussian_copula_synthesizer(metadata(adult_income)) |> fit(adult_income)
synth <- sample(syn, n = 500)
tvd_similarity(adult_income, synth, metadata(adult_income))
#> # A tibble: 9 × 2
#> column score
#> <chr> <dbl>
#> 1 workclass 0.975
#> 2 education 0.958
#> 3 marital_status 0.98
#> 4 occupation 0.936
#> 5 relationship 0.948
#> 6 race 0.99
#> 7 sex 0.998
#> 8 native_country 0.971
#> 9 income 0.99
# }