Implements probabilistic decoupling for U-statistics using independent sequence copies
Examples
# Generate synthetic DNA sequences
set.seed(123)
bases <- c("A", "C", "G", "T")
sequences <- lapply(1:5, function(i) sample(bases, 20, replace = TRUE))
# Create kernel and run decoupling
kernel <- create_kernel(hamming_distance_kernel, "Hamming Distance")
result <- decouple_u_stat(sequences, kernel, B = 100)
# Print results
result
#> DecoupleResult object:
#> Original U-statistic: 15.4000
#> Decoupled mean: 12.0850
#> Decoupled SD: 1.8846
#> Kernel: Hamming Distance
#> Method: Friedman-de la Pena Decoupling
#> P-value: 0.0786
#> Z-score: 1.7590
#> Significance: (p = 0.0786)