sub_criteria(
...,
match_funcs = c(exact = diyar::exact_match),
equal_funcs = c(exact = diyar::exact_match),
operator = "or"
)
attrs(..., .obj = NULL)
eval_sub_criteria(x, ...)
# S3 method for sub_criteria
print(x, ...)
# S3 method for sub_criteria
format(x, show_levels = FALSE, ...)
# S3 method for sub_criteria
eval_sub_criteria(
x,
x_pos = seq_len(max(attr_eval(x))),
y_pos = rep(1L, length(x_pos)),
check_duplicates = TRUE,
depth = 0,
...
)
[atomic]
Attributes passed to or eval_sub_criteria()
or eval_sub_criteria()
Arguments passed to methods for eval_sub_criteria()
[function]
. User defined logical test for matches.
[function]
. User defined logical test for identical record sets (all attributes of the same record).
[character]
. Options are "and"
or "or"
.
[data.frame|list]
. Attributes.
[sub_criteria]
. Attributes.
[logical]
. If TRUE
, show recursive depth for each logic statement of the match criteria.
[integer]
. Index of one half of a record pair.
[integer]
. Index of one half of a record pair.
[logical]
. If FALSE
, does not check duplicate values. The result of the initial check will be recycled.
[integer]
. First order of recursion.
sub_criteria
sub_criteria()
- Create a match criteria as a sub_criteria
object.
A sub_criteria
object contains attributes to be compared,
logical tests for the comparisons (see predefined_tests
for examples) and
another set of logical tests to determine identical records.
attrs()
- Create a d_attribute
object - a collection of atomic objects that can be passed to sub_criteria()
as a single attribute.
eval_sub_criteria()
- Evaluates a sub_criteria
object.
At each iteration of links
or episodes
, record-pairs are created from each attribute of a sub_criteria
object.
eval_sub_criteria()
evaluates each record-pair using the match_funcs
and equal_funcs
functions of a sub_criteria
object.
See predefined_tests
for examples of match_funcs
and equal_funcs
.
User-defined functions are also permitted as match_funcs
and equal_funcs
.
Such functions must meet three requirements:
It must be able to compare the attributes.
It must have two arguments named `x`
and `y`
, where `y`
is the value for one observation being compared against all other observations (`x`
).
It must return a logical
object i.e. TRUE
or FALSE
.
attrs()
is useful when the match criteria requires an interaction between the multiple attributes. For example, attribute 1 + attribute 2 > attribute 3.
Every attribute, including those in attrs()
, must have the same length or a length of 1.
predefined_tests
; links
; episodes
; eval_sub_criteria
# Attributes
attr_1 <- c(30, 28, 40, 25, 25, 29, 27)
attr_2 <- c("M", "F", "U", "M", "F", "U", "M")
# A match criteria
## Example 1 - A maximum difference of 10 in attribute 1
s_cri1 <- sub_criteria(attr_1, match_funcs = range_match)
s_cri1
#> {
#> match_func(30,28,40 ...)
#> }
# Evaluate the match criteria
## Compare the first element of 'attr_1' against all other elements
eval_sub_criteria(s_cri1)
#> $logical_test
#> [1] 1 1 0 1 1 1 1
#>
## Compare the second element of 'attr_1' against all other elements
x_pos_val <- seq_len(max(attr_eval(s_cri1)))
eval_sub_criteria(s_cri1,
x_pos = x_pos_val,
y_pos = rep(2, length(x_pos_val)))
#> $logical_test
#> [1] 0 1 0 1 1 0 1
#>
## Example 2 - `s_cri1` AND an exact match on attribute 2
s_cri2 <- sub_criteria(
s_cri1,
sub_criteria(attr_2, match_funcs = exact_match),
operator = "and")
s_cri2
#> {
#> {
#> match_func(30,28,40 ...)
#> } AND
#> {
#> match_func(M,F,U ...)
#> }
#> }
## Example 3 - `s_cri1` OR an exact match on attribute 2
s_cri3 <- sub_criteria(
s_cri1,
sub_criteria(attr_2, match_funcs = exact_match),
operator = "or")
s_cri3
#> {
#> {
#> match_func(30,28,40 ...)
#> } OR
#> {
#> match_func(M,F,U ...)
#> }
#> }
# Evaluate the match criteria
eval_sub_criteria(s_cri2)
#> $logical_test
#> [1] 1 0 0 1 0 0 1
#>
eval_sub_criteria(s_cri3)
#> $logical_test
#> [1] 1 1 0 1 1 1 1
#>
# Alternatively, using `attr()`
AND_func <- function(x, y) range_match(x$a1, y$a1) & x$a2 == y$a2
OR_func <- function(x, y) range_match(x$a1, y$a1) | x$a2 == y$a2
## Create a match criteria
s_cri2b <- sub_criteria(attrs(.obj = list(a1 = attr_1, a2 = attr_2)),
match_funcs = AND_func)
s_cri3b <- sub_criteria(attrs(.obj = list(a1 = attr_1, a2 = attr_2)),
match_funcs = OR_func)
# Evaluate the match criteria
eval_sub_criteria(s_cri2b)
#> $logical_test
#> [1] 1 0 0 1 0 0 1
#>
eval_sub_criteria(s_cri3b)
#> $logical_test
#> [1] 1 1 0 1 1 1 1
#>