Commit
This commit does not belong to any branch on this repository, and may belong to a fork outside of the repository.
- Loading branch information
0 parents
commit 4823331
Showing
46 changed files
with
5,422 additions
and
0 deletions.
There are no files selected for viewing
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
Original file line number | Diff line number | Diff line change |
---|---|---|
@@ -0,0 +1,25 @@ | ||
Package: multilink | ||
Title: Multifile Record Linkage and Duplicate Detection | ||
Version: 0.1.0 | ||
Authors@R: | ||
person(given = "Serge", | ||
family = "Aleshin-Guendel", | ||
role = c("aut", "cre"), | ||
email = "saleshinguendel@gmail.com") | ||
Description: Implementation of the methodology of Aleshin-Guendel & Sadinle (2022) <doi:10.1080/01621459.2021.2013242>. It handles the general problem of multifile record linkage and duplicate detection, where any number of files are to be linked, and any of the files may have duplicates. | ||
Depends: R (>= 3.5.0) | ||
License: GPL-3 | ||
Encoding: UTF-8 | ||
LazyData: true | ||
RoxygenNote: 7.1.2 | ||
URL: https://github.com/aleshing/multilink | ||
BugReports: https://github.com/aleshing/multilink/issues | ||
Imports: igraph, RecordLinkage, Rcpp, utils, mcclust, geosphere, | ||
stringr | ||
LinkingTo: Rcpp, RcppArmadillo | ||
NeedsCompilation: yes | ||
Packaged: 2023-01-20 18:23:16 UTC; sergealeshin-guendel | ||
Author: Serge Aleshin-Guendel [aut, cre] | ||
Maintainer: Serge Aleshin-Guendel <saleshinguendel@gmail.com> | ||
Repository: CRAN | ||
Date/Publication: 2023-01-23 09:20:02 UTC |
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
Original file line number | Diff line number | Diff line change |
---|---|---|
@@ -0,0 +1,45 @@ | ||
082fd32a4a4f99e7a7de2a0f303a4945 *DESCRIPTION | ||
167a4a71836c058ae3b32276c19a9b16 *NAMESPACE | ||
bf74c10eb64ee4419c0b108246b985cf *NEWS.md | ||
40cea04bfdd247602a4c9acddd71615d *R/RcppExports.R | ||
be0f77776c60e5196be45a4e3c986bb3 *R/create_comparison_data.R | ||
dc2de3e57b157774a0205e02371b137b *R/dup_data.R | ||
75213b21f0d7da630fccfce3928e95b0 *R/dup_data_small.R | ||
5e62f366fa2ed21bc8caf02d4e849770 *R/find_bayes_estimate.R | ||
75fa938d0923fd50df50eb293adc19c7 *R/gibbs_sampler.R | ||
cc7489616d255bc710cf0a7b5a01ba8e *R/initialize_partition.R | ||
82a173cafb14bfd13365f55ecf243701 *R/multilink-package.R | ||
6f35bedbca8bb45fc6e30885daac65c8 *R/no_dup_data.R | ||
fbd58f87f73849dcdbca07a548a8c409 *R/no_dup_data_small.R | ||
098c423aacd1842a79b098313c5bbeeb *R/reduce_comparison_data.R | ||
2cabf21e735054d3924f60001a0fb59c *R/relabel_bayes_estimate.R | ||
598752bd6f47863066c05bd48d9b7a03 *R/specify_prior.R | ||
64fe2a41861b6948c25a3ea5e40250d7 *README.md | ||
f8f34c698a71fc622589928c3deb09c0 *build/partial.rdb | ||
c8a4743b32c54e75a7a390256ac9a972 *data/dup_data.RData | ||
e27525ecbce3a850ae71f10ac6f45198 *data/dup_data_small.RData | ||
3320fdaf5f3eb3b3a5c0853db0c9f57c *data/no_dup_data.RData | ||
bc4c9ed78886ef847f5b5d4f0b2fc8bf *data/no_dup_data_small.RData | ||
00bb927cb2bf9bfca69c1fa9f241f032 *man/create_comparison_data.Rd | ||
5643e350c1f1a7ca1c9cb24aafd72f2c *man/dup_data.Rd | ||
3c875d40e31a4dc076e29a65d636309e *man/dup_data_small.Rd | ||
0fc71e92ce87782c62ffe7f2daa86c70 *man/find_bayes_estimate.Rd | ||
e04a0891ae859d6b2535f0767cdef926 *man/gibbs_sampler.Rd | ||
83441cfbeebeedbb37491dc51203f098 *man/initialize_partition.Rd | ||
5179159a7e4ea07e073704739a29e165 *man/multilink.Rd | ||
189cabd54c8a66b75f5e4981d3dd9a34 *man/no_dup_data.Rd | ||
7b51a40eb8381527d6ee0a3533f900e8 *man/no_dup_data_small.Rd | ||
b0eee4a899b36e6cb2139192aec636eb *man/reduce_comparison_data.Rd | ||
af431f87cd1553311c433c8b4c2813c8 *man/relabel_bayes_estimate.Rd | ||
542513337dae28a0074a467be872a6f2 *man/specify_prior.Rd | ||
e4a9a47c4a3aca98677ab8b16336e5de *src/Makevars | ||
e4a9a47c4a3aca98677ab8b16336e5de *src/Makevars.win | ||
de5455bc8a796f53e69b319cfec59ff4 *src/RcppExports.cpp | ||
bc6edea1f09b1943ceff6ec6c5ecd2bc *src/compute_log_like.cpp | ||
456bae76305e37084395039d75612971 *src/compute_log_like.h | ||
868162b41961aeab8c0de27bd9046750 *src/get_posterior_loss.cpp | ||
1df156c84997736b49e25da079f39176 *src/gibbs_loop.cpp | ||
abae8708a694058f28964f3b00f433ea *src/sample_Z.cpp | ||
d44e33514e9b227cdbf835f0a56e5da6 *src/sample_Z.h | ||
223d60586964bc0d2511b492bd756697 *src/sample_phi.cpp | ||
eec9f8e14b05130bc67b21542cd6dc30 *src/sample_phi.h |
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
Original file line number | Diff line number | Diff line change |
---|---|---|
@@ -0,0 +1,11 @@ | ||
# Generated by roxygen2: do not edit by hand | ||
|
||
export(create_comparison_data) | ||
export(find_bayes_estimate) | ||
export(gibbs_sampler) | ||
export(initialize_partition) | ||
export(reduce_comparison_data) | ||
export(relabel_bayes_estimate) | ||
export(specify_prior) | ||
importFrom(Rcpp,sourceCpp) | ||
useDynLib(multilink, .registration = TRUE) |
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
Original file line number | Diff line number | Diff line change |
---|---|---|
@@ -0,0 +1,3 @@ | ||
# multilink 0.1.0 | ||
|
||
* Updated package for submission to CRAN. |
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
Original file line number | Diff line number | Diff line change |
---|---|---|
@@ -0,0 +1,15 @@ | ||
# Generated by using Rcpp::compileAttributes() -> do not edit by hand | ||
# Generator token: 10BE3573-1514-4C36-9D1C-5A225CD40393 | ||
|
||
get_posterior_loss_allcpp <- function(TT, r, partitions, L_FNM, L_FM1, L_FM2) { | ||
.Call(`_multilink_get_posterior_loss_allcpp`, TT, r, partitions, L_FNM, L_FM1, L_FM2) | ||
} | ||
|
||
get_posterior_loss_abstain_cpp <- function(TT, r, partitions, L_FNM, L_FM1, L_FM2, L_A, power) { | ||
.Call(`_multilink_get_posterior_loss_abstain_cpp`, TT, r, partitions, L_FNM, L_FM1, L_FM2, L_A, power) | ||
} | ||
|
||
gibbs_loop_rcpp <- function(n_iter, Z_samp, clust_sizes_samp, cont_samp, m_samp, u_samp, mus, nus, alphas, alpha_0, dup_upper_bound, dup_count_prior, n_prior, cont, clust_sizes, n, ab, obs_mat, record_pairs, flat, r, r_1, valid_rp, singleton_ind, rp_ind, file_labels, powers, L, num_fp, num_rp, num_field, rp_to_fp, level_cum, no_dups, valid_fp, cc, Z_members, clust_sizes_collapsed, indexing_used, single_likelihood, single_nus, single_ab, num_chap_iter, chap_type, file_size_cum, valid_fp_matrix, fp_probs, comparison_rps, comparison_rps_length, extra_gibbs, num_restrict, comparisons_chap, comparison_rps_probs, verbose) { | ||
.Call(`_multilink_gibbs_loop_rcpp`, n_iter, Z_samp, clust_sizes_samp, cont_samp, m_samp, u_samp, mus, nus, alphas, alpha_0, dup_upper_bound, dup_count_prior, n_prior, cont, clust_sizes, n, ab, obs_mat, record_pairs, flat, r, r_1, valid_rp, singleton_ind, rp_ind, file_labels, powers, L, num_fp, num_rp, num_field, rp_to_fp, level_cum, no_dups, valid_fp, cc, Z_members, clust_sizes_collapsed, indexing_used, single_likelihood, single_nus, single_ab, num_chap_iter, chap_type, file_size_cum, valid_fp_matrix, fp_probs, comparison_rps, comparison_rps_length, extra_gibbs, num_restrict, comparisons_chap, comparison_rps_probs, verbose) | ||
} | ||
|
Oops, something went wrong.