gibasaの速さについて (1/2)
rmecab <- \() {
purrr::imap_dfr(
audubon::polano[5:800],
~ data.frame(
doc_id = .y,
tibble::enframe(unlist(RMeCab::RMeCabC(.x)), "POS1", "token")
)
)
}
rcppmecab1 <- \() {
purrr::imap_dfr(
RcppMeCab::posParallel(audubon::polano[5:800], join = FALSE),
~ data.frame(doc_id = .y, token = unname(.x), POS1 = names(.x))
)
}
rcppmecab2 <- \() { RcppMeCab::posParallel(audubon::polano[5:800], format = "data.frame") }
gibasa <- \() {
gibasa::gbs_tokenize(audubon::polano[5:800]) |> gibasa::prettify(col_select = "POS1")
}