2024-04-14 21:30:16 +00:00
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
#' Ping peer nodes for latency measurement
|
|
|
|
|
#'
|
|
|
|
|
#' @param bitmonero.dir .bitmonero directory where the monero.log file is.
|
|
|
|
|
#' @param output.file Name of the output file. The file will be created in `bitmonero.dir`.
|
|
|
|
|
#' @param sleep Number of seconds to sleep between each round of collecting new peer IPs.
|
|
|
|
|
#' @param ping.count Number of times to ping each peer.
|
2024-04-15 16:31:20 +00:00
|
|
|
|
#' @param threads Override default number of threads for sending pings.
|
2024-04-14 21:30:16 +00:00
|
|
|
|
#'
|
|
|
|
|
#' @return No return value. Executes in a loop until interrupted.
|
|
|
|
|
#' @export
|
|
|
|
|
#'
|
|
|
|
|
#' @examples
|
2024-04-15 12:46:16 +00:00
|
|
|
|
#' \dontrun{
|
2024-04-14 21:30:16 +00:00
|
|
|
|
#' ping.peers()
|
2024-04-15 12:46:16 +00:00
|
|
|
|
#' }
|
2024-04-15 23:14:12 +00:00
|
|
|
|
ping.peers <- function(bitmonero.dir = "~/.bitmonero", output.file = "monero_peer_pings.csv", sleep = 10, ping.count = 5, threads = NULL) {
|
2024-04-14 21:30:16 +00:00
|
|
|
|
|
2024-04-17 12:44:32 +00:00
|
|
|
|
Sys.setenv(VROOM_CONNECTION_SIZE = formatC(131072 * 100, format = "fg"))
|
|
|
|
|
# Fixes occasional issues with https://github.com/tidyverse/vroom/issues/364
|
|
|
|
|
# formatC() is used since VROOM_CONNECTION_SIZE cannot interpret scientific notation
|
|
|
|
|
|
2024-04-14 21:30:16 +00:00
|
|
|
|
bitmonero.dir <- path.expand(bitmonero.dir)
|
|
|
|
|
bitmonero.dir <- gsub("/+$", "", bitmonero.dir)
|
|
|
|
|
# Remove trailing slash(es) if they exist
|
|
|
|
|
|
2024-04-15 23:14:12 +00:00
|
|
|
|
output.file <- paste0(bitmonero.dir, "/", output.file)
|
2024-04-14 21:30:16 +00:00
|
|
|
|
|
2024-04-15 23:14:12 +00:00
|
|
|
|
files.in.dir <- list.files(bitmonero.dir)
|
|
|
|
|
log.file.name <- files.in.dir[grepl("(^bitmonero[.]log$)|(^monero[.]log$)", files.in.dir, ignore.case = TRUE)]
|
|
|
|
|
if (length(log.file.name) == 0) {
|
|
|
|
|
stop("Cannot find log file in bitmonero.dir")
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
if (length(log.file.name) > 1) {
|
|
|
|
|
stop("Files named 'bitmonero.log' _and_ 'monero.log' exist in bitmonero.dir")
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
log.file <- paste0(bitmonero.dir, "/", log.file.name)
|
2024-04-14 21:30:16 +00:00
|
|
|
|
|
|
|
|
|
first.file.line <- readr::read_lines(log.file, n_max = 1)
|
|
|
|
|
# Get the first file line so we know when the log file rolls over
|
|
|
|
|
# to the next file.
|
|
|
|
|
# Better to do this than file.info() because file.info() is OS-dependent:
|
|
|
|
|
# > What is meant by the three file times depends on the OS and file system.
|
|
|
|
|
# > On Windows native file systems ctime is the file creation time
|
|
|
|
|
# > (something which is not recorded on most Unix-alike file systems).
|
|
|
|
|
# > What is meant by ‘file access’ and hence the ‘last access time’ is system-dependent.
|
|
|
|
|
|
2024-04-15 16:31:20 +00:00
|
|
|
|
while (length(first.file.line) == 0) {
|
|
|
|
|
Sys.sleep(sleep)
|
|
|
|
|
first.file.line <- readr::read_lines(log.file, n_max = 1)
|
|
|
|
|
# If the log file is empty, sleep until it has at least one line.
|
|
|
|
|
}
|
2024-04-14 21:30:16 +00:00
|
|
|
|
|
|
|
|
|
lines.already.read <- 0
|
|
|
|
|
|
|
|
|
|
while (TRUE) {
|
|
|
|
|
|
|
|
|
|
check.first.file.line <- readr::read_lines(log.file, n_max = 1)
|
|
|
|
|
|
2024-04-15 16:31:20 +00:00
|
|
|
|
if (length(check.first.file.line) == 0) {
|
|
|
|
|
lines.already.read <- 0
|
|
|
|
|
Sys.sleep(sleep)
|
|
|
|
|
next
|
|
|
|
|
# If the log file is empty, sleep until it has at least one line.
|
|
|
|
|
}
|
|
|
|
|
|
2024-04-14 21:30:16 +00:00
|
|
|
|
if (first.file.line != check.first.file.line) {
|
|
|
|
|
first.file.line <- check.first.file.line
|
|
|
|
|
lines.already.read <- 0
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
if (file.exists(output.file)) {
|
|
|
|
|
old.ping.data <- read.csv(output.file, header = FALSE)
|
|
|
|
|
old.ip.ports <- paste0(old.ping.data[, 1], ":", old.ping.data[, 2])
|
|
|
|
|
} else {
|
|
|
|
|
old.ip.ports <- ""
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
tail.file <- readr::read_lines(log.file, skip = lines.already.read)
|
|
|
|
|
|
2024-04-15 12:46:16 +00:00
|
|
|
|
n.lines.file <- length(tail.file) + lines.already.read
|
|
|
|
|
|
2024-04-14 21:30:16 +00:00
|
|
|
|
ip.lines <- grep("Received NOTIFY_NEW_TRANSACTIONS", tail.file, fixed = TRUE)
|
|
|
|
|
|
|
|
|
|
if (length(ip.lines) == 0) {
|
2024-04-15 12:46:16 +00:00
|
|
|
|
Sys.sleep(sleep)
|
2024-04-14 21:30:16 +00:00
|
|
|
|
cat(base::date(), " Peers pinged: 0\n", sep = "")
|
|
|
|
|
next
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
get.peer.ip.port.direction <- function(x) {
|
2024-04-16 20:13:14 +00:00
|
|
|
|
x <- stringr::str_extract(x,
|
|
|
|
|
"\t\\[+([^\\[\\]]+)\\]*:([0-9]+) ([INCOUT]{3})\\] Received NOTIFY_NEW_TRANSACTIONS",
|
|
|
|
|
group = c(1, 2, 3))
|
|
|
|
|
if (!is.matrix(x)) {
|
|
|
|
|
x <- matrix(x, ncol = 3, byrow = TRUE)
|
|
|
|
|
# stringr::str_extract() creates an atomic vector instaed of a matrix
|
|
|
|
|
# if the x has only one element
|
|
|
|
|
}
|
|
|
|
|
x <- as.data.frame(x)
|
2024-04-14 21:30:16 +00:00
|
|
|
|
colnames(x) <- c("ip", "port", "direction")
|
|
|
|
|
x
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
peers <- get.peer.ip.port.direction(tail.file[ip.lines])
|
|
|
|
|
peers <- unique(peers)
|
2024-04-16 20:13:14 +00:00
|
|
|
|
missed.parsing <- (! complete.cases(peers))
|
|
|
|
|
if (any(missed.parsing)) {
|
|
|
|
|
cat("Unable to parse ", sum(missed.parsing), " IPs of peers\n", sep = "")
|
|
|
|
|
}
|
|
|
|
|
peers <- peers[! missed.parsing, , drop = FALSE] # Drops any NAs in case the parsing doesn't work
|
2024-04-14 21:30:16 +00:00
|
|
|
|
peers <- peers[! paste0(peers$ip, ":", peers$port) %in% old.ip.ports, , drop = FALSE]
|
|
|
|
|
|
|
|
|
|
if (nrow(peers) == 0) {
|
2024-04-15 12:46:16 +00:00
|
|
|
|
Sys.sleep(sleep)
|
2024-04-14 21:30:16 +00:00
|
|
|
|
cat(base::date(), " Peers pinged: 0\n", sep = "")
|
|
|
|
|
next
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
get.ping.data <- function(x) {
|
|
|
|
|
ip <- x[[1]]
|
2024-04-16 20:13:14 +00:00
|
|
|
|
ip.type <- IP::ip(ip)@.Data
|
|
|
|
|
|
|
|
|
|
if (is.na(ip.type) || (! ip.type %in% c(4, 6))) {
|
|
|
|
|
cat("Could not determine ipv4/ipv6 type of peer\n")
|
|
|
|
|
return(paste("UNPARSEABLE", "UNPARSEABLE", "UNPARSEABLE",
|
|
|
|
|
paste(rep(NA, ping.count), collapse = ","), sep = ","))
|
|
|
|
|
}
|
|
|
|
|
|
2024-04-14 21:30:16 +00:00
|
|
|
|
port <- x[[2]]
|
|
|
|
|
direction <- x[[3]]
|
|
|
|
|
if (paste0(ip, ":", port) %in% old.ip.ports) {
|
|
|
|
|
return("")
|
|
|
|
|
}
|
2024-04-16 20:13:14 +00:00
|
|
|
|
|
|
|
|
|
if (ip.type == 4) {
|
|
|
|
|
pings <- pingr::ping_port(ip, port = port, count = ping.count)
|
|
|
|
|
if (all(is.na(pings))) {
|
|
|
|
|
# This may happen if it is an incoming connection and the peer's port is closed
|
|
|
|
|
pings <- pingr::ping(ip, count = ping.count)
|
|
|
|
|
}
|
2024-04-14 21:30:16 +00:00
|
|
|
|
}
|
2024-04-16 20:13:14 +00:00
|
|
|
|
|
|
|
|
|
if (ip.type == 6) {
|
|
|
|
|
# pingr::ping() doesn't seem to work with ipv6, so switch to
|
|
|
|
|
# the pingers package
|
|
|
|
|
# pingers::ping_capture() output format makes it difficult to get the
|
|
|
|
|
# ping latency for each ping, so we will just loop ping.count times
|
|
|
|
|
ping.ipv6 <- function() {
|
|
|
|
|
y <- pingers::ping_capture(paste0(ip, ":", port), count = 1)$ping_min
|
|
|
|
|
if (is.na(y)) {
|
|
|
|
|
# This may happen if it is an incoming connection and the peer's port is closed
|
|
|
|
|
y <- pingers::ping_capture(ip, count = 1)$ping_min
|
|
|
|
|
}
|
|
|
|
|
y
|
|
|
|
|
}
|
|
|
|
|
pings <- replicate(ping.count, ping.ipv6())
|
|
|
|
|
}
|
|
|
|
|
|
2024-04-14 21:30:16 +00:00
|
|
|
|
paste(ip, port, direction, paste(pings, collapse = ","), sep = ",")
|
|
|
|
|
}
|
|
|
|
|
|
2024-04-16 20:13:14 +00:00
|
|
|
|
get.ping.data.errors.handled <- function(x) {
|
|
|
|
|
tryCatch(get.ping.data(x), error = function(e) {""})
|
|
|
|
|
}
|
|
|
|
|
|
2024-04-14 21:30:16 +00:00
|
|
|
|
if (nrow(peers) * ping.count > 5) {
|
|
|
|
|
|
2024-04-15 16:31:20 +00:00
|
|
|
|
if (is.null(threads)) {
|
2024-04-16 00:25:43 +00:00
|
|
|
|
n.workers <- min(c(floor(nrow(peers) * ping.count / 5), parallelly::availableCores()*4, 100))
|
2024-04-16 00:24:07 +00:00
|
|
|
|
} else {
|
|
|
|
|
n.workers <- threads
|
2024-04-15 16:31:20 +00:00
|
|
|
|
}
|
2024-04-14 21:30:16 +00:00
|
|
|
|
options(parallelly.maxWorkers.localhost = 4) # This means number of CPU cores times 4
|
|
|
|
|
# Most time in thread is waiting for ping to return, so can have
|
|
|
|
|
# high number of workers
|
|
|
|
|
|
2024-04-15 16:31:20 +00:00
|
|
|
|
future::plan(future::multisession, workers = n.workers)
|
|
|
|
|
# Must have this instead of
|
|
|
|
|
# future::plan(future::multisession(workers = n.workers))
|
|
|
|
|
# since the latter fails with" object 'n.workers' not found"
|
|
|
|
|
# because of a strange scoping reason.
|
2024-04-14 21:30:16 +00:00
|
|
|
|
|
2024-04-16 20:13:14 +00:00
|
|
|
|
ping.data <- future.apply::future_apply(peers, MARGIN = 1, get.ping.data.errors.handled, future.seed = TRUE)
|
2024-04-14 21:30:16 +00:00
|
|
|
|
|
|
|
|
|
future::plan(future::sequential)
|
|
|
|
|
# Shut down workers
|
|
|
|
|
|
|
|
|
|
} else {
|
2024-04-16 20:13:14 +00:00
|
|
|
|
ping.data <- apply(peers, MARGIN = 1, get.ping.data.errors.handled)
|
2024-04-14 21:30:16 +00:00
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
ping.data <- unname(ping.data)
|
|
|
|
|
|
|
|
|
|
ping.data <- ping.data[ping.data != ""]
|
|
|
|
|
|
|
|
|
|
if (length(ping.data) > 0) {
|
|
|
|
|
cat(ping.data, file = output.file, sep = "\n", append = TRUE)
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
lines.already.read <- n.lines.file
|
|
|
|
|
|
2024-04-15 12:46:16 +00:00
|
|
|
|
Sys.sleep(sleep)
|
2024-04-14 21:30:16 +00:00
|
|
|
|
|
|
|
|
|
cat(base::date(), " Peers pinged: ", length(ping.data), "\n", sep = "")
|
|
|
|
|
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|