library(htm2txt)
library(hgr)
library(htmltools)
library(reticulate)
library(httr)
library(magrittr)
library(xml2)
URL <- "https://medium.com/starts-with-a-bang/science-knows-if-a-nation-is-testing-nuclear-bombs-ec5db88f4526"
res <- crawltxt(URL = URL)
jtf <- just_the_facts(url = URL)
pg <- httr::GET(URL)
doc <- httr::content(pg, as="text", endoding="UTF-8")
readability <- import("readability") # pip install readability-lxml
doc <- readability$Document(doc)
doc$summary() %>%
read_xml() %>%
xml_text() -> doc