diff --git a/inst/doc/monkeylearn_intro.R b/inst/doc/monkeylearn_intro.R
new file mode 100644
index 0000000..f8083b2
--- /dev/null
+++ b/inst/doc/monkeylearn_intro.R
@@ -0,0 +1,146 @@
+## ---- echo = FALSE, warning=FALSE, message=FALSE-------------------------
+NOT_CRAN <- identical(tolower(Sys.getenv("NOT_CRAN")), "true")
+pat <- Sys.getenv("MONKEYLEARN_KEY")
+IS_THERE_KEY <- (pat != "")
+NOT_CRAN <- ifelse(IS_THERE_KEY, NOT_CRAN, FALSE)
+knitr::opts_chunk$set(
+  collapse = TRUE,
+  comment = "#>",
+  purl = NOT_CRAN,
+  eval = NOT_CRAN
+)
+
+## ---- message = FALSE----------------------------------------------------
+library(monkeylearn)
+library(magrittr)
+
+text <- "In the 19th century, the major European powers had gone to great lengths to maintain a balance of power throughout Europe, resulting in the existence of a complex network of political and military alliances throughout the continent by 1900.[7] These had started in 1815, with the Holy Alliance between Prussia, Russia, and Austria. Then, in October 1873, German Chancellor Otto von Bismarck negotiated the League of the Three Emperors (German: Dreikaiserbund) between the monarchs of Austria-Hungary, Russia and Germany."
+output <- monkey_extract(input = text,
+                         extractor_id = "ex_isnnZRbS")
+output
+attr(output, "headers")
+
+## ------------------------------------------------------------------------
+text <- "A panel of Goldman Sachs employees spent a recent Tuesday night at the
+Columbia University faculty club trying to convince a packed room of potential
+recruits that Wall Street, not Silicon Valley, was the place to be for computer
+scientists.\n\n The Goldman employees knew they had an uphill battle. They were
+fighting against perceptions of Wall Street as boring and regulation-bound and
+Silicon Valley as the promised land of flip-flops, beanbag chairs and million-dollar
+stock options.\n\n Their argument to the room of technologically inclined students
+was that Wall Street was where they could find far more challenging, diverse and,
+yes, lucrative jobs working on some of the worlds most difficult technical problems."
+
+output <- monkey_extract(text,
+                        extractor_id = "ex_y7BPYzNG",
+                        params = list(max_keywords = 3))
+output
+output2 <- monkey_extract(text,
+                          extractor_id = "ex_y7BPYzNG",
+                          params = list(max_keywords = 1))
+output2
+attr(output2, "headers")
+
+## ---- message = FALSE----------------------------------------------------
+text <- "A panel of Goldman Sachs employees spent a recent Tuesday night at the Columbia University faculty club trying to convince a packed room of potential recruits that Wall Street, not Silicon Valley, was the place to be for computer scientists.
+
+The Goldman employees knew they had an uphill battle. They were fighting against perceptions of Wall Street as boring and regulation-bound and Silicon Valley as the promised land of flip-flops, beanbag chairs and million-dollar stock options.
+
+Their argument to the room of technologically inclined students was that Wall Street was where they could find far more challenging, diverse and, yes, lucrative jobs working on some of the world�s most difficult technical problems.
+
+�Whereas in other opportunities you might be considering, it is working one type of data or one type of application, we deal in hundreds of products in hundreds of markets, with thousands or tens of thousands of clients, every day, millions of times of day worldwide,� Afsheen Afshar, a managing director at Goldman Sachs, told the students."
+
+monkey_extract(text, extractor_id = "ex_y7BPYzNG")
+
+## ---- message = FALSE----------------------------------------------------
+text <- "Hi, my email is john@example.com and my credit card is 4242-4242-4242-4242 so you can charge me with $10. My phone number is 15555 9876. We can get in touch on April 16, at 10:00am"
+text2 <- "Hi, my email is mary@example.com and my credit card is 4242-4232-4242-4242. My phone number is 16655 9876. We can get in touch on April 16, at 10:00am"
+
+monkey_extract(c(text, text2), extractor_id = "ex_dqRio5sG", unnest = TRUE)
+
+## ---- message = FALSE----------------------------------------------------
+text1 <- "my dog is an avid rice eater"
+text2 <- "i want to buy an iphone"
+request <- c(text1, text2)
+
+monkey_classify(request, classifier_id = "cl_oFKL5wft")
+
+## ------------------------------------------------------------------------
+monkeylearn_classifiers(private = FALSE)
+
+## ---- message = FALSE----------------------------------------------------
+text1 <- "Haur�s de dirigir-te al punt de trobada del grup al que et vulguis unir."
+text2 <- "i want to buy an iphone"
+text3 <- "Je d�teste ne plus avoir de dentifrice."
+request <- c(text1, text2, text3)
+
+monkey_classify(request, classifier_id = "cl_oJNMkt2V")
+
+## ---- message = FALSE----------------------------------------------------
+text1 <- "I think this is awesome."
+text2 <- "Holy shit! You did great!"
+request <- c(text1, text2)
+
+monkey_classify(request, classifier_id = "cl_KFXhoTdt")
+
+## ---- message = FALSE----------------------------------------------------
+text1 <- "Let me tell you about my dog and my cat. They are really friendly and like going on walks. They both like chasing mice."
+text2 <- "My first R package was probably a disaster but I keep learning how to program."
+request <- c(text1, text2)
+monkey_classify(request, classifier_id = "cl_5icAVzKR")
+
+
+## ----monkey_input--------------------------------------------------------
+input <- c("Emma Woodhouse, handsome, clever, and rich, with a comfortable home",     
+ "and happy disposition, seemed to unite some of the best blessings of",  
+ "existence; and had lived nearly twenty-one years in the world with very", 
+ "little to distress or vex her.",                                          
+ "",                   # <--- note the empty string!                                                   
+ "She was the youngest of the two daughters of a most affectionate,",       
+ "indulgent father; and had, in consequence of her sister's marriage, been",
+ "mistress of his house from a very early period. Her mother had died",     
+ "too long ago for her to have more than an indistinct remembrance of",     
+ "her caresses; and her place had been supplied by an excellent woman as",  
+ "governess, who had fallen little short of a mother in affection.")
+
+## ----monkey_output-------------------------------------------------------
+(output <- monkey_classify(input, unnest = FALSE))
+
+## ----very_empty_input----------------------------------------------------
+(very_empty_input <- rep("", 25) %>% c(input) %>% sample())
+
+## ------------------------------------------------------------------------
+monkey_classify(very_empty_input, unnest = FALSE)
+
+## ------------------------------------------------------------------------
+output$res
+
+## ----unnest_true---------------------------------------------------------
+(output_unnested <- monkey_classify(input, verbose = FALSE, unnest = TRUE))
+
+## ----compare_df----------------------------------------------------------
+input_df <- tibble::tibble(text = input) 
+output_df_unnested <- monkey_classify(input_df, text, unnest = TRUE, verbose = FALSE) %>% 
+    dplyr::rename(req = text)
+
+testthat::expect_equal(output_unnested, output_df_unnested)
+
+## ----keep_all------------------------------------------------------------
+sw <- dplyr::starwars %>% 
+  dplyr::select(name, height) %>% 
+  dplyr::sample_n(nrow(input_df))
+
+sw_input_df <- input_df %>% 
+  dplyr::bind_cols(sw)
+
+sw_input_df %>% monkey_classify(text, unnest = FALSE, verbose = FALSE)
+
+## ----one_by_one, warning=FALSE-------------------------------------------
+one_by_one <- system.time(output <- monkey_classify(input, texts_per_req = 1))
+
+## ----batch_of_five, warning=FALSE----------------------------------------
+batch_of_five <- system.time(output <- monkey_classify(input, texts_per_req = 5))
+
+## ----speedup-------------------------------------------------------------
+(speedup <- one_by_one[1] / batch_of_five[1])
+
diff --git a/inst/doc/monkeylearn_intro.Rmd b/inst/doc/monkeylearn_intro.Rmd
new file mode 100644
index 0000000..84ebfc3
--- /dev/null
+++ b/inst/doc/monkeylearn_intro.Rmd
@@ -0,0 +1,323 @@
+---
+title: "monkeylearn, a R Package for Natural Language Processing Using Monkeylearn Existing Modules"
+author: "M. Salmon, A. Dobbyn"
+date: "`r Sys.Date()`"
+output: rmarkdown::html_vignette
+vignette: >
+  %\VignetteIndexEntry{intro}
+  %\VignetteEngine{knitr::rmarkdown}
+  %\VignetteEncoding{UTF-8}
+---
+
+```{r, echo = FALSE, warning=FALSE, message=FALSE}
+NOT_CRAN <- identical(tolower(Sys.getenv("NOT_CRAN")), "true")
+pat <- Sys.getenv("MONKEYLEARN_KEY")
+IS_THERE_KEY <- (pat != "")
+NOT_CRAN <- ifelse(IS_THERE_KEY, NOT_CRAN, FALSE)
+knitr::opts_chunk$set(
+  collapse = TRUE,
+  comment = "#>",
+  purl = NOT_CRAN,
+  eval = NOT_CRAN
+)
+```
+
+# Intro
+
+This package is an interface to the [MonkeyLearn API](http://docs.monkeylearn.com/article/api-reference/). MonkeyLearn is a Machine Learning platform on the cloud that allows software companies and developers to easily extract actionable data from text.
+
+The goal of the package is not to support machine learning algorithms development with R or the API, but only to *reap the benefits of the existing modules on Monkeylearn*. Therefore, there are only two functions, one for using *extractors*, and one for using *classifiers*. The difference between extractors and classifiers is that extractors output information about words, whereas classifiers output information about each text as a whole. Named entity recognition is an extraction task, whereas assigning a topic to a text is a classification task.
+
+## Setup
+
+To get an API key for MonkeyLearn, register at http://monkeylearn.com/. Note that MonkeyLearn supports registration through GitHub, which makes the registration process really easy. For ease of use, save your API key as an environment variable as described at http://stat545.com/bit003_api-key-env-var.html. You might also want to use the `usethis::edit_r_environ()` function to modify .Renviron.
+
+All functions of the package will conveniently look for your API key using `Sys.getenv("MONKEYLEARN_KEY")` so if your API key is an environment variable called "MONKEYLEARN\_KEY" you don't need to input it manually.
+
+Please also create a "MONKEYLEARN\_PLAN" environment variable indicating whether your [Monkeylearn plan](https://app.monkeylearn.com/main/my-account/tab/change-plan/) is "free", "team", "business" or "custom". If you do not indicate it by default it will be "free" with a message. If your plan is "custom" you'll need a third environment variable "MONKEYLEARN\_RATE" indicating the maximum amount of requests per minute that you can make to the API. If you do not indicate it, by default it will be 120 with a message.
+
+## So many monkeys/functions
+
+The packages exports `monkeylearn_classify`, `monkey_classify`, `monkeylearn_extract`, `monkey_extract`. The `monkey_` functions are the newer and better ones, so if you don't have legacy code, just start using those!
+
+For inspiration beyond this vignette, you can see external examples of the package in action [on this page](http://ropensci.github.io/monkeylearn/). In particular you'll find examples using the older set of functions but we now recommend using `monkey_extract` and `monkey_classify`, see more later in the vignette. 
+
+# Extract
+
+## A first example 
+
+```{r, message = FALSE}
+library(monkeylearn)
+library(magrittr)
+
+text <- "In the 19th century, the major European powers had gone to great lengths to maintain a balance of power throughout Europe, resulting in the existence of a complex network of political and military alliances throughout the continent by 1900.[7] These had started in 1815, with the Holy Alliance between Prussia, Russia, and Austria. Then, in October 1873, German Chancellor Otto von Bismarck negotiated the League of the Three Emperors (German: Dreikaiserbund) between the monarchs of Austria-Hungary, Russia and Germany."
+output <- monkey_extract(input = text,
+                         extractor_id = "ex_isnnZRbS")
+output
+attr(output, "headers")
+```
+
+## Parameters
+
+If the documentation of the extractor you use states it has parameters, you can pass them as a named list, see below.
+
+```{r}
+text <- "A panel of Goldman Sachs employees spent a recent Tuesday night at the
+Columbia University faculty club trying to convince a packed room of potential
+recruits that Wall Street, not Silicon Valley, was the place to be for computer
+scientists.\n\n The Goldman employees knew they had an uphill battle. They were
+fighting against perceptions of Wall Street as boring and regulation-bound and
+Silicon Valley as the promised land of flip-flops, beanbag chairs and million-dollar
+stock options.\n\n Their argument to the room of technologically inclined students
+was that Wall Street was where they could find far more challenging, diverse and,
+yes, lucrative jobs working on some of the worlds most difficult technical problems."
+
+output <- monkey_extract(text,
+                        extractor_id = "ex_y7BPYzNG",
+                        params = list(max_keywords = 3))
+output
+output2 <- monkey_extract(text,
+                          extractor_id = "ex_y7BPYzNG",
+                          params = list(max_keywords = 1))
+output2
+attr(output2, "headers")
+```
+
+## How to find extractors?
+
+You can find extractors and their IDs, including extractors for text in Spanish, at https://app.monkeylearn.com/main/explore 
+
+There is no endpoint for automatically finding all extractors, but if you find one in the website you particularly like and use a lot in your language and application, you could choose to save its id as an environment variable as explained [here]( http://stat545.com/bit003_api-key-env-var.html). Reading about extractors on the website will give you a good overview of their characteristics and original application.
+
+Here are a few ones for text in English:
+
+* [Entity extractor](https://app.monkeylearn.com/extraction/extractors/ex_isnnZRbS/tab/description-tab), `extractor_id = "ex_isnnZRbS"` (used in the first example). Extract Entities from text using Named Entity Recognition (NER). NER labels sequences of words in a text which are the names of things, such as person and company names. This implementation labels 3 classes: PERSON, ORGANIZATION and LOCATION. This NER tagger is implemented using Conditional Random Field (CRF) sequence models.
+
+* [Keyword extractor](https://app.monkeylearn.com/extraction/extractors/ex_y7BPYzNG/tab/description-tab), `extractor_id = "ex_y7BPYzNG"`. Extract keywords from text in English. Keywords can be compounded by one or more words and are defined as the important topics in your content and can be used to index data, generate tag clouds or for searching. This keyword extraction algorithm employs statistical algorithms and natural language processing technology to analyze your content and identify the relevant keywords.
+
+```{r, message = FALSE}
+text <- "A panel of Goldman Sachs employees spent a recent Tuesday night at the Columbia University faculty club trying to convince a packed room of potential recruits that Wall Street, not Silicon Valley, was the place to be for computer scientists.
+
+The Goldman employees knew they had an uphill battle. They were fighting against perceptions of Wall Street as boring and regulation-bound and Silicon Valley as the promised land of flip-flops, beanbag chairs and million-dollar stock options.
+
+Their argument to the room of technologically inclined students was that Wall Street was where they could find far more challenging, diverse and, yes, lucrative jobs working on some of the world’s most difficult technical problems.
+
+“Whereas in other opportunities you might be considering, it is working one type of data or one type of application, we deal in hundreds of products in hundreds of markets, with thousands or tens of thousands of clients, every day, millions of times of day worldwide,” Afsheen Afshar, a managing director at Goldman Sachs, told the students."
+
+monkey_extract(text, extractor_id = "ex_y7BPYzNG")
+```
+
+* [Useful data extractor](https://app.monkeylearn.com/extraction/extractors/ex_dqRio5sG/tab/description-tab), `extractor_id = "ex_dqRio5sG"`. Extract useful data from text. This algorithm can be used to detect many different useful data: links, phones, ips, prices, times, emails, bitcoin addresses, dates, ipv6s, hex colors and credit cards.
+
+When using this extractor, the format of the API output is a bit different than for other extractors, see below how the output looks like.
+
+```{r, message = FALSE}
+text <- "Hi, my email is john@example.com and my credit card is 4242-4242-4242-4242 so you can charge me with $10. My phone number is 15555 9876. We can get in touch on April 16, at 10:00am"
+text2 <- "Hi, my email is mary@example.com and my credit card is 4242-4232-4242-4242. My phone number is 16655 9876. We can get in touch on April 16, at 10:00am"
+
+monkey_extract(c(text, text2), extractor_id = "ex_dqRio5sG", unnest = TRUE)
+```
+
+
+# Classify
+
+## A first example
+
+```{r, message = FALSE}
+text1 <- "my dog is an avid rice eater"
+text2 <- "i want to buy an iphone"
+request <- c(text1, text2)
+
+monkey_classify(request, classifier_id = "cl_oFKL5wft")
+```
+## How to find classifiers?
+
+You can find classifiers and their IDs at https://app.monkeylearn.com/main/explore or you can use the `monkeylearn_classifiers` function, choosing to show all classifiers or only the private ones with `private = TRUE`. The first column of the resulting data.frame is the `classifier_id` to be used in `monkeylearn_classify`.
+
+```{r}
+monkeylearn_classifiers(private = FALSE)
+```
+
+Here are a few other examples:
+
+* [Language detection](https://app.monkeylearn.com/categorizer/projects/cl_oJNMkt2V/tab/main-tab), `classifier_id = "cl_oJNMkt2V"`. Detect language in text. New languages were added for a total of 48 different languages arranged in language families.
+
+```{r, message = FALSE}
+text1 <- "Hauràs de dirigir-te al punt de trobada del grup al que et vulguis unir."
+text2 <- "i want to buy an iphone"
+text3 <- "Je déteste ne plus avoir de dentifrice."
+request <- c(text1, text2, text3)
+
+monkey_classify(request, classifier_id = "cl_oJNMkt2V")
+```
+
+* [Profanity and abuse detection](https://app.monkeylearn.com/categorizer/projects/cl_KFXhoTdt/tab/main-tab), `classifier_id = "cl_KFXhoTdt"`.
+
+```{r, message = FALSE}
+text1 <- "I think this is awesome."
+text2 <- "Holy shit! You did great!"
+request <- c(text1, text2)
+
+monkey_classify(request, classifier_id = "cl_KFXhoTdt")
+```
+
+* [General topic classifier](https://app.monkeylearn.com/categorizer/projects/cl_5icAVzKR/tab/), `classifier_id = "cl_5icAVzKR"`.
+
+```{r, message = FALSE}
+text1 <- "Let me tell you about my dog and my cat. They are really friendly and like going on walks. They both like chasing mice."
+text2 <- "My first R package was probably a disaster but I keep learning how to program."
+request <- c(text1, text2)
+monkey_classify(request, classifier_id = "cl_5icAVzKR")
+
+```
+
+
+# Get what you paid for
+
+Monkeylearn offers a different service based on your current plan, that is, "free", "team" or "business". These plans will both influence your _rate limiting_ (how fast?) and your _query limiting_ (how many queries?). See https://monkeylearn.com/pricing/. Thanks to your MONKEYLEARN_PLAN environment variable, the rate will be handled automatically thanks to [`ratelimitr`](https://github.com/tarakc02/ratelimitr).
+
+## Check the number of remaining calls
+
+After each call to a function you can check how many calls to the API you can still make  using `attr(output, "headers")$x.query.limit.remaining` and `attr(output, "headers")$x.query.limit.limit`. The period after which `attr(output, "headers")$x.query.limit.remaining` depends on your subscription and is not included in the output.
+
+
+
+# Fit `monkeylearn` into your pipeline!
+
+You can:
+
+* Send a vector of texts *or* a dataframe and a named column (unquoted)
+* Output either a nested or unnested dataframe
+    * Nested = 1 row per input; unnested = 1 row per output
+* This output
+    * Relates each input text to its (usually) multiple classifications/extractions
+    * Retains a record of inputs that could not be classified/extracted (e.g., empty strings)
+* Batch requests
+
+
+## In a bit more detail
+
+You can classify or extract a vector or dataframe of texts while relating the original input text to its classifications. This is important, because the input:output relationship may not always (and in fact, is not usually) 1:1. These functions retain the tie between each `input`[^1] element and all of its output elements.
+
+```{r monkey_input}
+input <- c("Emma Woodhouse, handsome, clever, and rich, with a comfortable home",     
+ "and happy disposition, seemed to unite some of the best blessings of",  
+ "existence; and had lived nearly twenty-one years in the world with very", 
+ "little to distress or vex her.",                                          
+ "",                   # <--- note the empty string!                                                   
+ "She was the youngest of the two daughters of a most affectionate,",       
+ "indulgent father; and had, in consequence of her sister's marriage, been",
+ "mistress of his house from a very early period. Her mother had died",     
+ "too long ago for her to have more than an indistinct remembrance of",     
+ "her caresses; and her place had been supplied by an excellent woman as",  
+ "governess, who had fallen little short of a mother in affection.")
+```
+
+That is true even if you have inputs that cannot be processed. For instance, empty string and `NA` input elements are not sent to the API for classification/extraction. (You'll get a warning of this if `verbose = TRUE`.) We've got one above to illustrate and elements that returned no classifications/extractions are included in the resulting dataframe. This way you'll know which inputs could not be processed.
+
+```{r monkey_output}
+(output <- monkey_classify(input, unnest = FALSE))
+```
+
+<br>
+
+If there are more than 20 empty inputs, we save your console by messaging only the first 20 indices.
+
+```{r very_empty_input}
+(very_empty_input <- rep("", 25) %>% c(input) %>% sample())
+```
+
+
+Since the entire original input is represented in the output, if you need to find all of the empty inputs you can easily filter the output to all of the rows containing empty strings.
+```{r}
+monkey_classify(very_empty_input, unnest = FALSE)
+```
+
+
+### Configuring the Output
+
+The default output is a nested dataframe with the same number of rows as your input dataframe or the same length as your input vector, depending on which one you sent in. 
+
+Let's take a look at the `res` output column. 
+```{r}
+output$res
+```
+
+You can easily choose an unnested output by setting the **unnest flag** to TRUE (which it is by default) to get one row per classification/extraction. 
+
+```{r unnest_true}
+(output_unnested <- monkey_classify(input, verbose = FALSE, unnest = TRUE))
+```
+
+We could have gotten the same result by sending in a dataframe and a named column. If a dataframe is supplied input column is not renamed to `req` as it is when input is a vector; the original column name is retained.
+
+```{r compare_df}
+input_df <- tibble::tibble(text = input) 
+output_df_unnested <- monkey_classify(input_df, text, unnest = TRUE, verbose = FALSE) %>% 
+    dplyr::rename(req = text)
+
+testthat::expect_equal(output_unnested, output_df_unnested)
+```
+
+<br>
+
+If the input is a dataframe, setting the `.keep_all` option to TRUE allows you to retain all input columns. If FALSE, only the column you specify for classification will be retained. 
+
+```{r keep_all}
+sw <- dplyr::starwars %>% 
+  dplyr::select(name, height) %>% 
+  dplyr::sample_n(nrow(input_df))
+
+sw_input_df <- input_df %>% 
+  dplyr::bind_cols(sw)
+
+sw_input_df %>% monkey_classify(text, unnest = FALSE, verbose = FALSE)
+```
+
+
+### Batching
+
+Retaining the relationship between input and output doesn't mean you'll need to send requests one-by-one. **Batch requests** by setting the `texts_per_req` value which governs the number of texts that are sent per request. Per the [MonkeyLearn documentation](http://help.monkeylearn.com/frequently-asked-questions/queries/can-i-classify-or-extract-more-than-one-text-with-one-api-request), the maximum we recommend sending at once is 200 requests. 
+
+If `texts_per_req` is NULL, the default, we try to optimize the response time from the API by setting `texts_per_req` to 200 when your input has more than 200 texts or to the length of the `input` if you've got fewer. You'll see a significant speedup by batching your requests this way. However, batching doesn't save you on queries; a batch of 150 texts still uses up 150 queries. 
+
+These functions also include some more verbose **progress reporting**, letting you know what batch you're on out of the total, and which texts are set to be processed in that batch.
+
+```{r one_by_one, warning=FALSE}
+one_by_one <- system.time(output <- monkey_classify(input, texts_per_req = 1))
+```
+
+```{r batch_of_five, warning=FALSE}
+batch_of_five <- system.time(output <- monkey_classify(input, texts_per_req = 5))
+```
+
+How much does sending 5 texts in a batch vs. 1 text improve our processing time?
+```{r speedup}
+(speedup <- one_by_one[1] / batch_of_five[1])
+```
+
+
+A 3-4x speedup isn't so bad! Worth keeping in mind that if you need the blazing fast speeds you might consider upgrading to a higher MonkeyLearn price tier. 
+
+<br>
+
+
+
+
+
+***
+
+<br>
+
+
+# Meta
+
+* Please [report any issues or bugs](https://github.com/ropensci/monkeylearn/issues).
+* License: GPL
+* Get citation information for `monkeylearn` in R doing `citation(package = 'monkeylearn')`
+* Please note that this project is released with a [Contributor Code of Conduct](CONDUCT.md). By participating in this project you agree to abide by its terms.
+* This package is part of the [rOpenSci project](https://ropensci.org/).
+
+
+[^1]: Thanks to [Julia Silge](https://juliasilge.com/)'s fantastic [`janeaustenr`](https://github.com/juliasilge/janeaustenr) package for this text!
+
diff --git a/inst/doc/monkeylearn_intro.html b/inst/doc/monkeylearn_intro.html
new file mode 100644
index 0000000..0bc3366
--- /dev/null
+++ b/inst/doc/monkeylearn_intro.html
@@ -0,0 +1,833 @@
+<!DOCTYPE html>
+
+<html xmlns="http://www.w3.org/1999/xhtml">
+
+<head>
+
+<meta charset="utf-8" />
+<meta http-equiv="Content-Type" content="text/html; charset=utf-8" />
+<meta name="generator" content="pandoc" />
+
+<meta name="viewport" content="width=device-width, initial-scale=1">
+
+<meta name="author" content="M. Salmon, A. Dobbyn" />
+
+<meta name="date" content="2018-04-11" />
+
+<title>monkeylearn, a R Package for Natural Language Processing Using Monkeylearn Existing Modules</title>
+
+
+
+<style type="text/css">code{white-space: pre;}</style>
+<style type="text/css">
+a.sourceLine { display: inline-block; line-height: 1.25; }
+a.sourceLine { pointer-events: none; color: inherit; text-decoration: inherit; }
+a.sourceLine:empty { height: 1.2em; position: absolute; }
+.sourceCode { overflow: visible; }
+code.sourceCode { white-space: pre; position: relative; }
+div.sourceCode { margin: 1em 0; }
+pre.sourceCode { margin: 0; }
+@media screen {
+div.sourceCode { overflow: auto; }
+}
+@media print {
+code.sourceCode { white-space: pre-wrap; }
+a.sourceLine { text-indent: -1em; padding-left: 1em; }
+}
+pre.numberSource a.sourceLine
+  { position: relative; }
+pre.numberSource a.sourceLine:empty
+  { position: absolute; }
+pre.numberSource a.sourceLine::before
+  { content: attr(data-line-number);
+    position: absolute; left: -5em; text-align: right; vertical-align: baseline;
+    border: none; pointer-events: all;
+    -webkit-touch-callout: none; -webkit-user-select: none;
+    -khtml-user-select: none; -moz-user-select: none;
+    -ms-user-select: none; user-select: none;
+    padding: 0 4px; width: 4em;
+    color: #aaaaaa;
+  }
+pre.numberSource { margin-left: 3em; border-left: 1px solid #aaaaaa;  padding-left: 4px; }
+div.sourceCode
+  {  }
+@media screen {
+a.sourceLine::before { text-decoration: underline; }
+}
+code span.al { color: #ff0000; font-weight: bold; } /* Alert */
+code span.an { color: #60a0b0; font-weight: bold; font-style: italic; } /* Annotation */
+code span.at { color: #7d9029; } /* Attribute */
+code span.bn { color: #40a070; } /* BaseN */
+code span.bu { } /* BuiltIn */
+code span.cf { color: #007020; font-weight: bold; } /* ControlFlow */
+code span.ch { color: #4070a0; } /* Char */
+code span.cn { color: #880000; } /* Constant */
+code span.co { color: #60a0b0; font-style: italic; } /* Comment */
+code span.cv { color: #60a0b0; font-weight: bold; font-style: italic; } /* CommentVar */
+code span.do { color: #ba2121; font-style: italic; } /* Documentation */
+code span.dt { color: #902000; } /* DataType */
+code span.dv { color: #40a070; } /* DecVal */
+code span.er { color: #ff0000; font-weight: bold; } /* Error */
+code span.ex { } /* Extension */
+code span.fl { color: #40a070; } /* Float */
+code span.fu { color: #06287e; } /* Function */
+code span.im { } /* Import */
+code span.in { color: #60a0b0; font-weight: bold; font-style: italic; } /* Information */
+code span.kw { color: #007020; font-weight: bold; } /* Keyword */
+code span.op { color: #666666; } /* Operator */
+code span.ot { color: #007020; } /* Other */
+code span.pp { color: #bc7a00; } /* Preprocessor */
+code span.sc { color: #4070a0; } /* SpecialChar */
+code span.ss { color: #bb6688; } /* SpecialString */
+code span.st { color: #4070a0; } /* String */
+code span.va { color: #19177c; } /* Variable */
+code span.vs { color: #4070a0; } /* VerbatimString */
+code span.wa { color: #60a0b0; font-weight: bold; font-style: italic; } /* Warning */
+</style>
+
+
+
+<style type="text/css">body {
+background-color: #fff;
+margin: 1em auto;
+max-width: 700px;
+overflow: visible;
+padding-left: 2em;
+padding-right: 2em;
+font-family: "Open Sans", "Helvetica Neue", Helvetica, Arial, sans-serif;
+font-size: 14px;
+line-height: 1.35;
+}
+#header {
+text-align: center;
+}
+#TOC {
+clear: both;
+margin: 0 0 10px 10px;
+padding: 4px;
+width: 400px;
+border: 1px solid #CCCCCC;
+border-radius: 5px;
+background-color: #f6f6f6;
+font-size: 13px;
+line-height: 1.3;
+}
+#TOC .toctitle {
+font-weight: bold;
+font-size: 15px;
+margin-left: 5px;
+}
+#TOC ul {
+padding-left: 40px;
+margin-left: -1.5em;
+margin-top: 5px;
+margin-bottom: 5px;
+}
+#TOC ul ul {
+margin-left: -2em;
+}
+#TOC li {
+line-height: 16px;
+}
+table {
+margin: 1em auto;
+border-width: 1px;
+border-color: #DDDDDD;
+border-style: outset;
+border-collapse: collapse;
+}
+table th {
+border-width: 2px;
+padding: 5px;
+border-style: inset;
+}
+table td {
+border-width: 1px;
+border-style: inset;
+line-height: 18px;
+padding: 5px 5px;
+}
+table, table th, table td {
+border-left-style: none;
+border-right-style: none;
+}
+table thead, table tr.even {
+background-color: #f7f7f7;
+}
+p {
+margin: 0.5em 0;
+}
+blockquote {
+background-color: #f6f6f6;
+padding: 0.25em 0.75em;
+}
+hr {
+border-style: solid;
+border: none;
+border-top: 1px solid #777;
+margin: 28px 0;
+}
+dl {
+margin-left: 0;
+}
+dl dd {
+margin-bottom: 13px;
+margin-left: 13px;
+}
+dl dt {
+font-weight: bold;
+}
+ul {
+margin-top: 0;
+}
+ul li {
+list-style: circle outside;
+}
+ul ul {
+margin-bottom: 0;
+}
+pre, code {
+background-color: #f7f7f7;
+border-radius: 3px;
+color: #333;
+white-space: pre-wrap; 
+}
+pre {
+border-radius: 3px;
+margin: 5px 0px 10px 0px;
+padding: 10px;
+}
+pre:not([class]) {
+background-color: #f7f7f7;
+}
+code {
+font-family: Consolas, Monaco, 'Courier New', monospace;
+font-size: 85%;
+}
+p > code, li > code {
+padding: 2px 0px;
+}
+div.figure {
+text-align: center;
+}
+img {
+background-color: #FFFFFF;
+padding: 2px;
+border: 1px solid #DDDDDD;
+border-radius: 3px;
+border: 1px solid #CCCCCC;
+margin: 0 5px;
+}
+h1 {
+margin-top: 0;
+font-size: 35px;
+line-height: 40px;
+}
+h2 {
+border-bottom: 4px solid #f7f7f7;
+padding-top: 10px;
+padding-bottom: 2px;
+font-size: 145%;
+}
+h3 {
+border-bottom: 2px solid #f7f7f7;
+padding-top: 10px;
+font-size: 120%;
+}
+h4 {
+border-bottom: 1px solid #f7f7f7;
+margin-left: 8px;
+font-size: 105%;
+}
+h5, h6 {
+border-bottom: 1px solid #ccc;
+font-size: 105%;
+}
+a {
+color: #0033dd;
+text-decoration: none;
+}
+a:hover {
+color: #6666ff; }
+a:visited {
+color: #800080; }
+a:visited:hover {
+color: #BB00BB; }
+a[href^="http:"] {
+text-decoration: underline; }
+a[href^="https:"] {
+text-decoration: underline; }
+
+code > span.kw { color: #555; font-weight: bold; } 
+code > span.dt { color: #902000; } 
+code > span.dv { color: #40a070; } 
+code > span.bn { color: #d14; } 
+code > span.fl { color: #d14; } 
+code > span.ch { color: #d14; } 
+code > span.st { color: #d14; } 
+code > span.co { color: #888888; font-style: italic; } 
+code > span.ot { color: #007020; } 
+code > span.al { color: #ff0000; font-weight: bold; } 
+code > span.fu { color: #900; font-weight: bold; }  code > span.er { color: #a61717; background-color: #e3d2d2; } 
+</style>
+
+</head>
+
+<body>
+
+
+
+
+<h1 class="title toc-ignore">monkeylearn, a R Package for Natural Language Processing Using Monkeylearn Existing Modules</h1>
+<h4 class="author"><em>M. Salmon, A. Dobbyn</em></h4>
+<h4 class="date"><em>2018-04-11</em></h4>
+
+
+
+<div id="intro" class="section level1">
+<h1>Intro</h1>
+<p>This package is an interface to the <a href="http://docs.monkeylearn.com/article/api-reference/">MonkeyLearn API</a>. MonkeyLearn is a Machine Learning platform on the cloud that allows software companies and developers to easily extract actionable data from text.</p>
+<p>The goal of the package is not to support machine learning algorithms development with R or the API, but only to <em>reap the benefits of the existing modules on Monkeylearn</em>. Therefore, there are only two functions, one for using <em>extractors</em>, and one for using <em>classifiers</em>. The difference between extractors and classifiers is that extractors output information about words, whereas classifiers output information about each text as a whole. Named entity recognition is an extraction task, whereas assigning a topic to a text is a classification task.</p>
+<div id="setup" class="section level2">
+<h2>Setup</h2>
+<p>To get an API key for MonkeyLearn, register at <a href="http://monkeylearn.com/" class="uri">http://monkeylearn.com/</a>. Note that MonkeyLearn supports registration through GitHub, which makes the registration process really easy. For ease of use, save your API key as an environment variable as described at <a href="http://stat545.com/bit003_api-key-env-var.html" class="uri">http://stat545.com/bit003_api-key-env-var.html</a>. You might also want to use the <code>usethis::edit_r_environ()</code> function to modify .Renviron.</p>
+<p>All functions of the package will conveniently look for your API key using <code>Sys.getenv(&quot;MONKEYLEARN_KEY&quot;)</code> so if your API key is an environment variable called “MONKEYLEARN_KEY” you don’t need to input it manually.</p>
+<p>Please also create a “MONKEYLEARN_PLAN” environment variable indicating whether your <a href="https://app.monkeylearn.com/main/my-account/tab/change-plan/">Monkeylearn plan</a> is “free”, “team”, “business” or “custom”. If you do not indicate it by default it will be “free” with a message. If your plan is “custom” you’ll need a third environment variable “MONKEYLEARN_RATE” indicating the maximum amount of requests per minute that you can make to the API. If you do not indicate it, by default it will be 120 with a message.</p>
+</div>
+<div id="so-many-monkeysfunctions" class="section level2">
+<h2>So many monkeys/functions</h2>
+<p>The packages exports <code>monkeylearn_classify</code>, <code>monkey_classify</code>, <code>monkeylearn_extract</code>, <code>monkey_extract</code>. The <code>monkey_</code> functions are the newer and better ones, so if you don’t have legacy code, just start using those!</p>
+<p>For inspiration beyond this vignette, you can see external examples of the package in action <a href="http://ropensci.github.io/monkeylearn/">on this page</a>. In particular you’ll find examples using the older set of functions but we now recommend using <code>monkey_extract</code> and <code>monkey_classify</code>, see more later in the vignette.</p>
+</div>
+</div>
+<div id="extract" class="section level1">
+<h1>Extract</h1>
+<div id="a-first-example" class="section level2">
+<h2>A first example</h2>
+<div class="sourceCode" id="cb1"><pre class="sourceCode r"><code class="sourceCode r"><a class="sourceLine" id="cb1-1" data-line-number="1"><span class="kw">library</span>(monkeylearn)</a>
+<a class="sourceLine" id="cb1-2" data-line-number="2"><span class="kw">library</span>(magrittr)</a>
+<a class="sourceLine" id="cb1-3" data-line-number="3"></a>
+<a class="sourceLine" id="cb1-4" data-line-number="4">text &lt;-<span class="st"> &quot;In the 19th century, the major European powers had gone to great lengths to maintain a balance of power throughout Europe, resulting in the existence of a complex network of political and military alliances throughout the continent by 1900.[7] These had started in 1815, with the Holy Alliance between Prussia, Russia, and Austria. Then, in October 1873, German Chancellor Otto von Bismarck negotiated the League of the Three Emperors (German: Dreikaiserbund) between the monarchs of Austria-Hungary, Russia and Germany.&quot;</span></a>
+<a class="sourceLine" id="cb1-5" data-line-number="5">output &lt;-<span class="st"> </span><span class="kw">monkey_extract</span>(<span class="dt">input =</span> text,</a>
+<a class="sourceLine" id="cb1-6" data-line-number="6">                         <span class="dt">extractor_id =</span> <span class="st">&quot;ex_isnnZRbS&quot;</span>)</a>
+<a class="sourceLine" id="cb1-7" data-line-number="7">output</a>
+<a class="sourceLine" id="cb1-8" data-line-number="8"><span class="co">#&gt; # A tibble: 7 x 4</span></a>
+<a class="sourceLine" id="cb1-9" data-line-number="9"><span class="co">#&gt;   req                                                  count tag    entity</span></a>
+<a class="sourceLine" id="cb1-10" data-line-number="10"><span class="co">#&gt;   &lt;chr&gt;                                                &lt;int&gt; &lt;chr&gt;  &lt;chr&gt; </span></a>
+<a class="sourceLine" id="cb1-11" data-line-number="11"><span class="co">#&gt; 1 In the 19th century, the major European powers had ~     1 LOCAT~ Europe</span></a>
+<a class="sourceLine" id="cb1-12" data-line-number="12"><span class="co">#&gt; 2 In the 19th century, the major European powers had ~     1 LOCAT~ Pruss~</span></a>
+<a class="sourceLine" id="cb1-13" data-line-number="13"><span class="co">#&gt; 3 In the 19th century, the major European powers had ~     1 LOCAT~ Austr~</span></a>
+<a class="sourceLine" id="cb1-14" data-line-number="14"><span class="co">#&gt; 4 In the 19th century, the major European powers had ~     1 LOCAT~ Austr~</span></a>
+<a class="sourceLine" id="cb1-15" data-line-number="15"><span class="co">#&gt; 5 In the 19th century, the major European powers had ~     1 LOCAT~ Germa~</span></a>
+<a class="sourceLine" id="cb1-16" data-line-number="16"><span class="co">#&gt; 6 In the 19th century, the major European powers had ~     1 PERSON Otto ~</span></a>
+<a class="sourceLine" id="cb1-17" data-line-number="17"><span class="co">#&gt; 7 In the 19th century, the major European powers had ~     2 LOCAT~ Russia</span></a>
+<a class="sourceLine" id="cb1-18" data-line-number="18"><span class="kw">attr</span>(output, <span class="st">&quot;headers&quot;</span>)</a>
+<a class="sourceLine" id="cb1-19" data-line-number="19"><span class="co">#&gt; # A tibble: 1 x 11</span></a>
+<a class="sourceLine" id="cb1-20" data-line-number="20"><span class="co">#&gt;   server  date   content.type transfer.encodi~ connection x.query.limit.l~</span></a>
+<a class="sourceLine" id="cb1-21" data-line-number="21"><span class="co">#&gt;   &lt;chr&gt;   &lt;chr&gt;  &lt;chr&gt;        &lt;chr&gt;            &lt;chr&gt;      &lt;chr&gt;           </span></a>
+<a class="sourceLine" id="cb1-22" data-line-number="22"><span class="co">#&gt; 1 nginx/~ Wed, ~ application~ chunked          keep-alive 5000000         </span></a>
+<a class="sourceLine" id="cb1-23" data-line-number="23"><span class="co">#&gt; # ... with 5 more variables: x.query.limit.remaining &lt;chr&gt;,</span></a>
+<a class="sourceLine" id="cb1-24" data-line-number="24"><span class="co">#&gt; #   x.query.limit.request.queries &lt;chr&gt;, allow &lt;chr&gt;,</span></a>
+<a class="sourceLine" id="cb1-25" data-line-number="25"><span class="co">#&gt; #   content.encoding &lt;chr&gt;, text_md5 &lt;chr&gt;</span></a></code></pre></div>
+</div>
+<div id="parameters" class="section level2">
+<h2>Parameters</h2>
+<p>If the documentation of the extractor you use states it has parameters, you can pass them as a named list, see below.</p>
+<div class="sourceCode" id="cb2"><pre class="sourceCode r"><code class="sourceCode r"><a class="sourceLine" id="cb2-1" data-line-number="1">text &lt;-<span class="st"> &quot;A panel of Goldman Sachs employees spent a recent Tuesday night at the</span></a>
+<a class="sourceLine" id="cb2-2" data-line-number="2"><span class="st">Columbia University faculty club trying to convince a packed room of potential</span></a>
+<a class="sourceLine" id="cb2-3" data-line-number="3"><span class="st">recruits that Wall Street, not Silicon Valley, was the place to be for computer</span></a>
+<a class="sourceLine" id="cb2-4" data-line-number="4"><span class="st">scientists.</span><span class="ch">\n\n</span><span class="st"> The Goldman employees knew they had an uphill battle. They were</span></a>
+<a class="sourceLine" id="cb2-5" data-line-number="5"><span class="st">fighting against perceptions of Wall Street as boring and regulation-bound and</span></a>
+<a class="sourceLine" id="cb2-6" data-line-number="6"><span class="st">Silicon Valley as the promised land of flip-flops, beanbag chairs and million-dollar</span></a>
+<a class="sourceLine" id="cb2-7" data-line-number="7"><span class="st">stock options.</span><span class="ch">\n\n</span><span class="st"> Their argument to the room of technologically inclined students</span></a>
+<a class="sourceLine" id="cb2-8" data-line-number="8"><span class="st">was that Wall Street was where they could find far more challenging, diverse and,</span></a>
+<a class="sourceLine" id="cb2-9" data-line-number="9"><span class="st">yes, lucrative jobs working on some of the worlds most difficult technical problems.&quot;</span></a>
+<a class="sourceLine" id="cb2-10" data-line-number="10"></a>
+<a class="sourceLine" id="cb2-11" data-line-number="11">output &lt;-<span class="st"> </span><span class="kw">monkey_extract</span>(text,</a>
+<a class="sourceLine" id="cb2-12" data-line-number="12">                        <span class="dt">extractor_id =</span> <span class="st">&quot;ex_y7BPYzNG&quot;</span>,</a>
+<a class="sourceLine" id="cb2-13" data-line-number="13">                        <span class="dt">params =</span> <span class="kw">list</span>(<span class="dt">max_keywords =</span> <span class="dv">3</span>))</a>
+<a class="sourceLine" id="cb2-14" data-line-number="14"><span class="co">#&gt; Processing batch 1 of 1 batches: texts 1 to 1</span></a>
+<a class="sourceLine" id="cb2-15" data-line-number="15">output</a>
+<a class="sourceLine" id="cb2-16" data-line-number="16"><span class="co">#&gt; # A tibble: 3 x 5</span></a>
+<a class="sourceLine" id="cb2-17" data-line-number="17"><span class="co">#&gt;   req                             count relevance positions_in_te~ keyword</span></a>
+<a class="sourceLine" id="cb2-18" data-line-number="18"><span class="co">#&gt;   &lt;chr&gt;                           &lt;int&gt; &lt;chr&gt;     &lt;list&gt;           &lt;chr&gt;  </span></a>
+<a class="sourceLine" id="cb2-19" data-line-number="19"><span class="co">#&gt; 1 &quot;A panel of Goldman Sachs empl~     3 0.978     &lt;int [3]&gt;        Wall S~</span></a>
+<a class="sourceLine" id="cb2-20" data-line-number="20"><span class="co">#&gt; 2 &quot;A panel of Goldman Sachs empl~     2 0.652     &lt;int [2]&gt;        Silico~</span></a>
+<a class="sourceLine" id="cb2-21" data-line-number="21"><span class="co">#&gt; 3 &quot;A panel of Goldman Sachs empl~     1 0.543     &lt;int [1]&gt;        millio~</span></a>
+<a class="sourceLine" id="cb2-22" data-line-number="22">output2 &lt;-<span class="st"> </span><span class="kw">monkey_extract</span>(text,</a>
+<a class="sourceLine" id="cb2-23" data-line-number="23">                          <span class="dt">extractor_id =</span> <span class="st">&quot;ex_y7BPYzNG&quot;</span>,</a>
+<a class="sourceLine" id="cb2-24" data-line-number="24">                          <span class="dt">params =</span> <span class="kw">list</span>(<span class="dt">max_keywords =</span> <span class="dv">1</span>))</a>
+<a class="sourceLine" id="cb2-25" data-line-number="25"><span class="co">#&gt; Processing batch 1 of 1 batches: texts 1 to 1</span></a>
+<a class="sourceLine" id="cb2-26" data-line-number="26">output2</a>
+<a class="sourceLine" id="cb2-27" data-line-number="27"><span class="co">#&gt; # A tibble: 1 x 5</span></a>
+<a class="sourceLine" id="cb2-28" data-line-number="28"><span class="co">#&gt;   req                             count relevance positions_in_te~ keyword</span></a>
+<a class="sourceLine" id="cb2-29" data-line-number="29"><span class="co">#&gt;   &lt;chr&gt;                           &lt;int&gt; &lt;chr&gt;     &lt;list&gt;           &lt;chr&gt;  </span></a>
+<a class="sourceLine" id="cb2-30" data-line-number="30"><span class="co">#&gt; 1 &quot;A panel of Goldman Sachs empl~     3 0.978     &lt;int [3]&gt;        Wall S~</span></a>
+<a class="sourceLine" id="cb2-31" data-line-number="31"><span class="kw">attr</span>(output2, <span class="st">&quot;headers&quot;</span>)</a>
+<a class="sourceLine" id="cb2-32" data-line-number="32"><span class="co">#&gt; # A tibble: 1 x 11</span></a>
+<a class="sourceLine" id="cb2-33" data-line-number="33"><span class="co">#&gt;   server  date   content.type transfer.encodi~ connection x.query.limit.l~</span></a>
+<a class="sourceLine" id="cb2-34" data-line-number="34"><span class="co">#&gt;   &lt;chr&gt;   &lt;chr&gt;  &lt;chr&gt;        &lt;chr&gt;            &lt;chr&gt;      &lt;chr&gt;           </span></a>
+<a class="sourceLine" id="cb2-35" data-line-number="35"><span class="co">#&gt; 1 nginx/~ Wed, ~ application~ chunked          keep-alive 5000000         </span></a>
+<a class="sourceLine" id="cb2-36" data-line-number="36"><span class="co">#&gt; # ... with 5 more variables: x.query.limit.remaining &lt;chr&gt;,</span></a>
+<a class="sourceLine" id="cb2-37" data-line-number="37"><span class="co">#&gt; #   x.query.limit.request.queries &lt;chr&gt;, allow &lt;chr&gt;,</span></a>
+<a class="sourceLine" id="cb2-38" data-line-number="38"><span class="co">#&gt; #   content.encoding &lt;chr&gt;, text_md5 &lt;chr&gt;</span></a></code></pre></div>
+</div>
+<div id="how-to-find-extractors" class="section level2">
+<h2>How to find extractors?</h2>
+<p>You can find extractors and their IDs, including extractors for text in Spanish, at <a href="https://app.monkeylearn.com/main/explore" class="uri">https://app.monkeylearn.com/main/explore</a></p>
+<p>There is no endpoint for automatically finding all extractors, but if you find one in the website you particularly like and use a lot in your language and application, you could choose to save its id as an environment variable as explained <a href="http://stat545.com/bit003_api-key-env-var.html">here</a>. Reading about extractors on the website will give you a good overview of their characteristics and original application.</p>
+<p>Here are a few ones for text in English:</p>
+<ul>
+<li><p><a href="https://app.monkeylearn.com/extraction/extractors/ex_isnnZRbS/tab/description-tab">Entity extractor</a>, <code>extractor_id = &quot;ex_isnnZRbS&quot;</code> (used in the first example). Extract Entities from text using Named Entity Recognition (NER). NER labels sequences of words in a text which are the names of things, such as person and company names. This implementation labels 3 classes: PERSON, ORGANIZATION and LOCATION. This NER tagger is implemented using Conditional Random Field (CRF) sequence models.</p></li>
+<li><p><a href="https://app.monkeylearn.com/extraction/extractors/ex_y7BPYzNG/tab/description-tab">Keyword extractor</a>, <code>extractor_id = &quot;ex_y7BPYzNG&quot;</code>. Extract keywords from text in English. Keywords can be compounded by one or more words and are defined as the important topics in your content and can be used to index data, generate tag clouds or for searching. This keyword extraction algorithm employs statistical algorithms and natural language processing technology to analyze your content and identify the relevant keywords.</p></li>
+</ul>
+<div class="sourceCode" id="cb3"><pre class="sourceCode r"><code class="sourceCode r"><a class="sourceLine" id="cb3-1" data-line-number="1">text &lt;-<span class="st"> &quot;A panel of Goldman Sachs employees spent a recent Tuesday night at the Columbia University faculty club trying to convince a packed room of potential recruits that Wall Street, not Silicon Valley, was the place to be for computer scientists.</span></a>
+<a class="sourceLine" id="cb3-2" data-line-number="2"></a>
+<a class="sourceLine" id="cb3-3" data-line-number="3"><span class="st">The Goldman employees knew they had an uphill battle. They were fighting against perceptions of Wall Street as boring and regulation-bound and Silicon Valley as the promised land of flip-flops, beanbag chairs and million-dollar stock options.</span></a>
+<a class="sourceLine" id="cb3-4" data-line-number="4"></a>
+<a class="sourceLine" id="cb3-5" data-line-number="5"><span class="st">Their argument to the room of technologically inclined students was that Wall Street was where they could find far more challenging, diverse and, yes, lucrative jobs working on some of the world’s most difficult technical problems.</span></a>
+<a class="sourceLine" id="cb3-6" data-line-number="6"></a>
+<a class="sourceLine" id="cb3-7" data-line-number="7"><span class="st">“Whereas in other opportunities you might be considering, it is working one type of data or one type of application, we deal in hundreds of products in hundreds of markets, with thousands or tens of thousands of clients, every day, millions of times of day worldwide,” Afsheen Afshar, a managing director at Goldman Sachs, told the students.&quot;</span></a>
+<a class="sourceLine" id="cb3-8" data-line-number="8"></a>
+<a class="sourceLine" id="cb3-9" data-line-number="9"><span class="kw">monkey_extract</span>(text, <span class="dt">extractor_id =</span> <span class="st">&quot;ex_y7BPYzNG&quot;</span>)</a>
+<a class="sourceLine" id="cb3-10" data-line-number="10"><span class="co">#&gt; # A tibble: 10 x 5</span></a>
+<a class="sourceLine" id="cb3-11" data-line-number="11"><span class="co">#&gt;    req                            count relevance positions_in_te~ keyword</span></a>
+<a class="sourceLine" id="cb3-12" data-line-number="12"><span class="co">#&gt;    &lt;chr&gt;                          &lt;int&gt; &lt;chr&gt;     &lt;list&gt;           &lt;chr&gt;  </span></a>
+<a class="sourceLine" id="cb3-13" data-line-number="13"><span class="co">#&gt;  1 &quot;A panel of Goldman Sachs emp~     3 0.978     &lt;int [3]&gt;        Wall S~</span></a>
+<a class="sourceLine" id="cb3-14" data-line-number="14"><span class="co">#&gt;  2 &quot;A panel of Goldman Sachs emp~     2 0.652     &lt;int [2]&gt;        Silico~</span></a>
+<a class="sourceLine" id="cb3-15" data-line-number="15"><span class="co">#&gt;  3 &quot;A panel of Goldman Sachs emp~     1 0.543     &lt;int [1]&gt;        millio~</span></a>
+<a class="sourceLine" id="cb3-16" data-line-number="16"><span class="co">#&gt;  4 &quot;A panel of Goldman Sachs emp~     1 0.543     &lt;int [1]&gt;        Goldma~</span></a>
+<a class="sourceLine" id="cb3-17" data-line-number="17"><span class="co">#&gt;  5 &quot;A panel of Goldman Sachs emp~     1 0.543     &lt;int [1]&gt;        Univer~</span></a>
+<a class="sourceLine" id="cb3-18" data-line-number="18"><span class="co">#&gt;  6 &quot;A panel of Goldman Sachs emp~     1 0.543     &lt;int [1]&gt;        recent~</span></a>
+<a class="sourceLine" id="cb3-19" data-line-number="19"><span class="co">#&gt;  7 &quot;A panel of Goldman Sachs emp~     1 0.543     &lt;int [1]&gt;        diffic~</span></a>
+<a class="sourceLine" id="cb3-20" data-line-number="20"><span class="co">#&gt;  8 &quot;A panel of Goldman Sachs emp~     2 0.435     &lt;int [2]&gt;        thousa~</span></a>
+<a class="sourceLine" id="cb3-21" data-line-number="21"><span class="co">#&gt;  9 &quot;A panel of Goldman Sachs emp~     2 0.435     &lt;int [2]&gt;        type   </span></a>
+<a class="sourceLine" id="cb3-22" data-line-number="22"><span class="co">#&gt; 10 &quot;A panel of Goldman Sachs emp~     2 0.435     &lt;int [2]&gt;        hundre~</span></a></code></pre></div>
+<ul>
+<li><a href="https://app.monkeylearn.com/extraction/extractors/ex_dqRio5sG/tab/description-tab">Useful data extractor</a>, <code>extractor_id = &quot;ex_dqRio5sG&quot;</code>. Extract useful data from text. This algorithm can be used to detect many different useful data: links, phones, ips, prices, times, emails, bitcoin addresses, dates, ipv6s, hex colors and credit cards.</li>
+</ul>
+<p>When using this extractor, the format of the API output is a bit different than for other extractors, see below how the output looks like.</p>
+<div class="sourceCode" id="cb4"><pre class="sourceCode r"><code class="sourceCode r"><a class="sourceLine" id="cb4-1" data-line-number="1">text &lt;-<span class="st"> &quot;Hi, my email is john@example.com and my credit card is 4242-4242-4242-4242 so you can charge me with $10. My phone number is 15555 9876. We can get in touch on April 16, at 10:00am&quot;</span></a>
+<a class="sourceLine" id="cb4-2" data-line-number="2">text2 &lt;-<span class="st"> &quot;Hi, my email is mary@example.com and my credit card is 4242-4232-4242-4242. My phone number is 16655 9876. We can get in touch on April 16, at 10:00am&quot;</span></a>
+<a class="sourceLine" id="cb4-3" data-line-number="3"></a>
+<a class="sourceLine" id="cb4-4" data-line-number="4"><span class="kw">monkey_extract</span>(<span class="kw">c</span>(text, text2), <span class="dt">extractor_id =</span> <span class="st">&quot;ex_dqRio5sG&quot;</span>, <span class="dt">unnest =</span> <span class="ot">TRUE</span>)</a>
+<a class="sourceLine" id="cb4-5" data-line-number="5"><span class="co">#&gt; # A tibble: 2 x 12</span></a>
+<a class="sourceLine" id="cb4-6" data-line-number="6"><span class="co">#&gt;   req        dates links phones ipv6s hex_colors ips   credit_cards prices</span></a>
+<a class="sourceLine" id="cb4-7" data-line-number="7"><span class="co">#&gt;   &lt;chr&gt;      &lt;chr&gt; &lt;chr&gt; &lt;chr&gt;  &lt;chr&gt; &lt;chr&gt;      &lt;chr&gt; &lt;chr&gt;        &lt;chr&gt; </span></a>
+<a class="sourceLine" id="cb4-8" data-line-number="8"><span class="co">#&gt; 1 Hi, my em~ Apri~ exam~ 15555~ &lt;NA&gt;  &lt;NA&gt;       &lt;NA&gt;  4242-4242-4~ $10   </span></a>
+<a class="sourceLine" id="cb4-9" data-line-number="9"><span class="co">#&gt; 2 Hi, my em~ Apri~ exam~ 16655~ &lt;NA&gt;  &lt;NA&gt;       &lt;NA&gt;  4242-4232-4~ &lt;NA&gt;  </span></a>
+<a class="sourceLine" id="cb4-10" data-line-number="10"><span class="co">#&gt; # ... with 3 more variables: times &lt;chr&gt;, emails &lt;chr&gt;,</span></a>
+<a class="sourceLine" id="cb4-11" data-line-number="11"><span class="co">#&gt; #   bitcoin_addresses &lt;chr&gt;</span></a></code></pre></div>
+</div>
+</div>
+<div id="classify" class="section level1">
+<h1>Classify</h1>
+<div id="a-first-example-1" class="section level2">
+<h2>A first example</h2>
+<div class="sourceCode" id="cb5"><pre class="sourceCode r"><code class="sourceCode r"><a class="sourceLine" id="cb5-1" data-line-number="1">text1 &lt;-<span class="st"> &quot;my dog is an avid rice eater&quot;</span></a>
+<a class="sourceLine" id="cb5-2" data-line-number="2">text2 &lt;-<span class="st"> &quot;i want to buy an iphone&quot;</span></a>
+<a class="sourceLine" id="cb5-3" data-line-number="3">request &lt;-<span class="st"> </span><span class="kw">c</span>(text1, text2)</a>
+<a class="sourceLine" id="cb5-4" data-line-number="4"></a>
+<a class="sourceLine" id="cb5-5" data-line-number="5"><span class="kw">monkey_classify</span>(request, <span class="dt">classifier_id =</span> <span class="st">&quot;cl_oFKL5wft&quot;</span>)</a>
+<a class="sourceLine" id="cb5-6" data-line-number="6"><span class="co">#&gt; # A tibble: 6 x 4</span></a>
+<a class="sourceLine" id="cb5-7" data-line-number="7"><span class="co">#&gt;   req                          category_id probability label             </span></a>
+<a class="sourceLine" id="cb5-8" data-line-number="8"><span class="co">#&gt;   &lt;chr&gt;                              &lt;int&gt;       &lt;dbl&gt; &lt;chr&gt;             </span></a>
+<a class="sourceLine" id="cb5-9" data-line-number="9"><span class="co">#&gt; 1 my dog is an avid rice eater    18313097      0.130  Pets              </span></a>
+<a class="sourceLine" id="cb5-10" data-line-number="10"><span class="co">#&gt; 2 my dog is an avid rice eater    18313108      0.239  Dogs              </span></a>
+<a class="sourceLine" id="cb5-11" data-line-number="11"><span class="co">#&gt; 3 my dog is an avid rice eater    18313113      0.0820 Dog Food          </span></a>
+<a class="sourceLine" id="cb5-12" data-line-number="12"><span class="co">#&gt; 4 i want to buy an iphone         18314739      0.113  Cell Phones       </span></a>
+<a class="sourceLine" id="cb5-13" data-line-number="13"><span class="co">#&gt; 5 i want to buy an iphone         18314740      0.186  Accessories       </span></a>
+<a class="sourceLine" id="cb5-14" data-line-number="14"><span class="co">#&gt; 6 i want to buy an iphone         18314741      0.0940 Cases &amp; Protectors</span></a></code></pre></div>
+</div>
+<div id="how-to-find-classifiers" class="section level2">
+<h2>How to find classifiers?</h2>
+<p>You can find classifiers and their IDs at <a href="https://app.monkeylearn.com/main/explore" class="uri">https://app.monkeylearn.com/main/explore</a> or you can use the <code>monkeylearn_classifiers</code> function, choosing to show all classifiers or only the private ones with <code>private = TRUE</code>. The first column of the resulting data.frame is the <code>classifier_id</code> to be used in <code>monkeylearn_classify</code>.</p>
+<div class="sourceCode" id="cb6"><pre class="sourceCode r"><code class="sourceCode r"><a class="sourceLine" id="cb6-1" data-line-number="1"><span class="kw">monkeylearn_classifiers</span>(<span class="dt">private =</span> <span class="ot">FALSE</span>)</a>
+<a class="sourceLine" id="cb6-2" data-line-number="2"><span class="co">#&gt; # A tibble: 45 x 19</span></a>
+<a class="sourceLine" id="cb6-3" data-line-number="3"><span class="co">#&gt;    classifier_id name   description      train_state train_job_id language</span></a>
+<a class="sourceLine" id="cb6-4" data-line-number="4"><span class="co">#&gt;    &lt;chr&gt;         &lt;chr&gt;  &lt;chr&gt;            &lt;chr&gt;       &lt;lgl&gt;        &lt;chr&gt;   </span></a>
+<a class="sourceLine" id="cb6-5" data-line-number="5"><span class="co">#&gt;  1 cl_Aiu8dfYF   Custo~ &quot;Classifies cus~ TRAINED     NA           en      </span></a>
+<a class="sourceLine" id="cb6-6" data-line-number="6"><span class="co">#&gt;  2 cl_gBhyCMCs   Custo~ Detects if huma~ TRAINED     NA           en      </span></a>
+<a class="sourceLine" id="cb6-7" data-line-number="7"><span class="co">#&gt;  3 cl_N3VzxNLN   Custo~ Differentiates ~ TRAINED     NA           en      </span></a>
+<a class="sourceLine" id="cb6-8" data-line-number="8"><span class="co">#&gt;  4 cl_csyzaevo   Role ~ &quot;Classifies job~ DIRTY       NA           en      </span></a>
+<a class="sourceLine" id="cb6-9" data-line-number="9"><span class="co">#&gt;  5 cl_pX4g5EEF   Custo~ Helps to detect~ TRAINED     NA           en      </span></a>
+<a class="sourceLine" id="cb6-10" data-line-number="10"><span class="co">#&gt;  6 cl_Jx8qzYJh   Senti~ Detect sentimen~ TRAINED     NA           en      </span></a>
+<a class="sourceLine" id="cb6-11" data-line-number="11"><span class="co">#&gt;  7 cl_sGdE8hD9   NPS S~ Classify NPS re~ DIRTY       NA           en      </span></a>
+<a class="sourceLine" id="cb6-12" data-line-number="12"><span class="co">#&gt;  8 cl_T7XMb74S   IAB T~ Classifies text~ TRAINED     NA           en      </span></a>
+<a class="sourceLine" id="cb6-13" data-line-number="13"><span class="co">#&gt;  9 cl_nLW3yR6m   Telco~ Classify custom~ TRAINED     NA           en      </span></a>
+<a class="sourceLine" id="cb6-14" data-line-number="14"><span class="co">#&gt; 10 cl_4LqLD7cN   Telco~ Detect the topi~ TRAINED     NA           en      </span></a>
+<a class="sourceLine" id="cb6-15" data-line-number="15"><span class="co">#&gt; # ... with 35 more rows, and 13 more variables: ngram_range &lt;chr&gt;,</span></a>
+<a class="sourceLine" id="cb6-16" data-line-number="16"><span class="co">#&gt; #   use_stemmer &lt;lgl&gt;, stop_words &lt;chr&gt;, max_features &lt;int&gt;,</span></a>
+<a class="sourceLine" id="cb6-17" data-line-number="17"><span class="co">#&gt; #   strip_stopwords &lt;lgl&gt;, is_multilabel &lt;lgl&gt;, is_twitter_data &lt;lgl&gt;,</span></a>
+<a class="sourceLine" id="cb6-18" data-line-number="18"><span class="co">#&gt; #   normalize_weights &lt;lgl&gt;, classifier &lt;chr&gt;, industry &lt;chr&gt;,</span></a>
+<a class="sourceLine" id="cb6-19" data-line-number="19"><span class="co">#&gt; #   classifier_type &lt;chr&gt;, text_type &lt;chr&gt;, permissions &lt;chr&gt;</span></a></code></pre></div>
+<p>Here are a few other examples:</p>
+<ul>
+<li><a href="https://app.monkeylearn.com/categorizer/projects/cl_oJNMkt2V/tab/main-tab">Language detection</a>, <code>classifier_id = &quot;cl_oJNMkt2V&quot;</code>. Detect language in text. New languages were added for a total of 48 different languages arranged in language families.</li>
+</ul>
+<div class="sourceCode" id="cb7"><pre class="sourceCode r"><code class="sourceCode r"><a class="sourceLine" id="cb7-1" data-line-number="1">text1 &lt;-<span class="st"> &quot;Hauràs de dirigir-te al punt de trobada del grup al que et vulguis unir.&quot;</span></a>
+<a class="sourceLine" id="cb7-2" data-line-number="2">text2 &lt;-<span class="st"> &quot;i want to buy an iphone&quot;</span></a>
+<a class="sourceLine" id="cb7-3" data-line-number="3">text3 &lt;-<span class="st"> &quot;Je déteste ne plus avoir de dentifrice.&quot;</span></a>
+<a class="sourceLine" id="cb7-4" data-line-number="4">request &lt;-<span class="st"> </span><span class="kw">c</span>(text1, text2, text3)</a>
+<a class="sourceLine" id="cb7-5" data-line-number="5"></a>
+<a class="sourceLine" id="cb7-6" data-line-number="6"><span class="kw">monkey_classify</span>(request, <span class="dt">classifier_id =</span> <span class="st">&quot;cl_oJNMkt2V&quot;</span>)</a>
+<a class="sourceLine" id="cb7-7" data-line-number="7"><span class="co">#&gt; # A tibble: 6 x 4</span></a>
+<a class="sourceLine" id="cb7-8" data-line-number="8"><span class="co">#&gt;   req                                      category_id probability label  </span></a>
+<a class="sourceLine" id="cb7-9" data-line-number="9"><span class="co">#&gt;   &lt;chr&gt;                                          &lt;int&gt;       &lt;dbl&gt; &lt;chr&gt;  </span></a>
+<a class="sourceLine" id="cb7-10" data-line-number="10"><span class="co">#&gt; 1 Hauràs de dirigir-te al punt de trobada~    53876647       1.00  Italic </span></a>
+<a class="sourceLine" id="cb7-11" data-line-number="11"><span class="co">#&gt; 2 Hauràs de dirigir-te al punt de trobada~    53876648       0.642 Catala~</span></a>
+<a class="sourceLine" id="cb7-12" data-line-number="12"><span class="co">#&gt; 3 i want to buy an iphone                     53876636       0.384 German~</span></a>
+<a class="sourceLine" id="cb7-13" data-line-number="13"><span class="co">#&gt; 4 i want to buy an iphone                     53876639       0.613 Englis~</span></a>
+<a class="sourceLine" id="cb7-14" data-line-number="14"><span class="co">#&gt; 5 Je déteste ne plus avoir de dentifrice.     53876647       0.995 Italic </span></a>
+<a class="sourceLine" id="cb7-15" data-line-number="15"><span class="co">#&gt; 6 Je déteste ne plus avoir de dentifrice.     53876649       0.887 French~</span></a></code></pre></div>
+<ul>
+<li><a href="https://app.monkeylearn.com/categorizer/projects/cl_KFXhoTdt/tab/main-tab">Profanity and abuse detection</a>, <code>classifier_id = &quot;cl_KFXhoTdt&quot;</code>.</li>
+</ul>
+<div class="sourceCode" id="cb8"><pre class="sourceCode r"><code class="sourceCode r"><a class="sourceLine" id="cb8-1" data-line-number="1">text1 &lt;-<span class="st"> &quot;I think this is awesome.&quot;</span></a>
+<a class="sourceLine" id="cb8-2" data-line-number="2">text2 &lt;-<span class="st"> &quot;Holy shit! You did great!&quot;</span></a>
+<a class="sourceLine" id="cb8-3" data-line-number="3">request &lt;-<span class="st"> </span><span class="kw">c</span>(text1, text2)</a>
+<a class="sourceLine" id="cb8-4" data-line-number="4"></a>
+<a class="sourceLine" id="cb8-5" data-line-number="5"><span class="kw">monkey_classify</span>(request, <span class="dt">classifier_id =</span> <span class="st">&quot;cl_KFXhoTdt&quot;</span>)</a>
+<a class="sourceLine" id="cb8-6" data-line-number="6"><span class="co">#&gt; # A tibble: 2 x 4</span></a>
+<a class="sourceLine" id="cb8-7" data-line-number="7"><span class="co">#&gt;   req                       category_id probability label    </span></a>
+<a class="sourceLine" id="cb8-8" data-line-number="8"><span class="co">#&gt;   &lt;chr&gt;                           &lt;int&gt;       &lt;dbl&gt; &lt;chr&gt;    </span></a>
+<a class="sourceLine" id="cb8-9" data-line-number="9"><span class="co">#&gt; 1 I think this is awesome.     22375077       0.803 clean    </span></a>
+<a class="sourceLine" id="cb8-10" data-line-number="10"><span class="co">#&gt; 2 Holy shit! You did great!    22375076       0.997 profanity</span></a></code></pre></div>
+<ul>
+<li><a href="https://app.monkeylearn.com/categorizer/projects/cl_5icAVzKR/tab/">General topic classifier</a>, <code>classifier_id = &quot;cl_5icAVzKR&quot;</code>.</li>
+</ul>
+<div class="sourceCode" id="cb9"><pre class="sourceCode r"><code class="sourceCode r"><a class="sourceLine" id="cb9-1" data-line-number="1">text1 &lt;-<span class="st"> &quot;Let me tell you about my dog and my cat. They are really friendly and like going on walks. They both like chasing mice.&quot;</span></a>
+<a class="sourceLine" id="cb9-2" data-line-number="2">text2 &lt;-<span class="st"> &quot;My first R package was probably a disaster but I keep learning how to program.&quot;</span></a>
+<a class="sourceLine" id="cb9-3" data-line-number="3">request &lt;-<span class="st"> </span><span class="kw">c</span>(text1, text2)</a>
+<a class="sourceLine" id="cb9-4" data-line-number="4"><span class="kw">monkey_classify</span>(request, <span class="dt">classifier_id =</span> <span class="st">&quot;cl_5icAVzKR&quot;</span>)</a>
+<a class="sourceLine" id="cb9-5" data-line-number="5"><span class="co">#&gt; # A tibble: 5 x 4</span></a>
+<a class="sourceLine" id="cb9-6" data-line-number="6"><span class="co">#&gt;   req                                    category_id probability label    </span></a>
+<a class="sourceLine" id="cb9-7" data-line-number="7"><span class="co">#&gt;   &lt;chr&gt;                                        &lt;int&gt;       &lt;dbl&gt; &lt;chr&gt;    </span></a>
+<a class="sourceLine" id="cb9-8" data-line-number="8"><span class="co">#&gt; 1 Let me tell you about my dog and my c~       64600       0.894 Animals  </span></a>
+<a class="sourceLine" id="cb9-9" data-line-number="9"><span class="co">#&gt; 2 Let me tell you about my dog and my c~       64608       0.649 Mammals  </span></a>
+<a class="sourceLine" id="cb9-10" data-line-number="10"><span class="co">#&gt; 3 Let me tell you about my dog and my c~       64611       0.869 Land Mam~</span></a>
+<a class="sourceLine" id="cb9-11" data-line-number="11"><span class="co">#&gt; 4 My first R package was probably a dis~       64638       0.240 Computer~</span></a>
+<a class="sourceLine" id="cb9-12" data-line-number="12"><span class="co">#&gt; 5 My first R package was probably a dis~       64640       0.252 Internet</span></a></code></pre></div>
+</div>
+</div>
+<div id="get-what-you-paid-for" class="section level1">
+<h1>Get what you paid for</h1>
+<p>Monkeylearn offers a different service based on your current plan, that is, “free”, “team” or “business”. These plans will both influence your <em>rate limiting</em> (how fast?) and your <em>query limiting</em> (how many queries?). See <a href="https://monkeylearn.com/pricing/" class="uri">https://monkeylearn.com/pricing/</a>. Thanks to your MONKEYLEARN_PLAN environment variable, the rate will be handled automatically thanks to <a href="https://github.com/tarakc02/ratelimitr"><code>ratelimitr</code></a>.</p>
+<div id="check-the-number-of-remaining-calls" class="section level2">
+<h2>Check the number of remaining calls</h2>
+<p>After each call to a function you can check how many calls to the API you can still make using <code>attr(output, &quot;headers&quot;)$x.query.limit.remaining</code> and <code>attr(output, &quot;headers&quot;)$x.query.limit.limit</code>. The period after which <code>attr(output, &quot;headers&quot;)$x.query.limit.remaining</code> depends on your subscription and is not included in the output.</p>
+</div>
+</div>
+<div id="fit-monkeylearn-into-your-pipeline" class="section level1">
+<h1>Fit <code>monkeylearn</code> into your pipeline!</h1>
+<p>You can:</p>
+<ul>
+<li>Send a vector of texts <em>or</em> a dataframe and a named column (unquoted)</li>
+<li>Output either a nested or unnested dataframe
+<ul>
+<li>Nested = 1 row per input; unnested = 1 row per output</li>
+</ul></li>
+<li>This output
+<ul>
+<li>Relates each input text to its (usually) multiple classifications/extractions</li>
+<li>Retains a record of inputs that could not be classified/extracted (e.g., empty strings)</li>
+</ul></li>
+<li>Batch requests</li>
+</ul>
+<div id="in-a-bit-more-detail" class="section level2">
+<h2>In a bit more detail</h2>
+<p>You can classify or extract a vector or dataframe of texts while relating the original input text to its classifications. This is important, because the input:output relationship may not always (and in fact, is not usually) 1:1. These functions retain the tie between each <code>input</code><a href="#fn1" class="footnote-ref" id="fnref1"><sup>1</sup></a> element and all of its output elements.</p>
+<div class="sourceCode" id="cb10"><pre class="sourceCode r"><code class="sourceCode r"><a class="sourceLine" id="cb10-1" data-line-number="1">input &lt;-<span class="st"> </span><span class="kw">c</span>(<span class="st">&quot;Emma Woodhouse, handsome, clever, and rich, with a comfortable home&quot;</span>,     </a>
+<a class="sourceLine" id="cb10-2" data-line-number="2"> <span class="st">&quot;and happy disposition, seemed to unite some of the best blessings of&quot;</span>,  </a>
+<a class="sourceLine" id="cb10-3" data-line-number="3"> <span class="st">&quot;existence; and had lived nearly twenty-one years in the world with very&quot;</span>, </a>
+<a class="sourceLine" id="cb10-4" data-line-number="4"> <span class="st">&quot;little to distress or vex her.&quot;</span>,                                          </a>
+<a class="sourceLine" id="cb10-5" data-line-number="5"> <span class="st">&quot;&quot;</span>,                   <span class="co"># &lt;--- note the empty string!                                                   </span></a>
+<a class="sourceLine" id="cb10-6" data-line-number="6"> <span class="st">&quot;She was the youngest of the two daughters of a most affectionate,&quot;</span>,       </a>
+<a class="sourceLine" id="cb10-7" data-line-number="7"> <span class="st">&quot;indulgent father; and had, in consequence of her sister's marriage, been&quot;</span>,</a>
+<a class="sourceLine" id="cb10-8" data-line-number="8"> <span class="st">&quot;mistress of his house from a very early period. Her mother had died&quot;</span>,     </a>
+<a class="sourceLine" id="cb10-9" data-line-number="9"> <span class="st">&quot;too long ago for her to have more than an indistinct remembrance of&quot;</span>,     </a>
+<a class="sourceLine" id="cb10-10" data-line-number="10"> <span class="st">&quot;her caresses; and her place had been supplied by an excellent woman as&quot;</span>,  </a>
+<a class="sourceLine" id="cb10-11" data-line-number="11"> <span class="st">&quot;governess, who had fallen little short of a mother in affection.&quot;</span>)</a></code></pre></div>
+<p>That is true even if you have inputs that cannot be processed. For instance, empty string and <code>NA</code> input elements are not sent to the API for classification/extraction. (You’ll get a warning of this if <code>verbose = TRUE</code>.) We’ve got one above to illustrate and elements that returned no classifications/extractions are included in the resulting dataframe. This way you’ll know which inputs could not be processed.</p>
+<div class="sourceCode" id="cb11"><pre class="sourceCode r"><code class="sourceCode r"><a class="sourceLine" id="cb11-1" data-line-number="1">(output &lt;-<span class="st"> </span><span class="kw">monkey_classify</span>(input, <span class="dt">unnest =</span> <span class="ot">FALSE</span>))</a>
+<a class="sourceLine" id="cb11-2" data-line-number="2"><span class="co">#&gt; Using classifier ID cl_oFKL5wft; to find other classifiers, run monkeylearn_classifiers() or visit https://app.monkeylearn.com/main/explore/</span></a>
+<a class="sourceLine" id="cb11-3" data-line-number="3"><span class="co">#&gt; The following indices were empty strings and could not be sent to the API: 5. They will still be included in the output.</span></a>
+<a class="sourceLine" id="cb11-4" data-line-number="4"><span class="co">#&gt; Processing batch 1 of 1 batches: texts 1 to 10</span></a>
+<a class="sourceLine" id="cb11-5" data-line-number="5"><span class="co">#&gt; # A tibble: 11 x 2</span></a>
+<a class="sourceLine" id="cb11-6" data-line-number="6"><span class="co">#&gt;    req                                                     res            </span></a>
+<a class="sourceLine" id="cb11-7" data-line-number="7"><span class="co">#&gt;    &lt;chr&gt;                                                   &lt;list&gt;         </span></a>
+<a class="sourceLine" id="cb11-8" data-line-number="8"><span class="co">#&gt;  1 Emma Woodhouse, handsome, clever, and rich, with a com~ &lt;data.frame [4~</span></a>
+<a class="sourceLine" id="cb11-9" data-line-number="9"><span class="co">#&gt;  2 and happy disposition, seemed to unite some of the bes~ &lt;data.frame [3~</span></a>
+<a class="sourceLine" id="cb11-10" data-line-number="10"><span class="co">#&gt;  3 existence; and had lived nearly twenty-one years in th~ &lt;data.frame [3~</span></a>
+<a class="sourceLine" id="cb11-11" data-line-number="11"><span class="co">#&gt;  4 little to distress or vex her.                          &lt;data.frame [4~</span></a>
+<a class="sourceLine" id="cb11-12" data-line-number="12"><span class="co">#&gt;  5 &quot;&quot;                                                      &lt;data.frame [1~</span></a>
+<a class="sourceLine" id="cb11-13" data-line-number="13"><span class="co">#&gt;  6 She was the youngest of the two daughters of a most af~ &lt;data.frame [4~</span></a>
+<a class="sourceLine" id="cb11-14" data-line-number="14"><span class="co">#&gt;  7 indulgent father; and had, in consequence of her siste~ &lt;data.frame [3~</span></a>
+<a class="sourceLine" id="cb11-15" data-line-number="15"><span class="co">#&gt;  8 mistress of his house from a very early period. Her mo~ &lt;data.frame [3~</span></a>
+<a class="sourceLine" id="cb11-16" data-line-number="16"><span class="co">#&gt;  9 too long ago for her to have more than an indistinct r~ &lt;data.frame [4~</span></a>
+<a class="sourceLine" id="cb11-17" data-line-number="17"><span class="co">#&gt; 10 her caresses; and her place had been supplied by an ex~ &lt;data.frame [3~</span></a>
+<a class="sourceLine" id="cb11-18" data-line-number="18"><span class="co">#&gt; 11 governess, who had fallen little short of a mother in ~ &lt;data.frame [4~</span></a></code></pre></div>
+<p><br></p>
+<p>If there are more than 20 empty inputs, we save your console by messaging only the first 20 indices.</p>
+<div class="sourceCode" id="cb12"><pre class="sourceCode r"><code class="sourceCode r"><a class="sourceLine" id="cb12-1" data-line-number="1">(very_empty_input &lt;-<span class="st"> </span><span class="kw">rep</span>(<span class="st">&quot;&quot;</span>, <span class="dv">25</span>) <span class="op">%&gt;%</span><span class="st"> </span><span class="kw">c</span>(input) <span class="op">%&gt;%</span><span class="st"> </span><span class="kw">sample</span>())</a>
+<a class="sourceLine" id="cb12-2" data-line-number="2"><span class="co">#&gt;  [1] &quot;&quot;                                                                        </span></a>
+<a class="sourceLine" id="cb12-3" data-line-number="3"><span class="co">#&gt;  [2] &quot;&quot;                                                                        </span></a>
+<a class="sourceLine" id="cb12-4" data-line-number="4"><span class="co">#&gt;  [3] &quot;&quot;                                                                        </span></a>
+<a class="sourceLine" id="cb12-5" data-line-number="5"><span class="co">#&gt;  [4] &quot;&quot;                                                                        </span></a>
+<a class="sourceLine" id="cb12-6" data-line-number="6"><span class="co">#&gt;  [5] &quot;little to distress or vex her.&quot;                                          </span></a>
+<a class="sourceLine" id="cb12-7" data-line-number="7"><span class="co">#&gt;  [6] &quot;&quot;                                                                        </span></a>
+<a class="sourceLine" id="cb12-8" data-line-number="8"><span class="co">#&gt;  [7] &quot;existence; and had lived nearly twenty-one years in the world with very&quot; </span></a>
+<a class="sourceLine" id="cb12-9" data-line-number="9"><span class="co">#&gt;  [8] &quot;&quot;                                                                        </span></a>
+<a class="sourceLine" id="cb12-10" data-line-number="10"><span class="co">#&gt;  [9] &quot;&quot;                                                                        </span></a>
+<a class="sourceLine" id="cb12-11" data-line-number="11"><span class="co">#&gt; [10] &quot;&quot;                                                                        </span></a>
+<a class="sourceLine" id="cb12-12" data-line-number="12"><span class="co">#&gt; [11] &quot;too long ago for her to have more than an indistinct remembrance of&quot;     </span></a>
+<a class="sourceLine" id="cb12-13" data-line-number="13"><span class="co">#&gt; [12] &quot;governess, who had fallen little short of a mother in affection.&quot;        </span></a>
+<a class="sourceLine" id="cb12-14" data-line-number="14"><span class="co">#&gt; [13] &quot;&quot;                                                                        </span></a>
+<a class="sourceLine" id="cb12-15" data-line-number="15"><span class="co">#&gt; [14] &quot;and happy disposition, seemed to unite some of the best blessings of&quot;    </span></a>
+<a class="sourceLine" id="cb12-16" data-line-number="16"><span class="co">#&gt; [15] &quot;She was the youngest of the two daughters of a most affectionate,&quot;       </span></a>
+<a class="sourceLine" id="cb12-17" data-line-number="17"><span class="co">#&gt; [16] &quot;&quot;                                                                        </span></a>
+<a class="sourceLine" id="cb12-18" data-line-number="18"><span class="co">#&gt; [17] &quot;&quot;                                                                        </span></a>
+<a class="sourceLine" id="cb12-19" data-line-number="19"><span class="co">#&gt; [18] &quot;mistress of his house from a very early period. Her mother had died&quot;     </span></a>
+<a class="sourceLine" id="cb12-20" data-line-number="20"><span class="co">#&gt; [19] &quot;&quot;                                                                        </span></a>
+<a class="sourceLine" id="cb12-21" data-line-number="21"><span class="co">#&gt; [20] &quot;&quot;                                                                        </span></a>
+<a class="sourceLine" id="cb12-22" data-line-number="22"><span class="co">#&gt; [21] &quot;&quot;                                                                        </span></a>
+<a class="sourceLine" id="cb12-23" data-line-number="23"><span class="co">#&gt; [22] &quot;indulgent father; and had, in consequence of her sister's marriage, been&quot;</span></a>
+<a class="sourceLine" id="cb12-24" data-line-number="24"><span class="co">#&gt; [23] &quot;&quot;                                                                        </span></a>
+<a class="sourceLine" id="cb12-25" data-line-number="25"><span class="co">#&gt; [24] &quot;&quot;                                                                        </span></a>
+<a class="sourceLine" id="cb12-26" data-line-number="26"><span class="co">#&gt; [25] &quot;&quot;                                                                        </span></a>
+<a class="sourceLine" id="cb12-27" data-line-number="27"><span class="co">#&gt; [26] &quot;&quot;                                                                        </span></a>
+<a class="sourceLine" id="cb12-28" data-line-number="28"><span class="co">#&gt; [27] &quot;&quot;                                                                        </span></a>
+<a class="sourceLine" id="cb12-29" data-line-number="29"><span class="co">#&gt; [28] &quot;&quot;                                                                        </span></a>
+<a class="sourceLine" id="cb12-30" data-line-number="30"><span class="co">#&gt; [29] &quot;her caresses; and her place had been supplied by an excellent woman as&quot;  </span></a>
+<a class="sourceLine" id="cb12-31" data-line-number="31"><span class="co">#&gt; [30] &quot;&quot;                                                                        </span></a>
+<a class="sourceLine" id="cb12-32" data-line-number="32"><span class="co">#&gt; [31] &quot;&quot;                                                                        </span></a>
+<a class="sourceLine" id="cb12-33" data-line-number="33"><span class="co">#&gt; [32] &quot;&quot;                                                                        </span></a>
+<a class="sourceLine" id="cb12-34" data-line-number="34"><span class="co">#&gt; [33] &quot;&quot;                                                                        </span></a>
+<a class="sourceLine" id="cb12-35" data-line-number="35"><span class="co">#&gt; [34] &quot;Emma Woodhouse, handsome, clever, and rich, with a comfortable home&quot;     </span></a>
+<a class="sourceLine" id="cb12-36" data-line-number="36"><span class="co">#&gt; [35] &quot;&quot;                                                                        </span></a>
+<a class="sourceLine" id="cb12-37" data-line-number="37"><span class="co">#&gt; [36] &quot;&quot;</span></a></code></pre></div>
+<p>Since the entire original input is represented in the output, if you need to find all of the empty inputs you can easily filter the output to all of the rows containing empty strings.</p>
+<div class="sourceCode" id="cb13"><pre class="sourceCode r"><code class="sourceCode r"><a class="sourceLine" id="cb13-1" data-line-number="1"><span class="kw">monkey_classify</span>(very_empty_input, <span class="dt">unnest =</span> <span class="ot">FALSE</span>)</a>
+<a class="sourceLine" id="cb13-2" data-line-number="2"><span class="co">#&gt; Using classifier ID cl_oFKL5wft; to find other classifiers, run monkeylearn_classifiers() or visit https://app.monkeylearn.com/main/explore/</span></a>
+<a class="sourceLine" id="cb13-3" data-line-number="3"><span class="co">#&gt; The following indices were empty strings and could not be sent to the API. (Displaying first 20): 1, 2, 3, 4, 6, 8, 9, 10, 13, 16, 17, 19, 20, 21, 23, 24, 25, 26, 27, 28... They will still be included in the output.</span></a>
+<a class="sourceLine" id="cb13-4" data-line-number="4"><span class="co">#&gt; Processing batch 1 of 1 batches: texts 1 to 10</span></a>
+<a class="sourceLine" id="cb13-5" data-line-number="5"><span class="co">#&gt; # A tibble: 36 x 2</span></a>
+<a class="sourceLine" id="cb13-6" data-line-number="6"><span class="co">#&gt;    req                                                    res             </span></a>
+<a class="sourceLine" id="cb13-7" data-line-number="7"><span class="co">#&gt;    &lt;chr&gt;                                                  &lt;list&gt;          </span></a>
+<a class="sourceLine" id="cb13-8" data-line-number="8"><span class="co">#&gt;  1 &quot;&quot;                                                     &lt;data.frame [1 ~</span></a>
+<a class="sourceLine" id="cb13-9" data-line-number="9"><span class="co">#&gt;  2 &quot;&quot;                                                     &lt;data.frame [1 ~</span></a>
+<a class="sourceLine" id="cb13-10" data-line-number="10"><span class="co">#&gt;  3 &quot;&quot;                                                     &lt;data.frame [1 ~</span></a>
+<a class="sourceLine" id="cb13-11" data-line-number="11"><span class="co">#&gt;  4 &quot;&quot;                                                     &lt;data.frame [1 ~</span></a>
+<a class="sourceLine" id="cb13-12" data-line-number="12"><span class="co">#&gt;  5 little to distress or vex her.                         &lt;data.frame [4 ~</span></a>
+<a class="sourceLine" id="cb13-13" data-line-number="13"><span class="co">#&gt;  6 &quot;&quot;                                                     &lt;data.frame [1 ~</span></a>
+<a class="sourceLine" id="cb13-14" data-line-number="14"><span class="co">#&gt;  7 existence; and had lived nearly twenty-one years in t~ &lt;data.frame [3 ~</span></a>
+<a class="sourceLine" id="cb13-15" data-line-number="15"><span class="co">#&gt;  8 &quot;&quot;                                                     &lt;data.frame [1 ~</span></a>
+<a class="sourceLine" id="cb13-16" data-line-number="16"><span class="co">#&gt;  9 &quot;&quot;                                                     &lt;data.frame [1 ~</span></a>
+<a class="sourceLine" id="cb13-17" data-line-number="17"><span class="co">#&gt; 10 &quot;&quot;                                                     &lt;data.frame [1 ~</span></a>
+<a class="sourceLine" id="cb13-18" data-line-number="18"><span class="co">#&gt; # ... with 26 more rows</span></a></code></pre></div>
+<div id="configuring-the-output" class="section level3">
+<h3>Configuring the Output</h3>
+<p>The default output is a nested dataframe with the same number of rows as your input dataframe or the same length as your input vector, depending on which one you sent in.</p>
+<p>Let’s take a look at the <code>res</code> output column.</p>
+<div class="sourceCode" id="cb14"><pre class="sourceCode r"><code class="sourceCode r"><a class="sourceLine" id="cb14-1" data-line-number="1">output<span class="op">$</span>res</a>
+<a class="sourceLine" id="cb14-2" data-line-number="2"><span class="co">#&gt; [[1]]</span></a>
+<a class="sourceLine" id="cb14-3" data-line-number="3"><span class="co">#&gt;   category_id probability         label</span></a>
+<a class="sourceLine" id="cb14-4" data-line-number="4"><span class="co">#&gt; 1    18313280       0.058         Music</span></a>
+<a class="sourceLine" id="cb14-5" data-line-number="5"><span class="co">#&gt; 2    18313356       0.052           Pop</span></a>
+<a class="sourceLine" id="cb14-6" data-line-number="6"><span class="co">#&gt; 3    18313357       0.338      Pop Rock</span></a>
+<a class="sourceLine" id="cb14-7" data-line-number="7"><span class="co">#&gt; 4    18313358       0.209 Joni Mitchell</span></a>
+<a class="sourceLine" id="cb14-8" data-line-number="8"><span class="co">#&gt; </span></a>
+<a class="sourceLine" id="cb14-9" data-line-number="9"><span class="co">#&gt; [[2]]</span></a>
+<a class="sourceLine" id="cb14-10" data-line-number="10"><span class="co">#&gt;   category_id probability                    label</span></a>
+<a class="sourceLine" id="cb14-11" data-line-number="11"><span class="co">#&gt; 1    18313280       0.088                    Music</span></a>
+<a class="sourceLine" id="cb14-12" data-line-number="12"><span class="co">#&gt; 2    18313701       0.051         Special Interest</span></a>
+<a class="sourceLine" id="cb14-13" data-line-number="13"><span class="co">#&gt; 3    18313702       0.816 See all Special Interest</span></a>
+<a class="sourceLine" id="cb14-14" data-line-number="14"><span class="co">#&gt; </span></a>
+<a class="sourceLine" id="cb14-15" data-line-number="15"><span class="co">#&gt; [[3]]</span></a>
+<a class="sourceLine" id="cb14-16" data-line-number="16"><span class="co">#&gt;   category_id probability         label</span></a>
+<a class="sourceLine" id="cb14-17" data-line-number="17"><span class="co">#&gt; 1    18314767       0.076         Books</span></a>
+<a class="sourceLine" id="cb14-18" data-line-number="18"><span class="co">#&gt; 2    18315016       0.049      Religion</span></a>
+<a class="sourceLine" id="cb14-19" data-line-number="19"><span class="co">#&gt; 3    18315024       0.139 Inspirational</span></a>
+<a class="sourceLine" id="cb14-20" data-line-number="20"><span class="co">#&gt; </span></a>
+<a class="sourceLine" id="cb14-21" data-line-number="21"><span class="co">#&gt; [[4]]</span></a>
+<a class="sourceLine" id="cb14-22" data-line-number="22"><span class="co">#&gt;   category_id probability         label</span></a>
+<a class="sourceLine" id="cb14-23" data-line-number="23"><span class="co">#&gt; 1    18313280       0.060         Music</span></a>
+<a class="sourceLine" id="cb14-24" data-line-number="24"><span class="co">#&gt; 2    18313601       0.057         Blues</span></a>
+<a class="sourceLine" id="cb14-25" data-line-number="25"><span class="co">#&gt; 3    18313612       0.262 Chicago Blues</span></a>
+<a class="sourceLine" id="cb14-26" data-line-number="26"><span class="co">#&gt; 4    18313614       0.227 Little Milton</span></a>
+<a class="sourceLine" id="cb14-27" data-line-number="27"><span class="co">#&gt; </span></a>
+<a class="sourceLine" id="cb14-28" data-line-number="28"><span class="co">#&gt; [[5]]</span></a>
+<a class="sourceLine" id="cb14-29" data-line-number="29"><span class="co">#&gt;   category_id probability label</span></a>
+<a class="sourceLine" id="cb14-30" data-line-number="30"><span class="co">#&gt; 1          NA          NA    NA</span></a>
+<a class="sourceLine" id="cb14-31" data-line-number="31"><span class="co">#&gt; </span></a>
+<a class="sourceLine" id="cb14-32" data-line-number="32"><span class="co">#&gt; [[6]]</span></a>
+<a class="sourceLine" id="cb14-33" data-line-number="33"><span class="co">#&gt;   category_id probability      label</span></a>
+<a class="sourceLine" id="cb14-34" data-line-number="34"><span class="co">#&gt; 1    18313280       0.059      Music</span></a>
+<a class="sourceLine" id="cb14-35" data-line-number="35"><span class="co">#&gt; 2    18313459       0.058     World </span></a>
+<a class="sourceLine" id="cb14-36" data-line-number="36"><span class="co">#&gt; 3    18313469       0.352     Celtic</span></a>
+<a class="sourceLine" id="cb14-37" data-line-number="37"><span class="co">#&gt; 4    18313471       0.440 Celtic Man</span></a>
+<a class="sourceLine" id="cb14-38" data-line-number="38"><span class="co">#&gt; </span></a>
+<a class="sourceLine" id="cb14-39" data-line-number="39"><span class="co">#&gt; [[7]]</span></a>
+<a class="sourceLine" id="cb14-40" data-line-number="40"><span class="co">#&gt;   category_id probability                label</span></a>
+<a class="sourceLine" id="cb14-41" data-line-number="41"><span class="co">#&gt; 1    18314767       0.075                Books</span></a>
+<a class="sourceLine" id="cb14-42" data-line-number="42"><span class="co">#&gt; 2    18314983       0.057 Parenting &amp; Families</span></a>
+<a class="sourceLine" id="cb14-43" data-line-number="43"><span class="co">#&gt; 3    18314999       0.057             Marriage</span></a>
+<a class="sourceLine" id="cb14-44" data-line-number="44"><span class="co">#&gt; </span></a>
+<a class="sourceLine" id="cb14-45" data-line-number="45"><span class="co">#&gt; [[8]]</span></a>
+<a class="sourceLine" id="cb14-46" data-line-number="46"><span class="co">#&gt;   category_id probability            label</span></a>
+<a class="sourceLine" id="cb14-47" data-line-number="47"><span class="co">#&gt; 1    18314767       0.078            Books</span></a>
+<a class="sourceLine" id="cb14-48" data-line-number="48"><span class="co">#&gt; 2    18314769       0.046 Children's Books</span></a>
+<a class="sourceLine" id="cb14-49" data-line-number="49"><span class="co">#&gt; 3    18314788       0.044      Educational</span></a>
+<a class="sourceLine" id="cb14-50" data-line-number="50"><span class="co">#&gt; </span></a>
+<a class="sourceLine" id="cb14-51" data-line-number="51"><span class="co">#&gt; [[9]]</span></a>
+<a class="sourceLine" id="cb14-52" data-line-number="52"><span class="co">#&gt;   category_id probability                        label</span></a>
+<a class="sourceLine" id="cb14-53" data-line-number="53"><span class="co">#&gt; 1    18313280       0.061                        Music</span></a>
+<a class="sourceLine" id="cb14-54" data-line-number="54"><span class="co">#&gt; 2    18313584       0.063             Children's Music</span></a>
+<a class="sourceLine" id="cb14-55" data-line-number="55"><span class="co">#&gt; 3    18313589       0.383       Children's Sing-a-Long</span></a>
+<a class="sourceLine" id="cb14-56" data-line-number="56"><span class="co">#&gt; 4    18313590       0.285 Various Artists-Sing-A-Longs</span></a>
+<a class="sourceLine" id="cb14-57" data-line-number="57"><span class="co">#&gt; </span></a>
+<a class="sourceLine" id="cb14-58" data-line-number="58"><span class="co">#&gt; [[10]]</span></a>
+<a class="sourceLine" id="cb14-59" data-line-number="59"><span class="co">#&gt;   category_id probability               label</span></a>
+<a class="sourceLine" id="cb14-60" data-line-number="60"><span class="co">#&gt; 1    18314767       0.058               Books</span></a>
+<a class="sourceLine" id="cb14-61" data-line-number="61"><span class="co">#&gt; 2    18314839       0.045 Biography &amp; Memoirs</span></a>
+<a class="sourceLine" id="cb14-62" data-line-number="62"><span class="co">#&gt; 3    18314851       0.082           Religious</span></a>
+<a class="sourceLine" id="cb14-63" data-line-number="63"><span class="co">#&gt; </span></a>
+<a class="sourceLine" id="cb14-64" data-line-number="64"><span class="co">#&gt; [[11]]</span></a>
+<a class="sourceLine" id="cb14-65" data-line-number="65"><span class="co">#&gt;   category_id probability            label</span></a>
+<a class="sourceLine" id="cb14-66" data-line-number="66"><span class="co">#&gt; 1    18314767       0.068            Books</span></a>
+<a class="sourceLine" id="cb14-67" data-line-number="67"><span class="co">#&gt; 2    18314769       0.049 Children's Books</span></a>
+<a class="sourceLine" id="cb14-68" data-line-number="68"><span class="co">#&gt; 3    18314784       0.042          Animals</span></a>
+<a class="sourceLine" id="cb14-69" data-line-number="69"><span class="co">#&gt; 4    18314785       0.504          Rabbits</span></a></code></pre></div>
+<p>You can easily choose an unnested output by setting the <strong>unnest flag</strong> to TRUE (which it is by default) to get one row per classification/extraction.</p>
+<div class="sourceCode" id="cb15"><pre class="sourceCode r"><code class="sourceCode r"><a class="sourceLine" id="cb15-1" data-line-number="1">(output_unnested &lt;-<span class="st"> </span><span class="kw">monkey_classify</span>(input, <span class="dt">verbose =</span> <span class="ot">FALSE</span>, <span class="dt">unnest =</span> <span class="ot">TRUE</span>))</a>
+<a class="sourceLine" id="cb15-2" data-line-number="2"><span class="co">#&gt; # A tibble: 36 x 4</span></a>
+<a class="sourceLine" id="cb15-3" data-line-number="3"><span class="co">#&gt;    req                               category_id probability label        </span></a>
+<a class="sourceLine" id="cb15-4" data-line-number="4"><span class="co">#&gt;    &lt;chr&gt;                                   &lt;int&gt;       &lt;dbl&gt; &lt;chr&gt;        </span></a>
+<a class="sourceLine" id="cb15-5" data-line-number="5"><span class="co">#&gt;  1 Emma Woodhouse, handsome, clever~    18313280      0.0580 Music        </span></a>
+<a class="sourceLine" id="cb15-6" data-line-number="6"><span class="co">#&gt;  2 Emma Woodhouse, handsome, clever~    18313356      0.0520 Pop          </span></a>
+<a class="sourceLine" id="cb15-7" data-line-number="7"><span class="co">#&gt;  3 Emma Woodhouse, handsome, clever~    18313357      0.338  Pop Rock     </span></a>
+<a class="sourceLine" id="cb15-8" data-line-number="8"><span class="co">#&gt;  4 Emma Woodhouse, handsome, clever~    18313358      0.209  Joni Mitchell</span></a>
+<a class="sourceLine" id="cb15-9" data-line-number="9"><span class="co">#&gt;  5 and happy disposition, seemed to~    18313280      0.0880 Music        </span></a>
+<a class="sourceLine" id="cb15-10" data-line-number="10"><span class="co">#&gt;  6 and happy disposition, seemed to~    18313701      0.0510 Special Inte~</span></a>
+<a class="sourceLine" id="cb15-11" data-line-number="11"><span class="co">#&gt;  7 and happy disposition, seemed to~    18313702      0.816  See all Spec~</span></a>
+<a class="sourceLine" id="cb15-12" data-line-number="12"><span class="co">#&gt;  8 existence; and had lived nearly ~    18314767      0.0760 Books        </span></a>
+<a class="sourceLine" id="cb15-13" data-line-number="13"><span class="co">#&gt;  9 existence; and had lived nearly ~    18315016      0.0490 Religion     </span></a>
+<a class="sourceLine" id="cb15-14" data-line-number="14"><span class="co">#&gt; 10 existence; and had lived nearly ~    18315024      0.139  Inspirational</span></a>
+<a class="sourceLine" id="cb15-15" data-line-number="15"><span class="co">#&gt; # ... with 26 more rows</span></a></code></pre></div>
+<p>We could have gotten the same result by sending in a dataframe and a named column. If a dataframe is supplied input column is not renamed to <code>req</code> as it is when input is a vector; the original column name is retained.</p>
+<div class="sourceCode" id="cb16"><pre class="sourceCode r"><code class="sourceCode r"><a class="sourceLine" id="cb16-1" data-line-number="1">input_df &lt;-<span class="st"> </span>tibble<span class="op">::</span><span class="kw">tibble</span>(<span class="dt">text =</span> input) </a>
+<a class="sourceLine" id="cb16-2" data-line-number="2">output_df_unnested &lt;-<span class="st"> </span><span class="kw">monkey_classify</span>(input_df, text, <span class="dt">unnest =</span> <span class="ot">TRUE</span>, <span class="dt">verbose =</span> <span class="ot">FALSE</span>) <span class="op">%&gt;%</span><span class="st"> </span></a>
+<a class="sourceLine" id="cb16-3" data-line-number="3"><span class="st">    </span>dplyr<span class="op">::</span><span class="kw">rename</span>(<span class="dt">req =</span> text)</a>
+<a class="sourceLine" id="cb16-4" data-line-number="4"></a>
+<a class="sourceLine" id="cb16-5" data-line-number="5">testthat<span class="op">::</span><span class="kw">expect_equal</span>(output_unnested, output_df_unnested)</a></code></pre></div>
+<p><br></p>
+<p>If the input is a dataframe, setting the <code>.keep_all</code> option to TRUE allows you to retain all input columns. If FALSE, only the column you specify for classification will be retained.</p>
+<div class="sourceCode" id="cb17"><pre class="sourceCode r"><code class="sourceCode r"><a class="sourceLine" id="cb17-1" data-line-number="1">sw &lt;-<span class="st"> </span>dplyr<span class="op">::</span>starwars <span class="op">%&gt;%</span><span class="st"> </span></a>
+<a class="sourceLine" id="cb17-2" data-line-number="2"><span class="st">  </span>dplyr<span class="op">::</span><span class="kw">select</span>(name, height) <span class="op">%&gt;%</span><span class="st"> </span></a>
+<a class="sourceLine" id="cb17-3" data-line-number="3"><span class="st">  </span>dplyr<span class="op">::</span><span class="kw">sample_n</span>(<span class="kw">nrow</span>(input_df))</a>
+<a class="sourceLine" id="cb17-4" data-line-number="4"></a>
+<a class="sourceLine" id="cb17-5" data-line-number="5">sw_input_df &lt;-<span class="st"> </span>input_df <span class="op">%&gt;%</span><span class="st"> </span></a>
+<a class="sourceLine" id="cb17-6" data-line-number="6"><span class="st">  </span>dplyr<span class="op">::</span><span class="kw">bind_cols</span>(sw)</a>
+<a class="sourceLine" id="cb17-7" data-line-number="7"></a>
+<a class="sourceLine" id="cb17-8" data-line-number="8">sw_input_df <span class="op">%&gt;%</span><span class="st"> </span><span class="kw">monkey_classify</span>(text, <span class="dt">unnest =</span> <span class="ot">FALSE</span>, <span class="dt">verbose =</span> <span class="ot">FALSE</span>)</a>
+<a class="sourceLine" id="cb17-9" data-line-number="9"><span class="co">#&gt; # A tibble: 11 x 4</span></a>
+<a class="sourceLine" id="cb17-10" data-line-number="10"><span class="co">#&gt;    name              height text                               res        </span></a>
+<a class="sourceLine" id="cb17-11" data-line-number="11"><span class="co">#&gt;    &lt;chr&gt;              &lt;int&gt; &lt;chr&gt;                              &lt;list&gt;     </span></a>
+<a class="sourceLine" id="cb17-12" data-line-number="12"><span class="co">#&gt;  1 Jek Tono Porkins     180 Emma Woodhouse, handsome, clever,~ &lt;data.fram~</span></a>
+<a class="sourceLine" id="cb17-13" data-line-number="13"><span class="co">#&gt;  2 Lobot                175 and happy disposition, seemed to ~ &lt;data.fram~</span></a>
+<a class="sourceLine" id="cb17-14" data-line-number="14"><span class="co">#&gt;  3 Gregar Typho         185 existence; and had lived nearly t~ &lt;data.fram~</span></a>
+<a class="sourceLine" id="cb17-15" data-line-number="15"><span class="co">#&gt;  4 Jocasta Nu           167 little to distress or vex her.     &lt;data.fram~</span></a>
+<a class="sourceLine" id="cb17-16" data-line-number="16"><span class="co">#&gt;  5 Poe Dameron           NA &quot;&quot;                                 &lt;data.fram~</span></a>
+<a class="sourceLine" id="cb17-17" data-line-number="17"><span class="co">#&gt;  6 Luminara Unduli      170 She was the youngest of the two d~ &lt;data.fram~</span></a>
+<a class="sourceLine" id="cb17-18" data-line-number="18"><span class="co">#&gt;  7 Owen Lars            178 indulgent father; and had, in con~ &lt;data.fram~</span></a>
+<a class="sourceLine" id="cb17-19" data-line-number="19"><span class="co">#&gt;  8 Taun We              213 mistress of his house from a very~ &lt;data.fram~</span></a>
+<a class="sourceLine" id="cb17-20" data-line-number="20"><span class="co">#&gt;  9 C-3PO                167 too long ago for her to have more~ &lt;data.fram~</span></a>
+<a class="sourceLine" id="cb17-21" data-line-number="21"><span class="co">#&gt; 10 Biggs Darklighter    183 her caresses; and her place had b~ &lt;data.fram~</span></a>
+<a class="sourceLine" id="cb17-22" data-line-number="22"><span class="co">#&gt; 11 Boba Fett            183 governess, who had fallen little ~ &lt;data.fram~</span></a></code></pre></div>
+</div>
+<div id="batching" class="section level3">
+<h3>Batching</h3>
+<p>Retaining the relationship between input and output doesn’t mean you’ll need to send requests one-by-one. <strong>Batch requests</strong> by setting the <code>texts_per_req</code> value which governs the number of texts that are sent per request. Per the <a href="http://help.monkeylearn.com/frequently-asked-questions/queries/can-i-classify-or-extract-more-than-one-text-with-one-api-request">MonkeyLearn documentation</a>, the maximum we recommend sending at once is 200 requests.</p>
+<p>If <code>texts_per_req</code> is NULL, the default, we try to optimize the response time from the API by setting <code>texts_per_req</code> to 200 when your input has more than 200 texts or to the length of the <code>input</code> if you’ve got fewer. You’ll see a significant speedup by batching your requests this way. However, batching doesn’t save you on queries; a batch of 150 texts still uses up 150 queries.</p>
+<p>These functions also include some more verbose <strong>progress reporting</strong>, letting you know what batch you’re on out of the total, and which texts are set to be processed in that batch.</p>
+<div class="sourceCode" id="cb18"><pre class="sourceCode r"><code class="sourceCode r"><a class="sourceLine" id="cb18-1" data-line-number="1">one_by_one &lt;-<span class="st"> </span><span class="kw">system.time</span>(output &lt;-<span class="st"> </span><span class="kw">monkey_classify</span>(input, <span class="dt">texts_per_req =</span> <span class="dv">1</span>))</a>
+<a class="sourceLine" id="cb18-2" data-line-number="2"><span class="co">#&gt; Using classifier ID cl_oFKL5wft; to find other classifiers, run monkeylearn_classifiers() or visit https://app.monkeylearn.com/main/explore/</span></a>
+<a class="sourceLine" id="cb18-3" data-line-number="3"><span class="co">#&gt; The following indices were empty strings and could not be sent to the API: 5. They will still be included in the output.</span></a>
+<a class="sourceLine" id="cb18-4" data-line-number="4"><span class="co">#&gt; Processing batch 1 of 10 batches: texts 1 to 1</span></a>
+<a class="sourceLine" id="cb18-5" data-line-number="5"><span class="co">#&gt; Processing batch 2 of 10 batches: texts 1 to 2</span></a>
+<a class="sourceLine" id="cb18-6" data-line-number="6"><span class="co">#&gt; Processing batch 3 of 10 batches: texts 2 to 3</span></a>
+<a class="sourceLine" id="cb18-7" data-line-number="7"><span class="co">#&gt; Processing batch 4 of 10 batches: texts 3 to 4</span></a>
+<a class="sourceLine" id="cb18-8" data-line-number="8"><span class="co">#&gt; Processing batch 5 of 10 batches: texts 4 to 5</span></a>
+<a class="sourceLine" id="cb18-9" data-line-number="9"><span class="co">#&gt; Processing batch 6 of 10 batches: texts 5 to 6</span></a>
+<a class="sourceLine" id="cb18-10" data-line-number="10"><span class="co">#&gt; Processing batch 7 of 10 batches: texts 6 to 7</span></a>
+<a class="sourceLine" id="cb18-11" data-line-number="11"><span class="co">#&gt; Processing batch 8 of 10 batches: texts 7 to 8</span></a>
+<a class="sourceLine" id="cb18-12" data-line-number="12"><span class="co">#&gt; Processing batch 9 of 10 batches: texts 8 to 9</span></a>
+<a class="sourceLine" id="cb18-13" data-line-number="13"><span class="co">#&gt; Processing batch 10 of 10 batches: texts 9 to 10</span></a>
+<a class="sourceLine" id="cb18-14" data-line-number="14"><span class="co">#&gt; </span></a>
+<a class="sourceLine" id="cb18-15" data-line-number="15"><span class="co">#&gt; </span></a>
+<a class="sourceLine" id="cb18-16" data-line-number="16"><span class="co">#&gt;  ------------- </span></a>
+<a class="sourceLine" id="cb18-17" data-line-number="17"><span class="co">#&gt; Still working! </span></a>
+<a class="sourceLine" id="cb18-18" data-line-number="18"><span class="co">#&gt;  -------------- </span></a>
+<a class="sourceLine" id="cb18-19" data-line-number="19"><span class="co">#&gt;               \   </span></a>
+<a class="sourceLine" id="cb18-20" data-line-number="20"><span class="co">#&gt;                \  </span></a>
+<a class="sourceLine" id="cb18-21" data-line-number="21"><span class="co">#&gt;                 \</span></a>
+<a class="sourceLine" id="cb18-22" data-line-number="22"><span class="co">#&gt; </span></a>
+<a class="sourceLine" id="cb18-23" data-line-number="23"><span class="co">#&gt;                   .=&quot;=.</span></a>
+<a class="sourceLine" id="cb18-24" data-line-number="24"><span class="co">#&gt;                 _/.-.-.\_     _</span></a>
+<a class="sourceLine" id="cb18-25" data-line-number="25"><span class="co">#&gt;                ( ( o o ) )    ))</span></a>
+<a class="sourceLine" id="cb18-26" data-line-number="26"><span class="co">#&gt;                 |/  &quot;  \|    //</span></a>
+<a class="sourceLine" id="cb18-27" data-line-number="27"><span class="co">#&gt;                  \'---'/    //</span></a>
+<a class="sourceLine" id="cb18-28" data-line-number="28"><span class="co">#&gt;            jgs   /`&quot;&quot;&quot;`\\  ((</span></a>
+<a class="sourceLine" id="cb18-29" data-line-number="29"><span class="co">#&gt;                 / /_,_\ \\  \\</span></a>
+<a class="sourceLine" id="cb18-30" data-line-number="30"><span class="co">#&gt;                 \_\_'__/  \  ))</span></a>
+<a class="sourceLine" id="cb18-31" data-line-number="31"><span class="co">#&gt;                 /`  /`~\   |//</span></a>
+<a class="sourceLine" id="cb18-32" data-line-number="32"><span class="co">#&gt;                /   /    \  /</span></a>
+<a class="sourceLine" id="cb18-33" data-line-number="33"><span class="co">#&gt;           ,--`,--'\/\    /</span></a>
+<a class="sourceLine" id="cb18-34" data-line-number="34"><span class="co">#&gt;           '-- &quot;--'  '--'</span></a></code></pre></div>
+<div class="sourceCode" id="cb19"><pre class="sourceCode r"><code class="sourceCode r"><a class="sourceLine" id="cb19-1" data-line-number="1">batch_of_five &lt;-<span class="st"> </span><span class="kw">system.time</span>(output &lt;-<span class="st"> </span><span class="kw">monkey_classify</span>(input, <span class="dt">texts_per_req =</span> <span class="dv">5</span>))</a>
+<a class="sourceLine" id="cb19-2" data-line-number="2"><span class="co">#&gt; Using classifier ID cl_oFKL5wft; to find other classifiers, run monkeylearn_classifiers() or visit https://app.monkeylearn.com/main/explore/</span></a>
+<a class="sourceLine" id="cb19-3" data-line-number="3"><span class="co">#&gt; The following indices were empty strings and could not be sent to the API: 5. They will still be included in the output.</span></a>
+<a class="sourceLine" id="cb19-4" data-line-number="4"><span class="co">#&gt; Processing batch 1 of 2 batches: texts 1 to 5</span></a>
+<a class="sourceLine" id="cb19-5" data-line-number="5"><span class="co">#&gt; Processing batch 2 of 2 batches: texts 5 to 10</span></a></code></pre></div>
+<p>How much does sending 5 texts in a batch vs. 1 text improve our processing time?</p>
+<div class="sourceCode" id="cb20"><pre class="sourceCode r"><code class="sourceCode r"><a class="sourceLine" id="cb20-1" data-line-number="1">(speedup &lt;-<span class="st"> </span>one_by_one[<span class="dv">1</span>] <span class="op">/</span><span class="st"> </span>batch_of_five[<span class="dv">1</span>])</a>
+<a class="sourceLine" id="cb20-2" data-line-number="2"><span class="co">#&gt; user.self </span></a>
+<a class="sourceLine" id="cb20-3" data-line-number="3"><span class="co">#&gt;  2.428571</span></a></code></pre></div>
+<p>A 3-4x speedup isn’t so bad! Worth keeping in mind that if you need the blazing fast speeds you might consider upgrading to a higher MonkeyLearn price tier.</p>
+<p><br></p>
+<hr />
+<p><br></p>
+</div>
+</div>
+</div>
+<div id="meta" class="section level1">
+<h1>Meta</h1>
+<ul>
+<li>Please <a href="https://github.com/ropensci/monkeylearn/issues">report any issues or bugs</a>.</li>
+<li>License: GPL</li>
+<li>Get citation information for <code>monkeylearn</code> in R doing <code>citation(package = 'monkeylearn')</code></li>
+<li>Please note that this project is released with a <a href="CONDUCT.md">Contributor Code of Conduct</a>. By participating in this project you agree to abide by its terms.</li>
+<li>This package is part of the <a href="https://ropensci.org/">rOpenSci project</a>.</li>
+</ul>
+</div>
+<div class="footnotes">
+<hr />
+<ol>
+<li id="fn1"><p>Thanks to <a href="https://juliasilge.com/">Julia Silge</a>’s fantastic <a href="https://github.com/juliasilge/janeaustenr"><code>janeaustenr</code></a> package for this text!<a href="#fnref1" class="footnote-back">↩</a></p></li>
+</ol>
+</div>
+
+
+
+<!-- dynamically load mathjax for compatibility with self-contained -->
+<script>
+  (function () {
+    var script = document.createElement("script");
+    script.type = "text/javascript";
+    script.src  = "https://mathjax.rstudio.com/latest/MathJax.js?config=TeX-AMS-MML_HTMLorMML";
+    document.getElementsByTagName("head")[0].appendChild(script);
+  })();
+</script>
+
+</body>
+</html>