Remove html tags.

strip_html_tags(text)

# S3 method for corpus
strip_html_tags(text)

# S3 method for documents
strip_html_tags(text)

# S3 method for document
strip_html_tags(text)

Arguments

text

An object inheriting of class document or corpus.

Examples

# NOT RUN {
init_textanalysis()

# build document
# must be lowercase
doc <- string_document("This is a <span>document</span>.")

# replaces in place!
strip_html_tags(doc)
get_text(doc)
# }