17 #ifndef REMWHAREAD_URI_HPP 18 #define REMWHAREAD_URI_HPP 37 bool successful =
false;
57 bool successful =
false;
82 explicit URI(
const string &uri);
140 const string &tag =
"");
158 #endif // REMWHAREAD_URI_HPP const string unescape_html(string html)
Convert HTML entities to UTF-8.
Definition: uri.cpp:306
URI(const string &uri)
Construct object and set URL.
Definition: uri.cpp:64
const string remove_html_tags(const string &html, const string &tag="")
Remove HTML tags.
Definition: uri.cpp:268
const string strip_html(const string &html)
Removes HTML tags and superflous spaces from an HTML page.
Definition: uri.cpp:247
const string remove_newlines(string text)
Replace newlines with spaces.
Definition: uri.cpp:631
The result of the call to the archive service.
Definition: uri.hpp:55
const html_extract get()
Download URI and extract title, description and full text.
Definition: uri.cpp:114
const string extract_title(const string &html)
Extract the title from an HTML page.
Definition: uri.cpp:212
Download, archive and process an URI.
Definition: uri.hpp:71
const string make_request(const string &uri, bool archive=false) const
Make a HTTP(S) request.
Definition: uri.cpp:139
const archive_answer archive()
Save URI in archive and return archive-URI.
Definition: uri.cpp:606
const string extract_description(const string &html)
Extract the description from an HTML page.
Definition: uri.cpp:229