unescape selftext_html from json api, fixes #354

This commit is contained in:
Martin Lindhe 2025-01-24 11:23:22 +01:00
parent d7ec07cd0d
commit 3212029458
3 changed files with 10 additions and 1 deletions

7
Cargo.lock generated
View file

@ -770,6 +770,12 @@ version = "0.4.0"
source = "registry+https://github.com/rust-lang/crates.io-index" source = "registry+https://github.com/rust-lang/crates.io-index"
checksum = "fbf6a919d6cf397374f7dfeeea91d974c7c0a7221d0d0f4f20d859d329e53fcc" checksum = "fbf6a919d6cf397374f7dfeeea91d974c7c0a7221d0d0f4f20d859d329e53fcc"
[[package]]
name = "htmlescape"
version = "0.3.1"
source = "registry+https://github.com/rust-lang/crates.io-index"
checksum = "e9025058dae765dee5070ec375f591e2ba14638c63feff74f13805a72e523163"
[[package]] [[package]]
name = "http" name = "http"
version = "0.2.12" version = "0.2.12"
@ -1367,6 +1373,7 @@ dependencies = [
"dotenvy", "dotenvy",
"fastrand", "fastrand",
"futures-lite", "futures-lite",
"htmlescape",
"hyper", "hyper",
"hyper-rustls", "hyper-rustls",
"libflate", "libflate",

View file

@ -51,6 +51,7 @@ common-words-all = { version = "0.0.2", default-features = false, features = ["e
hyper-rustls = { version = "0.24.2", features = [ "http2" ] } hyper-rustls = { version = "0.24.2", features = [ "http2" ] }
tegen = "0.1.4" tegen = "0.1.4"
serde_urlencoded = "0.7.1" serde_urlencoded = "0.7.1"
htmlescape = "0.3.1"
[dev-dependencies] [dev-dependencies]

View file

@ -22,6 +22,7 @@ use std::str::FromStr;
use std::string::ToString; use std::string::ToString;
use time::{macros::format_description, Duration, OffsetDateTime}; use time::{macros::format_description, Duration, OffsetDateTime};
use url::Url; use url::Url;
use htmlescape::decode_html;
/// Write a message to stderr on debug mode. This function is a no-op on /// Write a message to stderr on debug mode. This function is a no-op on
/// release code. /// release code.
@ -376,7 +377,7 @@ impl Post {
let awards = Awards::parse(&data["all_awardings"]); let awards = Awards::parse(&data["all_awardings"]);
// selftext_html is set for text posts when browsing. // selftext_html is set for text posts when browsing.
let mut body = rewrite_urls(&val(post, "selftext_html")); let mut body = rewrite_urls(&decode_html(&val(post, "selftext_html")).unwrap());
if body.is_empty() { if body.is_empty() {
body = rewrite_urls(&val(post, "body_html")); body = rewrite_urls(&val(post, "body_html"));
} }