mirror of
https://github.com/MarginaliaSearch/MarginaliaSearch.git
synced 2025-02-24 13:19:02 +00:00
(encyclopedia) Add URLencoding to path element
This prevents corruption of the links to the sideloaded encyclopedia data when the article path contains characters that are not valid in a URL.
This commit is contained in:
parent
9689f3faee
commit
29bf473d74
@ -1,6 +1,7 @@
|
|||||||
package nu.marginalia.converting.sideload.encyclopedia;
|
package nu.marginalia.converting.sideload.encyclopedia;
|
||||||
|
|
||||||
import com.github.luben.zstd.ZstdInputStream;
|
import com.github.luben.zstd.ZstdInputStream;
|
||||||
|
import com.google.common.base.Charsets;
|
||||||
import com.google.gson.Gson;
|
import com.google.gson.Gson;
|
||||||
import lombok.SneakyThrows;
|
import lombok.SneakyThrows;
|
||||||
import nu.marginalia.atags.AnchorTextKeywords;
|
import nu.marginalia.atags.AnchorTextKeywords;
|
||||||
@ -110,7 +111,7 @@ public class EncyclopediaMarginaliaNuSideloader implements SideloadSource, AutoC
|
|||||||
}
|
}
|
||||||
|
|
||||||
private ProcessedDocument convertDocument(List<String> parts, String title, String url, DomainLinks domainLinks) throws URISyntaxException, DisqualifiedException {
|
private ProcessedDocument convertDocument(List<String> parts, String title, String url, DomainLinks domainLinks) throws URISyntaxException, DisqualifiedException {
|
||||||
String fullUrl = baseUrl.toString() + url;
|
String fullUrl = baseUrl.toString() + URLEncoder.encode(url, Charsets.UTF_8);
|
||||||
|
|
||||||
StringBuilder fullHtml = new StringBuilder();
|
StringBuilder fullHtml = new StringBuilder();
|
||||||
fullHtml
|
fullHtml
|
||||||
|
Loading…
Reference in New Issue
Block a user