fix html comments

This commit is contained in:
yausername 2019-11-16 03:20:35 +05:30
parent 193442d01c
commit bb5ad49fac
1 changed files with 8 additions and 1 deletions

View File

@ -5,6 +5,8 @@ import java.text.ParseException;
import java.text.SimpleDateFormat;
import java.util.Locale;
import org.jsoup.Jsoup;
import org.jsoup.nodes.Document;
import org.schabi.newpipe.extractor.ServiceList;
import org.schabi.newpipe.extractor.comments.CommentsInfoItemExtractor;
import org.schabi.newpipe.extractor.exceptions.ParsingException;
@ -59,7 +61,12 @@ public class PeertubeCommentsInfoItemExtractor implements CommentsInfoItemExtrac
@Override
public String getCommentText() throws ParsingException {
String htmlText = JsonUtils.getString(item, "text");
return htmlText.replaceAll("(?s)<[^>]*>(\\s*<[^>]*>)*", "");
try {
Document doc = Jsoup.parse(htmlText);
return doc.body().text();
}catch(Exception e) {
return htmlText.replaceAll("(?s)<[^>]*>(\\s*<[^>]*>)*", "");
}
}
@Override