NewPipeExtractor/extractor/src/main/java/org/schabi/newpipe/extractor/services/peertube/extractors/PeertubeStreamExtractor.java

492 lines
17 KiB
Java
Raw Normal View History

2018-10-11 21:10:22 +02:00
package org.schabi.newpipe.extractor.services.peertube.extractors;
2022-03-18 10:25:16 +01:00
import static org.schabi.newpipe.extractor.utils.Utils.UTF_8;
import static org.schabi.newpipe.extractor.utils.Utils.isNullOrEmpty;
import com.grack.nanojson.JsonArray;
import com.grack.nanojson.JsonObject;
import com.grack.nanojson.JsonParser;
import com.grack.nanojson.JsonParserException;
2022-03-18 10:25:16 +01:00
2018-10-11 21:10:22 +02:00
import org.schabi.newpipe.extractor.MediaFormat;
import org.schabi.newpipe.extractor.NewPipe;
2018-10-11 21:10:22 +02:00
import org.schabi.newpipe.extractor.StreamingService;
2019-11-19 22:38:17 +01:00
import org.schabi.newpipe.extractor.downloader.Downloader;
import org.schabi.newpipe.extractor.downloader.Response;
2018-10-11 21:10:22 +02:00
import org.schabi.newpipe.extractor.exceptions.ExtractionException;
import org.schabi.newpipe.extractor.exceptions.ParsingException;
import org.schabi.newpipe.extractor.exceptions.ReCaptchaException;
import org.schabi.newpipe.extractor.linkhandler.LinkHandler;
2019-11-19 22:38:17 +01:00
import org.schabi.newpipe.extractor.localization.DateWrapper;
2018-10-11 21:10:22 +02:00
import org.schabi.newpipe.extractor.services.peertube.PeertubeParsingHelper;
import org.schabi.newpipe.extractor.services.peertube.linkHandler.PeertubeSearchQueryHandlerFactory;
import org.schabi.newpipe.extractor.services.peertube.linkHandler.PeertubeStreamLinkHandlerFactory;
2022-03-18 10:25:16 +01:00
import org.schabi.newpipe.extractor.stream.AudioStream;
import org.schabi.newpipe.extractor.stream.Description;
import org.schabi.newpipe.extractor.stream.Stream;
import org.schabi.newpipe.extractor.stream.StreamExtractor;
import org.schabi.newpipe.extractor.stream.StreamInfoItemsCollector;
import org.schabi.newpipe.extractor.stream.StreamType;
import org.schabi.newpipe.extractor.stream.SubtitlesStream;
import org.schabi.newpipe.extractor.stream.VideoStream;
2018-10-11 21:10:22 +02:00
import org.schabi.newpipe.extractor.utils.JsonUtils;
2020-05-02 08:21:47 +02:00
import org.schabi.newpipe.extractor.utils.Utils;
2018-10-11 21:10:22 +02:00
import java.io.IOException;
import java.io.UnsupportedEncodingException;
import java.net.URLEncoder;
import java.util.ArrayList;
import java.util.Collections;
import java.util.List;
import java.util.Locale;
2022-03-18 10:25:16 +01:00
import javax.annotation.Nonnull;
import javax.annotation.Nullable;
2021-02-07 22:12:22 +01:00
2018-10-11 21:10:22 +02:00
public class PeertubeStreamExtractor extends StreamExtractor {
private final String baseUrl;
2018-10-11 21:10:22 +02:00
private JsonObject json;
private final List<SubtitlesStream> subtitles = new ArrayList<>();
2022-03-18 10:25:16 +01:00
public PeertubeStreamExtractor(final StreamingService service, final LinkHandler linkHandler)
throws ParsingException {
2019-11-19 22:38:17 +01:00
super(service, linkHandler);
2019-11-22 19:35:49 +01:00
this.baseUrl = getBaseUrl();
2018-10-11 21:10:22 +02:00
}
2018-10-11 21:10:22 +02:00
@Override
2019-11-19 22:38:17 +01:00
public String getTextualUploadDate() throws ParsingException {
return JsonUtils.getString(json, "publishedAt");
2018-10-11 21:10:22 +02:00
}
2019-11-19 22:38:17 +01:00
@Override
public DateWrapper getUploadDate() throws ParsingException {
final String textualUploadDate = getTextualUploadDate();
if (textualUploadDate == null) {
return null;
}
return new DateWrapper(PeertubeParsingHelper.parseDateFrom(textualUploadDate));
}
@Nonnull
2018-10-11 21:10:22 +02:00
@Override
public String getThumbnailUrl() throws ParsingException {
return baseUrl + JsonUtils.getString(json, "previewPath");
2018-10-11 21:10:22 +02:00
}
@Nonnull
2018-10-11 21:10:22 +02:00
@Override
2020-02-06 23:35:46 +01:00
public Description getDescription() throws ParsingException {
String text;
2018-10-11 22:29:13 +02:00
try {
2020-02-06 23:35:46 +01:00
text = JsonUtils.getString(json, "description");
2022-03-18 10:25:16 +01:00
} catch (final ParsingException e) {
return Description.EMPTY_DESCRIPTION;
2018-10-11 22:29:13 +02:00
}
2022-03-18 10:25:16 +01:00
2020-02-06 23:35:46 +01:00
if (text.length() == 250 && text.substring(247).equals("...")) {
//if description is shortened, get full description
final Downloader dl = NewPipe.getDownloader();
try {
final Response response = dl.get(baseUrl
+ PeertubeStreamLinkHandlerFactory.VIDEO_API_ENDPOINT
+ getId() + "/description");
final JsonObject jsonObject = JsonParser.object().from(response.responseBody());
2020-02-06 23:35:46 +01:00
text = JsonUtils.getString(jsonObject, "description");
} catch (ReCaptchaException | IOException | JsonParserException e) {
e.printStackTrace();
}
}
return new Description(text, Description.MARKDOWN);
2018-10-11 21:10:22 +02:00
}
@Override
public int getAgeLimit() throws ParsingException {
final boolean isNSFW = JsonUtils.getBoolean(json, "nsfw");
if (isNSFW) {
return 18;
} else {
return NO_AGE_LIMIT;
}
2018-10-11 21:10:22 +02:00
}
@Override
2020-06-13 20:25:38 +02:00
public long getLength() {
return json.getLong("duration");
2018-10-11 21:10:22 +02:00
}
@Override
public long getTimeStamp() throws ParsingException {
final long timestamp =
getTimestampSeconds("((#|&|\\?)start=\\d{0,3}h?\\d{0,3}m?\\d{1,3}s?)");
if (timestamp == -2) {
// regex for timestamp was not found
return 0;
} else {
return timestamp;
}
2018-10-11 21:10:22 +02:00
}
@Override
2020-06-13 20:25:38 +02:00
public long getViewCount() {
return json.getLong("views");
2018-10-11 21:10:22 +02:00
}
@Override
2020-06-13 20:25:38 +02:00
public long getLikeCount() {
return json.getLong("likes");
2018-10-11 21:10:22 +02:00
}
@Override
2020-06-13 20:25:38 +02:00
public long getDislikeCount() {
return json.getLong("dislikes");
2018-10-11 21:10:22 +02:00
}
@Nonnull
2018-10-11 21:10:22 +02:00
@Override
public String getUploaderUrl() throws ParsingException {
final String name = JsonUtils.getString(json, "account.name");
final String host = JsonUtils.getString(json, "account.host");
2022-03-18 10:25:16 +01:00
return getService().getChannelLHFactory()
.fromId("accounts/" + name + "@" + host, baseUrl).getUrl();
2018-10-11 21:10:22 +02:00
}
@Nonnull
2018-10-11 21:10:22 +02:00
@Override
public String getUploaderName() throws ParsingException {
return JsonUtils.getString(json, "account.displayName");
}
@Nonnull
2018-10-11 21:10:22 +02:00
@Override
public String getUploaderAvatarUrl() {
2018-10-11 22:29:13 +02:00
String value;
try {
value = JsonUtils.getString(json, "account.avatar.path");
2022-03-18 10:25:16 +01:00
} catch (final Exception e) {
2018-10-11 22:29:13 +02:00
value = "/client/assets/images/default-avatar.png";
}
return baseUrl + value;
2018-10-11 21:10:22 +02:00
}
@Nonnull
@Override
public String getSubChannelUrl() throws ParsingException {
return JsonUtils.getString(json, "channel.url");
}
@Nonnull
@Override
public String getSubChannelName() throws ParsingException {
return JsonUtils.getString(json, "channel.displayName");
}
@Nonnull
@Override
public String getSubChannelAvatarUrl() {
String value;
try {
value = JsonUtils.getString(json, "channel.avatar.path");
2022-03-18 10:25:16 +01:00
} catch (final Exception e) {
value = "/client/assets/images/default-avatar.png";
}
return baseUrl + value;
}
@Nonnull
2018-10-11 21:10:22 +02:00
@Override
public String getHlsUrl() {
2021-06-18 16:25:10 +02:00
return json.getArray("streamingPlaylists").getObject(0).getString("playlistUrl");
2018-10-11 21:10:22 +02:00
}
@Override
public List<AudioStream> getAudioStreams() {
return Collections.emptyList();
2018-10-11 21:10:22 +02:00
}
@Override
public List<VideoStream> getVideoStreams() throws ExtractionException {
2018-10-11 21:10:22 +02:00
assertPageFetched();
final List<VideoStream> videoStreams = new ArrayList<>();
2022-03-18 10:25:16 +01:00
2021-05-15 12:39:23 +02:00
// mp4
2018-10-11 21:10:22 +02:00
try {
2021-05-15 12:39:23 +02:00
videoStreams.addAll(getVideoStreamsFromArray(json.getArray("files")));
2022-03-18 10:25:16 +01:00
} catch (final Exception ignored) { }
2021-05-15 12:39:23 +02:00
// HLS
try {
final JsonArray streamingPlaylists = json.getArray("streamingPlaylists");
for (final Object p : streamingPlaylists) {
2022-03-18 10:25:16 +01:00
if (!(p instanceof JsonObject)) {
continue;
}
2021-05-15 12:39:23 +02:00
final JsonObject playlist = (JsonObject) p;
videoStreams.addAll(getVideoStreamsFromArray(playlist.getArray("files")));
}
2022-03-18 10:25:16 +01:00
} catch (final Exception e) {
2021-05-15 12:39:23 +02:00
throw new ParsingException("Could not get video streams", e);
}
2021-06-18 16:25:10 +02:00
if (getStreamType() == StreamType.LIVE_STREAM) {
2022-03-18 10:25:16 +01:00
videoStreams.add(new VideoStream(getHlsUrl(), MediaFormat.MPEG_4, "720p"));
2021-06-18 16:25:10 +02:00
}
2021-05-15 12:39:23 +02:00
return videoStreams;
}
2022-03-18 10:25:16 +01:00
private List<VideoStream> getVideoStreamsFromArray(final JsonArray streams)
throws ParsingException {
2021-05-15 12:39:23 +02:00
try {
final List<VideoStream> videoStreams = new ArrayList<>();
for (final Object s : streams) {
2022-03-18 10:25:16 +01:00
if (!(s instanceof JsonObject)) {
continue;
}
final JsonObject stream = (JsonObject) s;
2021-05-15 12:39:23 +02:00
final String url;
if (stream.has("fileDownloadUrl")) {
url = JsonUtils.getString(stream, "fileDownloadUrl");
} else {
url = JsonUtils.getString(stream, "fileUrl");
}
final String torrentUrl = JsonUtils.getString(stream, "torrentUrl");
final String resolution = JsonUtils.getString(stream, "resolution.label");
final String extension = url.substring(url.lastIndexOf(".") + 1);
final MediaFormat format = MediaFormat.getFromSuffix(extension);
2022-03-18 10:25:16 +01:00
final VideoStream videoStream
= new VideoStream(url, torrentUrl, format, resolution);
2018-10-11 21:10:22 +02:00
if (!Stream.containSimilarStream(videoStream, videoStreams)) {
videoStreams.add(videoStream);
}
}
2021-05-15 12:39:23 +02:00
return videoStreams;
2022-03-18 10:25:16 +01:00
} catch (final Exception e) {
2021-05-15 12:39:23 +02:00
throw new ParsingException("Could not get video streams from array");
2018-10-11 21:10:22 +02:00
}
}
@Override
public List<VideoStream> getVideoOnlyStreams() {
2020-06-13 20:25:38 +02:00
return Collections.emptyList();
2018-10-11 21:10:22 +02:00
}
@Nonnull
2018-10-11 21:10:22 +02:00
@Override
public List<SubtitlesStream> getSubtitlesDefault() {
2019-11-16 00:00:13 +01:00
return subtitles;
2018-10-11 21:10:22 +02:00
}
@Nonnull
2018-10-11 21:10:22 +02:00
@Override
public List<SubtitlesStream> getSubtitles(final MediaFormat format) {
final List<SubtitlesStream> filteredSubs = new ArrayList<>();
for (final SubtitlesStream sub : subtitles) {
if (sub.getFormat() == format) {
2019-11-16 00:00:13 +01:00
filteredSubs.add(sub);
}
}
return filteredSubs;
2018-10-11 21:10:22 +02:00
}
@Override
public StreamType getStreamType() {
2021-06-18 16:25:10 +02:00
return json.getBoolean("isLive") ? StreamType.LIVE_STREAM : StreamType.VIDEO_STREAM;
2018-10-11 21:10:22 +02:00
}
@Nullable
2018-10-11 21:10:22 +02:00
@Override
public StreamInfoItemsCollector getRelatedItems() throws IOException, ExtractionException {
final List<String> tags = getTags();
final String apiUrl;
if (tags.isEmpty()) {
apiUrl = baseUrl + "/api/v1/accounts/" + JsonUtils.getString(json, "account.name")
2022-03-18 10:25:16 +01:00
+ "@" + JsonUtils.getString(json, "account.host")
+ "/videos?start=0&count=8";
} else {
apiUrl = getRelatedItemsUrl(tags);
}
if (Utils.isBlank(apiUrl)) {
return null;
} else {
final StreamInfoItemsCollector collector = new StreamInfoItemsCollector(getServiceId());
getStreamsFromApi(collector, apiUrl);
return collector;
}
2018-10-11 21:10:22 +02:00
}
@Nonnull
@Override
public List<String> getTags() {
return JsonUtils.getStringListFromJsonArray(json.getArray("tags"));
}
@Nonnull
@Override
public String getSupportInfo() {
try {
return JsonUtils.getString(json, "support");
2022-03-18 10:25:16 +01:00
} catch (final ParsingException e) {
return "";
}
}
private String getRelatedItemsUrl(final List<String> tags) throws UnsupportedEncodingException {
final String url = baseUrl + PeertubeSearchQueryHandlerFactory.SEARCH_ENDPOINT;
final StringBuilder params = new StringBuilder();
params.append("start=0&count=8&sort=-createdAt");
for (final String tag : tags) {
params.append("&tagsOneOf=");
2021-02-07 22:12:22 +01:00
params.append(URLEncoder.encode(tag, UTF_8));
}
2022-03-18 10:25:16 +01:00
return url + "?" + params;
}
2018-10-11 21:10:22 +02:00
2022-03-18 10:25:16 +01:00
private void getStreamsFromApi(final StreamInfoItemsCollector collector, final String apiUrl)
throws ReCaptchaException, IOException, ParsingException {
final Response response = getDownloader().get(apiUrl);
2018-10-11 21:10:22 +02:00
JsonObject relatedVideosJson = null;
if (response != null && !Utils.isBlank(response.responseBody())) {
2018-10-11 21:10:22 +02:00
try {
2019-11-19 22:38:17 +01:00
relatedVideosJson = JsonParser.object().from(response.responseBody());
2022-03-18 10:25:16 +01:00
} catch (final JsonParserException e) {
2018-10-11 21:10:22 +02:00
throw new ParsingException("Could not parse json data for related videos", e);
}
}
if (relatedVideosJson != null) {
2018-10-11 21:10:22 +02:00
collectStreamsFrom(collector, relatedVideosJson);
}
}
2022-03-18 10:25:16 +01:00
private void collectStreamsFrom(final StreamInfoItemsCollector collector,
final JsonObject jsonObject)
throws ParsingException {
final JsonArray contents;
2018-10-11 21:10:22 +02:00
try {
2022-03-18 10:25:16 +01:00
contents = (JsonArray) JsonUtils.getValue(jsonObject, "data");
} catch (final Exception e) {
2018-10-11 21:10:22 +02:00
throw new ParsingException("unable to extract related videos", e);
}
for (final Object c : contents) {
if (c instanceof JsonObject) {
2018-10-11 21:10:22 +02:00
final JsonObject item = (JsonObject) c;
2022-03-18 10:25:16 +01:00
final PeertubeStreamInfoItemExtractor extractor
= new PeertubeStreamInfoItemExtractor(item, baseUrl);
//do not add the same stream in related streams
2022-03-18 10:25:16 +01:00
if (!extractor.getUrl().equals(getUrl())) {
collector.commit(extractor);
}
2018-10-11 21:10:22 +02:00
}
}
}
2018-10-11 21:10:22 +02:00
@Override
public void onFetchPage(@Nonnull final Downloader downloader)
throws IOException, ExtractionException {
2022-03-18 10:25:16 +01:00
final Response response = downloader.get(
baseUrl + PeertubeStreamLinkHandlerFactory.VIDEO_API_ENDPOINT + getId());
2021-03-14 00:45:44 +01:00
if (response != null) {
2019-11-19 22:38:17 +01:00
setInitialData(response.responseBody());
} else {
2020-04-15 14:09:46 +02:00
throw new ExtractionException("Unable to extract PeerTube channel data");
2018-10-11 21:10:22 +02:00
}
2019-11-16 00:00:13 +01:00
loadSubtitles();
2018-10-11 21:10:22 +02:00
}
private void setInitialData(final String responseBody) throws ExtractionException {
2018-10-11 21:10:22 +02:00
try {
json = JsonParser.object().from(responseBody);
2022-03-18 10:25:16 +01:00
} catch (final JsonParserException e) {
2020-04-15 14:09:46 +02:00
throw new ExtractionException("Unable to extract PeerTube stream data", e);
2018-10-11 21:10:22 +02:00
}
if (json == null) {
throw new ExtractionException("Unable to extract PeerTube stream data");
}
2019-03-09 19:03:51 +01:00
PeertubeParsingHelper.validate(json);
2018-10-11 21:10:22 +02:00
}
2019-11-16 00:00:13 +01:00
private void loadSubtitles() {
if (subtitles.isEmpty()) {
try {
final Response response = getDownloader().get(baseUrl
+ PeertubeStreamLinkHandlerFactory.VIDEO_API_ENDPOINT
+ getId() + "/captions");
final JsonObject captionsJson = JsonParser.object().from(response.responseBody());
final JsonArray captions = JsonUtils.getArray(captionsJson, "data");
for (final Object c : captions) {
if (c instanceof JsonObject) {
final JsonObject caption = (JsonObject) c;
final String url = baseUrl + JsonUtils.getString(caption, "captionPath");
final String languageCode = JsonUtils.getString(caption, "language.id");
final String ext = url.substring(url.lastIndexOf(".") + 1);
final MediaFormat fmt = MediaFormat.getFromSuffix(ext);
2022-03-18 10:25:16 +01:00
if (fmt != null && !isNullOrEmpty(languageCode)) {
subtitles.add(new SubtitlesStream(fmt, languageCode, url, false));
2022-03-18 10:25:16 +01:00
}
2019-11-16 00:00:13 +01:00
}
}
2022-03-18 10:25:16 +01:00
} catch (final Exception e) {
2019-11-16 00:00:13 +01:00
// ignore all exceptions
}
}
}
2018-10-11 21:10:22 +02:00
@Nonnull
2018-10-11 21:10:22 +02:00
@Override
public String getName() throws ParsingException {
return JsonUtils.getString(json, "name");
}
@Nonnull
@Override
public String getHost() throws ParsingException {
return JsonUtils.getString(json, "account.host");
}
@Nonnull
@Override
public Privacy getPrivacy() {
switch (json.getObject("privacy").getInt("id")) {
case 1:
return Privacy.PUBLIC;
case 2:
return Privacy.UNLISTED;
case 3:
return Privacy.PRIVATE;
case 4:
return Privacy.INTERNAL;
default:
2021-02-12 20:34:46 +01:00
return Privacy.OTHER;
}
}
@Nonnull
@Override
public String getCategory() throws ParsingException {
return JsonUtils.getString(json, "category.label");
}
@Nonnull
@Override
public String getLicence() throws ParsingException {
return JsonUtils.getString(json, "licence.label");
}
@Override
public Locale getLanguageInfo() {
try {
return new Locale(JsonUtils.getString(json, "language.id"));
2022-03-18 10:25:16 +01:00
} catch (final ParsingException e) {
return null;
}
}
2018-10-11 21:10:22 +02:00
}