2018-05-08 21:19:03 +02:00
|
|
|
package org.schabi.newpipe.extractor.services.youtube.extractors;
|
2017-03-01 18:47:52 +01:00
|
|
|
|
2017-11-22 18:39:38 +01:00
|
|
|
import com.grack.nanojson.JsonArray;
|
2017-08-16 04:40:03 +02:00
|
|
|
import com.grack.nanojson.JsonObject;
|
|
|
|
import com.grack.nanojson.JsonParser;
|
2017-11-22 18:39:38 +01:00
|
|
|
import com.grack.nanojson.JsonParserException;
|
2017-03-01 18:47:52 +01:00
|
|
|
import org.jsoup.Jsoup;
|
|
|
|
import org.jsoup.nodes.Document;
|
|
|
|
import org.jsoup.nodes.Element;
|
2018-09-24 21:04:22 +02:00
|
|
|
import org.jsoup.select.Elements;
|
2017-03-01 18:47:52 +01:00
|
|
|
import org.mozilla.javascript.Context;
|
|
|
|
import org.mozilla.javascript.Function;
|
|
|
|
import org.mozilla.javascript.ScriptableObject;
|
2019-04-28 22:03:16 +02:00
|
|
|
import org.schabi.newpipe.extractor.MediaFormat;
|
|
|
|
import org.schabi.newpipe.extractor.NewPipe;
|
|
|
|
import org.schabi.newpipe.extractor.StreamingService;
|
|
|
|
import org.schabi.newpipe.extractor.downloader.Downloader;
|
|
|
|
import org.schabi.newpipe.extractor.downloader.Request;
|
|
|
|
import org.schabi.newpipe.extractor.downloader.Response;
|
2017-07-11 05:08:03 +02:00
|
|
|
import org.schabi.newpipe.extractor.exceptions.ContentNotAvailableException;
|
2017-04-12 02:55:53 +02:00
|
|
|
import org.schabi.newpipe.extractor.exceptions.ExtractionException;
|
|
|
|
import org.schabi.newpipe.extractor.exceptions.ParsingException;
|
|
|
|
import org.schabi.newpipe.extractor.exceptions.ReCaptchaException;
|
2018-07-13 18:02:40 +02:00
|
|
|
import org.schabi.newpipe.extractor.linkhandler.LinkHandler;
|
2019-04-28 22:03:16 +02:00
|
|
|
import org.schabi.newpipe.extractor.localization.TimeAgoParser;
|
2018-05-08 21:19:03 +02:00
|
|
|
import org.schabi.newpipe.extractor.services.youtube.ItagItem;
|
2019-10-29 06:00:29 +01:00
|
|
|
import org.schabi.newpipe.extractor.services.youtube.linkHandler.YoutubeParsingHelper;
|
2017-08-10 19:50:59 +02:00
|
|
|
import org.schabi.newpipe.extractor.stream.*;
|
2019-04-28 22:03:16 +02:00
|
|
|
import org.schabi.newpipe.extractor.utils.JsonUtils;
|
2017-06-29 20:12:55 +02:00
|
|
|
import org.schabi.newpipe.extractor.utils.Parser;
|
2017-07-11 05:08:03 +02:00
|
|
|
import org.schabi.newpipe.extractor.utils.Utils;
|
2017-03-01 18:47:52 +01:00
|
|
|
|
2017-11-25 01:10:04 +01:00
|
|
|
import javax.annotation.Nonnull;
|
|
|
|
import javax.annotation.Nullable;
|
2017-03-01 18:47:52 +01:00
|
|
|
import java.io.IOException;
|
2018-08-16 17:11:18 +02:00
|
|
|
import java.io.UnsupportedEncodingException;
|
|
|
|
import java.net.MalformedURLException;
|
|
|
|
import java.net.URL;
|
2017-11-22 18:39:38 +01:00
|
|
|
import java.util.*;
|
2019-08-18 05:48:15 +02:00
|
|
|
import java.util.regex.Matcher;
|
|
|
|
import java.util.regex.Pattern;
|
2017-03-01 18:47:52 +01:00
|
|
|
|
2017-06-29 20:12:55 +02:00
|
|
|
/*
|
2017-03-01 18:47:52 +01:00
|
|
|
* Created by Christian Schabesberger on 06.08.15.
|
|
|
|
*
|
2019-03-14 08:49:11 +01:00
|
|
|
* Copyright (C) Christian Schabesberger 2019 <chris.schabesberger@mailbox.org>
|
2017-03-01 18:47:52 +01:00
|
|
|
* YoutubeStreamExtractor.java is part of NewPipe.
|
|
|
|
*
|
|
|
|
* NewPipe is free software: you can redistribute it and/or modify
|
|
|
|
* it under the terms of the GNU General Public License as published by
|
|
|
|
* the Free Software Foundation, either version 3 of the License, or
|
|
|
|
* (at your option) any later version.
|
|
|
|
*
|
|
|
|
* NewPipe is distributed in the hope that it will be useful,
|
|
|
|
* but WITHOUT ANY WARRANTY; without even the implied warranty of
|
|
|
|
* MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
|
|
|
|
* GNU General Public License for more details.
|
|
|
|
*
|
|
|
|
* You should have received a copy of the GNU General Public License
|
|
|
|
* along with NewPipe. If not, see <http://www.gnu.org/licenses/>.
|
|
|
|
*/
|
|
|
|
|
|
|
|
public class YoutubeStreamExtractor extends StreamExtractor {
|
2017-07-11 05:08:03 +02:00
|
|
|
private static final String TAG = YoutubeStreamExtractor.class.getSimpleName();
|
2017-03-01 18:47:52 +01:00
|
|
|
|
2017-07-11 05:08:03 +02:00
|
|
|
/*//////////////////////////////////////////////////////////////////////////
|
|
|
|
// Exceptions
|
|
|
|
//////////////////////////////////////////////////////////////////////////*/
|
2017-03-01 18:47:52 +01:00
|
|
|
|
|
|
|
public class DecryptException extends ParsingException {
|
|
|
|
DecryptException(String message, Throwable cause) {
|
|
|
|
super(message, cause);
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2018-02-01 22:27:14 +01:00
|
|
|
public class SubtitlesException extends ContentNotAvailableException {
|
|
|
|
SubtitlesException(String message, Throwable cause) {
|
|
|
|
super(message, cause);
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2017-07-11 05:08:03 +02:00
|
|
|
/*//////////////////////////////////////////////////////////////////////////*/
|
2017-03-01 18:47:52 +01:00
|
|
|
|
2017-07-11 05:08:03 +02:00
|
|
|
private Document doc;
|
2017-11-25 01:10:04 +01:00
|
|
|
@Nullable
|
2017-08-16 04:40:03 +02:00
|
|
|
private JsonObject playerArgs;
|
2017-11-25 01:10:04 +01:00
|
|
|
@Nonnull
|
|
|
|
private final Map<String, String> videoInfoPage = new HashMap<>();
|
2019-09-11 19:05:41 +02:00
|
|
|
private JsonObject playerResponse;
|
2018-02-02 08:24:22 +01:00
|
|
|
|
2018-02-01 22:27:14 +01:00
|
|
|
@Nonnull
|
2018-02-02 08:24:22 +01:00
|
|
|
private List<SubtitlesInfo> subtitlesInfos = new ArrayList<>();
|
2017-08-10 19:50:59 +02:00
|
|
|
|
|
|
|
private boolean isAgeRestricted;
|
2017-03-01 18:47:52 +01:00
|
|
|
|
2019-04-28 22:03:16 +02:00
|
|
|
public YoutubeStreamExtractor(StreamingService service, LinkHandler linkHandler) {
|
|
|
|
super(service, linkHandler);
|
2017-03-01 18:47:52 +01:00
|
|
|
}
|
|
|
|
|
2017-07-11 05:08:03 +02:00
|
|
|
/*//////////////////////////////////////////////////////////////////////////
|
|
|
|
// Impl
|
|
|
|
//////////////////////////////////////////////////////////////////////////*/
|
2017-03-01 18:47:52 +01:00
|
|
|
|
2017-11-25 01:10:04 +01:00
|
|
|
@Nonnull
|
2017-03-01 18:47:52 +01:00
|
|
|
@Override
|
2017-08-11 03:23:09 +02:00
|
|
|
public String getName() throws ParsingException {
|
2017-11-30 10:49:27 +01:00
|
|
|
assertPageFetched();
|
2017-11-25 01:10:04 +01:00
|
|
|
String name = getStringFromMetaData("title");
|
|
|
|
if(name == null) {
|
2017-08-11 03:23:09 +02:00
|
|
|
// Fallback to HTML method
|
2017-11-25 01:10:04 +01:00
|
|
|
try {
|
|
|
|
name = doc.select("meta[name=title]").attr(CONTENT);
|
|
|
|
} catch (Exception e) {
|
|
|
|
throw new ParsingException("Could not get the title", e);
|
|
|
|
}
|
|
|
|
}
|
|
|
|
if(name == null || name.isEmpty()) {
|
|
|
|
throw new ParsingException("Could not get the title");
|
2017-03-01 18:47:52 +01:00
|
|
|
}
|
2017-11-25 01:10:04 +01:00
|
|
|
return name;
|
2017-03-01 18:47:52 +01:00
|
|
|
}
|
|
|
|
|
|
|
|
@Override
|
2019-04-28 22:03:16 +02:00
|
|
|
public String getTextualUploadDate() throws ParsingException {
|
|
|
|
if (getStreamType().equals(StreamType.LIVE_STREAM)) {
|
|
|
|
return null;
|
|
|
|
}
|
|
|
|
|
2017-03-01 18:47:52 +01:00
|
|
|
try {
|
2017-08-11 03:23:09 +02:00
|
|
|
return doc.select("meta[itemprop=datePublished]").attr(CONTENT);
|
|
|
|
} catch (Exception e) {//todo: add fallback method
|
|
|
|
throw new ParsingException("Could not get upload date", e);
|
2017-03-01 18:47:52 +01:00
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2019-04-28 22:03:16 +02:00
|
|
|
@Override
|
|
|
|
public Calendar getUploadDate() throws ParsingException {
|
|
|
|
final String textualUploadDate = getTextualUploadDate();
|
|
|
|
|
|
|
|
if (textualUploadDate == null) {
|
|
|
|
return null;
|
|
|
|
}
|
|
|
|
|
|
|
|
return YoutubeParsingHelper.parseDateFrom(textualUploadDate);
|
|
|
|
}
|
|
|
|
|
2017-11-25 01:10:04 +01:00
|
|
|
@Nonnull
|
2017-03-01 18:47:52 +01:00
|
|
|
@Override
|
2017-08-11 03:23:09 +02:00
|
|
|
public String getThumbnailUrl() throws ParsingException {
|
2017-11-30 10:49:27 +01:00
|
|
|
assertPageFetched();
|
2017-08-11 03:23:09 +02:00
|
|
|
// Try to get high resolution thumbnail first, if it fails, use low res from the player instead
|
2017-03-01 18:47:52 +01:00
|
|
|
try {
|
2017-08-11 03:23:09 +02:00
|
|
|
return doc.select("link[itemprop=\"thumbnailUrl\"]").first().attr("abs:href");
|
2017-08-10 19:50:59 +02:00
|
|
|
} catch (Exception ignored) {
|
|
|
|
// Try other method...
|
|
|
|
}
|
|
|
|
|
|
|
|
try {
|
2017-11-25 01:10:04 +01:00
|
|
|
if (playerArgs != null && playerArgs.isString("thumbnail_url")) return playerArgs.getString("thumbnail_url");
|
2017-08-10 19:50:59 +02:00
|
|
|
} catch (Exception ignored) {
|
|
|
|
// Try other method...
|
2017-06-29 20:12:55 +02:00
|
|
|
}
|
2017-08-10 19:50:59 +02:00
|
|
|
|
|
|
|
try {
|
2017-08-11 03:23:09 +02:00
|
|
|
return videoInfoPage.get("thumbnail_url");
|
2017-03-01 18:47:52 +01:00
|
|
|
} catch (Exception e) {
|
2017-08-11 03:23:09 +02:00
|
|
|
throw new ParsingException("Could not get thumbnail url", e);
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2017-11-25 01:10:04 +01:00
|
|
|
@Nonnull
|
2017-08-11 03:23:09 +02:00
|
|
|
@Override
|
|
|
|
public String getDescription() throws ParsingException {
|
2017-11-30 10:49:27 +01:00
|
|
|
assertPageFetched();
|
2017-08-11 03:23:09 +02:00
|
|
|
try {
|
2018-08-16 17:11:18 +02:00
|
|
|
return parseHtmlAndGetFullLinks(doc.select("p[id=\"eow-description\"]").first().html());
|
2018-08-16 17:37:19 +02:00
|
|
|
} catch (Exception e) {
|
2017-08-11 03:23:09 +02:00
|
|
|
throw new ParsingException("Could not get the description", e);
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2019-08-18 05:48:15 +02:00
|
|
|
// onclick="yt.www.watch.player.seekTo(0*3600+00*60+00);return false;"
|
|
|
|
// :00 is NOT recognized as a timestamp in description or comments.
|
|
|
|
// 0:00 is recognized in both description and comments.
|
|
|
|
// https://www.youtube.com/watch?v=4cccfDXu1vA
|
|
|
|
private final static Pattern DESCRIPTION_TIMESTAMP_ONCLICK_REGEX = Pattern.compile(
|
|
|
|
"seekTo\\("
|
|
|
|
+ "(?:(\\d+)\\*3600\\+)?" // hours?
|
|
|
|
+ "(\\d+)\\*60\\+" // minutes
|
|
|
|
+ "(\\d+)" // seconds
|
|
|
|
+ "\\)");
|
|
|
|
|
|
|
|
@SafeVarargs
|
|
|
|
private static <T> T coalesce(T... args) {
|
|
|
|
for (T arg : args) {
|
|
|
|
if (arg != null) return arg;
|
|
|
|
}
|
|
|
|
throw new IllegalArgumentException("all arguments to coalesce() were null");
|
|
|
|
}
|
|
|
|
|
2018-08-16 17:11:18 +02:00
|
|
|
private String parseHtmlAndGetFullLinks(String descriptionHtml)
|
|
|
|
throws MalformedURLException, UnsupportedEncodingException, ParsingException {
|
|
|
|
final Document description = Jsoup.parse(descriptionHtml, getUrl());
|
|
|
|
for(Element a : description.select("a")) {
|
2019-07-30 20:53:23 +02:00
|
|
|
final String rawUrl = a.attr("abs:href");
|
|
|
|
final URL redirectLink = new URL(rawUrl);
|
2019-08-18 05:48:15 +02:00
|
|
|
|
|
|
|
final Matcher onClickTimestamp;
|
|
|
|
final String queryString;
|
|
|
|
if ((onClickTimestamp = DESCRIPTION_TIMESTAMP_ONCLICK_REGEX.matcher(a.attr("onclick")))
|
|
|
|
.find()) {
|
|
|
|
a.removeAttr("onclick");
|
|
|
|
|
|
|
|
String hours = coalesce(onClickTimestamp.group(1), "0");
|
|
|
|
String minutes = onClickTimestamp.group(2);
|
|
|
|
String seconds = onClickTimestamp.group(3);
|
|
|
|
|
|
|
|
int timestamp = 0;
|
|
|
|
timestamp += Integer.parseInt(hours) * 3600;
|
|
|
|
timestamp += Integer.parseInt(minutes) * 60;
|
|
|
|
timestamp += Integer.parseInt(seconds);
|
|
|
|
|
|
|
|
String setTimestamp = "&t=" + timestamp;
|
|
|
|
|
|
|
|
// Even after clicking https://youtu.be/...?t=6,
|
|
|
|
// getUrl() is https://www.youtube.com/watch?v=..., never youtu.be, never &t=.
|
|
|
|
a.attr("href", getUrl() + setTimestamp);
|
|
|
|
|
|
|
|
} else if((queryString = redirectLink.getQuery()) != null) {
|
2018-08-16 17:37:19 +02:00
|
|
|
// if the query string is null we are not dealing with a redirect link,
|
|
|
|
// so we don't need to override it.
|
|
|
|
final String link =
|
|
|
|
Parser.compatParseMap(queryString).get("q");
|
2018-08-17 16:22:50 +02:00
|
|
|
|
|
|
|
if(link != null) {
|
2018-08-27 20:45:43 +02:00
|
|
|
// if link is null the a tag is a hashtag.
|
|
|
|
// They refer to the youtube search. We do not handle them.
|
2018-08-28 11:55:12 +02:00
|
|
|
a.text(link);
|
2019-07-30 20:53:23 +02:00
|
|
|
a.attr("href", link);
|
2018-09-20 13:51:06 +02:00
|
|
|
} else if(redirectLink.toString().contains("https://www.youtube.com/")) {
|
|
|
|
a.text(redirectLink.toString());
|
2019-07-30 20:53:23 +02:00
|
|
|
a.attr("href", redirectLink.toString());
|
2018-08-17 16:22:50 +02:00
|
|
|
}
|
2018-09-20 13:51:06 +02:00
|
|
|
} else if(redirectLink.toString().contains("https://www.youtube.com/")) {
|
2019-07-30 20:53:23 +02:00
|
|
|
descriptionHtml = descriptionHtml.replace(rawUrl, redirectLink.toString());
|
2018-09-07 22:18:22 +02:00
|
|
|
a.text(redirectLink.toString());
|
2019-07-30 20:53:23 +02:00
|
|
|
a.attr("href", redirectLink.toString());
|
2018-08-16 17:37:19 +02:00
|
|
|
}
|
2018-08-16 17:11:18 +02:00
|
|
|
}
|
|
|
|
return description.select("body").first().html();
|
|
|
|
}
|
|
|
|
|
2017-08-11 03:23:09 +02:00
|
|
|
@Override
|
|
|
|
public int getAgeLimit() throws ParsingException {
|
2017-11-30 10:49:27 +01:00
|
|
|
assertPageFetched();
|
2017-08-11 03:23:09 +02:00
|
|
|
if (!isAgeRestricted) {
|
2017-11-25 02:03:30 +01:00
|
|
|
return NO_AGE_LIMIT;
|
2017-08-11 03:23:09 +02:00
|
|
|
}
|
|
|
|
try {
|
|
|
|
return Integer.valueOf(doc.select("meta[property=\"og:restrictions:age\"]")
|
|
|
|
.attr(CONTENT).replace("+", ""));
|
|
|
|
} catch (Exception e) {
|
|
|
|
throw new ParsingException("Could not get age restriction");
|
2017-03-01 18:47:52 +01:00
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
@Override
|
2017-08-10 19:50:59 +02:00
|
|
|
public long getLength() throws ParsingException {
|
2017-11-30 10:49:27 +01:00
|
|
|
assertPageFetched();
|
2019-07-30 20:53:23 +02:00
|
|
|
|
|
|
|
// try getting duration from playerargs
|
2017-08-10 19:50:59 +02:00
|
|
|
try {
|
2019-07-30 20:53:23 +02:00
|
|
|
String durationMs = playerResponse
|
|
|
|
.getObject("streamingData")
|
|
|
|
.getArray("formats")
|
|
|
|
.getObject(0)
|
|
|
|
.getString("approxDurationMs");
|
|
|
|
return Long.parseLong(durationMs)/1000;
|
|
|
|
} catch (Exception e) {
|
2017-08-10 19:50:59 +02:00
|
|
|
}
|
|
|
|
|
2019-07-30 20:53:23 +02:00
|
|
|
//try getting value from age gated video
|
2017-08-10 19:50:59 +02:00
|
|
|
try {
|
2019-07-30 20:53:23 +02:00
|
|
|
String duration = playerResponse
|
|
|
|
.getObject("videoDetails")
|
|
|
|
.getString("lengthSeconds");
|
|
|
|
return Long.parseLong(duration);
|
2017-08-10 19:50:59 +02:00
|
|
|
} catch (Exception e) {
|
2019-07-30 20:53:23 +02:00
|
|
|
throw new ParsingException("Every methode to get the duration has failed: ", e);
|
2017-03-01 18:47:52 +01:00
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2017-08-11 03:23:09 +02:00
|
|
|
/**
|
|
|
|
* Attempts to parse (and return) the offset to start playing the video from.
|
|
|
|
*
|
|
|
|
* @return the offset (in seconds), or 0 if no timestamp is found.
|
|
|
|
*/
|
|
|
|
@Override
|
|
|
|
public long getTimeStamp() throws ParsingException {
|
2017-11-22 18:45:49 +01:00
|
|
|
return getTimestampSeconds("((#|&|\\?)t=\\d{0,3}h?\\d{0,3}m?\\d{1,3}s?)");
|
2017-08-11 03:23:09 +02:00
|
|
|
}
|
|
|
|
|
2017-03-01 18:47:52 +01:00
|
|
|
@Override
|
|
|
|
public long getViewCount() throws ParsingException {
|
2017-11-30 10:49:27 +01:00
|
|
|
assertPageFetched();
|
2017-03-01 18:47:52 +01:00
|
|
|
try {
|
2019-04-28 22:03:17 +02:00
|
|
|
if (getStreamType().equals(StreamType.LIVE_STREAM)) {
|
|
|
|
return getLiveStreamWatchingCount();
|
|
|
|
}
|
|
|
|
|
2017-08-10 19:50:59 +02:00
|
|
|
return Long.parseLong(doc.select("meta[itemprop=interactionCount]").attr(CONTENT));
|
2017-03-01 18:47:52 +01:00
|
|
|
} catch (Exception e) {//todo: find fallback method
|
2017-08-10 19:50:59 +02:00
|
|
|
throw new ParsingException("Could not get number of views", e);
|
2017-03-01 18:47:52 +01:00
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2019-04-28 22:03:17 +02:00
|
|
|
private long getLiveStreamWatchingCount() throws ExtractionException, IOException, JsonParserException {
|
|
|
|
// https://www.youtube.com/youtubei/v1/updated_metadata?alt=json&key=
|
|
|
|
String innerTubeKey = null, clientVersion = null;
|
|
|
|
if (playerArgs != null && !playerArgs.isEmpty()) {
|
|
|
|
innerTubeKey = playerArgs.getString("innertube_api_key");
|
|
|
|
clientVersion = playerArgs.getString("innertube_context_client_version");
|
|
|
|
} else if (!videoInfoPage.isEmpty()) {
|
|
|
|
innerTubeKey = videoInfoPage.get("innertube_api_key");
|
|
|
|
clientVersion = videoInfoPage.get("innertube_context_client_version");
|
|
|
|
}
|
|
|
|
|
|
|
|
if (innerTubeKey == null || innerTubeKey.isEmpty()) {
|
|
|
|
throw new ExtractionException("Couldn't get innerTube key");
|
|
|
|
}
|
|
|
|
|
|
|
|
if (clientVersion == null || clientVersion.isEmpty()) {
|
|
|
|
throw new ExtractionException("Couldn't get innerTube client version");
|
|
|
|
}
|
|
|
|
|
|
|
|
final String metadataUrl = "https://www.youtube.com/youtubei/v1/updated_metadata?alt=json&key=" + innerTubeKey;
|
|
|
|
final byte[] dataBody = ("{\"context\":{\"client\":{\"clientName\":1,\"clientVersion\":\"" + clientVersion + "\"}}" +
|
|
|
|
",\"videoId\":\"" + getId() + "\"}").getBytes("UTF-8");
|
|
|
|
final Response response = getDownloader().execute(Request.newBuilder()
|
|
|
|
.post(metadataUrl, dataBody)
|
|
|
|
.addHeader("Content-Type", "application/json")
|
|
|
|
.build());
|
|
|
|
final JsonObject jsonObject = JsonParser.object().from(response.responseBody());
|
|
|
|
|
|
|
|
for (Object actionEntry : jsonObject.getArray("actions")) {
|
|
|
|
if (!(actionEntry instanceof JsonObject)) continue;
|
|
|
|
final JsonObject entry = (JsonObject) actionEntry;
|
|
|
|
|
|
|
|
final JsonObject updateViewershipAction = entry.getObject("updateViewershipAction", null);
|
|
|
|
if (updateViewershipAction == null) continue;
|
|
|
|
|
|
|
|
final JsonArray viewCountRuns = JsonUtils.getArray(updateViewershipAction, "viewership.videoViewCountRenderer.viewCount.runs");
|
|
|
|
if (viewCountRuns.isEmpty()) continue;
|
|
|
|
|
|
|
|
final JsonObject textObject = viewCountRuns.getObject(0);
|
|
|
|
if (!textObject.has("text")) {
|
|
|
|
throw new ExtractionException("Response don't have \"text\" element");
|
|
|
|
}
|
|
|
|
|
|
|
|
return Long.parseLong(Utils.removeNonDigitCharacters(textObject.getString("text")));
|
|
|
|
}
|
|
|
|
|
|
|
|
throw new ExtractionException("Could not find correct results in response");
|
|
|
|
}
|
|
|
|
|
2017-03-01 18:47:52 +01:00
|
|
|
@Override
|
2017-08-11 03:23:09 +02:00
|
|
|
public long getLikeCount() throws ParsingException {
|
2017-11-30 10:49:27 +01:00
|
|
|
assertPageFetched();
|
2017-08-11 03:23:09 +02:00
|
|
|
String likesString = "";
|
2017-03-01 18:47:52 +01:00
|
|
|
try {
|
2017-08-11 03:23:09 +02:00
|
|
|
Element button = doc.select("button.like-button-renderer-like-button").first();
|
|
|
|
try {
|
|
|
|
likesString = button.select("span.yt-uix-button-content").first().text();
|
|
|
|
} catch (NullPointerException e) {
|
2017-11-11 01:21:43 +01:00
|
|
|
//if this kicks in our button has no content and therefore likes/dislikes are disabled
|
2017-08-11 03:23:09 +02:00
|
|
|
return -1;
|
|
|
|
}
|
|
|
|
return Integer.parseInt(Utils.removeNonDigitCharacters(likesString));
|
|
|
|
} catch (NumberFormatException nfe) {
|
|
|
|
throw new ParsingException("Could not parse \"" + likesString + "\" as an Integer", nfe);
|
|
|
|
} catch (Exception e) {
|
|
|
|
throw new ParsingException("Could not get like count", e);
|
2017-03-01 18:47:52 +01:00
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
@Override
|
2017-08-11 03:23:09 +02:00
|
|
|
public long getDislikeCount() throws ParsingException {
|
2017-11-30 10:49:27 +01:00
|
|
|
assertPageFetched();
|
2017-08-11 03:23:09 +02:00
|
|
|
String dislikesString = "";
|
2017-03-01 18:47:52 +01:00
|
|
|
try {
|
2017-08-11 03:23:09 +02:00
|
|
|
Element button = doc.select("button.like-button-renderer-dislike-button").first();
|
|
|
|
try {
|
|
|
|
dislikesString = button.select("span.yt-uix-button-content").first().text();
|
|
|
|
} catch (NullPointerException e) {
|
|
|
|
//if this kicks in our button has no content and therefore likes/dislikes are disabled
|
|
|
|
return -1;
|
|
|
|
}
|
|
|
|
return Integer.parseInt(Utils.removeNonDigitCharacters(dislikesString));
|
|
|
|
} catch (NumberFormatException nfe) {
|
|
|
|
throw new ParsingException("Could not parse \"" + dislikesString + "\" as an Integer", nfe);
|
|
|
|
} catch (Exception e) {
|
|
|
|
throw new ParsingException("Could not get dislike count", e);
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2017-11-25 01:10:04 +01:00
|
|
|
@Nonnull
|
2017-08-11 03:23:09 +02:00
|
|
|
@Override
|
|
|
|
public String getUploaderUrl() throws ParsingException {
|
2017-11-30 10:49:27 +01:00
|
|
|
assertPageFetched();
|
2017-08-11 03:23:09 +02:00
|
|
|
try {
|
|
|
|
return doc.select("div[class=\"yt-user-info\"]").first().children()
|
|
|
|
.select("a").first().attr("abs:href");
|
|
|
|
} catch (Exception e) {
|
|
|
|
throw new ParsingException("Could not get channel link", e);
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2017-11-25 01:10:04 +01:00
|
|
|
|
|
|
|
@Nullable
|
|
|
|
private String getStringFromMetaData(String field) {
|
2017-11-30 10:49:27 +01:00
|
|
|
assertPageFetched();
|
2017-11-25 01:10:04 +01:00
|
|
|
String value = null;
|
|
|
|
if(playerArgs != null) {
|
|
|
|
// This can not fail
|
|
|
|
value = playerArgs.getString(field);
|
|
|
|
}
|
|
|
|
if(value == null) {
|
|
|
|
// This can not fail too
|
|
|
|
value = videoInfoPage.get(field);
|
|
|
|
}
|
|
|
|
return value;
|
|
|
|
}
|
|
|
|
|
|
|
|
@Nonnull
|
2017-08-11 03:23:09 +02:00
|
|
|
@Override
|
|
|
|
public String getUploaderName() throws ParsingException {
|
2017-11-30 10:49:27 +01:00
|
|
|
assertPageFetched();
|
2017-11-25 01:10:04 +01:00
|
|
|
String name = getStringFromMetaData("author");
|
2017-08-10 19:50:59 +02:00
|
|
|
|
2017-11-25 01:10:04 +01:00
|
|
|
if(name == null) {
|
|
|
|
try {
|
|
|
|
// Fallback to HTML method
|
|
|
|
name = doc.select("div.yt-user-info").first().text();
|
|
|
|
} catch (Exception e) {
|
|
|
|
throw new ParsingException("Could not get uploader name", e);
|
|
|
|
}
|
2017-08-10 19:50:59 +02:00
|
|
|
}
|
2017-11-25 01:10:04 +01:00
|
|
|
if(name == null || name.isEmpty()) {
|
|
|
|
throw new ParsingException("Could not get uploader name");
|
2017-03-01 18:47:52 +01:00
|
|
|
}
|
2017-11-25 01:10:04 +01:00
|
|
|
return name;
|
2017-03-01 18:47:52 +01:00
|
|
|
}
|
|
|
|
|
2017-11-25 01:10:04 +01:00
|
|
|
@Nonnull
|
2017-03-01 18:47:52 +01:00
|
|
|
@Override
|
2017-08-08 23:36:11 +02:00
|
|
|
public String getUploaderAvatarUrl() throws ParsingException {
|
2017-11-30 10:49:27 +01:00
|
|
|
assertPageFetched();
|
2017-03-01 18:47:52 +01:00
|
|
|
try {
|
|
|
|
return doc.select("a[class*=\"yt-user-photo\"]").first()
|
|
|
|
.select("img").first()
|
|
|
|
.attr("abs:data-thumb");
|
|
|
|
} catch (Exception e) {//todo: add fallback method
|
2017-08-10 19:50:59 +02:00
|
|
|
throw new ParsingException("Could not get uploader thumbnail URL.", e);
|
2017-03-01 18:47:52 +01:00
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2018-02-25 22:03:32 +01:00
|
|
|
@Nonnull
|
2017-03-01 18:47:52 +01:00
|
|
|
@Override
|
|
|
|
public String getDashMpdUrl() throws ParsingException {
|
2017-11-30 10:49:27 +01:00
|
|
|
assertPageFetched();
|
2017-03-01 18:47:52 +01:00
|
|
|
try {
|
2017-07-11 05:08:03 +02:00
|
|
|
String dashManifestUrl;
|
2017-11-25 01:10:04 +01:00
|
|
|
if (videoInfoPage.containsKey("dashmpd")) {
|
2017-03-01 18:47:52 +01:00
|
|
|
dashManifestUrl = videoInfoPage.get("dashmpd");
|
2017-11-25 01:10:04 +01:00
|
|
|
} else if (playerArgs != null && playerArgs.isString("dashmpd")) {
|
2017-08-16 04:40:03 +02:00
|
|
|
dashManifestUrl = playerArgs.getString("dashmpd", "");
|
2017-03-01 18:47:52 +01:00
|
|
|
} else {
|
|
|
|
return "";
|
|
|
|
}
|
2017-08-10 19:50:59 +02:00
|
|
|
|
2017-06-29 20:12:55 +02:00
|
|
|
if (!dashManifestUrl.contains("/signature/")) {
|
2017-03-01 18:47:52 +01:00
|
|
|
String encryptedSig = Parser.matchGroup1("/s/([a-fA-F0-9\\.]+)", dashManifestUrl);
|
|
|
|
String decryptedSig;
|
|
|
|
|
|
|
|
decryptedSig = decryptSignature(encryptedSig, decryptionCode);
|
|
|
|
dashManifestUrl = dashManifestUrl.replace("/s/" + encryptedSig, "/signature/" + decryptedSig);
|
|
|
|
}
|
2017-08-10 19:50:59 +02:00
|
|
|
|
2017-03-01 18:47:52 +01:00
|
|
|
return dashManifestUrl;
|
|
|
|
} catch (Exception e) {
|
2017-08-10 19:50:59 +02:00
|
|
|
throw new ParsingException("Could not get dash manifest url", e);
|
2017-03-01 18:47:52 +01:00
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2018-02-25 22:03:32 +01:00
|
|
|
@Nonnull
|
|
|
|
@Override
|
|
|
|
public String getHlsUrl() throws ParsingException {
|
|
|
|
assertPageFetched();
|
2019-01-19 13:50:02 +01:00
|
|
|
|
2019-09-11 20:12:30 +02:00
|
|
|
try {
|
|
|
|
return playerResponse.getObject("streamingData").getString("hlsManifestUrl");
|
2018-02-25 22:03:32 +01:00
|
|
|
} catch (Exception e) {
|
2019-09-11 20:12:30 +02:00
|
|
|
if (playerArgs != null && playerArgs.isString("hlsvp")) {
|
|
|
|
return playerArgs.getString("hlsvp");
|
|
|
|
} else {
|
|
|
|
throw new ParsingException("Could not get hls manifest url", e);
|
|
|
|
}
|
2018-02-25 22:03:32 +01:00
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2017-03-01 18:47:52 +01:00
|
|
|
@Override
|
2019-09-11 20:04:28 +02:00
|
|
|
public List<AudioStream> getAudioStreams() throws ExtractionException {
|
2017-11-30 10:49:27 +01:00
|
|
|
assertPageFetched();
|
2017-08-06 22:20:15 +02:00
|
|
|
List<AudioStream> audioStreams = new ArrayList<>();
|
2017-06-29 20:12:55 +02:00
|
|
|
try {
|
2019-09-11 20:04:28 +02:00
|
|
|
for (Map.Entry<String, ItagItem> entry : getItags(ADAPTIVE_FORMATS, ItagItem.ItagType.AUDIO).entrySet()) {
|
2017-08-10 19:50:59 +02:00
|
|
|
ItagItem itag = entry.getValue();
|
2017-03-01 18:47:52 +01:00
|
|
|
|
2017-11-11 01:21:43 +01:00
|
|
|
AudioStream audioStream = new AudioStream(entry.getKey(), itag.getMediaFormat(), itag.avgBitrate);
|
2017-08-10 19:50:59 +02:00
|
|
|
if (!Stream.containSimilarStream(audioStream, audioStreams)) {
|
|
|
|
audioStreams.add(audioStream);
|
2017-03-01 18:47:52 +01:00
|
|
|
}
|
|
|
|
}
|
|
|
|
} catch (Exception e) {
|
2017-08-10 19:50:59 +02:00
|
|
|
throw new ParsingException("Could not get audio streams", e);
|
2017-03-01 18:47:52 +01:00
|
|
|
}
|
2017-08-10 19:50:59 +02:00
|
|
|
|
2017-03-01 18:47:52 +01:00
|
|
|
return audioStreams;
|
|
|
|
}
|
|
|
|
|
|
|
|
@Override
|
2019-09-11 20:04:28 +02:00
|
|
|
public List<VideoStream> getVideoStreams() throws ExtractionException {
|
2017-11-30 10:49:27 +01:00
|
|
|
assertPageFetched();
|
2017-08-06 22:20:15 +02:00
|
|
|
List<VideoStream> videoStreams = new ArrayList<>();
|
2017-06-29 20:12:55 +02:00
|
|
|
try {
|
2019-09-11 20:04:28 +02:00
|
|
|
for (Map.Entry<String, ItagItem> entry : getItags(FORMATS, ItagItem.ItagType.VIDEO).entrySet()) {
|
2017-08-10 19:50:59 +02:00
|
|
|
ItagItem itag = entry.getValue();
|
|
|
|
|
2017-11-11 01:21:43 +01:00
|
|
|
VideoStream videoStream = new VideoStream(entry.getKey(), itag.getMediaFormat(), itag.resolutionString);
|
2017-08-10 19:50:59 +02:00
|
|
|
if (!Stream.containSimilarStream(videoStream, videoStreams)) {
|
|
|
|
videoStreams.add(videoStream);
|
2017-03-01 18:47:52 +01:00
|
|
|
}
|
|
|
|
}
|
|
|
|
} catch (Exception e) {
|
2017-08-10 19:50:59 +02:00
|
|
|
throw new ParsingException("Could not get video streams", e);
|
2017-03-01 18:47:52 +01:00
|
|
|
}
|
|
|
|
|
|
|
|
return videoStreams;
|
|
|
|
}
|
|
|
|
|
|
|
|
@Override
|
2018-08-21 17:23:56 +02:00
|
|
|
public List<VideoStream> getVideoOnlyStreams() throws ExtractionException {
|
2017-11-30 10:49:27 +01:00
|
|
|
assertPageFetched();
|
2017-08-06 22:20:15 +02:00
|
|
|
List<VideoStream> videoOnlyStreams = new ArrayList<>();
|
2017-04-12 02:55:53 +02:00
|
|
|
try {
|
2019-09-11 20:04:28 +02:00
|
|
|
for (Map.Entry<String, ItagItem> entry : getItags(ADAPTIVE_FORMATS, ItagItem.ItagType.VIDEO_ONLY).entrySet()) {
|
2017-08-10 19:50:59 +02:00
|
|
|
ItagItem itag = entry.getValue();
|
2017-04-12 02:55:53 +02:00
|
|
|
|
2017-11-11 01:21:43 +01:00
|
|
|
VideoStream videoStream = new VideoStream(entry.getKey(), itag.getMediaFormat(), itag.resolutionString, true);
|
2017-08-10 19:50:59 +02:00
|
|
|
if (!Stream.containSimilarStream(videoStream, videoOnlyStreams)) {
|
|
|
|
videoOnlyStreams.add(videoStream);
|
2017-04-12 02:55:53 +02:00
|
|
|
}
|
|
|
|
}
|
|
|
|
} catch (Exception e) {
|
2017-08-10 19:50:59 +02:00
|
|
|
throw new ParsingException("Could not get video only streams", e);
|
2017-04-12 02:55:53 +02:00
|
|
|
}
|
|
|
|
|
|
|
|
return videoOnlyStreams;
|
2017-03-01 18:47:52 +01:00
|
|
|
}
|
|
|
|
|
2017-11-22 18:39:38 +01:00
|
|
|
@Override
|
2018-02-01 22:27:14 +01:00
|
|
|
@Nonnull
|
2018-09-24 21:04:22 +02:00
|
|
|
public List<SubtitlesStream> getSubtitlesDefault() throws IOException, ExtractionException {
|
|
|
|
return getSubtitles(MediaFormat.TTML);
|
2017-11-23 16:33:03 +01:00
|
|
|
}
|
|
|
|
|
|
|
|
@Override
|
2018-02-01 22:27:14 +01:00
|
|
|
@Nonnull
|
2018-09-24 21:04:22 +02:00
|
|
|
public List<SubtitlesStream> getSubtitles(final MediaFormat format) throws IOException, ExtractionException {
|
2017-11-30 10:49:27 +01:00
|
|
|
assertPageFetched();
|
2018-09-24 21:04:22 +02:00
|
|
|
List<SubtitlesStream> subtitles = new ArrayList<>();
|
2018-02-02 08:24:22 +01:00
|
|
|
for (final SubtitlesInfo subtitlesInfo : subtitlesInfos) {
|
|
|
|
subtitles.add(subtitlesInfo.getSubtitle(format));
|
2017-11-23 11:47:05 +01:00
|
|
|
}
|
2018-02-01 22:27:14 +01:00
|
|
|
return subtitles;
|
2017-11-22 18:39:38 +01:00
|
|
|
}
|
|
|
|
|
2017-03-01 18:47:52 +01:00
|
|
|
@Override
|
2017-08-11 03:23:09 +02:00
|
|
|
public StreamType getStreamType() throws ParsingException {
|
2018-02-25 23:31:42 +01:00
|
|
|
assertPageFetched();
|
|
|
|
try {
|
2018-02-28 03:16:29 +01:00
|
|
|
if (playerArgs != null && (playerArgs.has("ps") && playerArgs.get("ps").toString().equals("live") ||
|
2019-09-12 15:07:07 +02:00
|
|
|
(!playerResponse.getObject("streamingData").has(FORMATS)))) {
|
2018-02-25 23:31:42 +01:00
|
|
|
return StreamType.LIVE_STREAM;
|
|
|
|
}
|
|
|
|
} catch (Exception e) {
|
|
|
|
throw new ParsingException("Could not get hls manifest url", e);
|
|
|
|
}
|
2017-08-11 03:23:09 +02:00
|
|
|
return StreamType.VIDEO_STREAM;
|
2017-03-01 18:47:52 +01:00
|
|
|
}
|
|
|
|
|
|
|
|
@Override
|
2018-11-07 18:28:44 +01:00
|
|
|
public StreamInfoItem getNextStream() throws IOException, ExtractionException {
|
2017-11-30 10:49:27 +01:00
|
|
|
assertPageFetched();
|
2017-03-01 18:47:52 +01:00
|
|
|
try {
|
2018-02-24 22:20:50 +01:00
|
|
|
StreamInfoItemsCollector collector = new StreamInfoItemsCollector(getServiceId());
|
2019-04-28 22:03:16 +02:00
|
|
|
final TimeAgoParser timeAgoParser = getTimeAgoParser();
|
2017-08-10 19:50:59 +02:00
|
|
|
|
2018-09-24 21:04:22 +02:00
|
|
|
Elements watch = doc.select("div[class=\"watch-sidebar-section\"]");
|
|
|
|
if (watch.size() < 1) {
|
|
|
|
return null;// prevent the snackbar notification "report error" on age-restricted videos
|
|
|
|
}
|
2019-10-29 06:00:29 +01:00
|
|
|
|
2019-04-28 22:03:16 +02:00
|
|
|
collector.commit(extractVideoPreviewInfo(watch.first().select("li").first(), timeAgoParser));
|
2018-03-11 21:50:40 +01:00
|
|
|
return collector.getItems().get(0);
|
2017-06-29 20:12:55 +02:00
|
|
|
} catch (Exception e) {
|
2017-03-01 18:47:52 +01:00
|
|
|
throw new ParsingException("Could not get next video", e);
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
@Override
|
2018-11-07 18:28:44 +01:00
|
|
|
public StreamInfoItemsCollector getRelatedStreams() throws IOException, ExtractionException {
|
2017-11-30 10:49:27 +01:00
|
|
|
assertPageFetched();
|
2017-03-01 18:47:52 +01:00
|
|
|
try {
|
2018-02-24 22:20:50 +01:00
|
|
|
StreamInfoItemsCollector collector = new StreamInfoItemsCollector(getServiceId());
|
2019-04-28 22:03:16 +02:00
|
|
|
final TimeAgoParser timeAgoParser = getTimeAgoParser();
|
|
|
|
|
2017-03-01 18:47:52 +01:00
|
|
|
Element ul = doc.select("ul[id=\"watch-related\"]").first();
|
2017-06-29 20:12:55 +02:00
|
|
|
if (ul != null) {
|
2017-03-01 18:47:52 +01:00
|
|
|
for (Element li : ul.children()) {
|
|
|
|
// first check if we have a playlist. If so leave them out
|
|
|
|
if (li.select("a[class*=\"content-link\"]").first() != null) {
|
2019-04-28 22:03:16 +02:00
|
|
|
collector.commit(extractVideoPreviewInfo(li, timeAgoParser));
|
2017-03-01 18:47:52 +01:00
|
|
|
}
|
|
|
|
}
|
|
|
|
}
|
|
|
|
return collector;
|
2017-06-29 20:12:55 +02:00
|
|
|
} catch (Exception e) {
|
2017-03-01 18:47:52 +01:00
|
|
|
throw new ParsingException("Could not get related videos", e);
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2017-06-29 20:12:55 +02:00
|
|
|
/**
|
2017-07-11 05:08:03 +02:00
|
|
|
* {@inheritDoc}
|
2017-06-29 20:12:55 +02:00
|
|
|
*/
|
2017-07-11 05:08:03 +02:00
|
|
|
@Override
|
|
|
|
public String getErrorMessage() {
|
|
|
|
StringBuilder errorReason;
|
2019-09-23 10:44:17 +02:00
|
|
|
Element errorElement = doc.select("h1[id=\"unavailable-message\"]").first();
|
2017-03-01 18:47:52 +01:00
|
|
|
|
2019-09-23 10:44:17 +02:00
|
|
|
if (errorElement == null) {
|
2017-07-11 05:08:03 +02:00
|
|
|
errorReason = null;
|
|
|
|
} else {
|
2019-09-23 10:44:17 +02:00
|
|
|
String errorMessage = errorElement.text();
|
|
|
|
if (errorMessage == null || errorMessage.isEmpty()) {
|
|
|
|
errorReason = null;
|
|
|
|
} else {
|
|
|
|
errorReason = new StringBuilder(errorMessage);
|
|
|
|
errorReason.append(" ");
|
|
|
|
errorReason.append(doc.select("[id=\"unavailable-submessage\"]").first().text());
|
|
|
|
}
|
2017-07-11 05:08:03 +02:00
|
|
|
}
|
2017-03-01 18:47:52 +01:00
|
|
|
|
2017-07-11 05:08:03 +02:00
|
|
|
return errorReason != null ? errorReason.toString() : null;
|
|
|
|
}
|
2017-03-01 18:47:52 +01:00
|
|
|
|
2017-07-11 05:08:03 +02:00
|
|
|
/*//////////////////////////////////////////////////////////////////////////
|
2017-08-10 19:50:59 +02:00
|
|
|
// Fetch page
|
2017-07-11 05:08:03 +02:00
|
|
|
//////////////////////////////////////////////////////////////////////////*/
|
2017-03-01 18:47:52 +01:00
|
|
|
|
2019-09-11 20:04:28 +02:00
|
|
|
private static final String FORMATS = "formats";
|
|
|
|
private static final String ADAPTIVE_FORMATS = "adaptiveFormats";
|
2017-07-11 05:08:03 +02:00
|
|
|
private static final String HTTPS = "https:";
|
|
|
|
private static final String CONTENT = "content";
|
|
|
|
private static final String DECRYPTION_FUNC_NAME = "decrypt";
|
|
|
|
|
2018-03-02 01:31:36 +01:00
|
|
|
private static final String VERIFIED_URL_PARAMS = "&has_verified=1&bpctr=9999999999";
|
|
|
|
|
2018-09-08 07:25:07 +02:00
|
|
|
private final static String DECYRYPTION_SIGNATURE_FUNCTION_REGEX =
|
2019-03-14 08:49:11 +01:00
|
|
|
"([\\w$]+)\\s*=\\s*function\\((\\w+)\\)\\{\\s*\\2=\\s*\\2\\.split\\(\"\"\\)\\s*;";
|
2018-09-08 07:25:07 +02:00
|
|
|
private final static String DECRYPTION_AKAMAIZED_STRING_REGEX =
|
2019-01-18 11:47:34 +01:00
|
|
|
"yt\\.akamaized\\.net/\\)\\s*\\|\\|\\s*.*?\\s*c\\s*&&\\s*d\\.set\\([^,]+\\s*,\\s*(:encodeURIComponent\\s*\\()([a-zA-Z0-9$]+)\\(";
|
2018-09-08 07:25:07 +02:00
|
|
|
private final static String DECRYPTION_AKAMAIZED_SHORT_STRING_REGEX =
|
2019-01-18 11:47:34 +01:00
|
|
|
"\\bc\\s*&&\\s*d\\.set\\([^,]+\\s*,\\s*(:encodeURIComponent\\s*\\()([a-zA-Z0-9$]+)\\(";
|
2018-09-08 07:25:07 +02:00
|
|
|
|
2017-11-30 11:20:49 +01:00
|
|
|
private volatile String decryptionCode = "";
|
2017-07-11 05:08:03 +02:00
|
|
|
|
2017-11-30 11:20:49 +01:00
|
|
|
private String pageHtml = null;
|
2017-11-22 18:39:38 +01:00
|
|
|
|
2017-08-06 22:20:15 +02:00
|
|
|
@Override
|
2017-11-28 13:37:01 +01:00
|
|
|
public void onFetchPage(@Nonnull Downloader downloader) throws IOException, ExtractionException {
|
2019-10-29 06:00:29 +01:00
|
|
|
final String verifiedUrl = getUrl() + VERIFIED_URL_PARAMS;
|
2019-04-28 22:03:16 +02:00
|
|
|
final Response response = downloader.get(verifiedUrl, getExtractorLocalization());
|
|
|
|
pageHtml = response.responseBody();
|
2019-10-29 06:00:29 +01:00
|
|
|
doc = YoutubeParsingHelper.parseAndCheckPage(verifiedUrl, response);
|
2017-07-11 05:08:03 +02:00
|
|
|
|
2017-12-18 23:05:58 +01:00
|
|
|
final String playerUrl;
|
2017-07-11 05:08:03 +02:00
|
|
|
// Check if the video is age restricted
|
2019-10-29 06:00:28 +01:00
|
|
|
if (!doc.select("meta[property=\"og:restrictions:age\"").isEmpty()) {
|
2017-12-18 23:05:58 +01:00
|
|
|
final EmbeddedInfo info = getEmbeddedInfo();
|
|
|
|
final String videoInfoUrl = getVideoInfoUrl(getId(), info.sts);
|
2019-04-28 22:03:16 +02:00
|
|
|
final String infoPageResponse = downloader.get(videoInfoUrl, getExtractorLocalization()).responseBody();
|
2017-11-25 01:10:04 +01:00
|
|
|
videoInfoPage.putAll(Parser.compatParseMap(infoPageResponse));
|
2017-12-18 23:05:58 +01:00
|
|
|
playerUrl = info.url;
|
2017-07-11 05:08:03 +02:00
|
|
|
isAgeRestricted = true;
|
|
|
|
} else {
|
2019-10-29 06:00:29 +01:00
|
|
|
final JsonObject ytPlayerConfig = getPlayerConfig();
|
2017-07-11 05:08:03 +02:00
|
|
|
playerArgs = getPlayerArgs(ytPlayerConfig);
|
|
|
|
playerUrl = getPlayerUrl(ytPlayerConfig);
|
|
|
|
isAgeRestricted = false;
|
|
|
|
}
|
2019-09-11 19:05:41 +02:00
|
|
|
playerResponse = getPlayerResponse();
|
2017-07-11 05:08:03 +02:00
|
|
|
|
|
|
|
if (decryptionCode.isEmpty()) {
|
|
|
|
decryptionCode = loadDecryptionCode(playerUrl);
|
|
|
|
}
|
2018-02-01 22:27:14 +01:00
|
|
|
|
2018-02-02 08:24:22 +01:00
|
|
|
if (subtitlesInfos.isEmpty()) {
|
|
|
|
subtitlesInfos.addAll(getAvailableSubtitlesInfo());
|
2018-02-01 22:27:14 +01:00
|
|
|
}
|
2017-07-11 05:08:03 +02:00
|
|
|
}
|
|
|
|
|
2019-10-29 06:00:29 +01:00
|
|
|
private JsonObject getPlayerConfig() throws ParsingException {
|
2017-07-11 05:08:03 +02:00
|
|
|
try {
|
2019-10-29 06:00:29 +01:00
|
|
|
String ytPlayerConfigRaw = Parser.matchGroup1("ytplayer.config\\s*=\\s*(\\{.*?\\});", pageHtml);
|
2017-08-16 04:40:03 +02:00
|
|
|
return JsonParser.object().from(ytPlayerConfigRaw);
|
2017-07-11 05:08:03 +02:00
|
|
|
} catch (Parser.RegexException e) {
|
|
|
|
String errorReason = getErrorMessage();
|
|
|
|
switch (errorReason) {
|
|
|
|
case "":
|
|
|
|
throw new ContentNotAvailableException("Content not available: player config empty", e);
|
|
|
|
default:
|
|
|
|
throw new ContentNotAvailableException("Content not available", e);
|
2017-03-01 18:47:52 +01:00
|
|
|
}
|
2017-08-10 19:50:59 +02:00
|
|
|
} catch (Exception e) {
|
2017-07-11 05:08:03 +02:00
|
|
|
throw new ParsingException("Could not parse yt player config", e);
|
|
|
|
}
|
|
|
|
}
|
2017-03-01 18:47:52 +01:00
|
|
|
|
2017-08-16 04:40:03 +02:00
|
|
|
private JsonObject getPlayerArgs(JsonObject playerConfig) throws ParsingException {
|
|
|
|
JsonObject playerArgs;
|
2017-03-01 18:47:52 +01:00
|
|
|
|
2017-07-11 05:08:03 +02:00
|
|
|
//attempt to load the youtube js player JSON arguments
|
|
|
|
try {
|
2017-08-16 04:40:03 +02:00
|
|
|
playerArgs = playerConfig.getObject("args");
|
2017-08-10 19:50:59 +02:00
|
|
|
} catch (Exception e) {
|
2017-07-11 05:08:03 +02:00
|
|
|
throw new ParsingException("Could not parse yt player config", e);
|
|
|
|
}
|
2017-03-01 18:47:52 +01:00
|
|
|
|
2017-07-11 05:08:03 +02:00
|
|
|
return playerArgs;
|
|
|
|
}
|
|
|
|
|
2017-08-16 04:40:03 +02:00
|
|
|
private String getPlayerUrl(JsonObject playerConfig) throws ParsingException {
|
2017-07-11 05:08:03 +02:00
|
|
|
try {
|
|
|
|
// The Youtube service needs to be initialized by downloading the
|
|
|
|
// js-Youtube-player. This is done in order to get the algorithm
|
|
|
|
// for decrypting cryptic signatures inside certain stream urls.
|
|
|
|
String playerUrl;
|
|
|
|
|
2017-08-16 04:40:03 +02:00
|
|
|
JsonObject ytAssets = playerConfig.getObject("assets");
|
2017-07-11 05:08:03 +02:00
|
|
|
playerUrl = ytAssets.getString("js");
|
|
|
|
|
|
|
|
if (playerUrl.startsWith("//")) {
|
|
|
|
playerUrl = HTTPS + playerUrl;
|
2017-03-01 18:47:52 +01:00
|
|
|
}
|
2017-07-11 05:08:03 +02:00
|
|
|
return playerUrl;
|
2017-08-10 19:50:59 +02:00
|
|
|
} catch (Exception e) {
|
2017-08-16 04:40:03 +02:00
|
|
|
throw new ParsingException("Could not load decryption code for the Youtube service.", e);
|
2017-07-11 05:08:03 +02:00
|
|
|
}
|
2017-03-01 18:47:52 +01:00
|
|
|
}
|
|
|
|
|
2019-09-11 19:05:41 +02:00
|
|
|
private JsonObject getPlayerResponse() throws ParsingException {
|
|
|
|
try {
|
|
|
|
String playerResponseStr;
|
|
|
|
if(playerArgs != null) {
|
|
|
|
playerResponseStr = playerArgs.getString("player_response");
|
|
|
|
} else {
|
|
|
|
playerResponseStr = videoInfoPage.get("player_response");
|
|
|
|
}
|
|
|
|
return JsonParser.object().from(playerResponseStr);
|
|
|
|
} catch (Exception e) {
|
|
|
|
throw new ParsingException("Could not parse yt player response", e);
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2017-12-18 23:05:58 +01:00
|
|
|
@Nonnull
|
|
|
|
private EmbeddedInfo getEmbeddedInfo() throws ParsingException, ReCaptchaException {
|
2017-07-11 05:08:03 +02:00
|
|
|
try {
|
2017-12-18 23:05:58 +01:00
|
|
|
final Downloader downloader = NewPipe.getDownloader();
|
|
|
|
final String embedUrl = "https://www.youtube.com/embed/" + getId();
|
2019-04-28 22:03:16 +02:00
|
|
|
final String embedPageContent = downloader.get(embedUrl, getExtractorLocalization()).responseBody();
|
2017-12-18 23:05:58 +01:00
|
|
|
|
|
|
|
// Get player url
|
|
|
|
final String assetsPattern = "\"assets\":.+?\"js\":\\s*(\"[^\"]+\")";
|
|
|
|
String playerUrl = Parser.matchGroup1(assetsPattern, embedPageContent)
|
|
|
|
.replace("\\", "").replace("\"", "");
|
2017-07-11 05:08:03 +02:00
|
|
|
if (playerUrl.startsWith("//")) {
|
|
|
|
playerUrl = HTTPS + playerUrl;
|
|
|
|
}
|
2017-12-18 23:05:58 +01:00
|
|
|
|
2019-07-30 20:53:23 +02:00
|
|
|
try {
|
|
|
|
// Get embed sts
|
|
|
|
final String stsPattern = "\"sts\"\\s*:\\s*(\\d+)";
|
|
|
|
final String sts = Parser.matchGroup1(stsPattern, embedPageContent);
|
|
|
|
return new EmbeddedInfo(playerUrl, sts);
|
|
|
|
} catch (Exception i) {
|
|
|
|
// if it failes we simply reply with no sts as then it does not seem to be necessary
|
|
|
|
return new EmbeddedInfo(playerUrl, "");
|
|
|
|
}
|
2017-12-18 23:05:58 +01:00
|
|
|
|
2017-07-11 05:08:03 +02:00
|
|
|
} catch (IOException e) {
|
|
|
|
throw new ParsingException(
|
|
|
|
"Could load decryption code form restricted video for the Youtube service.", e);
|
|
|
|
}
|
|
|
|
}
|
2017-03-01 18:47:52 +01:00
|
|
|
|
|
|
|
private String loadDecryptionCode(String playerUrl) throws DecryptException {
|
|
|
|
try {
|
|
|
|
Downloader downloader = NewPipe.getDownloader();
|
2017-06-29 20:12:55 +02:00
|
|
|
if (!playerUrl.contains("https://youtube.com")) {
|
2017-03-01 18:47:52 +01:00
|
|
|
//sometimes the https://youtube.com part does not get send with
|
|
|
|
//than we have to add it by hand
|
|
|
|
playerUrl = "https://youtube.com" + playerUrl;
|
|
|
|
}
|
|
|
|
|
2019-04-28 22:03:16 +02:00
|
|
|
final String playerCode = downloader.get(playerUrl, getExtractorLocalization()).responseBody();
|
2019-03-14 09:07:19 +01:00
|
|
|
final String decryptionFunctionName = getDecryptionFuncName(playerCode);
|
2017-03-01 18:47:52 +01:00
|
|
|
|
2018-09-08 07:25:07 +02:00
|
|
|
final String functionPattern = "("
|
|
|
|
+ decryptionFunctionName.replace("$", "\\$")
|
2017-03-01 18:47:52 +01:00
|
|
|
+ "=function\\([a-zA-Z0-9_]+\\)\\{.+?\\})";
|
2018-09-08 07:25:07 +02:00
|
|
|
final String decryptionFunction = "var " + Parser.matchGroup1(functionPattern, playerCode) + ";";
|
2017-03-01 18:47:52 +01:00
|
|
|
|
2018-09-08 07:25:07 +02:00
|
|
|
final String helperObjectName =
|
|
|
|
Parser.matchGroup1(";([A-Za-z0-9_\\$]{2})\\...\\(", decryptionFunction);
|
|
|
|
final String helperPattern =
|
|
|
|
"(var " + helperObjectName.replace("$", "\\$") + "=\\{.+?\\}\\};)";
|
|
|
|
final String helperObject =
|
|
|
|
Parser.matchGroup1(helperPattern, playerCode.replace("\n", ""));
|
2017-03-01 18:47:52 +01:00
|
|
|
|
2018-09-08 07:25:07 +02:00
|
|
|
final String callerFunction =
|
|
|
|
"function " + DECRYPTION_FUNC_NAME + "(a){return " + decryptionFunctionName + "(a);}";
|
2017-03-01 18:47:52 +01:00
|
|
|
|
2018-09-08 07:25:07 +02:00
|
|
|
return helperObject + decryptionFunction + callerFunction;
|
2017-06-29 20:12:55 +02:00
|
|
|
} catch (IOException ioe) {
|
2017-03-01 18:47:52 +01:00
|
|
|
throw new DecryptException("Could not load decrypt function", ioe);
|
2017-06-29 20:12:55 +02:00
|
|
|
} catch (Exception e) {
|
2017-03-01 18:47:52 +01:00
|
|
|
throw new DecryptException("Could not parse decrypt function ", e);
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2017-07-11 05:08:03 +02:00
|
|
|
private String decryptSignature(String encryptedSig, String decryptionCode) throws DecryptException {
|
2017-03-01 18:47:52 +01:00
|
|
|
Context context = Context.enter();
|
|
|
|
context.setOptimizationLevel(-1);
|
2017-11-23 11:47:05 +01:00
|
|
|
Object result;
|
2017-03-01 18:47:52 +01:00
|
|
|
try {
|
|
|
|
ScriptableObject scope = context.initStandardObjects();
|
|
|
|
context.evaluateString(scope, decryptionCode, "decryptionCode", 1, null);
|
|
|
|
Function decryptionFunc = (Function) scope.get("decrypt", scope);
|
|
|
|
result = decryptionFunc.call(context, scope, scope, new Object[]{encryptedSig});
|
|
|
|
} catch (Exception e) {
|
|
|
|
throw new DecryptException("could not get decrypt signature", e);
|
|
|
|
} finally {
|
|
|
|
Context.exit();
|
|
|
|
}
|
|
|
|
return result == null ? "" : result.toString();
|
|
|
|
}
|
|
|
|
|
2019-03-14 09:07:19 +01:00
|
|
|
private String getDecryptionFuncName(String playerCode) throws DecryptException {
|
|
|
|
String decryptionFunctionName;
|
|
|
|
// Cascading things in catch is ugly, but its faster than running a match before getting the actual name
|
|
|
|
// to se if the function can actually be found with the given regex.
|
|
|
|
// However if this cascading should propably be cleaned up somehow as it looks a bit weird.
|
|
|
|
try {
|
|
|
|
decryptionFunctionName = Parser.matchGroup1(DECYRYPTION_SIGNATURE_FUNCTION_REGEX, playerCode);
|
|
|
|
} catch (Parser.RegexException re) {
|
|
|
|
try {
|
|
|
|
decryptionFunctionName = Parser.matchGroup1(DECRYPTION_AKAMAIZED_SHORT_STRING_REGEX, playerCode);
|
|
|
|
} catch (Parser.RegexException re2) {
|
|
|
|
try {
|
2019-03-14 16:49:30 +01:00
|
|
|
decryptionFunctionName = Parser.matchGroup1(DECRYPTION_AKAMAIZED_STRING_REGEX, playerCode);
|
2019-03-14 09:07:19 +01:00
|
|
|
} catch (Parser.RegexException re3) {
|
|
|
|
throw new DecryptException("Could not find decrypt function with any of the given patterns.", re);
|
|
|
|
}
|
|
|
|
}
|
|
|
|
}
|
|
|
|
return decryptionFunctionName;
|
|
|
|
}
|
|
|
|
|
2018-02-02 06:48:34 +01:00
|
|
|
@Nonnull
|
2018-02-02 08:24:22 +01:00
|
|
|
private List<SubtitlesInfo> getAvailableSubtitlesInfo() throws SubtitlesException {
|
2018-02-02 06:48:34 +01:00
|
|
|
// If the video is age restricted getPlayerConfig will fail
|
|
|
|
if(isAgeRestricted) return Collections.emptyList();
|
|
|
|
|
|
|
|
final JsonObject captions;
|
2019-09-11 19:35:08 +02:00
|
|
|
if (!playerResponse.has("captions")) {
|
|
|
|
// Captions does not exist
|
|
|
|
return Collections.emptyList();
|
2018-02-02 06:48:34 +01:00
|
|
|
}
|
2019-09-11 19:35:08 +02:00
|
|
|
captions = playerResponse.getObject("captions");
|
2018-02-02 06:48:34 +01:00
|
|
|
|
2018-02-06 19:45:58 +01:00
|
|
|
final JsonObject renderer = captions.getObject("playerCaptionsTracklistRenderer", new JsonObject());
|
|
|
|
final JsonArray captionsArray = renderer.getArray("captionTracks", new JsonArray());
|
2018-02-02 07:51:53 +01:00
|
|
|
// todo: use this to apply auto translation to different language from a source language
|
2018-02-06 19:45:58 +01:00
|
|
|
final JsonArray autoCaptionsArray = renderer.getArray("translationLanguages", new JsonArray());
|
2018-02-02 06:48:34 +01:00
|
|
|
|
2018-02-06 19:45:58 +01:00
|
|
|
// This check is necessary since there may be cases where subtitles metadata do not contain caption track info
|
|
|
|
// e.g. https://www.youtube.com/watch?v=-Vpwatutnko
|
2018-02-02 06:48:34 +01:00
|
|
|
final int captionsSize = captionsArray.size();
|
|
|
|
if(captionsSize == 0) return Collections.emptyList();
|
|
|
|
|
2018-02-02 08:24:22 +01:00
|
|
|
List<SubtitlesInfo> result = new ArrayList<>();
|
2018-02-02 06:48:34 +01:00
|
|
|
for (int i = 0; i < captionsSize; i++) {
|
2018-02-02 07:51:53 +01:00
|
|
|
final String languageCode = captionsArray.getObject(i).getString("languageCode");
|
|
|
|
final String baseUrl = captionsArray.getObject(i).getString("baseUrl");
|
2018-02-06 19:45:58 +01:00
|
|
|
final String vssId = captionsArray.getObject(i).getString("vssId");
|
2018-02-02 07:51:53 +01:00
|
|
|
|
2018-02-06 19:45:58 +01:00
|
|
|
if (languageCode != null && baseUrl != null && vssId != null) {
|
|
|
|
final boolean isAutoGenerated = vssId.startsWith("a.");
|
|
|
|
result.add(new SubtitlesInfo(baseUrl, languageCode, isAutoGenerated));
|
|
|
|
}
|
2018-02-01 22:27:14 +01:00
|
|
|
}
|
2018-02-02 06:48:34 +01:00
|
|
|
|
|
|
|
return result;
|
2018-02-01 22:27:14 +01:00
|
|
|
}
|
2017-12-18 23:05:58 +01:00
|
|
|
/*//////////////////////////////////////////////////////////////////////////
|
|
|
|
// Data Class
|
|
|
|
//////////////////////////////////////////////////////////////////////////*/
|
|
|
|
|
|
|
|
private class EmbeddedInfo {
|
|
|
|
final String url;
|
|
|
|
final String sts;
|
|
|
|
|
|
|
|
EmbeddedInfo(final String url, final String sts) {
|
|
|
|
this.url = url;
|
|
|
|
this.sts = sts;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2018-02-02 08:24:22 +01:00
|
|
|
private class SubtitlesInfo {
|
|
|
|
final String cleanUrl;
|
|
|
|
final String languageCode;
|
|
|
|
final boolean isGenerated;
|
|
|
|
|
|
|
|
public SubtitlesInfo(final String baseUrl, final String languageCode, final boolean isGenerated) {
|
|
|
|
this.cleanUrl = baseUrl
|
|
|
|
.replaceAll("&fmt=[^&]*", "") // Remove preexisting format if exists
|
|
|
|
.replaceAll("&tlang=[^&]*", ""); // Remove translation language
|
|
|
|
this.languageCode = languageCode;
|
|
|
|
this.isGenerated = isGenerated;
|
|
|
|
}
|
|
|
|
|
2018-09-24 21:04:22 +02:00
|
|
|
public SubtitlesStream getSubtitle(final MediaFormat format) {
|
|
|
|
return new SubtitlesStream(format, languageCode, cleanUrl + "&fmt=" + format.getSuffix(), isGenerated);
|
2018-02-02 08:24:22 +01:00
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2017-08-10 19:50:59 +02:00
|
|
|
/*//////////////////////////////////////////////////////////////////////////
|
|
|
|
// Utils
|
|
|
|
//////////////////////////////////////////////////////////////////////////*/
|
|
|
|
|
2017-12-18 23:05:58 +01:00
|
|
|
@Nonnull
|
2018-02-01 22:27:14 +01:00
|
|
|
private static String getVideoInfoUrl(final String id, final String sts) {
|
2017-12-18 23:05:58 +01:00
|
|
|
return "https://www.youtube.com/get_video_info?" + "video_id=" + id +
|
|
|
|
"&eurl=https://youtube.googleapis.com/v/" + id +
|
|
|
|
"&sts=" + sts + "&ps=default&gl=US&hl=en";
|
|
|
|
}
|
|
|
|
|
2019-09-11 19:05:41 +02:00
|
|
|
private Map<String, ItagItem> getItags(String streamingDataKey, ItagItem.ItagType itagTypeWanted) throws ParsingException {
|
2017-08-10 19:50:59 +02:00
|
|
|
Map<String, ItagItem> urlAndItags = new LinkedHashMap<>();
|
2019-09-12 15:08:17 +02:00
|
|
|
JsonObject streamingData = playerResponse.getObject("streamingData");
|
|
|
|
if (!streamingData.has(streamingDataKey)) {
|
|
|
|
return urlAndItags;
|
2017-08-10 19:50:59 +02:00
|
|
|
}
|
|
|
|
|
2019-09-12 15:08:17 +02:00
|
|
|
JsonArray formats = streamingData.getArray(streamingDataKey);
|
2019-09-11 19:05:41 +02:00
|
|
|
for (int i = 0; i != formats.size(); ++i) {
|
|
|
|
JsonObject formatData = formats.getObject(i);
|
|
|
|
int itag = formatData.getInt("itag");
|
2017-08-10 19:50:59 +02:00
|
|
|
|
2019-09-11 19:05:41 +02:00
|
|
|
if (ItagItem.isSupported(itag)) {
|
2019-09-11 19:56:16 +02:00
|
|
|
try {
|
2017-08-10 19:50:59 +02:00
|
|
|
ItagItem itagItem = ItagItem.getItag(itag);
|
|
|
|
if (itagItem.itagType == itagTypeWanted) {
|
2019-09-11 19:56:16 +02:00
|
|
|
String streamUrl;
|
|
|
|
if (formatData.has("url")) {
|
|
|
|
streamUrl = formatData.getString("url");
|
|
|
|
} else {
|
|
|
|
// this url has an encrypted signature
|
|
|
|
Map<String, String> cipher = Parser.compatParseMap(formatData.getString("cipher"));
|
|
|
|
streamUrl = cipher.get("url") + "&" + cipher.get("sp") + "=" + decryptSignature(cipher.get("s"), decryptionCode);
|
2017-08-10 19:50:59 +02:00
|
|
|
}
|
2019-09-11 19:56:16 +02:00
|
|
|
|
2017-08-10 19:50:59 +02:00
|
|
|
urlAndItags.put(streamUrl, itagItem);
|
|
|
|
}
|
2019-09-11 19:56:16 +02:00
|
|
|
} catch (UnsupportedEncodingException ignored) {
|
|
|
|
|
2017-08-10 19:50:59 +02:00
|
|
|
}
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
return urlAndItags;
|
|
|
|
}
|
|
|
|
|
2017-05-27 14:23:48 +02:00
|
|
|
/**
|
2017-07-11 05:08:03 +02:00
|
|
|
* Provides information about links to other videos on the video page, such as related videos.
|
2017-08-10 19:50:59 +02:00
|
|
|
* This is encapsulated in a StreamInfoItem object, which is a subset of the fields in a full StreamInfo.
|
2017-05-27 14:23:48 +02:00
|
|
|
*/
|
2019-04-28 22:03:16 +02:00
|
|
|
private StreamInfoItemExtractor extractVideoPreviewInfo(final Element li, final TimeAgoParser timeAgoParser) {
|
2019-10-02 07:02:01 +02:00
|
|
|
return new YoutubeStreamInfoItemExtractor(li, timeAgoParser) {
|
2017-05-27 14:23:48 +02:00
|
|
|
|
2017-07-11 05:08:03 +02:00
|
|
|
@Override
|
2017-08-11 20:21:49 +02:00
|
|
|
public String getUrl() throws ParsingException {
|
2017-07-11 05:08:03 +02:00
|
|
|
return li.select("a.content-link").first().attr("abs:href");
|
|
|
|
}
|
|
|
|
|
|
|
|
@Override
|
2017-08-11 20:21:49 +02:00
|
|
|
public String getName() throws ParsingException {
|
2017-07-11 05:08:03 +02:00
|
|
|
//todo: check NullPointerException causing
|
|
|
|
return li.select("span.title").first().text();
|
|
|
|
//this page causes the NullPointerException, after finding it by searching for "tjvg":
|
|
|
|
//https://www.youtube.com/watch?v=Uqg0aEhLFAg
|
|
|
|
}
|
|
|
|
|
|
|
|
@Override
|
2017-08-10 04:50:29 +02:00
|
|
|
public String getUploaderName() throws ParsingException {
|
2017-10-31 14:10:52 +01:00
|
|
|
return li.select("span[class*=\"attribution\"").first()
|
|
|
|
.select("span").first().text();
|
2017-07-11 05:08:03 +02:00
|
|
|
}
|
|
|
|
|
2017-11-26 17:12:20 +01:00
|
|
|
@Override
|
|
|
|
public String getUploaderUrl() throws ParsingException {
|
|
|
|
return ""; // The uploader is not linked
|
|
|
|
}
|
|
|
|
|
2017-07-11 05:08:03 +02:00
|
|
|
@Override
|
2019-10-02 07:02:01 +02:00
|
|
|
public String getTextualUploadDate() throws ParsingException {
|
2017-08-10 19:50:59 +02:00
|
|
|
return "";
|
2017-07-11 05:08:03 +02:00
|
|
|
}
|
|
|
|
|
|
|
|
@Override
|
|
|
|
public String getThumbnailUrl() throws ParsingException {
|
|
|
|
Element img = li.select("img").first();
|
|
|
|
String thumbnailUrl = img.attr("abs:src");
|
|
|
|
// Sometimes youtube sends links to gif files which somehow seem to not exist
|
|
|
|
// anymore. Items with such gif also offer a secondary image source. So we are going
|
|
|
|
// to use that if we caught such an item.
|
|
|
|
if (thumbnailUrl.contains(".gif")) {
|
|
|
|
thumbnailUrl = img.attr("data-thumb");
|
|
|
|
}
|
|
|
|
if (thumbnailUrl.startsWith("//")) {
|
|
|
|
thumbnailUrl = HTTPS + thumbnailUrl;
|
|
|
|
}
|
|
|
|
return thumbnailUrl;
|
|
|
|
}
|
|
|
|
};
|
2017-03-01 18:47:52 +01:00
|
|
|
}
|
2019-08-26 18:14:09 +02:00
|
|
|
|
2019-09-10 18:38:51 +02:00
|
|
|
@Nonnull
|
|
|
|
@Override
|
|
|
|
public List<Frameset> getFrames() throws ExtractionException {
|
|
|
|
try {
|
|
|
|
final String script = doc.select("#player-api").first().siblingElements().select("script").html();
|
|
|
|
int p = script.indexOf("ytplayer.config");
|
|
|
|
if (p == -1) {
|
|
|
|
return Collections.emptyList();
|
|
|
|
}
|
|
|
|
p = script.indexOf('{', p);
|
|
|
|
int e = script.indexOf("ytplayer.load", p);
|
|
|
|
if (e == -1) {
|
|
|
|
return Collections.emptyList();
|
|
|
|
}
|
|
|
|
JsonObject jo = JsonParser.object().from(script.substring(p, e - 1));
|
|
|
|
final String resp = jo.getObject("args").getString("player_response");
|
|
|
|
jo = JsonParser.object().from(resp);
|
|
|
|
final String[] spec = jo.getObject("storyboards").getObject("playerStoryboardSpecRenderer").getString("spec").split("\\|");
|
|
|
|
final String url = spec[0];
|
|
|
|
final ArrayList<Frameset> result = new ArrayList<>(spec.length - 1);
|
|
|
|
for (int i = 1; i < spec.length; ++i) {
|
|
|
|
final String[] parts = spec[i].split("#");
|
|
|
|
if (parts.length != 8) {
|
|
|
|
continue;
|
|
|
|
}
|
|
|
|
final int frameWidth = Integer.parseInt(parts[0]);
|
|
|
|
final int frameHeight = Integer.parseInt(parts[1]);
|
|
|
|
final int totalCount = Integer.parseInt(parts[2]);
|
|
|
|
final int framesPerPageX = Integer.parseInt(parts[3]);
|
|
|
|
final int framesPerPageY = Integer.parseInt(parts[4]);
|
|
|
|
final String baseUrl = url.replace("$L", String.valueOf(i - 1)).replace("$N", parts[6]) + "&sigh=" + parts[7];
|
|
|
|
final List<String> urls;
|
|
|
|
if (baseUrl.contains("$M")) {
|
|
|
|
final int totalPages = (int) Math.ceil(totalCount / (double) (framesPerPageX * framesPerPageY));
|
|
|
|
urls = new ArrayList<>(totalPages);
|
|
|
|
for (int j = 0; j < totalPages; j++) {
|
|
|
|
urls.add(baseUrl.replace("$M", String.valueOf(j)));
|
|
|
|
}
|
|
|
|
} else {
|
|
|
|
urls = Collections.singletonList(baseUrl);
|
|
|
|
}
|
|
|
|
result.add(new Frameset(
|
|
|
|
urls,
|
|
|
|
frameWidth,
|
|
|
|
frameHeight,
|
|
|
|
totalCount,
|
|
|
|
framesPerPageX,
|
|
|
|
framesPerPageY
|
|
|
|
));
|
|
|
|
}
|
|
|
|
result.trimToSize();
|
|
|
|
return result;
|
|
|
|
} catch (Exception e) {
|
|
|
|
throw new ExtractionException(e);
|
|
|
|
}
|
|
|
|
}
|
2017-03-01 18:47:52 +01:00
|
|
|
}
|