NewPipeExtractor/extractor/src/main/java/org/schabi/newpipe/extractor/services/youtube/extractors/YoutubeTrendingExtractor.java

/*
 * Created by Christian Schabesberger on 12.08.17.
 *
 * Copyright (C) Christian Schabesberger 2018 <chris.schabesberger@mailbox.org>
 * YoutubeTrendingExtractor.java is part of NewPipe Extractor.
 *
 * NewPipe Extractor is free software: you can redistribute it and/or modify
 * it under the terms of the GNU General Public License as published by
 * the Free Software Foundation, either version 3 of the License, or
 * (at your option) any later version.
 *
 * NewPipe Extractor is distributed in the hope that it will be useful,
 * but WITHOUT ANY WARRANTY; without even the implied warranty of
 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
 * GNU General Public License for more details.
 *
 * You should have received a copy of the GNU General Public License
 * along with NewPipe Extractor. If not, see <https://www.gnu.org/licenses/>.
 */

package org.schabi.newpipe.extractor.services.youtube.extractors;

import static org.schabi.newpipe.extractor.services.youtube.YoutubeParsingHelper.getJsonPostResponse;
import static org.schabi.newpipe.extractor.services.youtube.YoutubeParsingHelper.getTextAtKey;
import static org.schabi.newpipe.extractor.services.youtube.YoutubeParsingHelper.prepareDesktopJsonBuilder;
import static org.schabi.newpipe.extractor.utils.Utils.isNullOrEmpty;

import com.grack.nanojson.JsonObject;
import com.grack.nanojson.JsonWriter;

import org.schabi.newpipe.extractor.Page;
import org.schabi.newpipe.extractor.StreamingService;
import org.schabi.newpipe.extractor.downloader.Downloader;
import org.schabi.newpipe.extractor.exceptions.ExtractionException;
import org.schabi.newpipe.extractor.exceptions.ParsingException;
import org.schabi.newpipe.extractor.kiosk.KioskExtractor;
import org.schabi.newpipe.extractor.linkhandler.ListLinkHandler;
import org.schabi.newpipe.extractor.localization.TimeAgoParser;
import org.schabi.newpipe.extractor.stream.StreamInfoItem;
import org.schabi.newpipe.extractor.stream.StreamInfoItemsCollector;

import java.io.IOException;
import java.nio.charset.StandardCharsets;

import javax.annotation.Nonnull;

public class YoutubeTrendingExtractor extends KioskExtractor<StreamInfoItem> {
    private JsonObject initialData;

    public YoutubeTrendingExtractor(final StreamingService service,
                                    final ListLinkHandler linkHandler,
                                    final String kioskId) {
        super(service, linkHandler, kioskId);
    }

    @Override
    public void onFetchPage(@Nonnull final Downloader downloader)
            throws IOException, ExtractionException {
        // @formatter:off
        final byte[] body = JsonWriter.string(prepareDesktopJsonBuilder(getExtractorLocalization(),
                getExtractorContentCountry())
                .value("browseId", "FEtrending")
                .done())
                .getBytes(StandardCharsets.UTF_8);
        // @formatter:on

        initialData = getJsonPostResponse("browse", body, getExtractorLocalization());
    }

    @Override
    public InfoItemsPage<StreamInfoItem> getPage(final Page page) {
        return InfoItemsPage.emptyPage();
    }

    @Nonnull
    @Override
    public String getName() throws ParsingException {
        final JsonObject header = initialData.getObject("header");
        String name = null;
        if (header.has("feedTabbedHeaderRenderer")) {
            name = getTextAtKey(header.getObject("feedTabbedHeaderRenderer"), "title");
        } else if (header.has("c4TabbedHeaderRenderer")) {
            name = getTextAtKey(header.getObject("c4TabbedHeaderRenderer"), "title");
        }

        if (isNullOrEmpty(name)) {
            throw new ParsingException("Could not get Trending name");
        }
        return name;
    }

    @Nonnull
    @Override
    public InfoItemsPage<StreamInfoItem> getInitialPage() throws ParsingException {
        final StreamInfoItemsCollector collector = new StreamInfoItemsCollector(getServiceId());
        final TimeAgoParser timeAgoParser = getTimeAgoParser();
        final JsonObject tabContent = getTrendingTabContent();

        if (tabContent.has("richGridRenderer")) {
            tabContent.getObject("richGridRenderer")
                    .getArray("contents")
                    .stream()
                    .filter(JsonObject.class::isInstance)
                    .map(JsonObject.class::cast)
                    // Filter Trending shorts and Recently trending sections
                    .filter(content -> content.has("richItemRenderer"))
                    .map(content -> content.getObject("richItemRenderer")
                            .getObject("content")
                            .getObject("videoRenderer"))
                    .forEachOrdered(videoRenderer -> collector.commit(
                            new YoutubeStreamInfoItemExtractor(videoRenderer, timeAgoParser)));
        } else if (tabContent.has("sectionListRenderer")) {
            tabContent.getObject("sectionListRenderer")
                    .getArray("contents")
                    .stream()
                    .filter(JsonObject.class::isInstance)
                    .map(JsonObject.class::cast)
                    .flatMap(content -> content.getObject("itemSectionRenderer")
                            .getArray("contents")
                            .stream())
                    .filter(JsonObject.class::isInstance)
                    .map(JsonObject.class::cast)
                    .map(content -> content.getObject("shelfRenderer"))
                    // Filter Trending shorts and Recently trending sections which have a title,
                    // contrary to normal trends
                    .filter(shelfRenderer -> !shelfRenderer.has("title"))
                    .flatMap(shelfRenderer -> shelfRenderer.getObject("content")
                            .getObject("expandedShelfContentsRenderer")
                            .getArray("items")
                            .stream())
                    .filter(JsonObject.class::isInstance)
                    .map(JsonObject.class::cast)
                    .map(item -> item.getObject("videoRenderer"))
                    .forEachOrdered(videoRenderer -> collector.commit(
                            new YoutubeStreamInfoItemExtractor(videoRenderer, timeAgoParser)));
        }

        return new InfoItemsPage<>(collector, null);
    }

    private JsonObject getTrendingTabContent() throws ParsingException {
        return initialData.getObject("contents")
                .getObject("twoColumnBrowseResultsRenderer")
                .getArray("tabs")
                .stream()
                .filter(JsonObject.class::isInstance)
                .map(JsonObject.class::cast)
                .map(tab -> tab.getObject("tabRenderer"))
                .filter(tabRenderer -> tabRenderer.getBoolean("selected"))
                .filter(tabRenderer -> tabRenderer.has("content"))
                // There should be at most one tab selected
                .findFirst()
                .orElseThrow(() -> new ParsingException("Could not get \"Now\" trending tab"))
                .getObject("content");
    }
}
Fix license. 2022-11-09 04:34:16 +01:00			`/*`
			`* Created by Christian Schabesberger on 12.08.17.`
			`*`
			`* Copyright (C) Christian Schabesberger 2018 <chris.schabesberger@mailbox.org>`
			`* YoutubeTrendingExtractor.java is part of NewPipe Extractor.`
			`*`
			`* NewPipe Extractor is free software: you can redistribute it and/or modify`
			`* it under the terms of the GNU General Public License as published by`
			`* the Free Software Foundation, either version 3 of the License, or`
			`* (at your option) any later version.`
			`*`
			`* NewPipe Extractor is distributed in the hope that it will be useful,`
			`* but WITHOUT ANY WARRANTY; without even the implied warranty of`
			`* MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the`
			`* GNU General Public License for more details.`
			`*`
			`* You should have received a copy of the GNU General Public License`
			`* along with NewPipe Extractor. If not, see <https://www.gnu.org/licenses/>.`
			`*/`

Add Utils methods for URL encoding/decoding using UTF-8. 2022-08-09 04:03:29 +02:00			`package org.schabi.newpipe.extractor.services.youtube.extractors;`
add youtube trending extractor 2017-08-12 21:10:21 +02:00
Use StandardCharsets.UTF_8. 2022-07-28 04:19:21 +02:00			`import static org.schabi.newpipe.extractor.services.youtube.YoutubeParsingHelper.getJsonPostResponse;`
			`import static org.schabi.newpipe.extractor.services.youtube.YoutubeParsingHelper.getTextAtKey;`
			`import static org.schabi.newpipe.extractor.services.youtube.YoutubeParsingHelper.prepareDesktopJsonBuilder;`
			`import static org.schabi.newpipe.extractor.utils.Utils.isNullOrEmpty;`
[YouTube] Support new trending structure and filter recently trending section This new structure allow us to filter easily Trending shorts and Recently trending sections. On the previous one, this Recently trending section is now filtered, by checking whether sections have a title, which isn't the case for normal trends contrary to the other ones. This makes that the extractor returns now only the real 50 "Now" YouTube trends. Elements inside arrays are now extracted dynamically instead of only the ones of the first index, using Java 8's Stream API. The getInitialPage() method of YoutubeTrendingExtractor can now throw a ParsingException if no selected tab (corresponding to the one of the trends type extracted) has been found. Finally, the licence header has been moved to the top of the file and updated. 2022-08-28 18:20:07 +02:00
Detect disabled subriber count correctly Fix parsing of kiosk name 2020-02-17 17:30:22 +01:00			`import com.grack.nanojson.JsonObject;`
Use the youtubei API for YouTube trends 2021-04-11 17:01:43 +02:00			`import com.grack.nanojson.JsonWriter;`
Use plain YoutubeStreamInfoItemExtractor in YoutubeTrendingExtractor 2020-02-22 20:33:48 +01:00
Introduce Page class 2020-04-15 14:09:46 +02:00			`import org.schabi.newpipe.extractor.Page;`
Fix bug and some re-structure 2018-03-01 01:02:43 +01:00			`import org.schabi.newpipe.extractor.StreamingService;`
Implement time ago parser and improve localization handling - Handle special cases for languages where the number is not shown - Rework the Downloader base implementation, allowing for more advanced things to be done - Separate the localization from the content country (just like YouTube let's the user choose both). 2019-04-28 22:03:16 +02:00			`import org.schabi.newpipe.extractor.downloader.Downloader;`
add youtube trending extractor 2017-08-12 21:10:21 +02:00			`import org.schabi.newpipe.extractor.exceptions.ExtractionException;`
made YoutubeTrendingExtractor work 2017-08-13 00:58:29 +02:00			`import org.schabi.newpipe.extractor.exceptions.ParsingException;`
add youtube trending extractor 2017-08-12 21:10:21 +02:00			`import org.schabi.newpipe.extractor.kiosk.KioskExtractor;`
Implement time ago parser and improve localization handling - Handle special cases for languages where the number is not shown - Rework the Downloader base implementation, allowing for more advanced things to be done - Separate the localization from the content country (just like YouTube let's the user choose both). 2019-04-28 22:03:16 +02:00			`import org.schabi.newpipe.extractor.linkhandler.ListLinkHandler;`
			`import org.schabi.newpipe.extractor.localization.TimeAgoParser;`
Fix bug and some re-structure 2018-03-01 01:02:43 +01:00			`import org.schabi.newpipe.extractor.stream.StreamInfoItem;`
architecture refacturing 2018-02-24 22:20:50 +01:00			`import org.schabi.newpipe.extractor.stream.StreamInfoItemsCollector;`
made YoutubeTrendingExtractor work 2017-08-13 00:58:29 +02:00
add youtube trending extractor 2017-08-12 21:10:21 +02:00			`import java.io.IOException;`
Use StandardCharsets.UTF_8. 2022-07-28 04:19:21 +02:00			`import java.nio.charset.StandardCharsets;`
add youtube trending extractor 2017-08-12 21:10:21 +02:00
Use plain YoutubeStreamInfoItemExtractor in YoutubeTrendingExtractor 2020-02-22 20:33:48 +01:00			`import javax.annotation.Nonnull;`

add kiosk for conferences 2019-01-28 12:18:16 +01:00			`public class YoutubeTrendingExtractor extends KioskExtractor<StreamInfoItem> {`
Detect disabled subriber count correctly Fix parsing of kiosk name 2020-02-17 17:30:22 +01:00			`private JsonObject initialData;`
made YoutubeTrendingExtractor work 2017-08-13 00:58:29 +02:00
Use the youtubei API for YouTube trends 2021-04-11 17:01:43 +02:00			`public YoutubeTrendingExtractor(final StreamingService service,`
			`final ListLinkHandler linkHandler,`
			`final String kioskId) {`
Implement time ago parser and improve localization handling - Handle special cases for languages where the number is not shown - Rework the Downloader base implementation, allowing for more advanced things to be done - Separate the localization from the content country (just like YouTube let's the user choose both). 2019-04-28 22:03:16 +02:00			`super(service, linkHandler, kioskId);`
add youtube trending extractor 2017-08-12 21:10:21 +02:00			`}`

			`@Override`
[YouTube] Fix checkstyle issues 2022-03-18 15:09:06 +01:00			`public void onFetchPage(@Nonnull final Downloader downloader)`
			`throws IOException, ExtractionException {`
Use the youtubei API for YouTube trends 2021-04-11 17:01:43 +02:00			`// @formatter:off`
Rebase + some code improvements + fix extraction of age-restricted videos + update clients version Here is now the requests which will be made by the `onFetchPage` method of `YoutubeStreamExtractor`: - the desktop API is fetched. If there is no streaming data, the desktop player API with the embed client screen will be fetched (and also the player code), then the Android mobile API. - if there is no streaming data, a `ContentNotAvailableException` will be thrown by using the message provided in playability status If the video is age restricted, a request to the next endpoint of the desktop player with the embed client screen will be sent. Otherwise, the next endpoint will be fetched normally, if the content is available. If the video is not age-restricted, a request to the player endpoint of the Android mobile API will be made. We can get more streams by using the Android mobile API but some streams may be not available on this API, so the streaming data of the Android mobile API will be first used to get itags and then the streaming data of the desktop internal API will be used. If the parsing of the Android mobile API went wrong, only the streams of the desktop API will be used. Other code changes: - `prepareJsonBuilder` in `YoutubeParsingHelper` was renamed to `prepareDesktopJsonBuilder` - `prepareMobileJsonBuilder` in `YoutubeParsingHelper` was renamed to `prepareAndroidMobileJsonBuilder` - two new methods in `YoutubeParsingHelper` were added: `prepareDesktopEmbedVideoJsonBuilder` and `prepareAndroidMobileEmbedVideoJsonBuilder` - `createPlayerBodyWithSts` is now public and was moved to `YoutubeParsingHelper` - a new method in `YoutubeJavaScriptExtractor` was added: `resetJavaScriptCode`, which was needed for the method `resetDebofuscationCode` of `YoutubeStreamExtractor` - `areHardcodedClientVersionAndKeyValid` in `YoutubeParsingHelper` returns now a `boolean` instead of an `Optional<Boolean>` - the `fetchVideoInfoPage` method of `YoutubeStreamExtractor` was removed because YouTube returns now 404 for every client with the `get_video_info` page - some unused objects and some warnings in `YoutubeStreamExtractor` were removed and fixed Co-authored-by: TiA4f8R <74829229+TiA4f8R@users.noreply.github.com> 2021-07-28 23:55:09 +02:00			`final byte[] body = JsonWriter.string(prepareDesktopJsonBuilder(getExtractorLocalization(),`
Fix localization and update client version 2021-04-30 19:06:56 +02:00			`getExtractorContentCountry())`
Use the youtubei API for YouTube trends 2021-04-11 17:01:43 +02:00			`.value("browseId", "FEtrending")`
Do some improvements to YoutubeStreamExtractor Get the real name of the uploader (for autogenerated channels and music artist channels), like before the migration to the JSON pbj. Do some other improvements, especially reformatting some code to be in the 100 characters line limit and use final where possible. 2021-04-15 18:58:59 +02:00			`.done())`
Use StandardCharsets.UTF_8. 2022-07-28 04:19:21 +02:00			`.getBytes(StandardCharsets.UTF_8);`
Use the youtubei API for YouTube trends 2021-04-11 17:01:43 +02:00			`// @formatter:on`

			`initialData = getJsonPostResponse("browse", body, getExtractorLocalization());`
add youtube trending extractor 2017-08-12 21:10:21 +02:00			`}`

made getPage() function be stand alone 2018-02-26 15:55:27 +01:00			`@Override`
Throw IllegalArgumentException when Page is invalid 2020-05-11 15:25:18 +02:00			`public InfoItemsPage<StreamInfoItem> getPage(final Page page) {`
			`return InfoItemsPage.emptyPage();`
add youtube trending extractor 2017-08-12 21:10:21 +02:00			`}`

Fix bugs and present some in the future 2017-11-25 01:10:04 +01:00			`@Nonnull`
remove type from kiosk and make getName() crawl the translated kiosk name 2017-09-25 12:43:40 +02:00			`@Override`
			`public String getName() throws ParsingException {`
fix tests 2021-02-12 22:22:11 +01:00			`final JsonObject header = initialData.getObject("header");`
[YouTube] Fix trending getName() 2021-03-24 09:04:43 +01:00			`String name = null;`
fix tests 2021-02-12 22:22:11 +01:00			`if (header.has("feedTabbedHeaderRenderer")) {`
[YouTube] Fix trending getName() 2021-03-24 09:04:43 +01:00			`name = getTextAtKey(header.getObject("feedTabbedHeaderRenderer"), "title");`
fix tests 2021-02-12 22:22:11 +01:00			`} else if (header.has("c4TabbedHeaderRenderer")) {`
[YouTube] Fix trending getName() 2021-03-24 09:04:43 +01:00			`name = getTextAtKey(header.getObject("c4TabbedHeaderRenderer"), "title");`
fix tests 2021-02-12 22:22:11 +01:00			`}`

[YouTube] Fix trending getName() 2021-03-24 09:04:43 +01:00			`if (isNullOrEmpty(name)) {`
			`throw new ParsingException("Could not get Trending name");`
Detect disabled subriber count correctly Fix parsing of kiosk name 2020-02-17 17:30:22 +01:00			`}`
[YouTube] Fix trending getName() 2021-03-24 09:04:43 +01:00			`return name;`
remove type from kiosk and make getName() crawl the translated kiosk name 2017-09-25 12:43:40 +02:00			`}`

Add @Nonnull annotations 2017-11-25 02:03:30 +01:00			`@Nonnull`
add youtube trending extractor 2017-08-12 21:10:21 +02:00			`@Override`
[YouTube] Support new trending structure and filter recently trending section This new structure allow us to filter easily Trending shorts and Recently trending sections. On the previous one, this Recently trending section is now filtered, by checking whether sections have a title, which isn't the case for normal trends contrary to the other ones. This makes that the extractor returns now only the real 50 "Now" YouTube trends. Elements inside arrays are now extracted dynamically instead of only the ones of the first index, using Java 8's Stream API. The getInitialPage() method of YoutubeTrendingExtractor can now throw a ParsingException if no selected tab (corresponding to the one of the trends type extracted) has been found. Finally, the licence header has been moved to the top of the file and updated. 2022-08-28 18:20:07 +02:00			`public InfoItemsPage<StreamInfoItem> getInitialPage() throws ParsingException {`
[YouTube] Fix checkstyle issues 2022-03-18 15:09:06 +01:00			`final StreamInfoItemsCollector collector = new StreamInfoItemsCollector(getServiceId());`
Implement time ago parser and improve localization handling - Handle special cases for languages where the number is not shown - Rework the Downloader base implementation, allowing for more advanced things to be done - Separate the localization from the content country (just like YouTube let's the user choose both). 2019-04-28 22:03:16 +02:00			`final TimeAgoParser timeAgoParser = getTimeAgoParser();`
[YouTube] Support new trending structure and filter recently trending section This new structure allow us to filter easily Trending shorts and Recently trending sections. On the previous one, this Recently trending section is now filtered, by checking whether sections have a title, which isn't the case for normal trends contrary to the other ones. This makes that the extractor returns now only the real 50 "Now" YouTube trends. Elements inside arrays are now extracted dynamically instead of only the ones of the first index, using Java 8's Stream API. The getInitialPage() method of YoutubeTrendingExtractor can now throw a ParsingException if no selected tab (corresponding to the one of the trends type extracted) has been found. Finally, the licence header has been moved to the top of the file and updated. 2022-08-28 18:20:07 +02:00			`final JsonObject tabContent = getTrendingTabContent();`

			`if (tabContent.has("richGridRenderer")) {`
			`tabContent.getObject("richGridRenderer")`
			`.getArray("contents")`
			`.stream()`
			`.filter(JsonObject.class::isInstance)`
			`.map(JsonObject.class::cast)`
			`// Filter Trending shorts and Recently trending sections`
			`.filter(content -> content.has("richItemRenderer"))`
			`.map(content -> content.getObject("richItemRenderer")`
			`.getObject("content")`
			`.getObject("videoRenderer"))`
			`.forEachOrdered(videoRenderer -> collector.commit(`
			`new YoutubeStreamInfoItemExtractor(videoRenderer, timeAgoParser)));`
			`} else if (tabContent.has("sectionListRenderer")) {`
			`tabContent.getObject("sectionListRenderer")`
			`.getArray("contents")`
			`.stream()`
			`.filter(JsonObject.class::isInstance)`
			`.map(JsonObject.class::cast)`
			`.flatMap(content -> content.getObject("itemSectionRenderer")`
			`.getArray("contents")`
			`.stream())`
			`.filter(JsonObject.class::isInstance)`
			`.map(JsonObject.class::cast)`
			`.map(content -> content.getObject("shelfRenderer"))`
			`// Filter Trending shorts and Recently trending sections which have a title,`
			`// contrary to normal trends`
			`.filter(shelfRenderer -> !shelfRenderer.has("title"))`
			`.flatMap(shelfRenderer -> shelfRenderer.getObject("content")`
			`.getObject("expandedShelfContentsRenderer")`
			`.getArray("items")`
			`.stream())`
			`.filter(JsonObject.class::isInstance)`
			`.map(JsonObject.class::cast)`
			`.map(item -> item.getObject("videoRenderer"))`
			`.forEachOrdered(videoRenderer -> collector.commit(`
			`new YoutubeStreamInfoItemExtractor(videoRenderer, timeAgoParser)));`
made YoutubeTrendingExtractor work 2017-08-13 00:58:29 +02:00			`}`
Remove getNextPageUrl() function from ListExtractor 2020-04-10 10:25:53 +02:00
			`return new InfoItemsPage<>(collector, null);`
add youtube trending extractor 2017-08-12 21:10:21 +02:00			`}`
[YouTube] Support new trending structure and filter recently trending section This new structure allow us to filter easily Trending shorts and Recently trending sections. On the previous one, this Recently trending section is now filtered, by checking whether sections have a title, which isn't the case for normal trends contrary to the other ones. This makes that the extractor returns now only the real 50 "Now" YouTube trends. Elements inside arrays are now extracted dynamically instead of only the ones of the first index, using Java 8's Stream API. The getInitialPage() method of YoutubeTrendingExtractor can now throw a ParsingException if no selected tab (corresponding to the one of the trends type extracted) has been found. Finally, the licence header has been moved to the top of the file and updated. 2022-08-28 18:20:07 +02:00
			`private JsonObject getTrendingTabContent() throws ParsingException {`
			`return initialData.getObject("contents")`
			`.getObject("twoColumnBrowseResultsRenderer")`
			`.getArray("tabs")`
			`.stream()`
			`.filter(JsonObject.class::isInstance)`
			`.map(JsonObject.class::cast)`
			`.map(tab -> tab.getObject("tabRenderer"))`
			`.filter(tabRenderer -> tabRenderer.getBoolean("selected"))`
			`.filter(tabRenderer -> tabRenderer.has("content"))`
			`// There should be at most one tab selected`
			`.findFirst()`
			`.orElseThrow(() -> new ParsingException("Could not get \"Now\" trending tab"))`
			`.getObject("content");`
			`}`
add youtube trending extractor 2017-08-12 21:10:21 +02:00			`}`