mirror of
https://github.com/TeamNewPipe/NewPipe
synced 2025-01-11 09:50:32 +00:00
YTStreamExtractor: add support for age restricted
YouTube age restricted videos are now kind of supported. This is not a final solution to this problem and this commit still crashes because of some problem with the thumbnail.
This commit is contained in:
parent
d8281aeb34
commit
4d727245e1
@ -24,6 +24,8 @@ import java.io.IOException;
|
|||||||
import java.util.List;
|
import java.util.List;
|
||||||
import java.util.Map;
|
import java.util.Map;
|
||||||
import java.util.Vector;
|
import java.util.Vector;
|
||||||
|
import java.util.regex.Matcher;
|
||||||
|
import java.util.regex.Pattern;
|
||||||
|
|
||||||
/**
|
/**
|
||||||
* Created by Christian Schabesberger on 06.08.15.
|
* Created by Christian Schabesberger on 06.08.15.
|
||||||
@ -160,7 +162,8 @@ public class YoutubeStreamExtractor implements StreamExtractor {
|
|||||||
private static final String TAG = YoutubeStreamExtractor.class.toString();
|
private static final String TAG = YoutubeStreamExtractor.class.toString();
|
||||||
private final Document doc;
|
private final Document doc;
|
||||||
private JSONObject playerArgs;
|
private JSONObject playerArgs;
|
||||||
//private Map<String, String> videoInfoPage;
|
private boolean isAgeRestricted;
|
||||||
|
private Map<String, String> videoInfoPage;
|
||||||
|
|
||||||
// static values
|
// static values
|
||||||
private static final String DECRYPTION_FUNC_NAME="decrypt";
|
private static final String DECRYPTION_FUNC_NAME="decrypt";
|
||||||
@ -180,42 +183,37 @@ public class YoutubeStreamExtractor implements StreamExtractor {
|
|||||||
String pageContent = downloader.download(urlidhandler.cleanUrl(pageUrl));
|
String pageContent = downloader.download(urlidhandler.cleanUrl(pageUrl));
|
||||||
doc = Jsoup.parse(pageContent, pageUrl);
|
doc = Jsoup.parse(pageContent, pageUrl);
|
||||||
String ytPlayerConfigRaw;
|
String ytPlayerConfigRaw;
|
||||||
JSONObject ytPlayerConfig;
|
JSONObject ytPlayerConfig = new JSONObject();
|
||||||
|
|
||||||
//attempt to load the youtube js player JSON arguments
|
// Check if the video is age restricted
|
||||||
try {
|
if (pageContent.contains("<meta property=\"og:restrictions:age")) {
|
||||||
ytPlayerConfigRaw =
|
String videoInfoUrl = GET_VIDEO_INFO_URL.replace("%%video_id%%",
|
||||||
Parser.matchGroup1("ytplayer.config\\s*=\\s*(\\{.*?\\});", pageContent);
|
|
||||||
ytPlayerConfig = new JSONObject(ytPlayerConfigRaw);
|
|
||||||
playerArgs = ytPlayerConfig.getJSONObject("args");
|
|
||||||
} catch (Parser.RegexException e) {
|
|
||||||
String errorReason = findErrorReason(doc);
|
|
||||||
switch(errorReason) {
|
|
||||||
case "GEMA":
|
|
||||||
throw new GemaException(errorReason);
|
|
||||||
case "":
|
|
||||||
throw new ParsingException("player config empty", e);
|
|
||||||
default:
|
|
||||||
throw new ContentNotAvailableException("Content not available", e);
|
|
||||||
}
|
|
||||||
} catch (JSONException e) {
|
|
||||||
throw new ParsingException("Could not parse yt player config");
|
|
||||||
}
|
|
||||||
|
|
||||||
|
|
||||||
/* not yet nececeary
|
|
||||||
|
|
||||||
|
|
||||||
// get videoInfo page
|
|
||||||
try {
|
|
||||||
//Parser.unescapeEntities(url_data_str, true).split("&")
|
|
||||||
String getVideoInfoUrl = GET_VIDEO_INFO_URL.replace("%%video_id%%",
|
|
||||||
urlidhandler.getVideoId(pageUrl)).replace("$$el_type$$", "&" + EL_INFO);
|
urlidhandler.getVideoId(pageUrl)).replace("$$el_type$$", "&" + EL_INFO);
|
||||||
videoInfoPage = Parser.compatParseMap(downloader.download(getVideoInfoUrl));
|
String videoInfoPageString = downloader.download(videoInfoUrl);
|
||||||
} catch(Exception e) {
|
videoInfoPage = Parser.compatParseMap(videoInfoPageString);
|
||||||
throw new ParsingException("Could not load video info page.", e);
|
isAgeRestricted = true;
|
||||||
|
} else {
|
||||||
|
//attempt to load the youtube js player JSON arguments
|
||||||
|
try {
|
||||||
|
ytPlayerConfigRaw =
|
||||||
|
Parser.matchGroup1("ytplayer.config\\s*=\\s*(\\{.*?\\});", pageContent);
|
||||||
|
ytPlayerConfig = new JSONObject(ytPlayerConfigRaw);
|
||||||
|
playerArgs = ytPlayerConfig.getJSONObject("args");
|
||||||
|
isAgeRestricted = false;
|
||||||
|
} catch (Parser.RegexException e) {
|
||||||
|
String errorReason = findErrorReason(doc);
|
||||||
|
switch(errorReason) {
|
||||||
|
case "GEMA":
|
||||||
|
throw new GemaException(errorReason);
|
||||||
|
case "":
|
||||||
|
throw new ParsingException("player config empty", e);
|
||||||
|
default:
|
||||||
|
throw new ContentNotAvailableException("Content not available", e);
|
||||||
|
}
|
||||||
|
} catch (JSONException e) {
|
||||||
|
throw new ParsingException("Could not parse yt player config");
|
||||||
|
}
|
||||||
}
|
}
|
||||||
*/
|
|
||||||
|
|
||||||
//----------------------------------
|
//----------------------------------
|
||||||
// load and parse description code, if it isn't already initialised
|
// load and parse description code, if it isn't already initialised
|
||||||
@ -225,9 +223,21 @@ public class YoutubeStreamExtractor implements StreamExtractor {
|
|||||||
// The Youtube service needs to be initialized by downloading the
|
// The Youtube service needs to be initialized by downloading the
|
||||||
// js-Youtube-player. This is done in order to get the algorithm
|
// js-Youtube-player. This is done in order to get the algorithm
|
||||||
// for decrypting cryptic signatures inside certain stream urls.
|
// for decrypting cryptic signatures inside certain stream urls.
|
||||||
JSONObject ytAssets = ytPlayerConfig.getJSONObject("assets");
|
String playerUrl = "";
|
||||||
String playerUrl = ytAssets.getString("js");
|
if (isAgeRestricted) {
|
||||||
|
String videoId = urlidhandler.getVideoId(pageUrl);
|
||||||
|
String embedUrl = "https://www.youtube.com/embed/" + videoId;
|
||||||
|
String embedPageContent = downloader.download(embedUrl);
|
||||||
|
Pattern assetsPattern = Pattern.compile("\"assets\":.+?\"js\":\\s*(\"[^\"]+\")");
|
||||||
|
Matcher patternMatcher = assetsPattern.matcher(embedPageContent);
|
||||||
|
while (patternMatcher.find()) {
|
||||||
|
playerUrl = patternMatcher.group(1);
|
||||||
|
}
|
||||||
|
playerUrl = playerUrl.replace("\\", "").replace("\"", "");
|
||||||
|
} else {
|
||||||
|
JSONObject ytAssets = ytPlayerConfig.getJSONObject("assets");
|
||||||
|
playerUrl = ytAssets.getString("js");
|
||||||
|
}
|
||||||
if (playerUrl.startsWith("//")) {
|
if (playerUrl.startsWith("//")) {
|
||||||
playerUrl = "https:" + playerUrl;
|
playerUrl = "https:" + playerUrl;
|
||||||
}
|
}
|
||||||
@ -241,7 +251,11 @@ public class YoutubeStreamExtractor implements StreamExtractor {
|
|||||||
|
|
||||||
@Override
|
@Override
|
||||||
public String getTitle() throws ParsingException {
|
public String getTitle() throws ParsingException {
|
||||||
try {//json player args method
|
try {
|
||||||
|
if (playerArgs == null) {
|
||||||
|
return videoInfoPage.get("title");
|
||||||
|
}
|
||||||
|
//json player args method
|
||||||
return playerArgs.getString("title");
|
return playerArgs.getString("title");
|
||||||
} catch(JSONException je) {//html <meta> method
|
} catch(JSONException je) {//html <meta> method
|
||||||
je.printStackTrace();
|
je.printStackTrace();
|
||||||
@ -265,7 +279,11 @@ public class YoutubeStreamExtractor implements StreamExtractor {
|
|||||||
|
|
||||||
@Override
|
@Override
|
||||||
public String getUploader() throws ParsingException {
|
public String getUploader() throws ParsingException {
|
||||||
try {//json player args method
|
try {
|
||||||
|
if (playerArgs == null) {
|
||||||
|
return videoInfoPage.get("author");
|
||||||
|
}
|
||||||
|
//json player args method
|
||||||
return playerArgs.getString("author");
|
return playerArgs.getString("author");
|
||||||
} catch(JSONException je) {
|
} catch(JSONException je) {
|
||||||
je.printStackTrace();
|
je.printStackTrace();
|
||||||
@ -281,6 +299,9 @@ public class YoutubeStreamExtractor implements StreamExtractor {
|
|||||||
@Override
|
@Override
|
||||||
public int getLength() throws ParsingException {
|
public int getLength() throws ParsingException {
|
||||||
try {
|
try {
|
||||||
|
if (playerArgs == null) {
|
||||||
|
return Integer.valueOf(videoInfoPage.get("length_seconds"));
|
||||||
|
}
|
||||||
return playerArgs.getInt("length_seconds");
|
return playerArgs.getInt("length_seconds");
|
||||||
} catch (JSONException e) {//todo: find fallback method
|
} catch (JSONException e) {//todo: find fallback method
|
||||||
throw new ParsingException("failed to load video duration from JSON args", e);
|
throw new ParsingException("failed to load video duration from JSON args", e);
|
||||||
@ -321,6 +342,9 @@ public class YoutubeStreamExtractor implements StreamExtractor {
|
|||||||
} catch (JSONException je) {
|
} catch (JSONException je) {
|
||||||
throw new ParsingException(
|
throw new ParsingException(
|
||||||
"failed to extract thumbnail URL from JSON args; trying to extract it from HTML", je);
|
"failed to extract thumbnail URL from JSON args; trying to extract it from HTML", je);
|
||||||
|
} catch (NullPointerException ne) {
|
||||||
|
// Get from the video info page instead
|
||||||
|
return videoInfoPage.get("thumbnail_url");
|
||||||
}
|
}
|
||||||
}
|
}
|
||||||
|
|
||||||
@ -361,7 +385,12 @@ public class YoutubeStreamExtractor implements StreamExtractor {
|
|||||||
public List<VideoInfo.AudioStream> getAudioStreams() throws ParsingException {
|
public List<VideoInfo.AudioStream> getAudioStreams() throws ParsingException {
|
||||||
Vector<VideoInfo.AudioStream> audioStreams = new Vector<>();
|
Vector<VideoInfo.AudioStream> audioStreams = new Vector<>();
|
||||||
try{
|
try{
|
||||||
String encoded_url_map = playerArgs.getString("adaptive_fmts");
|
String encoded_url_map;
|
||||||
|
if (videoInfoPage == null) {
|
||||||
|
encoded_url_map = videoInfoPage.get("adaptive_fmts");
|
||||||
|
} else {
|
||||||
|
encoded_url_map = playerArgs.getString("adaptive_fmts");
|
||||||
|
}
|
||||||
for(String url_data_str : encoded_url_map.split(",")) {
|
for(String url_data_str : encoded_url_map.split(",")) {
|
||||||
// This loop iterates through multiple streams, therefor tags
|
// This loop iterates through multiple streams, therefor tags
|
||||||
// is related to one and the same stream at a time.
|
// is related to one and the same stream at a time.
|
||||||
@ -398,7 +427,12 @@ public class YoutubeStreamExtractor implements StreamExtractor {
|
|||||||
Vector<VideoInfo.VideoStream> videoStreams = new Vector<>();
|
Vector<VideoInfo.VideoStream> videoStreams = new Vector<>();
|
||||||
|
|
||||||
try{
|
try{
|
||||||
String encoded_url_map = playerArgs.getString("url_encoded_fmt_stream_map");
|
String encoded_url_map;
|
||||||
|
if (playerArgs == null) {
|
||||||
|
encoded_url_map = videoInfoPage.get("url_encoded_fmt_stream_map");
|
||||||
|
} else {
|
||||||
|
encoded_url_map = playerArgs.getString("url_encoded_fmt_stream_map");
|
||||||
|
}
|
||||||
for(String url_data_str : encoded_url_map.split(",")) {
|
for(String url_data_str : encoded_url_map.split(",")) {
|
||||||
try {
|
try {
|
||||||
// This loop iterates through multiple streams, therefor tags
|
// This loop iterates through multiple streams, therefor tags
|
||||||
@ -504,6 +538,9 @@ public class YoutubeStreamExtractor implements StreamExtractor {
|
|||||||
@Override
|
@Override
|
||||||
public String getAverageRating() throws ParsingException {
|
public String getAverageRating() throws ParsingException {
|
||||||
try {
|
try {
|
||||||
|
if (playerArgs == null) {
|
||||||
|
videoInfoPage.get("avg_rating");
|
||||||
|
}
|
||||||
return playerArgs.getString("avg_rating");
|
return playerArgs.getString("avg_rating");
|
||||||
} catch (JSONException e) {
|
} catch (JSONException e) {
|
||||||
throw new ParsingException("Could not get Average rating", e);
|
throw new ParsingException("Could not get Average rating", e);
|
||||||
|
Loading…
Reference in New Issue
Block a user