package org.schabi.newpipe.extractor.services.youtube; import org.jsoup.nodes.Element; import org.schabi.newpipe.extractor.AbstractStreamInfo; import org.schabi.newpipe.extractor.Parser; import org.schabi.newpipe.extractor.exceptions.FoundAdException; import org.schabi.newpipe.extractor.exceptions.ParsingException; import org.schabi.newpipe.extractor.stream_info.StreamInfoItemExtractor; /** * Copyright (C) Christian Schabesberger 2016 * YoutubeStreamInfoItemExtractor.java is part of NewPipe. * * NewPipe is free software: you can redistribute it and/or modify * it under the terms of the GNU General Public License as published by * the Free Software Foundation, either version 3 of the License, or * (at your option) any later version. * * NewPipe is distributed in the hope that it will be useful, * but WITHOUT ANY WARRANTY; without even the implied warranty of * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the * GNU General Public License for more details. * * You should have received a copy of the GNU General Public License * along with NewPipe. If not, see . */ public class YoutubeStreamInfoItemExtractor implements StreamInfoItemExtractor { private final Element item; public YoutubeStreamInfoItemExtractor(Element item) throws FoundAdException { this.item = item; } @Override public String getWebPageUrl() throws ParsingException { try { Element el = item.select("div[class*=\"yt-lockup-video\"").first(); Element dl = el.select("h3").first().select("a").first(); return dl.attr("abs:href"); } catch (Exception e) { throw new ParsingException("Could not get web page url for the video", e); } } @Override public String getTitle() throws ParsingException { try { Element el = item.select("div[class*=\"yt-lockup-video\"").first(); Element dl = el.select("h3").first().select("a").first(); return dl.text(); } catch (Exception e) { throw new ParsingException("Could not get title", e); } } @Override public int getDuration() throws ParsingException { try { return YoutubeParsingHelper.parseDurationString( item.select("span[class=\"video-time\"]").first().text()); } catch(Exception e) { if(isLiveStream(item)) { // -1 for no duration return -1; } else { throw new ParsingException("Could not get Duration: " + getTitle(), e); } } } @Override public String getUploader() throws ParsingException { try { return item.select("div[class=\"yt-lockup-byline\"]").first() .select("a").first() .text(); } catch (Exception e) { throw new ParsingException("Could not get uploader", e); } } @Override public String getUploadDate() throws ParsingException { try { Element div = item.select("div[class=\"yt-lockup-meta\"]").first(); if(div == null) { return null; } else { return div.select("li").first().text(); } } catch(Exception e) { throw new ParsingException("Could not get uplaod date", e); } } @Override public long getViewCount() throws ParsingException { String output; String input; try { Element div = item.select("div[class=\"yt-lockup-meta\"]").first(); if(div == null) { return -1; } else { input = div.select("li").get(1) .text(); } } catch (IndexOutOfBoundsException e) { if(isLiveStream(item)) { // -1 for no view count return -1; } else { throw new ParsingException( "Could not parse yt-lockup-meta although available: " + getTitle(), e); } } output = Parser.matchGroup1("([0-9,\\. ]*)", input) .replace(" ", "") .replace(".", "") .replace(",", ""); try { return Long.parseLong(output); } catch (NumberFormatException e) { // if this happens the video probably has no views if(!input.isEmpty()) { return 0; } else { throw new ParsingException("Could not handle input: " + input, e); } } } @Override public String getThumbnailUrl() throws ParsingException { try { String url; Element te = item.select("div[class=\"yt-thumb video-thumb\"]").first() .select("img").first(); url = te.attr("abs:src"); // Sometimes youtube sends links to gif files which somehow seem to not exist // anymore. Items with such gif also offer a secondary image source. So we are going // to use that if we've caught such an item. if (url.contains(".gif")) { url = te.attr("abs:data-thumb"); } return url; } catch (Exception e) { throw new ParsingException("Could not get thumbnail url", e); } } @Override public AbstractStreamInfo.StreamType getStreamType() { if(isLiveStream(item)) { return AbstractStreamInfo.StreamType.LIVE_STREAM; } else { return AbstractStreamInfo.StreamType.VIDEO_STREAM; } } @Override public boolean isAd() throws ParsingException { if(!item.select("span[class*=\"icon-not-available\"]").isEmpty()) { return true; } else { return false; } } private boolean isLiveStream(Element item) { Element bla = item.select("span[class*=\"yt-badge-live\"]").first(); if(bla == null) { // sometimes livestreams dont have badges but sill are live streams // if video time is not available we most likly have an offline livestream if(item.select("span[class*=\"video-time\"]").first() == null) { return true; } } return bla != null; } }