X-Git-Url: https://git.sur5r.net/?a=blobdiff_plain;ds=sidebyside;f=src%2Fvideo.cpp;h=f7b3107da01d33221a4801d3e86c684eae9c344a;hb=43c391d91acfaa16f226b4b8dd467e5cde027c23;hp=0fb30b3cbb6b4d65ee22a39b94c5e7f3b3efb767;hpb=fe37e0824b725d2b6cb9163bc21e41618ab3e6ef;p=minitube diff --git a/src/video.cpp b/src/video.cpp index 0fb30b3..f7b3107 100644 --- a/src/video.cpp +++ b/src/video.cpp @@ -1,103 +1,484 @@ +/* $BEGIN_LICENSE + +This file is part of Minitube. +Copyright 2009, Flavio Tordini + +Minitube is free software: you can redistribute it and/or modify +it under the terms of the GNU General Public License as published by +the Free Software Foundation, either version 3 of the License, or +(at your option) any later version. + +Minitube is distributed in the hope that it will be useful, +but WITHOUT ANY WARRANTY; without even the implied warranty of +MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the +GNU General Public License for more details. + +You should have received a copy of the GNU General Public License +along with Minitube. If not, see . + +$END_LICENSE */ + #include "video.h" #include "networkaccess.h" #include +#include "videodefinition.h" +#include "jsfunctions.h" +#include "temporary.h" +#include "compatibility/qurlqueryhelper.h" +#include "datautils.h" namespace The { - NetworkAccess* http(); +NetworkAccess* http(); } -Video::Video() : m_thumbnailUrls(QList()) { - m_duration = 0; - m_viewCount = -1; +namespace { +static const QString jsNameChars = "a-zA-Z0-9\\$_"; } -void Video::preloadThumbnail() { - if (m_thumbnailUrls.isEmpty()) return; - QObject *reply = The::http()->get(m_thumbnailUrls.first()); - connect(reply, SIGNAL(data(QByteArray)), SLOT(setThumbnail(QByteArray))); +Video::Video() : m_duration(0), + m_viewCount(-1), + m_license(LicenseYouTube), + definitionCode(0), + elIndex(0), + ageGate(false), + loadingStreamUrl(false), + loadingThumbnail(false) { } -void Video::setThumbnail(QByteArray bytes) { - m_thumbnail = QImage::fromData(bytes); - emit gotThumbnail(); +Video* Video::clone() { + Video* cloneVideo = new Video(); + cloneVideo->m_title = m_title; + cloneVideo->m_description = m_description; + cloneVideo->m_channelTitle = m_channelTitle; + cloneVideo->m_channelId = m_channelId; + cloneVideo->m_webpage = m_webpage; + cloneVideo->m_streamUrl = m_streamUrl; + cloneVideo->m_thumbnail = m_thumbnail; + cloneVideo->m_thumbnailUrl = m_thumbnailUrl; + cloneVideo->m_mediumThumbnailUrl = m_mediumThumbnailUrl; + cloneVideo->m_duration = m_duration; + cloneVideo->m_published = m_published; + cloneVideo->m_viewCount = m_viewCount; + cloneVideo->videoId = videoId; + cloneVideo->videoToken = videoToken; + cloneVideo->definitionCode = definitionCode; + return cloneVideo; } -const QImage Video::thumbnail() const { - return m_thumbnail; +const QString &Video::webpage() { + if (m_webpage.isEmpty() && !videoId.isEmpty()) + m_webpage.append("https://www.youtube.com/watch?v=").append(videoId); + return m_webpage; } -void Video::scrapeStreamUrl() { +void Video::setWebpage(const QString &value) { + m_webpage = value; + + // Get Video ID + if (videoId.isEmpty()) { + QRegExp re(JsFunctions::instance()->videoIdRE()); + if (re.indexIn(m_webpage) == -1) { + qWarning() << QString("Cannot get video id for %1").arg(m_webpage); + // emit errorStreamUrl(QString("Cannot get video id for %1").arg(m_webpage.toString())); + // loadingStreamUrl = false; + return; + } + videoId = re.cap(1); + } +} - // https://develop.participatoryculture.org/trac/democracy/browser/trunk/tv/portable/flashscraper.py +void Video::loadThumbnail() { + if (m_thumbnailUrl.isEmpty() || loadingThumbnail) return; + loadingThumbnail = true; + QObject *reply = The::http()->get(m_thumbnailUrl); + connect(reply, SIGNAL(data(QByteArray)), SLOT(setThumbnail(QByteArray))); +} - QUrl webpage = m_webpage; - // qDebug() << webpage.toString(); +void Video::setThumbnail(const QByteArray &bytes) { + loadingThumbnail = false; + qreal ratio = qApp->devicePixelRatio(); + m_thumbnail = QPixmap(); + m_thumbnail.loadFromData(bytes); + m_thumbnail.setDevicePixelRatio(ratio); + const int thumbWidth = 160 * ratio; + if (m_thumbnail.width() > thumbWidth) + m_thumbnail = m_thumbnail.scaledToWidth(thumbWidth, Qt::SmoothTransformation); + emit gotThumbnail(); +} - // Get Video ID - // youtube-dl line 428 - // QRegExp re("^((?:http://)?(?:\\w+\\.)?youtube\\.com/(?:(?:v/)|(?:(?:watch(?:\\.php)?)?\\?(?:.+&)?v=)))?([0-9A-Za-z_-]+)(?(1).+)?$"); - QRegExp re("^http://www\\.youtube\\.com/watch\\?v=([0-9A-Za-z_-]+).*"); - bool match = re.exactMatch(webpage.toString()); - if (!match || re.numCaptures() < 1) { - emit errorStreamUrl(QString("Cannot get video id for %1").arg(webpage.toString())); +void Video::loadStreamUrl() { + if (loadingStreamUrl) { + qDebug() << "Already loading stream URL for" << this->title(); return; } - videoId = re.cap(1); - // if (!videoId) return false; - // qDebug() << videoId; + loadingStreamUrl = true; + elIndex = 0; + ageGate = false; + + getVideoInfo(); +} + +void Video::getVideoInfo() { + static const QStringList elTypes = QStringList() << "&el=embedded" << "&el=detailpage" << "&el=vevo" << ""; + + QUrl url; + if (elIndex == elTypes.size()) { + // qDebug() << "Trying special embedded el param"; + url = QUrl("https://www.youtube.com/get_video_info"); - // Get Video Token - QUrl normalizedUrl = QUrl(QString("http://www.youtube.com/get_video_info?video_id=") - .append(videoId).append("&el=embedded&ps=default&eurl=")); + QUrlQueryHelper urlHelper(url); + urlHelper.addQueryItem("video_id", videoId); + urlHelper.addQueryItem("el", "embedded"); + urlHelper.addQueryItem("gl", "US"); + urlHelper.addQueryItem("hl", "en"); + urlHelper.addQueryItem("eurl", "https://youtube.googleapis.com/v/" + videoId); + urlHelper.addQueryItem("asv", "3"); + urlHelper.addQueryItem("sts", "1588"); + } else if (elIndex > elTypes.size() - 1) { + qWarning() << "Cannot get video info"; + loadingStreamUrl = false; + emit errorStreamUrl("Cannot get video info"); + return; + } else { + // qDebug() << "Trying el param:" << elTypes.at(elIndex) << elIndex; + url = QUrl(QString( + "https://www.youtube.com/get_video_info?video_id=%1%2&ps=default&eurl=&gl=US&hl=en" + ).arg(videoId, elTypes.at(elIndex))); + } - QObject *reply = The::http()->get(normalizedUrl); + QObject *reply = The::http()->get(url); connect(reply, SIGNAL(data(QByteArray)), SLOT(gotVideoInfo(QByteArray))); connect(reply, SIGNAL(error(QNetworkReply*)), SLOT(errorVideoInfo(QNetworkReply*))); // see you in gotVideoInfo... } -void Video::gotVideoInfo(QByteArray data) { - QString videoInfo = QString::fromUtf8(data); - - QRegExp re = QRegExp("^.*&token=([^&]+).*$"); - bool match = re.exactMatch(videoInfo); - - // on regexp failure, stop and report error - if (!match || re.numCaptures() < 1) { - qDebug() << videoInfo; - re = QRegExp("^.*&reason=([^&]+).*$"); - match = re.exactMatch(videoInfo); - if (match) { - // report the error in the status bar - QMainWindow* mainWindow = dynamic_cast(qApp->topLevelWidgets().first()); - QString errorMessage = QUrl::fromEncoded(re.cap(1).toUtf8()).toString().replace("+", " "); - int indexOfTag = errorMessage.indexOf("<"); - if (indexOfTag != -1) { - errorMessage = errorMessage.left(indexOfTag); - } - if (mainWindow) mainWindow->statusBar()->showMessage(errorMessage); - emit errorStreamUrl(errorMessage); - } else - emit errorStreamUrl("Error parsing video info"); +void Video::gotVideoInfo(const QByteArray &bytes) { + QString videoInfo = QString::fromUtf8(bytes); + // qDebug() << "videoInfo" << videoInfo; + + // get video token + QRegExp videoTokeRE(JsFunctions::instance()->videoTokenRE()); + if (videoTokeRE.indexIn(videoInfo) == -1) { + qDebug() << "Cannot get token. Trying next el param" << videoInfo << videoTokeRE.pattern(); + // Don't panic! We're gonna try another magic "el" param + elIndex++; + getVideoInfo(); return; } - QString videoToken = re.cap(1); - // FIXME proper decode - videoToken = videoToken.replace("%3D", "="); - // qDebug() << "token" << videoToken; + QString videoToken = videoTokeRE.cap(1); + // qDebug() << "got token" << videoToken; + while (videoToken.contains('%')) + videoToken = QByteArray::fromPercentEncoding(videoToken.toLatin1()); + // qDebug() << "videoToken" << videoToken; + this->videoToken = videoToken; - QUrl videoUrl = QUrl(QString("http://www.youtube.com/get_video?video_id=") - .append(videoId) - .append("&t=").append(videoToken) - .append("&eurl=&el=embedded&ps=default&fmt=18")); + // get fmt_url_map + QRegExp fmtMapRE(JsFunctions::instance()->videoInfoFmtMapRE()); + if (fmtMapRE.indexIn(videoInfo) == -1) { + // qDebug() << "Cannot get urlMap. Trying next el param"; + // Don't panic! We're gonna try another magic "el" param + elIndex++; + getVideoInfo(); + return; + } - m_streamUrl = videoUrl; + // qDebug() << "Got token and urlMap" << elIndex; - emit gotStreamUrl(videoUrl); + QString fmtUrlMap = fmtMapRE.cap(1); + // qDebug() << "got fmtUrlMap" << fmtUrlMap; + fmtUrlMap = QByteArray::fromPercentEncoding(fmtUrlMap.toUtf8()); + parseFmtUrlMap(fmtUrlMap); +} + +void Video::parseFmtUrlMap(const QString &fmtUrlMap, bool fromWebPage) { + const QString definitionName = QSettings().value("definition", "360p").toString(); + const VideoDefinition& definition = VideoDefinition::getDefinitionFor(definitionName); + + // qDebug() << "fmtUrlMap" << fmtUrlMap; + const QStringList formatUrls = fmtUrlMap.split(',', QString::SkipEmptyParts); + QHash urlMap; + foreach(const QString &formatUrl, formatUrls) { + // qDebug() << "formatUrl" << formatUrl; + const QStringList urlParams = formatUrl.split('&', QString::SkipEmptyParts); + // qDebug() << "urlParams" << urlParams; + + int format = -1; + QString url; + QString sig; + foreach(const QString &urlParam, urlParams) { + // qWarning() << urlParam; + if (urlParam.startsWith("itag=")) { + int separator = urlParam.indexOf("="); + format = urlParam.mid(separator + 1).toInt(); + } else if (urlParam.startsWith("url=")) { + int separator = urlParam.indexOf("="); + url = urlParam.mid(separator + 1); + url = QByteArray::fromPercentEncoding(url.toUtf8()); + } else if (urlParam.startsWith("sig=")) { + int separator = urlParam.indexOf("="); + sig = urlParam.mid(separator + 1); + sig = QByteArray::fromPercentEncoding(sig.toUtf8()); + } else if (urlParam.startsWith("s=")) { + if (fromWebPage || ageGate) { + int separator = urlParam.indexOf("="); + sig = urlParam.mid(separator + 1); + sig = QByteArray::fromPercentEncoding(sig.toUtf8()); + if (ageGate) + sig = JsFunctions::instance()->decryptAgeSignature(sig); + else { + sig = decryptSignature(sig); + if (sig.isEmpty()) + sig = JsFunctions::instance()->decryptSignature(sig); + } + } else { + + QUrl url("http://www.youtube.com/watch"); + { + QUrlQueryHelper urlHelper(url); + urlHelper.addQueryItem("v", videoId); + urlHelper.addQueryItem("gl", "US"); + urlHelper.addQueryItem("hl", "en"); + urlHelper.addQueryItem("has_verified", "1"); + } + // qDebug() << "Loading webpage" << url; + QObject *reply = The::http()->get(url); + connect(reply, SIGNAL(data(QByteArray)), SLOT(scrapeWebPage(QByteArray))); + connect(reply, SIGNAL(error(QNetworkReply*)), SLOT(errorVideoInfo(QNetworkReply*))); + // see you in scrapWebPage(QByteArray) + return; + } + } + } + if (format == -1 || url.isNull()) continue; + + url += "&signature=" + sig; + + if (!url.contains("ratebypass")) + url += "&ratebypass=yes"; + + // qWarning() << url; + + if (format == definition.getCode()) { + // qDebug() << "Found format" << definitionCode; + saveDefinitionForUrl(url, definition); + return; + } + + urlMap.insert(format, url); + } + + const QList& definitions = VideoDefinition::getDefinitions(); + int previousIndex = std::max(definitions.indexOf(definition) - 1, 0); + for (; previousIndex >= 0; previousIndex--) { + const VideoDefinition& previousDefinition = definitions.at(previousIndex); + if (urlMap.contains(previousDefinition.getCode())) { + // qDebug() << "Found format" << definitionCode; + saveDefinitionForUrl(urlMap.value(previousDefinition.getCode()), + previousDefinition); + return; + } + } + + emit errorStreamUrl(tr("Cannot get video stream for %1").arg(m_webpage)); } void Video::errorVideoInfo(QNetworkReply *reply) { + loadingStreamUrl = false; emit errorStreamUrl(tr("Network error: %1 for %2").arg(reply->errorString(), reply->url().toString())); } + +void Video::scrapeWebPage(const QByteArray &bytes) { + QString html = QString::fromUtf8(bytes); + + QRegExp ageGateRE(JsFunctions::instance()->ageGateRE()); + if (ageGateRE.indexIn(html) != -1) { + // qDebug() << "Found ageGate"; + ageGate = true; + elIndex = 4; + getVideoInfo(); + return; + } + + QRegExp fmtMapRE(JsFunctions::instance()->webPageFmtMapRE()); + if (fmtMapRE.indexIn(html) == -1) { + qWarning() << "Error parsing video page"; + // emit errorStreamUrl("Error parsing video page"); + // loadingStreamUrl = false; + elIndex++; + getVideoInfo(); + return; + } + fmtUrlMap = fmtMapRE.cap(1); + fmtUrlMap.replace("\\u0026", "&"); + // parseFmtUrlMap(fmtUrlMap, true); + +#ifdef APP_DASH + QSettings settings; + QString definitionName = settings.value("definition", "360p").toString(); + if (definitionName == QLatin1String("1080p")) { + QRegExp dashManifestRe("\"dashmpd\":\\s*\"([^\"]+)\""); + if (dashManifestRe.indexIn(html) != -1) { + dashManifestUrl = dashManifestRe.cap(1); + dashManifestUrl.remove('\\'); + qDebug() << "dashManifestUrl" << dashManifestUrl; + } + } +#endif + + QRegExp jsPlayerRe(JsFunctions::instance()->jsPlayerRE()); + if (jsPlayerRe.indexIn(html) != -1) { + QString jsPlayerUrl = jsPlayerRe.cap(1); + jsPlayerUrl.remove('\\'); + jsPlayerUrl = "http:" + jsPlayerUrl; + // qDebug() << "jsPlayerUrl" << jsPlayerUrl; + /* + QRegExp jsPlayerIdRe("-(.+)\\.js"); + jsPlayerIdRe.indexIn(jsPlayerUrl); + QString jsPlayerId = jsPlayerRe.cap(1); + */ + QObject *reply = The::http()->get(jsPlayerUrl); + connect(reply, SIGNAL(data(QByteArray)), SLOT(parseJsPlayer(QByteArray))); + connect(reply, SIGNAL(error(QNetworkReply*)), SLOT(errorVideoInfo(QNetworkReply*))); + } +} + +void Video::parseJsPlayer(const QByteArray &bytes) { + QString js = QString::fromUtf8(bytes); + // qWarning() << "jsPlayer" << js; + + // QRegExp funcNameRe("\"signature\"\\w*,\\w*([" + jsNameChars + "]+)"); + QRegExp funcNameRe(JsFunctions::instance()->signatureFunctionNameRE().arg(jsNameChars)); + + if (funcNameRe.indexIn(js) == -1) { + qWarning() << "Cannot capture signature function name" << js; + } else { + sigFuncName = funcNameRe.cap(1); + captureFunction(sigFuncName, js); + // qWarning() << sigFunctions; + } + +#ifdef APP_DASH + if (!dashManifestUrl.isEmpty()) { + QRegExp sigRe("/s/([\\w\\.]+)"); + if (sigRe.indexIn(dashManifestUrl) != -1) { + qDebug() << "Decrypting signature for dash manifest"; + QString sig = sigRe.cap(1); + sig = decryptSignature(sig); + dashManifestUrl.replace(sigRe, "/signature/" + sig); + qDebug() << dashManifestUrl; + + if (false) { + // let phonon play the manifest + m_streamUrl = dashManifestUrl; + this->definitionCode = 37; + emit gotStreamUrl(m_streamUrl); + loadingStreamUrl = false; + } else { + // download the manifest + QObject *reply = The::http()->get(QUrl::fromEncoded(dashManifestUrl.toUtf8())); + connect(reply, SIGNAL(data(QByteArray)), SLOT(parseDashManifest(QByteArray))); + connect(reply, SIGNAL(error(QNetworkReply*)), SLOT(errorVideoInfo(QNetworkReply*))); + } + + return; + } + } +#endif + + parseFmtUrlMap(fmtUrlMap, true); +} + +void Video::parseDashManifest(const QByteArray &bytes) { + QFile file(Temporary::filename() + ".mpd"); + if (!file.open(QIODevice::WriteOnly)) + qWarning() << file.errorString() << file.fileName(); + QDataStream stream(&file); + stream.writeRawData(bytes.constData(), bytes.size()); + + m_streamUrl = "file://" + file.fileName(); + this->definitionCode = 37; + emit gotStreamUrl(m_streamUrl); + loadingStreamUrl = false; +} + +void Video::captureFunction(const QString &name, const QString &js) { + QRegExp funcRe("function\\s+" + QRegExp::escape(name) + "\\s*\\([" + jsNameChars + ",\\s]*\\)\\s*\\{[^\\}]+\\}"); + if (funcRe.indexIn(js) == -1) { + qWarning() << "Cannot capture function" << name; + return; + } + QString func = funcRe.cap(0); + sigFunctions.insert(name, func); + + // capture inner functions + QRegExp invokedFuncRe("[\\s=;\\(]([" + jsNameChars + "]+)\\s*\\([" + jsNameChars + ",\\s]+\\)"); + int pos = name.length() + 9; + while ((pos = invokedFuncRe.indexIn(func, pos)) != -1) { + QString funcName = invokedFuncRe.cap(1); + if (!sigFunctions.contains(funcName)) + captureFunction(funcName, js); + pos += invokedFuncRe.matchedLength(); + } + + // capture referenced objects + QRegExp objRe("[\\s=;\\(]([" + jsNameChars + "]+)\\.[" + jsNameChars + "]+"); + pos = name.length() + 9; + while ((pos = objRe.indexIn(func, pos)) != -1) { + QString objName = objRe.cap(1); + if (!sigObjects.contains(objName)) + captureObject(objName, js); + pos += objRe.matchedLength(); + } +} + +void Video::captureObject(const QString &name, const QString &js) { + QRegExp re("var\\s+" + QRegExp::escape(name) + "\\s*=\\s*\\{.+\\}\\s*;"); + re.setMinimal(true); + if (re.indexIn(js) == -1) { + qWarning() << "Cannot capture object" << name; + return; + } + QString obj = re.cap(0); + sigObjects.insert(name, obj); +} + +QString Video::decryptSignature(const QString &s) { + if (sigFuncName.isEmpty()) return QString(); + QScriptEngine engine; + foreach (const QString &f, sigObjects.values()) { + QScriptValue value = engine.evaluate(f); + if (value.isError()) + qWarning() << "Error in" << f << value.toString(); + } + foreach (const QString &f, sigFunctions.values()) { + QScriptValue value = engine.evaluate(f); + if (value.isError()) + qWarning() << "Error in" << f << value.toString(); + } + QString js = sigFuncName + "('" + s + "');"; + QScriptValue value = engine.evaluate(js); + if (value.isUndefined()) { + qWarning() << "Undefined result for" << js; + return QString(); + } + if (value.isError()) { + qWarning() << "Error in" << js << value.toString(); + return QString(); + } + return value.toString(); +} + +QString Video::formattedDuration() const { + return DataUtils::formatDuration(m_duration); +} + +void Video::saveDefinitionForUrl(const QString& url, const VideoDefinition& definition) { + const QUrl videoUrl = QUrl::fromEncoded(url.toUtf8(), QUrl::StrictMode); + m_streamUrl = videoUrl; + definitionCode = definition.getCode(); + emit gotStreamUrl(videoUrl); + loadingStreamUrl = false; +} +