youtube.js 22 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526527528529530531532533534535536537538539540541542543544545546547548549550551552553554555556557558559560
  1. console.log('bundle2!')
  2. printable = (platform) => {
  3. return platform === "WEB";
  4. }
  5. parseCodecs = (format) => {
  6. const mimeType = format['mimeType']
  7. if (!mimeType) {
  8. return {};
  9. }
  10. const regex = /(?<mimetype>[^/]+\/[^;]+)(?:;\s*codecs="?(?<codecs>[^"]+))?/;
  11. const match = mimeType.match(regex);
  12. if (!match) {
  13. return {};
  14. }
  15. const codecs = match.groups.codecs;
  16. if (!codecs) {
  17. return {};
  18. }
  19. const splitCodecs = codecs.trim().replace(/,$/, '').split(',').map(str => str.trim()).filter(Boolean);
  20. let vcodec = null;
  21. let acodec = null;
  22. for (const fullCodec of splitCodecs) {
  23. const codec = fullCodec.split('.')[0];
  24. if (['avc1', 'avc2', 'avc3', 'avc4', 'vp9', 'vp8', 'hev1', 'hev2', 'h263', 'h264', 'mp4v', 'hvc1', 'av01', 'theora'].includes(codec)) {
  25. if (!vcodec) {
  26. vcodec = fullCodec;
  27. }
  28. } else if (['mp4a', 'opus', 'vorbis', 'mp3', 'aac', 'ac-3', 'ec-3', 'eac3', 'dtsc', 'dtse', 'dtsh', 'dtsl'].includes(codec)) {
  29. if (!acodec) {
  30. acodec = fullCodec;
  31. }
  32. } else {
  33. console.log(`WARNING: Unknown codec ${fullCodec}`);
  34. }
  35. }
  36. if (!vcodec && !acodec) {
  37. if (splitCodecs.length === 2) {
  38. return {
  39. vcodec: splitCodecs[0],
  40. acodec: splitCodecs[1]
  41. };
  42. }
  43. } else {
  44. return {
  45. vcodec: vcodec,
  46. acodec: acodec
  47. };
  48. }
  49. return {};
  50. }
  51. parseSetCookie = (headers) => {
  52. if (!headers) {
  53. return ""
  54. }
  55. const setCookie = headers['Set-Cookie']
  56. if (!setCookie) {
  57. return ""
  58. }
  59. console.log(`setCookie: ${setCookie}`)
  60. let result = 'PREF=hl=en&tz=UTC; SOCS=CAI; GPS=1; ';
  61. const needCookieNames = ['YSC', 'VISITOR_INFO1_LIVE', 'VISITOR_PRIVACY_METADATA'];
  62. for (const i in needCookieNames) {
  63. const cookieName = needCookieNames[i];
  64. const regexp = new RegExp(`${cookieName}=([^;,]+)`)
  65. const match = setCookie.match(regexp)
  66. if (match && match.length === 2) {
  67. const cookieValue = match[1]
  68. if (i != needCookieNames.length - 1) {
  69. result += `${cookieName}=${cookieValue}; `
  70. } else {
  71. result += `${cookieName}=${cookieValue}`
  72. }
  73. }
  74. }
  75. console.log(`current cookie: ${result}`)
  76. return result;
  77. }
  78. request = async (method, url, data = null, headers = {}, platform) => {
  79. if (platform === "WEB") {
  80. url = url.replace("https://www.youtube.com", "http://127.0.0.1");
  81. url = url.replace("https://music.youtube.com", "http://127.0.0.1");
  82. }
  83. console.log(`request url:${url}`)
  84. console.log(`request data:${data}`)
  85. console.log(`request method:${method}`)
  86. console.log(`request headers:${JSON.stringify((headers))}`)
  87. if (platform === "WEB") {
  88. const res = await fetch(url, {
  89. 'mode': 'cors',
  90. 'method': method,
  91. 'headers': headers,
  92. 'body': data
  93. })
  94. const resData = await res.text()
  95. return Promise.resolve({
  96. 'data': resData,
  97. 'headers': res.headers
  98. });
  99. }
  100. return new Promise((resolve, reject) => {
  101. AF.request(url, method, data, headers, (data, headers, err) => {
  102. if (err) {
  103. reject(err);
  104. } else {
  105. console.log(`response headers: ${headers}`);
  106. resolve({
  107. 'data': data,
  108. 'headers': JSON.parse(headers)
  109. });
  110. }
  111. });
  112. })
  113. }
  114. getStringBetween = (string, needleStart, needleEnd, offsetStart = 0, offsetEnd = 0) => {
  115. const x = string.indexOf(needleStart);
  116. const y = needleEnd ? string.indexOf(needleEnd, x) : string.length;
  117. return string.substring(x + needleStart.length + offsetEnd, y + offsetStart);
  118. }
  119. findFunction = (jsCode, regexp, platform) => {
  120. const match = jsCode.match(regexp)
  121. if (!match && match.length <= 1) {
  122. return null;
  123. }
  124. let result = "";
  125. const dependencyMatches = match[0].match(/([$a-zA-Z0-9]+\.[$a-zA-Z0-9]+)/g)
  126. const existDependencies = [];
  127. if (dependencyMatches && dependencyMatches.length >= 1) {
  128. for (let currentMatch of dependencyMatches) {
  129. const varName = currentMatch.split('.')[0];
  130. if (existDependencies.includes(varName)) {
  131. continue
  132. }
  133. if (!/^[$A-Z]+$/.test(varName)) {
  134. continue
  135. }
  136. const varNameMatch = jsCode.match(new RegExp(`var \\${varName}={(.|\\n)*?};`), 'ig');
  137. if (varNameMatch && varNameMatch.length >= 1) {
  138. result += varNameMatch[0] + "\n";
  139. }
  140. existDependencies.push(varName);
  141. }
  142. }
  143. result += `\n${match[0]}`;
  144. if (printable(platform)) {
  145. console.log(`findFunction result: ` + result);
  146. }
  147. return eval(result);
  148. };
  149. const cache = {};
  150. fetchBaseJSContent = async (baseJsUrl, platform) => {
  151. const cacheKey = `jsContent:${baseJsUrl}`;
  152. if (cache[cacheKey]) {
  153. console.log(`baseContent from cache: ${baseJsUrl}`);
  154. return cache[cacheKey];
  155. }
  156. console.log(`extract baseUrl: ${baseJsUrl}`);
  157. const baseContentResp = await request('GET', baseJsUrl, null, {
  158. 'User-Agent': 'Mozilla/5.0 (Windows NT 10.0; Win64; x64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/87.0.4280.101 Safari/537.36',
  159. }, platform);
  160. const {data, _} = baseContentResp;
  161. cache[cacheKey] = data;
  162. return data;
  163. }
  164. extractJSSignatureFunction = async (baseJsUrl, platform) => {
  165. const cacheKey = `jsSign:${baseJsUrl}`
  166. if (cache[cacheKey]) {
  167. console.log(`jsSign from cache: ${baseJsUrl}`);
  168. return cache[cacheKey];
  169. }
  170. const baseJsContent = await fetchBaseJSContent(baseJsUrl, platform);
  171. const result = findFunction(baseJsContent, /([a-zA-Z0-9]+)=function\([a-zA-Z0-9]+\)\{a=a\.split\(""\).*};/, platform);
  172. cache[cacheKey] = result
  173. return result
  174. }
  175. extractNJSFunction = async (baseJsUrl, platform) => {
  176. const cacheKey = `jsN:${baseJsUrl}`
  177. if (cache[cacheKey]) {
  178. console.log(`jsN from cache: ${baseJsUrl}`);
  179. return cache[cacheKey];
  180. }
  181. const baseJsContent = await fetchBaseJSContent(baseJsUrl, platform);
  182. const result = findFunction(baseJsContent, /([a-zA-Z0-9]+)=function\([a-zA-Z0-9]+\)\{var b=a\.split\(""\)[\s\S]*?};/, platform);
  183. cache[cacheKey] = result
  184. return result
  185. }
  186. signUrl = async (signatureCipher, baseJsUrl, platform) => {
  187. const searchParams = {}
  188. for (const item of signatureCipher.split('&')) {
  189. const [key, value] = item.split('=');
  190. searchParams[decodeURIComponent(key)] = decodeURIComponent(value);
  191. }
  192. const [url, signature, sp] = [searchParams['url'], searchParams['s'], searchParams['sp']];
  193. const decipher = await extractJSSignatureFunction(baseJsUrl, platform);
  194. if (!decipher) {
  195. return null;
  196. }
  197. if (printable(platform)) {
  198. console.log(`signatureCipher=${signatureCipher}, url=${url}, signature=${signature}, sp=${sp}`)
  199. }
  200. let newUrl = `${url}&${sp}=${decipher(signature)}`;
  201. function replaceUrlParam(url, paramName, paramValue) {
  202. let pattern = new RegExp(`([?&])${paramName}=.*?(&|$)`, 'i');
  203. let newUrl = url.replace(pattern, `$1${paramName}=${paramValue}$2`);
  204. if (newUrl === url && url.indexOf('?') === -1) {
  205. newUrl += `?${paramName}=${paramValue}`;
  206. } else if (newUrl === url) {
  207. newUrl += `&${paramName}=${paramValue}`;
  208. }
  209. return newUrl;
  210. }
  211. for (const item of url.split('&')) {
  212. const [key, value] = item.split('=');
  213. searchParams[decodeURIComponent(key)] = decodeURIComponent(value);
  214. }
  215. const nFunction = await extractNJSFunction(baseJsUrl, platform);
  216. const n = searchParams['n']
  217. if (n && nFunction) {
  218. const newN = nFunction(n);
  219. return replaceUrlParam(newUrl, 'n', newN);
  220. }
  221. return newUrl;
  222. }
  223. detail = async (url, platform) => {
  224. try {
  225. const htmlResp = await request('GET', `${url}&bpctr=9999999999&has_verified=1`, null, {
  226. 'User-Agent': 'Mozilla/5.0 (Windows NT 10.0; Win64; x64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/92.0.4515.107 Safari/537.36',
  227. 'Accept': 'text/html,application/xhtml+xml,application/xml;q=0.9,*/*;q=0.8',
  228. 'Accept-Language': 'en-us,en;q=0.5',
  229. 'Sec-Fetch-Mode': 'navigate',
  230. 'Accept-Encoding': 'gzip, deflate, br',
  231. 'Cookie': 'PREF=hl=en&tz=UTC; SOCS=CAI'
  232. }, platform);
  233. let {data: html, headers: htmlHeaders} = htmlResp;
  234. let regex = /var ytInitialPlayerResponse\s*=\s*({.*?});/;
  235. let match = html.match(regex);
  236. if (!match || !match.length) {
  237. console.log('can not found JSON: ytInitialPlayerResponse');
  238. throw new Error('JSON not found: ytInitialPlayerResponse');
  239. }
  240. const ytInitialPlayerResponse = JSON.parse(match[1]);
  241. if (printable(platform)) {
  242. console.log(ytInitialPlayerResponse);
  243. }
  244. const originVideoDetails = ytInitialPlayerResponse['videoDetails'];
  245. const thumbnails = []
  246. for (const item of originVideoDetails['thumbnail']['thumbnails']) {
  247. thumbnails.push({
  248. 'url': item['url'],
  249. 'width': item['width'] + "",
  250. 'height': item['height'] + ""
  251. })
  252. }
  253. let originFormats = [];
  254. // android
  255. try {
  256. const apiUrl = `https://music.youtube.com/youtubei/v1/player?key=AIzaSyAO_FJ2SlqU8Q4STEHLGCilw_Y9_11qcW8`;
  257. const apiResp = await request('POST', apiUrl, JSON.stringify({
  258. "context": {
  259. "client": {
  260. "clientName": "ANDROID",
  261. "hl": "en",
  262. "clientVersion": "18.49.37",
  263. "gl": "US"
  264. }
  265. },
  266. "videoId": url.replace('https://www.youtube.com/watch?v=', ''),
  267. "params": "CgIQBg"
  268. }), {
  269. 'Host': 'www.youtube.com',
  270. 'Connection': 'keep-alive',
  271. 'User-Agent': 'com.google.android.apps.youtube.music/17.31.35 (Linux; U; Android 11) gzip',
  272. 'Accept-Language': 'en-US,en',
  273. 'Cookie': parseSetCookie(htmlHeaders),
  274. 'Content-Type': 'application/json'
  275. }, platform);
  276. let {data: apiData, _} = apiResp;
  277. console.log(`android api result: ${JSON.stringify(apiResp)}`);
  278. const res = JSON.parse(apiData);
  279. const currentFormats = [];
  280. for (const format of [].concat(res["streamingData"]["formats"]).concat(res["streamingData"]["adaptiveFormats"])) {
  281. if (format) {
  282. format["from"] = "android"
  283. currentFormats.push(format);
  284. }
  285. }
  286. originFormats = originFormats.concat(currentFormats);
  287. } catch (e) {
  288. console.log(`can not found format android api error: ${e}`);
  289. }
  290. console.log(`after android api, format size:${originFormats.length}`);
  291. // web
  292. const currentFormats = [];
  293. for (const format of ytInitialPlayerResponse["streamingData"]["formats"].concat(ytInitialPlayerResponse["streamingData"]["adaptiveFormats"])) {
  294. if (format) {
  295. format["from"] = "web"
  296. currentFormats.push(format);
  297. }
  298. }
  299. originFormats = originFormats.concat(currentFormats);
  300. console.log(`after html, format size:${originFormats.length}`);
  301. const baseJsUrl = `https://www.youtube.com${JSON.parse(html.match(/set\(({.+?})\);/)[1])["PLAYER_JS_URL"]}`
  302. let formatIds = [];
  303. const formats = [];
  304. for (let format of originFormats) {
  305. if (printable(platform)) {
  306. console.log(format);
  307. }
  308. if (format && formatIds.indexOf(format['itag']) === -1) {
  309. if (!format["url"]) {
  310. format["url"] = await signUrl(format["signatureCipher"], baseJsUrl, platform);
  311. }
  312. if (format["url"]) {
  313. const {vcodec, acodec} = parseCodecs(format)
  314. if (vcodec && acodec) {
  315. const current = {
  316. "width": format["width"] + "",
  317. "height": format["height"] + "",
  318. "type": format["mimeType"],
  319. "quality": format["qualityLabel"],
  320. "itag": format["itag"],
  321. "fps": format["fps"] + "",
  322. "bitrate": format["bitrate"] + "",
  323. "url": format["url"],
  324. "ext": "mp4",
  325. "vcodec": vcodec,
  326. "acodec": acodec,
  327. "vbr": "0",
  328. "abr": "0",
  329. "container": "mp4_dash",
  330. "from": format["from"]
  331. }
  332. if (platform === "WEB") {
  333. current["source"] = format
  334. }
  335. formats.push(current)
  336. formatIds.push(format["itag"]);
  337. }
  338. }
  339. }
  340. }
  341. const ytInitialDataMatch = html.match(/var ytInitialData\s*=\s*({.*?});/);
  342. const recommendInfo = [];
  343. if (ytInitialDataMatch && ytInitialDataMatch.length === 2) {
  344. const ytInitialData = JSON.parse(ytInitialDataMatch[1]);
  345. if (printable(platform)) {
  346. console.log(ytInitialData);
  347. }
  348. for (const item of ytInitialData["contents"]?.["twoColumnWatchNextResults"]?.["secondaryResults"]?.["secondaryResults"]?.["results"] || []) {
  349. if (item["compactVideoRenderer"]) {
  350. const recommendVideo = item["compactVideoRenderer"];
  351. console.log(`recommend video: ${JSON.stringify(recommendVideo)}`);
  352. if (recommendVideo["videoId"]) {
  353. recommendInfo.push({
  354. "type": "gridVideoRenderer",
  355. "videoId": recommendVideo["videoId"],
  356. "title": recommendVideo["title"]?.["simpleText"],
  357. "thumbnails": recommendVideo["thumbnail"]?.["thumbnails"],
  358. "channelName": recommendVideo["longBylineText"]?.["runs"]?.[0]?.["text"],
  359. "publishedTimeText": recommendVideo["publishedTimeText"]?.["simpleText"],
  360. "viewCountText": recommendVideo["viewCountText"]?.["simpleText"],
  361. "shortViewCountText": recommendVideo["shortViewCountText"]?.["simpleText"],
  362. "lengthText": recommendVideo["lengthText"]?.["simpleText"]
  363. })
  364. }
  365. }
  366. }
  367. }
  368. formats.sort((a, b) => parseInt(a["height"]) - parseInt(b["height"]));
  369. const videoDetails = {
  370. "isLiveContent": originVideoDetails["isLiveContent"],
  371. "title": originVideoDetails["title"],
  372. "thumbnails": thumbnails,
  373. "description": originVideoDetails["shortDescription"],
  374. "lengthSeconds": originVideoDetails["lengthSeconds"],
  375. "viewCount": originVideoDetails["viewCount"],
  376. "keywords": originVideoDetails["keywords"],
  377. "author": originVideoDetails["author"],
  378. "channelID": originVideoDetails["channelId"],
  379. "recommendInfo": recommendInfo,
  380. "channelURL": `https://www.youtube.com/channel/${originVideoDetails["channelId"]}`,
  381. "videoId": originVideoDetails["videoId"]
  382. }
  383. const ret = {
  384. "code": 200,
  385. "msg": "",
  386. "data": {
  387. "videoDetails": videoDetails,
  388. "streamingData": {
  389. "formats": formats
  390. }
  391. },
  392. "id": "MusicDetailViewModel_detail_url"
  393. }
  394. console.log(`detail result: ${JSON.stringify(ret)}`);
  395. return ret;
  396. } catch (e) {
  397. const ret = {
  398. "code": -1,
  399. "msg": e.toString()
  400. }
  401. console.log(`detail result error: ${JSON.stringify(ret)}`);
  402. console.log(e);
  403. return ret;
  404. }
  405. }
  406. search = async (keyword, next, platform) => {
  407. try {
  408. console.log(`search keyword: ${keyword}`);
  409. console.log(`search next: ${next}`);
  410. if (next) {
  411. const nextObject = JSON.parse(next);
  412. const key = nextObject["key"];
  413. const body = {
  414. context: {
  415. client: {
  416. clientName: "WEB",
  417. clientVersion: "2.20240506.01.00",
  418. },
  419. },
  420. continuation: nextObject["continuation"]
  421. };
  422. let res = await request('POST', `https://www.youtube.com/youtubei/v1/search?key=${key}`, JSON.stringify(body), {}, platform);
  423. const {data, _} = res;
  424. res = JSON.parse(data);
  425. const videos = [];
  426. for (const item of res["onResponseReceivedCommands"][0]["appendContinuationItemsAction"]["continuationItems"][0]["itemSectionRenderer"]["contents"]) {
  427. const video = item["videoRenderer"];
  428. if (printable(platform)) {
  429. console.log(video);
  430. }
  431. if (video && video["videoId"]) {
  432. videos.push({
  433. "type": "videoWithContextRenderer",
  434. "data": {
  435. "videoId": video["videoId"],
  436. "title": video["title"]?.["runs"]?.[0]?.["text"],
  437. "thumbnails": video["thumbnail"]?.["thumbnails"],
  438. "channelName": video["longBylineText"]?.["runs"]?.[0]?.["text"],
  439. "publishedTimeText": video["publishedTimeText"]?.["simpleText"],
  440. "viewCountText": video["viewCountText"]?.["simpleText"],
  441. "shortViewCountText": video["shortViewCountText"]?.["simpleText"],
  442. "lengthText": video["lengthText"]?.["simpleText"]
  443. }
  444. });
  445. }
  446. }
  447. const ret = {
  448. "code": 200,
  449. "msg": "",
  450. "data": {
  451. "data": videos,
  452. "next": JSON.stringify({
  453. "key": nextObject["key"],
  454. "continuation": res["onResponseReceivedCommands"]?.[0]?.["appendContinuationItemsAction"]?.["continuationItems"]?.[1]?.["continuationItemRenderer"]?.["continuationEndpoint"]?.["continuationCommand"]?.["token"],
  455. }),
  456. },
  457. "id": "MusicSearchResultViewModel_search_result"
  458. }
  459. console.log(`[next] search result: ${JSON.stringify(ret)}`);
  460. return ret;
  461. } else {
  462. let url = `https://www.youtube.com/results?q=${encodeURIComponent(keyword)}&sp=EgIQAQ%253D%253D`;
  463. const htmlRes = await request('GET', url, null, {}, platform);
  464. const {data: html, _} = htmlRes;
  465. let regex = /var ytInitialData\s*=\s*({.*?});/;
  466. let match = html.match(regex);
  467. if (!match || !match.length) {
  468. console.log("can not found ytInitialData");
  469. throw new Error('JSON not found: ytInitialData');
  470. }
  471. const ytInitialDataResp = JSON.parse(match[1]);
  472. const videos = [];
  473. for (const item of ytInitialDataResp["contents"]?.["twoColumnSearchResultsRenderer"]?.["primaryContents"]?.["sectionListRenderer"]?.["contents"]?.[0]?.["itemSectionRenderer"]?.["contents"]) {
  474. if (item["videoRenderer"]) {
  475. const video = item["videoRenderer"];
  476. if (printable(platform)) {
  477. console.log(video);
  478. }
  479. if (video && video["videoId"]) {
  480. videos.push({
  481. "type": "videoWithContextRenderer",
  482. "data": {
  483. "videoId": video["videoId"],
  484. "title": video["title"]?.["runs"]?.[0]?.["text"],
  485. "thumbnails": video["thumbnail"]?.["thumbnails"],
  486. "channelName": video["longBylineText"]?.["runs"]?.[0]?.["text"],
  487. "publishedTimeText": video["publishedTimeText"]?.["simpleText"],
  488. "viewCountText": video["viewCountText"]?.["simpleText"],
  489. "shortViewCountText": video["shortViewCountText"]?.["simpleText"],
  490. "lengthText": video["lengthText"]?.["simpleText"]
  491. }
  492. });
  493. }
  494. }
  495. }
  496. let next = {};
  497. if (html.split("innertubeApiKey").length > 0) {
  498. next["key"] = html
  499. .split("innertubeApiKey")[1]
  500. .trim()
  501. .split(",")[0]
  502. .split('"')[2];
  503. }
  504. next["continuation"] = ytInitialDataResp["contents"]?.["twoColumnSearchResultsRenderer"]?.["primaryContents"]?.["sectionListRenderer"]?.["contents"]?.[1]?.["continuationItemRenderer"]?.["continuationEndpoint"]?.["continuationCommand"]?.["token"]
  505. const ret = {
  506. "code": 200,
  507. "msg": "",
  508. "data": {
  509. "data": videos,
  510. "next": JSON.stringify(next),
  511. },
  512. "id": "MusicSearchResultViewModel_search_result"
  513. }
  514. console.log(`unnext search result: ${JSON.stringify(ret)}`);
  515. return ret;
  516. }
  517. } catch (e) {
  518. const ret = {
  519. "code": -1,
  520. "msg": e.toString()
  521. }
  522. console.log(`search result error: ${JSON.stringify(ret)}`);
  523. return ret;
  524. }
  525. }