2019-03-29 16:30:02 -05:00
|
|
|
struct PlaylistVideo
|
2019-06-08 13:31:41 -05:00
|
|
|
def to_json(locale, config, kemal_config, json : JSON::Builder)
|
|
|
|
json.object do
|
|
|
|
json.field "title", self.title
|
|
|
|
json.field "videoId", self.id
|
|
|
|
|
|
|
|
json.field "author", self.author
|
|
|
|
json.field "authorId", self.ucid
|
|
|
|
json.field "authorUrl", "/channel/#{self.ucid}"
|
|
|
|
|
|
|
|
json.field "videoThumbnails" do
|
|
|
|
generate_thumbnails(json, self.id, config, kemal_config)
|
|
|
|
end
|
|
|
|
|
|
|
|
json.field "index", self.index
|
|
|
|
json.field "lengthSeconds", self.length_seconds
|
|
|
|
end
|
|
|
|
end
|
|
|
|
|
|
|
|
def to_json(locale, config, kemal_config, json : JSON::Builder | Nil = nil)
|
|
|
|
if json
|
|
|
|
to_json(locale, config, kemal_config, json)
|
|
|
|
else
|
|
|
|
JSON.build do |json|
|
|
|
|
to_json(locale, config, kemal_config, json)
|
|
|
|
end
|
|
|
|
end
|
|
|
|
end
|
|
|
|
|
2019-04-03 11:35:58 -05:00
|
|
|
db_mapping({
|
2018-09-28 23:12:35 -05:00
|
|
|
title: String,
|
|
|
|
id: String,
|
|
|
|
author: String,
|
|
|
|
ucid: String,
|
|
|
|
length_seconds: Int32,
|
|
|
|
published: Time,
|
2019-06-07 20:23:37 -05:00
|
|
|
plid: String,
|
2018-09-28 23:12:35 -05:00
|
|
|
index: Int32,
|
2019-03-24 09:10:14 -05:00
|
|
|
live_now: Bool,
|
2018-09-28 23:12:35 -05:00
|
|
|
})
|
|
|
|
end
|
|
|
|
|
2019-03-29 16:30:02 -05:00
|
|
|
struct Playlist
|
2019-04-03 11:35:58 -05:00
|
|
|
db_mapping({
|
2018-09-04 19:27:10 -05:00
|
|
|
title: String,
|
|
|
|
id: String,
|
|
|
|
author: String,
|
2018-09-25 10:28:40 -05:00
|
|
|
author_thumbnail: String,
|
2018-09-04 19:27:10 -05:00
|
|
|
ucid: String,
|
|
|
|
description_html: String,
|
|
|
|
video_count: Int32,
|
|
|
|
views: Int64,
|
|
|
|
updated: Time,
|
2019-08-21 19:08:11 -05:00
|
|
|
thumbnail: String?,
|
2018-08-15 10:22:36 -05:00
|
|
|
})
|
|
|
|
end
|
|
|
|
|
2018-12-20 15:32:09 -06:00
|
|
|
def fetch_playlist_videos(plid, page, video_count, continuation = nil, locale = nil)
|
2018-08-15 10:22:36 -05:00
|
|
|
client = make_client(YT_URL)
|
2018-09-22 14:13:10 -05:00
|
|
|
|
2018-10-07 21:11:33 -05:00
|
|
|
if continuation
|
2018-11-10 10:50:09 -06:00
|
|
|
html = client.get("/watch?v=#{continuation}&list=#{plid}&gl=US&hl=en&disable_polymer=1&has_verified=1&bpctr=9999999999")
|
2018-10-07 21:11:33 -05:00
|
|
|
html = XML.parse_html(html.body)
|
|
|
|
|
|
|
|
index = html.xpath_node(%q(//span[@id="playlist-current-index"])).try &.content.to_i?
|
|
|
|
if index
|
|
|
|
index -= 1
|
|
|
|
end
|
|
|
|
index ||= 0
|
|
|
|
else
|
2018-09-22 14:13:10 -05:00
|
|
|
index = (page - 1) * 100
|
2018-10-07 21:11:33 -05:00
|
|
|
end
|
|
|
|
|
|
|
|
if video_count > 100
|
2018-09-22 14:13:10 -05:00
|
|
|
url = produce_playlist_url(plid, index)
|
|
|
|
|
|
|
|
response = client.get(url)
|
|
|
|
response = JSON.parse(response.body)
|
|
|
|
if !response["content_html"]? || response["content_html"].as_s.empty?
|
2019-04-19 18:14:11 +02:00
|
|
|
raise translate(locale, "Empty playlist")
|
2018-09-22 14:13:10 -05:00
|
|
|
end
|
|
|
|
|
|
|
|
document = XML.parse_html(response["content_html"].as_s)
|
|
|
|
nodeset = document.xpath_nodes(%q(.//tr[contains(@class, "pl-video")]))
|
|
|
|
videos = extract_playlist(plid, nodeset, index)
|
|
|
|
else
|
2018-09-28 09:54:01 -05:00
|
|
|
# Playlist has less than one page of videos, so subsequent pages will be empty
|
2018-09-22 14:13:10 -05:00
|
|
|
if page > 1
|
|
|
|
videos = [] of PlaylistVideo
|
|
|
|
else
|
2018-09-28 09:54:01 -05:00
|
|
|
# Extract first page of videos
|
2018-09-25 17:55:32 -05:00
|
|
|
response = client.get("/playlist?list=#{plid}&gl=US&hl=en&disable_polymer=1")
|
2018-09-22 14:13:10 -05:00
|
|
|
document = XML.parse_html(response.body)
|
|
|
|
nodeset = document.xpath_nodes(%q(.//tr[contains(@class, "pl-video")]))
|
|
|
|
|
|
|
|
videos = extract_playlist(plid, nodeset, 0)
|
2018-12-24 17:47:23 -06:00
|
|
|
|
2018-10-10 19:47:51 -05:00
|
|
|
if continuation
|
|
|
|
until videos[0].id == continuation
|
|
|
|
videos.shift
|
|
|
|
end
|
|
|
|
end
|
2018-09-22 14:13:10 -05:00
|
|
|
end
|
2018-08-15 10:22:36 -05:00
|
|
|
end
|
|
|
|
|
2018-09-22 14:13:10 -05:00
|
|
|
return videos
|
|
|
|
end
|
|
|
|
|
|
|
|
def extract_playlist(plid, nodeset, index)
|
2018-08-15 10:22:36 -05:00
|
|
|
videos = [] of PlaylistVideo
|
|
|
|
|
2018-09-22 14:13:10 -05:00
|
|
|
nodeset.each_with_index do |video, offset|
|
|
|
|
anchor = video.xpath_node(%q(.//td[@class="pl-video-title"]))
|
|
|
|
if !anchor
|
|
|
|
next
|
2018-08-15 10:22:36 -05:00
|
|
|
end
|
2018-09-22 14:13:10 -05:00
|
|
|
|
|
|
|
title = anchor.xpath_node(%q(.//a)).not_nil!.content.strip(" \n")
|
|
|
|
id = anchor.xpath_node(%q(.//a)).not_nil!["href"].lchop("/watch?v=")[0, 11]
|
|
|
|
|
|
|
|
anchor = anchor.xpath_node(%q(.//div[@class="pl-video-owner"]/a))
|
|
|
|
if anchor
|
|
|
|
author = anchor.content
|
|
|
|
ucid = anchor["href"].split("/")[2]
|
|
|
|
else
|
|
|
|
author = ""
|
|
|
|
ucid = ""
|
|
|
|
end
|
|
|
|
|
|
|
|
anchor = video.xpath_node(%q(.//td[@class="pl-video-time"]/div/div[1]))
|
|
|
|
if anchor && !anchor.content.empty?
|
|
|
|
length_seconds = decode_length_seconds(anchor.content)
|
2019-03-24 09:10:14 -05:00
|
|
|
live_now = false
|
2018-09-22 14:13:10 -05:00
|
|
|
else
|
|
|
|
length_seconds = 0
|
2019-03-24 09:10:14 -05:00
|
|
|
live_now = true
|
2018-09-22 14:13:10 -05:00
|
|
|
end
|
|
|
|
|
|
|
|
videos << PlaylistVideo.new(
|
2018-12-20 15:32:09 -06:00
|
|
|
title: title,
|
|
|
|
id: id,
|
|
|
|
author: author,
|
|
|
|
ucid: ucid,
|
|
|
|
length_seconds: length_seconds,
|
2019-06-07 20:23:37 -05:00
|
|
|
published: Time.utc,
|
|
|
|
plid: plid,
|
2018-12-20 15:32:09 -06:00
|
|
|
index: index + offset,
|
2019-03-24 09:10:14 -05:00
|
|
|
live_now: live_now
|
2018-09-22 14:13:10 -05:00
|
|
|
)
|
2018-08-15 10:22:36 -05:00
|
|
|
end
|
|
|
|
|
|
|
|
return videos
|
|
|
|
end
|
|
|
|
|
|
|
|
def produce_playlist_url(id, index)
|
|
|
|
if id.starts_with? "UC"
|
|
|
|
id = "UU" + id.lchop("UC")
|
|
|
|
end
|
|
|
|
ucid = "VL" + id
|
|
|
|
|
2019-07-20 20:18:08 -05:00
|
|
|
data = IO::Memory.new
|
|
|
|
data.write_byte 0x08
|
|
|
|
VarInt.to_io(data, index)
|
2019-02-04 15:17:10 -06:00
|
|
|
|
2019-07-20 20:18:08 -05:00
|
|
|
data.rewind
|
|
|
|
data = Base64.urlsafe_encode(data, false)
|
|
|
|
data = "PT:#{data}"
|
2018-09-17 16:38:18 -05:00
|
|
|
|
2019-02-04 15:17:10 -06:00
|
|
|
continuation = IO::Memory.new
|
2019-07-20 20:18:08 -05:00
|
|
|
continuation.write_byte 0x7a
|
|
|
|
VarInt.to_io(continuation, data.bytesize)
|
|
|
|
continuation.print data
|
2018-09-17 16:38:18 -05:00
|
|
|
|
2019-07-20 20:18:08 -05:00
|
|
|
data = Base64.urlsafe_encode(continuation)
|
2019-09-24 19:31:33 +02:00
|
|
|
cursor = URI.encode_www_form(data)
|
2018-09-17 16:38:18 -05:00
|
|
|
|
2019-07-20 20:18:08 -05:00
|
|
|
data = IO::Memory.new
|
|
|
|
|
|
|
|
data.write_byte 0x12
|
|
|
|
VarInt.to_io(data, ucid.bytesize)
|
|
|
|
data.print ucid
|
|
|
|
|
|
|
|
data.write_byte 0x1a
|
|
|
|
VarInt.to_io(data, cursor.bytesize)
|
|
|
|
data.print cursor
|
|
|
|
|
|
|
|
data.rewind
|
|
|
|
|
|
|
|
buffer = IO::Memory.new
|
|
|
|
buffer.write Bytes[0xe2, 0xa9, 0x85, 0xb2, 0x02]
|
|
|
|
VarInt.to_io(buffer, data.bytesize)
|
2018-09-17 16:38:18 -05:00
|
|
|
|
2019-07-20 20:18:08 -05:00
|
|
|
IO.copy data, buffer
|
2018-09-17 16:38:18 -05:00
|
|
|
|
2019-07-20 20:18:08 -05:00
|
|
|
continuation = Base64.urlsafe_encode(buffer)
|
2019-09-24 19:31:33 +02:00
|
|
|
continuation = URI.encode_www_form(continuation)
|
2018-08-15 10:22:36 -05:00
|
|
|
|
2019-07-20 20:18:08 -05:00
|
|
|
url = "/browse_ajax?continuation=#{continuation}&gl=US&hl=en"
|
2018-08-15 10:22:36 -05:00
|
|
|
|
|
|
|
return url
|
|
|
|
end
|
|
|
|
|
2018-12-20 15:32:09 -06:00
|
|
|
def fetch_playlist(plid, locale)
|
2018-08-15 10:22:36 -05:00
|
|
|
client = make_client(YT_URL)
|
2018-09-22 14:13:10 -05:00
|
|
|
|
|
|
|
if plid.starts_with? "UC"
|
|
|
|
plid = "UU#{plid.lchop("UC")}"
|
|
|
|
end
|
|
|
|
|
2018-09-25 17:55:32 -05:00
|
|
|
response = client.get("/playlist?list=#{plid}&hl=en&disable_polymer=1")
|
2018-09-23 12:26:12 -05:00
|
|
|
if response.status_code != 200
|
2019-04-19 18:14:11 +02:00
|
|
|
raise translate(locale, "Not a playlist.")
|
2018-09-23 12:26:12 -05:00
|
|
|
end
|
|
|
|
|
2019-01-04 22:48:00 -06:00
|
|
|
body = response.body.gsub(/<button[^>]+><span[^>]+>\s*less\s*<img[^>]+>\n<\/span><\/button>/, "")
|
2018-09-13 21:00:39 -05:00
|
|
|
document = XML.parse_html(body)
|
2018-08-15 10:22:36 -05:00
|
|
|
|
2018-09-23 12:32:32 -05:00
|
|
|
title = document.xpath_node(%q(//h1[@class="pl-header-title"]))
|
|
|
|
if !title
|
2018-12-20 15:32:09 -06:00
|
|
|
raise translate(locale, "Playlist does not exist.")
|
2018-09-23 12:32:32 -05:00
|
|
|
end
|
|
|
|
title = title.content.strip(" \n")
|
2018-08-15 10:22:36 -05:00
|
|
|
|
2019-06-08 15:08:27 -05:00
|
|
|
description_html = document.xpath_node(%q(//span[@class="pl-header-description-text"]/div/div[1])).try &.to_s ||
|
|
|
|
document.xpath_node(%q(//span[@class="pl-header-description-text"])).try &.to_s || ""
|
2018-08-15 10:22:36 -05:00
|
|
|
|
2019-08-21 19:08:11 -05:00
|
|
|
playlist_thumbnail = document.xpath_node(%q(//div[@class="pl-header-thumb"]/img)).try &.["data-thumb"]? ||
|
|
|
|
document.xpath_node(%q(//div[@class="pl-header-thumb"]/img)).try &.["src"]
|
|
|
|
|
2019-05-01 08:03:58 -05:00
|
|
|
# YouTube allows anonymous playlists, so most of this can be empty or optional
|
|
|
|
anchor = document.xpath_node(%q(//ul[@class="pl-header-details"]))
|
|
|
|
author = anchor.try &.xpath_node(%q(.//li[1]/a)).try &.content
|
|
|
|
author ||= ""
|
2018-09-25 10:28:40 -05:00
|
|
|
author_thumbnail = document.xpath_node(%q(//img[@class="channel-header-profile-image"])).try &.["src"]
|
|
|
|
author_thumbnail ||= ""
|
2019-05-01 08:03:58 -05:00
|
|
|
ucid = anchor.try &.xpath_node(%q(.//li[1]/a)).try &.["href"].split("/")[-1]
|
|
|
|
ucid ||= ""
|
2018-08-15 10:22:36 -05:00
|
|
|
|
2019-05-01 08:03:58 -05:00
|
|
|
video_count = anchor.try &.xpath_node(%q(.//li[2])).try &.content.gsub(/\D/, "").to_i?
|
|
|
|
video_count ||= 0
|
2019-08-21 19:08:11 -05:00
|
|
|
|
|
|
|
views = anchor.try &.xpath_node(%q(.//li[3])).try &.content.gsub(/\D/, "").to_i64?
|
2019-05-01 08:03:58 -05:00
|
|
|
views ||= 0_i64
|
|
|
|
|
2019-08-21 19:08:11 -05:00
|
|
|
updated = anchor.try &.xpath_node(%q(.//li[4])).try &.content.lchop("Last updated on ").lchop("Updated ").try { |date| decode_date(date) }
|
|
|
|
updated ||= Time.utc
|
2018-08-15 10:22:36 -05:00
|
|
|
|
|
|
|
playlist = Playlist.new(
|
2018-12-15 13:02:53 -06:00
|
|
|
title: title,
|
|
|
|
id: plid,
|
|
|
|
author: author,
|
|
|
|
author_thumbnail: author_thumbnail,
|
|
|
|
ucid: ucid,
|
|
|
|
description_html: description_html,
|
|
|
|
video_count: video_count,
|
|
|
|
views: views,
|
2019-08-21 19:08:11 -05:00
|
|
|
updated: updated,
|
|
|
|
thumbnail: playlist_thumbnail,
|
2018-08-15 10:22:36 -05:00
|
|
|
)
|
|
|
|
|
|
|
|
return playlist
|
|
|
|
end
|
2018-10-07 21:11:33 -05:00
|
|
|
|
|
|
|
def template_playlist(playlist)
|
|
|
|
html = <<-END_HTML
|
|
|
|
<h3>
|
|
|
|
<a href="/playlist?list=#{playlist["playlistId"]}">
|
|
|
|
#{playlist["title"]}
|
|
|
|
</a>
|
|
|
|
</h3>
|
|
|
|
<div class="pure-menu pure-menu-scrollable playlist-restricted">
|
|
|
|
<ol class="pure-menu-list">
|
|
|
|
END_HTML
|
|
|
|
|
|
|
|
playlist["videos"].as_a.each do |video|
|
|
|
|
html += <<-END_HTML
|
|
|
|
<li class="pure-menu-item">
|
|
|
|
<a href="/watch?v=#{video["videoId"]}&list=#{playlist["playlistId"]}">
|
2019-03-03 10:03:24 -06:00
|
|
|
<div class="thumbnail">
|
|
|
|
<img class="thumbnail" src="/vi/#{video["videoId"]}/mqdefault.jpg">
|
|
|
|
<p class="length">#{recode_length_seconds(video["lengthSeconds"].as_i)}</p>
|
|
|
|
</div>
|
2018-10-07 21:11:33 -05:00
|
|
|
<p style="width:100%">#{video["title"]}</p>
|
|
|
|
<p>
|
2019-05-01 20:03:39 -05:00
|
|
|
<b style="width:100%">#{video["author"]}</b>
|
2018-10-07 21:11:33 -05:00
|
|
|
</p>
|
|
|
|
</a>
|
|
|
|
</li>
|
|
|
|
END_HTML
|
|
|
|
end
|
|
|
|
|
|
|
|
html += <<-END_HTML
|
|
|
|
</ol>
|
|
|
|
</div>
|
|
|
|
<hr>
|
|
|
|
END_HTML
|
|
|
|
|
|
|
|
html
|
|
|
|
end
|