invidious-experimenting/src/invidious/playlists.cr

struct PlaylistVideo
  add_mapping({
    title:          String,
    id:             String,
    author:         String,
    ucid:           String,
    length_seconds: Int32,
    published:      Time,
    playlists:      Array(String),
    index:          Int32,
    live_now:       Bool,
  })
end

struct Playlist
  add_mapping({
    title:            String,
    id:               String,
    author:           String,
    author_thumbnail: String,
    ucid:             String,
    description:      String,
    description_html: String,
    video_count:      Int32,
    views:            Int64,
    updated:          Time,
  })
end

def fetch_playlist_videos(plid, page, video_count, continuation = nil, locale = nil)
  client = make_client(YT_URL)

  if continuation
    html = client.get("/watch?v=#{continuation}&list=#{plid}&gl=US&hl=en&disable_polymer=1&has_verified=1&bpctr=9999999999")
    html = XML.parse_html(html.body)

    index = html.xpath_node(%q(//span[@id="playlist-current-index"])).try &.content.to_i?
    if index
      index -= 1
    end
    index ||= 0
  else
    index = (page - 1) * 100
  end

  if video_count > 100
    url = produce_playlist_url(plid, index)

    response = client.get(url)
    response = JSON.parse(response.body)
    if !response["content_html"]? || response["content_html"].as_s.empty?
      raise translate(locale, "Playlist is empty")
    end

    document = XML.parse_html(response["content_html"].as_s)
    nodeset = document.xpath_nodes(%q(.//tr[contains(@class, "pl-video")]))
    videos = extract_playlist(plid, nodeset, index)
  else
    # Playlist has less than one page of videos, so subsequent pages will be empty
    if page > 1
      videos = [] of PlaylistVideo
    else
      # Extract first page of videos
      response = client.get("/playlist?list=#{plid}&gl=US&hl=en&disable_polymer=1")
      document = XML.parse_html(response.body)
      nodeset = document.xpath_nodes(%q(.//tr[contains(@class, "pl-video")]))

      videos = extract_playlist(plid, nodeset, 0)

      if continuation
        until videos[0].id == continuation
          videos.shift
        end
      end
    end
  end

  return videos
end

def extract_playlist(plid, nodeset, index)
  videos = [] of PlaylistVideo

  nodeset.each_with_index do |video, offset|
    anchor = video.xpath_node(%q(.//td[@class="pl-video-title"]))
    if !anchor
      next
    end

    title = anchor.xpath_node(%q(.//a)).not_nil!.content.strip(" \n")
    id = anchor.xpath_node(%q(.//a)).not_nil!["href"].lchop("/watch?v=")[0, 11]

    anchor = anchor.xpath_node(%q(.//div[@class="pl-video-owner"]/a))
    if anchor
      author = anchor.content
      ucid = anchor["href"].split("/")[2]
    else
      author = ""
      ucid = ""
    end

    anchor = video.xpath_node(%q(.//td[@class="pl-video-time"]/div/div[1]))
    if anchor && !anchor.content.empty?
      length_seconds = decode_length_seconds(anchor.content)
      live_now = false
    else
      length_seconds = 0
      live_now = true
    end

    videos << PlaylistVideo.new(
      title: title,
      id: id,
      author: author,
      ucid: ucid,
      length_seconds: length_seconds,
      published: Time.now,
      playlists: [plid],
      index: index + offset,
      live_now: live_now
    )
  end

  return videos
end

def produce_playlist_url(id, index)
  if id.starts_with? "UC"
    id = "UU" + id.lchop("UC")
  end
  ucid = "VL" + id

  meta = IO::Memory.new
  meta.write(Bytes[0x08])
  meta.write(write_var_int(index))

  meta.rewind
  meta = Base64.urlsafe_encode(meta.to_slice, false)
  meta = "PT:#{meta}"

  continuation = IO::Memory.new
  continuation.write(Bytes[0x7a, meta.size])
  continuation.print(meta)

  continuation.rewind
  meta = Base64.urlsafe_encode(continuation.to_slice)
  meta = URI.escape(meta)

  continuation = IO::Memory.new
  continuation.write(Bytes[0x12, ucid.size])
  continuation.print(ucid)
  continuation.write(Bytes[0x1a, meta.size])
  continuation.print(meta)

  wrapper = IO::Memory.new
  wrapper.write(Bytes[0xe2, 0xa9, 0x85, 0xb2, 0x02, continuation.size])
  wrapper.print(continuation)
  wrapper.rewind

  wrapper = Base64.urlsafe_encode(wrapper.to_slice)
  wrapper = URI.escape(wrapper)

  url = "/browse_ajax?continuation=#{wrapper}&gl=US&hl=en"

  return url
end

def fetch_playlist(plid, locale)
  client = make_client(YT_URL)

  if plid.starts_with? "UC"
    plid = "UU#{plid.lchop("UC")}"
  end

  response = client.get("/playlist?list=#{plid}&hl=en&disable_polymer=1")
  if response.status_code != 200
    raise translate(locale, "Invalid playlist.")
  end

  body = response.body.gsub(/<button[^>]+><span[^>]+>\s*less\s*<img[^>]+>\n<\/span><\/button>/, "")
  document = XML.parse_html(body)

  title = document.xpath_node(%q(//h1[@class="pl-header-title"]))
  if !title
    raise translate(locale, "Playlist does not exist.")
  end
  title = title.content.strip(" \n")

  description_html = document.xpath_node(%q(//span[@class="pl-header-description-text"]/div/div[1]))
  description_html ||= document.xpath_node(%q(//span[@class="pl-header-description-text"]))
  description_html, description = html_to_content(description_html)

  anchor = document.xpath_node(%q(//ul[@class="pl-header-details"])).not_nil!
  author = anchor.xpath_node(%q(.//li[1]/a)).not_nil!.content
  author_thumbnail = document.xpath_node(%q(//img[@class="channel-header-profile-image"])).try &.["src"]
  author_thumbnail ||= ""
  ucid = anchor.xpath_node(%q(.//li[1]/a)).not_nil!["href"].split("/")[-1]

  video_count = anchor.xpath_node(%q(.//li[2])).not_nil!.content.delete("videos, ").to_i
  views = anchor.xpath_node(%q(.//li[3])).not_nil!.content.delete("No views, ")
  if views.empty?
    views = 0_i64
  else
    views = views.to_i64
  end

  updated = anchor.xpath_node(%q(.//li[4])).not_nil!.content.lchop("Last updated on ").lchop("Updated ")
  updated = decode_date(updated)

  playlist = Playlist.new(
    title: title,
    id: plid,
    author: author,
    author_thumbnail: author_thumbnail,
    ucid: ucid,
    description: description,
    description_html: description_html,
    video_count: video_count,
    views: views,
    updated: updated
  )

  return playlist
end

def template_playlist(playlist)
  html = <<-END_HTML
  <h3>
    <a href="/playlist?list=#{playlist["playlistId"]}">
      #{playlist["title"]}
    </a>
  </h3>
  <div class="pure-menu pure-menu-scrollable playlist-restricted">
    <ol class="pure-menu-list">
  END_HTML

  playlist["videos"].as_a.each do |video|
    html += <<-END_HTML
      <li class="pure-menu-item">
        <a href="/watch?v=#{video["videoId"]}&list=#{playlist["playlistId"]}">
          <div class="thumbnail">
              <img class="thumbnail" src="/vi/#{video["videoId"]}/mqdefault.jpg">
              <p class="length">#{recode_length_seconds(video["lengthSeconds"].as_i)}</p>
          </div>
          <p style="width:100%">#{video["title"]}</p>
          <p>
              <b style="width: 100%">#{video["author"]}</b>
          </p>
        </a>
      </li>
    END_HTML
  end

  html += <<-END_HTML
    </ol>
  </div>
  <hr>
  END_HTML

  html
end
Use struct for allocations 2019-03-30 03:00:02 +05:30			`struct PlaylistVideo`
Add mixes 2018-09-29 09:42:35 +05:30			`add_mapping({`
			`title: String,`
			`id: String,`
			`author: String,`
			`ucid: String,`
			`length_seconds: Int32,`
			`published: Time,`
			`playlists: Array(String),`
			`index: Int32,`
Add live now indicator to playlists 2019-03-24 19:40:14 +05:30			`live_now: Bool,`
Add mixes 2018-09-29 09:42:35 +05:30			`})`
			`end`

Use struct for allocations 2019-03-30 03:00:02 +05:30			`struct Playlist`
Add playlist page and endpoint 2018-08-15 20:52:36 +05:30			`add_mapping({`
Add descriptionHtml to playlists 2018-09-05 05:57:10 +05:30			`title: String,`
			`id: String,`
			`author: String,`
Add author thumbnails to playlist endpoint 2018-09-25 20:58:40 +05:30			`author_thumbnail: String,`
Add descriptionHtml to playlists 2018-09-05 05:57:10 +05:30			`ucid: String,`
			`description: String,`
			`description_html: String,`
			`video_count: Int32,`
			`views: Int64,`
			`updated: Time,`
Add playlist page and endpoint 2018-08-15 20:52:36 +05:30			`})`
			`end`

Add support for translations 2018-12-21 03:02:09 +05:30			`def fetch_playlist_videos(plid, page, video_count, continuation = nil, locale = nil)`
Add playlist page and endpoint 2018-08-15 20:52:36 +05:30			`client = make_client(YT_URL)`
Add fix for playlists with less than 100 videos 2018-09-23 00:43:10 +05:30
Add playlist playback support 2018-10-08 07:41:33 +05:30			`if continuation`
Update info extractor 2018-11-10 22:20:09 +05:30			`html = client.get("/watch?v=#{continuation}&list=#{plid}&gl=US&hl=en&disable_polymer=1&has_verified=1&bpctr=9999999999")`
Add playlist playback support 2018-10-08 07:41:33 +05:30			`html = XML.parse_html(html.body)`

			`index = html.xpath_node(%q(//span[@id="playlist-current-index"])).try &.content.to_i?`
			`if index`
			`index -= 1`
			`end`
			`index \|\|= 0`
			`else`
Add fix for playlists with less than 100 videos 2018-09-23 00:43:10 +05:30			`index = (page - 1) * 100`
Add playlist playback support 2018-10-08 07:41:33 +05:30			`end`

			`if video_count > 100`
Add fix for playlists with less than 100 videos 2018-09-23 00:43:10 +05:30			`url = produce_playlist_url(plid, index)`

			`response = client.get(url)`
			`response = JSON.parse(response.body)`
			`if !response["content_html"]? \|\| response["content_html"].as_s.empty?`
Add support for translations 2018-12-21 03:02:09 +05:30			`raise translate(locale, "Playlist is empty")`
Add fix for playlists with less than 100 videos 2018-09-23 00:43:10 +05:30			`end`

			`document = XML.parse_html(response["content_html"].as_s)`
			`nodeset = document.xpath_nodes(%q(.//tr[contains(@class, "pl-video")]))`
			`videos = extract_playlist(plid, nodeset, index)`
			`else`
Fix encoding of playlist index 2018-09-28 20:24:01 +05:30			`# Playlist has less than one page of videos, so subsequent pages will be empty`
Add fix for playlists with less than 100 videos 2018-09-23 00:43:10 +05:30			`if page > 1`
			`videos = [] of PlaylistVideo`
			`else`
Fix encoding of playlist index 2018-09-28 20:24:01 +05:30			`# Extract first page of videos`
Add host language to YouTube requests 2018-09-26 04:25:32 +05:30			`response = client.get("/playlist?list=#{plid}&gl=US&hl=en&disable_polymer=1")`
Add fix for playlists with less than 100 videos 2018-09-23 00:43:10 +05:30			`document = XML.parse_html(response.body)`
			`nodeset = document.xpath_nodes(%q(.//tr[contains(@class, "pl-video")]))`

			`videos = extract_playlist(plid, nodeset, 0)`
Fix param ordering for fetch_playlist_videos 2018-12-25 05:17:23 +05:30
Add fix for continuation on playlists smaller than 100 videos 2018-10-11 06:17:51 +05:30			`if continuation`
			`until videos[0].id == continuation`
			`videos.shift`
			`end`
			`end`
Add fix for playlists with less than 100 videos 2018-09-23 00:43:10 +05:30			`end`
Add playlist page and endpoint 2018-08-15 20:52:36 +05:30			`end`

Add fix for playlists with less than 100 videos 2018-09-23 00:43:10 +05:30			`return videos`
			`end`

			`def extract_playlist(plid, nodeset, index)`
Add playlist page and endpoint 2018-08-15 20:52:36 +05:30			`videos = [] of PlaylistVideo`

Add fix for playlists with less than 100 videos 2018-09-23 00:43:10 +05:30			`nodeset.each_with_index do \|video, offset\|`
			`anchor = video.xpath_node(%q(.//td[@class="pl-video-title"]))`
			`if !anchor`
			`next`
Add playlist page and endpoint 2018-08-15 20:52:36 +05:30			`end`
Add fix for playlists with less than 100 videos 2018-09-23 00:43:10 +05:30
			`title = anchor.xpath_node(%q(.//a)).not_nil!.content.strip(" \n")`
			`id = anchor.xpath_node(%q(.//a)).not_nil!["href"].lchop("/watch?v=")[0, 11]`

			`anchor = anchor.xpath_node(%q(.//div[@class="pl-video-owner"]/a))`
			`if anchor`
			`author = anchor.content`
			`ucid = anchor["href"].split("/")[2]`
			`else`
			`author = ""`
			`ucid = ""`
			`end`

			`anchor = video.xpath_node(%q(.//td[@class="pl-video-time"]/div/div[1]))`
			`if anchor && !anchor.content.empty?`
			`length_seconds = decode_length_seconds(anchor.content)`
Add live now indicator to playlists 2019-03-24 19:40:14 +05:30			`live_now = false`
Add fix for playlists with less than 100 videos 2018-09-23 00:43:10 +05:30			`else`
			`length_seconds = 0`
Add live now indicator to playlists 2019-03-24 19:40:14 +05:30			`live_now = true`
Add fix for playlists with less than 100 videos 2018-09-23 00:43:10 +05:30			`end`

			`videos << PlaylistVideo.new(`
Add support for translations 2018-12-21 03:02:09 +05:30			`title: title,`
			`id: id,`
			`author: author,`
			`ucid: ucid,`
			`length_seconds: length_seconds,`
			`published: Time.now,`
			`playlists: [plid],`
			`index: index + offset,`
Add live now indicator to playlists 2019-03-24 19:40:14 +05:30			`live_now: live_now`
Add fix for playlists with less than 100 videos 2018-09-23 00:43:10 +05:30			`)`
Add playlist page and endpoint 2018-08-15 20:52:36 +05:30			`end`

			`return videos`
			`end`

			`def produce_playlist_url(id, index)`
			`if id.starts_with? "UC"`
			`id = "UU" + id.lchop("UC")`
			`end`
			`ucid = "VL" + id`

Use IO::Memory for creating continuation tokens 2019-02-05 02:47:10 +05:30			`meta = IO::Memory.new`
			`meta.write(Bytes[0x08])`
			`meta.write(write_var_int(index))`

			`meta.rewind`
			`meta = Base64.urlsafe_encode(meta.to_slice, false)`
Refactor protocol buffers 2018-09-18 03:08:18 +05:30			`meta = "PT:#{meta}"`

Use IO::Memory for creating continuation tokens 2019-02-05 02:47:10 +05:30			`continuation = IO::Memory.new`
			`continuation.write(Bytes[0x7a, meta.size])`
			`continuation.print(meta)`
Refactor protocol buffers 2018-09-18 03:08:18 +05:30
Use IO::Memory for creating continuation tokens 2019-02-05 02:47:10 +05:30			`continuation.rewind`
			`meta = Base64.urlsafe_encode(continuation.to_slice)`
			`meta = URI.escape(meta)`
Refactor protocol buffers 2018-09-18 03:08:18 +05:30
Use IO::Memory for creating continuation tokens 2019-02-05 02:47:10 +05:30			`continuation = IO::Memory.new`
			`continuation.write(Bytes[0x12, ucid.size])`
			`continuation.print(ucid)`
			`continuation.write(Bytes[0x1a, meta.size])`
			`continuation.print(meta)`
Refactor protocol buffers 2018-09-18 03:08:18 +05:30
Use IO::Memory for creating continuation tokens 2019-02-05 02:47:10 +05:30			`wrapper = IO::Memory.new`
			`wrapper.write(Bytes[0xe2, 0xa9, 0x85, 0xb2, 0x02, continuation.size])`
			`wrapper.print(continuation)`
			`wrapper.rewind`
Refactor protocol buffers 2018-09-18 03:08:18 +05:30
Use IO::Memory for creating continuation tokens 2019-02-05 02:47:10 +05:30			`wrapper = Base64.urlsafe_encode(wrapper.to_slice)`
			`wrapper = URI.escape(wrapper)`
Add playlist page and endpoint 2018-08-15 20:52:36 +05:30
Use IO::Memory for creating continuation tokens 2019-02-05 02:47:10 +05:30			`url = "/browse_ajax?continuation=#{wrapper}&gl=US&hl=en"`
Add playlist page and endpoint 2018-08-15 20:52:36 +05:30
			`return url`
			`end`

Add support for translations 2018-12-21 03:02:09 +05:30			`def fetch_playlist(plid, locale)`
Add playlist page and endpoint 2018-08-15 20:52:36 +05:30			`client = make_client(YT_URL)`
Add fix for playlists with less than 100 videos 2018-09-23 00:43:10 +05:30
			`if plid.starts_with? "UC"`
			`plid = "UU#{plid.lchop("UC")}"`
			`end`

Add host language to YouTube requests 2018-09-26 04:25:32 +05:30			`response = client.get("/playlist?list=#{plid}&hl=en&disable_polymer=1")`
Add better error for invalid playlists 2018-09-23 22:56:12 +05:30			`if response.status_code != 200`
Add support for translations 2018-12-21 03:02:09 +05:30			`raise translate(locale, "Invalid playlist.")`
Add better error for invalid playlists 2018-09-23 22:56:12 +05:30			`end`

Improve playlist description extractor 2019-01-05 10:18:00 +05:30			`body = response.body.gsub(/<button[^>]+><span[^>]+>\sless\s<img[^>]+>\n<\/span><\/button>/, "")`
Remove 'less' button in playlist descriptions 2018-09-14 07:30:39 +05:30			`document = XML.parse_html(body)`
Add playlist page and endpoint 2018-08-15 20:52:36 +05:30
Add error for non-existent playlists 2018-09-23 23:02:32 +05:30			`title = document.xpath_node(%q(//h1[@class="pl-header-title"]))`
			`if !title`
Add support for translations 2018-12-21 03:02:09 +05:30			`raise translate(locale, "Playlist does not exist.")`
Add error for non-existent playlists 2018-09-23 23:02:32 +05:30			`end`
			`title = title.content.strip(" \n")`
Add playlist page and endpoint 2018-08-15 20:52:36 +05:30
Add descriptionHtml to playlists 2018-09-05 05:57:10 +05:30			`description_html = document.xpath_node(%q(//span[@class="pl-header-description-text"]/div/div[1]))`
Add fix for short playlist descriptions 2018-09-25 20:58:57 +05:30			`description_html \|\|= document.xpath_node(%q(//span[@class="pl-header-description-text"]))`
Remove 'less' button in playlist descriptions 2018-09-14 07:30:39 +05:30			`description_html, description = html_to_content(description_html)`
Add playlist page and endpoint 2018-08-15 20:52:36 +05:30
			`anchor = document.xpath_node(%q(//ul[@class="pl-header-details"])).not_nil!`
			`author = anchor.xpath_node(%q(.//li[1]/a)).not_nil!.content`
Add author thumbnails to playlist endpoint 2018-09-25 20:58:40 +05:30			`author_thumbnail = document.xpath_node(%q(//img[@class="channel-header-profile-image"])).try &.["src"]`
			`author_thumbnail \|\|= ""`
Fix index out of bounds for playlist ucid 2018-11-05 20:30:39 +05:30			`ucid = anchor.xpath_node(%q(.//li[1]/a)).not_nil!["href"].split("/")[-1]`
Add playlist page and endpoint 2018-08-15 20:52:36 +05:30
Fix playlist view extractor 2018-08-20 20:55:05 +05:30			`video_count = anchor.xpath_node(%q(.//li[2])).not_nil!.content.delete("videos, ").to_i`
Add fix for playlists with no views 2018-09-18 05:51:13 +05:30			`views = anchor.xpath_node(%q(.//li[3])).not_nil!.content.delete("No views, ")`
			`if views.empty?`
			`views = 0_i64`
			`else`
			`views = views.to_i64`
			`end`
Add playlist page and endpoint 2018-08-15 20:52:36 +05:30
			`updated = anchor.xpath_node(%q(.//li[4])).not_nil!.content.lchop("Last updated on ").lchop("Updated ")`
			`updated = decode_date(updated)`

			`playlist = Playlist.new(`
Use named params for SearchChannel 2018-12-16 00:32:53 +05:30			`title: title,`
			`id: plid,`
			`author: author,`
			`author_thumbnail: author_thumbnail,`
			`ucid: ucid,`
			`description: description,`
			`description_html: description_html,`
			`video_count: video_count,`
			`views: views,`
			`updated: updated`
Add playlist page and endpoint 2018-08-15 20:52:36 +05:30			`)`

			`return playlist`
			`end`
Add playlist playback support 2018-10-08 07:41:33 +05:30
			`def template_playlist(playlist)`
			`html = <<-END_HTML`
			`<h3>`
			`<a href="/playlist?list=#{playlist["playlistId"]}">`
			`#{playlist["title"]}`
			`</a>`
			`</h3>`
			`<div class="pure-menu pure-menu-scrollable playlist-restricted">`
			`<ol class="pure-menu-list">`
			`END_HTML`

			`playlist["videos"].as_a.each do \|video\|`
			`html += <<-END_HTML`
			`<li class="pure-menu-item">`
			`<a href="/watch?v=#{video["videoId"]}&list=#{playlist["playlistId"]}">`
Add length_seconds to playlist on watch page 2019-03-03 21:33:24 +05:30			`<div class="thumbnail">`
			`<img class="thumbnail" src="/vi/#{video["videoId"]}/mqdefault.jpg">`
			`<p class="length">#{recode_length_seconds(video["lengthSeconds"].as_i)}</p>`
			`</div>`
Add playlist playback support 2018-10-08 07:41:33 +05:30			`<p style="width:100%">#{video["title"]}</p>`
			`<p>`
			`<b style="width: 100%">#{video["author"]}</b>`
			`</p>`
			`</a>`
			`</li>`
			`END_HTML`
			`end`

			`html += <<-END_HTML`
			`</ol>`
			`</div>`
			`<hr>`
			`END_HTML`

			`html`
			`end`