invidious-experimenting/src/invidious/playlists.cr

class PlaylistVideo
  add_mapping({
    title:          String,
    id:             String,
    author:         String,
    ucid:           String,
    length_seconds: Int32,
    published:      Time,
    playlists:      Array(String),
    index:          Int32,
  })
end

class Playlist
  add_mapping({
    title:            String,
    id:               String,
    author:           String,
    author_thumbnail: String,
    ucid:             String,
    description:      String,
    description_html: String,
    video_count:      Int32,
    views:            Int64,
    updated:          Time,
  })
end

def fetch_playlist_videos(plid, page, video_count, continuation = nil)
  client = make_client(YT_URL)

  if continuation
    html = client.get("/watch?v=#{continuation}&list=#{plid}&bpctr=#{Time.new.to_unix + 2000}&gl=US&hl=en&disable_polymer=1")
    html = XML.parse_html(html.body)

    index = html.xpath_node(%q(//span[@id="playlist-current-index"])).try &.content.to_i?
    if index
      index -= 1
    end
    index ||= 0
  else
    index = (page - 1) * 100
  end

  if video_count > 100
    url = produce_playlist_url(plid, index)

    response = client.get(url)
    response = JSON.parse(response.body)
    if !response["content_html"]? || response["content_html"].as_s.empty?
      raise "Playlist is empty"
    end

    document = XML.parse_html(response["content_html"].as_s)
    nodeset = document.xpath_nodes(%q(.//tr[contains(@class, "pl-video")]))
    videos = extract_playlist(plid, nodeset, index)
  else
    # Playlist has less than one page of videos, so subsequent pages will be empty
    if page > 1
      videos = [] of PlaylistVideo
    else
      # Extract first page of videos
      response = client.get("/playlist?list=#{plid}&gl=US&hl=en&disable_polymer=1")
      document = XML.parse_html(response.body)
      nodeset = document.xpath_nodes(%q(.//tr[contains(@class, "pl-video")]))

      videos = extract_playlist(plid, nodeset, 0)
      if continuation
        until videos[0].id == continuation
          videos.shift
        end
      end
    end
  end

  return videos
end

def extract_playlist(plid, nodeset, index)
  videos = [] of PlaylistVideo

  nodeset.each_with_index do |video, offset|
    anchor = video.xpath_node(%q(.//td[@class="pl-video-title"]))
    if !anchor
      next
    end

    title = anchor.xpath_node(%q(.//a)).not_nil!.content.strip(" \n")
    id = anchor.xpath_node(%q(.//a)).not_nil!["href"].lchop("/watch?v=")[0, 11]

    anchor = anchor.xpath_node(%q(.//div[@class="pl-video-owner"]/a))
    if anchor
      author = anchor.content
      ucid = anchor["href"].split("/")[2]
    else
      author = ""
      ucid = ""
    end

    anchor = video.xpath_node(%q(.//td[@class="pl-video-time"]/div/div[1]))
    if anchor && !anchor.content.empty?
      length_seconds = decode_length_seconds(anchor.content)
    else
      length_seconds = 0
    end

    videos << PlaylistVideo.new(
      title,
      id,
      author,
      ucid,
      length_seconds,
      Time.now,
      [plid],
      index + offset,
    )
  end

  return videos
end

def produce_playlist_url(id, index)
  if id.starts_with? "UC"
    id = "UU" + id.lchop("UC")
  end
  ucid = "VL" + id

  meta = [0x08_u8] + write_var_int(index)
  meta = Slice.new(meta.to_unsafe, meta.size)
  meta = Base64.urlsafe_encode(meta, false)
  meta = "PT:#{meta}"

  wrapped = "\x7a"
  wrapped += meta.bytes.size.unsafe_chr
  wrapped += meta

  wrapped = Base64.urlsafe_encode(wrapped)
  meta = URI.escape(wrapped)

  continuation = "\x12"
  continuation += ucid.size.unsafe_chr
  continuation += ucid
  continuation += "\x1a"
  continuation += meta.bytes.size.unsafe_chr
  continuation += meta

  continuation = continuation.size.to_u8.unsafe_chr + continuation
  continuation = "\xe2\xa9\x85\xb2\x02" + continuation

  continuation = Base64.urlsafe_encode(continuation)
  continuation = URI.escape(continuation)

  url = "/browse_ajax?continuation=#{continuation}"

  return url
end

def fetch_playlist(plid)
  client = make_client(YT_URL)

  if plid.starts_with? "UC"
    plid = "UU#{plid.lchop("UC")}"
  end

  response = client.get("/playlist?list=#{plid}&hl=en&disable_polymer=1")
  if response.status_code != 200
    raise "Invalid playlist."
  end

  body = response.body.gsub(%(
  <button class="yt-uix-button yt-uix-button-size-default yt-uix-button-link yt-uix-expander-head playlist-description-expander yt-uix-inlineedit-ignore-edit" type="button" onclick=";return false;"><span class="yt-uix-button-content">  less <img alt="" src="/yts/img/pixel-vfl3z5WfW.gif">
  </span></button>
  ), "")
  document = XML.parse_html(body)

  title = document.xpath_node(%q(//h1[@class="pl-header-title"]))
  if !title
    raise "Playlist does not exist."
  end
  title = title.content.strip(" \n")

  description_html = document.xpath_node(%q(//span[@class="pl-header-description-text"]/div/div[1]))
  description_html ||= document.xpath_node(%q(//span[@class="pl-header-description-text"]))
  description_html, description = html_to_content(description_html)

  anchor = document.xpath_node(%q(//ul[@class="pl-header-details"])).not_nil!
  author = anchor.xpath_node(%q(.//li[1]/a)).not_nil!.content
  author_thumbnail = document.xpath_node(%q(//img[@class="channel-header-profile-image"])).try &.["src"]
  author_thumbnail ||= ""
  ucid = anchor.xpath_node(%q(.//li[1]/a)).not_nil!["href"].split("/")[-1]

  video_count = anchor.xpath_node(%q(.//li[2])).not_nil!.content.delete("videos, ").to_i
  views = anchor.xpath_node(%q(.//li[3])).not_nil!.content.delete("No views, ")
  if views.empty?
    views = 0_i64
  else
    views = views.to_i64
  end

  updated = anchor.xpath_node(%q(.//li[4])).not_nil!.content.lchop("Last updated on ").lchop("Updated ")
  updated = decode_date(updated)

  playlist = Playlist.new(
    title,
    plid,
    author,
    author_thumbnail,
    ucid,
    description,
    description_html,
    video_count,
    views,
    updated
  )

  return playlist
end

def template_playlist(playlist)
  html = <<-END_HTML
  <h3>
    <a href="/playlist?list=#{playlist["playlistId"]}">
      #{playlist["title"]}
    </a>
  </h3>
  <div class="pure-menu pure-menu-scrollable playlist-restricted">
    <ol class="pure-menu-list">
  END_HTML

  playlist["videos"].as_a.each do |video|
    html += <<-END_HTML
      <li class="pure-menu-item">
        <a href="/watch?v=#{video["videoId"]}&list=#{playlist["playlistId"]}">
          <img style="width:100%;" src="/vi/#{video["videoId"]}/mqdefault.jpg">
          <p style="width:100%">#{video["title"]}</p>
          <p>
              <b style="width: 100%">#{video["author"]}</b>
          </p>
        </a>
      </li>
    END_HTML
  end

  html += <<-END_HTML
    </ol>
  </div>
  <hr>
  END_HTML

  html
end
Add mixes 2018-09-28 23:12:35 -05:00			`class PlaylistVideo`
			`add_mapping({`
			`title: String,`
			`id: String,`
			`author: String,`
			`ucid: String,`
			`length_seconds: Int32,`
			`published: Time,`
			`playlists: Array(String),`
			`index: Int32,`
			`})`
			`end`

Add playlist page and endpoint 2018-08-15 10:22:36 -05:00			`class Playlist`
			`add_mapping({`
Add descriptionHtml to playlists 2018-09-04 19:27:10 -05:00			`title: String,`
			`id: String,`
			`author: String,`
Add author thumbnails to playlist endpoint 2018-09-25 10:28:40 -05:00			`author_thumbnail: String,`
Add descriptionHtml to playlists 2018-09-04 19:27:10 -05:00			`ucid: String,`
			`description: String,`
			`description_html: String,`
			`video_count: Int32,`
			`views: Int64,`
			`updated: Time,`
Add playlist page and endpoint 2018-08-15 10:22:36 -05:00			`})`
			`end`

Add playlist playback support 2018-10-07 21:11:33 -05:00			`def fetch_playlist_videos(plid, page, video_count, continuation = nil)`
Add playlist page and endpoint 2018-08-15 10:22:36 -05:00			`client = make_client(YT_URL)`
Add fix for playlists with less than 100 videos 2018-09-22 14:13:10 -05:00
Add playlist playback support 2018-10-07 21:11:33 -05:00			`if continuation`
Add support for Crystal 0.27.0 2018-11-04 09:37:12 -06:00			`html = client.get("/watch?v=#{continuation}&list=#{plid}&bpctr=#{Time.new.to_unix + 2000}&gl=US&hl=en&disable_polymer=1")`
Add playlist playback support 2018-10-07 21:11:33 -05:00			`html = XML.parse_html(html.body)`

			`index = html.xpath_node(%q(//span[@id="playlist-current-index"])).try &.content.to_i?`
			`if index`
			`index -= 1`
			`end`
			`index \|\|= 0`
			`else`
Add fix for playlists with less than 100 videos 2018-09-22 14:13:10 -05:00			`index = (page - 1) * 100`
Add playlist playback support 2018-10-07 21:11:33 -05:00			`end`

			`if video_count > 100`
Add fix for playlists with less than 100 videos 2018-09-22 14:13:10 -05:00			`url = produce_playlist_url(plid, index)`

			`response = client.get(url)`
			`response = JSON.parse(response.body)`
			`if !response["content_html"]? \|\| response["content_html"].as_s.empty?`
			`raise "Playlist is empty"`
			`end`

			`document = XML.parse_html(response["content_html"].as_s)`
			`nodeset = document.xpath_nodes(%q(.//tr[contains(@class, "pl-video")]))`
			`videos = extract_playlist(plid, nodeset, index)`
			`else`
Fix encoding of playlist index 2018-09-28 09:54:01 -05:00			`# Playlist has less than one page of videos, so subsequent pages will be empty`
Add fix for playlists with less than 100 videos 2018-09-22 14:13:10 -05:00			`if page > 1`
			`videos = [] of PlaylistVideo`
			`else`
Fix encoding of playlist index 2018-09-28 09:54:01 -05:00			`# Extract first page of videos`
Add host language to YouTube requests 2018-09-25 17:55:32 -05:00			`response = client.get("/playlist?list=#{plid}&gl=US&hl=en&disable_polymer=1")`
Add fix for playlists with less than 100 videos 2018-09-22 14:13:10 -05:00			`document = XML.parse_html(response.body)`
			`nodeset = document.xpath_nodes(%q(.//tr[contains(@class, "pl-video")]))`

			`videos = extract_playlist(plid, nodeset, 0)`
Add fix for continuation on playlists smaller than 100 videos 2018-10-10 19:47:51 -05:00			`if continuation`
			`until videos[0].id == continuation`
			`videos.shift`
			`end`
			`end`
Add fix for playlists with less than 100 videos 2018-09-22 14:13:10 -05:00			`end`
Add playlist page and endpoint 2018-08-15 10:22:36 -05:00			`end`

Add fix for playlists with less than 100 videos 2018-09-22 14:13:10 -05:00			`return videos`
			`end`

			`def extract_playlist(plid, nodeset, index)`
Add playlist page and endpoint 2018-08-15 10:22:36 -05:00			`videos = [] of PlaylistVideo`

Add fix for playlists with less than 100 videos 2018-09-22 14:13:10 -05:00			`nodeset.each_with_index do \|video, offset\|`
			`anchor = video.xpath_node(%q(.//td[@class="pl-video-title"]))`
			`if !anchor`
			`next`
Add playlist page and endpoint 2018-08-15 10:22:36 -05:00			`end`
Add fix for playlists with less than 100 videos 2018-09-22 14:13:10 -05:00
			`title = anchor.xpath_node(%q(.//a)).not_nil!.content.strip(" \n")`
			`id = anchor.xpath_node(%q(.//a)).not_nil!["href"].lchop("/watch?v=")[0, 11]`

			`anchor = anchor.xpath_node(%q(.//div[@class="pl-video-owner"]/a))`
			`if anchor`
			`author = anchor.content`
			`ucid = anchor["href"].split("/")[2]`
			`else`
			`author = ""`
			`ucid = ""`
			`end`

			`anchor = video.xpath_node(%q(.//td[@class="pl-video-time"]/div/div[1]))`
			`if anchor && !anchor.content.empty?`
			`length_seconds = decode_length_seconds(anchor.content)`
			`else`
			`length_seconds = 0`
			`end`

			`videos << PlaylistVideo.new(`
			`title,`
			`id,`
			`author,`
			`ucid,`
			`length_seconds,`
			`Time.now,`
			`[plid],`
			`index + offset,`
			`)`
Add playlist page and endpoint 2018-08-15 10:22:36 -05:00			`end`

			`return videos`
			`end`

			`def produce_playlist_url(id, index)`
			`if id.starts_with? "UC"`
			`id = "UU" + id.lchop("UC")`
			`end`
			`ucid = "VL" + id`

Fix encoding of playlist index 2018-09-28 09:54:01 -05:00			`meta = [0x08_u8] + write_var_int(index)`
			`meta = Slice.new(meta.to_unsafe, meta.size)`
Refactor protocol buffers 2018-09-17 16:38:18 -05:00			`meta = Base64.urlsafe_encode(meta, false)`
			`meta = "PT:#{meta}"`

			`wrapped = "\x7a"`
			`wrapped += meta.bytes.size.unsafe_chr`
			`wrapped += meta`

			`wrapped = Base64.urlsafe_encode(wrapped)`
			`meta = URI.escape(wrapped)`

			`continuation = "\x12"`
			`continuation += ucid.size.unsafe_chr`
			`continuation += ucid`
			`continuation += "\x1a"`
			`continuation += meta.bytes.size.unsafe_chr`
			`continuation += meta`

			`continuation = continuation.size.to_u8.unsafe_chr + continuation`
			`continuation = "\xe2\xa9\x85\xb2\x02" + continuation`

			`continuation = Base64.urlsafe_encode(continuation)`
			`continuation = URI.escape(continuation)`
Add playlist page and endpoint 2018-08-15 10:22:36 -05:00
Add fix for playlists with less than 100 videos 2018-09-22 14:13:10 -05:00			`url = "/browse_ajax?continuation=#{continuation}"`
Add playlist page and endpoint 2018-08-15 10:22:36 -05:00
			`return url`
			`end`

			`def fetch_playlist(plid)`
			`client = make_client(YT_URL)`
Add fix for playlists with less than 100 videos 2018-09-22 14:13:10 -05:00
			`if plid.starts_with? "UC"`
			`plid = "UU#{plid.lchop("UC")}"`
			`end`

Add host language to YouTube requests 2018-09-25 17:55:32 -05:00			`response = client.get("/playlist?list=#{plid}&hl=en&disable_polymer=1")`
Add better error for invalid playlists 2018-09-23 12:26:12 -05:00			`if response.status_code != 200`
			`raise "Invalid playlist."`
			`end`

Add support for Crystal 0.27.0 2018-11-04 09:37:12 -06:00			`body = response.body.gsub(%(`
Remove 'less' button in playlist descriptions 2018-09-13 21:00:39 -05:00			`<button class="yt-uix-button yt-uix-button-size-default yt-uix-button-link yt-uix-expander-head playlist-description-expander yt-uix-inlineedit-ignore-edit" type="button" onclick=";return false;"><span class="yt-uix-button-content"> less <img alt="" src="/yts/img/pixel-vfl3z5WfW.gif">`
			`</span></button>`
Add support for Crystal 0.27.0 2018-11-04 09:37:12 -06:00			`), "")`
Remove 'less' button in playlist descriptions 2018-09-13 21:00:39 -05:00			`document = XML.parse_html(body)`
Add playlist page and endpoint 2018-08-15 10:22:36 -05:00
Add error for non-existent playlists 2018-09-23 12:32:32 -05:00			`title = document.xpath_node(%q(//h1[@class="pl-header-title"]))`
			`if !title`
			`raise "Playlist does not exist."`
			`end`
			`title = title.content.strip(" \n")`
Add playlist page and endpoint 2018-08-15 10:22:36 -05:00
Add descriptionHtml to playlists 2018-09-04 19:27:10 -05:00			`description_html = document.xpath_node(%q(//span[@class="pl-header-description-text"]/div/div[1]))`
Add fix for short playlist descriptions 2018-09-25 10:28:57 -05:00			`description_html \|\|= document.xpath_node(%q(//span[@class="pl-header-description-text"]))`
Remove 'less' button in playlist descriptions 2018-09-13 21:00:39 -05:00			`description_html, description = html_to_content(description_html)`
Add playlist page and endpoint 2018-08-15 10:22:36 -05:00
			`anchor = document.xpath_node(%q(//ul[@class="pl-header-details"])).not_nil!`
			`author = anchor.xpath_node(%q(.//li[1]/a)).not_nil!.content`
Add author thumbnails to playlist endpoint 2018-09-25 10:28:40 -05:00			`author_thumbnail = document.xpath_node(%q(//img[@class="channel-header-profile-image"])).try &.["src"]`
			`author_thumbnail \|\|= ""`
Fix index out of bounds for playlist ucid 2018-11-05 09:00:39 -06:00			`ucid = anchor.xpath_node(%q(.//li[1]/a)).not_nil!["href"].split("/")[-1]`
Add playlist page and endpoint 2018-08-15 10:22:36 -05:00
Fix playlist view extractor 2018-08-20 10:25:05 -05:00			`video_count = anchor.xpath_node(%q(.//li[2])).not_nil!.content.delete("videos, ").to_i`
Add fix for playlists with no views 2018-09-17 19:21:13 -05:00			`views = anchor.xpath_node(%q(.//li[3])).not_nil!.content.delete("No views, ")`
			`if views.empty?`
			`views = 0_i64`
			`else`
			`views = views.to_i64`
			`end`
Add playlist page and endpoint 2018-08-15 10:22:36 -05:00
			`updated = anchor.xpath_node(%q(.//li[4])).not_nil!.content.lchop("Last updated on ").lchop("Updated ")`
			`updated = decode_date(updated)`

			`playlist = Playlist.new(`
			`title,`
			`plid,`
			`author,`
Add author thumbnails to playlist endpoint 2018-09-25 10:28:40 -05:00			`author_thumbnail,`
Add playlist page and endpoint 2018-08-15 10:22:36 -05:00			`ucid,`
			`description,`
Add descriptionHtml to playlists 2018-09-04 19:27:10 -05:00			`description_html,`
Add playlist page and endpoint 2018-08-15 10:22:36 -05:00			`video_count,`
			`views,`
			`updated`
			`)`

			`return playlist`
			`end`
Add playlist playback support 2018-10-07 21:11:33 -05:00
			`def template_playlist(playlist)`
			`html = <<-END_HTML`
			`<h3>`
			`<a href="/playlist?list=#{playlist["playlistId"]}">`
			`#{playlist["title"]}`
			`</a>`
			`</h3>`
			`<div class="pure-menu pure-menu-scrollable playlist-restricted">`
			`<ol class="pure-menu-list">`
			`END_HTML`

			`playlist["videos"].as_a.each do \|video\|`
			`html += <<-END_HTML`
			`<li class="pure-menu-item">`
			`<a href="/watch?v=#{video["videoId"]}&list=#{playlist["playlistId"]}">`
			`<img style="width:100%;" src="/vi/#{video["videoId"]}/mqdefault.jpg">`
			`<p style="width:100%">#{video["title"]}</p>`
			`<p>`
			`<b style="width: 100%">#{video["author"]}</b>`
			`</p>`
			`</a>`
			`</li>`
			`END_HTML`
			`end`

			`html += <<-END_HTML`
			`</ol>`
			`</div>`
			`<hr>`
			`END_HTML`

			`html`
			`end`