invidious-mod-JP/src/helpers.cr

macro add_mapping(mapping)
  def initialize({{*mapping.keys.map { |id| "@#{id}".id }}})
  end

  def to_a
    return [{{*mapping.keys.map { |id| "@#{id}".id }}}]
  end

  DB.mapping({{mapping}})
end

macro templated(filename)
  render "src/views/#{{{filename}}}.ecr", "src/views/layout.ecr"
end

class Config
  YAML.mapping({
    pool_size: Int32,
    threads:   Int32,
    db:        NamedTuple(
      user: String,
      password: String,
      host: String,
      port: Int32,
      dbname: String,
    ),
    dl_api_key: String?,
  })
end

class Video
  module HTTPParamConverter
    def self.from_rs(rs)
      HTTP::Params.parse(rs.read(String))
    end
  end

  add_mapping({
    id:   String,
    info: {
      type:      HTTP::Params,
      default:   HTTP::Params.parse(""),
      converter: Video::HTTPParamConverter,
    },
    updated:      Time,
    title:        String,
    views:        Int64,
    likes:        Int32,
    dislikes:     Int32,
    wilson_score: Float64,
    published:    Time,
    description:  String,
    language:     String?,
  })
end

class RedditSubmit
  JSON.mapping({
    data: RedditSubmitData,
  })
end

class RedditSubmitData
  JSON.mapping({
    children: Array(RedditThread),
  })
end

class RedditThread
  JSON.mapping({
    data: RedditThreadData,
  })
end

class RedditThreadData
  JSON.mapping({
    subreddit:    String,
    id:           String,
    num_comments: Int32,
    score:        Int32,
    author:       String,
    permalink:    String,
    title:        String,
  })
end

# See http://www.evanmiller.org/how-not-to-sort-by-average-rating.html
def ci_lower_bound(pos, n)
  if n == 0
    return 0.0
  end

  # z value here represents a confidence level of 0.95
  z = 1.96
  phat = 1.0*pos/n

  return (phat + z*z/(2*n) - z * Math.sqrt((phat*(1 - phat) + z*z/(4*n))/n))/(1 + z*z/n)
end

def elapsed_text(elapsed)
  millis = elapsed.total_milliseconds
  return "#{millis.round(2)}ms" if millis >= 1

  "#{(millis * 1000).round(2)}µs"
end

def get_client(pool)
  while pool.empty?
    sleep rand(0..10).milliseconds
  end

  return pool.shift
end

def fetch_video(id, client)
  info = client.get("/get_video_info?video_id=#{id}&el=detailpage&ps=default&eurl=&gl=US&hl=en").body
  html = client.get("/watch?v=#{id}&bpctr=#{Time.new.epoch + 2000}").body

  html = XML.parse_html(html)
  info = HTTP::Params.parse(info)

  if info["reason"]?
    info = client.get("/get_video_info?video_id=#{id}&ps=default&eurl=&gl=US&hl=en").body
    info = HTTP::Params.parse(info)
    if info["reason"]?
      raise info["reason"]
    end
  end

  title = info["title"]

  views = info["view_count"].to_i64

  likes = html.xpath_node(%q(//button[@title="I like this"]/span))
  likes = likes.try &.content.delete(",").try &.to_i
  likes ||= 0

  dislikes = html.xpath_node(%q(//button[@title="I dislike this"]/span))
  dislikes = dislikes.try &.content.delete(",").try &.to_i
  dislikes ||= 0

  description = html.xpath_node(%q(//p[@id="eow-description"]))
  description = description ? description.to_xml : ""

  wilson_score = ci_lower_bound(likes, likes + dislikes)

  published = html.xpath_node(%q(//strong[contains(@class,"watch-time-text")]))
  if published
    published = published.content
  else
    raise "Could not find date published"
  end

  published = published.lchop("Published ")
  published = published.lchop("Started streaming ")
  published = published.lchop("Streamed live ")
  published = published.lchop("Uploaded ")
  published = published.lchop("on ")
  published = published.lchop("Scheduled for ")
  if !published.includes?("ago")
    published = Time.parse(published, "%b %-d, %Y")
  else
    # Time matches format "20 hours ago", "40 minutes ago"...
    delta = published.split(" ")[0].to_i
    case published
    when .includes? "minute"
      published = Time.now - delta.minutes
    when .includes? "hour"
      published = Time.now - delta.hours
    else
      raise "Could not parse #{published}"
    end
  end

  video = Video.new(id, info, Time.now, title, views, likes, dislikes, wilson_score, published, description, nil)

  return video
end

def get_video(id, client, db, refresh = true)
  if db.query_one?("SELECT EXISTS (SELECT true FROM videos WHERE id = $1)", id, as: Bool)
    video = db.query_one("SELECT * FROM videos WHERE id = $1", id, as: Video)

    # If record was last updated over an hour ago, refresh (expire param in response lasts for 6 hours)
    if refresh && Time.now - video.updated > 1.hours
      db.exec("DELETE FROM videos * WHERE id = $1", id)
      video = fetch_video(id, client)
      args = arg_array(video.to_a)
      db.exec("INSERT INTO videos VALUES (#{args})", video.to_a)
    end
  else
    video = fetch_video(id, client)
    args = arg_array(video.to_a)
    db.exec("INSERT INTO videos VALUES (#{args})", video.to_a)
  end

  return video
end

def search(query, client)
  html = client.get("https://www.youtube.com/results?q=#{query}&sp=EgIQAVAU").body

  html = XML.parse_html(html)

  html.xpath_nodes(%q(//ol[@class="item-section"]/li)).each do |item|
    root = item.xpath_node(%q(div[contains(@class,"yt-lockup-video")]/div))
    if root
      link = root.xpath_node(%q(div[contains(@class,"yt-lockup-thumbnail")]/a/@href))
      if link
        yield link.content.split("=")[1]
      end
    end
  end
end

def splice(a, b)
  c = a[0]
  a[0] = a[b % a.size]
  a[b % a.size] = c
  return a
end

def decrypt_signature(a)
  a = a.split("")

  a = splice(a, 12)
  a = splice(a, 18)
  a.reverse!
  a.delete_at(0..2)
  a.reverse!
  a.delete_at(0..2)
  a = splice(a, 69)
  a.reverse!
  a.delete_at(0..2)

  return a.join("")
end

def rank_videos(db, n, pool, filter)
  top = [] of {Float64, String}

  db.query("SELECT id, wilson_score, published FROM videos WHERE views > 5000 ORDER BY published DESC LIMIT 1000") do |rs|
    rs.each do
      id = rs.read(String)
      wilson_score = rs.read(Float64)
      published = rs.read(Time)

      # Exponential decay, older videos tend to rank lower
      temperature = wilson_score * Math.exp(-0.000005*((Time.now - published).total_minutes))
      top << {temperature, id}
    end
  end

  top.sort!

  # Make hottest come first
  top.reverse!
  top = top.map { |a, b| b }

  if filter
    language_list = [] of String
    top.each do |id|
      if language_list.size == n
        break
      else
        client = get_client(pool)
        begin
          video = get_video(id, client, db)
        rescue ex
          next
        end

        pool << client

        if video.language
          language = video.language
        else
          description = XML.parse(video.description)
          content = [video.title, description.content].join(" ")
          content = content[0, 10000]

          results = DetectLanguage.detect(content)
          language = results[0].language

          db.exec("UPDATE videos SET language = $1 WHERE id = $2", language, id)
        end

        if language == "en"
          language_list << id
        end
      end
    end
    return language_list
  else
    return top[0..n - 1]
  end
end

def make_client(url)
  context = OpenSSL::SSL::Context::Client.new
  context.add_options(
    OpenSSL::SSL::Options::ALL |
    OpenSSL::SSL::Options::NO_SSL_V2 |
    OpenSSL::SSL::Options::NO_SSL_V3
  )
  client = HTTP::Client.new(url, context)
  client.read_timeout = 10.seconds
  client.connect_timeout = 10.seconds
  return client
end

def get_reddit_comments(id, client, headers)
  query = "(url:3D#{id}%20OR%20url:#{id})%20(site:youtube.com%20OR%20site:youtu.be)"
  search_results = client.get("/search.json?q=#{query}", headers)

  if search_results.status_code == 200
    search_results = RedditSubmit.from_json(search_results.body)

    thread = search_results.data.children.sort_by { |child| child.data.score }[-1]
    result = client.get("/r/#{thread.data.subreddit}/comments/#{thread.data.id}?limit=100&sort=top", headers).body
    result = JSON.parse(result)
  elsif search_results.status_code == 302
    search_results = client.get(search_results.headers["Location"], headers).body

    result = JSON.parse(search_results)
    thread = RedditThread.from_json(result[0]["data"]["children"][0].to_json)
  else
    raise "Got error code #{search_results.status_code}"
  end

  comments = result[1]["data"]["children"]
  return comments, thread
end

def template_comments(root)
  html = ""
  root.each do |child|
    if child["data"]["body_html"]?
      author = child["data"]["author"]
      score = child["data"]["score"]
      body_html = HTML.unescape(child["data"]["body_html"].as_s)

      # Replace local links wtih links back to Reddit
      body_html = fill_links(body_html, "https", "www.reddit.com")

      replies_html = ""
      if child["data"]["replies"] != ""
        replies_html = template_comments(child["data"]["replies"]["data"]["children"])
      end

      content = <<-END_HTML
      <p>
        <a href="javascript:void(0)" onclick="toggle(this)">[ - ]</a> #{score} <b>#{author}</b> 
      </p>
      <div>
      #{body_html}
      #{replies_html}
      </div>
      END_HTML

      if child["data"]["depth"].as_i > 0
        html += <<-END_HTML
          <div class="pure-g">
          <div class="pure-u-1-24"></div>
          <div class="pure-u-23-24">
          #{content}
          </div>
          </div>
        END_HTML
      else
        html += <<-END_HTML
          <div class="pure-g">
          <div class="pure-u-1">
          #{content}
          </div>
          </div>
        END_HTML
      end
    end
  end

  return html
end

def number_with_separator(number)
  number.to_s.reverse.gsub(/(\d{3})(?=\d)/, "\\1,").reverse
end

def arg_array(array)
  args = [] of String
  (1..array.size).each { |i| args << "($#{i})" }
  args = args.join(",")

  return args
end

def add_alt_links(html)
  alt_links = [] of {Int32, String}

  # This is painful but is likely the only way to accomplish this in Crystal,
  # as Crystigiri and others are not able to insert XML Nodes into a document.
  # The goal here is to use as little regex as possible
  html.scan(/<a[^>]*>([^<]+)<\/a>/) do |match|
    anchor = XML.parse_html(match[0])
    anchor = anchor.xpath_node("//a").not_nil!
    url = URI.parse(HTML.unescape(anchor["href"]))

    if ["www.youtube.com", "m.youtube.com"].includes?(url.host) && url.path == "/watch"
      alt_link = <<-END_HTML
      <a href="#{url.full_path}">
        <i class="fa fa-link" aria-hidden="true"></i>
      </a>
      END_HTML
    elsif url.host == "youtu.be"
      alt_link = <<-END_HTML
      <a href="/watch?v=#{url.full_path.lchop("/")}">
        <i class="fa fa-link" aria-hidden="true"></i>
      </a>
      END_HTML
    else
      alt_link = ""
    end

    alt_links << {match.end.not_nil!, alt_link}
  end

  alt_links.reverse!
  alt_links.each do |position, alt_link|
    html = html.insert(position, alt_link)
  end

  return html
end

def fill_links(html, scheme, host)
  html = XML.parse_html(html)

  html.xpath_nodes("//a").each do |match|
    url = URI.parse(match["href"])
    if !url.host # If reddit link
      url.scheme = scheme
      url.host = host
      match["href"] = url
    end
  end

  html = html.to_xml
end

def login_req(login_form, f_req)
  data = {
    "pstMsg"          => "1",
    "checkConnection" => "youtube",
    "checkedDomains"  => "youtube",
    "hl"              => "en",
    "deviceinfo"      => %q([null,null,null,[],null,"US",null,null,[],"GlifWebSignIn",null,[null,null,[]]]),
    "f.req"           => f_req,
    "flowName"        => "GlifWebSignIn",
    "flowEntry"       => "ServiceLogin",
  }

  data = data.merge(login_form)
  # pp data

  return HTTP::Params.encode(data)
end
Add mapping macro and move templated into helpers.cr 2018-03-07 23:58:33 +00:00			`macro add_mapping(mapping)`
			`def initialize({{*mapping.keys.map { \|id\| "@#{id}".id }}})`
			`end`

			`def to_a`
			`return [{{*mapping.keys.map { \|id\| "@#{id}".id }}}]`
			`end`

			`DB.mapping({{mapping}})`
			`end`

			`macro templated(filename)`
			`render "src/views/#{{{filename}}}.ecr", "src/views/layout.ecr"`
			`end`

Add config file 2018-03-09 18:42:23 +00:00			`class Config`
			`YAML.mapping({`
			`pool_size: Int32,`
			`threads: Int32,`
			`db: NamedTuple(`
			`user: String,`
			`password: String,`
			`host: String,`
			`port: Int32,`
			`dbname: String,`
			`),`
Disable language filtering when there is no key 2018-03-17 00:52:25 +00:00			`dl_api_key: String?,`
Add config file 2018-03-09 18:42:23 +00:00			`})`
			`end`

Move functions into helpers.cr 2018-01-28 02:09:27 +00:00			`class Video`
			`module HTTPParamConverter`
			`def self.from_rs(rs)`
			`HTTP::Params.parse(rs.read(String))`
			`end`
			`end`

Add mapping macro and move templated into helpers.cr 2018-03-07 23:58:33 +00:00			`add_mapping({`
Move functions into helpers.cr 2018-01-28 02:09:27 +00:00			`id: String,`
			`info: {`
			`type: HTTP::Params,`
			`default: HTTP::Params.parse(""),`
			`converter: Video::HTTPParamConverter,`
			`},`
			`updated: Time,`
			`title: String,`
			`views: Int64,`
			`likes: Int32,`
			`dislikes: Int32,`
			`wilson_score: Float64,`
Add published field 2018-02-03 03:44:10 +00:00			`published: Time,`
Remove html from DB 2018-02-27 00:58:45 +00:00			`description: String,`
Add "language" to postgres 2018-03-17 00:45:37 +00:00			`language: String?,`
Move functions into helpers.cr 2018-01-28 02:09:27 +00:00			`})`
			`end`

Add reddit comments 2018-03-03 21:06:14 +00:00			`class RedditSubmit`
			`JSON.mapping({`
			`data: RedditSubmitData,`
			`})`
			`end`

			`class RedditSubmitData`
			`JSON.mapping({`
			`children: Array(RedditThread),`
			`})`
			`end`

			`class RedditThread`
			`JSON.mapping({`
			`data: RedditThreadData,`
			`})`
			`end`

			`class RedditThreadData`
			`JSON.mapping({`
			`subreddit: String,`
			`id: String,`
			`num_comments: Int32,`
			`score: Int32,`
			`author: String,`
			`permalink: String,`
			`title: String,`
			`})`
			`end`

Move helpers into seperate file 2018-01-21 00:19:12 +00:00			`# See http://www.evanmiller.org/how-not-to-sort-by-average-rating.html`
			`def ci_lower_bound(pos, n)`
			`if n == 0`
Move functions into helpers.cr 2018-01-28 02:09:27 +00:00			`return 0.0`
Move helpers into seperate file 2018-01-21 00:19:12 +00:00			`end`

			`# z value here represents a confidence level of 0.95`
			`z = 1.96`
			`phat = 1.0*pos/n`

			`return (phat + zz/(2n) - z * Math.sqrt((phat(1 - phat) + zz/(4n))/n))/(1 + zz/n)`
			`end`

			`def elapsed_text(elapsed)`
			`millis = elapsed.total_milliseconds`
			`return "#{millis.round(2)}ms" if millis >= 1`

			`"#{(millis * 1000).round(2)}µs"`
			`end`

Move functions into helpers.cr 2018-01-28 02:09:27 +00:00			`def get_client(pool)`
			`while pool.empty?`
Move helpers into seperate file 2018-01-21 00:19:12 +00:00			`sleep rand(0..10).milliseconds`
			`end`

Move functions into helpers.cr 2018-01-28 02:09:27 +00:00			`return pool.shift`
Move helpers into seperate file 2018-01-21 00:19:12 +00:00			`end`

Move functions into helpers.cr 2018-01-28 02:09:27 +00:00			`def fetch_video(id, client)`
Clean up Video class 2018-03-04 14:54:19 +00:00			`info = client.get("/get_video_info?video_id=#{id}&el=detailpage&ps=default&eurl=&gl=US&hl=en").body`
Add fix for controversial videos 2018-03-09 16:55:14 +00:00			`html = client.get("/watch?v=#{id}&bpctr=#{Time.new.epoch + 2000}").body`
Move helpers into seperate file 2018-01-21 00:19:12 +00:00
			`html = XML.parse_html(html)`
Move functions into helpers.cr 2018-01-28 02:09:27 +00:00			`info = HTTP::Params.parse(info)`
Move helpers into seperate file 2018-01-21 00:19:12 +00:00
			`if info["reason"]?`
Partially bypass age-gate 2018-02-03 04:04:34 +00:00			`info = client.get("/get_video_info?video_id=#{id}&ps=default&eurl=&gl=US&hl=en").body`
			`info = HTTP::Params.parse(info)`
			`if info["reason"]?`
			`raise info["reason"]`
			`end`
Move helpers into seperate file 2018-01-21 00:19:12 +00:00			`end`

Move functions into helpers.cr 2018-01-28 02:09:27 +00:00			`title = info["title"]`

			`views = info["view_count"].to_i64`
Move helpers into seperate file 2018-01-21 00:19:12 +00:00
Move functions into helpers.cr 2018-01-28 02:09:27 +00:00			`likes = html.xpath_node(%q(//button[@title="I like this"]/span))`
Use try instead of ternary 2018-03-14 23:06:21 +00:00			`likes = likes.try &.content.delete(",").try &.to_i`
			`likes \|\|= 0`
Move functions into helpers.cr 2018-01-28 02:09:27 +00:00
			`dislikes = html.xpath_node(%q(//button[@title="I dislike this"]/span))`
Use try instead of ternary 2018-03-14 23:06:21 +00:00			`dislikes = dislikes.try &.content.delete(",").try &.to_i`
			`dislikes \|\|= 0`
Move functions into helpers.cr 2018-01-28 02:09:27 +00:00
Remove html from DB 2018-02-27 00:58:45 +00:00			`description = html.xpath_node(%q(//p[@id="eow-description"]))`
			`description = description ? description.to_xml : ""`

Move functions into helpers.cr 2018-01-28 02:09:27 +00:00			`wilson_score = ci_lower_bound(likes, likes + dislikes)`

Fix video indexing 2018-02-05 01:42:13 +00:00			`published = html.xpath_node(%q(//strong[contains(@class,"watch-time-text")]))`
Add published field 2018-02-03 03:44:10 +00:00			`if published`
			`published = published.content`
Fix video indexing 2018-02-05 01:42:13 +00:00			`else`
			`raise "Could not find date published"`
			`end`

			`published = published.lchop("Published ")`
			`published = published.lchop("Started streaming ")`
Add published variant 2018-03-17 03:34:26 +00:00			`published = published.lchop("Streamed live ")`
			`published = published.lchop("Uploaded ")`
Fix video indexing 2018-02-05 01:42:13 +00:00			`published = published.lchop("on ")`
			`published = published.lchop("Scheduled for ")`
Run 'crystal tool format' 2018-02-05 23:57:03 +00:00			`if !published.includes?("ago")`
			`published = Time.parse(published, "%b %-d, %Y")`
			`else`
			`# Time matches format "20 hours ago", "40 minutes ago"...`
Fix video indexing 2018-02-05 01:42:13 +00:00			`delta = published.split(" ")[0].to_i`
			`case published`
			`when .includes? "minute"`
			`published = Time.now - delta.minutes`
			`when .includes? "hour"`
			`published = Time.now - delta.hours`
Run 'crystal tool format' 2018-02-05 23:57:03 +00:00			`else`
Fix video indexing 2018-02-05 01:42:13 +00:00			`raise "Could not parse #{published}"`
Run 'crystal tool format' 2018-02-05 23:57:03 +00:00			`end`
Add published field 2018-02-03 03:44:10 +00:00			`end`

Add "language" to postgres 2018-03-17 00:45:37 +00:00			`video = Video.new(id, info, Time.now, title, views, likes, dislikes, wilson_score, published, description, nil)`
Move helpers into seperate file 2018-01-21 00:19:12 +00:00
			`return video`
			`end`

Move functions into helpers.cr 2018-01-28 02:09:27 +00:00			`def get_video(id, client, db, refresh = true)`
			`if db.query_one?("SELECT EXISTS (SELECT true FROM videos WHERE id = $1)", id, as: Bool)`
			`video = db.query_one("SELECT * FROM videos WHERE id = $1", id, as: Video)`
Move helpers into seperate file 2018-01-21 00:19:12 +00:00
Move functions into helpers.cr 2018-01-28 02:09:27 +00:00			`# If record was last updated over an hour ago, refresh (expire param in response lasts for 6 hours)`
			`if refresh && Time.now - video.updated > 1.hours`
Clean up Video class 2018-03-04 14:54:19 +00:00			`db.exec("DELETE FROM videos * WHERE id = $1", id)`
Add refresh for top videos 2018-03-17 04:01:35 +00:00			`video = fetch_video(id, client)`
Clean up Video class 2018-03-04 14:54:19 +00:00			`args = arg_array(video.to_a)`
			`db.exec("INSERT INTO videos VALUES (#{args})", video.to_a)`
Move helpers into seperate file 2018-01-21 00:19:12 +00:00			`end`
			`else`
Move functions into helpers.cr 2018-01-28 02:09:27 +00:00			`video = fetch_video(id, client)`
Clean up Video class 2018-03-04 14:54:19 +00:00			`args = arg_array(video.to_a)`
			`db.exec("INSERT INTO videos VALUES (#{args})", video.to_a)`
Move helpers into seperate file 2018-01-21 00:19:12 +00:00			`end`

			`return video`
			`end`
Fix index out of bounds error 2018-01-21 23:49:27 +00:00
Move functions into helpers.cr 2018-01-28 02:09:27 +00:00			`def search(query, client)`
Clean up Video class 2018-03-04 14:54:19 +00:00			`html = client.get("https://www.youtube.com/results?q=#{query}&sp=EgIQAVAU").body`
Fix index out of bounds error 2018-01-21 23:49:27 +00:00
			`html = XML.parse_html(html)`

			`html.xpath_nodes(%q(//ol[@class="item-section"]/li)).each do \|item\|`
			`root = item.xpath_node(%q(div[contains(@class,"yt-lockup-video")]/div))`
			`if root`
			`link = root.xpath_node(%q(div[contains(@class,"yt-lockup-thumbnail")]/a/@href))`
			`if link`
			`yield link.content.split("=")[1]`
			`end`
			`end`
			`end`
			`end`
Add ability to decrypt signature for vflxuxnEY/en_US/base.js 2018-02-03 20:41:59 +00:00
Replace signature function with generic catchall 2018-02-22 19:01:37 +00:00			`def splice(a, b)`
Add ability to decrypt signature for vflxuxnEY/en_US/base.js 2018-02-03 20:41:59 +00:00			`c = a[0]`
Add support for different signature functions 2018-02-12 04:06:29 +00:00			`a[0] = a[b % a.size]`
			`a[b % a.size] = c`
			`return a`
			`end`

Replace signature function with generic catchall 2018-02-22 19:01:37 +00:00			`def decrypt_signature(a)`
Format and add function for vflCCoUi2 and vflg4IfMn 2018-02-13 16:44:11 +00:00			`a = a.split("")`
Add support for different signature functions 2018-02-12 04:06:29 +00:00
Update signature 2018-03-22 16:02:15 +00:00			`a = splice(a, 12)`
			`a = splice(a, 18)`
Update signature function 2018-03-07 14:07:40 +00:00			`a.reverse!`
Update signature 2018-03-22 16:02:15 +00:00			`a.delete_at(0..2)`
Update signature function 2018-03-07 14:07:40 +00:00			`a.reverse!`
Update signature 2018-03-22 16:02:15 +00:00			`a.delete_at(0..2)`
			`a = splice(a, 69)`
			`a.reverse!`
			`a.delete_at(0..2)`
Make link styling default for anchor tags 2018-03-07 04:03:45 +00:00
Format and add function for vflCCoUi2 and vflg4IfMn 2018-02-13 16:44:11 +00:00			`return a.join("")`
			`end`

Add language detection for top videos 2018-03-17 00:36:49 +00:00			`def rank_videos(db, n, pool, filter)`
Add home page 2018-02-05 23:56:40 +00:00			`top = [] of {Float64, String}`

Add rescue for video ranking 2018-03-17 04:57:31 +00:00			`db.query("SELECT id, wilson_score, published FROM videos WHERE views > 5000 ORDER BY published DESC LIMIT 1000") do \|rs\|`
Add home page 2018-02-05 23:56:40 +00:00			`rs.each do`
			`id = rs.read(String)`
			`wilson_score = rs.read(Float64)`
			`published = rs.read(Time)`

			`# Exponential decay, older videos tend to rank lower`
Fix rank_videos 2018-02-10 16:06:37 +00:00			`temperature = wilson_score * Math.exp(-0.000005*((Time.now - published).total_minutes))`
Add home page 2018-02-05 23:56:40 +00:00			`top << {temperature, id}`
			`end`
			`end`

			`top.sort!`

			`# Make hottest come first`
			`top.reverse!`
			`top = top.map { \|a, b\| b }`

Add language detection for top videos 2018-03-17 00:36:49 +00:00			`if filter`
			`language_list = [] of String`
			`top.each do \|id\|`
			`if language_list.size == n`
			`break`
			`else`
			`client = get_client(pool)`
Add error handling for top videos 2018-03-19 17:35:35 +00:00			`begin`
			`video = get_video(id, client, db)`
			`rescue ex`
			`next`
			`end`

Add language detection for top videos 2018-03-17 00:36:49 +00:00			`pool << client`

Add "language" to postgres 2018-03-17 00:45:37 +00:00			`if video.language`
			`language = video.language`
			`else`
			`description = XML.parse(video.description)`
			`content = [video.title, description.content].join(" ")`
Add error handling for top videos 2018-03-19 17:35:35 +00:00			`content = content[0, 10000]`
Add language detection for top videos 2018-03-17 00:36:49 +00:00
Add "language" to postgres 2018-03-17 00:45:37 +00:00			`results = DetectLanguage.detect(content)`
			`language = results[0].language`
Add language detection for top videos 2018-03-17 00:36:49 +00:00
Add "language" to postgres 2018-03-17 00:45:37 +00:00			`db.exec("UPDATE videos SET language = $1 WHERE id = $2", language, id)`
			`end`

			`if language == "en"`
Add language detection for top videos 2018-03-17 00:36:49 +00:00			`language_list << id`
			`end`
			`end`
			`end`
			`return language_list`
			`else`
			`return top[0..n - 1]`
			`end`
Add home page 2018-02-05 23:56:40 +00:00			`end`
Refactor client creation 2018-02-06 01:07:49 +00:00
Fix regression for youtube pool 2018-03-05 04:25:03 +00:00			`def make_client(url)`
			`context = OpenSSL::SSL::Context::Client.new`
			`context.add_options(`
			`OpenSSL::SSL::Options::ALL \|`
			`OpenSSL::SSL::Options::NO_SSL_V2 \|`
			`OpenSSL::SSL::Options::NO_SSL_V3`
			`)`
Minor fixes 2018-02-27 00:59:02 +00:00			`client = HTTP::Client.new(url, context)`
Major fixes, add options for YT, add User-Agent for Reddit 2018-03-04 16:59:03 +00:00			`client.read_timeout = 10.seconds`
			`client.connect_timeout = 10.seconds`
Refactor client creation 2018-02-06 01:07:49 +00:00			`return client`
			`end`
Add reddit comments 2018-03-03 21:06:14 +00:00
Major fixes, add options for YT, add User-Agent for Reddit 2018-03-04 16:59:03 +00:00			`def get_reddit_comments(id, client, headers)`
Use more advanced query for reddit search 2018-03-04 15:31:26 +00:00			`query = "(url:3D#{id}%20OR%20url:#{id})%20(site:youtube.com%20OR%20site:youtu.be)"`
Major fixes, add options for YT, add User-Agent for Reddit 2018-03-04 16:59:03 +00:00			`search_results = client.get("/search.json?q=#{query}", headers)`
Add fix for controversial videos 2018-03-09 16:55:14 +00:00
Major fixes, add options for YT, add User-Agent for Reddit 2018-03-04 16:59:03 +00:00			`if search_results.status_code == 200`
Add support for reddit redirect 2018-03-04 01:10:25 +00:00			`search_results = RedditSubmit.from_json(search_results.body)`
Add fix for controversial videos 2018-03-09 16:55:14 +00:00
Add support for reddit redirect 2018-03-04 01:10:25 +00:00			`thread = search_results.data.children.sort_by { \|child\| child.data.score }[-1]`
Limit number of reddit comments 2018-03-09 16:47:50 +00:00			`result = client.get("/r/#{thread.data.subreddit}/comments/#{thread.data.id}?limit=100&sort=top", headers).body`
Add support for reddit redirect 2018-03-04 01:10:25 +00:00			`result = JSON.parse(result)`
Major fixes, add options for YT, add User-Agent for Reddit 2018-03-04 16:59:03 +00:00			`elsif search_results.status_code == 302`
			`search_results = client.get(search_results.headers["Location"], headers).body`

			`result = JSON.parse(search_results)`
			`thread = RedditThread.from_json(result[0]["data"]["children"][0].to_json)`
			`else`
			`raise "Got error code #{search_results.status_code}"`
Add support for reddit redirect 2018-03-04 01:10:25 +00:00			`end`

Major fixes, add options for YT, add User-Agent for Reddit 2018-03-04 16:59:03 +00:00			`comments = result[1]["data"]["children"]`
Add support for reddit redirect 2018-03-04 01:10:25 +00:00			`return comments, thread`
Add reddit comments 2018-03-03 21:06:14 +00:00			`end`

			`def template_comments(root)`
			`html = ""`
			`root.each do \|child\|`
			`if child["data"]["body_html"]?`
			`author = child["data"]["author"]`
			`score = child["data"]["score"]`
			`body_html = HTML.unescape(child["data"]["body_html"].as_s)`

Add local alternatives for video links 2018-03-07 04:00:35 +00:00			`# Replace local links wtih links back to Reddit`
			`body_html = fill_links(body_html, "https", "www.reddit.com")`

Add reddit comments 2018-03-03 21:06:14 +00:00			`replies_html = ""`
			`if child["data"]["replies"] != ""`
			`replies_html = template_comments(child["data"]["replies"]["data"]["children"])`
			`end`

			`content = <<-END_HTML`
			`<p>`
Make link styling default for anchor tags 2018-03-07 04:03:45 +00:00			`<a href="javascript:void(0)" onclick="toggle(this)">[ - ]</a> #{score} <b>#{author}</b>`
Add reddit comments 2018-03-03 21:06:14 +00:00			`</p>`
Allow for collapsing and expanding of Reddit comments 2018-03-04 04:36:18 +00:00			`<div>`
			`#{body_html}`
Add reddit comments 2018-03-03 21:06:14 +00:00			`#{replies_html}`
Allow for collapsing and expanding of Reddit comments 2018-03-04 04:36:18 +00:00			`</div>`
Add reddit comments 2018-03-03 21:06:14 +00:00			`END_HTML`

			`if child["data"]["depth"].as_i > 0`
			`html += <<-END_HTML`
			`<div class="pure-g">`
			`<div class="pure-u-1-24"></div>`
			`<div class="pure-u-23-24">`
			`#{content}`
			`</div>`
			`</div>`
			`END_HTML`
			`else`
			`html += <<-END_HTML`
			`<div class="pure-g">`
			`<div class="pure-u-1">`
			`#{content}`
			`</div>`
			`</div>`
			`END_HTML`
			`end`
			`end`
			`end`

			`return html`
			`end`
Separate with comma views, likes, dislikes 2018-03-03 21:10:56 +00:00
			`def number_with_separator(number)`
			`number.to_s.reverse.gsub(/(\d{3})(?=\d)/, "\\1,").reverse`
			`end`
Clean up Video class 2018-03-04 14:54:19 +00:00
			`def arg_array(array)`
			`args = [] of String`
Refactor arg_array 2018-03-25 01:57:57 +00:00			`(1..array.size).each { \|i\| args << "($#{i})" }`
			`args = args.join(",")`
Clean up Video class 2018-03-04 14:54:19 +00:00
			`return args`
			`end`
Add local alternatives for video links 2018-03-07 04:00:35 +00:00
			`def add_alt_links(html)`
			`alt_links = [] of {Int32, String}`

			`# This is painful but is likely the only way to accomplish this in Crystal,`
			`# as Crystigiri and others are not able to insert XML Nodes into a document.`
			`# The goal here is to use as little regex as possible`
			`html.scan(/<a[^>]*>([^<]+)<\/a>/) do \|match\|`
			`anchor = XML.parse_html(match[0])`
			`anchor = anchor.xpath_node("//a").not_nil!`
			`url = URI.parse(HTML.unescape(anchor["href"]))`

Fix alt_link for youtu.be 2018-03-09 20:06:35 +00:00			`if ["www.youtube.com", "m.youtube.com"].includes?(url.host) && url.path == "/watch"`
Add local alternatives for video links 2018-03-07 04:00:35 +00:00			`alt_link = <<-END_HTML`
Make link styling default for anchor tags 2018-03-07 04:03:45 +00:00			`<a href="#{url.full_path}">`
Add local alternatives for video links 2018-03-07 04:00:35 +00:00			`<i class="fa fa-link" aria-hidden="true"></i>`
			`</a>`
			`END_HTML`
Fix alt_link for youtu.be 2018-03-09 20:06:35 +00:00			`elsif url.host == "youtu.be"`
			`alt_link = <<-END_HTML`
			`<a href="/watch?v=#{url.full_path.lchop("/")}">`
			`<i class="fa fa-link" aria-hidden="true"></i>`
			`</a>`
			`END_HTML`
			`else`
			`alt_link = ""`
Add local alternatives for video links 2018-03-07 04:00:35 +00:00			`end`
Fix alt_link for youtu.be 2018-03-09 20:06:35 +00:00
			`alt_links << {match.end.not_nil!, alt_link}`
Add local alternatives for video links 2018-03-07 04:00:35 +00:00			`end`

			`alt_links.reverse!`
			`alt_links.each do \|position, alt_link\|`
			`html = html.insert(position, alt_link)`
			`end`

			`return html`
			`end`

			`def fill_links(html, scheme, host)`
			`html = XML.parse_html(html)`

			`html.xpath_nodes("//a").each do \|match\|`
			`url = URI.parse(match["href"])`
			`if !url.host # If reddit link`
			`url.scheme = scheme`
			`url.host = host`
			`match["href"] = url`
			`end`
			`end`

			`html = html.to_xml`
			`end`
Add login page 2018-03-16 16:40:29 +00:00
			`def login_req(login_form, f_req)`
			`data = {`
			`"pstMsg" => "1",`
			`"checkConnection" => "youtube",`
			`"checkedDomains" => "youtube",`
			`"hl" => "en",`
			`"deviceinfo" => %q([null,null,null,[],null,"US",null,null,[],"GlifWebSignIn",null,[null,null,[]]]),`
			`"f.req" => f_req,`
			`"flowName" => "GlifWebSignIn",`
			`"flowEntry" => "ServiceLogin",`
			`}`

			`data = data.merge(login_form)`
			`# pp data`

			`return HTTP::Params.encode(data)`
			`end`