2019-04-03 16:35:58 +00:00
require " ./macros "
2019-04-10 21:23:37 +00:00
struct Nonce
2020-07-26 14:58:50 +00:00
include DB :: Serializable
property nonce : String
property expire : Time
2019-04-10 21:23:37 +00:00
end
struct SessionId
2020-07-26 14:58:50 +00:00
include DB :: Serializable
property id : String
property email : String
property issued : String
2019-04-10 21:23:37 +00:00
end
2019-04-15 16:13:09 +00:00
struct Annotation
2020-07-26 14:58:50 +00:00
include DB :: Serializable
property id : String
property annotations : String
2019-04-15 16:13:09 +00:00
end
2019-04-03 16:35:58 +00:00
struct ConfigPreferences
2020-07-26 14:58:50 +00:00
include YAML :: Serializable
property annotations : Bool = false
property annotations_subscribed : Bool = false
property autoplay : Bool = false
property captions : Array ( String ) = [ " " , " " , " " ]
property comments : Array ( String ) = [ " youtube " , " " ]
property continue : Bool = false
property continue_autoplay : Bool = true
property dark_mode : String = " "
property latest_only : Bool = false
property listen : Bool = false
property local : Bool = false
property locale : String = " en-US "
property max_results : Int32 = 40
property notifications_only : Bool = false
property player_style : String = " invidious "
property quality : String = " hd720 "
2020-12-13 09:16:26 +00:00
property quality_dash : String = " auto "
2021-04-04 22:20:08 +00:00
property default_home : String ? = " Popular "
2020-07-26 14:58:50 +00:00
property feed_menu : Array ( String ) = [ " Popular " , " Trending " , " Subscriptions " , " Playlists " ]
property related_videos : Bool = true
property sort : String = " published "
property speed : Float32 = 1.0_f32
property thin_mode : Bool = false
property unseen_only : Bool = false
property video_loop : Bool = false
2019-11-11 16:06:06 +00:00
property extend_desc : Bool = false
2020-07-26 14:58:50 +00:00
property volume : Int32 = 100
2021-04-12 03:55:07 +00:00
property vr_mode : Bool = true
2020-07-26 14:58:50 +00:00
def to_tuple
{% begin %}
{
{{ * @type . instance_vars . map { | var | " #{ var . name } : #{ var . name } " . id }} }
}
{% end %}
2019-08-15 16:29:55 +00:00
end
2019-04-03 16:35:58 +00:00
end
2020-12-27 05:12:43 +00:00
class Config
2020-07-26 14:58:50 +00:00
include YAML :: Serializable
2021-01-30 14:52:48 +00:00
property channel_threads : Int32 = 1 # Number of threads to use for crawling videos from channels (for updating subscriptions)
property feed_threads : Int32 = 1 # Number of threads to use for updating feeds
property output : String = " STDOUT " # Log file path or STDOUT
property log_level : LogLevel = LogLevel :: Info # Default log level, valid YAML values are ints and strings, see src/invidious/helpers/logger.cr
property db : DBConfig? = nil # Database configuration with separate parameters (username, hostname, etc)
@[ YAML :: Field ( converter : Preferences :: URIConverter ) ]
property database_url : URI = URI . parse ( " " ) # Database configuration using 12-Factor "Database URL" syntax
2020-09-27 17:19:44 +00:00
property decrypt_polling : Bool = true # Use polling to keep decryption function up to date
2021-01-04 15:05:15 +00:00
property full_refresh : Bool = false # Used for crawling channels: threads should check all videos uploaded by a channel
2020-07-26 14:58:50 +00:00
property https_only : Bool ? # Used to tell Invidious it is behind a proxy, so links to resources should be https://
property hmac_key : String ? # HMAC signing key for CSRF tokens and verifying pubsub subscriptions
property domain : String ? # Domain to be used for links to resources on the site where an absolute URL is required
property use_pubsub_feeds : Bool | Int32 = false # Subscribe to channels using PubSubHubbub (requires domain, hmac_key)
2020-12-27 05:12:43 +00:00
property popular_enabled : Bool = true
2020-07-26 14:58:50 +00:00
property captcha_enabled : Bool = true
property login_enabled : Bool = true
property registration_enabled : Bool = true
property statistics_enabled : Bool = false
property admins : Array ( String ) = [ ] of String
property external_port : Int32 ? = nil
2020-07-26 15:09:45 +00:00
property default_user_preferences : ConfigPreferences = ConfigPreferences . from_yaml ( " " )
2020-07-26 14:58:50 +00:00
property dmca_content : Array ( String ) = [ ] of String # For compliance with DMCA, disables download widget using list of video IDs
property check_tables : Bool = false # Check table integrity, automatically try to add any missing columns, create tables, etc.
property cache_annotations : Bool = false # Cache annotations requested from IA, will not cache empty annotations or annotations that only contain cards
property banner : String ? = nil # Optional banner to be displayed along top of page for announcements, etc.
property hsts : Bool ? = true # Enables 'Strict-Transport-Security'. Ensure that `domain` and all subdomains are served securely
property disable_proxy : Bool ? | Array ( String ) ? = false # Disable proxying server-wide: options: 'dash', 'livestreams', 'downloads', 'local'
@[ YAML :: Field ( converter : Preferences :: FamilyConverter ) ]
property force_resolve : Socket :: Family = Socket :: Family :: UNSPEC # Connect to YouTube over 'ipv6', 'ipv4'. Will sometimes resolve fix issues with rate-limiting (see https://github.com/ytdl-org/youtube-dl/issues/21729)
property port : Int32 = 3000 # Port to listen for connections (overrided by command line argument)
property host_binding : String = " 0.0.0.0 " # Host to bind (overrided by command line argument)
property pool_size : Int32 = 100 # Pool size for HTTP requests to youtube.com and ytimg.com (each domain has a separate pool of `pool_size`)
2021-04-03 20:11:35 +00:00
property use_quic : Bool = true # Use quic transport for youtube api
2020-07-26 14:58:50 +00:00
@[ YAML :: Field ( converter : Preferences :: StringToCookies ) ]
2020-11-20 21:21:26 +00:00
property cookies : HTTP :: Cookies = HTTP :: Cookies . new # Saved cookies in "name1=value1; name2=value2..." format
property captcha_key : String ? = nil # Key for Anti-Captcha
property captcha_api_url : String = " https://api.anti-captcha.com " # API URL for Anti-Captcha
2019-11-09 19:18:19 +00:00
2019-07-07 14:07:53 +00:00
def disabled? ( option )
case disabled = CONFIG . disable_proxy
when Bool
return disabled
when Array
if disabled . includes? option
return true
else
return false
end
2020-04-09 17:18:09 +00:00
else
return false
2019-07-07 14:07:53 +00:00
end
end
2021-01-23 17:58:13 +00:00
def self . load
# Load config from file or YAML string env var
env_config_file = " INVIDIOUS_CONFIG_FILE "
env_config_yaml = " INVIDIOUS_CONFIG "
config_file = ENV . has_key? ( env_config_file ) ? ENV . fetch ( env_config_file ) : " config/config.yml "
config_yaml = ENV . has_key? ( env_config_yaml ) ? ENV . fetch ( env_config_yaml ) : File . read ( config_file )
config = Config . from_yaml ( config_yaml )
# Update config from env vars (upcased and prefixed with "INVIDIOUS_")
{% for ivar in Config . instance_vars %}
{% env_id = " INVIDIOUS_ #{ ivar . id . upcase } " %}
if ENV . has_key? ( {{ env_id }} )
# puts %(Config.{{ivar.id}} : Loading from env var {{env_id}})
env_value = ENV . fetch ( {{ env_id }} )
success = false
# Use YAML converter if specified
{% ann = ivar . annotation ( :: YAML :: Field ) %}
{% if ann && ann [ :converter ] %}
puts %( Config.{{ivar.id}} : Parsing " #{ env_value } " as {{ivar.type}} with {{ann[:converter]}} converter )
config . {{ ivar . id }} = {{ ann [ :converter ] }} . from_yaml ( YAML :: ParseContext . new , YAML :: Nodes . parse ( ENV . fetch ( {{ env_id }} ) ) . nodes [ 0 ] )
puts %( Config.{{ivar.id}} : Set to #{ config . { { ivar . id } } } )
success = true
# Use regular YAML parser otherwise
{% else %}
{% ivar_types = ivar . type . union? ? ivar . type . union_types : [ ivar . type ] %}
# Sort types to avoid parsing nulls and numbers as strings
{% ivar_types = ivar_types . sort_by { | ivar_type | ivar_type == Nil ? 0 : ivar_type == Int32 ? 1 : 2 } %}
{{ ivar_types }} . each do | ivar_type |
if ! success
begin
# puts %(Config.{{ivar.id}} : Trying to parse "#{env_value}" as #{ivar_type})
config . {{ ivar . id }} = ivar_type . from_yaml ( env_value )
puts %( Config.{{ivar.id}} : Set to #{ config . { { ivar . id } } } ( #{ ivar_type } ) )
success = true
rescue
# nop
end
end
end
{% end %}
# Exit on fail
if ! success
puts %( Config.{{ivar.id}} failed to parse #{ env_value } as {{ivar.type}} )
exit ( 1 )
end
end
{% end %}
2021-01-30 14:52:48 +00:00
# Build database_url from db.* if it's not set directly
if config . database_url . to_s . empty?
if db = config . db
config . database_url = URI . new (
scheme : " postgres " ,
user : db . user ,
password : db . password ,
host : db . host ,
port : db . port ,
path : db . dbname ,
)
else
puts " Config : Either database_url or db.* is required "
exit ( 1 )
end
end
2021-01-23 17:58:13 +00:00
return config
end
2018-08-04 20:30:44 +00:00
end
2019-05-21 14:00:35 +00:00
struct DBConfig
2020-07-26 14:58:50 +00:00
include YAML :: Serializable
property user : String
property password : String
property host : String
property port : Int32
property dbname : String
2019-05-21 14:00:35 +00:00
end
2019-06-09 18:48:31 +00:00
def login_req ( f_req )
2018-08-04 20:30:44 +00:00
data = {
2019-06-09 18:48:31 +00:00
# Unfortunately there's not much information available on `bgRequest`; part of Google's BotGuard
2019-07-12 17:04:39 +00:00
# Generally this is much longer (>1250 characters), see also
# https://github.com/ytdl-org/youtube-dl/commit/baf67a604d912722b0fe03a40e9dc5349a2208cb .
2019-06-09 18:48:31 +00:00
# For now this can be empty.
2019-07-12 17:04:39 +00:00
" bgRequest " = > % | [ " identifier " , " " ] | ,
" pstMsg " = > " 1 " ,
" checkConnection " = > " youtube " ,
" checkedDomains " = > " youtube " ,
" hl " = > " en " ,
" deviceinfo " = > % | [ null , null , null , [ ] , null , " US " , null , null , [ ] , " GlifWebSignIn " , null , [ null , null , [ ] ] ] | ,
" f.req " = > f_req ,
2018-08-04 20:30:44 +00:00
" flowName " = > " GlifWebSignIn " ,
" flowEntry " = > " ServiceLogin " ,
2019-07-12 17:04:39 +00:00
# "cookiesDisabled" => "false",
# "gmscoreversion" => "undefined",
# "continue" => "https://accounts.google.com/ManageAccount",
# "azt" => "",
# "bgHash" => "",
2019-06-09 18:48:31 +00:00
}
2018-08-04 20:30:44 +00:00
return HTTP :: Params . encode ( data )
end
2019-06-08 20:08:27 +00:00
def html_to_content ( description_html : String )
description = description_html . gsub ( / (<br>)|(<br \/ >) / , {
" <br> " : " \n " ,
" <br/> " : " \n " ,
} )
if ! description . empty?
description = XML . parse_html ( description ) . content . strip ( " \n " )
2018-08-10 13:38:31 +00:00
end
2019-06-08 20:08:27 +00:00
return description
2018-08-10 13:38:31 +00:00
end
2018-08-10 14:44:19 +00:00
2020-06-16 22:51:35 +00:00
def extract_videos ( initial_data : Hash ( String , JSON :: Any ) , author_fallback : String ? = nil , author_id_fallback : String ? = nil )
extract_items ( initial_data , author_fallback , author_id_fallback ) . select ( & . is_a? ( SearchVideo ) ) . map ( & . as ( SearchVideo ) )
2018-09-20 14:36:09 +00:00
end
2020-09-02 20:28:57 +00:00
def extract_item ( item : JSON :: Any , author_fallback : String ? = nil , author_id_fallback : String ? = nil )
if i = ( item [ " videoRenderer " ]? || item [ " gridVideoRenderer " ]? )
video_id = i [ " videoId " ] . as_s
title = i [ " title " ] . try { | t | t [ " simpleText " ]? . try & . as_s || t [ " runs " ]? . try & . as_a . map ( & . [ " text " ] . as_s ) . join ( " " ) } || " "
2021-02-10 00:04:27 +00:00
author_info = i [ " ownerText " ]? . try & . [ " runs " ]? . try & . as_a? . try & . [ 0 ]?
2020-09-02 20:28:57 +00:00
author = author_info . try & . [ " text " ] . as_s || author_fallback || " "
author_id = author_info . try & . [ " navigationEndpoint " ]? . try & . [ " browseEndpoint " ] [ " browseId " ] . as_s || author_id_fallback || " "
published = i [ " publishedTimeText " ]? . try & . [ " simpleText " ]? . try { | t | decode_date ( t . as_s ) } || Time . local
view_count = i [ " viewCountText " ]? . try & . [ " simpleText " ]? . try & . as_s . gsub ( / \ D+ / , " " ) . to_i64? || 0 _i64
description_html = i [ " descriptionSnippet " ]? . try { | t | parse_content ( t ) } || " "
length_seconds = i [ " lengthText " ]? . try & . [ " simpleText " ]? . try & . as_s . try { | t | decode_length_seconds ( t ) } ||
2020-10-03 13:19:12 +00:00
i [ " thumbnailOverlays " ]? . try & . as_a . find ( & . [ " thumbnailOverlayTimeStatusRenderer " ]? ) . try & . [ " thumbnailOverlayTimeStatusRenderer " ]?
. try & . [ " text " ]? . try & . [ " simpleText " ]? . try & . as_s . try { | t | decode_length_seconds ( t ) } || 0
2020-09-02 20:28:57 +00:00
live_now = false
paid = false
premium = false
premiere_timestamp = i [ " upcomingEventData " ]? . try & . [ " startTime " ]? . try { | t | Time . unix ( t . as_s . to_i64 ) }
i [ " badges " ]? . try & . as_a . each do | badge |
b = badge [ " metadataBadgeRenderer " ]
case b [ " label " ] . as_s
when " LIVE NOW "
live_now = true
when " New " , " 4K " , " CC "
# TODO
when " Premium "
paid = true
# TODO: Potentially available as i["topStandaloneBadge"]["metadataBadgeRenderer"]
premium = true
else nil # Ignore
end
end
SearchVideo . new ( {
title : title ,
id : video_id ,
author : author ,
ucid : author_id ,
published : published ,
views : view_count ,
description_html : description_html ,
length_seconds : length_seconds ,
live_now : live_now ,
paid : paid ,
premium : premium ,
premiere_timestamp : premiere_timestamp ,
} )
elsif i = item [ " channelRenderer " ]?
author = i [ " title " ] [ " simpleText " ]? . try & . as_s || author_fallback || " "
author_id = i [ " channelId " ]? . try & . as_s || author_id_fallback || " "
2021-01-27 17:36:24 +00:00
author_thumbnail = i [ " thumbnail " ] [ " thumbnails " ]? . try & . as_a [ 0 ]? . try & . [ " url " ]? . try & . as_s || " "
2020-09-02 20:28:57 +00:00
subscriber_count = i [ " subscriberCountText " ]? . try & . [ " simpleText " ]? . try & . as_s . try { | s | short_text_to_number ( s . split ( " " ) [ 0 ] ) } || 0
auto_generated = false
auto_generated = true if ! i [ " videoCountText " ]?
video_count = i [ " videoCountText " ]? . try & . [ " runs " ] . as_a [ 0 ]? . try & . [ " text " ] . as_s . gsub ( / \ D / , " " ) . to_i || 0
description_html = i [ " descriptionSnippet " ]? . try { | t | parse_content ( t ) } || " "
SearchChannel . new ( {
author : author ,
ucid : author_id ,
author_thumbnail : author_thumbnail ,
subscriber_count : subscriber_count ,
video_count : video_count ,
description_html : description_html ,
auto_generated : auto_generated ,
} )
elsif i = item [ " gridPlaylistRenderer " ]?
title = i [ " title " ] [ " runs " ] . as_a [ 0 ]? . try & . [ " text " ] . as_s || " "
plid = i [ " playlistId " ]? . try & . as_s || " "
video_count = i [ " videoCountText " ] [ " runs " ] . as_a [ 0 ]? . try & . [ " text " ] . as_s . gsub ( / \ D / , " " ) . to_i || 0
playlist_thumbnail = i [ " thumbnail " ] [ " thumbnails " ] [ 0 ]? . try & . [ " url " ]? . try & . as_s || " "
SearchPlaylist . new ( {
title : title ,
id : plid ,
author : author_fallback || " " ,
ucid : author_id_fallback || " " ,
video_count : video_count ,
videos : [ ] of SearchPlaylistVideo ,
thumbnail : playlist_thumbnail ,
} )
elsif i = item [ " playlistRenderer " ]?
title = i [ " title " ] [ " simpleText " ]? . try & . as_s || " "
plid = i [ " playlistId " ]? . try & . as_s || " "
video_count = i [ " videoCount " ]? . try & . as_s . to_i || 0
playlist_thumbnail = i [ " thumbnails " ] . as_a [ 0 ]? . try & . [ " thumbnails " ]? . try & . as_a [ 0 ]? . try & . [ " url " ] . as_s || " "
2021-02-10 00:04:27 +00:00
author_info = i [ " shortBylineText " ]? . try & . [ " runs " ]? . try & . as_a? . try & . [ 0 ]?
2020-09-02 20:28:57 +00:00
author = author_info . try & . [ " text " ] . as_s || author_fallback || " "
author_id = author_info . try & . [ " navigationEndpoint " ]? . try & . [ " browseEndpoint " ] [ " browseId " ] . as_s || author_id_fallback || " "
videos = i [ " videos " ]? . try & . as_a . map do | v |
v = v [ " childVideoRenderer " ]
v_title = v [ " title " ] [ " simpleText " ]? . try & . as_s || " "
v_id = v [ " videoId " ]? . try & . as_s || " "
v_length_seconds = v [ " lengthText " ]? . try & . [ " simpleText " ]? . try { | t | decode_length_seconds ( t . as_s ) } || 0
SearchPlaylistVideo . new ( {
title : v_title ,
id : v_id ,
length_seconds : v_length_seconds ,
} )
end || [ ] of SearchPlaylistVideo
# TODO: i["publishedTimeText"]?
SearchPlaylist . new ( {
title : title ,
id : plid ,
author : author ,
ucid : author_id ,
video_count : video_count ,
videos : videos ,
thumbnail : playlist_thumbnail ,
} )
elsif i = item [ " radioRenderer " ]? # Mix
# TODO
elsif i = item [ " showRenderer " ]? # Show
# TODO
elsif i = item [ " shelfRenderer " ]?
elsif i = item [ " horizontalCardListRenderer " ]?
elsif i = item [ " searchPyvRenderer " ]? # Ad
end
end
2020-06-16 22:51:35 +00:00
def extract_items ( initial_data : Hash ( String , JSON :: Any ) , author_fallback : String ? = nil , author_id_fallback : String ? = nil )
2020-06-15 22:33:23 +00:00
items = [ ] of SearchItem
2020-09-02 20:28:57 +00:00
channel_v2_response = initial_data
2021-03-03 21:21:29 +00:00
. try & . [ " continuationContents " ]?
. try & . [ " gridContinuation " ]?
. try & . [ " items " ]?
2020-09-02 20:28:57 +00:00
if channel_v2_response
channel_v2_response . try & . as_a . each { | item |
2020-10-03 13:19:12 +00:00
extract_item ( item , author_fallback , author_id_fallback )
. try { | t | items << t }
2020-09-02 20:28:57 +00:00
}
else
initial_data . try { | t | t [ " contents " ]? || t [ " response " ]? }
. try { | t | t [ " twoColumnBrowseResultsRenderer " ]? . try & . [ " tabs " ] . as_a . select ( & . [ " tabRenderer " ]? . try & . [ " selected " ] . as_bool ) [ 0 ]? . try & . [ " tabRenderer " ] [ " content " ] ||
t [ " twoColumnSearchResultsRenderer " ]? . try & . [ " primaryContents " ] ||
t [ " continuationContents " ]? }
. try { | t | t [ " sectionListRenderer " ]? || t [ " sectionListContinuation " ]? }
. try & . [ " contents " ] . as_a
. each { | c | c . try & . [ " itemSectionRenderer " ]? . try & . [ " contents " ] . as_a
. try { | t | t [ 0 ]? . try & . [ " shelfRenderer " ]? . try & . [ " content " ] [ " expandedShelfContentsRenderer " ]? . try & . [ " items " ] . as_a ||
t [ 0 ]? . try & . [ " gridRenderer " ]? . try & . [ " items " ] . as_a || t }
. each { | item |
extract_item ( item , author_fallback , author_id_fallback )
. try { | t | items << t }
} }
2020-10-03 13:19:12 +00:00
end
2020-06-15 22:33:23 +00:00
items
end
2021-01-04 15:51:06 +00:00
def check_enum ( db , enum_name , struct_type = nil )
2020-06-15 22:57:20 +00:00
return # TODO
2020-07-26 14:58:50 +00:00
2019-08-05 23:49:13 +00:00
if ! db . query_one? ( " SELECT true FROM pg_type WHERE typname = $1 " , enum_name , as : Bool )
2021-01-04 15:51:06 +00:00
LOGGER . info ( " check_enum: CREATE TYPE #{ enum_name } " )
2019-08-05 23:49:13 +00:00
db . using_connection do | conn |
conn . as ( PG :: Connection ) . exec_all ( File . read ( " config/sql/ #{ enum_name } .sql " ) )
end
end
end
2021-01-04 15:51:06 +00:00
def check_table ( db , table_name , struct_type = nil )
2019-04-10 21:23:37 +00:00
# Create table if it doesn't exist
2019-04-10 22:16:18 +00:00
begin
db . exec ( " SELECT * FROM #{ table_name } LIMIT 0 " )
rescue ex
2021-01-04 15:51:06 +00:00
LOGGER . info ( " check_table: check_table: CREATE TABLE #{ table_name } " )
2019-04-10 22:09:36 +00:00
2019-04-10 21:23:37 +00:00
db . using_connection do | conn |
conn . as ( PG :: Connection ) . exec_all ( File . read ( " config/sql/ #{ table_name } .sql " ) )
end
end
2020-06-15 22:57:20 +00:00
return if ! struct_type
2019-04-10 21:23:37 +00:00
2020-07-26 14:58:50 +00:00
struct_array = struct_type . type_array
2019-04-10 21:23:37 +00:00
column_array = get_column_array ( db , table_name )
column_types = File . read ( " config/sql/ #{ table_name } .sql " ) . match ( / CREATE TABLE public \ . #{ table_name } \ n \ ((?<types>[ \ d \ D]*?) \ ); / )
2020-06-15 22:57:20 +00:00
. try & . [ " types " ] . split ( " , " ) . map { | line | line . strip } . reject & . starts_with? ( " CONSTRAINT " )
2019-04-10 21:23:37 +00:00
2020-06-15 22:57:20 +00:00
return if ! column_types
2019-04-10 21:23:37 +00:00
struct_array . each_with_index do | name , i |
if name != column_array [ i ]?
if ! column_array [ i ]?
new_column = column_types . select { | line | line . starts_with? name } [ 0 ]
2021-01-04 15:51:06 +00:00
LOGGER . info ( " check_table: ALTER TABLE #{ table_name } ADD COLUMN #{ new_column } " )
2019-04-10 22:09:36 +00:00
db . exec ( " ALTER TABLE #{ table_name } ADD COLUMN #{ new_column } " )
2019-04-10 21:23:37 +00:00
next
end
# Column doesn't exist
if ! column_array . includes? name
new_column = column_types . select { | line | line . starts_with? name } [ 0 ]
db . exec ( " ALTER TABLE #{ table_name } ADD COLUMN #{ new_column } " )
end
# Column exists but in the wrong position, rotate
if struct_array . includes? column_array [ i ]
until name == column_array [ i ]
new_column = column_types . select { | line | line . starts_with? column_array [ i ] } [ 0 ]? . try & . gsub ( " #{ column_array [ i ] } " , " #{ column_array [ i ] } _new " )
# There's a column we didn't expect
if ! new_column
2021-01-04 15:51:06 +00:00
LOGGER . info ( " check_table: ALTER TABLE #{ table_name } DROP COLUMN #{ column_array [ i ] } " )
2019-04-10 22:09:36 +00:00
db . exec ( " ALTER TABLE #{ table_name } DROP COLUMN #{ column_array [ i ] } CASCADE " )
2019-04-10 21:23:37 +00:00
column_array = get_column_array ( db , table_name )
next
end
2021-01-04 15:51:06 +00:00
LOGGER . info ( " check_table: ALTER TABLE #{ table_name } ADD COLUMN #{ new_column } " )
2019-04-10 22:09:36 +00:00
db . exec ( " ALTER TABLE #{ table_name } ADD COLUMN #{ new_column } " )
2019-06-08 01:07:55 +00:00
2021-01-04 15:51:06 +00:00
LOGGER . info ( " check_table: UPDATE #{ table_name } SET #{ column_array [ i ] } _new= #{ column_array [ i ] } " )
2019-04-10 22:09:36 +00:00
db . exec ( " UPDATE #{ table_name } SET #{ column_array [ i ] } _new= #{ column_array [ i ] } " )
2019-06-08 01:07:55 +00:00
2021-01-04 15:51:06 +00:00
LOGGER . info ( " check_table: ALTER TABLE #{ table_name } DROP COLUMN #{ column_array [ i ] } CASCADE " )
2019-04-10 22:09:36 +00:00
db . exec ( " ALTER TABLE #{ table_name } DROP COLUMN #{ column_array [ i ] } CASCADE " )
2019-06-08 01:07:55 +00:00
2021-01-04 15:51:06 +00:00
LOGGER . info ( " check_table: ALTER TABLE #{ table_name } RENAME COLUMN #{ column_array [ i ] } _new TO #{ column_array [ i ] } " )
2019-04-10 22:09:36 +00:00
db . exec ( " ALTER TABLE #{ table_name } RENAME COLUMN #{ column_array [ i ] } _new TO #{ column_array [ i ] } " )
2019-04-10 21:23:37 +00:00
column_array = get_column_array ( db , table_name )
end
else
2021-01-04 15:51:06 +00:00
LOGGER . info ( " check_table: ALTER TABLE #{ table_name } DROP COLUMN #{ column_array [ i ] } CASCADE " )
2019-04-10 22:09:36 +00:00
db . exec ( " ALTER TABLE #{ table_name } DROP COLUMN #{ column_array [ i ] } CASCADE " )
2019-04-10 21:23:37 +00:00
end
end
end
2020-06-15 22:57:20 +00:00
return if column_array . size <= struct_array . size
2020-06-15 22:33:23 +00:00
column_array . each do | column |
if ! struct_array . includes? column
2021-01-04 15:51:06 +00:00
LOGGER . info ( " check_table: ALTER TABLE #{ table_name } DROP COLUMN #{ column } CASCADE " )
2020-06-15 22:33:23 +00:00
db . exec ( " ALTER TABLE #{ table_name } DROP COLUMN #{ column } CASCADE " )
end
end
2019-04-10 21:23:37 +00:00
end
class PG:: ResultSet
def field ( index = @column_index )
@fields . not_nil! [ index ]
end
end
def get_column_array ( db , table_name )
column_array = [ ] of String
db . query ( " SELECT * FROM #{ table_name } LIMIT 0 " ) do | rs |
rs . column_count . times do | i |
column = rs . as ( PG :: ResultSet ) . field ( i )
column_array << column . name
end
end
return column_array
end
2019-04-15 16:13:09 +00:00
def cache_annotation ( db , id , annotations )
if ! CONFIG . cache_annotations
return
end
body = XML . parse ( annotations )
nodeset = body . xpath_nodes ( % q ( / document / annotations / annotation ) )
2020-04-07 18:34:40 +00:00
return if nodeset == 0
2019-04-15 16:13:09 +00:00
has_legacy_annotations = false
nodeset . each do | node |
if ! { " branding " , " card " , " drawer " } . includes? node [ " type " ]?
has_legacy_annotations = true
break
end
end
2020-06-15 22:10:30 +00:00
db . exec ( " INSERT INTO annotations VALUES ($1, $2) ON CONFLICT DO NOTHING " , id , annotations ) if has_legacy_annotations
2019-04-15 16:13:09 +00:00
end
2019-05-19 00:14:58 +00:00
2020-06-15 22:10:30 +00:00
def create_notification_stream ( env , topics , connection_channel )
2019-06-03 18:36:49 +00:00
connection = Channel ( PQ :: Notification ) . new ( 8 )
2019-06-03 18:12:06 +00:00
connection_channel . send ( { true , connection } )
2019-05-21 14:01:17 +00:00
locale = LOCALES [ env . get ( " preferences " ) . as ( Preferences ) . locale ]?
since = env . params . query [ " since " ]? . try & . to_i?
2019-06-02 12:41:53 +00:00
id = 0
2019-05-21 14:01:17 +00:00
2019-06-02 12:41:53 +00:00
if topics . includes? " debug "
2019-05-21 14:01:17 +00:00
spawn do
2019-06-03 18:12:06 +00:00
begin
loop do
time_span = [ 0 , 0 , 0 , 0 ]
time_span [ rand ( 4 ) ] = rand ( 30 ) + 5
2020-04-09 17:18:09 +00:00
published = Time . utc - Time :: Span . new ( days : time_span [ 0 ] , hours : time_span [ 1 ] , minutes : time_span [ 2 ] , seconds : time_span [ 3 ] )
2019-06-03 18:12:06 +00:00
video_id = TEST_IDS [ rand ( TEST_IDS . size ) ]
2019-06-29 02:17:56 +00:00
video = get_video ( video_id , PG_DB )
2019-06-03 18:12:06 +00:00
video . published = published
2020-06-15 22:10:30 +00:00
response = JSON . parse ( video . to_json ( locale ) )
2019-06-03 18:12:06 +00:00
if fields_text = env . params . query [ " fields " ]?
begin
JSONFilter . filter ( response , fields_text )
rescue ex
env . response . status_code = 400
response = { " error " = > ex . message }
end
2019-05-21 14:01:17 +00:00
end
2019-06-03 18:12:06 +00:00
env . response . puts " id: #{ id } "
env . response . puts " data: #{ response . to_json } "
env . response . puts
env . response . flush
2019-05-21 14:01:17 +00:00
2019-06-03 18:12:06 +00:00
id += 1
2019-06-02 12:41:53 +00:00
2019-06-03 18:12:06 +00:00
sleep 1 . minute
2019-06-16 00:18:36 +00:00
Fiber . yield
2019-06-03 18:12:06 +00:00
end
rescue ex
2019-06-02 12:41:53 +00:00
end
end
end
spawn do
2019-06-03 18:12:06 +00:00
begin
if since
topics . try & . each do | topic |
case topic
when . match ( / UC[A-Za-z0-9_-]{22} / )
PG_DB . query_all ( " SELECT * FROM channel_videos WHERE ucid = $1 AND published > $2 ORDER BY published DESC LIMIT 15 " ,
topic , Time . unix ( since . not_nil! ) , as : ChannelVideo ) . each do | video |
2020-06-15 22:10:30 +00:00
response = JSON . parse ( video . to_json ( locale ) )
2019-06-03 18:12:06 +00:00
if fields_text = env . params . query [ " fields " ]?
begin
JSONFilter . filter ( response , fields_text )
rescue ex
env . response . status_code = 400
response = { " error " = > ex . message }
end
2019-06-02 12:41:53 +00:00
end
2019-06-03 18:12:06 +00:00
env . response . puts " id: #{ id } "
env . response . puts " data: #{ response . to_json } "
env . response . puts
env . response . flush
2019-06-02 12:41:53 +00:00
2019-06-03 18:12:06 +00:00
id += 1
end
else
# TODO
2019-06-02 12:41:53 +00:00
end
2019-05-21 14:01:17 +00:00
end
end
end
2019-06-02 12:41:53 +00:00
end
2019-05-21 14:01:17 +00:00
2019-06-02 12:41:53 +00:00
spawn do
2019-06-03 18:12:06 +00:00
begin
loop do
event = connection . receive
notification = JSON . parse ( event . payload )
topic = notification [ " topic " ] . as_s
video_id = notification [ " videoId " ] . as_s
published = notification [ " published " ] . as_i64
2019-06-03 18:36:49 +00:00
if ! topics . try & . includes? topic
next
end
2019-06-29 02:17:56 +00:00
video = get_video ( video_id , PG_DB )
2019-06-03 18:12:06 +00:00
video . published = Time . unix ( published )
2020-06-15 22:10:30 +00:00
response = JSON . parse ( video . to_json ( locale ) )
2019-06-03 18:12:06 +00:00
if fields_text = env . params . query [ " fields " ]?
begin
JSONFilter . filter ( response , fields_text )
rescue ex
env . response . status_code = 400
response = { " error " = > ex . message }
end
2019-06-02 12:41:53 +00:00
end
2019-06-03 18:36:49 +00:00
env . response . puts " id: #{ id } "
env . response . puts " data: #{ response . to_json } "
env . response . puts
env . response . flush
2019-06-02 12:41:53 +00:00
2019-06-03 18:36:49 +00:00
id += 1
2019-06-02 12:41:53 +00:00
end
2019-06-03 18:12:06 +00:00
rescue ex
ensure
connection_channel . send ( { false , connection } )
2019-05-21 14:01:17 +00:00
end
2019-06-02 12:41:53 +00:00
end
2019-06-03 18:12:06 +00:00
begin
# Send heartbeat
loop do
2019-06-08 00:56:41 +00:00
env . response . puts " :keepalive #{ Time . utc . to_unix } "
2019-06-03 18:12:06 +00:00
env . response . puts
env . response . flush
sleep ( 20 + rand ( 11 ) ) . seconds
end
rescue ex
ensure
connection_channel . send ( { false , connection } )
2019-05-21 14:01:17 +00:00
end
end
2019-07-11 12:27:42 +00:00
2020-06-15 22:33:23 +00:00
def extract_initial_data ( body ) : Hash ( String , JSON :: Any )
2021-03-30 00:37:12 +00:00
return JSON . parse ( body . match ( / (window \ ["ytInitialData" \ ]|var \ s*ytInitialData) \ s*= \ s*(?<info>{.*?});< \/ script> /mx ) . try & . [ " info " ] || " {} " ) . as_h
2019-07-11 12:27:42 +00:00
end
2019-07-18 23:51:10 +00:00
def proxy_file ( response , env )
if response . headers . includes_word? ( " Content-Encoding " , " gzip " )
2020-06-15 22:57:20 +00:00
Compress :: Gzip :: Writer . open ( env . response ) do | deflate |
IO . copy response . body_io , deflate
2019-07-18 23:51:10 +00:00
end
elsif response . headers . includes_word? ( " Content-Encoding " , " deflate " )
2020-06-15 22:57:20 +00:00
Compress :: Deflate :: Writer . open ( env . response ) do | deflate |
IO . copy response . body_io , deflate
2019-07-18 23:51:10 +00:00
end
else
2020-06-15 22:57:20 +00:00
IO . copy response . body_io , env . response
end
end
# See https://github.com/kemalcr/kemal/pull/576
class HTTP::Server::Response:: Output
def close
return if closed?
unless response . wrote_headers?
response . content_length = @out_count
end
ensure_headers_written
super
if @chunked
@io << " 0 \ r \n \ r \n "
@io . flush
end
2019-07-18 23:51:10 +00:00
end
end
class HTTP::Client:: Response
def pipe ( io )
HTTP . serialize_body ( io , headers , @body , @body_io , @version )
end
end
# Supports serialize_body without first writing headers
module HTTP
def self . serialize_body ( io , headers , body , body_io , version )
if body
io << body
elsif body_io
content_length = content_length ( headers )
if content_length
copied = IO . copy ( body_io , io )
if copied != content_length
raise ArgumentError . new ( " Content-Length header is #{ content_length } but body had #{ copied } bytes " )
end
elsif Client :: Response . supports_chunked? ( version )
headers [ " Transfer-Encoding " ] = " chunked "
serialize_chunked_body ( io , body_io )
else
io << body
end
end
end
end
class HTTP:: Client
property family : Socket :: Family = Socket :: Family :: UNSPEC
private def socket
socket = @socket
return socket if socket
hostname = @host . starts_with? ( '[' ) && @host . ends_with? ( ']' ) ? @host [ 1 .. - 2 ] : @host
socket = TCPSocket . new hostname , @port , @dns_timeout , @connect_timeout , @family
socket . read_timeout = @read_timeout if @read_timeout
socket . sync = false
{% if ! flag? ( :without_openssl ) %}
if tls = @tls
socket = OpenSSL :: SSL :: Socket :: Client . new ( socket , context : tls , sync_close : true , hostname : @host )
end
{% end %}
@socket = socket
end
end
class TCPSocket
def initialize ( host , port , dns_timeout = nil , connect_timeout = nil , family = Socket :: Family :: UNSPEC )
Addrinfo . tcp ( host , port , timeout : dns_timeout , family : family ) do | addrinfo |
super ( addrinfo . family , addrinfo . type , addrinfo . protocol )
connect ( addrinfo , timeout : connect_timeout ) do | error |
close
error
end
end
end
end