2019-03-29 16:30:02 -05:00
|
|
|
struct SearchVideo
|
2019-06-07 12:39:12 -05:00
|
|
|
def to_xml(host_url, auto_generated, xml : XML::Builder)
|
|
|
|
xml.element("entry") do
|
|
|
|
xml.element("id") { xml.text "yt:video:#{self.id}" }
|
|
|
|
xml.element("yt:videoId") { xml.text self.id }
|
|
|
|
xml.element("yt:channelId") { xml.text self.ucid }
|
|
|
|
xml.element("title") { xml.text self.title }
|
|
|
|
xml.element("link", rel: "alternate", href: "#{host_url}/watch?v=#{self.id}")
|
|
|
|
|
|
|
|
xml.element("author") do
|
|
|
|
if auto_generated
|
|
|
|
xml.element("name") { xml.text self.author }
|
|
|
|
xml.element("uri") { xml.text "#{host_url}/channel/#{self.ucid}" }
|
|
|
|
else
|
|
|
|
xml.element("name") { xml.text author }
|
|
|
|
xml.element("uri") { xml.text "#{host_url}/channel/#{ucid}" }
|
|
|
|
end
|
|
|
|
end
|
|
|
|
|
|
|
|
xml.element("content", type: "xhtml") do
|
|
|
|
xml.element("div", xmlns: "http://www.w3.org/1999/xhtml") do
|
|
|
|
xml.element("a", href: "#{host_url}/watch?v=#{self.id}") do
|
|
|
|
xml.element("img", src: "#{host_url}/vi/#{self.id}/mqdefault.jpg")
|
|
|
|
end
|
|
|
|
end
|
|
|
|
end
|
|
|
|
|
|
|
|
xml.element("published") { xml.text self.published.to_s("%Y-%m-%dT%H:%M:%S%:z") }
|
|
|
|
|
|
|
|
xml.element("media:group") do
|
|
|
|
xml.element("media:title") { xml.text self.title }
|
|
|
|
xml.element("media:thumbnail", url: "#{host_url}/vi/#{self.id}/mqdefault.jpg",
|
|
|
|
width: "320", height: "180")
|
|
|
|
xml.element("media:description") { xml.text self.description }
|
|
|
|
end
|
|
|
|
|
|
|
|
xml.element("media:community") do
|
|
|
|
xml.element("media:statistics", views: self.views)
|
|
|
|
end
|
|
|
|
end
|
|
|
|
end
|
|
|
|
|
|
|
|
def to_xml(host_url, auto_generated, xml : XML::Builder | Nil = nil)
|
|
|
|
if xml
|
|
|
|
to_xml(host_url, auto_generated, xml)
|
|
|
|
else
|
|
|
|
XML.build do |json|
|
|
|
|
to_xml(host_url, auto_generated, xml)
|
|
|
|
end
|
|
|
|
end
|
|
|
|
end
|
|
|
|
|
2019-04-03 11:35:58 -05:00
|
|
|
db_mapping({
|
2019-03-22 12:24:47 -05:00
|
|
|
title: String,
|
|
|
|
id: String,
|
|
|
|
author: String,
|
|
|
|
ucid: String,
|
|
|
|
published: Time,
|
|
|
|
views: Int64,
|
|
|
|
description: String,
|
|
|
|
description_html: String,
|
|
|
|
length_seconds: Int32,
|
|
|
|
live_now: Bool,
|
|
|
|
paid: Bool,
|
|
|
|
premium: Bool,
|
|
|
|
premiere_timestamp: Time?,
|
2018-08-04 23:07:38 -05:00
|
|
|
})
|
|
|
|
end
|
|
|
|
|
2019-03-29 16:30:02 -05:00
|
|
|
struct SearchPlaylistVideo
|
2019-04-03 11:35:58 -05:00
|
|
|
db_mapping({
|
2018-09-20 09:36:09 -05:00
|
|
|
title: String,
|
|
|
|
id: String,
|
|
|
|
length_seconds: Int32,
|
|
|
|
})
|
|
|
|
end
|
|
|
|
|
2019-03-29 16:30:02 -05:00
|
|
|
struct SearchPlaylist
|
2019-04-03 11:35:58 -05:00
|
|
|
db_mapping({
|
2019-03-17 09:00:00 -05:00
|
|
|
title: String,
|
|
|
|
id: String,
|
|
|
|
author: String,
|
|
|
|
ucid: String,
|
|
|
|
video_count: Int32,
|
|
|
|
videos: Array(SearchPlaylistVideo),
|
|
|
|
thumbnail_id: String?,
|
2018-09-20 09:36:09 -05:00
|
|
|
})
|
|
|
|
end
|
|
|
|
|
2019-03-29 16:30:02 -05:00
|
|
|
struct SearchChannel
|
2019-04-03 11:35:58 -05:00
|
|
|
db_mapping({
|
2018-09-20 09:36:09 -05:00
|
|
|
author: String,
|
|
|
|
ucid: String,
|
|
|
|
author_thumbnail: String,
|
|
|
|
subscriber_count: Int32,
|
|
|
|
video_count: Int32,
|
|
|
|
description: String,
|
|
|
|
description_html: String,
|
|
|
|
})
|
|
|
|
end
|
|
|
|
|
|
|
|
alias SearchItem = SearchVideo | SearchChannel | SearchPlaylist
|
|
|
|
|
2018-09-13 17:47:31 -05:00
|
|
|
def channel_search(query, page, channel)
|
|
|
|
client = make_client(YT_URL)
|
|
|
|
|
2019-04-11 13:52:09 -05:00
|
|
|
response = client.get("/channel/#{channel}?disable_polymer=1&hl=en&gl=US")
|
2018-09-13 17:47:31 -05:00
|
|
|
document = XML.parse_html(response.body)
|
|
|
|
canonical = document.xpath_node(%q(//link[@rel="canonical"]))
|
|
|
|
|
|
|
|
if !canonical
|
2019-04-11 13:52:09 -05:00
|
|
|
response = client.get("/c/#{channel}?disable_polymer=1&hl=en&gl=US")
|
2018-09-13 17:47:31 -05:00
|
|
|
document = XML.parse_html(response.body)
|
|
|
|
canonical = document.xpath_node(%q(//link[@rel="canonical"]))
|
|
|
|
end
|
|
|
|
|
2019-04-22 15:39:57 -05:00
|
|
|
if !canonical
|
|
|
|
response = client.get("/user/#{channel}?disable_polymer=1&hl=en&gl=US")
|
|
|
|
document = XML.parse_html(response.body)
|
|
|
|
canonical = document.xpath_node(%q(//link[@rel="canonical"]))
|
|
|
|
end
|
|
|
|
|
2018-09-13 17:47:31 -05:00
|
|
|
if !canonical
|
2018-09-20 09:36:09 -05:00
|
|
|
return 0, [] of SearchItem
|
2018-09-13 17:47:31 -05:00
|
|
|
end
|
|
|
|
|
|
|
|
ucid = canonical["href"].split("/")[-1]
|
|
|
|
|
|
|
|
url = produce_channel_search_url(ucid, query, page)
|
|
|
|
response = client.get(url)
|
|
|
|
json = JSON.parse(response.body)
|
|
|
|
|
|
|
|
if json["content_html"]? && !json["content_html"].as_s.empty?
|
|
|
|
document = XML.parse_html(json["content_html"].as_s)
|
|
|
|
nodeset = document.xpath_nodes(%q(//li[contains(@class, "feed-item-container")]))
|
|
|
|
|
|
|
|
count = nodeset.size
|
2018-09-20 09:36:09 -05:00
|
|
|
items = extract_items(nodeset)
|
2018-09-13 17:47:31 -05:00
|
|
|
else
|
|
|
|
count = 0
|
2018-09-20 09:36:09 -05:00
|
|
|
items = [] of SearchItem
|
2018-09-13 17:47:31 -05:00
|
|
|
end
|
|
|
|
|
2018-09-20 09:36:09 -05:00
|
|
|
return count, items
|
2018-09-13 17:47:31 -05:00
|
|
|
end
|
|
|
|
|
2019-02-06 18:21:40 -06:00
|
|
|
def search(query, page = 1, search_params = produce_search_params(content_type: "all"), proxies = nil, region = nil)
|
|
|
|
client = make_client(YT_URL, proxies, region)
|
2018-08-27 15:23:25 -05:00
|
|
|
if query.empty?
|
2018-09-20 09:36:09 -05:00
|
|
|
return {0, [] of SearchItem}
|
2018-08-27 15:23:25 -05:00
|
|
|
end
|
|
|
|
|
2018-09-25 17:55:32 -05:00
|
|
|
html = client.get("/results?q=#{URI.escape(query)}&page=#{page}&sp=#{search_params}&hl=en&disable_polymer=1").body
|
2018-08-04 23:07:38 -05:00
|
|
|
if html.empty?
|
2018-09-20 09:36:09 -05:00
|
|
|
return {0, [] of SearchItem}
|
2018-08-04 23:07:38 -05:00
|
|
|
end
|
|
|
|
|
2018-08-04 15:30:44 -05:00
|
|
|
html = XML.parse_html(html)
|
2018-08-10 09:44:19 -05:00
|
|
|
nodeset = html.xpath_nodes(%q(//ol[@class="item-section"]/li))
|
2018-09-20 09:36:09 -05:00
|
|
|
items = extract_items(nodeset)
|
2018-08-04 15:30:44 -05:00
|
|
|
|
2018-09-20 09:36:09 -05:00
|
|
|
return {nodeset.size, items}
|
2018-08-04 15:30:44 -05:00
|
|
|
end
|
2018-08-04 17:12:58 -05:00
|
|
|
|
2018-09-17 16:38:18 -05:00
|
|
|
def produce_search_params(sort : String = "relevance", date : String = "", content_type : String = "",
|
|
|
|
duration : String = "", features : Array(String) = [] of String)
|
2018-08-04 17:12:58 -05:00
|
|
|
head = "\x08"
|
2018-08-27 15:23:25 -05:00
|
|
|
head += case sort
|
2018-08-04 17:12:58 -05:00
|
|
|
when "relevance"
|
|
|
|
"\x00"
|
|
|
|
when "rating"
|
|
|
|
"\x01"
|
2018-08-30 17:42:30 -05:00
|
|
|
when "upload_date", "date"
|
2018-08-04 17:12:58 -05:00
|
|
|
"\x02"
|
2018-08-30 17:42:30 -05:00
|
|
|
when "view_count", "views"
|
2018-08-04 17:12:58 -05:00
|
|
|
"\x03"
|
|
|
|
else
|
2018-08-27 15:23:25 -05:00
|
|
|
raise "No sort #{sort}"
|
2018-08-04 17:12:58 -05:00
|
|
|
end
|
|
|
|
|
|
|
|
body = ""
|
|
|
|
body += case date
|
|
|
|
when "hour"
|
|
|
|
"\x08\x01"
|
|
|
|
when "today"
|
|
|
|
"\x08\x02"
|
|
|
|
when "week"
|
|
|
|
"\x08\x03"
|
|
|
|
when "month"
|
|
|
|
"\x08\x04"
|
|
|
|
when "year"
|
|
|
|
"\x08\x05"
|
|
|
|
else
|
|
|
|
""
|
|
|
|
end
|
|
|
|
|
|
|
|
body += case content_type
|
|
|
|
when "video"
|
|
|
|
"\x10\x01"
|
|
|
|
when "channel"
|
|
|
|
"\x10\x02"
|
|
|
|
when "playlist"
|
|
|
|
"\x10\x03"
|
|
|
|
when "movie"
|
|
|
|
"\x10\x04"
|
|
|
|
when "show"
|
|
|
|
"\x10\x05"
|
2018-09-20 09:36:09 -05:00
|
|
|
when "all"
|
2018-08-04 17:12:58 -05:00
|
|
|
""
|
2018-09-20 09:36:09 -05:00
|
|
|
else
|
|
|
|
"\x10\x01"
|
2018-08-04 17:12:58 -05:00
|
|
|
end
|
|
|
|
|
|
|
|
body += case duration
|
|
|
|
when "short"
|
|
|
|
"\x18\x01"
|
|
|
|
when "long"
|
|
|
|
"\x18\x02"
|
|
|
|
else
|
|
|
|
""
|
|
|
|
end
|
|
|
|
|
|
|
|
features.each do |feature|
|
|
|
|
body += case feature
|
|
|
|
when "hd"
|
|
|
|
"\x20\x01"
|
|
|
|
when "subtitles"
|
|
|
|
"\x28\x01"
|
2018-08-30 17:42:30 -05:00
|
|
|
when "creative_commons", "cc"
|
2018-08-04 17:12:58 -05:00
|
|
|
"\x30\x01"
|
|
|
|
when "3d"
|
|
|
|
"\x38\x01"
|
2018-09-20 10:16:10 -05:00
|
|
|
when "live", "livestream"
|
2018-08-04 17:12:58 -05:00
|
|
|
"\x40\x01"
|
|
|
|
when "purchased"
|
|
|
|
"\x48\x01"
|
|
|
|
when "4k"
|
|
|
|
"\x70\x01"
|
|
|
|
when "360"
|
|
|
|
"\x78\x01"
|
|
|
|
when "location"
|
|
|
|
"\xb8\x01\x01"
|
|
|
|
when "hdr"
|
|
|
|
"\xc8\x01\x01"
|
|
|
|
else
|
|
|
|
raise "Unknown feature #{feature}"
|
|
|
|
end
|
|
|
|
end
|
|
|
|
|
2019-02-26 14:31:37 -06:00
|
|
|
if !body.empty?
|
2018-09-17 16:38:18 -05:00
|
|
|
token = head + "\x12" + body.size.unsafe_chr + body
|
2018-08-04 17:12:58 -05:00
|
|
|
else
|
|
|
|
token = head
|
|
|
|
end
|
|
|
|
|
|
|
|
token = Base64.urlsafe_encode(token)
|
|
|
|
token = URI.escape(token)
|
|
|
|
|
|
|
|
return token
|
|
|
|
end
|
2018-09-13 17:47:31 -05:00
|
|
|
|
|
|
|
def produce_channel_search_url(ucid, query, page)
|
|
|
|
page = "#{page}"
|
|
|
|
|
2019-02-04 15:17:10 -06:00
|
|
|
meta = IO::Memory.new
|
|
|
|
meta.write(Bytes[0x12, 0x06])
|
|
|
|
meta.print("search")
|
|
|
|
|
|
|
|
meta.write(Bytes[0x30, 0x02])
|
|
|
|
meta.write(Bytes[0x38, 0x01])
|
|
|
|
meta.write(Bytes[0x60, 0x01])
|
|
|
|
meta.write(Bytes[0x6a, 0x00])
|
|
|
|
meta.write(Bytes[0xb8, 0x01, 0x00])
|
|
|
|
|
|
|
|
meta.write(Bytes[0x7a, page.size])
|
|
|
|
meta.print(page)
|
|
|
|
|
|
|
|
meta.rewind
|
|
|
|
meta = Base64.urlsafe_encode(meta.to_slice)
|
2018-09-13 17:47:31 -05:00
|
|
|
meta = URI.escape(meta)
|
|
|
|
|
2019-02-04 15:17:10 -06:00
|
|
|
continuation = IO::Memory.new
|
|
|
|
continuation.write(Bytes[0x12, ucid.size])
|
|
|
|
continuation.print(ucid)
|
|
|
|
|
|
|
|
continuation.write(Bytes[0x1a, meta.size])
|
|
|
|
continuation.print(meta)
|
|
|
|
|
|
|
|
continuation.write(Bytes[0x5a, query.size])
|
|
|
|
continuation.print(query)
|
|
|
|
|
|
|
|
continuation.rewind
|
|
|
|
continuation = continuation.gets_to_end
|
2018-09-13 17:47:31 -05:00
|
|
|
|
2019-02-04 15:17:10 -06:00
|
|
|
wrapper = IO::Memory.new
|
|
|
|
wrapper.write(Bytes[0xe2, 0xa9, 0x85, 0xb2, 0x02, continuation.size])
|
|
|
|
wrapper.print(continuation)
|
|
|
|
wrapper.rewind
|
2018-09-13 17:47:31 -05:00
|
|
|
|
2019-02-04 15:17:10 -06:00
|
|
|
wrapper = Base64.urlsafe_encode(wrapper.to_slice)
|
|
|
|
wrapper = URI.escape(wrapper)
|
2018-09-13 17:47:31 -05:00
|
|
|
|
2019-02-04 15:17:10 -06:00
|
|
|
url = "/browse_ajax?continuation=#{wrapper}&gl=US&hl=en"
|
2018-09-13 17:47:31 -05:00
|
|
|
|
|
|
|
return url
|
|
|
|
end
|