Fix crash in video crawler

pull/42/head
Omar Roth 2018-07-26 08:41:23 -05:00
rodzic 3f577650bc
commit 0fba601e91
2 zmienionych plików z 3 dodań i 4 usunięć

Wyświetl plik

@ -86,6 +86,7 @@ crawl_threads.times do
end
loop do
client = make_client(YT_URL)
if ids.empty?
search(random.base64(3), client) do |id|
ids << id
@ -97,7 +98,6 @@ crawl_threads.times do
video = get_video(id, client, PG_DB)
rescue ex
STDOUT << id << " : " << ex.message << "\n"
client = make_client(YT_URL)
next
ensure
ids.delete(id)

Wyświetl plik

@ -307,9 +307,8 @@ def get_video(id, client, db, refresh = true)
return video
end
def search(query, client)
html = client.get("https://www.youtube.com/results?q=#{query}&sp=EgIQAVAU&disable_polymer=1").body
def search(query, client, &block)
html = client.get("/results?q=#{query}&sp=EgIQAVAU&disable_polymer=1").body
html = XML.parse_html(html)
html.xpath_nodes(%q(//ol[@class="item-section"]/li)).each do |item|