Compare commits
2 Commits
5bdb49fb80
...
8872618022
Author | SHA1 | Date |
---|---|---|
TheTechRobo | 8872618022 | |
TheTechRobo | 1e36186c9b |
9
grab.lua
9
grab.lua
|
@ -59,6 +59,13 @@ wget.callbacks.get_urls = function(file, url, is_css, iri)
|
|||
end
|
||||
table.insert(addedUrls, { url="https://www.tharpsontheimerfh.com/pax/prnobit", post_data="ok=" .. ok .. "&fcf=0&bg=1"})
|
||||
end
|
||||
io.stderr:write(table.show(addedUrls, "Added URLs "))
|
||||
if url:match("^https://www.bestattung%-muellner.at/?.?.?/sterbefall/[^/]+/%\?action=gedenkkerzen") then
|
||||
local root = htmlparser.parse(data)
|
||||
local otherPages = root(".pagination .inactive")
|
||||
for index, pagination in ipairs(otherPages) do
|
||||
table.insert(addedUrls, { url=pagination.attributes.href})
|
||||
end
|
||||
end
|
||||
io.stderr:write(table.show(addedUrls, "Added URLs"))
|
||||
return addedUrls
|
||||
end
|
||||
|
|
10
pipeline.py
10
pipeline.py
|
@ -184,6 +184,16 @@ class WgetArgs(object):
|
|||
item_name = [f'https://downsandsonfuneralhome.com/tribute/details/{i_n[1]}/Dr-Alex-Klym/obituary.html']
|
||||
elif i_n[0] == 'tharpsontheimerfh':
|
||||
item_name = [f'https://www.tharpsontheimerfh.com/tributes/{i_n[1]}', f'https://www.tharpsontheimerfh.com/printnotice/{i_n[1]}/1o/1c/1q/0d/1b', f'https://www.tharpsontheimerfh.com/tributes/{i_n[1]}/guest-book', f'https://www.tharpsontheimerfh.com/tributes/{i_n[1]}/photo-album', f'https://www.tharpsontheimerfh.com/tributes/{i_n[1]}/services']
|
||||
elif i_n[0] == 'bestattung-mullner':
|
||||
ep = 'https://www.bestattung-muellner.at%s/sterbefall/%s/'
|
||||
eps = []
|
||||
for language in ('', '/en', '/sk'): # de, en, sk
|
||||
eps.append(ep % (language, i_n[1]))
|
||||
eps.append(ep % (language, i_n[1]) + '?action=parte')
|
||||
eps.append(ep % (language, i_n[1]) + '?action=sterbebild')
|
||||
eps.append(ep % (language, i_n[1]) + '?action=gedenkkerzen')
|
||||
eps.append(ep % (language, i_n[1]) + '?action=kondolenzbuch')
|
||||
item_name = eps
|
||||
else:
|
||||
raise TypeError("bad item type")
|
||||
item_urls+=(item_name)
|
||||
|
|
Loading…
Reference in New Issue