|
@ -5,14 +5,14 @@ from json import loads, dumps |
|
|
|
|
|
|
|
|
import requests as req |
|
|
import requests as req |
|
|
|
|
|
|
|
|
searchUrl = "https://archive.org/advancedsearch.php?q={0}&fl%5B%5D=avg_rating&fl%5B%5D=description&fl%5B%5D=identifier&fl%5B%5D=type&sort%5B%5D=&sort%5B%5D=&sort%5B%5D=&rows=50&page=1&output=json&callback=callback&save=yes#raw" |
|
|
searchUrl = "https://archive.org/advancedsearch.php?q={0}&fl%5B%5D=avg_rating&fl%5B%5D=description&fl%5B%5D=identifier&fl%5B%5D=mediatype&fl%5B%5D=type&fl%5B%5D=type&sort%5B%5D=&sort%5B%5D=&sort%5B%5D=&rows=50&page=1&output=json&callback=callback&save=yes#raw" |
|
|
|
|
|
|
|
|
def searchIA(title, author): |
|
|
def searchIA(title, author): |
|
|
""" |
|
|
""" |
|
|
Do a search on The Internet Archive for a book |
|
|
Do a search on The Internet Archive for a book |
|
|
""" |
|
|
""" |
|
|
print("running a search") |
|
|
print("running a search") |
|
|
requrl = searchUrl.format(quote(title + " " + author)) |
|
|
requrl = searchUrl.format(quote(title) + " AND " + quote(author)) |
|
|
try: |
|
|
try: |
|
|
results = loads(req.get(requrl).text[9:][0:-1]) |
|
|
results = loads(req.get(requrl).text[9:][0:-1]) |
|
|
except ValueError: |
|
|
except ValueError: |
|
@ -24,7 +24,8 @@ def searchIA(title, author): |
|
|
return [] |
|
|
return [] |
|
|
docs = results["response"]["docs"] |
|
|
docs = results["response"]["docs"] |
|
|
urls = [] |
|
|
urls = [] |
|
|
for result in results["response"]["docs"][0:3]: |
|
|
for result in [r for r in results["response"]["docs"][0:10] if r["mediatype"] == "texts"]: |
|
|
|
|
|
print(result) |
|
|
urls.append("https://archive.org/details/%s" % result["identifier"]) |
|
|
urls.append("https://archive.org/details/%s" % result["identifier"]) |
|
|
return urls |
|
|
return urls |
|
|
|
|
|
|
|
|