Compare commits
	
		
			4 Commits
		
	
	
		
			new-taxono
			...
			opds-fetch
		
	
	| Author | SHA1 | Date | |
|---|---|---|---|
| 2db5be3438 | |||
| 028bc1df84 | |||
| 82a017f624 | |||
| 3055ee37df | 
| @ -155,6 +155,8 @@ def parse_enclosures(post_dir, entry): | ||||
|         if "type" in e: | ||||
|             print("found enclosed media", e.type) | ||||
|             if "image/" in e.type: | ||||
|                 if not os.path.exists(post_dir): #this might be redundant with create_post | ||||
|                     os.makedirs(post_dir) | ||||
|                 featured_image = grab_media(post_dir, e.href) | ||||
|                 media_item = urlparse(e.href).path.split('/')[-1] | ||||
|                 entry["featured_image"] = media_item | ||||
| @ -310,12 +312,15 @@ def create_opds_post(post_dir, entry): | ||||
|         ft = item['type'].split('/')[-1] | ||||
|         fn = item['rel'].split('/')[-1] | ||||
|  | ||||
|         if fn == "acquisition": | ||||
|             fn = "publication" #calling the publications acquisition is weird | ||||
|         # entry.links has image, thumbnail and publication/acquisition. | ||||
|         # Only downloading image for now | ||||
|         #if fn == "acquisition":  | ||||
|         #fn = "publication" #calling the publications acquisition is weird  | ||||
|  | ||||
|         prefered_name = "{}-{}.{}".format(fn, slugify(entry['title']), ft) | ||||
|  | ||||
|         grab_media(post_dir, item['href'], prefered_name) | ||||
|         if 'image' in fn: | ||||
|             prefered_name = "{}-{}.{}".format(fn, slugify(entry['title']), ft) | ||||
|             grab_media(post_dir, item['href'], prefered_name) | ||||
|             frontmatter['featured_image'] = prefered_name | ||||
|  | ||||
|         if "summary" in entry: | ||||
|             summary = entry.summary | ||||
| @ -331,6 +336,18 @@ def create_opds_post(post_dir, entry): | ||||
|         timestamp = arrow.get(entry['updated_parsed']) | ||||
|         f.write(timestamp.format('X')) | ||||
|  | ||||
| def opds_fetch_more(data): | ||||
|     """ | ||||
|     Look for mode OPDS feeds to pull, untill we no longer hit the "next" navigation property.  | ||||
|     """ | ||||
|     for link in data.feed.links: | ||||
|         for i in link: | ||||
|             if link[i] == 'next': | ||||
|                 print(link['href']) | ||||
|                 data = grab_feed(link['href']) | ||||
|                 return data | ||||
|     return None | ||||
|  | ||||
|  | ||||
| def main(): | ||||
|     feed_urls = open("feeds_list.txt", "r").read().splitlines() | ||||
| @ -377,12 +394,23 @@ def main(): | ||||
|         if data: #whenever we get a 200 | ||||
|             if data.feed: #only if it is an actual feed | ||||
|                 opds_feed = False | ||||
|                 opds_entries = [] | ||||
|                 if 'links' in data.feed: | ||||
|                     for i in data.feed['links']: | ||||
|                             if i['rel'] == 'self': | ||||
|                                 if 'opds' in i['type']: | ||||
|                                     opds_feed = True | ||||
|                                     print("OPDS type feed!") | ||||
|                                     feed_data = data | ||||
|                                     while feed_data: | ||||
|                                         feed_data = opds_fetch_more(feed_data) | ||||
|                                         if feed_data: | ||||
|                                             for i in feed_data.entries: | ||||
|                                                 opds_entries.append(i) | ||||
|                                     for i in opds_entries: | ||||
|                                         data['entries'].append(i) | ||||
|                                      | ||||
|  | ||||
|  | ||||
|                 for entry in data.entries: | ||||
|                     # if 'tags' in entry: | ||||
|  | ||||
		Reference in New Issue
	
	Block a user
	