display progress for extracting pdf images as well as for analyzing them
This commit is contained in:
		
							parent
							
								
									18fbc7f8dc
								
							
						
					
					
						commit
						26ec1901c3
					
				
					 1 changed files with 6 additions and 2 deletions
				
			
		|  | @ -388,10 +388,14 @@ class Collator: | |||
|                 return None | ||||
| 
 | ||||
|             self.dest.mkdir(parents=True, exist_ok=True) | ||||
| 
 | ||||
|             print(f'0 pages collated...', end='') | ||||
|             for (idx, image) in enumerate(images, start=self.index): | ||||
|                 file_path = self.dest / f'{idx:04d}.{image["ext"]}' | ||||
|                 with open(file_path, 'wb') as f: | ||||
|                     f.write(image["image"]) | ||||
|                 print(f'\x1b[2K\r{idx+1-self.index} pages collated...', end='') | ||||
|             print() | ||||
| 
 | ||||
|             self.index += pdf.page_count | ||||
|             return True | ||||
|  | @ -575,7 +579,7 @@ def pdf_images(pdf, strategy): | |||
|         return (extract_image(pdf, images[0][0]) for (images, _) in images_by_page) | ||||
| 
 | ||||
|     print("Checking PDF images the quick way failed, trying the slow way") | ||||
|     print(f'0/{pdf.page_count} pages processed...', end='') | ||||
|     print(f'0/{pdf.page_count} pages analyzed...', end='') | ||||
|     image_extractors = [] | ||||
|     for (idx, page) in enumerate(pdf): | ||||
|         page_images = page.get_image_info(xrefs=True) | ||||
|  | @ -610,7 +614,7 @@ def pdf_images(pdf, strategy): | |||
|                     display_sixel_page(page) | ||||
| 
 | ||||
|                 choice = input(f'[N]ope out / [c]onvert page{"" if xref is None else " / e[x]tract image"} / [d]rop page / [s]how page? [n/c{"" if xref is None else "/x"}/d/s] ') | ||||
|         print(f'\x1b[2K\r{idx+1}/{pdf.page_count} pages processed...', end=('' if idx+1 < pdf.page_count else '\n')) | ||||
|         print(f'\x1b[2K\r{idx+1}/{pdf.page_count} pages analyzed...', end=('' if idx+1 < pdf.page_count else '\n')) | ||||
| 
 | ||||
|     return (extractor() for extractor in image_extractors) | ||||
| 
 | ||||
|  |  | |||
		Loading…
	
	Add table
		Add a link
		
	
		Reference in a new issue