import os
import glob
import re
from PIL import Image
from pathlib import Path
import shutil
delete_unused_images = True # if true, and an image is not referenced in any markdown file, it will be deleted
max_density = 400 # maximum image resolution, in dots per inch. You can set a very big value here if you don't want to resize images
full_width = 800 # width of the page, in pixels
page_width = 190 # in millimeters, without print margins
source_dir = os.path.dirname(__file__) + '/../source'
images_dir = os.path.dirname(__file__) + '/../source/img' # subdirectories are explored too
target_dir = os.path.dirname(__file__) + '/../source/img' # can be the same directory as images_dir, or another one
md_sources = list(glob.iglob(source_dir + '/**/*.md', recursive=True))
# Replace an image in all source files
def replace_image(original_rel_path, new_rel_path):
for src_name in md_sources:
with open(src_name) as src_file:
original_contents = src_file.read()
new_contents = original_contents.replace(original_rel_path, new_rel_path)
if new_contents != original_contents:
with open(src_name, 'w') as new_file:
new_file.write(new_contents)
total_saved_space = 0
for image_path in (Path(images_dir).glob("**/*")):
if image_path.suffix.lower() not in {".jpg", ".jpeg", ".png", ".svg"}: continue
image_filename = image_path.name
image_display_width = 0
# compute target path relatively to the source folder
image_rel_path = os.path.relpath(image_path.resolve(), images_dir)
image_rel_path = os.path.relpath(target_dir + '/' + image_rel_path, source_dir)
os.makedirs(os.path.dirname(source_dir + '/' + image_rel_path), exist_ok = True)
if images_dir != target_dir and os.path.isfile(source_dir + '/' + image_rel_path): continue
#print(image_rel_path)
image_search = re.escape(image_rel_path)
image = Image.open(image_path.resolve()) if image_path.suffix.lower() != '.svg' else None
image_aspect = 1 if image is None else image.size[0] / image.size[1]
original_size = os.path.getsize(image_path.resolve())
for src_name in md_sources:
with open(src_name) as src_file:
src_contents = src_file.read()
# ![alt text](image/path)
for img_code in re.finditer('!\[.*\]\('+image_search+'\)', src_contents):
#print(img_code.group(0))
image_display_width = max(image_display_width, full_width)
#
for img_code in re.finditer('', src_contents):
#print(img_code.group(0))
width = full_width
width_code = re.search('width="(.*?)[px]*"', img_code.group(0))
if width_code is None:
height_code = re.search('height="(.*?)[px]*"', img_code.group(0))
if height_code is not None:
height = int(height_code.group(1))
width = int(image_aspect * height + 0.5)
else:
width = int(width_code.group(1))
image_display_width = max(image_display_width, width)
# ```{image} img/vhelio.png :width: wpx :height: hpx```
for img_code in re.finditer('```{image} '+image_search+'.*?```', src_contents, re.MULTILINE + re.DOTALL):
#print(img_code.group(0))
width = full_width
width_code = re.search(':width:\s*(.*?)[px]*\s', img_code.group(0))
if width_code is None:
height_code = re.search(':height:\s*(.*?)[px]*\s', img_code.group(0))
if height_code is not None:
height = int(height_code.group(1))
width = int(image_aspect * height + 0.5)
else:
width = int(width_code.group(1))
image_display_width = max(image_display_width, width)
if image_display_width == 0:
if delete_unused_images:
print('WARNING: removing unused image ' + image_rel_path)
os.remove(image_path.resolve())
continue
else:
raise Exception('Image not found in source documents: ' + image_rel_path)
if image is None:
if images_dir != target_dir:
shutil.copyfile(image_path.resolve(), source_dir + '/' + image_rel_path)
continue
#print(image_filename + ': width=' + str(image_info.max_width))
image_width_inches = image_display_width / full_width * page_width / 25.4
target_resolution_width = max(1, int(max_density * image_width_inches + 0.5))
target_resolution_height = max(1, int(target_resolution_width/image.size[0]*image.size[1]+0.5))
if target_resolution_width > image.size[0]:
target_resolution_width = image.size[0]
target_resolution_height = image.size[1]
#print('Resizing image ' + image_filename + ' from ' + str(current_image.size[0]) + ' to ' + str(target_resolution_width))
resized = image.resize((target_resolution_width,target_resolution_height), Image.Resampling.LANCZOS) if target_resolution_width != image.size[0] else image
target_path = source_dir + '/' + image_rel_path
if image_path.suffix.lower() == '.png':
# Try to save the file as JPEG to see if it would be significantly smaller
# This helps detecting files that should be JPEG, not PNG
if resized.mode != 'RGB':
background = Image.new('RGBA', resized.size, (255,255,255))
alpha_composite = Image.alpha_composite(background, resized.convert('RGBA'))
resized = alpha_composite.convert('RGB')
png_path = target_path
jpeg_path = png_path[0:-4] + '.jpg.tmp'
png_path = png_path + '.tmp'
resized.save(jpeg_path, format = 'JPEG', quality = 80)
resized.save(png_path, format = 'PNG')
# Force JPEG compression if it makes the image at least twice as small (in some cases, PNG can even give a smaller file)
png_size = os.path.getsize(png_path)
jpeg_size = os.path.getsize(jpeg_path)
best_png_size = min(original_size, png_size)
if jpeg_size < best_png_size - 200*1024 or jpeg_size < best_png_size / 2:
os.remove(png_path)
os.remove(target_path)
os.rename(jpeg_path, jpeg_path[0:-4])
print('WARNING: ' + image_rel_path + ' has been converted to JPEG format')
replace_image(image_rel_path, os.path.relpath(jpeg_path[0:-4], source_dir))
total_saved_space += original_size - jpeg_size
else:
os.remove(jpeg_path)
if png_size < original_size - 100*1024 or png_size < original_size * 8/10:
total_saved_space += original_size - png_size
os.remove(target_path)
os.rename(png_path, target_path)
print('Recompressed PNG ' + image_rel_path)
else:
os.remove(png_path)
else:
tmp_path = target_path + '.tmp'
resized.save(tmp_path, format = 'JPEG', quality = 80)
tmp_size = os.path.getsize(tmp_path)
if tmp_size < original_size - 100*1024 or tmp_size < original_size * 8/10:
total_saved_space += original_size - tmp_size
os.remove(target_path)
os.rename(tmp_path, target_path)
print('Recompressed JPEG ' + image_rel_path)
else:
os.remove(tmp_path)
print('Done. Saved ' + str(int(total_saved_space/1024+0.5)) + 'kB.')