img2html: {remoteurl}

#!/usr/bin/python # Image to HTML converter # Copyright (C) January 2019 Neil Fraser # https://neil.fraser.name/ # This program is free software; you can redistribute it and/or # modify it under the terms of version 2 of the GNU General # Public License as published by the Free Software Foundation. # This program is distributed in the hope that it will be useful, # but WITHOUT ANY WARRANTY; without even the implied warranty of # MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the # GNU General Public License for more details. # http://www.gnu.org/ # Loads JPEGs, PNGs and GIFs from websites and converts them to HTML. # Usage: img2html.py?img=www.example.com/image.jpg from PIL import Image import cgi import cStringIO import math import re import sys import urllib # Throw a 500 error and terminate the program. def die(msg): print('Status:500') print('Content-type: text/plain') print('') print('Error: ' + msg) sys.exit() def is_valid_url(url): regex = re.compile( r'^https?://' # http:// or https:// r'(?:(?:[A-Z0-9](?:[A-Z0-9-]{0,61}[A-Z0-9])?\.)+[A-Z]{2,6}\.?|' # domain... r'\d{1,3}\.\d{1,3}\.\d{1,3}\.\d{1,3})' # ...or IP r'(?::\d+)?' # optional port r'(?:/?|[/?]\S+)$', re.IGNORECASE) return url is not None and regex.search(url) form = cgi.FieldStorage() if not form.has_key('img'): die('"img" paramater not found.') #rows = min(512+1, int(form['y'].value, 10)) remoteurl = form['img'].value remoteurl = remoteurl.strip() if not remoteurl: die('No image URL specified.') if not re.match('\\w+:\/\/', remoteurl): remoteurl = 'http://' + remoteurl if not is_valid_url(remoteurl): die('Invalid image URL. Please go back and check the address.') # Reduce load on my server, use cached tux.html if the request is tux.jpg if remoteurl == 'https://neil.fraser.name/software/img2html/tux.jpg': f = open('/home/neil/html/software/img2html/tux.html') print("Content-type: text/html\n\n") print(f.read()) f.close() sys.exit() try: f = urllib.urlopen(remoteurl) data = f.read() except Exception as err: die('Invalid image URL: %s' % err) oldsize = int(round(len(data) / 1024)) cStr = cStringIO.StringIO(data) image = Image.open(cStr) image = image.convert('RGBA') background = Image.new('RGBA', image.size, (255, 255, 255)) background.paste(image, mask=image.split()[3]) # 3 is the alpha channel image = background image = image.convert('RGB') maxPixels = 100*100 (oldX, oldY) = image.size if oldX * oldY > maxPixels: factor = math.sqrt(maxPixels / float(oldX * oldY)) newX = int(round(oldX * factor)) newY = int(round(oldY * factor)) image.thumbnail((newX, newY), Image.ANTIALIAS) msg = '[This image is too large to comfortably handle, so it has been scaled down to %s%% of its original size.]

' % int(100.0 * newX / oldX); else: newX = oldX newY = oldY msg = '' # Scan the image pixel by pixel and build the HTML table. table = ''; firstrow = True # Disable RLE for first row of each table segment (dodge Mozilla bug) for y in range(newY): row = ''; for x in range(newX): try: (r, g, b) = image.getpixel((x, y)) except: # Some images throw a range error on some (transparent?) pixels. (r, g, b) = (255, 255, 255) if x == newX: # Dummy run to clear the colspan buffer. rgb = '' else: rgb = '%02x%02x%02x' % (r, g, b) if x == 0: # Initialise the RLE (Run Length Encoding) prev_rgb = rgb span = 0 span += 1 if rgb != prev_rgb or firstrow: if span == 1: # One pixel. row += "" % prev_rgb else: # A run of multiple pixels with the same colour. row += "" % (prev_rgb, span) span = 0 prev_rgb = rgb table += "%s\n" % row # Segment the table so that MSIE renders it in pieces instead of waiting till the end. if y != 0 and (y == 5 or y % 15 == 0) and y < newY - 10: table += "\n" firstrow = True else: firstrow = False newsize = int(round(len(table) / 1024)) # We're done. Now print it all out (this is what takes the time). print("Content-type: text/html\n") print(""" img2html: {remoteurl}

Original Image
{remoteurl}
{oldX}x{oldY}
{oldsize}KB
{msg}
Text Image
{newX}x{newY}
{newsize}KB

{table}

Done """.format(remoteurl=remoteurl, table=table, msg=msg, oldsize=oldsize, newsize=newsize, oldX=oldX, oldY=oldY, newX=newX, newY=newY))