| 
									
										
										
										
											2019-07-12 19:08:46 +00:00
										 |  |  | __filename__ = "media.py" | 
					
						
							|  |  |  | __author__ = "Bob Mottram" | 
					
						
							|  |  |  | __license__ = "AGPL3+" | 
					
						
							| 
									
										
										
										
											2019-12-14 10:52:19 +00:00
										 |  |  | __version__ = "1.1.0" | 
					
						
							| 
									
										
										
										
											2019-07-12 19:08:46 +00:00
										 |  |  | __maintainer__ = "Bob Mottram" | 
					
						
							|  |  |  | __email__ = "bob@freedombone.net" | 
					
						
							|  |  |  | __status__ = "Production" | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | from blurhash import blurhash_encode as blurencode | 
					
						
							|  |  |  | from PIL import Image | 
					
						
							|  |  |  | import numpy | 
					
						
							|  |  |  | import os | 
					
						
							| 
									
										
										
										
											2019-07-12 19:51:10 +00:00
										 |  |  | import sys | 
					
						
							| 
									
										
										
										
											2019-07-12 19:08:46 +00:00
										 |  |  | import json | 
					
						
							|  |  |  | import datetime | 
					
						
							| 
									
										
										
										
											2019-12-04 18:52:27 +00:00
										 |  |  | from hashlib import sha1 | 
					
						
							| 
									
										
										
										
											2019-07-12 19:08:46 +00:00
										 |  |  | from auth import createPassword | 
					
						
							|  |  |  | from shutil import copyfile | 
					
						
							| 
									
										
										
										
											2019-07-12 19:51:10 +00:00
										 |  |  | from shutil import rmtree | 
					
						
							| 
									
										
										
										
											2019-07-12 19:55:23 +00:00
										 |  |  | from shutil import move | 
					
						
							| 
									
										
										
										
											2019-07-12 19:08:46 +00:00
										 |  |  | 
 | 
					
						
							| 
									
										
										
										
											2020-01-15 10:57:09 +00:00
										 |  |  | def replaceYouTube(postJsonObject: {}) -> None: | 
					
						
							| 
									
										
										
										
											2020-01-15 10:56:39 +00:00
										 |  |  |     """Replace YouTube with invidio.us
 | 
					
						
							|  |  |  |     This denies Google some, but not all, tracking data | 
					
						
							|  |  |  |     """
 | 
					
						
							|  |  |  |     if not isinstance(postJsonObject['object'], dict): | 
					
						
							|  |  |  |         return | 
					
						
							|  |  |  |     if not postJsonObject['object'].get('content'): | 
					
						
							|  |  |  |         return | 
					
						
							|  |  |  |     if 'www.youtube.com' not in postJsonObject['object']['content']: | 
					
						
							|  |  |  |         return | 
					
						
							|  |  |  |     postJsonObject['object']['content']= \ | 
					
						
							|  |  |  |         postJsonObject['object']['content'].replace('www.youtube.com','invidio.us') | 
					
						
							|  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2019-10-26 11:56:41 +00:00
										 |  |  | def removeMetaData(imageFilename: str,outputFilename: str) -> None: | 
					
						
							| 
									
										
										
										
											2020-01-08 14:53:28 +00:00
										 |  |  |     """Attempts to do this with pure python didn't work well,
 | 
					
						
							|  |  |  |     so better to use a dedicated tool if one is installed | 
					
						
							| 
									
										
										
										
											2020-01-08 14:31:25 +00:00
										 |  |  |     """
 | 
					
						
							|  |  |  |     copyfile(imageFilename,outputFilename) | 
					
						
							| 
									
										
										
										
											2020-01-08 14:53:28 +00:00
										 |  |  |     if os.path.isfile('/usr/bin/exiftool'): | 
					
						
							|  |  |  |         print('Removing metadata from '+outputFilename+' using exiftool') | 
					
						
							|  |  |  |         os.system('exiftool -all= '+outputFilename) | 
					
						
							|  |  |  |     elif os.path.isfile('/usr/bin/mogrify'): | 
					
						
							|  |  |  |         print('Removing metadata from '+outputFilename+' using mogrify') | 
					
						
							|  |  |  |         os.system('/usr/bin/mogrify -strip '+outputFilename) | 
					
						
							| 
									
										
										
										
											2019-07-24 13:14:23 +00:00
										 |  |  | 
 | 
					
						
							| 
									
										
										
										
											2019-07-12 19:51:10 +00:00
										 |  |  | def getImageHash(imageFilename: str) -> str: | 
					
						
							| 
									
										
										
										
											2019-07-12 19:26:54 +00:00
										 |  |  |     return blurencode(numpy.array(Image.open(imageFilename).convert("RGB"))) | 
					
						
							| 
									
										
										
										
											2019-07-12 19:08:46 +00:00
										 |  |  | 
 | 
					
						
							| 
									
										
										
										
											2019-08-30 18:01:29 +00:00
										 |  |  | def isMedia(imageFilename: str) -> bool: | 
					
						
							| 
									
										
										
										
											2019-11-14 15:11:20 +00:00
										 |  |  |     permittedMedia=['png','jpg','gif','webp','mp4','ogv','mp3','ogg'] | 
					
						
							| 
									
										
										
										
											2019-08-30 18:01:29 +00:00
										 |  |  |     for m in permittedMedia:         | 
					
						
							|  |  |  |         if imageFilename.endswith('.'+m): | 
					
						
							|  |  |  |             return True | 
					
						
							|  |  |  |     print('WARN: '+imageFilename+' is not a permitted media type') | 
					
						
							| 
									
										
										
										
											2019-07-12 19:08:46 +00:00
										 |  |  |     return False | 
					
						
							|  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2019-07-12 19:26:54 +00:00
										 |  |  | def createMediaDirs(baseDir: str,mediaPath: str) -> None:     | 
					
						
							| 
									
										
										
										
											2019-07-12 19:08:46 +00:00
										 |  |  |     if not os.path.isdir(baseDir+'/media'): | 
					
						
							|  |  |  |         os.mkdir(baseDir+'/media') | 
					
						
							| 
									
										
										
										
											2019-07-12 19:26:54 +00:00
										 |  |  |     if not os.path.isdir(baseDir+'/'+mediaPath): | 
					
						
							|  |  |  |         os.mkdir(baseDir+'/'+mediaPath) | 
					
						
							| 
									
										
										
										
											2019-07-12 19:08:46 +00:00
										 |  |  | 
 | 
					
						
							| 
									
										
										
										
											2019-07-12 19:26:54 +00:00
										 |  |  | def getMediaPath() -> str: | 
					
						
							|  |  |  |     currTime=datetime.datetime.utcnow() | 
					
						
							| 
									
										
										
										
											2019-07-12 19:51:10 +00:00
										 |  |  |     weeksSinceEpoch=int((currTime - datetime.datetime(1970,1,1)).days/7) | 
					
						
							| 
									
										
										
										
											2019-07-12 19:26:54 +00:00
										 |  |  |     return 'media/'+str(weeksSinceEpoch) | 
					
						
							| 
									
										
										
										
											2019-08-30 15:50:20 +00:00
										 |  |  | 
 | 
					
						
							|  |  |  | def getAttachmentMediaType(filename: str) -> str: | 
					
						
							|  |  |  |     """Returns the type of media for the given file
 | 
					
						
							|  |  |  |     image, video or audio | 
					
						
							|  |  |  |     """
 | 
					
						
							|  |  |  |     mediaType=None | 
					
						
							| 
									
										
										
										
											2019-11-14 15:11:20 +00:00
										 |  |  |     imageTypes=['png','jpg','jpeg','gif','webp'] | 
					
						
							| 
									
										
										
										
											2019-08-30 15:50:20 +00:00
										 |  |  |     for mType in imageTypes: | 
					
						
							|  |  |  |         if filename.endswith('.'+mType): | 
					
						
							|  |  |  |             return 'image' | 
					
						
							|  |  |  |     videoTypes=['mp4','webm','ogv'] | 
					
						
							|  |  |  |     for mType in videoTypes: | 
					
						
							|  |  |  |         if filename.endswith('.'+mType): | 
					
						
							|  |  |  |             return 'video' | 
					
						
							|  |  |  |     audioTypes=['mp3','ogg'] | 
					
						
							|  |  |  |     for mType in audioTypes: | 
					
						
							|  |  |  |         if filename.endswith('.'+mType): | 
					
						
							|  |  |  |             return 'audio' | 
					
						
							|  |  |  |     return mediaType | 
					
						
							|  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2019-12-04 18:52:27 +00:00
										 |  |  | def updateEtag(mediaFilename: str) -> None: | 
					
						
							|  |  |  |     """ calculate the etag, which is a sha1 of the data
 | 
					
						
							|  |  |  |     """
 | 
					
						
							|  |  |  |     # only create etags for media | 
					
						
							|  |  |  |     if '/media/' not in mediaFilename: | 
					
						
							|  |  |  |         return | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  |     # check that the media exists | 
					
						
							|  |  |  |     if not os.path.isfile(mediaFilename): | 
					
						
							|  |  |  |         return | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  |     # read the binary data | 
					
						
							|  |  |  |     data=None | 
					
						
							|  |  |  |     try: | 
					
						
							| 
									
										
										
										
											2019-12-04 18:55:40 +00:00
										 |  |  |         with open(mediaFilename, 'rb') as mediaFile: | 
					
						
							| 
									
										
										
										
											2019-12-04 18:52:27 +00:00
										 |  |  |             data=mediaFile.read()                 | 
					
						
							|  |  |  |     except: | 
					
						
							|  |  |  |         pass | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  |     if not data: | 
					
						
							|  |  |  |         return | 
					
						
							|  |  |  |     # calculate hash | 
					
						
							|  |  |  |     etag=sha1(data).hexdigest() | 
					
						
							|  |  |  |     # save the hash | 
					
						
							|  |  |  |     try: | 
					
						
							|  |  |  |         with open(mediaFilename+'.etag', 'w') as etagFile: | 
					
						
							|  |  |  |             etagFile.write(etag) | 
					
						
							|  |  |  |     except: | 
					
						
							|  |  |  |         pass | 
					
						
							|  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2019-08-30 18:32:34 +00:00
										 |  |  | def attachMedia(baseDir: str,httpPrefix: str,domain: str,port: int, \ | 
					
						
							| 
									
										
										
										
											2019-08-30 15:50:20 +00:00
										 |  |  |                 postJson: {},imageFilename: str, \ | 
					
						
							|  |  |  |                 mediaType: str,description: str, \ | 
					
						
							| 
									
										
										
										
											2019-07-12 19:08:46 +00:00
										 |  |  |                 useBlurhash: bool) -> {}: | 
					
						
							| 
									
										
										
										
											2019-08-30 18:32:34 +00:00
										 |  |  |     """Attaches media to a json object post
 | 
					
						
							| 
									
										
										
										
											2019-07-12 19:08:46 +00:00
										 |  |  |     The description can be None | 
					
						
							|  |  |  |     Blurhash is optional, since low power systems may take a long time to calculate it | 
					
						
							|  |  |  |     """
 | 
					
						
							| 
									
										
										
										
											2019-08-30 18:01:29 +00:00
										 |  |  |     if not isMedia(imageFilename): | 
					
						
							| 
									
										
										
										
											2019-07-12 19:08:46 +00:00
										 |  |  |         return postJson | 
					
						
							| 
									
										
										
										
											2019-08-30 18:01:29 +00:00
										 |  |  |      | 
					
						
							|  |  |  |     fileExtension=None | 
					
						
							| 
									
										
										
										
											2019-11-14 15:11:20 +00:00
										 |  |  |     acceptedTypes=['png','jpg','gif','webp','mp4','webm','ogv','mp3','ogg'] | 
					
						
							| 
									
										
										
										
											2019-08-30 15:50:20 +00:00
										 |  |  |     for mType in acceptedTypes: | 
					
						
							|  |  |  |         if imageFilename.endswith('.'+mType): | 
					
						
							|  |  |  |             if mType=='jpg': | 
					
						
							|  |  |  |                 mType='jpeg' | 
					
						
							| 
									
										
										
										
											2019-08-30 18:44:26 +00:00
										 |  |  |             if mType=='mp3': | 
					
						
							|  |  |  |                 mType='mpeg' | 
					
						
							| 
									
										
										
										
											2019-08-30 18:24:58 +00:00
										 |  |  |             fileExtension=mType | 
					
						
							| 
									
										
										
										
											2019-08-30 18:01:29 +00:00
										 |  |  |     if not fileExtension:         | 
					
						
							|  |  |  |         return postJson | 
					
						
							| 
									
										
										
										
											2019-08-30 15:50:20 +00:00
										 |  |  |     mediaType=mediaType+'/'+fileExtension | 
					
						
							| 
									
										
										
										
											2019-08-30 18:24:58 +00:00
										 |  |  |     print('Attached media type: '+mediaType) | 
					
						
							| 
									
										
										
										
											2019-08-30 15:50:20 +00:00
										 |  |  | 
 | 
					
						
							|  |  |  |     if fileExtension=='jpeg': | 
					
						
							| 
									
										
										
										
											2019-07-12 19:08:46 +00:00
										 |  |  |         fileExtension='jpg' | 
					
						
							| 
									
										
										
										
											2019-08-30 19:10:27 +00:00
										 |  |  |     if mediaType=='audio/mpeg': | 
					
						
							| 
									
										
										
										
											2019-08-30 18:44:26 +00:00
										 |  |  |         fileExtension='mp3' | 
					
						
							| 
									
										
										
										
											2019-07-12 19:08:46 +00:00
										 |  |  | 
 | 
					
						
							| 
									
										
										
										
											2019-08-16 20:35:11 +00:00
										 |  |  |     if port: | 
					
						
							|  |  |  |         if port!=80 and port!=443: | 
					
						
							|  |  |  |             if ':' not in domain: | 
					
						
							|  |  |  |                 domain=domain+':'+str(port) | 
					
						
							| 
									
										
										
										
											2019-07-12 19:08:46 +00:00
										 |  |  | 
 | 
					
						
							| 
									
										
										
										
											2019-07-12 19:26:54 +00:00
										 |  |  |     mPath=getMediaPath() | 
					
						
							|  |  |  |     mediaPath=mPath+'/'+createPassword(32)+'.'+fileExtension | 
					
						
							| 
									
										
										
										
											2019-07-16 10:19:04 +00:00
										 |  |  |     if baseDir: | 
					
						
							|  |  |  |         createMediaDirs(baseDir,mPath) | 
					
						
							|  |  |  |         mediaFilename=baseDir+'/'+mediaPath | 
					
						
							| 
									
										
										
										
											2019-07-12 19:08:46 +00:00
										 |  |  | 
 | 
					
						
							|  |  |  |     attachmentJson={ | 
					
						
							|  |  |  |         'mediaType': mediaType, | 
					
						
							|  |  |  |         'name': description, | 
					
						
							| 
									
										
										
										
											2019-12-04 17:02:38 +00:00
										 |  |  |         'type': 'Document', | 
					
						
							| 
									
										
										
										
											2019-07-12 19:08:46 +00:00
										 |  |  |         'url': httpPrefix+'://'+domain+'/'+mediaPath | 
					
						
							|  |  |  |     } | 
					
						
							| 
									
										
										
										
											2019-12-03 23:38:36 +00:00
										 |  |  |     if useBlurhash and mediaType.startswith('image/'): | 
					
						
							| 
									
										
										
										
											2019-07-12 19:08:46 +00:00
										 |  |  |         attachmentJson['blurhash']=getImageHash(imageFilename) | 
					
						
							|  |  |  |     postJson['attachment']=[attachmentJson] | 
					
						
							|  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2019-08-30 19:01:16 +00:00
										 |  |  |     if baseDir: | 
					
						
							|  |  |  |         if mediaType=='image': | 
					
						
							|  |  |  |             removeMetaData(imageFilename,mediaFilename) | 
					
						
							|  |  |  |         else: | 
					
						
							|  |  |  |             copyfile(imageFilename,mediaFilename) | 
					
						
							| 
									
										
										
										
											2019-12-04 18:52:27 +00:00
										 |  |  |         updateEtag(mediaFilename) | 
					
						
							|  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2019-07-12 19:08:46 +00:00
										 |  |  |     return postJson | 
					
						
							|  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2019-07-12 19:55:23 +00:00
										 |  |  | def archiveMedia(baseDir: str,archiveDirectory: str,maxWeeks=4) -> None: | 
					
						
							| 
									
										
										
										
											2019-07-12 19:51:10 +00:00
										 |  |  |     """Any media older than the given number of weeks gets archived
 | 
					
						
							|  |  |  |     """
 | 
					
						
							|  |  |  |     currTime=datetime.datetime.utcnow() | 
					
						
							|  |  |  |     weeksSinceEpoch=int((currTime - datetime.datetime(1970,1,1)).days/7) | 
					
						
							|  |  |  |     minWeek=weeksSinceEpoch-maxWeeks | 
					
						
							|  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2019-07-12 20:43:55 +00:00
										 |  |  |     if archiveDirectory: | 
					
						
							|  |  |  |         if not os.path.isdir(archiveDirectory): | 
					
						
							|  |  |  |             os.mkdir(archiveDirectory) | 
					
						
							|  |  |  |         if not os.path.isdir(archiveDirectory+'/media'): | 
					
						
							|  |  |  |             os.mkdir(archiveDirectory+'/media') | 
					
						
							|  |  |  |      | 
					
						
							| 
									
										
										
										
											2019-07-12 19:51:10 +00:00
										 |  |  |     for subdir, dirs, files in os.walk(baseDir+'/media'): | 
					
						
							|  |  |  |         for weekDir in dirs: | 
					
						
							|  |  |  |             if int(weekDir)<minWeek: | 
					
						
							| 
									
										
										
										
											2019-07-12 19:55:23 +00:00
										 |  |  |                 if archiveDirectory: | 
					
						
							| 
									
										
										
										
											2019-07-12 20:43:55 +00:00
										 |  |  |                     move(os.path.join(baseDir+'/media', weekDir),archiveDirectory+'/media') | 
					
						
							| 
									
										
										
										
											2019-07-12 19:55:23 +00:00
										 |  |  |                 else: | 
					
						
							|  |  |  |                     # archive to /dev/null | 
					
						
							|  |  |  |                     rmtree(os.path.join(baseDir+'/media', weekDir)) |