| 
									
										
										
										
											2020-04-03 17:01:25 +00:00
										 |  |  | __filename__ = "migrate.py" | 
					
						
							|  |  |  | __author__ = "Bob Mottram" | 
					
						
							|  |  |  | __license__ = "AGPL3+" | 
					
						
							| 
									
										
										
										
											2021-01-26 10:07:42 +00:00
										 |  |  | __version__ = "1.2.0" | 
					
						
							| 
									
										
										
										
											2020-04-03 17:01:25 +00:00
										 |  |  | __maintainer__ = "Bob Mottram" | 
					
						
							|  |  |  | __email__ = "bob@freedombone.net" | 
					
						
							|  |  |  | __status__ = "Production" | 
					
						
							| 
									
										
										
										
											2019-10-31 10:36:35 +00:00
										 |  |  | 
 | 
					
						
							|  |  |  | import os | 
					
						
							| 
									
										
										
										
											2021-01-09 15:08:26 +00:00
										 |  |  | from utils import getNicknameFromActor | 
					
						
							|  |  |  | from utils import getDomainFromActor | 
					
						
							|  |  |  | from webfinger import webfingerHandle | 
					
						
							|  |  |  | from blocking import isBlocked | 
					
						
							|  |  |  | from session import getJson | 
					
						
							|  |  |  | from posts import getUserUrl | 
					
						
							|  |  |  | from follow import unfollowAccount | 
					
						
							| 
									
										
										
										
											2019-10-31 10:36:35 +00:00
										 |  |  | 
 | 
					
						
							| 
									
										
										
										
											2020-04-03 17:01:25 +00:00
										 |  |  | 
 | 
					
						
							| 
									
										
										
										
											2021-01-09 15:08:26 +00:00
										 |  |  | def _moveFollowingHandlesForAccount(baseDir: str, nickname: str, domain: str, | 
					
						
							|  |  |  |                                     session, | 
					
						
							|  |  |  |                                     httpPrefix: str, cachedWebfingers: {}, | 
					
						
							| 
									
										
										
										
											2021-01-09 20:27:17 +00:00
										 |  |  |                                     debug: bool) -> int: | 
					
						
							| 
									
										
										
										
											2021-01-09 15:08:26 +00:00
										 |  |  |     """Goes through all follows for an account and updates any that have moved
 | 
					
						
							| 
									
										
										
										
											2019-10-31 10:36:35 +00:00
										 |  |  |     """
 | 
					
						
							| 
									
										
										
										
											2021-01-09 15:08:26 +00:00
										 |  |  |     ctr = 0 | 
					
						
							|  |  |  |     followingFilename = \ | 
					
						
							| 
									
										
										
										
											2021-01-09 20:27:17 +00:00
										 |  |  |         baseDir + '/accounts/' + nickname + '@' + domain + '/following.txt' | 
					
						
							| 
									
										
										
										
											2021-01-09 15:08:26 +00:00
										 |  |  |     if not os.path.isfile(followingFilename): | 
					
						
							|  |  |  |         return ctr | 
					
						
							|  |  |  |     with open(followingFilename, "r") as f: | 
					
						
							|  |  |  |         followingHandles = f.readlines() | 
					
						
							|  |  |  |         for followHandle in followingHandles: | 
					
						
							|  |  |  |             followHandle = followHandle.strip("\n").strip("\r") | 
					
						
							|  |  |  |             ctr += \ | 
					
						
							|  |  |  |                 _updateMovedHandle(baseDir, nickname, domain, | 
					
						
							|  |  |  |                                    followHandle, session, | 
					
						
							|  |  |  |                                    httpPrefix, cachedWebfingers, | 
					
						
							| 
									
										
										
										
											2021-01-09 20:27:17 +00:00
										 |  |  |                                    debug) | 
					
						
							| 
									
										
										
										
											2021-01-09 15:08:26 +00:00
										 |  |  |     return ctr | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | def _updateMovedHandle(baseDir: str, nickname: str, domain: str, | 
					
						
							|  |  |  |                        handle: str, session, | 
					
						
							|  |  |  |                        httpPrefix: str, cachedWebfingers: {}, | 
					
						
							| 
									
										
										
										
											2021-01-09 20:27:17 +00:00
										 |  |  |                        debug: bool) -> int: | 
					
						
							| 
									
										
										
										
											2021-01-09 15:08:26 +00:00
										 |  |  |     """Check if an account has moved, and if so then alter following.txt
 | 
					
						
							|  |  |  |     for each account. | 
					
						
							|  |  |  |     Returns 1 if moved, 0 otherwise | 
					
						
							| 
									
										
										
										
											2019-10-31 10:36:35 +00:00
										 |  |  |     """
 | 
					
						
							| 
									
										
										
										
											2021-01-09 15:08:26 +00:00
										 |  |  |     ctr = 0 | 
					
						
							|  |  |  |     if '@' not in handle: | 
					
						
							|  |  |  |         return ctr | 
					
						
							|  |  |  |     if len(handle) < 5: | 
					
						
							|  |  |  |         return ctr | 
					
						
							|  |  |  |     if handle.startswith('@'): | 
					
						
							|  |  |  |         handle = handle[1:] | 
					
						
							|  |  |  |     wfRequest = webfingerHandle(session, handle, | 
					
						
							|  |  |  |                                 httpPrefix, cachedWebfingers, | 
					
						
							| 
									
										
										
										
											2021-03-14 19:22:58 +00:00
										 |  |  |                                 None, __version__, debug) | 
					
						
							| 
									
										
										
										
											2021-01-09 15:08:26 +00:00
										 |  |  |     if not wfRequest: | 
					
						
							|  |  |  |         print('updateMovedHandle unable to webfinger ' + handle) | 
					
						
							|  |  |  |         return ctr | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  |     if not isinstance(wfRequest, dict): | 
					
						
							|  |  |  |         print('updateMovedHandle webfinger for ' + handle + | 
					
						
							|  |  |  |               ' did not return a dict. ' + str(wfRequest)) | 
					
						
							|  |  |  |         return ctr | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  |     personUrl = None | 
					
						
							|  |  |  |     if wfRequest.get('errors'): | 
					
						
							|  |  |  |         print('wfRequest error: ' + str(wfRequest['errors'])) | 
					
						
							|  |  |  |         return ctr | 
					
						
							| 
									
										
										
										
											2019-10-31 10:36:35 +00:00
										 |  |  | 
 | 
					
						
							| 
									
										
										
										
											2021-01-09 15:08:26 +00:00
										 |  |  |     profileStr = 'https://www.w3.org/ns/activitystreams' | 
					
						
							|  |  |  |     asHeader = { | 
					
						
							|  |  |  |         'Accept': 'application/activity+json; profile="' + profileStr + '"' | 
					
						
							|  |  |  |     } | 
					
						
							|  |  |  |     if not personUrl: | 
					
						
							| 
									
										
										
										
											2021-03-14 20:41:37 +00:00
										 |  |  |         personUrl = getUserUrl(wfRequest, 0, debug) | 
					
						
							| 
									
										
										
										
											2021-01-09 15:08:26 +00:00
										 |  |  |         if not personUrl: | 
					
						
							|  |  |  |             return ctr | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  |     profileStr = 'https://www.w3.org/ns/activitystreams' | 
					
						
							|  |  |  |     asHeader = { | 
					
						
							|  |  |  |         'Accept': 'application/ld+json; profile="' + profileStr + '"' | 
					
						
							|  |  |  |     } | 
					
						
							|  |  |  |     personJson = \ | 
					
						
							| 
									
										
										
										
											2021-03-14 20:55:37 +00:00
										 |  |  |         getJson(session, personUrl, asHeader, None, | 
					
						
							|  |  |  |                 debug, __version__, httpPrefix, None) | 
					
						
							| 
									
										
										
										
											2021-01-09 15:08:26 +00:00
										 |  |  |     if not personJson: | 
					
						
							|  |  |  |         return ctr | 
					
						
							|  |  |  |     if not personJson.get('movedTo'): | 
					
						
							|  |  |  |         return ctr | 
					
						
							|  |  |  |     movedToUrl = personJson['movedTo'] | 
					
						
							|  |  |  |     if '://' not in movedToUrl: | 
					
						
							|  |  |  |         return ctr | 
					
						
							|  |  |  |     if '.' not in movedToUrl: | 
					
						
							|  |  |  |         return ctr | 
					
						
							|  |  |  |     movedToNickname = getNicknameFromActor(movedToUrl) | 
					
						
							|  |  |  |     if not movedToNickname: | 
					
						
							|  |  |  |         return ctr | 
					
						
							|  |  |  |     movedToDomain, movedToPort = getDomainFromActor(movedToUrl) | 
					
						
							|  |  |  |     if not movedToDomain: | 
					
						
							|  |  |  |         return ctr | 
					
						
							|  |  |  |     movedToDomainFull = movedToDomain | 
					
						
							|  |  |  |     if movedToPort: | 
					
						
							|  |  |  |         if movedToPort != 80 and movedToPort != 443: | 
					
						
							|  |  |  |             movedToDomainFull = movedToDomain + ':' + str(movedToPort) | 
					
						
							|  |  |  |     if isBlocked(baseDir, nickname, domain, | 
					
						
							|  |  |  |                  movedToNickname, movedToDomain): | 
					
						
							|  |  |  |         # someone that you follow has moved to a blocked domain | 
					
						
							|  |  |  |         # so just unfollow them | 
					
						
							|  |  |  |         unfollowAccount(baseDir, nickname, domain, | 
					
						
							|  |  |  |                         movedToNickname, movedToDomainFull, | 
					
						
							| 
									
										
										
										
											2021-01-09 20:27:17 +00:00
										 |  |  |                         'following.txt', debug) | 
					
						
							| 
									
										
										
										
											2021-01-09 15:08:26 +00:00
										 |  |  |         return ctr | 
					
						
							| 
									
										
										
										
											2021-01-09 20:27:17 +00:00
										 |  |  | 
 | 
					
						
							| 
									
										
										
										
											2021-01-09 15:08:26 +00:00
										 |  |  |     followingFilename = \ | 
					
						
							| 
									
										
										
										
											2021-01-09 20:27:17 +00:00
										 |  |  |         baseDir + '/accounts/' + nickname + '@' + domain + '/following.txt' | 
					
						
							|  |  |  |     if os.path.isfile(followingFilename): | 
					
						
							|  |  |  |         with open(followingFilename, "r") as f: | 
					
						
							|  |  |  |             followingHandles = f.readlines() | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  |             movedToHandle = movedToNickname + '@' + movedToDomainFull | 
					
						
							|  |  |  |             handleLower = handle.lower() | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  |             refollowFilename = \ | 
					
						
							|  |  |  |                 baseDir + '/accounts/' + \ | 
					
						
							|  |  |  |                 nickname + '@' + domain + '/refollow.txt' | 
					
						
							| 
									
										
										
										
											2021-01-09 17:41:41 +00:00
										 |  |  | 
 | 
					
						
							| 
									
										
										
										
											2021-01-09 20:27:17 +00:00
										 |  |  |             # unfollow the old handle | 
					
						
							|  |  |  |             with open(followingFilename, 'w+') as f: | 
					
						
							|  |  |  |                 for followHandle in followingHandles: | 
					
						
							|  |  |  |                     if followHandle.strip("\n").strip("\r").lower() != \ | 
					
						
							|  |  |  |                        handleLower: | 
					
						
							|  |  |  |                         f.write(followHandle) | 
					
						
							| 
									
										
										
										
											2021-01-09 18:12:36 +00:00
										 |  |  |                     else: | 
					
						
							| 
									
										
										
										
											2021-01-09 20:27:17 +00:00
										 |  |  |                         handleNickname = handle.split('@')[0] | 
					
						
							|  |  |  |                         handleDomain = handle.split('@')[1] | 
					
						
							|  |  |  |                         unfollowAccount(baseDir, nickname, domain, | 
					
						
							|  |  |  |                                         handleNickname, | 
					
						
							|  |  |  |                                         handleDomain, | 
					
						
							|  |  |  |                                         'following.txt', debug) | 
					
						
							|  |  |  |                         ctr += 1 | 
					
						
							|  |  |  |                         print('Unfollowed ' + handle + ' who has moved to ' + | 
					
						
							|  |  |  |                               movedToHandle) | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  |                         # save the new handles to the refollow list | 
					
						
							|  |  |  |                         if os.path.isfile(refollowFilename): | 
					
						
							|  |  |  |                             with open(refollowFilename, 'a+') as f: | 
					
						
							|  |  |  |                                 f.write(movedToHandle + '\n') | 
					
						
							|  |  |  |                         else: | 
					
						
							|  |  |  |                             with open(refollowFilename, 'w+') as f: | 
					
						
							|  |  |  |                                 f.write(movedToHandle + '\n') | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  |     followersFilename = \ | 
					
						
							|  |  |  |         baseDir + '/accounts/' + nickname + '@' + domain + '/followers.txt' | 
					
						
							|  |  |  |     if os.path.isfile(followersFilename): | 
					
						
							|  |  |  |         with open(followersFilename, "r") as f: | 
					
						
							|  |  |  |             followerHandles = f.readlines() | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  |             handleLower = handle.lower() | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  |             # remove followers who have moved | 
					
						
							|  |  |  |             with open(followersFilename, 'w+') as f: | 
					
						
							|  |  |  |                 for followerHandle in followerHandles: | 
					
						
							|  |  |  |                     if followerHandle.strip("\n").strip("\r").lower() != \ | 
					
						
							|  |  |  |                        handleLower: | 
					
						
							|  |  |  |                         f.write(followerHandle) | 
					
						
							|  |  |  |                     else: | 
					
						
							|  |  |  |                         ctr += 1 | 
					
						
							|  |  |  |                         print('Removed follower who has moved ' + handle) | 
					
						
							|  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2021-01-09 15:08:26 +00:00
										 |  |  |     return ctr | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | def migrateAccounts(baseDir: str, session, | 
					
						
							|  |  |  |                     httpPrefix: str, cachedWebfingers: {}, | 
					
						
							|  |  |  |                     debug: bool) -> int: | 
					
						
							|  |  |  |     """If followed accounts change then this modifies the
 | 
					
						
							|  |  |  |     following lists for each account accordingly. | 
					
						
							|  |  |  |     Returns the number of accounts migrated | 
					
						
							|  |  |  |     """
 | 
					
						
							| 
									
										
										
										
											2019-10-31 10:36:35 +00:00
										 |  |  |     # update followers and following lists for each account | 
					
						
							| 
									
										
										
										
											2021-01-09 15:08:26 +00:00
										 |  |  |     ctr = 0 | 
					
						
							| 
									
										
										
										
											2020-04-03 17:01:25 +00:00
										 |  |  |     for subdir, dirs, files in os.walk(baseDir + '/accounts'): | 
					
						
							| 
									
										
										
										
											2019-10-31 10:36:35 +00:00
										 |  |  |         for handle in dirs: | 
					
						
							| 
									
										
										
										
											2021-01-09 15:08:26 +00:00
										 |  |  |             if '@' not in handle: | 
					
						
							|  |  |  |                 continue | 
					
						
							|  |  |  |             if handle.startswith('inbox@'): | 
					
						
							|  |  |  |                 continue | 
					
						
							|  |  |  |             if handle.startswith('news@'): | 
					
						
							|  |  |  |                 continue | 
					
						
							|  |  |  |             nickname = handle.split('@')[0] | 
					
						
							|  |  |  |             domain = handle.split('@')[1] | 
					
						
							|  |  |  |             ctr += \ | 
					
						
							|  |  |  |                 _moveFollowingHandlesForAccount(baseDir, nickname, domain, | 
					
						
							|  |  |  |                                                 session, httpPrefix, | 
					
						
							| 
									
										
										
										
											2021-01-09 20:27:17 +00:00
										 |  |  |                                                 cachedWebfingers, debug) | 
					
						
							| 
									
										
										
										
											2020-12-13 22:13:45 +00:00
										 |  |  |         break | 
					
						
							| 
									
										
										
										
											2021-01-09 15:08:26 +00:00
										 |  |  |     return ctr |