epicyon/utils.py

__filename__ = "utils.py"
__author__ = "Bob Mottram"
__license__ = "AGPL3+"
__version__ = "1.4.0"
__maintainer__ = "Bob Mottram"
__email__ = "bob@libreserver.org"
__status__ = "Production"
__module_group__ = "Core"

import os
import re
import time
import shutil
import datetime
import json
import idna
import locale
from dateutil.tz import tz
from pprint import pprint
from cryptography.hazmat.backends import default_backend
from cryptography.hazmat.primitives import hashes
from followingCalendar import add_person_to_calendar

VALID_HASHTAG_CHARS = \
    set('_0123456789' +
        'abcdefghijklmnopqrstuvwxyz' +
        'ABCDEFGHIJKLMNOPQRSTUVWXYZ' +
        '¡¿ÄäÀàÁáÂâÃãÅåǍǎĄąĂăÆæĀā' +
        'ÇçĆćĈĉČčĎđĐďðÈèÉéÊêËëĚěĘęĖėĒē' +
        'ĜĝĢģĞğĤĥÌìÍíÎîÏïıĪīĮįĴĵĶķ' +
        'ĹĺĻļŁłĽľĿŀÑñŃńŇňŅņÖöÒòÓóÔôÕõŐőØøŒœ' +
        'ŔŕŘřẞßŚśŜŝŞşŠšȘșŤťŢţÞþȚțÜüÙùÚúÛûŰűŨũŲųŮůŪū' +
        'ŴŵÝýŸÿŶŷŹźŽžŻż')

# posts containing these strings will always get screened out,
# both incoming and outgoing.
# Could include dubious clacks or admin dogwhistles
INVALID_CHARACTERS = (
    '卐', '卍', '࿕', '࿖', '࿗', '࿘', 'ϟϟ', '🏳️‍🌈🚫', '⚡⚡', ''
)

INVALID_ACTOR_URL_CHARACTERS = (
    ' ', '', '<', '>', '%', '{', '}', '|', '\\', '^', '`',
    '?', '#', '[', ']', '!', '$', '&', "'", '(', ')', '*',
    '+', ',', ';', '='
)


def _standardize_text_range(text: str,
                            range_start: int, range_end: int,
                            offset: str) -> str:
    """Convert any fancy characters within the given range into ordinary ones
    """
    offset = ord(offset)
    ctr = 0
    text = list(text)
    while ctr < len(text):
        val = ord(text[ctr])
        if val in range(range_start, range_end):
            text[ctr] = chr(val - range_start + offset)
        ctr += 1
    return "".join(text)


def standardize_text(text: str) -> str:
    """Converts fancy unicode text to ordinary letters
    """
    if not text:
        return text

    char_ranges = (
        [65345, 'a'],
        [119886, 'a'],
        [119990, 'a'],
        [120042, 'a'],
        [120094, 'a'],
        [120146, 'a'],
        [120198, 'a'],
        [120302, 'a'],
        [120354, 'a'],
        [120406, 'a'],
        [65313, 'A'],
        [119912, 'A'],
        [119964, 'A'],
        [120016, 'A'],
        [120068, 'A'],
        [120120, 'A'],
        [120172, 'A'],
        [120224, 'A'],
        [120328, 'A'],
        [120380, 'A'],
        [120432, 'A'],
        [127344, 'A'],
        [127312, 'A'],
        [127280, 'A'],
        [127248, 'A']
    )
    for char_range in char_ranges:
        range_start = char_range[0]
        range_end = range_start + 26
        offset = char_range[1]
        text = _standardize_text_range(text, range_start, range_end, offset)

    return text


def remove_eol(line: str):
    """Removes line ending characters
    """
    return line.replace('\n', '').replace('\r', '')


def text_in_file(text: str, filename: str,
                 case_sensitive: bool = True) -> bool:
    """is the given text in the given file?
    """
    if not case_sensitive:
        text = text.lower()
    try:
        with open(filename, 'r', encoding='utf-8') as file:
            content = file.read()
            if content:
                if not case_sensitive:
                    content = content.lower()
                if text in content:
                    return True
    except OSError:
        print('EX: unable to find text in missing file ' + filename)
    return False


def local_actor_url(http_prefix: str, nickname: str, domain_full: str) -> str:
    """Returns the url for an actor on this instance
    """
    return http_prefix + '://' + domain_full + '/users/' + nickname


def get_actor_languages_list(actor_json: {}) -> []:
    """Returns a list containing languages used by the given actor
    """
    if not actor_json.get('attachment'):
        return []
    for property_value in actor_json['attachment']:
        name_value = None
        if property_value.get('name'):
            name_value = property_value['name']
        elif property_value.get('schema:name'):
            name_value = property_value['schema:name']
        if not name_value:
            continue
        if not name_value.lower().startswith('languages'):
            continue
        if not property_value.get('type'):
            continue
        prop_value_name, _ = \
            get_attachment_property_value(property_value)
        if not prop_value_name:
            continue
        if not property_value['type'].endswith('PropertyValue'):
            continue
        if isinstance(property_value[prop_value_name], list):
            lang_list = property_value[prop_value_name]
            lang_list.sort()
            return lang_list
        if isinstance(property_value[prop_value_name], str):
            lang_str = property_value[prop_value_name]
            lang_list_temp = []
            if ',' in lang_str:
                lang_list_temp = lang_str.split(',')
            elif ';' in lang_str:
                lang_list_temp = lang_str.split(';')
            elif '/' in lang_str:
                lang_list_temp = lang_str.split('/')
            elif '+' in lang_str:
                lang_list_temp = lang_str.split('+')
            elif ' ' in lang_str:
                lang_list_temp = lang_str.split(' ')
            else:
                return [lang_str]
            lang_list = []
            for lang in lang_list_temp:
                lang = lang.strip()
                if lang not in lang_list:
                    lang_list.append(lang)
            lang_list.sort()
            return lang_list
    return []


def has_object_dict(post_json_object: {}) -> bool:
    """Returns true if the given post has an object dict
    """
    if post_json_object.get('object'):
        if isinstance(post_json_object['object'], dict):
            return True
    return False


def remove_markup_tag(html: str, tag: str) -> str:
    """Remove the given tag from the given html markup
    """
    if '<' + tag not in html:
        return html

    section = html.split('<' + tag)
    result = ''
    for text in section:
        if not result:
            if html.startswith('<' + tag) and '>' in text:
                result = text.split('>', 1)[1]
            else:
                result = text
            continue
        result += text.split('>', 1)[1]

    html = result
    section = html.split('</' + tag)
    result = ''
    for text in section:
        if not result:
            if html.startswith('</' + tag) and '>' in text:
                result = text.split('>', 1)[1]
            else:
                result = text
            continue
        result += text.split('>', 1)[1]

    return result


def get_content_from_post(post_json_object: {}, system_language: str,
                          languages_understood: [],
                          content_type: str = "content") -> str:
    """Returns the content from the post in the given language
    including searching for a matching entry within contentMap
    """
    this_post_json = post_json_object
    if has_object_dict(post_json_object):
        this_post_json = post_json_object['object']
    map_dict = content_type + 'Map'
    if not this_post_json.get(content_type) and \
       not this_post_json.get(map_dict):
        return ''
    content = ''
    map_dict = content_type + 'Map'
    if this_post_json.get(map_dict):
        if isinstance(this_post_json[map_dict], dict):
            if this_post_json[map_dict].get(system_language):
                sys_lang = this_post_json[map_dict][system_language]
                if isinstance(sys_lang, str):
                    content = sys_lang
                    content = remove_markup_tag(content, 'pre')
                    content = content.replace('&amp;', '&')
                    return standardize_text(content)
            else:
                # is there a contentMap/summaryMap entry for one of
                # the understood languages?
                for lang in languages_understood:
                    if this_post_json[map_dict].get(lang):
                        map_lang = this_post_json[map_dict][lang]
                        if isinstance(map_lang, str):
                            content = map_lang
                            content = remove_markup_tag(content, 'pre')
                            content = content.replace('&amp;', '&')
                            return standardize_text(content)
    else:
        if isinstance(this_post_json[content_type], str):
            content = this_post_json[content_type]
            content = content.replace('&amp;', '&')
            content = remove_markup_tag(content, 'pre')
    return standardize_text(content)


def get_language_from_post(post_json_object: {}, system_language: str,
                           languages_understood: [],
                           content_type: str = "content") -> str:
    """Returns the content language from the post
    including searching for a matching entry within contentMap
    """
    this_post_json = post_json_object
    if has_object_dict(post_json_object):
        this_post_json = post_json_object['object']
    if not this_post_json.get(content_type):
        return system_language
    map_dict = content_type + 'Map'
    if this_post_json.get(map_dict):
        if isinstance(this_post_json[map_dict], dict):
            if this_post_json[map_dict].get(system_language):
                sys_lang = this_post_json[map_dict][system_language]
                if isinstance(sys_lang, str):
                    return system_language
            else:
                # is there a contentMap/summaryMap entry for one of
                # the understood languages?
                for lang in languages_understood:
                    if this_post_json[map_dict].get(lang):
                        return lang
    return system_language


def get_media_descriptions_from_post(post_json_object: {}) -> str:
    """Returns all attached media descriptions as a single text.
    This is used for filtering
    """
    this_post_json = post_json_object
    if has_object_dict(post_json_object):
        this_post_json = post_json_object['object']
    if not this_post_json.get('attachment'):
        return ''
    descriptions = ''
    for attach in this_post_json['attachment']:
        if not attach.get('name'):
            continue
        descriptions += attach['name'] + ' '
        if attach.get('url'):
            descriptions += attach['url'] + ' '
    return descriptions.strip()


def get_summary_from_post(post_json_object: {}, system_language: str,
                          languages_understood: []) -> str:
    """Returns the summary from the post in the given language
    including searching for a matching entry within summaryMap
    """
    return get_content_from_post(post_json_object, system_language,
                                 languages_understood, "summary")


def get_base_content_from_post(post_json_object: {},
                               system_language: str) -> str:
    """Returns the content from the post in the given language
    """
    this_post_json = post_json_object
    if has_object_dict(post_json_object):
        this_post_json = post_json_object['object']
    if 'content' not in this_post_json:
        return ''
    return this_post_json['content']


def acct_dir(base_dir: str, nickname: str, domain: str) -> str:
    return base_dir + '/accounts/' + nickname + '@' + domain


def acct_handle_dir(base_dir: str, handle: str) -> str:
    return base_dir + '/accounts/' + handle


def is_featured_writer(base_dir: str, nickname: str, domain: str) -> bool:
    """Is the given account a featured writer, appearing in the features
    timeline on news instances?
    """
    features_blocked_filename = \
        acct_dir(base_dir, nickname, domain) + '/.nofeatures'
    return not os.path.isfile(features_blocked_filename)


def refresh_newswire(base_dir: str):
    """Causes the newswire to be updates after a change to user accounts
    """
    refresh_newswire_filename = base_dir + '/accounts/.refresh_newswire'
    if os.path.isfile(refresh_newswire_filename):
        return
    with open(refresh_newswire_filename, 'w+',
              encoding='utf-8') as refresh_file:
        refresh_file.write('\n')


def get_sha_256(msg: str):
    """Returns a SHA256 hash of the given string
    """
    digest = hashes.Hash(hashes.SHA256(), backend=default_backend())
    digest.update(msg)
    return digest.finalize()


def get_sha_512(msg: str):
    """Returns a SHA512 hash of the given string
    """
    digest = hashes.Hash(hashes.SHA512(), backend=default_backend())
    digest.update(msg)
    return digest.finalize()


def local_network_host(host: str) -> bool:
    """Returns true if the given host is on the local network
    """
    if host.startswith('localhost') or \
       host.startswith('192.') or \
       host.startswith('127.') or \
       host.startswith('10.'):
        return True
    return False


def decoded_host(host: str) -> str:
    """Convert hostname to internationalized domain
    https://en.wikipedia.org/wiki/Internationalized_domain_name
    """
    if ':' not in host:
        # eg. mydomain:8000
        if not local_network_host(host):
            if not host.endswith('.onion'):
                if not host.endswith('.i2p'):
                    return idna.decode(host)
    return host


def get_locked_account(actor_json: {}) -> bool:
    """Returns whether the given account requires follower approval
    """
    if not actor_json.get('manuallyApprovesFollowers'):
        return False
    if actor_json['manuallyApprovesFollowers'] is True:
        return True
    return False


def has_users_path(path_str: str) -> bool:
    """Whether there is a /users/ path (or equivalent) in the given string
    """
    users_list = get_user_paths()
    for users_str in users_list:
        if users_str in path_str:
            return True
    if '://' in path_str:
        domain = path_str.split('://')[1]
        if '/' in domain:
            domain = domain.split('/')[0]
        if '://' + domain + '/' not in path_str:
            return False
        nickname = path_str.split('://' + domain + '/')[1]
        if '/' in nickname or '.' in nickname:
            return False
        return True
    return False


def valid_post_date(published: str, max_age_days: int, debug: bool) -> bool:
    """Returns true if the published date is recent and is not in the future
    """
    baseline_time = datetime.datetime(1970, 1, 1)

    days_diff = datetime.datetime.utcnow() - baseline_time
    now_days_since_epoch = days_diff.days

    try:
        post_time_object = \
            datetime.datetime.strptime(published, "%Y-%m-%dT%H:%M:%SZ")
    except BaseException:
        if debug:
            print('EX: valid_post_date invalid published date ' +
                  str(published))
        return False

    days_diff = post_time_object - baseline_time
    post_days_since_epoch = days_diff.days

    if post_days_since_epoch > now_days_since_epoch:
        if debug:
            print("Inbox post has a published date in the future!")
        return False

    if now_days_since_epoch - post_days_since_epoch >= max_age_days:
        if debug:
            print("Inbox post is not recent enough")
        return False
    return True


def get_full_domain(domain: str, port: int) -> str:
    """Returns the full domain name, including port number
    """
    if not port:
        return domain
    if ':' in domain:
        return domain
    if port in (80, 443):
        return domain
    return domain + ':' + str(port)


def is_dormant(base_dir: str, nickname: str, domain: str, actor: str,
               dormant_months: int) -> bool:
    """Is the given followed actor dormant, from the standpoint
    of the given account
    """
    last_seen_filename = acct_dir(base_dir, nickname, domain) + \
        '/lastseen/' + actor.replace('/', '#') + '.txt'

    if not os.path.isfile(last_seen_filename):
        return False

    days_since_epoch_str = None
    try:
        with open(last_seen_filename, 'r',
                  encoding='utf-8') as last_seen_file:
            days_since_epoch_str = last_seen_file.read()
    except OSError:
        print('EX: failed to read last seen ' + last_seen_filename)
        return False

    if days_since_epoch_str:
        days_since_epoch = int(days_since_epoch_str)
        curr_time = datetime.datetime.utcnow()
        curr_days_since_epoch = \
            (curr_time - datetime.datetime(1970, 1, 1)).days
        time_diff_months = \
            int((curr_days_since_epoch - days_since_epoch) / 30)
        if time_diff_months >= dormant_months:
            return True
    return False


def is_editor(base_dir: str, nickname: str) -> bool:
    """Returns true if the given nickname is an editor
    """
    editors_file = base_dir + '/accounts/editors.txt'

    if not os.path.isfile(editors_file):
        admin_name = get_config_param(base_dir, 'admin')
        if admin_name:
            if admin_name == nickname:
                return True
        return False

    with open(editors_file, 'r', encoding='utf-8') as editors:
        lines = editors.readlines()
        if len(lines) == 0:
            admin_name = get_config_param(base_dir, 'admin')
            if admin_name:
                if admin_name == nickname:
                    return True
        for editor in lines:
            editor = editor.strip('\n').strip('\r')
            if editor == nickname:
                return True
    return False


def is_artist(base_dir: str, nickname: str) -> bool:
    """Returns true if the given nickname is an artist
    """
    artists_file = base_dir + '/accounts/artists.txt'

    if not os.path.isfile(artists_file):
        admin_name = get_config_param(base_dir, 'admin')
        if admin_name:
            if admin_name == nickname:
                return True
        return False

    with open(artists_file, 'r', encoding='utf-8') as artists:
        lines = artists.readlines()
        if len(lines) == 0:
            admin_name = get_config_param(base_dir, 'admin')
            if admin_name:
                if admin_name == nickname:
                    return True
        for artist in lines:
            artist = artist.strip('\n').strip('\r')
            if artist == nickname:
                return True
    return False


def get_video_extensions() -> []:
    """Returns a list of the possible video file extensions
    """
    return ('mp4', 'webm', 'ogv')


def get_audio_extensions() -> []:
    """Returns a list of the possible audio file extensions
    """
    return ('mp3', 'ogg', 'flac', 'opus', 'spx', 'wav')


def get_image_extensions() -> []:
    """Returns a list of the possible image file extensions
    """
    return ('jpg', 'jpeg', 'gif', 'webp', 'avif', 'heic',
            'svg', 'ico', 'jxl', 'png')


def get_image_mime_type(image_filename: str) -> str:
    """Returns the mime type for the given image
    """
    extensions_to_mime = {
        'png': 'png',
        'jpg': 'jpeg',
        'jxl': 'jxl',
        'gif': 'gif',
        'avif': 'avif',
        'heic': 'heic',
        'svg': 'svg+xml',
        'webp': 'webp',
        'ico': 'x-icon'
    }
    for ext, mime_ext in extensions_to_mime.items():
        if image_filename.endswith('.' + ext):
            return 'image/' + mime_ext
    return 'image/png'


def get_image_extension_from_mime_type(content_type: str) -> str:
    """Returns the image extension from a mime type, such as image/jpeg
    """
    image_media = {
        'png': 'png',
        'jpeg': 'jpg',
        'jxl': 'jxl',
        'gif': 'gif',
        'svg+xml': 'svg',
        'webp': 'webp',
        'avif': 'avif',
        'heic': 'heic',
        'x-icon': 'ico'
    }
    for mime_ext, ext in image_media.items():
        if content_type.endswith(mime_ext):
            return ext
    return 'png'


def get_media_extensions() -> []:
    """Returns a list of the possible media file extensions
    """
    return get_image_extensions() + \
        get_video_extensions() + get_audio_extensions()


def get_image_formats() -> str:
    """Returns a string of permissable image formats
    used when selecting an image for a new post
    """
    image_ext = get_image_extensions()

    image_formats = ''
    for ext in image_ext:
        if image_formats:
            image_formats += ', '
        image_formats += '.' + ext
    return image_formats


def is_image_file(filename: str) -> bool:
    """Is the given filename an image?
    """
    for ext in get_image_extensions():
        if filename.endswith('.' + ext):
            return True
    return False


def get_media_formats() -> str:
    """Returns a string of permissable media formats
    used when selecting an attachment for a new post
    """
    media_ext = get_media_extensions()

    media_formats = ''
    for ext in media_ext:
        if media_formats:
            media_formats += ', '
        media_formats += '.' + ext
    return media_formats


def remove_html(content: str) -> str:
    """Removes html links from the given content.
    Used to ensure that profile descriptions don't contain dubious content
    """
    if '<' not in content:
        return content
    removing = False
    content = content.replace('<a href', ' <a href')
    content = content.replace('<q>', '"').replace('</q>', '"')
    content = content.replace('</p>', '\n\n').replace('<br>', '\n')
    result = ''
    for char in content:
        if char == '<':
            removing = True
        elif char == '>':
            removing = False
        elif not removing:
            result += char

    plain_text = result.replace('  ', ' ')

    # insert spaces after full stops
    str_len = len(plain_text)
    result = ''
    for i in range(str_len):
        result += plain_text[i]
        if plain_text[i] == '.' and i < str_len - 1:
            if plain_text[i + 1] >= 'A' and plain_text[i + 1] <= 'Z':
                result += ' '

    result = result.replace('  ', ' ').strip()
    return result


def remove_style_within_html(content: str) -> str:
    """Removes style="something" within html post content.
    Used to ensure that styles
    """
    if '<' not in content:
        return content
    if ' style="' not in content:
        return content
    sections = content.split(' style="')
    result = ''
    ctr = 0
    for section_text in sections:
        if ctr > 0:
            result += section_text.split('"', 1)[1]
        else:
            result = section_text
        ctr = 1
    return result


def first_paragraph_from_string(content: str) -> str:
    """Get the first paragraph from a blog post
    to be used as a summary in the newswire feed
    """
    if '<p>' not in content or '</p>' not in content:
        return remove_html(content)
    paragraph = content.split('<p>')[1]
    if '</p>' in paragraph:
        paragraph = paragraph.split('</p>')[0]
    return remove_html(paragraph)


def is_system_account(nickname: str) -> bool:
    """Returns true if the given nickname is a system account
    """
    if nickname in ('news', 'inbox'):
        return True
    return False


def _create_config(base_dir: str) -> None:
    """Creates a configuration file
    """
    config_filename = base_dir + '/config.json'
    if os.path.isfile(config_filename):
        return
    config_json = {
    }
    save_json(config_json, config_filename)


def set_config_param(base_dir: str, variable_name: str,
                     variable_value) -> None:
    """Sets a configuration value
    """
    _create_config(base_dir)
    config_filename = base_dir + '/config.json'
    config_json = {}
    if os.path.isfile(config_filename):
        config_json = load_json(config_filename)
    variable_name = _convert_to_camel_case(variable_name)
    config_json[variable_name] = variable_value
    save_json(config_json, config_filename)


def get_config_param(base_dir: str, variable_name: str):
    """Gets a configuration value
    """
    _create_config(base_dir)
    config_filename = base_dir + '/config.json'
    config_json = load_json(config_filename)
    if config_json:
        variable_name = _convert_to_camel_case(variable_name)
        if variable_name in config_json:
            return config_json[variable_name]
    return None


def is_suspended(base_dir: str, nickname: str) -> bool:
    """Returns true if the given nickname is suspended
    """
    admin_nickname = get_config_param(base_dir, 'admin')
    if not admin_nickname:
        return False
    if nickname == admin_nickname:
        return False

    suspended_filename = base_dir + '/accounts/suspended.txt'
    if os.path.isfile(suspended_filename):
        with open(suspended_filename, 'r', encoding='utf-8') as susp_file:
            lines = susp_file.readlines()
        for suspended in lines:
            if suspended.strip('\n').strip('\r') == nickname:
                return True
    return False


def get_followers_list(base_dir: str,
                       nickname: str, domain: str,
                       follow_file='following.txt') -> []:
    """Returns a list of followers for the given account
    """
    filename = acct_dir(base_dir, nickname, domain) + '/' + follow_file

    if not os.path.isfile(filename):
        return []

    with open(filename, 'r', encoding='utf-8') as foll_file:
        lines = foll_file.readlines()
        for i, _ in enumerate(lines):
            lines[i] = lines[i].strip()
        return lines
    return []


def get_followers_of_person(base_dir: str,
                            nickname: str, domain: str,
                            follow_file='following.txt') -> []:
    """Returns a list containing the followers of the given person
    Used by the shared inbox to know who to send incoming mail to
    """
    followers = []
    domain = remove_domain_port(domain)
    handle = nickname + '@' + domain
    handle_dir = acct_handle_dir(base_dir, handle)
    if not os.path.isdir(handle_dir):
        return followers
    for subdir, dirs, _ in os.walk(base_dir + '/accounts'):
        for account in dirs:
            filename = os.path.join(subdir, account) + '/' + follow_file
            if account == handle or \
               account.startswith('inbox@') or \
               account.startswith('Actor@') or \
               account.startswith('news@'):
                continue
            if not os.path.isfile(filename):
                continue
            with open(filename, 'r', encoding='utf-8') as followingfile:
                for following_handle in followingfile:
                    following_handle2 = remove_eol(following_handle)
                    if following_handle2 == handle:
                        if account not in followers:
                            followers.append(account)
                        break
        break
    return followers


def remove_id_ending(id_str: str) -> str:
    """Removes endings such as /activity and /undo
    """
    if id_str.endswith('/activity'):
        id_str = id_str[:-len('/activity')]
    elif id_str.endswith('/undo'):
        id_str = id_str[:-len('/undo')]
    elif id_str.endswith('/event'):
        id_str = id_str[:-len('/event')]
    elif id_str.endswith('/replies'):
        id_str = id_str[:-len('/replies')]
    elif id_str.endswith('/delete'):
        id_str = id_str[:-len('/delete')]
    elif id_str.endswith('/update'):
        id_str = id_str[:-len('/update')]
    if id_str.endswith('#Create'):
        id_str = id_str.split('#Create')[0]
    elif id_str.endswith('#delete'):
        id_str = id_str.split('#delete')[0]
    elif '#update' in id_str:
        id_str = id_str.split('#update')[0]
    elif '#primary' in id_str:
        id_str = id_str.split('#primary')[0]
    elif '#reciprocal' in id_str:
        id_str = id_str.split('#reciprocal')[0]
    return id_str


def remove_hash_from_post_id(post_id: str) -> str:
    """Removes any has from a post id
    """
    if '#' not in post_id:
        return post_id
    return post_id.split('#')[0]


def get_protocol_prefixes() -> []:
    """Returns a list of valid prefixes
    """
    return ('https://', 'http://', 'ftp://',
            'dat://', 'i2p://', 'gnunet://',
            'ipfs://', 'ipns://',
            'hyper://', 'gemini://', 'gopher://')


def get_link_prefixes() -> []:
    """Returns a list of valid web link prefixes
    """
    return ('https://', 'http://', 'ftp://',
            'dat://', 'i2p://', 'gnunet://', 'payto://',
            'hyper://', 'gemini://', 'gopher://', 'briar:')


def remove_avatar_from_cache(base_dir: str, actor_str: str) -> None:
    """Removes any existing avatar entries from the cache
    This avoids duplicate entries with differing extensions
    """
    avatar_filename_extensions = get_image_extensions()
    for extension in avatar_filename_extensions:
        avatar_filename = \
            base_dir + '/cache/avatars/' + actor_str + '.' + extension
        if os.path.isfile(avatar_filename):
            try:
                os.remove(avatar_filename)
            except OSError:
                print('EX: remove_avatar_from_cache ' +
                      'unable to delete cached avatar ' +
                      str(avatar_filename))


def save_json(json_object: {}, filename: str) -> bool:
    """Saves json to a file
    """
    tries = 1
    while tries <= 5:
        try:
            with open(filename, 'w+', encoding='utf-8') as json_file:
                json_file.write(json.dumps(json_object))
                return True
        except OSError:
            print('EX: save_json ' + str(tries) + ' ' + str(filename))
            time.sleep(1)
            tries += 1
    return False


def load_json(filename: str, delay_sec: int = 2, max_tries: int = 5) -> {}:
    """Makes a few attempts to load a json formatted file
    """
    if '/Actor@' in filename:
        filename = filename.replace('/Actor@', '/inbox@')
    json_object = None
    tries = 1
    while tries <= max_tries:
        try:
            with open(filename, 'r', encoding='utf-8') as json_file:
                data = json_file.read()
                json_object = json.loads(data)
                break
        except BaseException:
            print('EX: load_json exception ' +
                  str(tries) + ' ' + str(filename))
            if delay_sec > 0:
                time.sleep(delay_sec)
            tries += 1
    return json_object


def load_json_onionify(filename: str, domain: str, onion_domain: str,
                       delay_sec: int = 2) -> {}:
    """Makes a few attempts to load a json formatted file
    This also converts the domain name to the onion domain
    """
    if '/Actor@' in filename:
        filename = filename.replace('/Actor@', '/inbox@')
    json_object = None
    tries = 0
    while tries < 5:
        try:
            with open(filename, 'r', encoding='utf-8') as json_file:
                data = json_file.read()
                if data:
                    data = data.replace(domain, onion_domain)
                    data = data.replace('https:', 'http:')
                json_object = json.loads(data)
                break
        except BaseException:
            print('EX: load_json_onionify exception ' + str(filename))
            if delay_sec > 0:
                time.sleep(delay_sec)
            tries += 1
    return json_object


def get_status_number(published_str: str = None) -> (str, str):
    """Returns the status number and published date
    """
    if not published_str:
        curr_time = datetime.datetime.utcnow()
    else:
        curr_time = \
            datetime.datetime.strptime(published_str, '%Y-%m-%dT%H:%M:%SZ')
    days_since_epoch = (curr_time - datetime.datetime(1970, 1, 1)).days
    # status is the number of seconds since epoch
    status_number = \
        str(((days_since_epoch * 24 * 60 * 60) +
             (curr_time.hour * 60 * 60) +
             (curr_time.minute * 60) +
             curr_time.second) * 1000 +
            int(curr_time.microsecond / 1000))
    # See https://github.com/tootsuite/mastodon/blob/
    # 995f8b389a66ab76ec92d9a240de376f1fc13a38/lib/mastodon/snowflake.rb
    # use the leftover microseconds as the sequence number
    sequence_id = curr_time.microsecond % 1000
    # shift by 16bits "sequence data"
    status_number = str((int(status_number) << 16) + sequence_id)
    published = curr_time.strftime("%Y-%m-%dT%H:%M:%SZ")
    return status_number, published


def evil_incarnate() -> []:
    """Hardcoded blocked domains
    """
    return ('fedilist.com', 'gab.com', 'gabfed.com', 'spinster.xyz',
            'kiwifarms.cc', 'djitter.com')


def is_evil(domain: str) -> bool:
    """ https://www.youtube.com/watch?v=5qw1hcevmdU
    """
    if not isinstance(domain, str):
        print('WARN: Malformed domain ' + str(domain))
        return True
    # if a domain contains any of these strings then it is
    # declaring itself to be hostile
    evil_emporium = (
        'nazi', 'extremis', 'extreemis', 'gendercritic',
        'kiwifarm', 'illegal', 'raplst', 'rapist',
        'rapl.st', 'rapi.st', 'antivax', 'plandemic', 'terror'
    )
    for hostile_str in evil_emporium:
        if hostile_str in domain:
            return True
    evil_domains = evil_incarnate()
    for concentrated_evil in evil_domains:
        if domain.endswith(concentrated_evil):
            return True
    return False


def contains_invalid_chars(json_str: str) -> bool:
    """Does the given json string contain invalid characters?
    """
    for is_invalid in INVALID_CHARACTERS:
        if is_invalid in json_str:
            return True
    return False


def contains_invalid_actor_url_chars(url: str) -> bool:
    """Does the given actor url contain invalid characters?
    """
    for is_invalid in INVALID_ACTOR_URL_CHARACTERS:
        if is_invalid in url:
            return True

    return contains_invalid_chars(url)


def remove_invalid_chars(text: str) -> str:
    """Removes any invalid characters from a string
    """
    for is_invalid in INVALID_CHARACTERS:
        if is_invalid not in text:
            continue
        text = text.replace(is_invalid, '')
    return text


def create_person_dir(nickname: str, domain: str, base_dir: str,
                      dir_name: str) -> str:
    """Create a directory for a person
    """
    handle = nickname + '@' + domain
    handle_dir = acct_handle_dir(base_dir, handle)
    if not os.path.isdir(handle_dir):
        os.mkdir(handle_dir)
    box_dir = acct_handle_dir(base_dir, handle) + '/' + dir_name
    if not os.path.isdir(box_dir):
        os.mkdir(box_dir)
    return box_dir


def create_outbox_dir(nickname: str, domain: str, base_dir: str) -> str:
    """Create an outbox for a person
    """
    return create_person_dir(nickname, domain, base_dir, 'outbox')


def create_inbox_queue_dir(nickname: str, domain: str, base_dir: str) -> str:
    """Create an inbox queue and returns the feed filename and directory
    """
    return create_person_dir(nickname, domain, base_dir, 'queue')


def domain_permitted(domain: str, federation_list: []) -> bool:
    """Is the given domain permitted according to the federation list?
    """
    if len(federation_list) == 0:
        return True
    domain = remove_domain_port(domain)
    if domain in federation_list:
        return True
    return False


def url_permitted(url: str, federation_list: []):
    if is_evil(url):
        return False
    if not federation_list:
        return True
    for domain in federation_list:
        if domain in url:
            return True
    return False


def get_local_network_addresses() -> []:
    """Returns patterns for local network address detection
    """
    return ('localhost', '127.0.', '192.168', '10.0.')


def is_local_network_address(ip_address: str) -> bool:
    """Is the given ip address local?
    """
    local_ips = get_local_network_addresses()
    for ip_addr in local_ips:
        if ip_address.startswith(ip_addr):
            return True
    return False


def _is_dangerous_string_tag(content: str, allow_local_network_access: bool,
                             separators: [], invalid_strings: []) -> bool:
    """Returns true if the given string is dangerous
    """
    for separator_style in separators:
        start_char = separator_style[0]
        end_char = separator_style[1]
        if start_char not in content:
            continue
        if end_char not in content:
            continue
        content_sections = content.split(start_char)
        invalid_partials = ()
        if not allow_local_network_access:
            invalid_partials = get_local_network_addresses()
        for markup in content_sections:
            if end_char not in markup:
                continue
            markup = markup.split(end_char)[0].strip()
            for partial_match in invalid_partials:
                if partial_match in markup:
                    return True
            if ' ' not in markup:
                for bad_str in invalid_strings:
                    if not bad_str.endswith('-'):
                        if bad_str in markup:
                            return True
                    else:
                        if markup.startswith(bad_str):
                            return True
            else:
                for bad_str in invalid_strings:
                    if not bad_str.endswith('-'):
                        if bad_str + ' ' in markup:
                            return True
                    else:
                        if markup.startswith(bad_str):
                            return True
    return False


def _is_dangerous_string_simple(content: str, allow_local_network_access: bool,
                                separators: [], invalid_strings: []) -> bool:
    """Returns true if the given string is dangerous
    """
    for separator_style in separators:
        start_char = separator_style[0]
        end_char = separator_style[1]
        if start_char not in content:
            continue
        if end_char not in content:
            continue
        content_sections = content.split(start_char)
        invalid_partials = ()
        if not allow_local_network_access:
            invalid_partials = get_local_network_addresses()
        for markup in content_sections:
            if end_char not in markup:
                continue
            markup = markup.split(end_char)[0].strip()
            for partial_match in invalid_partials:
                if partial_match in markup:
                    return True
            for bad_str in invalid_strings:
                if bad_str in markup:
                    return True
    return False


def html_tag_has_closing(tag_name: str, content: str) -> bool:
    """Does the given tag have opening and closing labels?
    """
    content_lower = content.lower()
    if '<' + tag_name not in content_lower:
        return True
    sections = content_lower.split('<' + tag_name)
    ctr = 0
    end_tag = '</' + tag_name + '>'
    for section in sections:
        if ctr == 0:
            ctr += 1
            continue
        # check that an ending tag exists
        if end_tag not in section:
            return False
        if tag_name in ('code', 'pre'):
            # check that lines are not too long
            section = section.split(end_tag)[0]
            section = section.replace('<br>', '\n')
            code_lines = section.split('\n')
            for line in code_lines:
                if len(line) >= 60:
                    print('<code> or <pre> line too long')
                    return False
        ctr += 1
    return True


def dangerous_markup(content: str, allow_local_network_access: bool,
                     allow_tags: []) -> bool:
    """Returns true if the given content contains dangerous html markup
    """
    if '.svg' in content.lower():
        return True
    separators = [['<', '>'], ['&lt;', '&gt;']]
    invalid_strings = [
        'ampproject', 'googleapis', '_exec(', ' id=', ' name='
    ]
    if _is_dangerous_string_simple(content, allow_local_network_access,
                                   separators, invalid_strings):
        return True
    for closing_tag in ('code', 'pre'):
        if not html_tag_has_closing(closing_tag, content):
            return True
    invalid_strings = [
        'script', 'noscript', 'canvas', 'style', 'abbr', 'input',
        'frame', 'iframe', 'html', 'body', 'hr', 'allow-popups',
        'allow-scripts', 'amp-', '?php', 'pre'
    ]
    for allowed in allow_tags:
        if allowed in invalid_strings:
            invalid_strings.remove(allowed)
    return _is_dangerous_string_tag(content, allow_local_network_access,
                                    separators, invalid_strings)


def dangerous_svg(content: str, allow_local_network_access: bool) -> bool:
    """Returns true if the given svg file content contains dangerous scripts
    """
    separators = [['<', '>'], ['&lt;', '&gt;']]
    invalid_strings = [
        'script'
    ]
    return _is_dangerous_string_tag(content, allow_local_network_access,
                                    separators, invalid_strings)


def _get_statuses_list() -> []:
    """Returns a list of statuses path strings
    """
    return ('/statuses/', '/objects/', '/p/')


def contains_statuses(url: str) -> bool:
    """Whether the given url contains /statuses/
    """
    statuses_list = _get_statuses_list()
    for status_str in statuses_list:
        if status_str in url:
            return True
    return False


def get_actor_from_post_id(post_id: str) -> str:
    """Returns an actor url from a post id containing /statuses/ or equivalent
    eg. https://somedomain/users/nick/statuses/123 becomes
    https://somedomain/users/nick
    """
    actor = post_id
    statuses_list = _get_statuses_list()
    pixelfed_style_statuses = ['/p/']
    for status_str in statuses_list:
        if status_str not in actor:
            continue
        if status_str in pixelfed_style_statuses:
            # pixelfed style post id
            nick = actor.split(status_str)[1]
            if '/' in nick:
                nick = nick.split('/')[0]
            actor = actor.split(status_str)[0] + '/users/' + nick
            break
        if has_users_path(actor):
            actor = actor.split(status_str)[0]
            break
    return actor


def get_display_name(base_dir: str, actor: str, person_cache: {}) -> str:
    """Returns the display name for the given actor
    """
    actor = get_actor_from_post_id(actor)
    if not person_cache.get(actor):
        return None
    name_found = None
    if person_cache[actor].get('actor'):
        if person_cache[actor]['actor'].get('name'):
            name_found = person_cache[actor]['actor']['name']
    else:
        # Try to obtain from the cached actors
        cached_actor_filename = \
            base_dir + '/cache/actors/' + (actor.replace('/', '#')) + '.json'
        if os.path.isfile(cached_actor_filename):
            actor_json = load_json(cached_actor_filename, 1)
            if actor_json:
                if actor_json.get('name'):
                    name_found = actor_json['name']
    if name_found:
        if dangerous_markup(name_found, False, []):
            name_found = "*ADVERSARY*"
    return standardize_text(name_found)


def display_name_is_emoji(display_name: str) -> bool:
    """Returns true if the given display name is an emoji
    """
    if ' ' in display_name:
        words = display_name.split(' ')
        for wrd in words:
            if not wrd.startswith(':'):
                return False
            if not wrd.endswith(':'):
                return False
        return True
    if len(display_name) < 2:
        return False
    if not display_name.startswith(':'):
        return False
    if not display_name.endswith(':'):
        return False
    return True


def _gender_from_string(translate: {}, text: str) -> str:
    """Given some text, does it contain a gender description?
    """
    gender = None
    if not text:
        return None
    text_orig = text
    text = text.lower()
    if translate['He/Him'].lower() in text or \
       translate['boy'].lower() in text:
        gender = 'He/Him'
    elif (translate['She/Her'].lower() in text or
          translate['girl'].lower() in text):
        gender = 'She/Her'
    elif 'him' in text or 'male' in text:
        gender = 'He/Him'
    elif 'her' in text or 'she' in text or \
         'fem' in text or 'woman' in text:
        gender = 'She/Her'
    elif 'man' in text or 'He' in text_orig:
        gender = 'He/Him'
    return gender


def get_gender_from_bio(base_dir: str, actor: str, person_cache: {},
                        translate: {}) -> str:
    """Tries to ascertain gender from bio description
    This is for use by text-to-speech for pitch setting
    """
    default_gender = 'They/Them'
    actor = get_actor_from_post_id(actor)
    if not person_cache.get(actor):
        return default_gender
    bio_found = None
    if translate:
        pronoun_str = translate['pronoun'].lower()
    else:
        pronoun_str = 'pronoun'
    actor_json = None
    if person_cache[actor].get('actor'):
        actor_json = person_cache[actor]['actor']
    else:
        # Try to obtain from the cached actors
        cached_actor_filename = \
            base_dir + '/cache/actors/' + (actor.replace('/', '#')) + '.json'
        if os.path.isfile(cached_actor_filename):
            actor_json = load_json(cached_actor_filename, 1)
    if not actor_json:
        return default_gender
    # is gender defined as a profile tag?
    if actor_json.get('attachment'):
        tags_list = actor_json['attachment']
        if isinstance(tags_list, list):
            # look for a gender field name
            for tag in tags_list:
                if not isinstance(tag, dict):
                    continue
                name_value = None
                if tag.get('name'):
                    name_value = tag['name']
                if tag.get('schema:name'):
                    name_value = tag['schema:name']
                if not name_value:
                    continue
                prop_value_name, _ = get_attachment_property_value(tag)
                if not prop_value_name:
                    continue
                if name_value.lower() == \
                   translate['gender'].lower():
                    bio_found = tag[prop_value_name]
                    break
                if name_value.lower().startswith(pronoun_str):
                    bio_found = tag[prop_value_name]
                    break
            # the field name could be anything,
            # just look at the value
            if not bio_found:
                for tag in tags_list:
                    if not isinstance(tag, dict):
                        continue
                    if not tag.get('name') and not tag.get('schema:name'):
                        continue
                    prop_value_name, _ = get_attachment_property_value(tag)
                    if not prop_value_name:
                        continue
                    gender = \
                        _gender_from_string(translate, tag[prop_value_name])
                    if gender:
                        return gender
    # if not then use the bio
    if not bio_found and actor_json.get('summary'):
        bio_found = actor_json['summary']
    if not bio_found:
        return default_gender
    gender = _gender_from_string(translate, bio_found)
    if not gender:
        gender = default_gender
    return gender


def get_nickname_from_actor(actor: str) -> str:
    """Returns the nickname from an actor url
    """
    if actor.startswith('@'):
        actor = actor[1:]
    users_paths = get_user_paths()
    for possible_path in users_paths:
        if possible_path in actor:
            nick_str = actor.split(possible_path)[1].replace('@', '')
            if '/' not in nick_str:
                return nick_str
            return nick_str.split('/')[0]
    if '/@/' not in actor:
        if '/@' in actor:
            # https://domain/@nick
            nick_str = actor.split('/@')[1]
            if '/' in nick_str:
                nick_str = nick_str.split('/')[0]
            return nick_str
        if '@' in actor:
            nick_str = actor.split('@')[0]
            return nick_str
    if '://' in actor:
        domain = actor.split('://')[1]
        if '/' in domain:
            domain = domain.split('/')[0]
        if '://' + domain + '/' not in actor:
            return None
        nick_str = actor.split('://' + domain + '/')[1]
        if '/' in nick_str or '.' in nick_str:
            return None
        return nick_str
    return None


def get_user_paths() -> []:
    """Returns possible user paths
    e.g. /users/nickname, /channel/nickname
    """
    return ('/users/', '/profile/', '/accounts/', '/channel/', '/u/',
            '/c/', '/m/', '/video-channels/', '/author/',
            '/activitypub/', '/actors/', '/snac/', '/@/', '/~/',
            '/fediverse/blog/', '/user/')


def get_group_paths() -> []:
    """Returns possible group paths
    e.g. https://lemmy/c/groupname
    """
    return ['/c/', '/video-channels/', '/m/']


def get_domain_from_actor(actor: str) -> (str, int):
    """Returns the domain name from an actor url
    """
    if actor.startswith('@'):
        actor = actor[1:]
    port = None
    prefixes = get_protocol_prefixes()
    users_paths = get_user_paths()
    for possible_path in users_paths:
        if possible_path in actor:
            domain = actor.split(possible_path)[0]
            for prefix in prefixes:
                domain = domain.replace(prefix, '')
            break
    if '/@' in actor and '/@/' not in actor:
        domain = actor.split('/@')[0]
        for prefix in prefixes:
            domain = domain.replace(prefix, '')
    elif '@' in actor and '/@/' not in actor:
        domain = actor.split('@')[1].strip()
    else:
        domain = actor
        for prefix in prefixes:
            domain = domain.replace(prefix, '')
        if '/' in actor:
            domain = domain.split('/')[0]
    if ':' in domain:
        port = get_port_from_domain(domain)
        domain = remove_domain_port(domain)
    return domain, port


def _set_default_pet_name(base_dir: str, nickname: str, domain: str,
                          follow_nickname: str, follow_domain: str) -> None:
    """Sets a default petname
    This helps especially when using onion or i2p address
    """
    domain = remove_domain_port(domain)
    user_path = acct_dir(base_dir, nickname, domain)
    petnames_filename = user_path + '/petnames.txt'

    petname_lookup_entry = follow_nickname + ' ' + \
        follow_nickname + '@' + follow_domain + '\n'
    if not os.path.isfile(petnames_filename):
        # if there is no existing petnames lookup file
        with open(petnames_filename, 'w+', encoding='utf-8') as petnames_file:
            petnames_file.write(petname_lookup_entry)
        return

    with open(petnames_filename, 'r', encoding='utf-8') as petnames_file:
        petnames_str = petnames_file.read()
        if petnames_str:
            petnames_list = petnames_str.split('\n')
            for pet in petnames_list:
                if pet.startswith(follow_nickname + ' '):
                    # petname already exists
                    return
    # petname doesn't already exist
    with open(petnames_filename, 'a+', encoding='utf-8') as petnames_file:
        petnames_file.write(petname_lookup_entry)


def follow_person(base_dir: str, nickname: str, domain: str,
                  follow_nickname: str, follow_domain: str,
                  federation_list: [], debug: bool,
                  group_account: bool,
                  follow_file: str = 'following.txt') -> bool:
    """Adds a person to the follow list
    """
    follow_domain_str_lower1 = follow_domain.lower()
    follow_domain_str_lower = remove_eol(follow_domain_str_lower1)
    if not domain_permitted(follow_domain_str_lower,
                            federation_list):
        if debug:
            print('DEBUG: follow of domain ' +
                  follow_domain + ' not permitted')
        return False
    if debug:
        print('DEBUG: follow of domain ' + follow_domain)

    if ':' in domain:
        domain_only = remove_domain_port(domain)
        handle = nickname + '@' + domain_only
    else:
        handle = nickname + '@' + domain

    handle_dir = acct_handle_dir(base_dir, handle)
    if not os.path.isdir(handle_dir):
        print('WARN: account for ' + handle + ' does not exist')
        return False

    if ':' in follow_domain:
        follow_domain_only = remove_domain_port(follow_domain)
        handle_to_follow = follow_nickname + '@' + follow_domain_only
    else:
        handle_to_follow = follow_nickname + '@' + follow_domain

    if group_account:
        handle_to_follow = '!' + handle_to_follow

    # was this person previously unfollowed?
    unfollowed_filename = acct_handle_dir(base_dir, handle) + '/unfollowed.txt'
    if os.path.isfile(unfollowed_filename):
        if text_in_file(handle_to_follow, unfollowed_filename):
            # remove them from the unfollowed file
            new_lines = ''
            with open(unfollowed_filename, 'r',
                      encoding='utf-8') as unfoll_file:
                lines = unfoll_file.readlines()
                for line in lines:
                    if handle_to_follow not in line:
                        new_lines += line
            with open(unfollowed_filename, 'w+',
                      encoding='utf-8') as unfoll_file:
                unfoll_file.write(new_lines)

    if not os.path.isdir(base_dir + '/accounts'):
        os.mkdir(base_dir + '/accounts')
    handle_to_follow = follow_nickname + '@' + follow_domain
    if group_account:
        handle_to_follow = '!' + handle_to_follow
    filename = acct_handle_dir(base_dir, handle) + '/' + follow_file
    if os.path.isfile(filename):
        if text_in_file(handle_to_follow, filename):
            if debug:
                print('DEBUG: follow already exists')
            return True
        # prepend to follow file
        try:
            with open(filename, 'r+', encoding='utf-8') as foll_file:
                content = foll_file.read()
                if handle_to_follow + '\n' not in content:
                    foll_file.seek(0, 0)
                    foll_file.write(handle_to_follow + '\n' + content)
                    print('DEBUG: follow added')
        except OSError as ex:
            print('WARN: Failed to write entry to follow file ' +
                  filename + ' ' + str(ex))
    else:
        # first follow
        if debug:
            print('DEBUG: ' + handle +
                  ' creating new following file to follow ' +
                  handle_to_follow +
                  ', filename is ' + filename)
        with open(filename, 'w+', encoding='utf-8') as foll_file:
            foll_file.write(handle_to_follow + '\n')

    if follow_file.endswith('following.txt'):
        # Default to adding new follows to the calendar.
        # Possibly this could be made optional
        # if following a person add them to the list of
        # calendar follows
        print('DEBUG: adding ' +
              follow_nickname + '@' + follow_domain + ' to calendar of ' +
              nickname + '@' + domain)
        add_person_to_calendar(base_dir, nickname, domain,
                               follow_nickname, follow_domain)
        # add a default petname
        _set_default_pet_name(base_dir, nickname, domain,
                              follow_nickname, follow_domain)
    return True


def votes_on_newswire_item(status: []) -> int:
    """Returns the number of votes on a newswire item
    """
    total_votes = 0
    for line in status:
        if 'vote:' in line:
            total_votes += 1
    return total_votes


def locate_news_votes(base_dir: str, domain: str,
                      post_url: str) -> str:
    """Returns the votes filename for a news post
    within the news user account
    """
    post_url1 = post_url.strip()
    post_url = remove_eol(post_url1)

    # if this post in the shared inbox?
    post_url = remove_id_ending(post_url.strip()).replace('/', '#')

    if post_url.endswith('.json'):
        post_url = post_url + '.votes'
    else:
        post_url = post_url + '.json.votes'

    account_dir = base_dir + '/accounts/news@' + domain + '/'
    post_filename = account_dir + 'outbox/' + post_url
    if os.path.isfile(post_filename):
        return post_filename

    return None


def locate_news_arrival(base_dir: str, domain: str,
                        post_url: str) -> str:
    """Returns the arrival time for a news post
    within the news user account
    """
    post_url1 = post_url.strip()
    post_url = remove_eol(post_url1)

    # if this post in the shared inbox?
    post_url = remove_id_ending(post_url.strip()).replace('/', '#')

    if post_url.endswith('.json'):
        post_url = post_url + '.arrived'
    else:
        post_url = post_url + '.json.arrived'

    account_dir = base_dir + '/accounts/news@' + domain + '/'
    post_filename = account_dir + 'outbox/' + post_url
    if os.path.isfile(post_filename):
        with open(post_filename, 'r', encoding='utf-8') as arrival_file:
            arrival = arrival_file.read()
            if arrival:
                arrival_date = \
                    datetime.datetime.strptime(arrival,
                                               "%Y-%m-%dT%H:%M:%SZ")
                return arrival_date

    return None


def clear_from_post_caches(base_dir: str, recent_posts_cache: {},
                           post_id: str) -> None:
    """Clears cached html for the given post, so that edits
    to news will appear
    """
    filename = '/postcache/' + post_id + '.html'
    for _, dirs, _ in os.walk(base_dir + '/accounts'):
        for acct in dirs:
            if '@' not in acct:
                continue
            if acct.startswith('inbox@') or acct.startswith('Actor@'):
                continue
            cache_dir = os.path.join(base_dir + '/accounts', acct)
            post_filename = cache_dir + filename
            if os.path.isfile(post_filename):
                try:
                    os.remove(post_filename)
                except OSError:
                    print('EX: clear_from_post_caches file not removed ' +
                          str(post_filename))
            # if the post is in the recent posts cache then remove it
            if recent_posts_cache.get('index'):
                if post_id in recent_posts_cache['index']:
                    recent_posts_cache['index'].remove(post_id)
            if recent_posts_cache.get('json'):
                if recent_posts_cache['json'].get(post_id):
                    del recent_posts_cache['json'][post_id]
            if recent_posts_cache.get('html'):
                if recent_posts_cache['html'].get(post_id):
                    del recent_posts_cache['html'][post_id]
        break


def locate_post(base_dir: str, nickname: str, domain: str,
                post_url: str, replies: bool = False) -> str:
    """Returns the filename for the given status post url
    """
    if not replies:
        extension = 'json'
    else:
        extension = 'replies'

    # if this post in the shared inbox?
    post_url = remove_id_ending(post_url.strip()).replace('/', '#')

    # add the extension
    post_url = post_url + '.' + extension

    # search boxes
    boxes = ('inbox', 'outbox', 'tlblogs')
    account_dir = acct_dir(base_dir, nickname, domain) + '/'
    for box_name in boxes:
        post_filename = account_dir + box_name + '/' + post_url
        if os.path.isfile(post_filename):
            return post_filename

    # check news posts
    account_dir = base_dir + '/accounts/news' + '@' + domain + '/'
    post_filename = account_dir + 'outbox/' + post_url
    if os.path.isfile(post_filename):
        return post_filename

    # is it in the announce cache?
    post_filename = base_dir + '/cache/announce/' + nickname + '/' + post_url
    if os.path.isfile(post_filename):
        return post_filename

    # print('WARN: unable to locate ' + nickname + ' ' + post_url)
    return None


def _get_published_date(post_json_object: {}) -> str:
    """Returns the published date on the given post
    """
    published = None
    if post_json_object.get('published'):
        published = post_json_object['published']
    elif has_object_dict(post_json_object):
        if post_json_object['object'].get('published'):
            published = post_json_object['object']['published']
    if not published:
        return None
    if not isinstance(published, str):
        return None
    return published


def get_reply_interval_hours(base_dir: str, nickname: str, domain: str,
                             default_reply_interval_hrs: int) -> int:
    """Returns the reply interval for the given account.
    The reply interval is the number of hours after a post being made
    during which replies are allowed
    """
    reply_interval_filename = \
        acct_dir(base_dir, nickname, domain) + '/.reply_interval_hours'
    if os.path.isfile(reply_interval_filename):
        with open(reply_interval_filename, 'r',
                  encoding='utf-8') as interval_file:
            hours_str = interval_file.read()
            if hours_str.isdigit():
                return int(hours_str)
    return default_reply_interval_hrs


def set_reply_interval_hours(base_dir: str, nickname: str, domain: str,
                             reply_interval_hours: int) -> bool:
    """Sets the reply interval for the given account.
    The reply interval is the number of hours after a post being made
    during which replies are allowed
    """
    reply_interval_filename = \
        acct_dir(base_dir, nickname, domain) + '/.reply_interval_hours'
    try:
        with open(reply_interval_filename, 'w+',
                  encoding='utf-8') as interval_file:
            interval_file.write(str(reply_interval_hours))
            return True
    except OSError:
        print('EX: set_reply_interval_hours unable to save reply interval ' +
              str(reply_interval_filename) + ' ' +
              str(reply_interval_hours))
    return False


def can_reply_to(base_dir: str, nickname: str, domain: str,
                 post_url: str, reply_interval_hours: int,
                 curr_date_str: str = None,
                 post_json_object: {} = None) -> bool:
    """Is replying to the given local post permitted?
    This is a spam mitigation feature, so that spammers can't
    add a lot of replies to old post which you don't notice.
    """
    if '/statuses/' not in post_url:
        return True
    if not post_json_object:
        post_filename = locate_post(base_dir, nickname, domain, post_url)
        if not post_filename:
            # the post is not stored locally
            return True
        post_json_object = load_json(post_filename)
    if not post_json_object:
        return False
    published = _get_published_date(post_json_object)
    if not published:
        return False
    try:
        pub_date = datetime.datetime.strptime(published, '%Y-%m-%dT%H:%M:%SZ')
    except BaseException:
        print('EX: can_reply_to unrecognized published date ' + str(published))
        return False
    if not curr_date_str:
        curr_date = datetime.datetime.utcnow()
    else:
        try:
            curr_date = \
                datetime.datetime.strptime(curr_date_str, '%Y-%m-%dT%H:%M:%SZ')
        except BaseException:
            print('EX: can_reply_to unrecognized current date ' +
                  str(curr_date_str))
            return False
    hours_since_publication = \
        int((curr_date - pub_date).total_seconds() / 3600)
    if hours_since_publication < 0 or \
       hours_since_publication >= reply_interval_hours:
        return False
    return True


def _remove_attachment(base_dir: str, http_prefix: str, domain: str,
                       post_json: {}):
    """Removes media files for an attachment
    """
    if not post_json.get('attachment'):
        return
    if not post_json['attachment'][0].get('url'):
        return
    attachment_url = post_json['attachment'][0]['url']
    if not attachment_url:
        return
    attachment_url = remove_html(attachment_url)
    media_filename = base_dir + '/' + \
        attachment_url.replace(http_prefix + '://' + domain + '/', '')
    if os.path.isfile(media_filename):
        try:
            os.remove(media_filename)
        except OSError:
            print('EX: _remove_attachment unable to delete media file ' +
                  str(media_filename))
    if os.path.isfile(media_filename + '.vtt'):
        try:
            os.remove(media_filename + '.vtt')
        except OSError:
            print('EX: _remove_attachment unable to delete media transcript ' +
                  str(media_filename) + '.vtt')
    etag_filename = media_filename + '.etag'
    if os.path.isfile(etag_filename):
        try:
            os.remove(etag_filename)
        except OSError:
            print('EX: _remove_attachment unable to delete etag file ' +
                  str(etag_filename))
    post_json['attachment'] = []


def remove_moderation_post_from_index(base_dir: str, post_url: str,
                                      debug: bool) -> None:
    """Removes a url from the moderation index
    """
    moderation_index_file = base_dir + '/accounts/moderation.txt'
    if not os.path.isfile(moderation_index_file):
        return
    post_id = remove_id_ending(post_url)
    if text_in_file(post_id, moderation_index_file):
        with open(moderation_index_file, 'r',
                  encoding='utf-8') as file1:
            lines = file1.readlines()
            with open(moderation_index_file, 'w+',
                      encoding='utf-8') as file2:
                for line in lines:
                    if line.strip("\n").strip("\r") != post_id:
                        file2.write(line)
                        continue
                    if debug:
                        print('DEBUG: removed ' + post_id +
                              ' from moderation index')


def _is_reply_to_blog_post(base_dir: str, nickname: str, domain: str,
                           post_json_object: str):
    """Is the given post a reply to a blog post?
    """
    if not has_object_dict(post_json_object):
        return False
    if not post_json_object['object'].get('inReplyTo'):
        return False
    if not isinstance(post_json_object['object']['inReplyTo'], str):
        return False
    blogs_index_filename = \
        acct_dir(base_dir, nickname, domain) + '/tlblogs.index'
    if not os.path.isfile(blogs_index_filename):
        return False
    post_id = remove_id_ending(post_json_object['object']['inReplyTo'])
    post_id = post_id.replace('/', '#')
    if text_in_file(post_id, blogs_index_filename):
        return True
    return False


def _delete_post_remove_replies(base_dir: str, nickname: str, domain: str,
                                http_prefix: str, post_filename: str,
                                recent_posts_cache: {}, debug: bool,
                                manual: bool) -> None:
    """Removes replies when deleting a post
    """
    replies_filename = post_filename.replace('.json', '.replies')
    if not os.path.isfile(replies_filename):
        return
    if debug:
        print('DEBUG: removing replies to ' + post_filename)
    with open(replies_filename, 'r', encoding='utf-8') as replies_file:
        for reply_id in replies_file:
            reply_file = locate_post(base_dir, nickname, domain, reply_id)
            if not reply_file:
                continue
            if os.path.isfile(reply_file):
                delete_post(base_dir, http_prefix,
                            nickname, domain, reply_file, debug,
                            recent_posts_cache, manual)
    # remove the replies file
    try:
        os.remove(replies_filename)
    except OSError:
        print('EX: _delete_post_remove_replies ' +
              'unable to delete replies file ' + str(replies_filename))


def _is_bookmarked(base_dir: str, nickname: str, domain: str,
                   post_filename: str) -> bool:
    """Returns True if the given post is bookmarked
    """
    bookmarks_index_filename = \
        acct_dir(base_dir, nickname, domain) + '/bookmarks.index'
    if os.path.isfile(bookmarks_index_filename):
        bookmark_index = post_filename.split('/')[-1] + '\n'
        if text_in_file(bookmark_index, bookmarks_index_filename):
            return True
    return False


def remove_post_from_cache(post_json_object: {},
                           recent_posts_cache: {}) -> None:
    """ if the post exists in the recent posts cache then remove it
    """
    if not recent_posts_cache:
        return

    if not post_json_object.get('id'):
        return

    if not recent_posts_cache.get('index'):
        return

    post_id = post_json_object['id']
    if '#' in post_id:
        post_id = post_id.split('#', 1)[0]
    post_id = remove_id_ending(post_id).replace('/', '#')
    if post_id not in recent_posts_cache['index']:
        return

    if recent_posts_cache.get('index'):
        if post_id in recent_posts_cache['index']:
            recent_posts_cache['index'].remove(post_id)

    if recent_posts_cache.get('json'):
        if recent_posts_cache['json'].get(post_id):
            del recent_posts_cache['json'][post_id]

    if recent_posts_cache.get('html'):
        if recent_posts_cache['html'].get(post_id):
            del recent_posts_cache['html'][post_id]


def delete_cached_html(base_dir: str, nickname: str, domain: str,
                       post_json_object: {}):
    """Removes cached html file for the given post
    """
    cached_post_filename = \
        get_cached_post_filename(base_dir, nickname, domain, post_json_object)
    if cached_post_filename:
        if os.path.isfile(cached_post_filename):
            try:
                os.remove(cached_post_filename)
            except OSError:
                print('EX: delete_cached_html ' +
                      'unable to delete cached post file ' +
                      str(cached_post_filename))

        cached_post_filename = cached_post_filename.replace('.html', '.ssml')
        if os.path.isfile(cached_post_filename):
            try:
                os.remove(cached_post_filename)
            except OSError:
                print('EX: delete_cached_html ' +
                      'unable to delete cached ssml post file ' +
                      str(cached_post_filename))

        cached_post_filename = \
            cached_post_filename.replace('/postcache/', '/outbox/')
        if os.path.isfile(cached_post_filename):
            try:
                os.remove(cached_post_filename)
            except OSError:
                print('EX: delete_cached_html ' +
                      'unable to delete cached outbox ssml post file ' +
                      str(cached_post_filename))


def _remove_post_id_from_tag_index(tag_index_filename: str,
                                   post_id: str) -> None:
    """Remove post_id from the tag index file
    """
    lines = None
    with open(tag_index_filename, 'r', encoding='utf-8') as index_file:
        lines = index_file.readlines()
    if not lines:
        return
    newlines = ''
    for file_line in lines:
        if post_id in file_line:
            # skip over the deleted post
            continue
        newlines += file_line
    if not newlines.strip():
        # if there are no lines then remove the hashtag file
        try:
            os.remove(tag_index_filename)
        except OSError:
            print('EX: _delete_hashtags_on_post ' +
                  'unable to delete tag index ' + str(tag_index_filename))
    else:
        # write the new hashtag index without the given post in it
        with open(tag_index_filename, 'w+',
                  encoding='utf-8') as index_file:
            index_file.write(newlines)


def _delete_hashtags_on_post(base_dir: str, post_json_object: {}) -> None:
    """Removes hashtags when a post is deleted
    """
    remove_hashtag_index = False
    if has_object_dict(post_json_object):
        if post_json_object['object'].get('content'):
            if '#' in post_json_object['object']['content']:
                remove_hashtag_index = True

    if not remove_hashtag_index:
        return

    if not post_json_object['object'].get('id') or \
       not post_json_object['object'].get('tag'):
        return

    # get the id of the post
    post_id = remove_id_ending(post_json_object['object']['id'])
    for tag in post_json_object['object']['tag']:
        if not tag.get('type'):
            continue
        if tag['type'] != 'Hashtag':
            continue
        if not tag.get('name'):
            continue
        # find the index file for this tag
        tag_map_filename = base_dir + '/tagmaps/' + tag['name'][1:] + '.txt'
        if os.path.isfile(tag_map_filename):
            _remove_post_id_from_tag_index(tag_map_filename, post_id)
        # find the index file for this tag
        tag_index_filename = base_dir + '/tags/' + tag['name'][1:] + '.txt'
        if os.path.isfile(tag_index_filename):
            _remove_post_id_from_tag_index(tag_index_filename, post_id)


def _delete_conversation_post(base_dir: str, nickname: str, domain: str,
                              post_json_object: {}) -> None:
    """Deletes a post from a conversation
    """
    if not has_object_dict(post_json_object):
        return False
    if not post_json_object['object'].get('conversation') and \
       not post_json_object['object'].get('context'):
        return False
    if not post_json_object['object'].get('id'):
        return False
    conversation_dir = \
        acct_dir(base_dir, nickname, domain) + '/conversation'
    if post_json_object['object'].get('conversation'):
        conversation_id = post_json_object['object']['conversation']
    else:
        conversation_id = post_json_object['object']['context']
    conversation_id = conversation_id.replace('/', '#')
    post_id = post_json_object['object']['id']
    conversation_filename = conversation_dir + '/' + conversation_id
    if not os.path.isfile(conversation_filename):
        return False
    conversation_str = ''
    with open(conversation_filename, 'r', encoding='utf-8') as conv_file:
        conversation_str = conv_file.read()
    if post_id + '\n' not in conversation_str:
        return False
    conversation_str = conversation_str.replace(post_id + '\n', '')
    if conversation_str:
        with open(conversation_filename, 'w+', encoding='utf-8') as conv_file:
            conv_file.write(conversation_str)
    else:
        if os.path.isfile(conversation_filename + '.muted'):
            try:
                os.remove(conversation_filename + '.muted')
            except OSError:
                print('EX: _delete_conversation_post ' +
                      'unable to remove conversation ' +
                      str(conversation_filename) + '.muted')
        try:
            os.remove(conversation_filename)
        except OSError:
            print('EX: _delete_conversation_post ' +
                  'unable to remove conversation ' +
                  str(conversation_filename))


def is_dm(post_json_object: {}) -> bool:
    """Returns true if the given post is a DM
    """
    if post_json_object['type'] != 'Create':
        return False
    if not has_object_dict(post_json_object):
        return False
    if post_json_object['object']['type'] != 'ChatMessage':
        if post_json_object['object']['type'] != 'Note' and \
           post_json_object['object']['type'] != 'Page' and \
           post_json_object['object']['type'] != 'Patch' and \
           post_json_object['object']['type'] != 'EncryptedMessage' and \
           post_json_object['object']['type'] != 'Article':
            return False
    if post_json_object['object'].get('moderationStatus'):
        return False
    fields = ('to', 'cc')
    for field_name in fields:
        if not post_json_object['object'].get(field_name):
            continue
        for to_address in post_json_object['object'][field_name]:
            if to_address.endswith('#Public') or \
               to_address == 'as:Public' or \
               to_address == 'Public':
                return False
            if to_address.endswith('followers'):
                return False
    return True


def is_reminder(post_json_object: {}) -> bool:
    """Returns true if the given post is a reminder
    """
    if not is_dm(post_json_object):
        return False
    if not post_json_object['object'].get('to'):
        return False
    if not post_json_object['object'].get('attributedTo'):
        return False
    if not post_json_object['object'].get('tag'):
        return False
    if len(post_json_object['object']['to']) != 1:
        return False
    if post_json_object['object']['to'][0] != \
       post_json_object['object']['attributedTo']:
        return False
    for tag in post_json_object['object']['tag']:
        if tag['type'] == 'Event':
            return True
    return False


def _is_remote_dm(domain_full: str, post_json_object: {}) -> bool:
    """Is the given post a DM from a different domain?
    """
    if not is_dm(post_json_object):
        return False
    this_post_json = post_json_object
    if has_object_dict(post_json_object):
        this_post_json = post_json_object['object']
    if this_post_json.get('attributedTo'):
        if isinstance(this_post_json['attributedTo'], str):
            if '://' + domain_full not in this_post_json['attributedTo']:
                return True
    return False


def delete_post(base_dir: str, http_prefix: str,
                nickname: str, domain: str, post_filename: str,
                debug: bool, recent_posts_cache: {},
                manual: bool) -> None:
    """Recursively deletes a post and its replies and attachments
    """
    post_json_object = load_json(post_filename, 1)
    if not post_json_object:
        # remove any replies
        _delete_post_remove_replies(base_dir, nickname, domain,
                                    http_prefix, post_filename,
                                    recent_posts_cache, debug, manual)
        # finally, remove the post itself
        try:
            os.remove(post_filename)
        except OSError:
            if debug:
                print('EX: delete_post unable to delete post ' +
                      str(post_filename))
        return

    # don't allow DMs to be deleted if they came from a different instance
    # otherwise this breaks expectations about how DMs should operate
    # i.e. DMs should only be removed if they are manually deleted
    if not manual:
        if _is_remote_dm(domain, post_json_object):
            return

    # don't allow deletion of bookmarked posts
    if _is_bookmarked(base_dir, nickname, domain, post_filename):
        return

    # don't remove replies to blog posts
    if _is_reply_to_blog_post(base_dir, nickname, domain,
                              post_json_object):
        return

    # remove from recent posts cache in memory
    remove_post_from_cache(post_json_object, recent_posts_cache)

    # remove from conversation index
    _delete_conversation_post(base_dir, nickname, domain, post_json_object)

    # remove any attachment
    _remove_attachment(base_dir, http_prefix, domain, post_json_object)

    extensions = (
        'votes', 'arrived', 'muted', 'tts', 'reject', 'mitm', 'edits'
    )
    for ext in extensions:
        ext_filename = post_filename + '.' + ext
        if os.path.isfile(ext_filename):
            try:
                os.remove(ext_filename)
            except OSError:
                print('EX: delete_post unable to remove ext ' +
                      str(ext_filename))
        elif post_filename.endswith('.json'):
            ext_filename = post_filename.replace('.json', '') + '.' + ext
            if os.path.isfile(ext_filename):
                try:
                    os.remove(ext_filename)
                except OSError:
                    print('EX: delete_post unable to remove ext ' +
                          str(ext_filename))

    # remove cached html version of the post
    delete_cached_html(base_dir, nickname, domain, post_json_object)

    has_object = False
    if post_json_object.get('object'):
        has_object = True

    # remove from moderation index file
    if has_object:
        if has_object_dict(post_json_object):
            if post_json_object['object'].get('moderationStatus'):
                if post_json_object.get('id'):
                    post_id = remove_id_ending(post_json_object['id'])
                    remove_moderation_post_from_index(base_dir, post_id, debug)

    # remove any hashtags index entries
    if has_object:
        _delete_hashtags_on_post(base_dir, post_json_object)

    # remove any replies
    _delete_post_remove_replies(base_dir, nickname, domain,
                                http_prefix, post_filename,
                                recent_posts_cache, debug, manual)
    # finally, remove the post itself
    try:
        os.remove(post_filename)
    except OSError:
        if debug:
            print('EX: delete_post unable to delete post ' +
                  str(post_filename))


def _is_valid_language(text: str) -> bool:
    """Returns true if the given text contains a valid
    natural language string
    """
    natural_languages = {
        "Latin": [65, 866],
        "Greek": [880, 1280],
        "isArmenian": [1328, 1424],
        "isHebrew": [1424, 1536],
        "Arabic": [1536, 1792],
        "Syriac": [1792, 1872],
        "Thaan": [1920, 1984],
        "Devanagari": [2304, 2432],
        "Bengali": [2432, 2560],
        "Gurmukhi": [2560, 2688],
        "Gujarati": [2688, 2816],
        "Oriya": [2816, 2944],
        "Tamil": [2944, 3072],
        "Telugu": [3072, 3200],
        "Kannada": [3200, 3328],
        "Malayalam": [3328, 3456],
        "Sinhala": [3456, 3584],
        "Thai": [3584, 3712],
        "Lao": [3712, 3840],
        "Tibetan": [3840, 4096],
        "Myanmar": [4096, 4256],
        "Georgian": [4256, 4352],
        "HangulJamo": [4352, 4608],
        "Cherokee": [5024, 5120],
        "UCAS": [5120, 5760],
        "Ogham": [5760, 5792],
        "Runic": [5792, 5888],
        "Khmer": [6016, 6144],
        "Hangul Syllables": [44032, 55203],
        "Hangul Jamo": [4352, 4607],
        "Hangul Compatibility Jamo": [12592, 12687],
        "Hangul Jamo Extended-A": [43360, 43391],
        "Hangul Jamo Extended-B": [55216, 55295],
        "Mongolian": [6144, 6320],
        "Cyrillic": [1024, 1279],
        "Cyrillic Supplement": [1280, 1327],
        "Cyrillic Extended A": [11744, 11775],
        "Cyrillic Extended B": [42560, 42655],
        "Cyrillic Extended C": [7296, 7311],
        "Phonetic Extensions": [7467, 7544],
        "Combining Half Marks": [65070, 65071]
    }
    for _, lang_range in natural_languages.items():
        ok_lang = True
        for char in text:
            if char.isdigit() or char == '_':
                continue
            if ord(char) not in range(lang_range[0], lang_range[1]):
                ok_lang = False
                break
        if ok_lang:
            return True
    return False


def _get_reserved_words() -> str:
    return ('inbox', 'dm', 'outbox', 'following',
            'public', 'followers', 'category',
            'channel', 'calendar', 'video-channels',
            'tlreplies', 'tlmedia', 'tlblogs',
            'tlblogs', 'tlfeatures',
            'moderation', 'moderationaction',
            'activity', 'undo', 'pinned',
            'actor', 'Actor', 'instance.actor',
            'reply', 'replies', 'question', 'like',
            'likes', 'users', 'statuses', 'tags', 'author',
            'accounts', 'headers', 'snac',
            'channels', 'profile', 'u', 'c',
            'updates', 'repeat', 'announce',
            'shares', 'fonts', 'icons', 'avatars',
            'welcome', 'helpimages',
            'bookmark', 'bookmarks', 'tlbookmarks',
            'ignores', 'linksmobile', 'newswiremobile',
            'minimal', 'search', 'eventdelete',
            'searchemoji', 'catalog', 'conversationId',
            'mention', 'http', 'https', 'ipfs', 'ipns',
            'ontologies', 'data', 'postedit', 'moved',
            'inactive', 'activitypub', 'actors',
            'notes', 'offers', 'wanted')


def get_nickname_validation_pattern() -> str:
    """Returns a html text input validation pattern for nickname
    """
    reserved_names = _get_reserved_words()
    pattern = ''
    for word in reserved_names:
        if pattern:
            pattern += '(?!.*\\b' + word + '\\b)'
        else:
            pattern = '^(?!.*\\b' + word + '\\b)'
    return pattern + '.*${1,30}'


def _is_reserved_name(nickname: str) -> bool:
    """Is the given nickname reserved for some special function?
    """
    reserved_names = _get_reserved_words()
    if nickname in reserved_names:
        return True
    return False


def valid_nickname(domain: str, nickname: str) -> bool:
    """Is the given nickname valid?
    """
    if len(nickname) == 0:
        return False
    if len(nickname) > 30:
        return False
    if not _is_valid_language(nickname):
        return False
    forbidden_chars = ('.', ' ', '/', '?', ':', ';', '@', '#', '!')
    for char in forbidden_chars:
        if char in nickname:
            return False
    # this should only apply for the shared inbox
    if nickname == domain:
        return False
    if _is_reserved_name(nickname):
        return False
    return True


def no_of_accounts(base_dir: str) -> bool:
    """Returns the number of accounts on the system
    """
    account_ctr = 0
    for _, dirs, _ in os.walk(base_dir + '/accounts'):
        for account in dirs:
            if is_account_dir(account):
                account_ctr += 1
        break
    return account_ctr


def no_of_active_accounts_monthly(base_dir: str, months: int) -> bool:
    """Returns the number of accounts on the system this month
    """
    account_ctr = 0
    curr_time = int(time.time())
    month_seconds = int(60*60*24*30*months)
    for _, dirs, _ in os.walk(base_dir + '/accounts'):
        for account in dirs:
            if not is_account_dir(account):
                continue
            last_used_filename = \
                base_dir + '/accounts/' + account + '/.lastUsed'
            if not os.path.isfile(last_used_filename):
                continue
            with open(last_used_filename, 'r',
                      encoding='utf-8') as last_used_file:
                last_used = last_used_file.read()
                if last_used.isdigit():
                    time_diff = (curr_time - int(last_used))
                    if time_diff < month_seconds:
                        account_ctr += 1
        break
    return account_ctr


def is_public_post_from_url(base_dir: str, nickname: str, domain: str,
                            post_url: str) -> bool:
    """Returns whether the given url is a public post
    """
    post_filename = locate_post(base_dir, nickname, domain, post_url)
    if not post_filename:
        return False
    post_json_object = load_json(post_filename, 1)
    if not post_json_object:
        return False
    return is_public_post(post_json_object)


def is_public_post(post_json_object: {}) -> bool:
    """Returns true if the given post is public
    """
    if not post_json_object.get('type'):
        return False
    if post_json_object['type'] != 'Create':
        return False
    if not has_object_dict(post_json_object):
        return False
    if not post_json_object['object'].get('to'):
        return False
    for recipient in post_json_object['object']['to']:
        if recipient.endswith('#Public') or \
           recipient == 'as:Public' or \
           recipient == 'Public':
            return True
    return False


def is_followers_post(post_json_object: {}) -> bool:
    """Returns true if the given post is to followers
    """
    if not post_json_object.get('type'):
        return False
    if post_json_object['type'] != 'Create':
        return False
    if not has_object_dict(post_json_object):
        return False
    if not post_json_object['object'].get('to'):
        return False
    for recipient in post_json_object['object']['to']:
        if recipient.endswith('/followers'):
            return True
    return False


def is_unlisted_post(post_json_object: {}) -> bool:
    """Returns true if the given post is unlisted
    """
    if not post_json_object.get('type'):
        return False
    if post_json_object['type'] != 'Create':
        return False
    if not has_object_dict(post_json_object):
        return False
    if not post_json_object['object'].get('to'):
        return False
    if not post_json_object['object'].get('cc'):
        return False
    has_followers = False
    for recipient in post_json_object['object']['to']:
        if recipient.endswith('/followers'):
            has_followers = True
            break
    if not has_followers:
        return False
    for recipient in post_json_object['object']['cc']:
        if recipient.endswith('#Public') or \
           recipient == 'as:Public' or \
           recipient == 'Public':
            return True
    return False


def copytree(src: str, dst: str, symlinks: str = False, ignore: bool = None):
    """Copy a directory
    """
    for item in os.listdir(src):
        s_dir = os.path.join(src, item)
        d_dir = os.path.join(dst, item)
        if os.path.isdir(s_dir):
            shutil.copytree(s_dir, d_dir, symlinks, ignore)
        else:
            shutil.copy2(s_dir, d_dir)


def get_cached_post_directory(base_dir: str,
                              nickname: str, domain: str) -> str:
    """Returns the directory where the html post cache exists
    """
    html_post_cache_dir = acct_dir(base_dir, nickname, domain) + '/postcache'
    return html_post_cache_dir


def get_cached_post_filename(base_dir: str, nickname: str, domain: str,
                             post_json_object: {}) -> str:
    """Returns the html cache filename for the given post
    """
    cached_post_dir = get_cached_post_directory(base_dir, nickname, domain)
    if not os.path.isdir(cached_post_dir):
        # print('ERROR: invalid html cache directory ' + cached_post_dir)
        return None
    if '@' not in cached_post_dir:
        # print('ERROR: invalid html cache directory ' + cached_post_dir)
        return None
    cached_post_id = remove_id_ending(post_json_object['id'])
    cached_post_filename = \
        cached_post_dir + '/' + cached_post_id.replace('/', '#')
    return cached_post_filename + '.html'


def update_recent_posts_cache(recent_posts_cache: {}, max_recent_posts: int,
                              post_json_object: {}, html_str: str) -> None:
    """Store recent posts in memory so that they can be quickly recalled
    """
    if not post_json_object.get('id'):
        return
    post_id = post_json_object['id']
    if '#' in post_id:
        post_id = post_id.split('#', 1)[0]
    post_id = remove_id_ending(post_id).replace('/', '#')
    if recent_posts_cache.get('index'):
        if post_id in recent_posts_cache['index']:
            return
        recent_posts_cache['index'].append(post_id)
        post_json_object['muted'] = False
        recent_posts_cache['json'][post_id] = json.dumps(post_json_object)
        recent_posts_cache['html'][post_id] = html_str

        while len(recent_posts_cache['html'].items()) > max_recent_posts:
            post_id = recent_posts_cache['index'][0]
            recent_posts_cache['index'].pop(0)
            if recent_posts_cache['json'].get(post_id):
                del recent_posts_cache['json'][post_id]
            if recent_posts_cache['html'].get(post_id):
                del recent_posts_cache['html'][post_id]
    else:
        recent_posts_cache['index'] = [post_id]
        recent_posts_cache['json'] = {}
        recent_posts_cache['html'] = {}
        recent_posts_cache['json'][post_id] = json.dumps(post_json_object)
        recent_posts_cache['html'][post_id] = html_str


def file_last_modified(filename: str) -> str:
    """Returns the date when a file was last modified
    """
    time_val = os.path.getmtime(filename)
    modified_time = datetime.datetime.fromtimestamp(time_val)
    return modified_time.strftime("%Y-%m-%dT%H:%M:%SZ")


def get_css(base_dir: str, css_filename: str) -> str:
    """Retrieves the css for a given file, or from a cache
    """
    # does the css file exist?
    if not os.path.isfile(css_filename):
        return None

    with open(css_filename, 'r', encoding='utf-8') as fp_css:
        css = fp_css.read()
        return css

    return None


def is_blog_post(post_json_object: {}) -> bool:
    """Is the given post a blog post?
    """
    if post_json_object['type'] != 'Create':
        return False
    if not has_object_dict(post_json_object):
        return False
    if not has_object_string_type(post_json_object, False):
        return False
    if 'content' not in post_json_object['object']:
        return False
    if post_json_object['object']['type'] != 'Article':
        return False
    return True


def is_news_post(post_json_object: {}) -> bool:
    """Is the given post a blog post?
    """
    return post_json_object.get('news')


def _search_virtual_box_posts(base_dir: str, nickname: str, domain: str,
                              search_str: str, max_results: int,
                              box_name: str) -> []:
    """Searches through a virtual box, which is typically an index on the inbox
    """
    index_filename = \
        acct_dir(base_dir, nickname, domain) + '/' + box_name + '.index'
    if box_name == 'bookmarks':
        box_name = 'inbox'
    path = acct_dir(base_dir, nickname, domain) + '/' + box_name
    if not os.path.isdir(path):
        return []

    search_str = search_str.lower().strip()

    if '+' in search_str:
        search_words = search_str.split('+')
        for index, _ in enumerate(search_words):
            search_words[index] = search_words[index].strip()
        print('SEARCH: ' + str(search_words))
    else:
        search_words = [search_str]

    res = []
    with open(index_filename, 'r', encoding='utf-8') as index_file:
        post_filename = 'start'
        while post_filename:
            post_filename = index_file.readline()
            if not post_filename:
                break
            if '.json' not in post_filename:
                break
            post_filename = path + '/' + post_filename.strip()
            if not os.path.isfile(post_filename):
                continue
            with open(post_filename, 'r', encoding='utf-8') as post_file:
                data = post_file.read().lower()

                not_found = False
                for keyword in search_words:
                    if keyword not in data:
                        not_found = True
                        break
                if not_found:
                    continue

                res.append(post_filename)
                if len(res) >= max_results:
                    return res
    return res


def search_box_posts(base_dir: str, nickname: str, domain: str,
                     search_str: str, max_results: int,
                     box_name='outbox') -> []:
    """Search your posts and return a list of the filenames
    containing matching strings
    """
    path = acct_dir(base_dir, nickname, domain) + '/' + box_name
    # is this a virtual box, such as direct messages?
    if not os.path.isdir(path):
        if os.path.isfile(path + '.index'):
            return _search_virtual_box_posts(base_dir, nickname, domain,
                                             search_str, max_results, box_name)
        return []
    search_str = search_str.lower().strip()

    if '+' in search_str:
        search_words = search_str.split('+')
        for index, _ in enumerate(search_words):
            search_words[index] = search_words[index].strip()
        print('SEARCH: ' + str(search_words))
    else:
        search_words = [search_str]

    res = []
    for root, _, fnames in os.walk(path):
        for fname in fnames:
            file_path = os.path.join(root, fname)
            with open(file_path, 'r', encoding='utf-8') as post_file:
                data = post_file.read().lower()

                not_found = False
                for keyword in search_words:
                    if keyword not in data:
                        not_found = True
                        break
                if not_found:
                    continue

                res.append(file_path)
                if len(res) >= max_results:
                    return res
        break
    return res


def get_file_case_insensitive(path: str) -> str:
    """Returns a case specific filename given a case insensitive version of it
    """
    if os.path.isfile(path):
        return path
    if path != path.lower():
        if os.path.isfile(path.lower()):
            return path.lower()
    return None


def undo_likes_collection_entry(recent_posts_cache: {},
                                base_dir: str, post_filename: str,
                                object_url: str,
                                actor: str, domain: str, debug: bool,
                                post_json_object: {}) -> None:
    """Undoes a like for a particular actor
    """
    if not post_json_object:
        post_json_object = load_json(post_filename)
    if not post_json_object:
        return
    # remove any cached version of this post so that the
    # like icon is changed
    nickname = get_nickname_from_actor(actor)
    if not nickname:
        return
    cached_post_filename = \
        get_cached_post_filename(base_dir, nickname,
                                 domain, post_json_object)
    if cached_post_filename:
        if os.path.isfile(cached_post_filename):
            try:
                os.remove(cached_post_filename)
            except OSError:
                print('EX: undo_likes_collection_entry ' +
                      'unable to delete cached post ' +
                      str(cached_post_filename))
    remove_post_from_cache(post_json_object, recent_posts_cache)

    if not post_json_object.get('type'):
        return
    if post_json_object['type'] != 'Create':
        return
    obj = post_json_object
    if has_object_dict(post_json_object):
        obj = post_json_object['object']
    if not obj.get('likes'):
        return
    if not isinstance(obj['likes'], dict):
        return
    if not obj['likes'].get('items'):
        return
    total_items = 0
    if obj['likes'].get('totalItems'):
        total_items = obj['likes']['totalItems']
    item_found = False
    for like_item in obj['likes']['items']:
        if like_item.get('actor'):
            if like_item['actor'] == actor:
                if debug:
                    print('DEBUG: like was removed for ' + actor)
                obj['likes']['items'].remove(like_item)
                item_found = True
                break
    if not item_found:
        return
    if total_items == 1:
        if debug:
            print('DEBUG: likes was removed from post')
        del obj['likes']
    else:
        itlen = len(obj['likes']['items'])
        obj['likes']['totalItems'] = itlen

    save_json(post_json_object, post_filename)


def undo_reaction_collection_entry(recent_posts_cache: {},
                                   base_dir: str, post_filename: str,
                                   object_url: str,
                                   actor: str, domain: str, debug: bool,
                                   post_json_object: {},
                                   emoji_content: str) -> None:
    """Undoes an emoji reaction for a particular actor
    """
    if not post_json_object:
        post_json_object = load_json(post_filename)
    if not post_json_object:
        return
    # remove any cached version of this post so that the
    # like icon is changed
    nickname = get_nickname_from_actor(actor)
    if not nickname:
        return
    cached_post_filename = \
        get_cached_post_filename(base_dir, nickname,
                                 domain, post_json_object)
    if cached_post_filename:
        if os.path.isfile(cached_post_filename):
            try:
                os.remove(cached_post_filename)
            except OSError:
                print('EX: undo_reaction_collection_entry ' +
                      'unable to delete cached post ' +
                      str(cached_post_filename))
    remove_post_from_cache(post_json_object, recent_posts_cache)

    if not post_json_object.get('type'):
        return
    if post_json_object['type'] != 'Create':
        return
    obj = post_json_object
    if has_object_dict(post_json_object):
        obj = post_json_object['object']
    if not obj.get('reactions'):
        return
    if not isinstance(obj['reactions'], dict):
        return
    if not obj['reactions'].get('items'):
        return
    total_items = 0
    if obj['reactions'].get('totalItems'):
        total_items = obj['reactions']['totalItems']
    item_found = False
    for like_item in obj['reactions']['items']:
        if like_item.get('actor'):
            if like_item['actor'] == actor and \
               like_item['content'] == emoji_content:
                if debug:
                    print('DEBUG: emoji reaction was removed for ' + actor)
                obj['reactions']['items'].remove(like_item)
                item_found = True
                break
    if not item_found:
        return
    if total_items == 1:
        if debug:
            print('DEBUG: emoji reaction was removed from post')
        del obj['reactions']
    else:
        itlen = len(obj['reactions']['items'])
        obj['reactions']['totalItems'] = itlen

    save_json(post_json_object, post_filename)


def undo_announce_collection_entry(recent_posts_cache: {},
                                   base_dir: str, post_filename: str,
                                   actor: str, domain: str,
                                   debug: bool) -> None:
    """Undoes an announce for a particular actor by removing it from
    the "shares" collection within a post. Note that the "shares"
    collection has no relation to shared items in shares.py. It's
    shares of posts, not shares of physical objects.
    """
    post_json_object = load_json(post_filename)
    if not post_json_object:
        return
    # remove any cached version of this announce so that the announce
    # icon is changed
    nickname = get_nickname_from_actor(actor)
    if not nickname:
        return
    cached_post_filename = \
        get_cached_post_filename(base_dir, nickname, domain,
                                 post_json_object)
    if cached_post_filename:
        if os.path.isfile(cached_post_filename):
            try:
                os.remove(cached_post_filename)
            except OSError:
                if debug:
                    print('EX: undo_announce_collection_entry ' +
                          'unable to delete cached post ' +
                          str(cached_post_filename))
    remove_post_from_cache(post_json_object, recent_posts_cache)

    if not post_json_object.get('type'):
        return
    if post_json_object['type'] != 'Create':
        return
    if not has_object_dict(post_json_object):
        if debug:
            pprint(post_json_object)
            print('DEBUG: post has no object')
        return
    if not post_json_object['object'].get('shares'):
        return
    if not post_json_object['object']['shares'].get('items'):
        return
    total_items = 0
    if post_json_object['object']['shares'].get('totalItems'):
        total_items = post_json_object['object']['shares']['totalItems']
    item_found = False
    for announce_item in post_json_object['object']['shares']['items']:
        if announce_item.get('actor'):
            if announce_item['actor'] == actor:
                if debug:
                    print('DEBUG: Announce was removed for ' + actor)
                an_it = announce_item
                post_json_object['object']['shares']['items'].remove(an_it)
                item_found = True
                break
    if not item_found:
        return
    if total_items == 1:
        if debug:
            print('DEBUG: shares (announcements) ' +
                  'was removed from post')
        del post_json_object['object']['shares']
    else:
        itlen = len(post_json_object['object']['shares']['items'])
        post_json_object['object']['shares']['totalItems'] = itlen

    save_json(post_json_object, post_filename)


def update_announce_collection(recent_posts_cache: {},
                               base_dir: str, post_filename: str,
                               actor: str, nickname: str, domain: str,
                               debug: bool) -> None:
    """Updates the announcements collection within a post
    Confusingly this is known as "shares", but isn't the
    same as shared items within shares.py
    It's shares of posts, not shares of physical objects.
    """
    post_json_object = load_json(post_filename)
    if not post_json_object:
        return
    # remove any cached version of this announce so that the announce
    # icon is changed
    cached_post_filename = \
        get_cached_post_filename(base_dir, nickname, domain,
                                 post_json_object)
    if cached_post_filename:
        if os.path.isfile(cached_post_filename):
            try:
                os.remove(cached_post_filename)
            except OSError:
                if debug:
                    print('EX: update_announce_collection ' +
                          'unable to delete cached post ' +
                          str(cached_post_filename))
    remove_post_from_cache(post_json_object, recent_posts_cache)

    if not has_object_dict(post_json_object):
        if debug:
            pprint(post_json_object)
            print('DEBUG: post ' + post_filename + ' has no object')
        return
    post_url = remove_id_ending(post_json_object['id']) + '/shares'
    if not post_json_object['object'].get('shares'):
        if debug:
            print('DEBUG: Adding initial shares (announcements) to ' +
                  post_url)
        announcements_json = {
            "@context": "https://www.w3.org/ns/activitystreams",
            'id': post_url,
            'type': 'Collection',
            "totalItems": 1,
            'items': [{
                'type': 'Announce',
                'actor': actor
            }]
        }
        post_json_object['object']['shares'] = announcements_json
    else:
        if post_json_object['object']['shares'].get('items'):
            shares_items = post_json_object['object']['shares']['items']
            for announce_item in shares_items:
                if announce_item.get('actor'):
                    if announce_item['actor'] == actor:
                        return
            new_announce = {
                'type': 'Announce',
                'actor': actor
            }
            post_json_object['object']['shares']['items'].append(new_announce)
            itlen = len(post_json_object['object']['shares']['items'])
            post_json_object['object']['shares']['totalItems'] = itlen
        else:
            if debug:
                print('DEBUG: shares (announcements) section of post ' +
                      'has no items list')

    if debug:
        print('DEBUG: saving post with shares (announcements) added')
        pprint(post_json_object)
    save_json(post_json_object, post_filename)


def week_day_of_month_start(month_number: int, year: int) -> int:
    """Gets the day number of the first day of the month
    1=sun, 7=sat
    """
    first_day_of_month = datetime.datetime(year, month_number, 1, 0, 0)
    return int(first_day_of_month.strftime("%w")) + 1


def media_file_mime_type(filename: str) -> str:
    """Given a media filename return its mime type
    """
    if '.' not in filename:
        return 'image/png'
    extensions = {
        'json': 'application/json',
        'png': 'image/png',
        'jpg': 'image/jpeg',
        'jxl': 'image/jxl',
        'jpeg': 'image/jpeg',
        'gif': 'image/gif',
        'svg': 'image/svg+xml',
        'webp': 'image/webp',
        'avif': 'image/avif',
        'heic': 'image/heic',
        'ico': 'image/x-icon',
        'mp3': 'audio/mpeg',
        'ogg': 'audio/ogg',
        'audio/wav': 'wav',
        'audio/x-wav': 'wav',
        'audio/x-pn-wave': 'wav',
        'wav': 'audio/vnd.wave',
        'opus': 'audio/opus',
        'spx': 'audio/speex',
        'flac': 'audio/flac',
        'mp4': 'video/mp4',
        'ogv': 'video/ogv'
    }
    file_ext = filename.split('.')[-1]
    if not extensions.get(file_ext):
        return 'image/png'
    return extensions[file_ext]


def is_recent_post(post_json_object: {}, max_days: int) -> bool:
    """ Is the given post recent?
    """
    if not has_object_dict(post_json_object):
        return False
    if not post_json_object['object'].get('published'):
        return False
    if not isinstance(post_json_object['object']['published'], str):
        return False
    curr_time = datetime.datetime.utcnow()
    days_since_epoch = (curr_time - datetime.datetime(1970, 1, 1)).days
    recently = days_since_epoch - max_days

    published_date_str = post_json_object['object']['published']
    if '.' in published_date_str:
        published_date_str = published_date_str.split('.')[0] + 'Z'
    try:
        published_date = \
            datetime.datetime.strptime(published_date_str,
                                       "%Y-%m-%dT%H:%M:%SZ")
    except BaseException:
        print('EX: is_recent_post unrecognized published date ' +
              str(published_date_str))
        return False

    published_days_since_epoch = \
        (published_date - datetime.datetime(1970, 1, 1)).days
    if published_days_since_epoch < recently:
        return False
    return True


def camel_case_split(text: str) -> str:
    """ Splits CamelCase into "Camel Case"
    """
    matches = re.finditer('.+?(?:(?<=[a-z])(?=[A-Z])|' +
                          '(?<=[A-Z])(?=[A-Z][a-z])|$)', text)
    if not matches:
        return text
    result_str = ''
    for word in matches:
        result_str += word.group(0) + ' '
    return result_str.strip()


def convert_to_snake_case(text: str) -> str:
    """Convert camel case to snake case
    """
    return camel_case_split(text).lower().replace(' ', '_')


def _convert_to_camel_case(text: str) -> str:
    """Convers a snake case string to camel case
    """
    if '_' not in text:
        return text
    words = text.split('_')
    result = ''
    ctr = 0
    for wrd in words:
        if ctr > 0:
            result += wrd.title()
        else:
            result = wrd.lower()
        ctr += 1
    return result


def reject_post_id(base_dir: str, nickname: str, domain: str,
                   post_id: str, recent_posts_cache: {}) -> None:
    """ Marks the given post as rejected,
    for example an announce which is too old
    """
    post_filename = locate_post(base_dir, nickname, domain, post_id)
    if not post_filename:
        return

    if recent_posts_cache.get('index'):
        # if this is a full path then remove the directories
        index_filename = post_filename
        if '/' in post_filename:
            index_filename = post_filename.split('/')[-1]

        # filename of the post without any extension or path
        # This should also correspond to any index entry in
        # the posts cache
        post_url = remove_eol(index_filename)
        post_url = post_url.replace('.json', '').strip()

        if post_url in recent_posts_cache['index']:
            if recent_posts_cache['json'].get(post_url):
                del recent_posts_cache['json'][post_url]
            if recent_posts_cache['html'].get(post_url):
                del recent_posts_cache['html'][post_url]

    with open(post_filename + '.reject', 'w+',
              encoding='utf-8') as reject_file:
        reject_file.write('\n')


def is_chat_message(post_json_object: {}) -> bool:
    """Returns true if the given post is a chat message
    Note that is_dm should be checked before calling this
    """
    if post_json_object['type'] != 'Create':
        return False
    if not has_object_dict(post_json_object):
        return False
    if post_json_object['object']['type'] != 'ChatMessage':
        return False
    return True


def is_reply(post_json_object: {}, actor: str) -> bool:
    """Returns true if the given post is a reply to the given actor
    """
    if post_json_object['type'] != 'Create':
        return False
    if not has_object_dict(post_json_object):
        return False
    if post_json_object['object'].get('moderationStatus'):
        return False
    if post_json_object['object']['type'] != 'Note' and \
       post_json_object['object']['type'] != 'Page' and \
       post_json_object['object']['type'] != 'EncryptedMessage' and \
       post_json_object['object']['type'] != 'ChatMessage' and \
       post_json_object['object']['type'] != 'Article':
        return False
    if post_json_object['object'].get('inReplyTo'):
        if isinstance(post_json_object['object']['inReplyTo'], str):
            if post_json_object['object']['inReplyTo'].startswith(actor):
                return True
    if not post_json_object['object'].get('tag'):
        return False
    if not isinstance(post_json_object['object']['tag'], list):
        return False
    for tag in post_json_object['object']['tag']:
        if not tag.get('type'):
            continue
        if tag['type'] == 'Mention':
            if not tag.get('href'):
                continue
            if actor in tag['href']:
                return True
    return False


def contains_pgp_public_key(content: str) -> bool:
    """Returns true if the given content contains a PGP public key
    """
    if '--BEGIN PGP PUBLIC KEY BLOCK--' in content:
        if '--END PGP PUBLIC KEY BLOCK--' in content:
            return True
    return False


def is_pgp_encrypted(content: str) -> bool:
    """Returns true if the given content is PGP encrypted
    """
    if '--BEGIN PGP MESSAGE--' in content:
        if '--END PGP MESSAGE--' in content:
            return True
    return False


def invalid_ciphertext(content: str) -> bool:
    """Returns true if the given content contains an invalid key
    """
    if '----BEGIN ' in content or '----END ' in content:
        if not contains_pgp_public_key(content) and \
           not is_pgp_encrypted(content):
            return True
    return False


def load_translations_from_file(base_dir: str, language: str) -> ({}, str):
    """Returns the translations dictionary
    """
    if not os.path.isdir(base_dir + '/translations'):
        print('ERROR: translations directory not found')
        return None, None
    if not language:
        system_language = locale.getdefaultlocale()[0]
    else:
        system_language = language
    if not system_language:
        system_language = 'en'
    if '_' in system_language:
        system_language = system_language.split('_')[0]
    while '/' in system_language:
        system_language = system_language.split('/')[1]
    if '.' in system_language:
        system_language = system_language.split('.')[0]
    translations_file = base_dir + '/translations/' + \
        system_language + '.json'
    if not os.path.isfile(translations_file):
        system_language = 'en'
        translations_file = base_dir + '/translations/' + \
            system_language + '.json'
    return load_json(translations_file), system_language


def dm_allowed_from_domain(base_dir: str,
                           nickname: str, domain: str,
                           sending_actor_domain: str) -> bool:
    """When a DM is received and the .followDMs flag file exists
    Then optionally some domains can be specified as allowed,
    regardless of individual follows.
    i.e. Mostly you only want DMs from followers, but there are
    a few particular instances that you trust
    """
    dm_allowed_instances_file = \
        acct_dir(base_dir, nickname, domain) + '/dmAllowedInstances.txt'
    if not os.path.isfile(dm_allowed_instances_file):
        return False
    if text_in_file(sending_actor_domain + '\n', dm_allowed_instances_file):
        return True
    return False


def get_occupation_skills(actor_json: {}) -> []:
    """Returns the list of skills for an actor
    """
    if 'hasOccupation' not in actor_json:
        return []
    if not isinstance(actor_json['hasOccupation'], list):
        return []
    for occupation_item in actor_json['hasOccupation']:
        if not isinstance(occupation_item, dict):
            continue
        if not occupation_item.get('@type'):
            continue
        if not occupation_item['@type'] == 'Occupation':
            continue
        if not occupation_item.get('skills'):
            continue
        if isinstance(occupation_item['skills'], list):
            return occupation_item['skills']
        if isinstance(occupation_item['skills'], str):
            return [occupation_item['skills']]
        break
    return []


def get_occupation_name(actor_json: {}) -> str:
    """Returns the occupation name an actor
    """
    if not actor_json.get('hasOccupation'):
        return ""
    if not isinstance(actor_json['hasOccupation'], list):
        return ""
    for occupation_item in actor_json['hasOccupation']:
        if not isinstance(occupation_item, dict):
            continue
        if not occupation_item.get('@type'):
            continue
        if occupation_item['@type'] != 'Occupation':
            continue
        if not occupation_item.get('name'):
            continue
        if isinstance(occupation_item['name'], str):
            return occupation_item['name']
        break
    return ""


def set_occupation_name(actor_json: {}, name: str) -> bool:
    """Sets the occupation name of an actor
    """
    if not actor_json.get('hasOccupation'):
        return False
    if not isinstance(actor_json['hasOccupation'], list):
        return False
    for index, _ in enumerate(actor_json['hasOccupation']):
        occupation_item = actor_json['hasOccupation'][index]
        if not isinstance(occupation_item, dict):
            continue
        if not occupation_item.get('@type'):
            continue
        if occupation_item['@type'] != 'Occupation':
            continue
        occupation_item['name'] = name
        return True
    return False


def set_occupation_skills_list(actor_json: {}, skills_list: []) -> bool:
    """Sets the occupation skills for an actor
    """
    if 'hasOccupation' not in actor_json:
        return False
    if not isinstance(actor_json['hasOccupation'], list):
        return False
    for index, _ in enumerate(actor_json['hasOccupation']):
        occupation_item = actor_json['hasOccupation'][index]
        if not isinstance(occupation_item, dict):
            continue
        if not occupation_item.get('@type'):
            continue
        if occupation_item['@type'] != 'Occupation':
            continue
        occupation_item['skills'] = skills_list
        return True
    return False


def is_account_dir(dir_name: str) -> bool:
    """Is the given directory an account within /accounts ?
    """
    if '@' not in dir_name:
        return False
    if 'inbox@' in dir_name or 'news@' in dir_name or 'Actor@' in dir_name:
        return False
    return True


def permitted_dir(path: str) -> bool:
    """These are special paths which should not be accessible
       directly via GET or POST
    """
    if path.startswith('/wfendpoints') or \
       path.startswith('/keys') or \
       path.startswith('/accounts'):
        return False
    return True


def user_agent_domain(user_agent: str, debug: bool) -> str:
    """If the User-Agent string contains a domain
    then return it
    """
    if 'https://' not in user_agent and 'http://' not in user_agent:
        return None
    agent_domain = ''
    if 'https://' in user_agent:
        agent_domain = user_agent.split('https://')[1].strip()
    else:
        agent_domain = user_agent.split('http://')[1].strip()
    if '/' in agent_domain:
        agent_domain = agent_domain.split('/')[0]
    if ')' in agent_domain:
        agent_domain = agent_domain.split(')')[0].strip()
    if ' ' in agent_domain:
        agent_domain = agent_domain.replace(' ', '')
    if ';' in agent_domain:
        agent_domain = agent_domain.replace(';', '')
    if '.' not in agent_domain:
        return None
    if debug:
        print('User-Agent Domain: ' + agent_domain)
    return agent_domain


def get_alt_path(actor: str, domain_full: str, calling_domain: str) -> str:
    """Returns alternate path from the actor
    eg. https://clearnetdomain/path becomes http://oniondomain/path
    """
    post_actor = actor
    if calling_domain not in actor and domain_full in actor:
        if calling_domain.endswith('.onion') or \
           calling_domain.endswith('.i2p'):
            post_actor = \
                'http://' + calling_domain + actor.split(domain_full)[1]
            print('Changed POST domain from ' + actor + ' to ' + post_actor)
    return post_actor


def get_actor_property_url(actor_json: {}, property_name: str) -> str:
    """Returns a url property from an actor
    """
    if not actor_json.get('attachment'):
        return ''
    property_name = property_name.lower()
    for property_value in actor_json['attachment']:
        name_value = None
        if property_value.get('name'):
            name_value = property_value['name']
        elif property_value.get('schema:name'):
            name_value = property_value['schema:name']
        if not name_value:
            continue
        if not name_value.lower().startswith(property_name):
            continue
        if not property_value.get('type'):
            continue
        prop_value_name, _ = \
            get_attachment_property_value(property_value)
        if not prop_value_name:
            continue
        if not property_value['type'].endswith('PropertyValue'):
            continue
        property_value['value'] = property_value[prop_value_name].strip()
        prefixes = get_protocol_prefixes()
        prefix_found = False
        for prefix in prefixes:
            if property_value[prop_value_name].startswith(prefix):
                prefix_found = True
                break
        if not prefix_found:
            continue
        if '.' not in property_value[prop_value_name]:
            continue
        if ' ' in property_value[prop_value_name]:
            continue
        if ',' in property_value[prop_value_name]:
            continue
        return property_value[prop_value_name]
    return ''


def remove_domain_port(domain: str) -> str:
    """If the domain has a port appended then remove it
    eg. mydomain.com:80 becomes mydomain.com
    """
    if ':' in domain:
        if domain.startswith('did:'):
            return domain
        domain = domain.split(':')[0]
    return domain


def get_port_from_domain(domain: str) -> int:
    """If the domain has a port number appended then return it
    eg. mydomain.com:80 returns 80
    """
    if ':' in domain:
        if domain.startswith('did:'):
            return None
        port_str = domain.split(':')[1]
        if port_str.isdigit():
            return int(port_str)
    return None


def valid_url_prefix(url: str) -> bool:
    """Does the given url have a valid prefix?
    """
    if '/' not in url:
        return False
    prefixes = ('https:', 'http:', 'hyper:', 'i2p:', 'gnunet:')
    for pre in prefixes:
        if url.startswith(pre):
            return True
    return False


def valid_password(password: str) -> bool:
    """Returns true if the given password is valid
    """
    if len(password) < 8:
        return False
    return True


def is_float(value) -> bool:
    """Is the given value a float?
    """
    try:
        float(value)
        return True
    except ValueError:
        return False


def date_string_to_seconds(date_str: str) -> int:
    """Converts a date string (eg "published") into seconds since epoch
    """
    try:
        expiry_time = \
            datetime.datetime.strptime(date_str, '%Y-%m-%dT%H:%M:%SZ')
    except BaseException:
        print('EX: date_string_to_seconds unable to parse date ' +
              str(date_str))
        return None
    return int(datetime.datetime.timestamp(expiry_time))


def date_seconds_to_string(date_sec: int) -> str:
    """Converts a date in seconds since epoch to a string
    """
    this_date = datetime.datetime.fromtimestamp(date_sec)
    return this_date.strftime("%Y-%m-%dT%H:%M:%SZ")


def has_group_type(base_dir: str, actor: str, person_cache: {},
                   debug: bool = False) -> bool:
    """Does the given actor url have a group type?
    """
    # does the actor path clearly indicate that this is a group?
    # eg. https://lemmy/c/groupname
    group_paths = get_group_paths()
    for grp_path in group_paths:
        if grp_path in actor:
            if debug:
                print('grpPath ' + grp_path + ' in ' + actor)
            return True
    # is there a cached actor which can be examined for Group type?
    return is_group_actor(base_dir, actor, person_cache, debug)


def is_group_actor(base_dir: str, actor: str, person_cache: {},
                   debug: bool = False) -> bool:
    """Is the given actor a group?
    """
    if person_cache:
        if person_cache.get(actor):
            if person_cache[actor].get('actor'):
                if person_cache[actor]['actor'].get('type'):
                    if person_cache[actor]['actor']['type'] == 'Group':
                        if debug:
                            print('Cached actor ' + actor + ' has Group type')
                        return True
                return False
    if debug:
        print('Actor ' + actor + ' not in cache')
    cached_actor_filename = \
        base_dir + '/cache/actors/' + (actor.replace('/', '#')) + '.json'
    if not os.path.isfile(cached_actor_filename):
        if debug:
            print('Cached actor file not found ' + cached_actor_filename)
        return False
    if text_in_file('"type": "Group"', cached_actor_filename):
        if debug:
            print('Group type found in ' + cached_actor_filename)
        return True
    return False


def is_group_account(base_dir: str, nickname: str, domain: str) -> bool:
    """Returns true if the given account is a group
    """
    account_filename = acct_dir(base_dir, nickname, domain) + '.json'
    if not os.path.isfile(account_filename):
        return False
    if text_in_file('"type": "Group"', account_filename):
        return True
    return False


def get_currencies() -> {}:
    """Returns a dictionary of currencies
    """
    return {
        "CA$": "CAD",
        "J$": "JMD",
        "£": "GBP",
        "€": "EUR",
        "؋": "AFN",
        "ƒ": "AWG",
        "₼": "AZN",
        "Br": "BYN",
        "BZ$": "BZD",
        "$b": "BOB",
        "KM": "BAM",
        "P": "BWP",
        "лв": "BGN",
        "R$": "BRL",
        "៛": "KHR",
        "$U": "UYU",
        "RD$": "DOP",
        "$": "USD",
        "₡": "CRC",
        "kn": "HRK",
        "₱": "CUP",
        "Kč": "CZK",
        "kr": "NOK",
        "¢": "GHS",
        "Q": "GTQ",
        "L": "HNL",
        "Ft": "HUF",
        "Rp": "IDR",
        "₹": "INR",
        "﷼": "IRR",
        "₪": "ILS",
        "¥": "JPY",
        "₩": "KRW",
        "₭": "LAK",
        "ден": "MKD",
        "RM": "MYR",
        "₨": "MUR",
        "₮": "MNT",
        "MT": "MZN",
        "C$": "NIO",
        "₦": "NGN",
        "Gs": "PYG",
        "zł": "PLN",
        "lei": "RON",
        "₽": "RUB",
        "Дин": "RSD",
        "S": "SOS",
        "R": "ZAR",
        "CHF": "CHF",
        "NT$": "TWD",
        "฿": "THB",
        "TT$": "TTD",
        "₴": "UAH",
        "Bs": "VEB",
        "₫": "VND",
        "Z$": "ZQD"
    }


def get_supported_languages(base_dir: str) -> []:
    """Returns a list of supported languages
    """
    translations_dir = base_dir + '/translations'
    languages_str = []
    for _, _, files in os.walk(translations_dir):
        for fname in files:
            if not fname.endswith('.json'):
                continue
            lang = fname.split('.')[0]
            if len(lang) == 2:
                languages_str.append(lang)
        break
    return languages_str


def get_category_types(base_dir: str) -> []:
    """Returns the list of ontologies
    """
    ontology_dir = base_dir + '/ontology'
    categories = []
    for _, _, files in os.walk(ontology_dir):
        for fname in files:
            if not fname.endswith('.json'):
                continue
            if '#' in fname or '~' in fname:
                continue
            if fname.startswith('custom'):
                continue
            ontology_filename = fname.split('.')[0]
            if 'Types' in ontology_filename:
                categories.append(ontology_filename.replace('Types', ''))
        break
    return categories


def get_shares_files_list() -> []:
    """Returns the possible shares files
    """
    return ('shares', 'wanted')


def replace_users_with_at(actor: str) -> str:
    """ https://domain/users/nick becomes https://domain/@nick
    """
    u_paths = get_user_paths()
    for path in u_paths:
        if path in actor:
            if '/@/' not in actor:
                actor = actor.replace(path, '/@')
            break
    return actor


def has_actor(post_json_object: {}, debug: bool) -> bool:
    """Does the given post have an actor?
    """
    if post_json_object.get('actor'):
        if '#' in post_json_object['actor']:
            return False
        return True
    if debug:
        if post_json_object.get('type'):
            msg = post_json_object['type'] + ' has missing actor'
            if post_json_object.get('id'):
                msg += ' ' + post_json_object['id']
            print(msg)
    return False


def has_object_string_type(post_json_object: {}, debug: bool) -> bool:
    """Does the given post have a type field within an object dict?
    """
    if not has_object_dict(post_json_object):
        if debug:
            print('has_object_string_type no object found')
        return False
    if post_json_object['object'].get('type'):
        if isinstance(post_json_object['object']['type'], str):
            return True
        if post_json_object.get('type'):
            print('DEBUG: ' + post_json_object['type'] +
                  ' type within object is not a string ' +
                  str(post_json_object))
    if debug:
        print('No type field within object ' + post_json_object['id'])
    return False


def has_object_string_object(post_json_object: {}, debug: bool) -> bool:
    """Does the given post have an object string field within an object dict?
    """
    if not has_object_dict(post_json_object):
        if debug:
            print('has_object_string_type no object found')
        return False
    if post_json_object['object'].get('object'):
        if isinstance(post_json_object['object']['object'], str):
            return True
        if debug:
            if post_json_object.get('type'):
                print('DEBUG: ' + post_json_object['type'] +
                      ' object within dict is not a string')
    if debug:
        print('No object field within dict ' + post_json_object['id'])
    return False


def has_object_string(post_json_object: {}, debug: bool) -> bool:
    """Does the given post have an object string field?
    """
    if post_json_object.get('object'):
        if isinstance(post_json_object['object'], str):
            return True
        if debug:
            if post_json_object.get('type'):
                print('DEBUG: ' + post_json_object['type'] +
                      ' object is not a string')
    if debug:
        print('No object field within post ' + post_json_object['id'])
    return False


def get_new_post_endpoints() -> []:
    """Returns a list of endpoints for new posts
    """
    return (
        'newpost', 'newblog', 'newunlisted', 'newfollowers', 'newdm',
        'newreminder', 'newreport', 'newquestion', 'newshare', 'newwanted',
        'editblogpost'
    )


def get_fav_filename_from_url(base_dir: str, favicon_url: str) -> str:
    """Returns the cached filename for a favicon based upon its url
    """
    if '://' in favicon_url:
        favicon_url = favicon_url.split('://')[1]
    if '/favicon.' in favicon_url:
        favicon_url = favicon_url.replace('/favicon.', '.')
    return base_dir + '/favicons/' + favicon_url.replace('/', '-')


def valid_hash_tag(hashtag: str) -> bool:
    """Returns true if the give hashtag contains valid characters
    """
    # long hashtags are not valid
    if len(hashtag) >= 32:
        return False
    # numbers are not permitted to be hashtags
    if hashtag.isdigit():
        return False
    if set(hashtag).issubset(VALID_HASHTAG_CHARS):
        return True
    if _is_valid_language(hashtag):
        return True
    return False


def convert_published_to_local_timezone(published, timezone: str) -> str:
    """Converts a post published time into local time
    """
    from_zone = tz.gettz('UTC')
    if timezone:
        try:
            to_zone = tz.gettz(timezone)
        except BaseException:
            pass
    if not timezone:
        return published

    utc = published.replace(tzinfo=from_zone)
    local_time = utc.astimezone(to_zone)
    return local_time


def load_account_timezones(base_dir: str) -> {}:
    """Returns a dictionary containing the preferred timezone for each account
    """
    account_timezone = {}
    for _, dirs, _ in os.walk(base_dir + '/accounts'):
        for acct in dirs:
            if '@' not in acct:
                continue
            if acct.startswith('inbox@') or acct.startswith('Actor@'):
                continue
            acct_directory = os.path.join(base_dir + '/accounts', acct)
            tz_filename = acct_directory + '/timezone.txt'
            if not os.path.isfile(tz_filename):
                continue
            timezone = None
            with open(tz_filename, 'r', encoding='utf-8') as fp_timezone:
                timezone = fp_timezone.read().strip()
            if timezone:
                nickname = acct.split('@')[0]
                account_timezone[nickname] = timezone
        break
    return account_timezone


def load_bold_reading(base_dir: str) -> {}:
    """Returns a dictionary containing the bold reading status for each account
    """
    bold_reading = {}
    for _, dirs, _ in os.walk(base_dir + '/accounts'):
        for acct in dirs:
            if '@' not in acct:
                continue
            if acct.startswith('inbox@') or acct.startswith('Actor@'):
                continue
            bold_reading_filename = \
                base_dir + '/accounts/' + acct + '/.boldReading'
            if os.path.isfile(bold_reading_filename):
                nickname = acct.split('@')[0]
                bold_reading[nickname] = True
        break
    return bold_reading


def get_account_timezone(base_dir: str, nickname: str, domain: str) -> str:
    """Returns the timezone for the given account
    """
    tz_filename = \
        acct_dir(base_dir, nickname, domain) + '/timezone.txt'
    if not os.path.isfile(tz_filename):
        return None
    timezone = None
    with open(tz_filename, 'r', encoding='utf-8') as fp_timezone:
        timezone = fp_timezone.read().strip()
    return timezone


def set_account_timezone(base_dir: str, nickname: str, domain: str,
                         timezone: str) -> None:
    """Sets the timezone for the given account
    """
    tz_filename = \
        acct_dir(base_dir, nickname, domain) + '/timezone.txt'
    timezone = timezone.strip()
    with open(tz_filename, 'w+', encoding='utf-8') as fp_timezone:
        fp_timezone.write(timezone)


def is_onion_request(calling_domain: str, referer_domain: str,
                     domain: str, onion_domain: str) -> bool:
    """Do the given domains indicate that this is a request
    from an onion instance
    """
    if not onion_domain:
        return False
    if domain == onion_domain:
        return True
    if calling_domain.endswith('.onion'):
        return True
    if not referer_domain:
        return False
    if referer_domain.endswith('.onion'):
        return True
    return False


def is_i2p_request(calling_domain: str, referer_domain: str,
                   domain: str, i2p_domain: str) -> bool:
    """Do the given domains indicate that this is a request
    from an i2p instance
    """
    if not i2p_domain:
        return False
    if domain == i2p_domain:
        return True
    if calling_domain.endswith('.i2p'):
        return True
    if not referer_domain:
        return False
    if referer_domain.endswith('.i2p'):
        return True
    return False


def disallow_announce(content: str, attachment: [], capabilities: {}) -> bool:
    """Are announces/boosts not allowed for the given post?
    """
    # pixelfed style capabilities
    if capabilities.get('announce'):
        if isinstance(capabilities['announce'], str):
            if not capabilities['announce'].endswith('#Public'):
                # TODO handle non-public announce permissions
                print('CAPABILITIES: announce ' + capabilities['announce'])
                return True

    # emojis
    disallow_strings = (
        ':boost_no:',
        ':noboost:',
        ':noboosts:',
        ':no_boost:',
        ':no_boosts:',
        ':boosts_no:',
        'dont_repeat',
        'dont_announce',
        'dont_boost',
        'do not boost',
        "don't boost",
        'boost_denied',
        'boosts_denied',
        'boostdenied',
        'boostsdenied'
    )
    content_lower = content.lower()
    for diss in disallow_strings:
        if diss in content_lower:
            return True

    # check for attached images without descriptions
    if isinstance(attachment, list):
        for item in attachment:
            if not isinstance(item, dict):
                continue
            if not item.get('mediaType'):
                continue
            if not item.get('url'):
                continue
            if not item['mediaType'].startswith('image/'):
                continue
            if not item.get('name'):
                # no image description
                return True
    return False


def disallow_reply(content: str) -> bool:
    """Are replies not allowed for the given post?
    """
    disallow_strings = (
        ':reply_no:',
        ':noreply:',
        ':noreplies:',
        ':no_reply:',
        ':no_replies:',
        ':replies_no:',
        'dont_at_me',
        'do not reply',
        "don't reply",
        "don't @ me",
        'dont@me',
        'dontatme'
    )
    content_lower = content.lower()
    for diss in disallow_strings:
        if diss in content_lower:
            return True
    return False


def get_attachment_property_value(property_value: {}) -> (str, str):
    """Returns the fieldname and value for an attachment property
    """
    prop_value = None
    prop_value_name = None
    if property_value.get('value'):
        prop_value = property_value['value']
        prop_value_name = 'value'
    elif property_value.get('http://schema.org#value'):
        prop_value_name = 'http://schema.org#value'
        prop_value = property_value[prop_value_name]
    elif property_value.get('https://schema.org#value'):
        prop_value_name = 'https://schema.org#value'
        prop_value = property_value[prop_value_name]
    elif property_value.get('href'):
        prop_value_name = 'href'
        prop_value = property_value[prop_value_name]
    return prop_value_name, prop_value


def safe_system_string(text: str) -> str:
    """Returns a safe version of a string which can be used within a
    system command
    """
    text = text.replace('$(', '(').replace('`', '')
    return text


def get_json_content_from_accept(accept: str) -> str:
    """returns the json content type for the given accept
    """
    protocol_str = 'application/json'
    if accept:
        if 'application/ld+json' in accept:
            protocol_str = 'application/ld+json'
    return protocol_str


def remove_inverted_text(text: str, system_language: str) -> str:
    """Removes any inverted text from the given string
    """
    if system_language != 'en':
        return text

    inverted_lower = [*"_ʎ_ʍʌ_ʇ_ɹ____ɯʃʞɾıɥƃɟǝ_ɔ_ɐ"]
    inverted_upper = [*"_⅄__ᴧ∩⊥_ᴚΌԀ_ᴎ_⅂⋊ſ__⅁ℲƎ◖Ↄ𐐒∀"]

    start_separator = ''
    separator = '\n'
    if '</p>' in text:
        text = text.replace('<p>', '')
        start_separator = '<p>'
        separator = '</p>'
    paragraphs = text.split(separator)
    new_text = ''
    inverted_list = (inverted_lower, inverted_upper)
    z_value = (ord('z'), ord('Z'))
    for para in paragraphs:
        replaced_chars = 0

        for idx in range(2):
            index = 0
            for test_ch in inverted_list[idx]:
                if test_ch == '_':
                    index += 1
                    continue
                if test_ch in para:
                    para = para.replace(test_ch, chr(z_value[idx] - index))
                    replaced_chars += 1
                index += 1

        if replaced_chars > 2:
            para = para[::-1]
        if para:
            new_text += start_separator + para
            if separator in text:
                new_text += separator

    return new_text


def remove_square_capitals(text: str, system_language: str) -> str:
    """Removes any square capital text from the given string
    """
    if system_language != 'en':
        return text
    offset = ord('A')
    start_value = ord('🅰')
    end_value = start_value + 26
    result = ''
    for text_ch in text:
        text_value = ord(text_ch)
        if text_value < start_value or text_value > end_value:
            result += text_ch
        else:
            result += chr(offset + text_value - start_value)
    return result


def dont_speak_hashtags(content: str) -> str:
    """Ensure that hashtags aren't announced by screen readers
    """
    if not content:
        return content
    return content.replace('>#<span',
                           '><span aria-hidden="true">#</span><span')


def load_min_images_for_accounts(base_dir: str) -> []:
    """Loads a list of nicknames for accounts where all images should
    be minimized by default
    """
    min_images_for_accounts = []
    for subdir, dirs, _ in os.walk(base_dir + '/accounts'):
        for account in dirs:
            if not is_account_dir(account):
                continue
            filename = os.path.join(subdir, account) + '/.minimize_all_images'
            if os.path.isfile(filename):
                min_images_for_accounts.append(account.split('@')[0])
        break
    return min_images_for_accounts


def set_minimize_all_images(base_dir: str,
                            nickname: str, domain: str,
                            minimize: bool,
                            min_images_for_accounts: []) -> None:
    """Add of remove a file indicating that all images for an account
    should be minimized by default
    """
    filename = acct_dir(base_dir, nickname, domain) + '/.minimize_all_images'
    if minimize:
        if nickname not in min_images_for_accounts:
            min_images_for_accounts.append(nickname)
        if not os.path.isfile(filename):
            try:
                with open(filename, 'w+', encoding='utf-8') as fp_min:
                    fp_min.write('\n')
            except OSError:
                print('EX: unable to write ' + filename)
        return

    if nickname in min_images_for_accounts:
        min_images_for_accounts.remove(nickname)
    if os.path.isfile(filename):
        try:
            os.remove(filename)
        except OSError:
            print('EX: unable to delete ' + filename)


def load_reverse_timeline(base_dir: str) -> []:
    """Loads flags for each user indicating whether they prefer to
    see reversed timelines
    """
    reverse_sequence = []
    for _, dirs, _ in os.walk(base_dir + '/accounts'):
        for acct in dirs:
            if not is_account_dir(acct):
                continue
            nickname = acct.split('@')[0]
            domain = acct.split('@')[1]
            reverse_filename = \
                acct_dir(base_dir, nickname, domain) + '/.reverse_timeline'
            if os.path.isfile(reverse_filename):
                if nickname not in reverse_sequence:
                    reverse_sequence.append(nickname)
        break
    return reverse_sequence


def save_reverse_timeline(base_dir: str, reverse_sequence: []) -> []:
    """Saves flags for each user indicating whether they prefer to
    see reversed timelines
    """
    for _, dirs, _ in os.walk(base_dir + '/accounts'):
        for acct in dirs:
            if not is_account_dir(acct):
                continue
            nickname = acct.split('@')[0]
            domain = acct.split('@')[1]
            reverse_filename = \
                acct_dir(base_dir, nickname, domain) + '/.reverse_timeline'
            if nickname in reverse_sequence:
                if not os.path.isfile(reverse_filename):
                    try:
                        with open(reverse_filename, 'w+',
                                  encoding='utf-8') as fp_reverse:
                            fp_reverse.write('\n')
                    except OSError:
                        print('EX: failed to save reverse ' + reverse_filename)
            else:
                if os.path.isfile(reverse_filename):
                    try:
                        os.remove(reverse_filename)
                    except OSError:
                        print('EX: failed to delete reverse ' +
                              reverse_filename)
        break


def is_quote_toot(post_json_object: str, content: str) -> bool:
    """Returns true if the given post is a quote toot / quote tweet
    """
    # Pleroma/Misskey implementations
    if post_json_object['object'].get('quoteUri') or \
       post_json_object['object'].get('quoteUrl') or \
       post_json_object['object'].get('quoteReply') or \
       post_json_object['object'].get('toot:quoteReply') or \
       post_json_object['object'].get('_misskey_quote'):
        return True
    # More correct ActivityPub implementation - adding a Link tag
    if post_json_object['object'].get('tag'):
        if isinstance(post_json_object['object']['tag'], list):
            for item in post_json_object['object']['tag']:
                if not isinstance(item, dict):
                    continue
                if item.get('rel'):
                    if isinstance(item['rel'], list):
                        for rel_str in item['rel']:
                            if not isinstance(rel_str, str):
                                continue
                            if '_misskey_quote' in rel_str:
                                return True
                    elif isinstance(item['rel'], str):
                        if '_misskey_quote' in item['rel']:
                            return True
                if not item.get('type'):
                    continue
                if not item.get('mediaType'):
                    continue
                if not isinstance(item['type'], str):
                    continue
                if item['type'] != 'Link':
                    continue
                if not isinstance(item['mediaType'], str):
                    continue
                if 'json' not in item['mediaType']:
                    continue
                return True
    # Twitter-style indicator
    if content:
        if 'QT: ' in content:
            return True
    return False


def license_link_from_name(license: str) -> str:
    """Returns the license link from its name
    """
    if '://' in license:
        return license
    value_upper = license.upper()
    if 'CC-BY-SA-NC' in value_upper or \
       'CC-BY-NC-SA' in value_upper or \
       'CC BY SA NC' in value_upper or \
       'CC BY NC SA' in value_upper:
        value = 'https://creativecommons.org/licenses/by-nc-sa/4.0'
    elif 'CC-BY-SA' in value_upper or 'CC-SA-BY' in value_upper or \
         'CC BY SA' in value_upper or 'CC SA BY' in value_upper:
        value = 'https://creativecommons.org/licenses/by-sa/4.0'
    elif 'CC-BY-NC' in value_upper or 'CC BY NC' in value_upper:
        value = 'https://creativecommons.org/licenses/by-nc/4.0'
    elif 'CC-BY-ND' in value_upper or 'CC BY ND' in value_upper:
        value = 'https://creativecommons.org/licenses/by-nc-nd/4.0'
    elif 'CC-BY' in value_upper or 'CC BY' in value_upper:
        value = 'https://creativecommons.org/licenses/by/4.0'
    elif 'GFDL' in value_upper or 'GNU FREE DOC' in value_upper:
        value = 'https://www.gnu.org/licenses/fdl-1.3.html'
    elif 'OPL' in value_upper or 'OPEN PUBLICATION LIC' in value_upper:
        value = 'https://opencontent.org/openpub'
    elif 'PDDL' in value_upper or 'OPEN DATA COMMONS PUBLIC' in value_upper:
        value = 'https://opendatacommons.org/licenses/pddl'
    elif 'ODBL' in value_upper or 'OPEN DATA COMMONS OPEN' in value_upper:
        value = 'https://opendatacommons.org/licenses/odbl'
    elif 'ODC' in value_upper or 'OPEN DATA COMMONS ATTR' in value_upper:
        value = 'https://opendatacommons.org/licenses/by'
    elif 'OGL' in value_upper or 'OPEN GOVERNMENT LIC' in value_upper:
        value = \
            'https://www.nationalarchives.gov.uk/doc/open-government-licence'
    elif 'PDL' in value_upper or \
         'PUBLIC DOCUMENTATION LIC' in value_upper:
        value = 'http://www.openoffice.org/licenses/PDL.html'
    elif 'FREEBSD' in value_upper:
        value = 'https://www.freebsd.org/copyright/freebsd-doc-license'
    elif 'WTF' in value_upper:
        value = 'http://www.wtfpl.net/txt/copying'
    elif 'UNLICENSE' in value_upper:
        value = 'https://unlicense.org'
    else:
        value = 'https://creativecommons.org/publicdomain/zero/1.0'
    return value


def _get_escaped_chars() -> {}:
    """Returns escaped characters
    """
    return {
        "&": "&amp;",
        "<": "&lt;",
        ">": "&gt;",
        '"': "&quot;",
        "'": "&apos;"
    }


def escape_text(txt: str) -> str:
    """Escape text for inclusion in xml/rss
    """
    for orig, replacement in _get_escaped_chars().items():
        txt = txt.replace(orig, replacement)
    return txt


def unescaped_text(txt: str) -> str:
    """Escape text for inclusion in xml/rss
    """
    for orig, replacement in _get_escaped_chars().items():
        txt = txt.replace(replacement, orig)
    return txt


def harmless_markup(post_json_object: {}) -> None:
    """render harmless any dangerous markup
    """
    for field_name in ('content', 'summary'):
        if post_json_object['object'].get(field_name):
            if dangerous_markup(post_json_object['object'][field_name],
                                False, ['pre']):
                post_json_object['object'][field_name] = \
                    remove_html(post_json_object['object'][field_name])
            post_json_object['object'][field_name] = \
                remove_markup_tag(post_json_object['object'][field_name],
                                  'pre')
        map_name = field_name + 'Map'
        if post_json_object['object'].get(map_name):
            map_dict = post_json_object['object'][map_name].items()
            for lang, content in map_dict:
                if not isinstance(content, str):
                    continue
                if dangerous_markup(content, False, ['pre']):
                    content = remove_html(content)
                    post_json_object['object'][map_name][lang] = \
                        content
                content = post_json_object['object'][map_name][lang]
                post_json_object['object'][map_name][lang] = \
                    remove_markup_tag(content, 'pre')


def ap_proxy_type(json_object: {}) -> str:
    """Returns a string indicating the proxy for an activitypub post
    or None if not proxied
    See https://codeberg.org/fediverse/fep/src/branch/main/feps/fep-fffd.md
    """
    if not json_object.get('proxyOf'):
        return None
    if not isinstance(json_object['proxyOf'], list):
        return None
    for proxy_dict in json_object['proxyOf']:
        if proxy_dict.get('protocol'):
            if isinstance(proxy_dict['protocol'], str):
                return proxy_dict['protocol']
    return None
-												flake8 format

											
										
										
											2020-04-04 13:44:49 +00:00
+								__filename__ = "utils.py"
 								__author__ = "Bob Mottram"
 								__license__ = "AGPL3+"
-												v1.4.0

											
										
										
											2023-01-21 23:03:30 +00:00
+								__version__ = "1.4.0"
-												flake8 format

											
										
										
											2020-04-04 13:44:49 +00:00
+								__maintainer__ = "Bob Mottram"
-												Change domain to libreserver.org

											
										
										
											2021-09-10 16:14:50 +00:00
+								__email__ = "bob@libreserver.org"
-												flake8 format

											
										
										
											2020-04-04 13:44:49 +00:00
+								__status__ = "Production"
-												Module groups

											
										
										
											2021-06-26 11:16:41 +00:00
+								__module_group__ = "Core"
-												Announce function

											
										
										
											2019-07-02 09:25:29 +00:00
 								import os
-												Split camelcase display names for speaker clarity

											
										
										
											2021-03-03 20:34:55 +00:00
+								import re
-												Add some retries

											
										
										
											2019-10-11 18:03:58 +00:00
+								import time
-												Unit test for emoji

											
										
										
											2019-09-29 18:48:34 +00:00
+								import shutil
-												Announce function

											
										
										
											2019-07-02 09:25:29 +00:00
+								import datetime
-												Use dumps to save json

											
										
										
											2019-11-23 10:20:30 +00:00
+								import json
-												Don't do idna conversion for local network addresses

											
										
										
											2021-01-25 11:38:12 +00:00
+								import idna
-												Add speakable text for desktop client

											
										
										
											2021-03-18 17:27:46 +00:00
+								import locale
-												Unit test for time zone

											
										
										
											2022-02-25 21:00:53 +00:00
+								from dateutil.tz import tz
-												Fix circular dependency

											
										
										
											2020-06-06 18:16:16 +00:00
+								from pprint import pprint
-												Move jsonld signatures to python3-cryptography

											
										
										
											2021-02-04 18:18:31 +00:00
+								from cryptography.hazmat.backends import default_backend
 								from cryptography.hazmat.primitives import hashes
-												Snake case

											
										
										
											2021-12-27 16:18:52 +00:00
+								from followingCalendar import add_person_to_calendar
-												Move jsonld signatures to python3-cryptography

											
										
										
											2021-02-04 18:18:31 +00:00
-												Get categories from podcast feeds

											
										
										
											2022-01-13 15:10:41 +00:00
+								VALID_HASHTAG_CHARS = \
-												Allow underscores in hashtags

											
										
										
											2022-03-02 15:13:59 +00:00
+								    set('_0123456789' +
-												Get categories from podcast feeds

											
										
										
											2022-01-13 15:10:41 +00:00
+								        'abcdefghijklmnopqrstuvwxyz' +
 								        'ABCDEFGHIJKLMNOPQRSTUVWXYZ' +
 								        '¡¿ÄäÀàÁáÂâÃãÅåǍǎĄąĂăÆæĀā' +
 								        'ÇçĆćĈĉČčĎđĐďðÈèÉéÊêËëĚěĘęĖėĒē' +
 								        'ĜĝĢģĞğĤĥÌìÍíÎîÏïıĪīĮįĴĵĶķ' +
 								        'ĹĺĻļŁłĽľĿŀÑñŃńŇňŅņÖöÒòÓóÔôÕõŐőØøŒœ' +
 								        'ŔŕŘřẞßŚśŜŝŞşŠšȘșŤťŢţÞþȚțÜüÙùÚúÛûŰűŨũŲųŮůŪū' +
 								        'ŴŵÝýŸÿŶŷŹźŽžŻż')
-												Screen for outgoing abusive posts

											
										
										
											2021-02-11 10:33:56 +00:00
+								# posts containing these strings will always get screened out,
 								# both incoming and outgoing.
 								# Could include dubious clacks or admin dogwhistles
-												Snake case

											
										
										
											2021-12-26 10:11:18 +00:00
+								INVALID_CHARACTERS = (
-												Filter out posts containing zero width spaces

											
										
										
											2023-01-01 22:28:13 +00:00
+								    '卐', '卍', '࿕', '࿖', '࿗', '࿘', 'ϟϟ', '🏳️‍🌈🚫', '⚡⚡', ''
-												Screen for outgoing abusive posts

											
										
										
											2021-02-11 10:33:56 +00:00
+								)
-												Extra actor url validation

											
										
										
											2022-12-26 10:49:41 +00:00
+								INVALID_ACTOR_URL_CHARACTERS = (
 								    ' ', '', '<', '>', '%', '{', '}', '|', '\\', '^', '`',
-												Validate actor url from webfinger

											
										
										
											2022-12-26 15:41:21 +00:00
+								    '?', '#', '[', ']', '!', '$', '&', "'", '(', ')', '*',
 								    '+', ',', ';', '='
-												Extra actor url validation

											
										
										
											2022-12-26 10:49:41 +00:00
+								)
-												Move jsonld signatures to python3-cryptography

											
										
										
											2021-02-04 18:18:31 +00:00
-												Convert fancy characters to ordinary ones

This will help screen readers

											
										
										
											2022-07-09 10:54:05 +00:00
+								def _standardize_text_range(text: str,
 								                            range_start: int, range_end: int,
 								                            offset: str) -> str:
 								    """Convert any fancy characters within the given range into ordinary ones
 								    """
 								    offset = ord(offset)
 								    ctr = 0
 								    text = list(text)
 								    while ctr < len(text):
 								        val = ord(text[ctr])
 								        if val in range(range_start, range_end):
 								            text[ctr] = chr(val - range_start + offset)
 								        ctr += 1
 								    return "".join(text)
 								def standardize_text(text: str) -> str:
 								    """Converts fancy unicode text to ordinary letters
 								    """
-												Check for none case

											
										
										
											2022-07-09 22:56:33 +00:00
+								    if not text:
 								        return text
-												Tidying

											
										
										
											2022-07-09 11:03:12 +00:00
+								    char_ranges = (
-												Tidying

											
										
										
											2022-07-09 11:09:29 +00:00
+								        [65345, 'a'],
-												Tidying

											
										
										
											2022-07-09 11:03:12 +00:00
+								        [119886, 'a'],
 								        [119990, 'a'],
 								        [120042, 'a'],
 								        [120094, 'a'],
-												Tidying

											
										
										
											2022-07-09 11:09:29 +00:00
+								        [120146, 'a'],
 								        [120198, 'a'],
-												More fancy unicode character ranges

											
										
										
											2022-07-09 11:24:11 +00:00
+								        [120302, 'a'],
 								        [120354, 'a'],
 								        [120406, 'a'],
-												Tidying

											
										
										
											2022-07-09 11:03:12 +00:00
+								        [65313, 'A'],
-												Tidying

											
										
										
											2022-07-09 11:09:29 +00:00
+								        [119912, 'A'],
 								        [119964, 'A'],
 								        [120016, 'A'],
 								        [120068, 'A'],
 								        [120120, 'A'],
 								        [120172, 'A'],
-												More fancy unicode character ranges

											
										
										
											2022-07-09 11:24:11 +00:00
+								        [120224, 'A'],
 								        [120328, 'A'],
 								        [120380, 'A'],
-												Additional unicode alphabets

											
										
										
											2023-07-19 09:14:36 +00:00
+								        [120432, 'A'],
 								        [127344, 'A'],
 								        [127312, 'A'],
 								        [127280, 'A'],
 								        [127248, 'A']
-												Convert fancy characters to ordinary ones

This will help screen readers

											
										
										
											2022-07-09 10:54:05 +00:00
+								    )
-												Tidying

											
										
										
											2022-07-09 11:03:12 +00:00
+								    for char_range in char_ranges:
 								        range_start = char_range[0]
-												Convert fancy characters to ordinary ones

This will help screen readers

											
										
										
											2022-07-09 10:54:05 +00:00
+								        range_end = range_start + 26
-												Tidying

											
										
										
											2022-07-09 11:03:12 +00:00
+								        offset = char_range[1]
 								        text = _standardize_text_range(text, range_start, range_end, offset)
-												Convert fancy characters to ordinary ones

This will help screen readers

											
										
										
											2022-07-09 10:54:05 +00:00
 								    return text
-												Function for line ending characters

											
										
										
											2022-06-21 11:58:50 +00:00
+								def remove_eol(line: str):
 								    """Removes line ending characters
 								    """
 								    return line.replace('\n', '').replace('\r', '')
-												Replacing open statements

											
										
										
											2022-06-10 13:01:39 +00:00
+								def text_in_file(text: str, filename: str,
 								                 case_sensitive: bool = True) -> bool:
-												Function for checking text in a file

											
										
										
											2022-06-10 09:24:11 +00:00
+								    """is the given text in the given file?
 								    """
-												Function for finding text in file

											
										
										
											2022-06-10 11:43:33 +00:00
+								    if not case_sensitive:
 								        text = text.lower()
-												Function for checking text in a file

											
										
										
											2022-06-10 09:24:11 +00:00
+								    try:
 								        with open(filename, 'r', encoding='utf-8') as file:
 								            content = file.read()
 								            if content:
-												Function for finding text in file

											
										
										
											2022-06-10 11:43:33 +00:00
+								                if not case_sensitive:
 								                    content = content.lower()
-												Function for checking text in a file

											
										
										
											2022-06-10 09:24:11 +00:00
+								                if text in content:
 								                    return True
 								    except OSError:
-												Exception for text in file

											
										
										
											2022-06-10 10:40:47 +00:00
+								        print('EX: unable to find text in missing file ' + filename)
-												Function for checking text in a file

											
										
										
											2022-06-10 09:24:11 +00:00
+								    return False
-												Snake case

											
										
										
											2021-12-26 10:19:59 +00:00
+								def local_actor_url(http_prefix: str, nickname: str, domain_full: str) -> str:
-												Tidying of actor urls

											
										
										
											2021-08-14 11:13:39 +00:00
+								    """Returns the url for an actor on this instance
 								    """
-												Snake case

											
										
										
											2021-12-26 10:00:46 +00:00
+								    return http_prefix + '://' + domain_full + '/users/' + nickname
-												Tidying of actor urls

											
										
										
											2021-08-14 11:13:39 +00:00
-												Snake case

											
										
										
											2021-12-26 10:29:52 +00:00
+								def get_actor_languages_list(actor_json: {}) -> []:
-												Handling of understood languages prior to automatic translation

											
										
										
											2021-07-20 13:33:27 +00:00
+								    """Returns a list containing languages used by the given actor
 								    """
-												Snake case

											
										
										
											2021-12-26 10:29:52 +00:00
+								    if not actor_json.get('attachment'):
-												Handling of understood languages prior to automatic translation

											
										
										
											2021-07-20 13:33:27 +00:00
+								        return []
-												Snake case

											
										
										
											2021-12-26 10:32:45 +00:00
+								    for property_value in actor_json['attachment']:
-												Prepare for alternative property names

											
										
										
											2022-05-11 16:10:38 +00:00
+								        name_value = None
 								        if property_value.get('name'):
 								            name_value = property_value['name']
 								        elif property_value.get('schema:name'):
 								            name_value = property_value['schema:name']
 								        if not name_value:
-												Handling of understood languages prior to automatic translation

											
										
										
											2021-07-20 13:33:27 +00:00
+								            continue
-												Prepare for alternative property names

											
										
										
											2022-05-11 16:10:38 +00:00
+								        if not name_value.lower().startswith('languages'):
-												Handling of understood languages prior to automatic translation

											
										
										
											2021-07-20 13:33:27 +00:00
+								            continue
-												Snake case

											
										
										
											2021-12-26 10:32:45 +00:00
+								        if not property_value.get('type'):
-												Handling of understood languages prior to automatic translation

											
										
										
											2021-07-20 13:33:27 +00:00
+								            continue
-												Prepare for alternative value field within attachments

											
										
										
											2022-05-11 17:17:23 +00:00
+								        prop_value_name, _ = \
 								            get_attachment_property_value(property_value)
 								        if not prop_value_name:
-												Handling of understood languages prior to automatic translation

											
										
										
											2021-07-20 13:33:27 +00:00
+								            continue
-												Prepare for alternative property value

											
										
										
											2022-05-11 16:16:34 +00:00
+								        if not property_value['type'].endswith('PropertyValue'):
-												Handling of understood languages prior to automatic translation

											
										
										
											2021-07-20 13:33:27 +00:00
+								            continue
-												Prepare for alternative value field within attachments

											
										
										
											2022-05-11 17:17:23 +00:00
+								        if isinstance(property_value[prop_value_name], list):
 								            lang_list = property_value[prop_value_name]
-												Snake case

											
										
										
											2021-12-26 10:35:37 +00:00
+								            lang_list.sort()
 								            return lang_list
-												Prepare for alternative value field within attachments

											
										
										
											2022-05-11 17:17:23 +00:00
+								        if isinstance(property_value[prop_value_name], str):
 								            lang_str = property_value[prop_value_name]
-												Snake case

											
										
										
											2021-12-26 10:40:24 +00:00
+								            lang_list_temp = []
-												Snake case

											
										
										
											2021-12-26 10:38:02 +00:00
+								            if ',' in lang_str:
-												Snake case

											
										
										
											2021-12-26 10:40:24 +00:00
+								                lang_list_temp = lang_str.split(',')
-												Snake case

											
										
										
											2021-12-26 10:38:02 +00:00
+								            elif ';' in lang_str:
-												Snake case

											
										
										
											2021-12-26 10:40:24 +00:00
+								                lang_list_temp = lang_str.split(';')
-												Snake case

											
										
										
											2021-12-26 10:38:02 +00:00
+								            elif '/' in lang_str:
-												Snake case

											
										
										
											2021-12-26 10:40:24 +00:00
+								                lang_list_temp = lang_str.split('/')
-												Snake case

											
										
										
											2021-12-26 10:38:02 +00:00
+								            elif '+' in lang_str:
-												Snake case

											
										
										
											2021-12-26 10:40:24 +00:00
+								                lang_list_temp = lang_str.split('+')
-												Snake case

											
										
										
											2021-12-26 10:38:02 +00:00
+								            elif ' ' in lang_str:
-												Snake case

											
										
										
											2021-12-26 10:40:24 +00:00
+								                lang_list_temp = lang_str.split(' ')
-												Returning single language understood as a list

											
										
										
											2022-02-25 15:20:15 +00:00
+								            else:
 								                return [lang_str]
-												Snake case

											
										
										
											2021-12-26 10:35:37 +00:00
+								            lang_list = []
-												Snake case

											
										
										
											2021-12-26 10:40:24 +00:00
+								            for lang in lang_list_temp:
-												Handle languages list as a string

											
										
										
											2021-08-11 09:00:17 +00:00
+								                lang = lang.strip()
-												Snake case

											
										
										
											2021-12-26 10:35:37 +00:00
+								                if lang not in lang_list:
 								                    lang_list.append(lang)
 								            lang_list.sort()
 								            return lang_list
-												Handling of understood languages prior to automatic translation

											
										
										
											2021-07-20 13:33:27 +00:00
+								    return []
-												Don't clear down DMs from other instances

											
										
										
											2022-05-01 13:23:32 +00:00
+								def has_object_dict(post_json_object: {}) -> bool:
 								    """Returns true if the given post has an object dict
 								    """
 								    if post_json_object.get('object'):
 								        if isinstance(post_json_object['object'], dict):
 								            return True
 								    return False
-												Allow pre tag through dangerous markup filter in some cases, then remove it when rendering

											
										
										
											2023-05-18 11:15:18 +00:00
+								def remove_markup_tag(html: str, tag: str) -> str:
 								    """Remove the given tag from the given html markup
 								    """
 								    if '<' + tag not in html:
 								        return html
 								    section = html.split('<' + tag)
 								    result = ''
 								    for text in section:
 								        if not result:
 								            if html.startswith('<' + tag) and '>' in text:
 								                result = text.split('>', 1)[1]
 								            else:
 								                result = text
 								            continue
 								        result += text.split('>', 1)[1]
 								    html = result
 								    section = html.split('</' + tag)
 								    result = ''
 								    for text in section:
 								        if not result:
 								            if html.startswith('</' + tag) and '>' in text:
 								                result = text.split('>', 1)[1]
 								            else:
 								                result = text
 								            continue
 								        result += text.split('>', 1)[1]
 								    return result
-												Snake case

											
										
										
											2021-12-26 10:50:49 +00:00
+								def get_content_from_post(post_json_object: {}, system_language: str,
-												Handle post summary translations

											
										
										
											2022-01-28 10:07:35 +00:00
+								                          languages_understood: [],
-												Replacing open statements

											
										
										
											2022-06-10 13:01:39 +00:00
+								                          content_type: str = "content") -> str:
-												Support for contentMap when creating html posts

											
										
										
											2021-07-18 11:48:29 +00:00
+								    """Returns the content from the post in the given language
-												Support for libretranslate

											
										
										
											2021-07-19 19:40:04 +00:00
+								    including searching for a matching entry within contentMap
-												Support for contentMap when creating html posts

											
										
										
											2021-07-18 11:48:29 +00:00
+								    """
-												Snake case

											
										
										
											2021-12-26 10:54:58 +00:00
+								    this_post_json = post_json_object
-												Snake case

											
										
										
											2021-12-26 10:57:03 +00:00
+								    if has_object_dict(post_json_object):
-												Snake case

											
										
										
											2021-12-26 10:54:58 +00:00
+								        this_post_json = post_json_object['object']
-												cwlists in a separate module

											
										
										
											2023-03-20 14:50:19 +00:00
+								    map_dict = content_type + 'Map'
 								    if not this_post_json.get(content_type) and \
 								       not this_post_json.get(map_dict):
-												Support for contentMap when creating html posts

											
										
										
											2021-07-18 11:48:29 +00:00
+								        return ''
-												Getting post content

											
										
										
											2021-07-20 12:28:56 +00:00
+								    content = ''
-												Replacing open statements

											
										
										
											2022-06-10 13:01:39 +00:00
+								    map_dict = content_type + 'Map'
 								    if this_post_json.get(map_dict):
 								        if isinstance(this_post_json[map_dict], dict):
 								            if this_post_json[map_dict].get(system_language):
 								                sys_lang = this_post_json[map_dict][system_language]
-												Snake case

											
										
										
											2021-12-25 23:03:28 +00:00
+								                if isinstance(sys_lang, str):
-												Tidying

											
										
										
											2023-07-14 12:11:12 +00:00
+								                    content = sys_lang
-												Allow pre tag through dangerous markup filter in some cases, then remove it when rendering

											
										
										
											2023-05-18 11:15:18 +00:00
+								                    content = remove_markup_tag(content, 'pre')
-												Tidying

											
										
										
											2023-07-14 12:11:12 +00:00
+								                    content = content.replace('&amp;', '&')
-												Convert fancy characters to ordinary ones

This will help screen readers

											
										
										
											2022-07-09 10:54:05 +00:00
+								                    return standardize_text(content)
-												Handling of understood languages prior to automatic translation

											
										
										
											2021-07-20 13:33:27 +00:00
+								            else:
-												Handle post summary translations

											
										
										
											2022-01-28 10:07:35 +00:00
+								                # is there a contentMap/summaryMap entry for one of
-												Handling of understood languages prior to automatic translation

											
										
										
											2021-07-20 13:33:27 +00:00
+								                # the understood languages?
-												Snake case

											
										
										
											2021-12-26 10:52:54 +00:00
+								                for lang in languages_understood:
-												Replacing open statements

											
										
										
											2022-06-10 13:01:39 +00:00
+								                    if this_post_json[map_dict].get(lang):
-												Tidying

											
										
										
											2023-07-14 12:11:12 +00:00
+								                        map_lang = this_post_json[map_dict][lang]
 								                        if isinstance(map_lang, str):
 								                            content = map_lang
 								                            content = remove_markup_tag(content, 'pre')
 								                            content = content.replace('&amp;', '&')
 								                            return standardize_text(content)
-												Getting post content

											
										
										
											2021-07-20 12:28:56 +00:00
+								    else:
-												Replacing open statements

											
										
										
											2022-06-10 13:01:39 +00:00
+								        if isinstance(this_post_json[content_type], str):
 								            content = this_post_json[content_type]
-												Tidying

											
										
										
											2023-07-14 12:11:12 +00:00
+								            content = content.replace('&amp;', '&')
-												Allow pre tag through dangerous markup filter in some cases, then remove it when rendering

											
										
										
											2023-05-18 11:15:18 +00:00
+								            content = remove_markup_tag(content, 'pre')
-												Convert fancy characters to ordinary ones

This will help screen readers

											
										
										
											2022-07-09 10:54:05 +00:00
+								    return standardize_text(content)
-												Support for contentMap when creating html posts

											
										
										
											2021-07-18 11:48:29 +00:00
-												Message text direction for certain languages

											
										
										
											2022-12-16 21:43:34 +00:00
+								def get_language_from_post(post_json_object: {}, system_language: str,
 								                           languages_understood: [],
 								                           content_type: str = "content") -> str:
 								    """Returns the content language from the post
 								    including searching for a matching entry within contentMap
 								    """
 								    this_post_json = post_json_object
 								    if has_object_dict(post_json_object):
 								        this_post_json = post_json_object['object']
 								    if not this_post_json.get(content_type):
 								        return system_language
 								    map_dict = content_type + 'Map'
 								    if this_post_json.get(map_dict):
 								        if isinstance(this_post_json[map_dict], dict):
 								            if this_post_json[map_dict].get(system_language):
 								                sys_lang = this_post_json[map_dict][system_language]
 								                if isinstance(sys_lang, str):
 								                    return system_language
 								            else:
 								                # is there a contentMap/summaryMap entry for one of
 								                # the understood languages?
 								                for lang in languages_understood:
 								                    if this_post_json[map_dict].get(lang):
 								                        return lang
 								    return system_language
-												Filtering include image descriptions and urls

											
										
										
											2022-06-02 18:07:07 +00:00
+								def get_media_descriptions_from_post(post_json_object: {}) -> str:
 								    """Returns all attached media descriptions as a single text.
 								    This is used for filtering
 								    """
 								    this_post_json = post_json_object
 								    if has_object_dict(post_json_object):
 								        this_post_json = post_json_object['object']
 								    if not this_post_json.get('attachment'):
 								        return ''
 								    descriptions = ''
 								    for attach in this_post_json['attachment']:
 								        if not attach.get('name'):
 								            continue
 								        descriptions += attach['name'] + ' '
 								        if attach.get('url'):
 								            descriptions += attach['url'] + ' '
 								    return descriptions.strip()
-												Handle post summary translations

											
										
										
											2022-01-28 10:07:35 +00:00
+								def get_summary_from_post(post_json_object: {}, system_language: str,
 								                          languages_understood: []) -> str:
 								    """Returns the summary from the post in the given language
 								    including searching for a matching entry within summaryMap
 								    """
 								    return get_content_from_post(post_json_object, system_language,
 								                                 languages_understood, "summary")
-												Snake case

											
										
										
											2021-12-26 11:29:40 +00:00
+								def get_base_content_from_post(post_json_object: {},
 								                               system_language: str) -> str:
-												Support for libretranslate

											
										
										
											2021-07-19 19:40:04 +00:00
+								    """Returns the content from the post in the given language
 								    """
-												Snake case

											
										
										
											2021-12-26 10:54:58 +00:00
+								    this_post_json = post_json_object
-												Snake case

											
										
										
											2021-12-26 10:57:03 +00:00
+								    if has_object_dict(post_json_object):
-												Snake case

											
										
										
											2021-12-26 10:54:58 +00:00
+								        this_post_json = post_json_object['object']
-												Improve checking for content

											
										
										
											2023-01-08 22:23:02 +00:00
+								    if 'content' not in this_post_json:
-												Support for libretranslate

											
										
										
											2021-07-19 19:40:04 +00:00
+								        return ''
-												Snake case

											
										
										
											2021-12-26 10:54:58 +00:00
+								    return this_post_json['content']
-												Support for libretranslate

											
										
										
											2021-07-19 19:40:04 +00:00
-												Snake case

											
										
										
											2021-12-26 12:02:29 +00:00
+								def acct_dir(base_dir: str, nickname: str, domain: str) -> str:
-												Snake case

											
										
										
											2021-12-25 16:17:53 +00:00
+								    return base_dir + '/accounts/' + nickname + '@' + domain
-												Function for account directory

											
										
										
											2021-07-13 21:59:53 +00:00
-												Tidying

											
										
										
											2022-12-18 15:29:54 +00:00
+								def acct_handle_dir(base_dir: str, handle: str) -> str:
 								    return base_dir + '/accounts/' + handle
-												Snake case

											
										
										
											2021-12-26 12:07:40 +00:00
+								def is_featured_writer(base_dir: str, nickname: str, domain: str) -> bool:
-												Featured writers

											
										
										
											2021-02-13 11:37:02 +00:00
+								    """Is the given account a featured writer, appearing in the features
 								    timeline on news instances?
 								    """
-												Snake case

											
										
										
											2021-12-26 12:10:21 +00:00
+								    features_blocked_filename = \
-												Snake case

											
										
										
											2021-12-26 12:02:29 +00:00
+								        acct_dir(base_dir, nickname, domain) + '/.nofeatures'
-												Snake case

											
										
										
											2021-12-26 12:10:21 +00:00
+								    return not os.path.isfile(features_blocked_filename)
-												Featured writers

											
										
										
											2021-02-13 11:37:02 +00:00
-												Snake case

											
										
										
											2021-12-26 12:10:21 +00:00
+								def refresh_newswire(base_dir: str):
-												Refresh newswire after removing or suspending an account

											
										
										
											2021-02-13 10:01:04 +00:00
+								    """Causes the newswire to be updates after a change to user accounts
 								    """
-												Snake case

											
										
										
											2021-12-26 12:13:46 +00:00
+								    refresh_newswire_filename = base_dir + '/accounts/.refresh_newswire'
 								    if os.path.isfile(refresh_newswire_filename):
-												Refresh newswire after removing or suspending an account

											
										
										
											2021-02-13 10:01:04 +00:00
+								        return
-												Explicitly set file encoding

											
										
										
											2022-06-09 14:46:30 +00:00
+								    with open(refresh_newswire_filename, 'w+',
 								              encoding='utf-8') as refresh_file:
-												Snake case

											
										
										
											2021-12-26 12:13:46 +00:00
+								        refresh_file.write('\n')
-												Refresh newswire after removing or suspending an account

											
										
										
											2021-02-13 10:01:04 +00:00
-												Snake case

											
										
										
											2021-12-26 12:13:46 +00:00
+								def get_sha_256(msg: str):
-												Move jsonld signatures to python3-cryptography

											
										
										
											2021-02-04 18:18:31 +00:00
+								    """Returns a SHA256 hash of the given string
 								    """
 								    digest = hashes.Hash(hashes.SHA256(), backend=default_backend())
 								    digest.update(msg)
 								    return digest.finalize()
-												Signing GET requests

											
										
										
											2021-09-08 10:05:45 +00:00
-												Snake case

											
										
										
											2021-12-26 12:13:46 +00:00
+								def get_sha_512(msg: str):
-												Signing GET requests

											
										
										
											2021-09-08 10:05:45 +00:00
+								    """Returns a SHA512 hash of the given string
 								    """
 								    digest = hashes.Hash(hashes.SHA512(), backend=default_backend())
 								    digest.update(msg)
 								    return digest.finalize()
-												Announce function

											
										
										
											2019-07-02 09:25:29 +00:00
-												flake8 format

											
										
										
											2020-04-04 13:44:49 +00:00
-												Extra checks for nodeinfo calling domain

											
										
										
											2022-01-30 17:21:28 +00:00
+								def local_network_host(host: str) -> bool:
-												Don't do idna conversion for local network addresses

											
										
										
											2021-01-25 11:38:12 +00:00
+								    """Returns true if the given host is on the local network
 								    """
-												Check for localhost

											
										
										
											2021-01-25 11:51:42 +00:00
+								    if host.startswith('localhost') or \
 								       host.startswith('192.') or \
-												Don't do idna conversion for local network addresses

											
										
										
											2021-01-25 11:38:12 +00:00
+								       host.startswith('127.') or \
 								       host.startswith('10.'):
 								        return True
 								    return False
-												Snake case

											
										
										
											2021-12-26 12:21:31 +00:00
+								def decoded_host(host: str) -> str:
-												Don't do idna conversion for local network addresses

											
										
										
											2021-01-25 11:38:12 +00:00
+								    """Convert hostname to internationalized domain
 								    https://en.wikipedia.org/wiki/Internationalized_domain_name
 								    """
 								    if ':' not in host:
-												Tests for international domain handling

											
										
										
											2021-01-25 12:24:40 +00:00
+								        # eg. mydomain:8000
-												Extra checks for nodeinfo calling domain

											
										
										
											2022-01-30 17:21:28 +00:00
+								        if not local_network_host(host):
-												Tests for international domain handling

											
										
										
											2021-01-25 12:24:40 +00:00
+								            if not host.endswith('.onion'):
 								                if not host.endswith('.i2p'):
 								                    return idna.decode(host)
-												Don't do idna conversion for local network addresses

											
										
										
											2021-01-25 11:38:12 +00:00
+								    return host
-												Snake case

											
										
										
											2021-12-26 12:16:36 +00:00
+								def get_locked_account(actor_json: {}) -> bool:
-												Show locked account status after search for handle

											
										
										
											2021-01-02 11:18:43 +00:00
+								    """Returns whether the given account requires follower approval
 								    """
-												Snake case

											
										
										
											2021-12-26 10:29:52 +00:00
+								    if not actor_json.get('manuallyApprovesFollowers'):
-												Show locked account status after search for handle

											
										
										
											2021-01-02 11:18:43 +00:00
+								        return False
-												Snake case

											
										
										
											2021-12-26 10:29:52 +00:00
+								    if actor_json['manuallyApprovesFollowers'] is True:
-												Show locked account status after search for handle

											
										
										
											2021-01-02 11:18:43 +00:00
+								        return True
 								    return False
-												Snake case

											
										
										
											2021-12-26 12:31:47 +00:00
+								def has_users_path(path_str: str) -> bool:
-												Tidying of users path detection

											
										
										
											2020-12-23 10:57:44 +00:00
+								    """Whether there is a /users/ path (or equivalent) in the given string
 								    """
-												Snake case

											
										
										
											2021-12-26 12:31:47 +00:00
+								    users_list = get_user_paths()
 								    for users_str in users_list:
 								        if users_str in path_str:
-												Tidying of users path detection

											
										
										
											2020-12-23 10:57:44 +00:00
+								            return True
-												Snake case

											
										
										
											2021-12-26 12:31:47 +00:00
+								    if '://' in path_str:
 								        domain = path_str.split('://')[1]
-												Additional users path

											
										
										
											2021-06-03 18:30:48 +00:00
+								        if '/' in domain:
 								            domain = domain.split('/')[0]
-												Snake case

											
										
										
											2021-12-26 12:31:47 +00:00
+								        if '://' + domain + '/' not in path_str:
-												Additional users path

											
										
										
											2021-06-03 18:30:48 +00:00
+								            return False
-												Snake case

											
										
										
											2021-12-26 12:31:47 +00:00
+								        nickname = path_str.split('://' + domain + '/')[1]
-												Additional users path

											
										
										
											2021-06-03 18:30:48 +00:00
+								        if '/' in nickname or '.' in nickname:
 								            return False
 								        return True
-												Tidying of users path detection

											
										
										
											2020-12-23 10:57:44 +00:00
+								    return False
-												Snake case

											
										
										
											2021-12-26 12:37:53 +00:00
+								def valid_post_date(published: str, max_age_days: int, debug: bool) -> bool:
-												Validate newswire item dates

So they can't be in the future or too far in the past

											
										
										
											2020-12-21 12:11:45 +00:00
+								    """Returns true if the published date is recent and is not in the future
 								    """
-												Snake case

											
										
										
											2021-12-26 12:37:53 +00:00
+								    baseline_time = datetime.datetime(1970, 1, 1)
-												Validate newswire item dates

So they can't be in the future or too far in the past

											
										
										
											2020-12-21 12:11:45 +00:00
-												Snake case

											
										
										
											2021-12-27 16:18:52 +00:00
+								    days_diff = datetime.datetime.utcnow() - baseline_time
 								    now_days_since_epoch = days_diff.days
-												Validate newswire item dates

So they can't be in the future or too far in the past

											
										
										
											2020-12-21 12:11:45 +00:00
-												Handle exception on date format

											
										
										
											2021-01-09 10:23:05 +00:00
+								    try:
-												Snake case

											
										
										
											2021-12-26 12:37:53 +00:00
+								        post_time_object = \
-												Handle exception on date format

											
										
										
											2021-01-09 10:23:05 +00:00
+								            datetime.datetime.strptime(published, "%Y-%m-%dT%H:%M:%SZ")
 								    except BaseException:
-												Show warnings for exceptions

											
										
										
											2021-10-29 14:33:52 +00:00
+								        if debug:
-												Snake case

											
										
										
											2021-12-26 12:31:47 +00:00
+								            print('EX: valid_post_date invalid published date ' +
 								                  str(published))
-												Handle exception on date format

											
										
										
											2021-01-09 10:23:05 +00:00
+								        return False
-												Snake case

											
										
										
											2021-12-26 12:45:03 +00:00
+								    days_diff = post_time_object - baseline_time
 								    post_days_since_epoch = days_diff.days
-												Validate newswire item dates

So they can't be in the future or too far in the past

											
										
										
											2020-12-21 12:11:45 +00:00
-												Snake case

											
										
										
											2021-12-26 12:45:03 +00:00
+								    if post_days_since_epoch > now_days_since_epoch:
-												Less verbose

											
										
										
											2021-03-14 19:53:22 +00:00
+								        if debug:
 								            print("Inbox post has a published date in the future!")
-												Validate newswire item dates

So they can't be in the future or too far in the past

											
										
										
											2020-12-21 12:11:45 +00:00
+								        return False
-												Snake case

											
										
										
											2021-12-26 12:45:03 +00:00
+								    if now_days_since_epoch - post_days_since_epoch >= max_age_days:
-												Less verbose

											
										
										
											2021-03-14 19:53:22 +00:00
+								        if debug:
 								            print("Inbox post is not recent enough")
-												Validate newswire item dates

So they can't be in the future or too far in the past

											
										
										
											2020-12-21 12:11:45 +00:00
+								        return False
 								    return True
-												Snake case

											
										
										
											2021-12-26 12:45:03 +00:00
+								def get_full_domain(domain: str, port: int) -> str:
-												Tidying

											
										
										
											2020-12-16 10:30:54 +00:00
+								    """Returns the full domain name, including port number
 								    """
 								    if not port:
 								        return domain
 								    if ':' in domain:
 								        return domain
-												Snake case

											
										
										
											2021-12-27 16:18:52 +00:00
+								    if port in (80, 443):
-												Tidying

											
										
										
											2020-12-16 10:30:54 +00:00
+								        return domain
 								    return domain + ':' + str(port)
-												Snake case

											
										
										
											2021-12-26 12:54:51 +00:00
+								def is_dormant(base_dir: str, nickname: str, domain: str, actor: str,
 								               dormant_months: int) -> bool:
-												Mark dormant followed accounts on profile

											
										
										
											2020-12-13 12:44:17 +00:00
+								    """Is the given followed actor dormant, from the standpoint
 								    of the given account
 								    """
-												Snake case

											
										
										
											2021-12-26 13:17:46 +00:00
+								    last_seen_filename = acct_dir(base_dir, nickname, domain) + \
-												Mark dormant followed accounts on profile

											
										
										
											2020-12-13 12:44:17 +00:00
+								        '/lastseen/' + actor.replace('/', '#') + '.txt'
-												Snake case

											
										
										
											2021-12-26 13:17:46 +00:00
+								    if not os.path.isfile(last_seen_filename):
-												Mark dormant followed accounts on profile

											
										
										
											2020-12-13 12:44:17 +00:00
+								        return False
-												Snake case

											
										
										
											2021-12-26 13:17:46 +00:00
+								    days_since_epoch_str = None
-												Exception handling

											
										
										
											2021-12-24 20:43:54 +00:00
+								    try:
-												Explicitly set file encoding

											
										
										
											2022-06-09 14:46:30 +00:00
+								        with open(last_seen_filename, 'r',
 								                  encoding='utf-8') as last_seen_file:
-												Snake case

											
										
										
											2021-12-26 13:17:46 +00:00
+								            days_since_epoch_str = last_seen_file.read()
-												Exception handling

											
										
										
											2021-12-24 20:43:54 +00:00
+								    except OSError:
-												Snake case

											
										
										
											2021-12-26 13:17:46 +00:00
+								        print('EX: failed to read last seen ' + last_seen_filename)
-												Exception handling

											
										
										
											2021-12-24 20:43:54 +00:00
+								        return False
-												Snake case

											
										
										
											2021-12-26 13:17:46 +00:00
+								    if days_since_epoch_str:
 								        days_since_epoch = int(days_since_epoch_str)
 								        curr_time = datetime.datetime.utcnow()
-												Snake case

											
										
										
											2021-12-26 13:21:50 +00:00
+								        curr_days_since_epoch = \
 								            (curr_time - datetime.datetime(1970, 1, 1)).days
-												Snake case

											
										
										
											2021-12-26 13:24:20 +00:00
+								        time_diff_months = \
-												Snake case

											
										
										
											2021-12-26 13:21:50 +00:00
+								            int((curr_days_since_epoch - days_since_epoch) / 30)
-												Snake case

											
										
										
											2021-12-26 13:24:20 +00:00
+								        if time_diff_months >= dormant_months:
-												Mark dormant followed accounts on profile

											
										
										
											2020-12-13 12:44:17 +00:00
+								            return True
 								    return False
-												Snake case

											
										
										
											2021-12-26 13:27:57 +00:00
+								def is_editor(base_dir: str, nickname: str) -> bool:
-												Editors can set a hashtag category

											
										
										
											2020-12-01 21:44:27 +00:00
+								    """Returns true if the given nickname is an editor
 								    """
-												Snake case

											
										
										
											2021-12-27 16:18:52 +00:00
+								    editors_file = base_dir + '/accounts/editors.txt'
-												Editors can set a hashtag category

											
										
										
											2020-12-01 21:44:27 +00:00
-												Snake case

											
										
										
											2021-12-27 16:18:52 +00:00
+								    if not os.path.isfile(editors_file):
-												Snake case

											
										
										
											2021-12-26 14:11:30 +00:00
+								        admin_name = get_config_param(base_dir, 'admin')
-												Snake case

											
										
										
											2021-12-27 16:18:52 +00:00
+								        if admin_name:
 								            if admin_name == nickname:
 								                return True
-												Editors can set a hashtag category

											
										
										
											2020-12-01 21:44:27 +00:00
+								        return False
-												Explicitly set file encoding

											
										
										
											2022-06-09 14:46:30 +00:00
+								    with open(editors_file, 'r', encoding='utf-8') as editors:
-												Snake case

											
										
										
											2021-12-27 16:18:52 +00:00
+								        lines = editors.readlines()
-												Editors can set a hashtag category

											
										
										
											2020-12-01 21:44:27 +00:00
+								        if len(lines) == 0:
-												Snake case

											
										
										
											2021-12-26 14:11:30 +00:00
+								            admin_name = get_config_param(base_dir, 'admin')
-												Snake case

											
										
										
											2021-12-27 16:18:52 +00:00
+								            if admin_name:
 								                if admin_name == nickname:
 								                    return True
-												Editors can set a hashtag category

											
										
										
											2020-12-01 21:44:27 +00:00
+								        for editor in lines:
 								            editor = editor.strip('\n').strip('\r')
 								            if editor == nickname:
 								                return True
 								    return False
-												Snake case

											
										
										
											2021-12-26 14:17:13 +00:00
+								def is_artist(base_dir: str, nickname: str) -> bool:
-												Graphic design section on edit profile screen

											
										
										
											2021-05-17 17:52:33 +00:00
+								    """Returns true if the given nickname is an artist
 								    """
-												Snake case

											
										
										
											2021-12-26 14:20:09 +00:00
+								    artists_file = base_dir + '/accounts/artists.txt'
-												Graphic design section on edit profile screen

											
										
										
											2021-05-17 17:52:33 +00:00
-												Snake case

											
										
										
											2021-12-26 14:20:09 +00:00
+								    if not os.path.isfile(artists_file):
-												Snake case

											
										
										
											2021-12-26 14:11:30 +00:00
+								        admin_name = get_config_param(base_dir, 'admin')
-												Snake case

											
										
										
											2021-12-27 16:18:52 +00:00
+								        if admin_name:
 								            if admin_name == nickname:
 								                return True
-												Graphic design section on edit profile screen

											
										
										
											2021-05-17 17:52:33 +00:00
+								        return False
-												Explicitly set file encoding

											
										
										
											2022-06-09 14:46:30 +00:00
+								    with open(artists_file, 'r', encoding='utf-8') as artists:
-												Snake case

											
										
										
											2021-12-27 16:18:52 +00:00
+								        lines = artists.readlines()
-												Graphic design section on edit profile screen

											
										
										
											2021-05-17 17:52:33 +00:00
+								        if len(lines) == 0:
-												Snake case

											
										
										
											2021-12-26 14:11:30 +00:00
+								            admin_name = get_config_param(base_dir, 'admin')
-												Snake case

											
										
										
											2021-12-27 16:18:52 +00:00
+								            if admin_name:
 								                if admin_name == nickname:
 								                    return True
-												Graphic design section on edit profile screen

											
										
										
											2021-05-17 17:52:33 +00:00
+								        for artist in lines:
 								            artist = artist.strip('\n').strip('\r')
 								            if artist == nickname:
 								                return True
 								    return False
-												Snake case

											
										
										
											2021-12-26 14:20:09 +00:00
+								def get_video_extensions() -> []:
-												Tidying of mime types

											
										
										
											2021-08-03 09:09:04 +00:00
+								    """Returns a list of the possible video file extensions
 								    """
 								    return ('mp4', 'webm', 'ogv')
-												Snake case

											
										
										
											2021-12-26 14:24:03 +00:00
+								def get_audio_extensions() -> []:
-												Tidying of mime types

											
										
										
											2021-08-03 09:09:04 +00:00
+								    """Returns a list of the possible audio file extensions
 								    """
-												Support wave file attachments

											
										
										
											2022-10-31 11:05:11 +00:00
+								    return ('mp3', 'ogg', 'flac', 'opus', 'spx', 'wav')
-												Tidying of mime types

											
										
										
											2021-08-03 09:09:04 +00:00
-												Snake case

											
										
										
											2021-12-26 14:26:16 +00:00
+								def get_image_extensions() -> []:
-												Move image format functions to utils

											
										
										
											2020-11-21 11:21:05 +00:00
+								    """Returns a list of the possible image file extensions
 								    """
-												Support heic formatted images

											
										
										
											2022-10-31 17:26:31 +00:00
+								    return ('jpg', 'jpeg', 'gif', 'webp', 'avif', 'heic',
 								            'svg', 'ico', 'jxl', 'png')
-												Move image format functions to utils

											
										
										
											2020-11-21 11:21:05 +00:00
-												Snake case

											
										
										
											2021-12-26 14:42:21 +00:00
+								def get_image_mime_type(image_filename: str) -> str:
-												Tidying

											
										
										
											2021-07-09 20:53:49 +00:00
+								    """Returns the mime type for the given image
 								    """
-												Snake case

											
										
										
											2021-12-27 16:18:52 +00:00
+								    extensions_to_mime = {
-												Tidying

											
										
										
											2021-07-09 20:53:49 +00:00
+								        'png': 'png',
 								        'jpg': 'jpeg',
-												Support jpeg-xl format

											
										
										
											2022-02-06 11:04:49 +00:00
+								        'jxl': 'jxl',
-												Tidying

											
										
										
											2021-07-09 20:53:49 +00:00
+								        'gif': 'gif',
 								        'avif': 'avif',
-												Support heic formatted images

											
										
										
											2022-10-31 17:26:31 +00:00
+								        'heic': 'heic',
-												Tidying

											
										
										
											2021-07-09 20:53:49 +00:00
+								        'svg': 'svg+xml',
-												Shorter cached favicon filename

											
										
										
											2021-12-17 12:01:54 +00:00
+								        'webp': 'webp',
 								        'ico': 'x-icon'
-												Tidying

											
										
										
											2021-07-09 20:53:49 +00:00
+								    }
-												Snake case

											
										
										
											2021-12-27 16:18:52 +00:00
+								    for ext, mime_ext in extensions_to_mime.items():
-												Snake case

											
										
										
											2021-12-26 14:42:21 +00:00
+								        if image_filename.endswith('.' + ext):
-												Snake case

											
										
										
											2021-12-26 15:44:28 +00:00
+								            return 'image/' + mime_ext
-												Tidying

											
										
										
											2021-07-09 20:53:49 +00:00
+								    return 'image/png'
-												Snake case

											
										
										
											2021-12-27 16:02:54 +00:00
+								def get_image_extension_from_mime_type(content_type: str) -> str:
-												Tidying

											
										
										
											2021-07-09 20:53:49 +00:00
+								    """Returns the image extension from a mime type, such as image/jpeg
 								    """
-												Snake case

											
										
										
											2021-12-26 15:23:01 +00:00
+								    image_media = {
-												Tidying

											
										
										
											2021-07-09 20:53:49 +00:00
+								        'png': 'png',
 								        'jpeg': 'jpg',
-												Support jpeg-xl format

											
										
										
											2022-02-06 11:04:49 +00:00
+								        'jxl': 'jxl',
-												Tidying

											
										
										
											2021-07-09 20:53:49 +00:00
+								        'gif': 'gif',
 								        'svg+xml': 'svg',
 								        'webp': 'webp',
-												Shorter cached favicon filename

											
										
										
											2021-12-17 12:01:54 +00:00
+								        'avif': 'avif',
-												Support heic formatted images

											
										
										
											2022-10-31 17:26:31 +00:00
+								        'heic': 'heic',
-												Shorter cached favicon filename

											
										
										
											2021-12-17 12:01:54 +00:00
+								        'x-icon': 'ico'
-												Tidying

											
										
										
											2021-07-09 20:53:49 +00:00
+								    }
-												Snake case

											
										
										
											2021-12-27 16:02:54 +00:00
+								    for mime_ext, ext in image_media.items():
 								        if content_type.endswith(mime_ext):
-												Tidying

											
										
										
											2021-07-09 20:53:49 +00:00
+								            return ext
 								    return 'png'
-												Snake case

											
										
										
											2021-12-26 14:39:49 +00:00
+								def get_media_extensions() -> []:
-												Tidy up the handling of media formats

											
										
										
											2020-11-21 11:54:29 +00:00
+								    """Returns a list of the possible media file extensions
 								    """
-												Snake case

											
										
										
											2021-12-26 14:26:16 +00:00
+								    return get_image_extensions() + \
-												Snake case

											
										
										
											2021-12-26 14:24:03 +00:00
+								        get_video_extensions() + get_audio_extensions()
-												Tidy up the handling of media formats

											
										
										
											2020-11-21 11:54:29 +00:00
-												Snake case

											
										
										
											2021-12-26 15:44:28 +00:00
+								def get_image_formats() -> str:
-												Move image format functions to utils

											
										
										
											2020-11-21 11:21:05 +00:00
+								    """Returns a string of permissable image formats
 								    used when selecting an image for a new post
 								    """
-												Snake case

											
										
										
											2021-12-27 16:02:54 +00:00
+								    image_ext = get_image_extensions()
 								    image_formats = ''
 								    for ext in image_ext:
 								        if image_formats:
 								            image_formats += ', '
 								        image_formats += '.' + ext
 								    return image_formats
-												Move image format functions to utils

											
										
										
											2020-11-21 11:21:05 +00:00
-												Snake case

											
										
										
											2021-12-27 15:58:46 +00:00
+								def is_image_file(filename: str) -> bool:
-												Tidying of image formats

											
										
										
											2021-07-01 09:51:16 +00:00
+								    """Is the given filename an image?
 								    """
-												Snake case

											
										
										
											2021-12-26 14:26:16 +00:00
+								    for ext in get_image_extensions():
-												Tidying of image formats

											
										
										
											2021-07-01 09:51:16 +00:00
+								        if filename.endswith('.' + ext):
 								            return True
 								    return False
-												Snake case

											
										
										
											2021-12-27 15:56:15 +00:00
+								def get_media_formats() -> str:
-												Tidy up the handling of media formats

											
										
										
											2020-11-21 11:54:29 +00:00
+								    """Returns a string of permissable media formats
 								    used when selecting an attachment for a new post
 								    """
-												Snake case

											
										
										
											2021-12-26 15:44:28 +00:00
+								    media_ext = get_media_extensions()
-												Tidy up the handling of media formats

											
										
										
											2020-11-21 11:54:29 +00:00
-												Snake case

											
										
										
											2021-12-27 15:58:46 +00:00
+								    media_formats = ''
-												Snake case

											
										
										
											2021-12-26 15:44:28 +00:00
+								    for ext in media_ext:
-												Snake case

											
										
										
											2021-12-27 15:58:46 +00:00
+								        if media_formats:
 								            media_formats += ', '
 								        media_formats += '.' + ext
 								    return media_formats
-												Tidy up the handling of media formats

											
										
										
											2020-11-21 11:54:29 +00:00
-												Snake case

											
										
										
											2021-12-27 15:43:22 +00:00
+								def remove_html(content: str) -> str:
-												Remove html before checking for hashtags

											
										
										
											2020-10-25 12:47:16 +00:00
+								    """Removes html links from the given content.
 								    Used to ensure that profile descriptions don't contain dubious content
 								    """
 								    if '<' not in content:
 								        return content
 								    removing = False
-												Re-adding notifications to the desktop client

											
										
										
											2021-03-22 13:09:17 +00:00
+								    content = content.replace('<a href', ' <a href')
-												Remove html before checking for hashtags

											
										
										
											2020-10-25 12:47:16 +00:00
+								    content = content.replace('<q>', '"').replace('</q>', '"')
-												Convert html paragraphs

											
										
										
											2021-03-23 10:52:10 +00:00
+								    content = content.replace('</p>', '\n\n').replace('<br>', '\n')
-												Remove html before checking for hashtags

											
										
										
											2020-10-25 12:47:16 +00:00
+								    result = ''
-												Snake case

											
										
										
											2021-12-27 17:16:57 +00:00
+								    for char in content:
 								        if char == '<':
-												Remove html before checking for hashtags

											
										
										
											2020-10-25 12:47:16 +00:00
+								            removing = True
-												Snake case

											
										
										
											2021-12-27 17:16:57 +00:00
+								        elif char == '>':
-												Remove html before checking for hashtags

											
										
										
											2020-10-25 12:47:16 +00:00
+								            removing = False
 								        elif not removing:
-												Snake case

											
										
										
											2021-12-27 17:16:57 +00:00
+								            result += char
-												Highlight inbox posts addressed to you

											
										
										
											2021-03-23 11:22:09 +00:00
-												Snake case

											
										
										
											2021-12-27 15:56:15 +00:00
+								    plain_text = result.replace('  ', ' ')
-												Adding spaces after full stops

											
										
										
											2021-03-23 10:38:03 +00:00
 								    # insert spaces after full stops
-												Snake case

											
										
										
											2021-12-27 17:16:57 +00:00
+								    str_len = len(plain_text)
-												Adding spaces after full stops

											
										
										
											2021-03-23 10:38:03 +00:00
+								    result = ''
-												Snake case

											
										
										
											2021-12-27 17:16:57 +00:00
+								    for i in range(str_len):
-												Snake case

											
										
										
											2021-12-27 15:56:15 +00:00
+								        result += plain_text[i]
-												Snake case

											
										
										
											2021-12-27 17:16:57 +00:00
+								        if plain_text[i] == '.' and i < str_len - 1:
-												Snake case

											
										
										
											2021-12-27 15:56:15 +00:00
+								            if plain_text[i + 1] >= 'A' and plain_text[i + 1] <= 'Z':
-												Adding spaces after full stops

											
										
										
											2021-03-23 10:38:03 +00:00
+								                result += ' '
-												Highlight inbox posts addressed to you

											
										
										
											2021-03-23 11:22:09 +00:00
+								    result = result.replace('  ', ' ').strip()
-												Remove html before checking for hashtags

											
										
										
											2020-10-25 12:47:16 +00:00
+								    return result
-												Remove css style from post content

This could otherwise mess up the UI

											
										
										
											2023-02-19 11:36:35 +00:00
+								def remove_style_within_html(content: str) -> str:
 								    """Removes style="something" within html post content.
 								    Used to ensure that styles
 								    """
 								    if '<' not in content:
 								        return content
 								    if ' style="' not in content:
 								        return content
 								    sections = content.split(' style="')
 								    result = ''
 								    ctr = 0
 								    for section_text in sections:
 								        if ctr > 0:
 								            result += section_text.split('"', 1)[1]
 								        else:
 								            result = section_text
 								        ctr = 1
 								    return result
-												Snake case

											
										
										
											2021-12-27 15:52:08 +00:00
+								def first_paragraph_from_string(content: str) -> str:
-												Function sequence

											
										
										
											2020-11-08 10:52:07 +00:00
+								    """Get the first paragraph from a blog post
 								    to be used as a summary in the newswire feed
 								    """
 								    if '<p>' not in content or '</p>' not in content:
-												Snake case

											
										
										
											2021-12-27 15:43:22 +00:00
+								        return remove_html(content)
-												Function sequence

											
										
										
											2020-11-08 10:52:07 +00:00
+								    paragraph = content.split('<p>')[1]
 								    if '</p>' in paragraph:
 								        paragraph = paragraph.split('</p>')[0]
-												Snake case

											
										
										
											2021-12-27 15:43:22 +00:00
+								    return remove_html(paragraph)
-												Function sequence

											
										
										
											2020-11-08 10:52:07 +00:00
-												Snake case

											
										
										
											2021-12-27 15:41:04 +00:00
+								def is_system_account(nickname: str) -> bool:
-												More verbose

											
										
										
											2020-10-13 11:13:32 +00:00
+								    """Returns true if the given nickname is a system account
 								    """
-												Snake case

											
										
										
											2021-12-27 17:16:57 +00:00
+								    if nickname in ('news', 'inbox'):
-												More verbose

											
										
										
											2020-10-13 11:13:32 +00:00
+								        return True
 								    return False
-												Snake case

											
										
										
											2021-12-26 14:37:28 +00:00
+								def _create_config(base_dir: str) -> None:
-												Tidying

											
										
										
											2020-10-06 08:58:44 +00:00
+								    """Creates a configuration file
 								    """
-												Snake case

											
										
										
											2021-12-26 14:37:28 +00:00
+								    config_filename = base_dir + '/config.json'
 								    if os.path.isfile(config_filename):
-												Tidying

											
										
										
											2020-10-06 08:58:44 +00:00
+								        return
-												Snake case

											
										
										
											2021-12-26 14:37:28 +00:00
+								    config_json = {
-												Tidying

											
										
										
											2020-10-06 08:58:44 +00:00
+								    }
-												Snake case

											
										
										
											2021-12-26 14:47:21 +00:00
+								    save_json(config_json, config_filename)
-												Tidying

											
										
										
											2020-10-06 08:58:44 +00:00
-												Snake case

											
										
										
											2021-12-27 20:38:02 +00:00
+								def set_config_param(base_dir: str, variable_name: str,
 								                     variable_value) -> None:
-												Tidying

											
										
										
											2020-10-06 08:58:44 +00:00
+								    """Sets a configuration value
 								    """
-												Snake case

											
										
										
											2021-12-26 14:37:28 +00:00
+								    _create_config(base_dir)
 								    config_filename = base_dir + '/config.json'
-												Snake case

											
										
										
											2021-12-27 20:38:02 +00:00
+								    config_json = {}
-												Snake case

											
										
										
											2021-12-26 14:37:28 +00:00
+								    if os.path.isfile(config_filename):
-												Snake case

											
										
										
											2021-12-27 20:38:02 +00:00
+								        config_json = load_json(config_filename)
-												Convert config variable names to camel case

											
										
										
											2021-12-28 15:13:51 +00:00
+								    variable_name = _convert_to_camel_case(variable_name)
-												Snake case

											
										
										
											2021-12-27 20:38:02 +00:00
+								    config_json[variable_name] = variable_value
 								    save_json(config_json, config_filename)
-												Tidying

											
										
										
											2020-10-06 08:58:44 +00:00
-												Snake case

											
										
										
											2021-12-27 15:41:04 +00:00
+								def get_config_param(base_dir: str, variable_name: str):
-												Tidying

											
										
										
											2020-10-06 08:58:44 +00:00
+								    """Gets a configuration value
 								    """
-												Snake case

											
										
										
											2021-12-26 14:37:28 +00:00
+								    _create_config(base_dir)
 								    config_filename = base_dir + '/config.json'
-												Snake case

											
										
										
											2021-12-27 17:16:57 +00:00
+								    config_json = load_json(config_filename)
 								    if config_json:
-												Convert config variable names to camel case

											
										
										
											2021-12-28 15:13:51 +00:00
+								        variable_name = _convert_to_camel_case(variable_name)
-												Snake case

											
										
										
											2021-12-27 17:16:57 +00:00
+								        if variable_name in config_json:
 								            return config_json[variable_name]
-												Tidying

											
										
										
											2020-10-06 08:58:44 +00:00
+								    return None
-												Snake case

											
										
										
											2021-12-27 15:37:31 +00:00
+								def is_suspended(base_dir: str, nickname: str) -> bool:
-												Tidying

											
										
										
											2020-10-06 08:58:44 +00:00
+								    """Returns true if the given nickname is suspended
 								    """
-												Snake case

											
										
										
											2021-12-27 15:37:31 +00:00
+								    admin_nickname = get_config_param(base_dir, 'admin')
 								    if not admin_nickname:
-												More checks that admin user is defined

											
										
										
											2020-10-10 16:10:32 +00:00
+								        return False
-												Snake case

											
										
										
											2021-12-27 15:37:31 +00:00
+								    if nickname == admin_nickname:
-												Tidying

											
										
										
											2020-10-06 08:58:44 +00:00
+								        return False
-												Snake case

											
										
										
											2021-12-27 15:37:31 +00:00
+								    suspended_filename = base_dir + '/accounts/suspended.txt'
 								    if os.path.isfile(suspended_filename):
-												Explicitly set file encoding

											
										
										
											2022-06-09 14:46:30 +00:00
+								        with open(suspended_filename, 'r', encoding='utf-8') as susp_file:
-												Snake case

											
										
										
											2021-12-27 17:16:57 +00:00
+								            lines = susp_file.readlines()
-												Tidying

											
										
										
											2020-10-06 08:58:44 +00:00
+								        for suspended in lines:
 								            if suspended.strip('\n').strip('\r') == nickname:
 								                return True
 								    return False
-												Snake case

											
										
										
											2021-12-27 13:58:17 +00:00
+								def get_followers_list(base_dir: str,
 								                       nickname: str, domain: str,
 								                       follow_file='following.txt') -> []:
-												Return lists

											
										
										
											2020-09-25 14:14:59 +00:00
+								    """Returns a list of followers for the given account
 								    """
-												Snake case

											
										
										
											2021-12-27 13:58:17 +00:00
+								    filename = acct_dir(base_dir, nickname, domain) + '/' + follow_file
-												Return lists

											
										
										
											2020-09-25 14:14:59 +00:00
 								    if not os.path.isfile(filename):
 								        return []
-												Explicitly set file encoding

											
										
										
											2022-06-09 14:46:30 +00:00
+								    with open(filename, 'r', encoding='utf-8') as foll_file:
-												Snake case

											
										
										
											2021-12-27 17:16:57 +00:00
+								        lines = foll_file.readlines()
-												Use enumerations

											
										
										
											2022-01-08 10:58:54 +00:00
+								        for i, _ in enumerate(lines):
-												Return lists

											
										
										
											2020-09-25 14:14:59 +00:00
+								            lines[i] = lines[i].strip()
 								        return lines
 								    return []
-												Snake case

											
										
										
											2021-12-27 11:31:04 +00:00
+								def get_followers_of_person(base_dir: str,
 								                            nickname: str, domain: str,
 								                            follow_file='following.txt') -> []:
-												Move functions

											
										
										
											2020-09-25 13:21:56 +00:00
+								    """Returns a list containing the followers of the given person
 								    Used by the shared inbox to know who to send incoming mail to
 								    """
 								    followers = []
-												Snake case

											
										
										
											2021-12-26 18:17:37 +00:00
+								    domain = remove_domain_port(domain)
-												Move functions

											
										
										
											2020-09-25 13:21:56 +00:00
+								    handle = nickname + '@' + domain
-												Tidying

											
										
										
											2022-12-18 15:29:54 +00:00
+								    handle_dir = acct_handle_dir(base_dir, handle)
 								    if not os.path.isdir(handle_dir):
-												Move functions

											
										
										
											2020-09-25 13:21:56 +00:00
+								        return followers
-												Snake case

											
										
										
											2021-12-27 17:16:57 +00:00
+								    for subdir, dirs, _ in os.walk(base_dir + '/accounts'):
-												Move functions

											
										
										
											2020-09-25 13:21:56 +00:00
+								        for account in dirs:
-												Snake case

											
										
										
											2021-12-27 11:31:04 +00:00
+								            filename = os.path.join(subdir, account) + '/' + follow_file
-												Include news account

											
										
										
											2021-04-21 16:09:56 +00:00
+								            if account == handle or \
 								               account.startswith('inbox@') or \
-												Actor is not an account directory

											
										
										
											2022-02-10 15:07:09 +00:00
+								               account.startswith('Actor@') or \
-												Include news account

											
										
										
											2021-04-21 16:09:56 +00:00
+								               account.startswith('news@'):
-												Move functions

											
										
										
											2020-09-25 13:21:56 +00:00
+								                continue
 								            if not os.path.isfile(filename):
 								                continue
-												Explicitly set file encoding

											
										
										
											2022-06-09 14:46:30 +00:00
+								            with open(filename, 'r', encoding='utf-8') as followingfile:
-												Snake case

											
										
										
											2021-12-27 13:58:17 +00:00
+								                for following_handle in followingfile:
-												Function for line ending characters

											
										
										
											2022-06-21 11:58:50 +00:00
+								                    following_handle2 = remove_eol(following_handle)
-												Snake case

											
										
										
											2021-12-27 13:58:17 +00:00
+								                    if following_handle2 == handle:
-												Move functions

											
										
										
											2020-09-25 13:21:56 +00:00
+								                        if account not in followers:
 								                            followers.append(account)
 								                        break
-												Break after loop

											
										
										
											2020-12-13 22:13:45 +00:00
+								        break
-												Move functions

											
										
										
											2020-09-25 13:21:56 +00:00
+								    return followers
-												Snake case

											
										
										
											2021-12-27 11:31:04 +00:00
+								def remove_id_ending(id_str: str) -> str:
-												Remove id endings in a better way

											
										
										
											2020-08-23 11:13:35 +00:00
+								    """Removes endings such as /activity and /undo
 								    """
-												Snake case

											
										
										
											2021-12-27 11:31:04 +00:00
+								    if id_str.endswith('/activity'):
 								        id_str = id_str[:-len('/activity')]
 								    elif id_str.endswith('/undo'):
 								        id_str = id_str[:-len('/undo')]
 								    elif id_str.endswith('/event'):
 								        id_str = id_str[:-len('/event')]
 								    elif id_str.endswith('/replies'):
 								        id_str = id_str[:-len('/replies')]
-												Handle delete endings on ids

											
										
										
											2022-11-13 20:25:07 +00:00
+								    elif id_str.endswith('/delete'):
 								        id_str = id_str[:-len('/delete')]
-												Handle update endings on ids

											
										
										
											2022-11-13 20:33:24 +00:00
+								    elif id_str.endswith('/update'):
 								        id_str = id_str[:-len('/update')]
-												Snake case

											
										
										
											2021-12-27 11:31:04 +00:00
+								    if id_str.endswith('#Create'):
 								        id_str = id_str.split('#Create')[0]
-												Handle delete endings on ids

											
										
										
											2022-11-13 20:25:07 +00:00
+								    elif id_str.endswith('#delete'):
 								        id_str = id_str.split('#delete')[0]
-												Handle update id endings

											
										
										
											2023-05-05 10:35:22 +00:00
+								    elif '#update' in id_str:
-												Handle update endings on ids

											
										
										
											2022-11-13 20:33:24 +00:00
+								        id_str = id_str.split('#update')[0]
-												Add price representation for shares collection

											
										
										
											2023-08-20 11:06:39 +00:00
+								    elif '#primary' in id_str:
 								        id_str = id_str.split('#primary')[0]
 								    elif '#reciprocal' in id_str:
 								        id_str = id_str.split('#reciprocal')[0]
-												Snake case

											
										
										
											2021-12-27 11:31:04 +00:00
+								    return id_str
-												Remove id endings in a better way

											
										
										
											2020-08-23 11:13:35 +00:00
-												Snake case

											
										
										
											2021-12-27 17:16:57 +00:00
+								def remove_hash_from_post_id(post_id: str) -> str:
-												Tidying

											
										
										
											2021-12-06 12:42:05 +00:00
+								    """Removes any has from a post id
 								    """
-												Snake case

											
										
										
											2021-12-26 19:47:06 +00:00
+								    if '#' not in post_id:
 								        return post_id
 								    return post_id.split('#')[0]
-												Tidying

											
										
										
											2021-12-06 12:42:05 +00:00
-												Snake case

											
										
										
											2021-12-27 17:20:01 +00:00
+								def get_protocol_prefixes() -> []:
-												Reduce duplicate prefixes

											
										
										
											2020-06-11 12:26:15 +00:00
+								    """Returns a list of valid prefixes
 								    """
-												Add ftp as a supported link type

											
										
										
											2021-01-02 10:37:19 +00:00
+								    return ('https://', 'http://', 'ftp://',
 								            'dat://', 'i2p://', 'gnunet://',
-												Begin support for ipfs

											
										
										
											2022-04-29 13:54:13 +00:00
+								            'ipfs://', 'ipns://',
-												Reduce duplicate prefixes

											
										
										
											2020-06-11 12:26:15 +00:00
+								            'hyper://', 'gemini://', 'gopher://')
-												Snake case

											
										
										
											2021-12-27 17:32:34 +00:00
+								def get_link_prefixes() -> []:
-												Reduce duplicate prefixes

											
										
										
											2020-06-11 12:26:15 +00:00
+								    """Returns a list of valid web link prefixes
 								    """
-												Add ftp as a supported link type

											
										
										
											2021-01-02 10:37:19 +00:00
+								    return ('https://', 'http://', 'ftp://',
-												Support payto links

											
										
										
											2021-09-21 10:24:42 +00:00
+								            'dat://', 'i2p://', 'gnunet://', 'payto://',
-												Reduce duplicate prefixes

											
										
										
											2020-06-11 12:26:15 +00:00
+								            'hyper://', 'gemini://', 'gopher://', 'briar:')
-												Snake case

											
										
										
											2021-12-27 20:43:15 +00:00
+								def remove_avatar_from_cache(base_dir: str, actor_str: str) -> None:
-												Clearing avatar images from cache before storing updated ones

											
										
										
											2020-02-04 19:34:52 +00:00
+								    """Removes any existing avatar entries from the cache
 								    This avoids duplicate entries with differing extensions
 								    """
-												Snake case

											
										
										
											2021-12-27 17:35:58 +00:00
+								    avatar_filename_extensions = get_image_extensions()
 								    for extension in avatar_filename_extensions:
 								        avatar_filename = \
-												Snake case

											
										
										
											2021-12-27 20:43:15 +00:00
+								            base_dir + '/cache/avatars/' + actor_str + '.' + extension
-												Snake case

											
										
										
											2021-12-27 17:35:58 +00:00
+								        if os.path.isfile(avatar_filename):
-												Exception handling when deleting files

This can fail if a file is manually deleted or deleted in another thread

											
										
										
											2021-09-05 10:17:43 +00:00
+								            try:
-												Snake case

											
										
										
											2021-12-27 17:35:58 +00:00
+								                os.remove(avatar_filename)
-												More specific exceptions

											
										
										
											2021-11-25 18:42:38 +00:00
+								            except OSError:
-												Snake case

											
										
										
											2021-12-27 17:35:58 +00:00
+								                print('EX: remove_avatar_from_cache ' +
 								                      'unable to delete cached avatar ' +
 								                      str(avatar_filename))
-												Clearing avatar images from cache before storing updated ones

											
										
										
											2020-02-04 19:34:52 +00:00
-												flake8 format

											
										
										
											2020-04-04 13:44:49 +00:00
-												Snake case

											
										
										
											2021-12-26 15:13:34 +00:00
+								def save_json(json_object: {}, filename: str) -> bool:
-												Tidying the loading and saving of json

											
										
										
											2019-10-22 11:55:06 +00:00
+								    """Saves json to a file
 								    """
-												More exception information

											
										
										
											2023-05-17 12:02:16 +00:00
+								    tries = 1
 								    while tries <= 5:
-												Revert "File storage functions"

This reverts commit 9c18e7042e76c6a1282b4f0ab86c58eeeaf197d4.

											
										
										
											2021-06-21 22:53:04 +00:00
+								        try:
-												Explicitly set file encoding

											
										
										
											2022-06-09 14:46:30 +00:00
+								            with open(filename, 'w+', encoding='utf-8') as json_file:
-												Snake case

											
										
										
											2021-12-27 17:42:35 +00:00
+								                json_file.write(json.dumps(json_object))
-												Revert "File storage functions"

This reverts commit 9c18e7042e76c6a1282b4f0ab86c58eeeaf197d4.

											
										
										
											2021-06-21 22:53:04 +00:00
+								                return True
-												Exception prefix

											
										
										
											2021-11-25 22:22:54 +00:00
+								        except OSError:
-												More exception information

											
										
										
											2023-05-17 12:02:16 +00:00
+								            print('EX: save_json ' + str(tries) + ' ' + str(filename))
-												Revert "File storage functions"

This reverts commit 9c18e7042e76c6a1282b4f0ab86c58eeeaf197d4.

											
										
										
											2021-06-21 22:53:04 +00:00
+								            time.sleep(1)
 								            tries += 1
-												Tidying the loading and saving of json

											
										
										
											2019-10-22 11:55:06 +00:00
+								    return False
-												flake8 format

											
										
										
											2020-04-04 13:44:49 +00:00
-												Snake case

											
										
										
											2021-12-26 15:28:08 +00:00
+								def load_json(filename: str, delay_sec: int = 2, max_tries: int = 5) -> {}:
-												Tidying the loading and saving of json

											
										
										
											2019-10-22 11:55:06 +00:00
+								    """Makes a few attempts to load a json formatted file
 								    """
-												Getting instance actor file

											
										
										
											2022-02-04 17:28:14 +00:00
+								    if '/Actor@' in filename:
 								        filename = filename.replace('/Actor@', '/inbox@')
-												Snake case

											
										
										
											2021-12-27 17:42:35 +00:00
+								    json_object = None
-												More exception information

											
										
										
											2023-05-17 12:02:16 +00:00
+								    tries = 1
 								    while tries <= max_tries:
-												Tidying the loading and saving of json

											
										
										
											2019-10-22 11:55:06 +00:00
+								        try:
-												Explicitly set file encoding

											
										
										
											2022-06-09 14:46:30 +00:00
+								            with open(filename, 'r', encoding='utf-8') as json_file:
-												Snake case

											
										
										
											2021-12-27 17:42:35 +00:00
+								                data = json_file.read()
 								                json_object = json.loads(data)
-												Tidying the loading and saving of json

											
										
										
											2019-10-22 11:55:06 +00:00
+								                break
-												flake8 format

											
										
										
											2020-04-04 13:44:49 +00:00
+								        except BaseException:
-												More exception information

											
										
										
											2023-05-17 12:02:16 +00:00
+								            print('EX: load_json exception ' +
 								                  str(tries) + ' ' + str(filename))
-												Snake case

											
										
										
											2021-12-26 15:28:08 +00:00
+								            if delay_sec > 0:
 								                time.sleep(delay_sec)
-												flake8 format

											
										
										
											2020-04-04 13:44:49 +00:00
+								            tries += 1
-												Snake case

											
										
										
											2021-12-27 17:42:35 +00:00
+								    return json_object
-												Tidying the loading and saving of json

											
										
										
											2019-10-22 11:55:06 +00:00
-												flake8 format

											
										
										
											2020-04-04 13:44:49 +00:00
-												Snake case

											
										
										
											2021-12-26 15:13:34 +00:00
+								def load_json_onionify(filename: str, domain: str, onion_domain: str,
-												Snake case

											
										
										
											2021-12-26 15:28:08 +00:00
+								                       delay_sec: int = 2) -> {}:
-												Onion webfinger requests

											
										
										
											2020-03-02 14:35:44 +00:00
+								    """Makes a few attempts to load a json formatted file
 								    This also converts the domain name to the onion domain
 								    """
-												Getting instance actor file

											
										
										
											2022-02-04 17:34:00 +00:00
+								    if '/Actor@' in filename:
 								        filename = filename.replace('/Actor@', '/inbox@')
-												Snake case

											
										
										
											2021-12-27 17:42:35 +00:00
+								    json_object = None
-												flake8 format

											
										
										
											2020-04-04 13:44:49 +00:00
+								    tries = 0
 								    while tries < 5:
-												Onion webfinger requests

											
										
										
											2020-03-02 14:35:44 +00:00
+								        try:
-												Explicitly set file encoding

											
										
										
											2022-06-09 14:46:30 +00:00
+								            with open(filename, 'r', encoding='utf-8') as json_file:
-												Snake case

											
										
										
											2021-12-27 17:42:35 +00:00
+								                data = json_file.read()
-												Revert "Reading functions"

This reverts commit ee0ffade9d74f8465338aab59546ef296c8f2a74.

											
										
										
											2021-06-21 22:52:04 +00:00
+								                if data:
-												Snake case

											
										
										
											2021-12-25 20:43:43 +00:00
+								                    data = data.replace(domain, onion_domain)
-												Revert "Reading functions"

This reverts commit ee0ffade9d74f8465338aab59546ef296c8f2a74.

											
										
										
											2021-06-21 22:52:04 +00:00
+								                    data = data.replace('https:', 'http:')
-												Snake case

											
										
										
											2021-12-27 17:42:35 +00:00
+								                json_object = json.loads(data)
-												Revert "Reading functions"

This reverts commit ee0ffade9d74f8465338aab59546ef296c8f2a74.

											
										
										
											2021-06-21 22:52:04 +00:00
+								                break
-												flake8 format

											
										
										
											2020-04-04 13:44:49 +00:00
+								        except BaseException:
-												Snake case

											
										
										
											2021-12-26 15:13:34 +00:00
+								            print('EX: load_json_onionify exception ' + str(filename))
-												Snake case

											
										
										
											2021-12-26 15:28:08 +00:00
+								            if delay_sec > 0:
 								                time.sleep(delay_sec)
-												flake8 format

											
										
										
											2020-04-04 13:44:49 +00:00
+								            tries += 1
-												Snake case

											
										
										
											2021-12-27 17:42:35 +00:00
+								    return json_object
-												Onion webfinger requests

											
										
										
											2020-03-02 14:35:44 +00:00
-												flake8 format

											
										
										
											2020-04-04 13:44:49 +00:00
-												Snake case

											
										
										
											2021-12-27 17:46:27 +00:00
+								def get_status_number(published_str: str = None) -> (str, str):
-												Announce function

											
										
										
											2019-07-02 09:25:29 +00:00
+								    """Returns the status number and published date
 								    """
-												Snake case

											
										
										
											2021-12-27 17:46:27 +00:00
+								    if not published_str:
-												Snake case

											
										
										
											2021-12-26 13:17:46 +00:00
+								        curr_time = datetime.datetime.utcnow()
-												Move rss posts to news account

											
										
										
											2020-10-07 16:55:15 +00:00
+								    else:
-												Snake case

											
										
										
											2021-12-26 13:17:46 +00:00
+								        curr_time = \
-												Snake case

											
										
										
											2021-12-27 17:46:27 +00:00
+								            datetime.datetime.strptime(published_str, '%Y-%m-%dT%H:%M:%SZ')
-												Snake case

											
										
										
											2021-12-26 13:17:46 +00:00
+								    days_since_epoch = (curr_time - datetime.datetime(1970, 1, 1)).days
-												Announce function

											
										
										
											2019-07-02 09:25:29 +00:00
+								    # status is the number of seconds since epoch
-												Snake case

											
										
										
											2021-12-27 17:46:27 +00:00
+								    status_number = \
-												Snake case

											
										
										
											2021-12-26 13:17:46 +00:00
+								        str(((days_since_epoch * 24 * 60 * 60) +
 								             (curr_time.hour * 60 * 60) +
 								             (curr_time.minute * 60) +
 								             curr_time.second) * 1000 +
 								            int(curr_time.microsecond / 1000))
-												flake8 format

											
										
										
											2020-04-04 13:44:49 +00:00
+								    # See https://github.com/tootsuite/mastodon/blob/
 								    # 995f8b389a66ab76ec92d9a240de376f1fc13a38/lib/mastodon/snowflake.rb
-												Fix status number using sequence data

											
										
										
											2019-10-12 12:45:53 +00:00
+								    # use the leftover microseconds as the sequence number
-												Snake case

											
										
										
											2021-12-27 17:46:27 +00:00
+								    sequence_id = curr_time.microsecond % 1000
-												Fix status number using sequence data

											
										
										
											2019-10-12 12:45:53 +00:00
+								    # shift by 16bits "sequence data"
-												Snake case

											
										
										
											2021-12-27 17:46:27 +00:00
+								    status_number = str((int(status_number) << 16) + sequence_id)
-												Snake case

											
										
										
											2021-12-26 13:17:46 +00:00
+								    published = curr_time.strftime("%Y-%m-%dT%H:%M:%SZ")
-												Snake case

											
										
										
											2021-12-27 17:46:27 +00:00
+								    return status_number, published
-												flake8 format

											
										
										
											2020-04-04 13:44:49 +00:00
-												Announce function

											
										
										
											2019-07-02 09:25:29 +00:00
-												Snake case

											
										
										
											2021-12-27 17:46:27 +00:00
+								def evil_incarnate() -> []:
-												Snake case

											
										
										
											2021-12-27 20:43:15 +00:00
+								    """Hardcoded blocked domains
 								    """
-												Default user agent blocks

											
										
										
											2021-10-23 22:56:16 +00:00
+								    return ('fedilist.com', 'gab.com', 'gabfed.com', 'spinster.xyz',
-												flake8 format

											
										
										
											2020-04-04 13:44:49 +00:00
+								            'kiwifarms.cc', 'djitter.com')
-												Faster checking for blocked domains

											
										
										
											2020-03-28 10:33:04 +00:00
-												Snake case

											
										
										
											2021-12-27 17:49:35 +00:00
+								def is_evil(domain: str) -> bool:
-												Snake case

											
										
										
											2021-12-27 17:53:41 +00:00
+								    """ https://www.youtube.com/watch?v=5qw1hcevmdU
 								    """
-												Type check

											
										
										
											2020-01-17 23:19:17 +00:00
+								    if not isinstance(domain, str):
-												flake8 format

											
										
										
											2020-04-04 13:44:49 +00:00
+								        print('WARN: Malformed domain ' + str(domain))
-												Type check

											
										
										
											2020-01-17 23:19:17 +00:00
+								        return True
-												Filter for obviously hostile domains

											
										
										
											2021-02-06 21:05:09 +00:00
+								    # if a domain contains any of these strings then it is
 								    # declaring itself to be hostile
-												Snake case

											
										
										
											2021-12-27 17:53:41 +00:00
+								    evil_emporium = (
-												Filter for obviously hostile domains

											
										
										
											2021-02-06 21:05:09 +00:00
+								        'nazi', 'extremis', 'extreemis', 'gendercritic',
 								        'kiwifarm', 'illegal', 'raplst', 'rapist',
-												Additional domain blocks

											
										
										
											2022-02-13 20:31:31 +00:00
+								        'rapl.st', 'rapi.st', 'antivax', 'plandemic', 'terror'
-												Filter for obviously hostile domains

											
										
										
											2021-02-06 21:05:09 +00:00
+								    )
-												Snake case

											
										
										
											2021-12-27 17:53:41 +00:00
+								    for hostile_str in evil_emporium:
 								        if hostile_str in domain:
-												Filter for obviously hostile domains

											
										
										
											2021-02-06 21:05:09 +00:00
+								            return True
-												Snake case

											
										
										
											2021-12-27 17:53:41 +00:00
+								    evil_domains = evil_incarnate()
 								    for concentrated_evil in evil_domains:
 								        if domain.endswith(concentrated_evil):
-												Tidying

											
										
										
											2019-09-09 15:53:23 +00:00
+								            return True
 								    return False
-												flake8 format

											
										
										
											2020-04-04 13:44:49 +00:00
-												Snake case

											
										
										
											2021-12-27 17:53:41 +00:00
+								def contains_invalid_chars(json_str: str) -> bool:
-												Check for invalid characters

											
										
										
											2020-10-15 08:59:08 +00:00
+								    """Does the given json string contain invalid characters?
 								    """
-												Snake case

											
										
										
											2021-12-27 17:53:41 +00:00
+								    for is_invalid in INVALID_CHARACTERS:
 								        if is_invalid in json_str:
-												Check for invalid characters

											
										
										
											2020-10-15 08:59:08 +00:00
+								            return True
 								    return False
-												Extra actor url validation

											
										
										
											2022-12-26 10:49:41 +00:00
+								def contains_invalid_actor_url_chars(url: str) -> bool:
 								    """Does the given actor url contain invalid characters?
 								    """
 								    for is_invalid in INVALID_ACTOR_URL_CHARACTERS:
 								        if is_invalid in url:
 								            return True
 								    return contains_invalid_chars(url)
-												Snake case

											
										
										
											2021-12-27 19:33:45 +00:00
+								def remove_invalid_chars(text: str) -> str:
-												Screen for outgoing abusive posts

											
										
										
											2021-02-11 10:33:56 +00:00
+								    """Removes any invalid characters from a string
 								    """
-												Snake case

											
										
										
											2021-12-27 17:57:27 +00:00
+								    for is_invalid in INVALID_CHARACTERS:
 								        if is_invalid not in text:
-												Screen for outgoing abusive posts

											
										
										
											2021-02-11 10:33:56 +00:00
+								            continue
-												Snake case

											
										
										
											2021-12-27 17:57:27 +00:00
+								        text = text.replace(is_invalid, '')
-												Screen for outgoing abusive posts

											
										
										
											2021-02-11 10:33:56 +00:00
+								    return text
-												Snake case

											
										
										
											2021-12-27 19:26:54 +00:00
+								def create_person_dir(nickname: str, domain: str, base_dir: str,
 								                      dir_name: str) -> str:
-												Save posts to inbox to a queue

											
										
										
											2019-07-04 10:02:56 +00:00
+								    """Create a directory for a person
-												Announce function

											
										
										
											2019-07-02 09:25:29 +00:00
+								    """
-												flake8 format

											
										
										
											2020-04-04 13:44:49 +00:00
+								    handle = nickname + '@' + domain
-												Tidying

											
										
										
											2022-12-18 15:29:54 +00:00
+								    handle_dir = acct_handle_dir(base_dir, handle)
 								    if not os.path.isdir(handle_dir):
 								        os.mkdir(handle_dir)
 								    box_dir = acct_handle_dir(base_dir, handle) + '/' + dir_name
-												Snake case

											
										
										
											2021-12-27 17:57:27 +00:00
+								    if not os.path.isdir(box_dir):
 								        os.mkdir(box_dir)
 								    return box_dir
-												Save posts to inbox to a queue

											
										
										
											2019-07-04 10:02:56 +00:00
-												flake8 format

											
										
										
											2020-04-04 13:44:49 +00:00
-												Snake case

											
										
										
											2021-12-27 17:57:27 +00:00
+								def create_outbox_dir(nickname: str, domain: str, base_dir: str) -> str:
-												Save posts to inbox to a queue

											
										
										
											2019-07-04 10:02:56 +00:00
+								    """Create an outbox for a person
 								    """
-												Snake case

											
										
										
											2021-12-27 19:26:54 +00:00
+								    return create_person_dir(nickname, domain, base_dir, 'outbox')
-												Save posts to inbox to a queue

											
										
										
											2019-07-04 10:02:56 +00:00
-												flake8 format

											
										
										
											2020-04-04 13:44:49 +00:00
-												Snake case

											
										
										
											2021-12-27 18:00:51 +00:00
+								def create_inbox_queue_dir(nickname: str, domain: str, base_dir: str) -> str:
-												Save posts to inbox to a queue

											
										
										
											2019-07-04 10:02:56 +00:00
+								    """Create an inbox queue and returns the feed filename and directory
 								    """
-												Snake case

											
										
										
											2021-12-27 19:26:54 +00:00
+								    return create_person_dir(nickname, domain, base_dir, 'queue')
-												flake8 format

											
										
										
											2020-04-04 13:44:49 +00:00
-												Consolidate permissions functions

											
										
										
											2019-07-02 10:39:55 +00:00
-												Snake case

											
										
										
											2021-12-27 19:26:54 +00:00
+								def domain_permitted(domain: str, federation_list: []) -> bool:
 								    """Is the given domain permitted according to the federation list?
 								    """
-												Snake case

											
										
										
											2021-12-25 23:45:30 +00:00
+								    if len(federation_list) == 0:
-												Consolidate permissions functions

											
										
										
											2019-07-02 10:39:55 +00:00
+								        return True
-												Snake case

											
										
										
											2021-12-26 18:17:37 +00:00
+								    domain = remove_domain_port(domain)
-												Snake case

											
										
										
											2021-12-25 23:45:30 +00:00
+								    if domain in federation_list:
-												Consolidate permissions functions

											
										
										
											2019-07-02 10:39:55 +00:00
+								        return True
 								    return False
-												flake8 format

											
										
										
											2020-04-04 13:44:49 +00:00
-												Snake case

											
										
										
											2021-12-27 20:47:05 +00:00
+								def url_permitted(url: str, federation_list: []):
-												Snake case

											
										
										
											2021-12-27 17:49:35 +00:00
+								    if is_evil(url):
-												Tidying

											
										
										
											2019-09-09 15:53:23 +00:00
+								        return False
-												Snake case

											
										
										
											2021-12-25 23:45:30 +00:00
+								    if not federation_list:
-												Consolidate permissions functions

											
										
										
											2019-07-02 10:39:55 +00:00
+								        return True
-												Snake case

											
										
										
											2021-12-25 23:45:30 +00:00
+								    for domain in federation_list:
-												Consolidate permissions functions

											
										
										
											2019-07-02 10:39:55 +00:00
+								        if domain in url:
 								            return True
 								    return False
-												Receive follow accept

											
										
										
											2019-07-06 15:17:21 +00:00
-												flake8 format

											
										
										
											2020-04-04 13:44:49 +00:00
-												Snake case

											
										
										
											2021-12-27 20:43:15 +00:00
+								def get_local_network_addresses() -> []:
-												Actor validation for arriving posts

											
										
										
											2021-02-15 10:06:49 +00:00
+								    """Returns patterns for local network address detection
 								    """
 								    return ('localhost', '127.0.', '192.168', '10.0.')
-												Snake case

											
										
										
											2021-12-27 21:42:08 +00:00
+								def is_local_network_address(ip_address: str) -> bool:
 								    """Is the given ip address local?
-												Get forwarded IP address

											
										
										
											2021-06-09 14:01:26 +00:00
+								    """
-												Snake case

											
										
										
											2021-12-27 21:42:08 +00:00
+								    local_ips = get_local_network_addresses()
 								    for ip_addr in local_ips:
 								        if ip_address.startswith(ip_addr):
-												Get forwarded IP address

											
										
										
											2021-06-09 14:01:26 +00:00
+								            return True
 								    return False
-												Check html for spyware

											
										
										
											2022-03-22 18:22:09 +00:00
+								def _is_dangerous_string_tag(content: str, allow_local_network_access: bool,
 								                             separators: [], invalid_strings: []) -> bool:
-												Don't allow svg files containing scripts

											
										
										
											2021-09-13 17:51:33 +00:00
+								    """Returns true if the given string is dangerous
-												Check for dangerous markup in display name and clearly indicate adversaries

											
										
										
											2021-01-31 11:05:17 +00:00
+								    """
-												Snake case

											
										
										
											2021-12-27 21:42:08 +00:00
+								    for separator_style in separators:
 								        start_char = separator_style[0]
 								        end_char = separator_style[1]
 								        if start_char not in content:
-												Check for dangerous markup in display name and clearly indicate adversaries

											
										
										
											2021-01-31 11:05:17 +00:00
+								            continue
-												Snake case

											
										
										
											2021-12-27 21:42:08 +00:00
+								        if end_char not in content:
-												Detect encoded script markup

											
										
										
											2021-05-19 11:29:37 +00:00
+								            continue
-												Snake case

											
										
										
											2021-12-27 21:42:08 +00:00
+								        content_sections = content.split(start_char)
 								        invalid_partials = ()
-												Snake case

											
										
										
											2021-12-25 18:54:50 +00:00
+								        if not allow_local_network_access:
-												Snake case

											
										
										
											2021-12-27 21:42:08 +00:00
+								            invalid_partials = get_local_network_addresses()
 								        for markup in content_sections:
 								            if end_char not in markup:
-												Detect encoded script markup

											
										
										
											2021-05-19 11:29:37 +00:00
+								                continue
-												Snake case

											
										
										
											2021-12-27 21:42:08 +00:00
+								            markup = markup.split(end_char)[0].strip()
 								            for partial_match in invalid_partials:
 								                if partial_match in markup:
-												Check for dangerous markup in display name and clearly indicate adversaries

											
										
										
											2021-01-31 11:05:17 +00:00
+								                    return True
-												Detect encoded script markup

											
										
										
											2021-05-19 11:29:37 +00:00
+								            if ' ' not in markup:
-												Snake case

											
										
										
											2021-12-27 21:42:08 +00:00
+								                for bad_str in invalid_strings:
-												Check html for spyware

											
										
										
											2022-03-22 18:22:09 +00:00
+								                    if not bad_str.endswith('-'):
 								                        if bad_str in markup:
 								                            return True
 								                    else:
 								                        if markup.startswith(bad_str):
 								                            return True
-												Detect encoded script markup

											
										
										
											2021-05-19 11:29:37 +00:00
+								            else:
-												Snake case

											
										
										
											2021-12-27 21:42:08 +00:00
+								                for bad_str in invalid_strings:
-												Check html for spyware

											
										
										
											2022-03-22 18:22:09 +00:00
+								                    if not bad_str.endswith('-'):
 								                        if bad_str + ' ' in markup:
 								                            return True
 								                    else:
 								                        if markup.startswith(bad_str):
 								                            return True
 								    return False
 								def _is_dangerous_string_simple(content: str, allow_local_network_access: bool,
 								                                separators: [], invalid_strings: []) -> bool:
 								    """Returns true if the given string is dangerous
 								    """
 								    for separator_style in separators:
 								        start_char = separator_style[0]
 								        end_char = separator_style[1]
 								        if start_char not in content:
 								            continue
 								        if end_char not in content:
 								            continue
 								        content_sections = content.split(start_char)
 								        invalid_partials = ()
 								        if not allow_local_network_access:
 								            invalid_partials = get_local_network_addresses()
 								        for markup in content_sections:
 								            if end_char not in markup:
 								                continue
 								            markup = markup.split(end_char)[0].strip()
 								            for partial_match in invalid_partials:
 								                if partial_match in markup:
 								                    return True
 								            for bad_str in invalid_strings:
 								                if bad_str in markup:
 								                    return True
-												Check for dangerous markup in display name and clearly indicate adversaries

											
										
										
											2021-01-31 11:05:17 +00:00
+								    return False
-												Fix checking of closing markup

											
										
										
											2023-01-19 15:17:20 +00:00
+								def html_tag_has_closing(tag_name: str, content: str) -> bool:
-												Comment

											
										
										
											2022-07-17 17:44:52 +00:00
+								    """Does the given tag have opening and closing labels?
-												Allow code within posts, but with additional checks

											
										
										
											2022-07-17 17:40:48 +00:00
+								    """
 								    content_lower = content.lower()
 								    if '<' + tag_name not in content_lower:
 								        return True
 								    sections = content_lower.split('<' + tag_name)
 								    ctr = 0
 								    end_tag = '</' + tag_name + '>'
 								    for section in sections:
 								        if ctr == 0:
 								            ctr += 1
 								            continue
 								        # check that an ending tag exists
 								        if end_tag not in section:
 								            return False
-												Allow pre with extra checks

											
										
										
											2023-04-28 11:38:32 +00:00
+								        if tag_name in ('code', 'pre'):
-												Allow code within posts, but with additional checks

											
										
										
											2022-07-17 17:40:48 +00:00
+								            # check that lines are not too long
-												Fix checking of closing markup

											
										
										
											2023-01-19 15:17:20 +00:00
+								            section = section.split(end_tag)[0]
-												Splitting code lines

											
										
										
											2023-04-28 10:13:07 +00:00
+								            section = section.replace('<br>', '\n')
-												Allow code within posts, but with additional checks

											
										
										
											2022-07-17 17:40:48 +00:00
+								            code_lines = section.split('\n')
 								            for line in code_lines:
 								                if len(line) >= 60:
-												Allow pre with extra checks

											
										
										
											2023-04-28 11:38:32 +00:00
+								                    print('<code> or <pre> line too long')
-												Allow code within posts, but with additional checks

											
										
										
											2022-07-17 17:40:48 +00:00
+								                    return False
 								        ctr += 1
 								    return True
-												Allow pre tag through dangerous markup filter in some cases, then remove it when rendering

											
										
										
											2023-05-18 11:15:18 +00:00
+								def dangerous_markup(content: str, allow_local_network_access: bool,
 								                     allow_tags: []) -> bool:
-												Don't allow svg files containing scripts

											
										
										
											2021-09-13 17:51:33 +00:00
+								    """Returns true if the given content contains dangerous html markup
 								    """
-												Avoid svg image links within content

											
										
										
											2023-05-30 09:07:51 +00:00
+								    if '.svg' in content.lower():
 								        return True
-												Don't allow svg files containing scripts

											
										
										
											2021-09-13 17:51:33 +00:00
+								    separators = [['<', '>'], ['&lt;', '&gt;']]
-												Check html for spyware

											
										
										
											2022-03-22 18:22:09 +00:00
+								    invalid_strings = [
-												Extra markup checks

											
										
										
											2022-12-12 21:49:03 +00:00
+								        'ampproject', 'googleapis', '_exec(', ' id=', ' name='
-												Check html for spyware

											
										
										
											2022-03-22 18:22:09 +00:00
+								    ]
 								    if _is_dangerous_string_simple(content, allow_local_network_access,
 								                                   separators, invalid_strings):
 								        return True
-												Tidying

											
										
										
											2023-04-28 11:42:25 +00:00
+								    for closing_tag in ('code', 'pre'):
 								        if not html_tag_has_closing(closing_tag, content):
 								            return True
-												Snake case

											
										
										
											2021-12-27 21:42:08 +00:00
+								    invalid_strings = [
-												Allow pre with extra checks

											
										
										
											2023-04-28 11:38:32 +00:00
+								        'script', 'noscript', 'canvas', 'style', 'abbr', 'input',
 								        'frame', 'iframe', 'html', 'body', 'hr', 'allow-popups',
-												Allow pre tag through dangerous markup filter in some cases, then remove it when rendering

											
										
										
											2023-05-18 11:15:18 +00:00
+								        'allow-scripts', 'amp-', '?php', 'pre'
-												Tidying

											
										
										
											2022-03-22 18:25:42 +00:00
+								    ]
-												Allow pre tag through dangerous markup filter in some cases, then remove it when rendering

											
										
										
											2023-05-18 11:15:18 +00:00
+								    for allowed in allow_tags:
 								        if allowed in invalid_strings:
 								            invalid_strings.remove(allowed)
-												Check html for spyware

											
										
										
											2022-03-22 18:22:09 +00:00
+								    return _is_dangerous_string_tag(content, allow_local_network_access,
-												Tidying

											
										
										
											2022-03-22 18:25:42 +00:00
+								                                    separators, invalid_strings)
-												Don't allow svg files containing scripts

											
										
										
											2021-09-13 17:51:33 +00:00
-												Snake case

											
										
										
											2021-12-27 21:44:48 +00:00
+								def dangerous_svg(content: str, allow_local_network_access: bool) -> bool:
-												Don't allow svg files containing scripts

											
										
										
											2021-09-13 17:51:33 +00:00
+								    """Returns true if the given svg file content contains dangerous scripts
 								    """
 								    separators = [['<', '>'], ['&lt;', '&gt;']]
-												Snake case

											
										
										
											2021-12-27 21:44:48 +00:00
+								    invalid_strings = [
-												Don't allow svg files containing scripts

											
										
										
											2021-09-13 17:51:33 +00:00
+								        'script'
 								    ]
-												Check html for spyware

											
										
										
											2022-03-22 18:22:09 +00:00
+								    return _is_dangerous_string_tag(content, allow_local_network_access,
 								                                    separators, invalid_strings)
-												Don't allow svg files containing scripts

											
										
										
											2021-09-13 17:51:33 +00:00
-												More general

											
										
										
											2023-08-14 19:01:15 +00:00
+								def _get_statuses_list() -> []:
 								    """Returns a list of statuses path strings
 								    """
 								    return ('/statuses/', '/objects/', '/p/')
 								def contains_statuses(url: str) -> bool:
 								    """Whether the given url contains /statuses/
 								    """
 								    statuses_list = _get_statuses_list()
 								    for status_str in statuses_list:
 								        if status_str in url:
 								            return True
 								    return False
-												Tidying

											
										
										
											2023-08-03 17:31:47 +00:00
+								def get_actor_from_post_id(post_id: str) -> str:
-												More general

											
										
										
											2023-08-14 19:01:15 +00:00
+								    """Returns an actor url from a post id containing /statuses/ or equivalent
-												Tidying

											
										
										
											2023-08-03 17:31:47 +00:00
+								    eg. https://somedomain/users/nick/statuses/123 becomes
 								    https://somedomain/users/nick
 								    """
 								    actor = post_id
-												More general

											
										
										
											2023-08-14 19:01:15 +00:00
+								    statuses_list = _get_statuses_list()
 								    pixelfed_style_statuses = ['/p/']
 								    for status_str in statuses_list:
-												Check for statuses

											
										
										
											2023-08-14 19:07:14 +00:00
+								        if status_str not in actor:
 								            continue
-												More general

											
										
										
											2023-08-14 19:01:15 +00:00
+								        if status_str in pixelfed_style_statuses:
 								            # pixelfed style post id
 								            nick = actor.split(status_str)[1]
 								            if '/' in nick:
 								                nick = nick.split('/')[0]
 								            actor = actor.split(status_str)[0] + '/users/' + nick
 								            break
-												Tidying

											
										
										
											2023-08-14 19:11:58 +00:00
+								        if has_users_path(actor):
-												Check for statuses

											
										
										
											2023-08-14 19:07:14 +00:00
+								            actor = actor.split(status_str)[0]
 								            break
-												Tidying

											
										
										
											2023-08-03 17:31:47 +00:00
+								    return actor
-												Snake case

											
										
										
											2021-12-27 21:59:07 +00:00
+								def get_display_name(base_dir: str, actor: str, person_cache: {}) -> str:
-												Preferred name becomes display name - less ambiguous

											
										
										
											2019-08-22 18:36:07 +00:00
+								    """Returns the display name for the given actor
-												Use preferred names in posts

											
										
										
											2019-08-22 12:41:16 +00:00
+								    """
-												Tidying

											
										
										
											2023-08-03 17:31:47 +00:00
+								    actor = get_actor_from_post_id(actor)
-												Snake case

											
										
										
											2021-12-25 22:17:49 +00:00
+								    if not person_cache.get(actor):
-												Sequence

											
										
										
											2019-08-22 13:29:57 +00:00
+								        return None
-												Snake case

											
										
										
											2021-12-27 22:12:29 +00:00
+								    name_found = None
-												Snake case

											
										
										
											2021-12-25 22:17:49 +00:00
+								    if person_cache[actor].get('actor'):
 								        if person_cache[actor]['actor'].get('name'):
-												Snake case

											
										
										
											2021-12-27 22:12:29 +00:00
+								            name_found = person_cache[actor]['actor']['name']
-												Obtain preferred name from cached actor

											
										
										
											2019-10-09 13:24:14 +00:00
+								    else:
 								        # Try to obtain from the cached actors
-												Snake case

											
										
										
											2021-12-27 22:12:29 +00:00
+								        cached_actor_filename = \
-												Snake case

											
										
										
											2021-12-25 16:17:53 +00:00
+								            base_dir + '/cache/actors/' + (actor.replace('/', '#')) + '.json'
-												Snake case

											
										
										
											2021-12-27 22:12:29 +00:00
+								        if os.path.isfile(cached_actor_filename):
 								            actor_json = load_json(cached_actor_filename, 1)
-												Snake case

											
										
										
											2021-12-26 10:29:52 +00:00
+								            if actor_json:
 								                if actor_json.get('name'):
-												Snake case

											
										
										
											2021-12-27 22:12:29 +00:00
+								                    name_found = actor_json['name']
 								    if name_found:
-												Allow pre tag through dangerous markup filter in some cases, then remove it when rendering

											
										
										
											2023-05-18 11:15:18 +00:00
+								        if dangerous_markup(name_found, False, []):
-												Snake case

											
										
										
											2021-12-27 22:12:29 +00:00
+								            name_found = "*ADVERSARY*"
-												Remove fancy unicode characters from names and bio text

											
										
										
											2022-07-09 22:01:38 +00:00
+								    return standardize_text(name_found)
-												Use preferred names in posts

											
										
										
											2019-08-22 12:41:16 +00:00
-												flake8 format

											
										
										
											2020-04-04 13:44:49 +00:00
-												Show handle if display name is a single emoji

											
										
										
											2022-05-02 19:22:00 +00:00
+								def display_name_is_emoji(display_name: str) -> bool:
 								    """Returns true if the given display name is an emoji
 								    """
 								    if ' ' in display_name:
-												Check for multiple emoji display name

											
										
										
											2022-05-02 22:50:14 +00:00
+								        words = display_name.split(' ')
 								        for wrd in words:
 								            if not wrd.startswith(':'):
 								                return False
 								            if not wrd.endswith(':'):
 								                return False
 								        return True
-												Show handle if display name is a single emoji

											
										
										
											2022-05-02 19:22:00 +00:00
+								    if len(display_name) < 2:
 								        return False
 								    if not display_name.startswith(':'):
 								        return False
 								    if not display_name.endswith(':'):
 								        return False
 								    return True
-												Snake case

											
										
										
											2021-12-27 22:12:29 +00:00
+								def _gender_from_string(translate: {}, text: str) -> str:
-												Comment

											
										
										
											2021-06-24 19:28:26 +00:00
+								    """Given some text, does it contain a gender description?
 								    """
-												Tidying

											
										
										
											2021-06-24 19:25:39 +00:00
+								    gender = None
-												Handle posts without text

											
										
										
											2021-07-23 14:32:21 +00:00
+								    if not text:
 								        return None
-												Snake case

											
										
										
											2021-12-27 22:12:29 +00:00
+								    text_orig = text
-												Tidying

											
										
										
											2021-06-24 19:25:39 +00:00
+								    text = text.lower()
 								    if translate['He/Him'].lower() in text or \
 								       translate['boy'].lower() in text:
 								        gender = 'He/Him'
 								    elif (translate['She/Her'].lower() in text or
 								          translate['girl'].lower() in text):
 								        gender = 'She/Her'
 								    elif 'him' in text or 'male' in text:
 								        gender = 'He/Him'
 								    elif 'her' in text or 'she' in text or \
 								         'fem' in text or 'woman' in text:
 								        gender = 'She/Her'
-												Snake case

											
										
										
											2021-12-27 22:12:29 +00:00
+								    elif 'man' in text or 'He' in text_orig:
-												Tidying

											
										
										
											2021-06-24 19:25:39 +00:00
+								        gender = 'He/Him'
 								    return gender
-												Snake case

											
										
										
											2021-12-27 22:12:29 +00:00
+								def get_gender_from_bio(base_dir: str, actor: str, person_cache: {},
 								                        translate: {}) -> str:
-												Gender detaction for SSML

											
										
										
											2021-03-03 13:02:47 +00:00
+								    """Tries to ascertain gender from bio description
-												Tidying

											
										
										
											2021-06-24 19:25:39 +00:00
+								    This is for use by text-to-speech for pitch setting
-												Gender detaction for SSML

											
										
										
											2021-03-03 13:02:47 +00:00
+								    """
-												Snake case

											
										
										
											2021-12-27 22:19:18 +00:00
+								    default_gender = 'They/Them'
-												Tidying

											
										
										
											2023-08-03 17:31:47 +00:00
+								    actor = get_actor_from_post_id(actor)
-												Snake case

											
										
										
											2021-12-25 22:17:49 +00:00
+								    if not person_cache.get(actor):
-												Snake case

											
										
										
											2021-12-27 22:19:18 +00:00
+								        return default_gender
 								    bio_found = None
-												Fix unit tests

											
										
										
											2021-03-03 19:15:32 +00:00
+								    if translate:
-												Snake case

											
										
										
											2021-12-27 22:19:18 +00:00
+								        pronoun_str = translate['pronoun'].lower()
-												Fix unit tests

											
										
										
											2021-03-03 19:15:32 +00:00
+								    else:
-												Snake case

											
										
										
											2021-12-27 22:19:18 +00:00
+								        pronoun_str = 'pronoun'
-												Snake case

											
										
										
											2021-12-26 10:29:52 +00:00
+								    actor_json = None
-												Snake case

											
										
										
											2021-12-25 22:17:49 +00:00
+								    if person_cache[actor].get('actor'):
-												Snake case

											
										
										
											2021-12-26 10:29:52 +00:00
+								        actor_json = person_cache[actor]['actor']
-												Gender detaction for SSML

											
										
										
											2021-03-03 13:02:47 +00:00
+								    else:
 								        # Try to obtain from the cached actors
-												Snake case

											
										
										
											2021-12-27 22:19:18 +00:00
+								        cached_actor_filename = \
-												Snake case

											
										
										
											2021-12-25 16:17:53 +00:00
+								            base_dir + '/cache/actors/' + (actor.replace('/', '#')) + '.json'
-												Snake case

											
										
										
											2021-12-27 22:19:18 +00:00
+								        if os.path.isfile(cached_actor_filename):
 								            actor_json = load_json(cached_actor_filename, 1)
-												Snake case

											
										
										
											2021-12-26 10:29:52 +00:00
+								    if not actor_json:
-												Snake case

											
										
										
											2021-12-27 22:19:18 +00:00
+								        return default_gender
-												Tidying

											
										
										
											2021-06-24 19:10:23 +00:00
+								    # is gender defined as a profile tag?
-												Snake case

											
										
										
											2021-12-26 10:29:52 +00:00
+								    if actor_json.get('attachment'):
-												Snake case

											
										
										
											2021-12-27 22:19:18 +00:00
+								        tags_list = actor_json['attachment']
 								        if isinstance(tags_list, list):
-												Tidying

											
										
										
											2021-06-24 19:25:39 +00:00
+								            # look for a gender field name
-												Snake case

											
										
										
											2021-12-27 22:19:18 +00:00
+								            for tag in tags_list:
-												Tidying

											
										
										
											2021-06-24 19:10:23 +00:00
+								                if not isinstance(tag, dict):
 								                    continue
-												Supporting alternative name and value properties in attachments

											
										
										
											2022-05-11 18:04:58 +00:00
+								                name_value = None
 								                if tag.get('name'):
 								                    name_value = tag['name']
 								                if tag.get('schema:name'):
 								                    name_value = tag['schema:name']
 								                if not name_value:
-												Tidying

											
										
										
											2021-06-24 19:10:23 +00:00
+								                    continue
-												Supporting alternative name and value properties in attachments

											
										
										
											2022-05-11 18:04:58 +00:00
+								                prop_value_name, _ = get_attachment_property_value(tag)
 								                if not prop_value_name:
 								                    continue
 								                if name_value.lower() == \
-												Tidying

											
										
										
											2021-06-24 19:10:23 +00:00
+								                   translate['gender'].lower():
-												Tidying

											
										
										
											2022-05-11 18:16:20 +00:00
+								                    bio_found = tag[prop_value_name]
-												Tidying

											
										
										
											2021-06-24 19:10:23 +00:00
+								                    break
-												Supporting alternative name and value properties in attachments

											
										
										
											2022-05-11 18:04:58 +00:00
+								                if name_value.lower().startswith(pronoun_str):
-												Tidying

											
										
										
											2022-05-11 18:16:20 +00:00
+								                    bio_found = tag[prop_value_name]
-												Tidying

											
										
										
											2021-06-24 19:10:23 +00:00
+								                    break
-												Tidying

											
										
										
											2021-06-24 19:25:39 +00:00
+								            # the field name could be anything,
 								            # just look at the value
-												Snake case

											
										
										
											2021-12-27 22:19:18 +00:00
+								            if not bio_found:
 								                for tag in tags_list:
-												Tidying

											
										
										
											2021-06-24 19:25:39 +00:00
+								                    if not isinstance(tag, dict):
 								                        continue
-												Supporting alternative name and value properties in attachments

											
										
										
											2022-05-11 18:04:58 +00:00
+								                    if not tag.get('name') and not tag.get('schema:name'):
 								                        continue
 								                    prop_value_name, _ = get_attachment_property_value(tag)
 								                    if not prop_value_name:
-												Tidying

											
										
										
											2021-06-24 19:25:39 +00:00
+								                        continue
-												Supporting alternative name and value properties in attachments

											
										
										
											2022-05-11 18:04:58 +00:00
+								                    gender = \
 								                        _gender_from_string(translate, tag[prop_value_name])
-												Tidying

											
										
										
											2021-06-24 19:25:39 +00:00
+								                    if gender:
 								                        return gender
-												Tidying

											
										
										
											2021-06-24 19:10:23 +00:00
+								    # if not then use the bio
-												Snake case

											
										
										
											2021-12-27 22:19:18 +00:00
+								    if not bio_found and actor_json.get('summary'):
 								        bio_found = actor_json['summary']
 								    if not bio_found:
 								        return default_gender
 								    gender = _gender_from_string(translate, bio_found)
-												Tidying

											
										
										
											2021-06-24 19:25:39 +00:00
+								    if not gender:
-												Snake case

											
										
										
											2021-12-27 22:19:18 +00:00
+								        gender = default_gender
-												Gender detaction for SSML

											
										
										
											2021-03-03 13:02:47 +00:00
+								    return gender
-												Snake case

											
										
										
											2021-12-27 22:19:18 +00:00
+								def get_nickname_from_actor(actor: str) -> str:
-												Receive follow accept

											
										
										
											2019-07-06 15:17:21 +00:00
+								    """Returns the nickname from an actor url
 								    """
-												More actor parsing

											
										
										
											2020-08-13 16:41:02 +00:00
+								    if actor.startswith('@'):
 								        actor = actor[1:]
-												Snake case

											
										
										
											2021-12-27 22:32:59 +00:00
+								    users_paths = get_user_paths()
 								    for possible_path in users_paths:
 								        if possible_path in actor:
 								            nick_str = actor.split(possible_path)[1].replace('@', '')
 								            if '/' not in nick_str:
 								                return nick_str
 								            return nick_str.split('/')[0]
-												Additional user paths

											
										
										
											2023-04-23 15:55:48 +00:00
+								    if '/@/' not in actor:
 								        if '/@' in actor:
 								            # https://domain/@nick
 								            nick_str = actor.split('/@')[1]
 								            if '/' in nick_str:
 								                nick_str = nick_str.split('/')[0]
 								            return nick_str
 								        if '@' in actor:
 								            nick_str = actor.split('@')[0]
 								            return nick_str
-												Snake case

											
										
										
											2021-12-27 22:32:59 +00:00
+								    if '://' in actor:
-												Tidying

											
										
										
											2021-06-24 19:55:29 +00:00
+								        domain = actor.split('://')[1]
 								        if '/' in domain:
 								            domain = domain.split('/')[0]
 								        if '://' + domain + '/' not in actor:
 								            return None
-												Snake case

											
										
										
											2021-12-27 22:32:59 +00:00
+								        nick_str = actor.split('://' + domain + '/')[1]
 								        if '/' in nick_str or '.' in nick_str:
-												Tidying

											
										
										
											2021-06-24 19:55:29 +00:00
+								            return None
-												Snake case

											
										
										
											2021-12-27 22:32:59 +00:00
+								        return nick_str
-												Tidying

											
										
										
											2021-06-24 19:55:29 +00:00
+								    return None
-												Receive follow accept

											
										
										
											2019-07-06 15:17:21 +00:00
-												flake8 format

											
										
										
											2020-04-04 13:44:49 +00:00
-												Snake case

											
										
										
											2021-12-26 12:24:40 +00:00
+								def get_user_paths() -> []:
-												Function to return user paths

											
										
										
											2021-07-04 22:58:01 +00:00
+								    """Returns possible user paths
-												Better support for alternative users paths

											
										
										
											2021-07-28 12:49:02 +00:00
+								    e.g. /users/nickname, /channel/nickname
-												Function to return user paths

											
										
										
											2021-07-04 22:58:01 +00:00
+								    """
-												video-channels users path

											
										
										
											2021-09-13 13:57:37 +00:00
+								    return ('/users/', '/profile/', '/accounts/', '/channel/', '/u/',
-												Additional group user path

											
										
										
											2023-06-17 09:28:16 +00:00
+								            '/c/', '/m/', '/video-channels/', '/author/',
-												Additional user path

											
										
										
											2023-06-26 10:38:21 +00:00
+								            '/activitypub/', '/actors/', '/snac/', '/@/', '/~/',
-												Another user path

											
										
										
											2023-08-07 08:46:52 +00:00
+								            '/fediverse/blog/', '/user/')
-												Function to return user paths

											
										
										
											2021-07-04 22:58:01 +00:00
-												Snake case

											
										
										
											2021-12-26 17:53:07 +00:00
+								def get_group_paths() -> []:
-												Detecting group handle

											
										
										
											2021-07-30 13:00:23 +00:00
+								    """Returns possible group paths
-												Comment

											
										
										
											2021-07-30 13:03:29 +00:00
+								    e.g. https://lemmy/c/groupname
-												Detecting group handle

											
										
										
											2021-07-30 13:00:23 +00:00
+								    """
-												Additional group user path

											
										
										
											2023-06-17 09:28:16 +00:00
+								    return ['/c/', '/video-channels/', '/m/']
-												Detecting group handle

											
										
										
											2021-07-30 13:00:23 +00:00
-												Snake case

											
										
										
											2021-12-27 19:05:25 +00:00
+								def get_domain_from_actor(actor: str) -> (str, int):
-												Receive follow accept

											
										
										
											2019-07-06 15:17:21 +00:00
+								    """Returns the domain name from an actor url
 								    """
-												More actor parsing

											
										
										
											2020-08-13 16:41:02 +00:00
+								    if actor.startswith('@'):
 								        actor = actor[1:]
-												flake8 format

											
										
										
											2020-04-04 13:44:49 +00:00
+								    port = None
-												Snake case

											
										
										
											2021-12-27 17:20:01 +00:00
+								    prefixes = get_protocol_prefixes()
-												Snake case

											
										
										
											2021-12-27 22:32:59 +00:00
+								    users_paths = get_user_paths()
 								    for possible_path in users_paths:
 								        if possible_path in actor:
 								            domain = actor.split(possible_path)[0]
-												Tidying

											
										
										
											2021-06-24 19:55:29 +00:00
+								            for prefix in prefixes:
 								                domain = domain.replace(prefix, '')
 								            break
-												Additional user paths

											
										
										
											2023-04-23 15:55:48 +00:00
+								    if '/@' in actor and '/@/' not in actor:
-												More actor parsing

											
										
										
											2020-08-13 16:41:02 +00:00
+								        domain = actor.split('/@')[0]
 								        for prefix in prefixes:
 								            domain = domain.replace(prefix, '')
-												Additional user paths

											
										
										
											2023-04-23 15:55:48 +00:00
+								    elif '@' in actor and '/@/' not in actor:
-												More actor parsing

											
										
										
											2020-08-13 16:41:02 +00:00
+								        domain = actor.split('@')[1].strip()
-												Receive follow accept

											
										
										
											2019-07-06 15:17:21 +00:00
+								    else:
-												More actor parsing

											
										
										
											2020-08-13 16:41:02 +00:00
+								        domain = actor
-												Allow accounts as users path

											
										
										
											2020-08-13 16:19:35 +00:00
+								        for prefix in prefixes:
 								            domain = domain.replace(prefix, '')
-												More actor parsing

											
										
										
											2020-08-13 16:41:02 +00:00
+								        if '/' in actor:
 								            domain = domain.split('/')[0]
-												Receive follow accept

											
										
										
											2019-07-06 15:17:21 +00:00
+								    if ':' in domain:
-												Snake case

											
										
										
											2021-12-26 18:14:21 +00:00
+								        port = get_port_from_domain(domain)
-												Snake case

											
										
										
											2021-12-26 18:17:37 +00:00
+								        domain = remove_domain_port(domain)
-												flake8 format

											
										
										
											2020-04-04 13:44:49 +00:00
+								    return domain, port
-												Snake case

											
										
										
											2021-12-27 19:26:54 +00:00
+								def _set_default_pet_name(base_dir: str, nickname: str, domain: str,
 								                          follow_nickname: str, follow_domain: str) -> None:
-												Create default petname when following

											
										
										
											2020-11-23 15:07:55 +00:00
+								    """Sets a default petname
 								    This helps especially when using onion or i2p address
 								    """
-												Snake case

											
										
										
											2021-12-26 18:17:37 +00:00
+								    domain = remove_domain_port(domain)
-												Snake case

											
										
										
											2021-12-27 22:32:59 +00:00
+								    user_path = acct_dir(base_dir, nickname, domain)
 								    petnames_filename = user_path + '/petnames.txt'
-												Create default petname when following

											
										
										
											2020-11-23 15:07:55 +00:00
-												Snake case

											
										
										
											2021-12-27 22:32:59 +00:00
+								    petname_lookup_entry = follow_nickname + ' ' + \
-												Snake case

											
										
										
											2021-12-27 19:26:54 +00:00
+								        follow_nickname + '@' + follow_domain + '\n'
-												Snake case

											
										
										
											2021-12-27 22:32:59 +00:00
+								    if not os.path.isfile(petnames_filename):
-												Create default petname when following

											
										
										
											2020-11-23 15:07:55 +00:00
+								        # if there is no existing petnames lookup file
-												Explicitly set file encoding

											
										
										
											2022-06-09 14:46:30 +00:00
+								        with open(petnames_filename, 'w+', encoding='utf-8') as petnames_file:
-												Snake case

											
										
										
											2021-12-27 22:32:59 +00:00
+								            petnames_file.write(petname_lookup_entry)
-												Create default petname when following

											
										
										
											2020-11-23 15:07:55 +00:00
+								        return
-												Explicitly set file encoding

											
										
										
											2022-06-09 14:46:30 +00:00
+								    with open(petnames_filename, 'r', encoding='utf-8') as petnames_file:
-												Snake case

											
										
										
											2021-12-27 22:32:59 +00:00
+								        petnames_str = petnames_file.read()
 								        if petnames_str:
 								            petnames_list = petnames_str.split('\n')
 								            for pet in petnames_list:
-												Snake case

											
										
										
											2021-12-27 19:26:54 +00:00
+								                if pet.startswith(follow_nickname + ' '):
-												Revert "Reading functions"

This reverts commit ee0ffade9d74f8465338aab59546ef296c8f2a74.

											
										
										
											2021-06-21 22:52:04 +00:00
+								                    # petname already exists
 								                    return
-												Create default petname when following

											
										
										
											2020-11-23 15:07:55 +00:00
+								    # petname doesn't already exist
-												Explicitly set file encoding

											
										
										
											2022-06-09 14:46:30 +00:00
+								    with open(petnames_filename, 'a+', encoding='utf-8') as petnames_file:
-												Snake case

											
										
										
											2021-12-27 22:32:59 +00:00
+								        petnames_file.write(petname_lookup_entry)
-												Create default petname when following

											
										
										
											2020-11-23 15:07:55 +00:00
-												Snake case

											
										
										
											2021-12-27 17:08:19 +00:00
+								def follow_person(base_dir: str, nickname: str, domain: str,
-												Snake case

											
										
										
											2021-12-27 19:26:54 +00:00
+								                  follow_nickname: str, follow_domain: str,
-												Snake case

											
										
										
											2021-12-27 17:08:19 +00:00
+								                  federation_list: [], debug: bool,
 								                  group_account: bool,
 								                  follow_file: str = 'following.txt') -> bool:
-												Follow request test passes

											
										
										
											2019-07-06 19:24:52 +00:00
+								    """Adds a person to the follow list
 								    """
-												Function for line ending characters

											
										
										
											2022-06-21 11:58:50 +00:00
+								    follow_domain_str_lower1 = follow_domain.lower()
 								    follow_domain_str_lower = remove_eol(follow_domain_str_lower1)
-												Snake case

											
										
										
											2021-12-27 22:32:59 +00:00
+								    if not domain_permitted(follow_domain_str_lower,
-												Snake case

											
										
										
											2021-12-27 18:28:26 +00:00
+								                            federation_list):
-												Follow request test passes

											
										
										
											2019-07-06 19:24:52 +00:00
+								        if debug:
-												flake8 format

											
										
										
											2020-04-04 13:44:49 +00:00
+								            print('DEBUG: follow of domain ' +
-												Snake case

											
										
										
											2021-12-27 19:26:54 +00:00
+								                  follow_domain + ' not permitted')
-												Follow request test passes

											
										
										
											2019-07-06 19:24:52 +00:00
+								        return False
-												Move shared inbox account into daemon

											
										
										
											2019-07-11 12:29:31 +00:00
+								    if debug:
-												Snake case

											
										
										
											2021-12-27 19:26:54 +00:00
+								        print('DEBUG: follow of domain ' + follow_domain)
-												Fix follower ports

											
										
										
											2019-07-16 22:57:45 +00:00
 								    if ':' in domain:
-												Snake case

											
										
										
											2021-12-27 22:32:59 +00:00
+								        domain_only = remove_domain_port(domain)
 								        handle = nickname + '@' + domain_only
-												Fix follower ports

											
										
										
											2019-07-16 22:57:45 +00:00
+								    else:
-												Don't insist on lowercase handle

											
										
										
											2020-09-15 09:16:03 +00:00
+								        handle = nickname + '@' + domain
-												Avoid beautifulsoup

											
										
										
											2020-03-03 11:02:34 +00:00
-												Tidying

											
										
										
											2022-12-18 15:29:54 +00:00
+								    handle_dir = acct_handle_dir(base_dir, handle)
 								    if not os.path.isdir(handle_dir):
-												flake8 format

											
										
										
											2020-04-04 13:44:49 +00:00
+								        print('WARN: account for ' + handle + ' does not exist')
-												Warn if account does not exist

											
										
										
											2020-03-03 09:56:48 +00:00
+								        return False
-												Snake case

											
										
										
											2021-12-27 19:26:54 +00:00
+								    if ':' in follow_domain:
-												Snake case

											
										
										
											2021-12-27 22:32:59 +00:00
+								        follow_domain_only = remove_domain_port(follow_domain)
 								        handle_to_follow = follow_nickname + '@' + follow_domain_only
-												Fix follower ports

											
										
										
											2019-07-16 22:57:45 +00:00
+								    else:
-												Snake case

											
										
										
											2021-12-27 22:32:59 +00:00
+								        handle_to_follow = follow_nickname + '@' + follow_domain
-												Add unfollowed file

This prevents received follow accepts from refollowing after an unfollow

											
										
										
											2020-02-22 10:50:07 +00:00
-												Snake case

											
										
										
											2021-12-26 00:07:44 +00:00
+								    if group_account:
-												Snake case

											
										
										
											2021-12-27 22:32:59 +00:00
+								        handle_to_follow = '!' + handle_to_follow
-												Unit test for following a group

											
										
										
											2021-07-31 11:56:28 +00:00
-												Add unfollowed file

This prevents received follow accepts from refollowing after an unfollow

											
										
										
											2020-02-22 10:50:07 +00:00
+								    # was this person previously unfollowed?
-												Tidying

											
										
										
											2022-12-18 15:29:54 +00:00
+								    unfollowed_filename = acct_handle_dir(base_dir, handle) + '/unfollowed.txt'
-												Snake case

											
										
										
											2021-12-27 22:32:59 +00:00
+								    if os.path.isfile(unfollowed_filename):
-												Function for checking text in a file

											
										
										
											2022-06-10 09:24:11 +00:00
+								        if text_in_file(handle_to_follow, unfollowed_filename):
-												Add unfollowed file

This prevents received follow accepts from refollowing after an unfollow

											
										
										
											2020-02-22 10:50:07 +00:00
+								            # remove them from the unfollowed file
-												Snake case

											
										
										
											2021-12-27 22:32:59 +00:00
+								            new_lines = ''
-												Explicitly set file encoding

											
										
										
											2022-06-09 14:46:30 +00:00
+								            with open(unfollowed_filename, 'r',
 								                      encoding='utf-8') as unfoll_file:
-												Snake case

											
										
										
											2021-12-27 22:32:59 +00:00
+								                lines = unfoll_file.readlines()
-												Add unfollowed file

This prevents received follow accepts from refollowing after an unfollow

											
										
										
											2020-02-22 10:50:07 +00:00
+								                for line in lines:
-												Snake case

											
										
										
											2021-12-27 22:32:59 +00:00
+								                    if handle_to_follow not in line:
 								                        new_lines += line
-												Explicitly set file encoding

											
										
										
											2022-06-09 14:46:30 +00:00
+								            with open(unfollowed_filename, 'w+',
 								                      encoding='utf-8') as unfoll_file:
-												Snake case

											
										
										
											2021-12-27 22:32:59 +00:00
+								                unfoll_file.write(new_lines)
-												Add unfollowed file

This prevents received follow accepts from refollowing after an unfollow

											
										
										
											2020-02-22 10:50:07 +00:00
-												Snake case

											
										
										
											2021-12-25 16:17:53 +00:00
+								    if not os.path.isdir(base_dir + '/accounts'):
 								        os.mkdir(base_dir + '/accounts')
-												Snake case

											
										
										
											2021-12-27 22:32:59 +00:00
+								    handle_to_follow = follow_nickname + '@' + follow_domain
-												Snake case

											
										
										
											2021-12-26 00:07:44 +00:00
+								    if group_account:
-												Snake case

											
										
										
											2021-12-27 22:32:59 +00:00
+								        handle_to_follow = '!' + handle_to_follow
-												Tidying

											
										
										
											2022-12-18 15:29:54 +00:00
+								    filename = acct_handle_dir(base_dir, handle) + '/' + follow_file
-												Follow request test passes

											
										
										
											2019-07-06 19:24:52 +00:00
+								    if os.path.isfile(filename):
-												Function for checking text in a file

											
										
										
											2022-06-10 09:24:11 +00:00
+								        if text_in_file(handle_to_follow, filename):
-												Move shared inbox account into daemon

											
										
										
											2019-07-11 12:29:31 +00:00
+								            if debug:
 								                print('DEBUG: follow already exists')
-												Follow request test passes

											
										
										
											2019-07-06 19:24:52 +00:00
+								            return True
-												prepend to follow/followers files

											
										
										
											2019-10-26 15:15:38 +00:00
+								        # prepend to follow file
 								        try:
-												Explicitly set file encoding

											
										
										
											2022-06-09 14:46:30 +00:00
+								            with open(filename, 'r+', encoding='utf-8') as foll_file:
-												Snake case

											
										
										
											2021-12-27 17:08:19 +00:00
+								                content = foll_file.read()
-												Snake case

											
										
										
											2021-12-27 22:32:59 +00:00
+								                if handle_to_follow + '\n' not in content:
-												Snake case

											
										
										
											2021-12-27 17:08:19 +00:00
+								                    foll_file.seek(0, 0)
-												Snake case

											
										
										
											2021-12-27 22:32:59 +00:00
+								                    foll_file.write(handle_to_follow + '\n' + content)
-												Check before adding new entries to indexes

											
										
										
											2020-12-29 20:22:28 +00:00
+								                    print('DEBUG: follow added')
-												Snake case

											
										
										
											2021-12-27 16:18:52 +00:00
+								        except OSError as ex:
-												flake8 format

											
										
										
											2020-04-04 13:44:49 +00:00
+								            print('WARN: Failed to write entry to follow file ' +
-												Exception variable names

											
										
										
											2021-12-25 15:28:52 +00:00
+								                  filename + ' ' + str(ex))
-												Improve handling of the first follow

											
										
										
											2020-09-03 10:09:40 +00:00
+								    else:
 								        # first follow
 								        if debug:
-												Unit test for adding new follow to calendar

											
										
										
											2020-09-03 12:16:24 +00:00
+								            print('DEBUG: ' + handle +
-												Snake case

											
										
										
											2021-12-27 22:32:59 +00:00
+								                  ' creating new following file to follow ' +
 								                  handle_to_follow +
-												Unit test for adding new follow to calendar

											
										
										
											2020-09-03 12:16:24 +00:00
+								                  ', filename is ' + filename)
-												Explicitly set file encoding

											
										
										
											2022-06-09 14:46:30 +00:00
+								        with open(filename, 'w+', encoding='utf-8') as foll_file:
-												Snake case

											
										
										
											2021-12-27 22:32:59 +00:00
+								            foll_file.write(handle_to_follow + '\n')
-												Improve handling of the first follow

											
										
										
											2020-09-03 10:09:40 +00:00
-												Snake case

											
										
										
											2021-12-27 11:31:04 +00:00
+								    if follow_file.endswith('following.txt'):
-												Create default petname when following

											
										
										
											2020-11-23 15:07:55 +00:00
+								        # Default to adding new follows to the calendar.
 								        # Possibly this could be made optional
-												Improve handling of the first follow

											
										
										
											2020-09-03 10:09:40 +00:00
+								        # if following a person add them to the list of
 								        # calendar follows
-												Unit test for adding new follow to calendar

											
										
										
											2020-09-03 12:16:24 +00:00
+								        print('DEBUG: adding ' +
-												Snake case

											
										
										
											2021-12-27 19:26:54 +00:00
+								              follow_nickname + '@' + follow_domain + ' to calendar of ' +
-												Unit test for adding new follow to calendar

											
										
										
											2020-09-03 12:16:24 +00:00
+								              nickname + '@' + domain)
-												Snake case

											
										
										
											2021-12-27 16:18:52 +00:00
+								        add_person_to_calendar(base_dir, nickname, domain,
-												Snake case

											
										
										
											2021-12-27 19:26:54 +00:00
+								                               follow_nickname, follow_domain)
-												Create default petname when following

											
										
										
											2020-11-23 15:07:55 +00:00
+								        # add a default petname
-												Snake case

											
										
										
											2021-12-27 19:26:54 +00:00
+								        _set_default_pet_name(base_dir, nickname, domain,
 								                              follow_nickname, follow_domain)
-												Follow request test passes

											
										
										
											2019-07-06 19:24:52 +00:00
+								    return True
-												Move shared inbox account into daemon

											
										
										
											2019-07-11 12:29:31 +00:00
-												flake8 format

											
										
										
											2020-04-04 13:44:49 +00:00
-												Snake case

											
										
										
											2021-12-27 22:32:59 +00:00
+								def votes_on_newswire_item(status: []) -> int:
-												Apply voting threshold to timeline

											
										
										
											2020-10-08 19:47:23 +00:00
+								    """Returns the number of votes on a newswire item
 								    """
-												Snake case

											
										
										
											2021-12-27 22:32:59 +00:00
+								    total_votes = 0
-												Apply voting threshold to timeline

											
										
										
											2020-10-08 19:47:23 +00:00
+								    for line in status:
 								        if 'vote:' in line:
-												Snake case

											
										
										
											2021-12-27 22:32:59 +00:00
+								            total_votes += 1
 								    return total_votes
-												Apply voting threshold to timeline

											
										
										
											2020-10-08 19:47:23 +00:00
-												Snake case

											
										
										
											2021-12-27 22:38:48 +00:00
+								def locate_news_votes(base_dir: str, domain: str,
 								                      post_url: str) -> str:
-												Apply voting threshold to timeline

											
										
										
											2020-10-08 19:47:23 +00:00
+								    """Returns the votes filename for a news post
 								    within the news user account
 								    """
-												Function for line ending characters

											
										
										
											2022-06-21 11:58:50 +00:00
+								    post_url1 = post_url.strip()
 								    post_url = remove_eol(post_url1)
-												Apply voting threshold to timeline

											
										
										
											2020-10-08 19:47:23 +00:00
 								    # if this post in the shared inbox?
-												Snake case

											
										
										
											2021-12-27 22:38:48 +00:00
+								    post_url = remove_id_ending(post_url.strip()).replace('/', '#')
-												Apply voting threshold to timeline

											
										
										
											2020-10-08 19:47:23 +00:00
-												Snake case

											
										
										
											2021-12-27 22:38:48 +00:00
+								    if post_url.endswith('.json'):
 								        post_url = post_url + '.votes'
-												Apply voting threshold to timeline

											
										
										
											2020-10-08 19:47:23 +00:00
+								    else:
-												Snake case

											
										
										
											2021-12-27 22:38:48 +00:00
+								        post_url = post_url + '.json.votes'
-												Apply voting threshold to timeline

											
										
										
											2020-10-08 19:47:23 +00:00
-												Snake case

											
										
										
											2021-12-27 22:38:48 +00:00
+								    account_dir = base_dir + '/accounts/news@' + domain + '/'
 								    post_filename = account_dir + 'outbox/' + post_url
-												Snake case

											
										
										
											2021-12-26 23:41:34 +00:00
+								    if os.path.isfile(post_filename):
 								        return post_filename
-												Voting time period

											
										
										
											2020-10-09 12:15:20 +00:00
 								    return None
-												Snake case

											
										
										
											2021-12-27 22:46:10 +00:00
+								def locate_news_arrival(base_dir: str, domain: str,
 								                        post_url: str) -> str:
-												Voting time period

											
										
										
											2020-10-09 12:15:20 +00:00
+								    """Returns the arrival time for a news post
 								    within the news user account
 								    """
-												Function for line ending characters

											
										
										
											2022-06-21 11:58:50 +00:00
+								    post_url1 = post_url.strip()
 								    post_url = remove_eol(post_url1)
-												Voting time period

											
										
										
											2020-10-09 12:15:20 +00:00
 								    # if this post in the shared inbox?
-												Snake case

											
										
										
											2021-12-27 22:46:10 +00:00
+								    post_url = remove_id_ending(post_url.strip()).replace('/', '#')
-												Voting time period

											
										
										
											2020-10-09 12:15:20 +00:00
-												Snake case

											
										
										
											2021-12-27 22:46:10 +00:00
+								    if post_url.endswith('.json'):
 								        post_url = post_url + '.arrived'
-												Voting time period

											
										
										
											2020-10-09 12:15:20 +00:00
+								    else:
-												Snake case

											
										
										
											2021-12-27 22:46:10 +00:00
+								        post_url = post_url + '.json.arrived'
-												Voting time period

											
										
										
											2020-10-09 12:15:20 +00:00
-												Snake case

											
										
										
											2021-12-27 22:46:10 +00:00
+								    account_dir = base_dir + '/accounts/news@' + domain + '/'
 								    post_filename = account_dir + 'outbox/' + post_url
-												Snake case

											
										
										
											2021-12-26 23:41:34 +00:00
+								    if os.path.isfile(post_filename):
-												Explicitly set file encoding

											
										
										
											2022-06-09 14:46:30 +00:00
+								        with open(post_filename, 'r', encoding='utf-8') as arrival_file:
-												Snake case

											
										
										
											2021-12-27 22:46:10 +00:00
+								            arrival = arrival_file.read()
-												Revert "Reading functions"

This reverts commit ee0ffade9d74f8465338aab59546ef296c8f2a74.

											
										
										
											2021-06-21 22:52:04 +00:00
+								            if arrival:
-												Snake case

											
										
										
											2021-12-27 22:46:10 +00:00
+								                arrival_date = \
-												Revert "Reading functions"

This reverts commit ee0ffade9d74f8465338aab59546ef296c8f2a74.

											
										
										
											2021-06-21 22:52:04 +00:00
+								                    datetime.datetime.strptime(arrival,
 								                                               "%Y-%m-%dT%H:%M:%SZ")
-												Snake case

											
										
										
											2021-12-27 22:46:10 +00:00
+								                return arrival_date
-												Voting time period

											
										
										
											2020-10-09 12:15:20 +00:00
-												Apply voting threshold to timeline

											
										
										
											2020-10-08 19:47:23 +00:00
+								    return None
-												Snake case

											
										
										
											2021-12-28 10:17:58 +00:00
+								def clear_from_post_caches(base_dir: str, recent_posts_cache: {},
 								                           post_id: str) -> None:
-												Clear post from caches before updating

											
										
										
											2020-10-18 16:19:28 +00:00
+								    """Clears cached html for the given post, so that edits
 								    to news will appear
 								    """
-												Snake case

											
										
										
											2021-12-26 19:47:06 +00:00
+								    filename = '/postcache/' + post_id + '.html'
-												Check break after walk

											
										
										
											2022-07-22 09:58:42 +00:00
+								    for _, dirs, _ in os.walk(base_dir + '/accounts'):
-												Clear post from caches before updating

											
										
										
											2020-10-18 16:19:28 +00:00
+								        for acct in dirs:
 								            if '@' not in acct:
 								                continue
-												Actor is not an account directory

											
										
										
											2022-02-10 15:07:09 +00:00
+								            if acct.startswith('inbox@') or acct.startswith('Actor@'):
-												Clear post from caches before updating

											
										
										
											2020-10-18 16:19:28 +00:00
+								                continue
-												Snake case

											
										
										
											2021-12-28 10:17:58 +00:00
+								            cache_dir = os.path.join(base_dir + '/accounts', acct)
 								            post_filename = cache_dir + filename
-												Snake case

											
										
										
											2021-12-26 23:41:34 +00:00
+								            if os.path.isfile(post_filename):
-												Clear post from caches before updating

											
										
										
											2020-10-18 16:19:28 +00:00
+								                try:
-												Snake case

											
										
										
											2021-12-26 23:41:34 +00:00
+								                    os.remove(post_filename)
-												More specific exceptions

											
										
										
											2021-11-25 18:42:38 +00:00
+								                except OSError:
-												Snake case

											
										
										
											2021-12-28 10:17:58 +00:00
+								                    print('EX: clear_from_post_caches file not removed ' +
-												Snake case

											
										
										
											2021-12-26 23:41:34 +00:00
+								                          str(post_filename))
-												Remove from recent posts cache when clearing post

											
										
										
											2020-10-18 20:06:52 +00:00
+								            # if the post is in the recent posts cache then remove it
-												Snake case

											
										
										
											2021-12-26 20:01:37 +00:00
+								            if recent_posts_cache.get('index'):
 								                if post_id in recent_posts_cache['index']:
 								                    recent_posts_cache['index'].remove(post_id)
 								            if recent_posts_cache.get('json'):
 								                if recent_posts_cache['json'].get(post_id):
 								                    del recent_posts_cache['json'][post_id]
 								            if recent_posts_cache.get('html'):
 								                if recent_posts_cache['html'].get(post_id):
 								                    del recent_posts_cache['html'][post_id]
-												Break after loop

											
										
										
											2020-12-13 22:13:45 +00:00
+								        break
-												Clear post from caches before updating

											
										
										
											2020-10-18 16:19:28 +00:00
-												Snake case

											
										
										
											2021-12-26 20:36:08 +00:00
+								def locate_post(base_dir: str, nickname: str, domain: str,
-												Snake case

											
										
										
											2021-12-28 12:15:46 +00:00
+								                post_url: str, replies: bool = False) -> str:
-												Move shared inbox account into daemon

											
										
										
											2019-07-11 12:29:31 +00:00
+								    """Returns the filename for the given status post url
 								    """
-												Handle displaying replies

											
										
										
											2019-07-13 19:28:14 +00:00
+								    if not replies:
-												flake8 format

											
										
										
											2020-04-04 13:44:49 +00:00
+								        extension = 'json'
-												Handle displaying replies

											
										
										
											2019-07-13 19:28:14 +00:00
+								    else:
-												flake8 format

											
										
										
											2020-04-04 13:44:49 +00:00
+								        extension = 'replies'
-												More debug

											
										
										
											2019-11-18 14:42:18 +00:00
-												Check that announce activity arrives

											
										
										
											2019-07-11 19:31:02 +00:00
+								    # if this post in the shared inbox?
-												Snake case

											
										
										
											2021-12-28 12:15:46 +00:00
+								    post_url = remove_id_ending(post_url.strip()).replace('/', '#')
-												More debug

											
										
										
											2019-11-18 14:42:18 +00:00
-												Tidying

											
										
										
											2020-05-18 10:19:31 +00:00
+								    # add the extension
-												Snake case

											
										
										
											2021-12-28 12:15:46 +00:00
+								    post_url = post_url + '.' + extension
-												Tidying

											
										
										
											2020-05-18 10:19:31 +00:00
-												Tidying

											
										
										
											2020-05-18 10:14:29 +00:00
+								    # search boxes
-												Deprecate events

Mobilizon does it in a different way

											
										
										
											2021-07-01 21:30:36 +00:00
+								    boxes = ('inbox', 'outbox', 'tlblogs')
-												Snake case

											
										
										
											2021-12-28 10:17:58 +00:00
+								    account_dir = acct_dir(base_dir, nickname, domain) + '/'
-												Snake case

											
										
										
											2021-12-28 12:15:46 +00:00
+								    for box_name in boxes:
 								        post_filename = account_dir + box_name + '/' + post_url
-												Snake case

											
										
										
											2021-12-26 23:41:34 +00:00
+								        if os.path.isfile(post_filename):
 								            return post_filename
-												Locate news posts

											
										
										
											2020-10-08 13:07:17 +00:00
 								    # check news posts
-												Snake case

											
										
										
											2021-12-28 10:17:58 +00:00
+								    account_dir = base_dir + '/accounts/news' + '@' + domain + '/'
-												Snake case

											
										
										
											2021-12-28 12:15:46 +00:00
+								    post_filename = account_dir + 'outbox/' + post_url
-												Snake case

											
										
										
											2021-12-26 23:41:34 +00:00
+								    if os.path.isfile(post_filename):
 								        return post_filename
-												Tidying

											
										
										
											2020-05-18 10:14:29 +00:00
 								    # is it in the announce cache?
-												Snake case

											
										
										
											2021-12-28 12:15:46 +00:00
+								    post_filename = base_dir + '/cache/announce/' + nickname + '/' + post_url
-												Snake case

											
										
										
											2021-12-26 23:41:34 +00:00
+								    if os.path.isfile(post_filename):
 								        return post_filename
-												Tidying

											
										
										
											2020-05-18 10:14:29 +00:00
-												Snake case

											
										
										
											2021-12-28 12:15:46 +00:00
+								    # print('WARN: unable to locate ' + nickname + ' ' + post_url)
-												More debug

											
										
										
											2019-11-18 14:42:18 +00:00
+								    return None
-												Recursive delete

											
										
										
											2019-07-14 16:37:01 +00:00
-												flake8 format

											
										
										
											2020-04-04 13:44:49 +00:00
-												Snake case

											
										
										
											2021-12-28 10:25:50 +00:00
+								def _get_published_date(post_json_object: {}) -> str:
-												Implement reply interval in hours

The time after publication of a post during which replies are permitted

											
										
										
											2021-09-08 18:37:04 +00:00
+								    """Returns the published date on the given post
 								    """
 								    published = None
-												Snake case

											
										
										
											2021-12-25 22:09:19 +00:00
+								    if post_json_object.get('published'):
 								        published = post_json_object['published']
-												Snake case

											
										
										
											2021-12-26 10:57:03 +00:00
+								    elif has_object_dict(post_json_object):
-												Snake case

											
										
										
											2021-12-25 22:09:19 +00:00
+								        if post_json_object['object'].get('published'):
 								            published = post_json_object['object']['published']
-												Implement reply interval in hours

The time after publication of a post during which replies are permitted

											
										
										
											2021-09-08 18:37:04 +00:00
+								    if not published:
 								        return None
 								    if not isinstance(published, str):
 								        return None
 								    return published
-												Snake case

											
										
										
											2021-12-28 10:25:50 +00:00
+								def get_reply_interval_hours(base_dir: str, nickname: str, domain: str,
 								                             default_reply_interval_hrs: int) -> int:
-												Implement reply interval in hours

The time after publication of a post during which replies are permitted

											
										
										
											2021-09-08 18:37:04 +00:00
+								    """Returns the reply interval for the given account.
 								    The reply interval is the number of hours after a post being made
 								    during which replies are allowed
 								    """
-												Snake case

											
										
										
											2021-12-28 10:25:50 +00:00
+								    reply_interval_filename = \
-												Snake case

											
										
										
											2021-12-28 12:15:46 +00:00
+								        acct_dir(base_dir, nickname, domain) + '/.reply_interval_hours'
-												Snake case

											
										
										
											2021-12-28 10:25:50 +00:00
+								    if os.path.isfile(reply_interval_filename):
-												Explicitly set file encoding

											
										
										
											2022-06-09 14:46:30 +00:00
+								        with open(reply_interval_filename, 'r',
 								                  encoding='utf-8') as interval_file:
-												Snake case

											
										
										
											2021-12-28 10:25:50 +00:00
+								            hours_str = interval_file.read()
 								            if hours_str.isdigit():
 								                return int(hours_str)
-												Snake case

											
										
										
											2021-12-25 17:31:22 +00:00
+								    return default_reply_interval_hrs
-												Implement reply interval in hours

The time after publication of a post during which replies are permitted

											
										
										
											2021-09-08 18:37:04 +00:00
-												Snake case

											
										
										
											2021-12-28 12:15:46 +00:00
+								def set_reply_interval_hours(base_dir: str, nickname: str, domain: str,
 								                             reply_interval_hours: int) -> bool:
-												Set reply interval from edit profile screen

											
										
										
											2021-09-08 19:30:49 +00:00
+								    """Sets the reply interval for the given account.
 								    The reply interval is the number of hours after a post being made
 								    during which replies are allowed
 								    """
-												Snake case

											
										
										
											2021-12-28 10:25:50 +00:00
+								    reply_interval_filename = \
-												Snake case

											
										
										
											2021-12-28 12:15:46 +00:00
+								        acct_dir(base_dir, nickname, domain) + '/.reply_interval_hours'
 								    try:
-												Explicitly set file encoding

											
										
										
											2022-06-09 14:46:30 +00:00
+								        with open(reply_interval_filename, 'w+',
 								                  encoding='utf-8') as interval_file:
-												Snake case

											
										
										
											2021-12-28 12:15:46 +00:00
+								            interval_file.write(str(reply_interval_hours))
-												Set reply interval from edit profile screen

											
										
										
											2021-09-08 19:30:49 +00:00
+								            return True
-												Snake case

											
										
										
											2021-12-28 12:15:46 +00:00
+								    except OSError:
 								        print('EX: set_reply_interval_hours unable to save reply interval ' +
 								              str(reply_interval_filename) + ' ' +
 								              str(reply_interval_hours))
-												Set reply interval from edit profile screen

											
										
										
											2021-09-08 19:30:49 +00:00
+								    return False
-												Snake case

											
										
										
											2021-12-28 12:15:46 +00:00
+								def can_reply_to(base_dir: str, nickname: str, domain: str,
 								                 post_url: str, reply_interval_hours: int,
 								                 curr_date_str: str = None,
 								                 post_json_object: {} = None) -> bool:
-												Tidying

											
										
										
											2023-08-03 17:31:47 +00:00
+								    """Is replying to the given local post permitted?
-												Implement reply interval in hours

The time after publication of a post during which replies are permitted

											
										
										
											2021-09-08 18:37:04 +00:00
+								    This is a spam mitigation feature, so that spammers can't
 								    add a lot of replies to old post which you don't notice.
 								    """
-												Snake case

											
										
										
											2021-12-28 12:15:46 +00:00
+								    if '/statuses/' not in post_url:
-												Check that the post replies to is a status

											
										
										
											2021-09-10 11:12:52 +00:00
+								        return True
-												Snake case

											
										
										
											2021-12-25 22:09:19 +00:00
+								    if not post_json_object:
-												Snake case

											
										
										
											2021-12-28 12:15:46 +00:00
+								        post_filename = locate_post(base_dir, nickname, domain, post_url)
-												Snake case

											
										
										
											2021-12-26 23:41:34 +00:00
+								        if not post_filename:
-												Replying to remote posts

											
										
										
											2023-02-16 14:42:56 +00:00
+								            # the post is not stored locally
 								            return True
-												Snake case

											
										
										
											2021-12-26 23:41:34 +00:00
+								        post_json_object = load_json(post_filename)
-												Snake case

											
										
										
											2021-12-25 22:09:19 +00:00
+								    if not post_json_object:
-												Implement reply interval in hours

The time after publication of a post during which replies are permitted

											
										
										
											2021-09-08 18:37:04 +00:00
+								        return False
-												Snake case

											
										
										
											2021-12-28 10:25:50 +00:00
+								    published = _get_published_date(post_json_object)
-												Implement reply interval in hours

The time after publication of a post during which replies are permitted

											
										
										
											2021-09-08 18:37:04 +00:00
+								    if not published:
 								        return False
 								    try:
-												Snake case

											
										
										
											2021-12-28 12:15:46 +00:00
+								        pub_date = datetime.datetime.strptime(published, '%Y-%m-%dT%H:%M:%SZ')
-												Implement reply interval in hours

The time after publication of a post during which replies are permitted

											
										
										
											2021-09-08 18:37:04 +00:00
+								    except BaseException:
-												Snake case

											
										
										
											2021-12-28 12:15:46 +00:00
+								        print('EX: can_reply_to unrecognized published date ' + str(published))
-												Implement reply interval in hours

The time after publication of a post during which replies are permitted

											
										
										
											2021-09-08 18:37:04 +00:00
+								        return False
-												Snake case

											
										
										
											2021-12-28 12:15:46 +00:00
+								    if not curr_date_str:
 								        curr_date = datetime.datetime.utcnow()
-												Implement reply interval in hours

The time after publication of a post during which replies are permitted

											
										
										
											2021-09-08 18:37:04 +00:00
+								    else:
 								        try:
-												Snake case

											
										
										
											2021-12-28 12:15:46 +00:00
+								            curr_date = \
 								                datetime.datetime.strptime(curr_date_str, '%Y-%m-%dT%H:%M:%SZ')
-												Implement reply interval in hours

The time after publication of a post during which replies are permitted

											
										
										
											2021-09-08 18:37:04 +00:00
+								        except BaseException:
-												Snake case

											
										
										
											2021-12-28 12:15:46 +00:00
+								            print('EX: can_reply_to unrecognized current date ' +
 								                  str(curr_date_str))
-												Implement reply interval in hours

The time after publication of a post during which replies are permitted

											
										
										
											2021-09-08 18:37:04 +00:00
+								            return False
-												Snake case

											
										
										
											2021-12-28 12:15:46 +00:00
+								    hours_since_publication = \
 								        int((curr_date - pub_date).total_seconds() / 3600)
 								    if hours_since_publication < 0 or \
 								       hours_since_publication >= reply_interval_hours:
-												Implement reply interval in hours

The time after publication of a post during which replies are permitted

											
										
										
											2021-09-08 18:37:04 +00:00
+								        return False
 								    return True
-												Snake case

											
										
										
											2021-12-28 13:49:44 +00:00
+								def _remove_attachment(base_dir: str, http_prefix: str, domain: str,
 								                       post_json: {}):
-												Save file containing video transcript

											
										
										
											2023-02-18 22:32:50 +00:00
+								    """Removes media files for an attachment
 								    """
-												Snake case

											
										
										
											2021-12-28 12:15:46 +00:00
+								    if not post_json.get('attachment'):
-												Tidying

											
										
										
											2019-07-14 16:57:06 +00:00
+								        return
-												Snake case

											
										
										
											2021-12-28 12:15:46 +00:00
+								    if not post_json['attachment'][0].get('url'):
-												Tidying

											
										
										
											2019-07-14 16:57:06 +00:00
+								        return
-												Snake case

											
										
										
											2021-12-28 12:15:46 +00:00
+								    attachment_url = post_json['attachment'][0]['url']
 								    if not attachment_url:
-												Tidying

											
										
										
											2019-07-14 16:57:06 +00:00
+								        return
-												Sanitise links to avoid injection attacks in rendered html

											
										
										
											2023-07-12 11:08:02 +00:00
+								    attachment_url = remove_html(attachment_url)
-												Snake case

											
										
										
											2021-12-28 12:15:46 +00:00
+								    media_filename = base_dir + '/' + \
 								        attachment_url.replace(http_prefix + '://' + domain + '/', '')
 								    if os.path.isfile(media_filename):
-												Exception handling when deleting files

This can fail if a file is manually deleted or deleted in another thread

											
										
										
											2021-09-05 10:17:43 +00:00
+								        try:
-												Snake case

											
										
										
											2021-12-28 12:15:46 +00:00
+								            os.remove(media_filename)
-												More specific exceptions

											
										
										
											2021-11-25 18:42:38 +00:00
+								        except OSError:
-												Snake case

											
										
										
											2021-12-28 13:49:44 +00:00
+								            print('EX: _remove_attachment unable to delete media file ' +
-												Snake case

											
										
										
											2021-12-28 12:15:46 +00:00
+								                  str(media_filename))
-												Save file containing video transcript

											
										
										
											2023-02-18 22:32:50 +00:00
+								    if os.path.isfile(media_filename + '.vtt'):
 								        try:
 								            os.remove(media_filename + '.vtt')
 								        except OSError:
 								            print('EX: _remove_attachment unable to delete media transcript ' +
 								                  str(media_filename) + '.vtt')
-												Snake case

											
										
										
											2021-12-28 12:15:46 +00:00
+								    etag_filename = media_filename + '.etag'
 								    if os.path.isfile(etag_filename):
-												Exception handling when deleting files

This can fail if a file is manually deleted or deleted in another thread

											
										
										
											2021-09-05 10:17:43 +00:00
+								        try:
-												Snake case

											
										
										
											2021-12-28 12:15:46 +00:00
+								            os.remove(etag_filename)
-												More specific exceptions

											
										
										
											2021-11-25 18:42:38 +00:00
+								        except OSError:
-												Snake case

											
										
										
											2021-12-28 13:49:44 +00:00
+								            print('EX: _remove_attachment unable to delete etag file ' +
-												Snake case

											
										
										
											2021-12-28 12:15:46 +00:00
+								                  str(etag_filename))
 								    post_json['attachment'] = []
-												flake8 format

											
										
										
											2020-04-04 13:44:49 +00:00
-												Tidying

											
										
										
											2019-07-14 16:57:06 +00:00
-												Snake case

											
										
										
											2021-12-28 13:12:10 +00:00
+								def remove_moderation_post_from_index(base_dir: str, post_url: str,
 								                                      debug: bool) -> None:
-												Deletion of moderation reports

											
										
										
											2019-08-12 18:02:29 +00:00
+								    """Removes a url from the moderation index
 								    """
-												Snake case

											
										
										
											2021-12-26 19:47:06 +00:00
+								    moderation_index_file = base_dir + '/accounts/moderation.txt'
 								    if not os.path.isfile(moderation_index_file):
-												Deletion of moderation reports

											
										
										
											2019-08-12 18:02:29 +00:00
+								        return
-												Snake case

											
										
										
											2021-12-28 12:15:46 +00:00
+								    post_id = remove_id_ending(post_url)
-												Function for checking text in a file

											
										
										
											2022-06-10 09:24:11 +00:00
+								    if text_in_file(post_id, moderation_index_file):
-												Explicitly set file encoding

											
										
										
											2022-06-09 14:46:30 +00:00
+								        with open(moderation_index_file, 'r',
 								                  encoding='utf-8') as file1:
-												Snake case

											
										
										
											2021-12-28 12:15:46 +00:00
+								            lines = file1.readlines()
-												Explicitly set file encoding

											
										
										
											2022-06-09 14:46:30 +00:00
+								            with open(moderation_index_file, 'w+',
 								                      encoding='utf-8') as file2:
-												Deletion of moderation reports

											
										
										
											2019-08-12 18:02:29 +00:00
+								                for line in lines:
-												Snake case

											
										
										
											2021-12-26 19:47:06 +00:00
+								                    if line.strip("\n").strip("\r") != post_id:
-												Snake case

											
										
										
											2021-12-28 12:15:46 +00:00
+								                        file2.write(line)
 								                        continue
 								                    if debug:
 								                        print('DEBUG: removed ' + post_id +
 								                              ' from moderation index')
-												flake8 format

											
										
										
											2020-04-04 13:44:49 +00:00
-												Deletion of moderation reports

											
										
										
											2019-08-12 18:02:29 +00:00
-												Snake case

											
										
										
											2021-12-26 19:36:40 +00:00
+								def _is_reply_to_blog_post(base_dir: str, nickname: str, domain: str,
 								                           post_json_object: str):
-												Don't remove cached html if it is a reply to a blog post

											
										
										
											2020-05-18 15:59:11 +00:00
+								    """Is the given post a reply to a blog post?
 								    """
-												Snake case

											
										
										
											2021-12-26 10:57:03 +00:00
+								    if not has_object_dict(post_json_object):
-												Don't remove cached html if it is a reply to a blog post

											
										
										
											2020-05-18 15:59:11 +00:00
+								        return False
-												Snake case

											
										
										
											2021-12-25 22:09:19 +00:00
+								    if not post_json_object['object'].get('inReplyTo'):
-												Don't remove cached html if it is a reply to a blog post

											
										
										
											2020-05-18 15:59:11 +00:00
+								        return False
-												Snake case

											
										
										
											2021-12-25 22:09:19 +00:00
+								    if not isinstance(post_json_object['object']['inReplyTo'], str):
-												Check that replyTo field is a string

											
										
										
											2020-08-28 14:45:07 +00:00
+								        return False
-												Snake case

											
										
										
											2021-12-26 19:36:40 +00:00
+								    blogs_index_filename = \
-												Snake case

											
										
										
											2021-12-26 12:02:29 +00:00
+								        acct_dir(base_dir, nickname, domain) + '/tlblogs.index'
-												Snake case

											
										
										
											2021-12-26 19:36:40 +00:00
+								    if not os.path.isfile(blogs_index_filename):
-												Don't remove cached html if it is a reply to a blog post

											
										
										
											2020-05-18 15:59:11 +00:00
+								        return False
-												Snake case

											
										
										
											2021-12-27 11:20:57 +00:00
+								    post_id = remove_id_ending(post_json_object['object']['inReplyTo'])
-												Snake case

											
										
										
											2021-12-26 19:36:40 +00:00
+								    post_id = post_id.replace('/', '#')
-												Function for checking text in a file

											
										
										
											2022-06-10 09:24:11 +00:00
+								    if text_in_file(post_id, blogs_index_filename):
-												Don't remove cached html if it is a reply to a blog post

											
										
										
											2020-05-18 15:59:11 +00:00
+								        return True
 								    return False
-												Snake case

											
										
										
											2021-12-28 14:55:45 +00:00
+								def _delete_post_remove_replies(base_dir: str, nickname: str, domain: str,
 								                                http_prefix: str, post_filename: str,
-												Only prevent remote DM deletions during archive

											
										
										
											2022-05-01 17:14:29 +00:00
+								                                recent_posts_cache: {}, debug: bool,
 								                                manual: bool) -> None:
-												Tidying of post deletion

											
										
										
											2021-07-05 09:24:29 +00:00
+								    """Removes replies when deleting a post
 								    """
-												Snake case

											
										
										
											2021-12-28 12:15:46 +00:00
+								    replies_filename = post_filename.replace('.json', '.replies')
 								    if not os.path.isfile(replies_filename):
-												Tidying of post deletion

											
										
										
											2021-07-05 09:24:29 +00:00
+								        return
 								    if debug:
-												Snake case

											
										
										
											2021-12-26 23:41:34 +00:00
+								        print('DEBUG: removing replies to ' + post_filename)
-												Explicitly set file encoding

											
										
										
											2022-06-09 14:46:30 +00:00
+								    with open(replies_filename, 'r', encoding='utf-8') as replies_file:
-												Snake case

											
										
										
											2021-12-28 12:15:46 +00:00
+								        for reply_id in replies_file:
 								            reply_file = locate_post(base_dir, nickname, domain, reply_id)
 								            if not reply_file:
-												Tidying of post deletion

											
										
										
											2021-07-05 09:24:29 +00:00
+								                continue
-												Snake case

											
										
										
											2021-12-28 12:15:46 +00:00
+								            if os.path.isfile(reply_file):
-												Snake case

											
										
										
											2021-12-28 14:55:45 +00:00
+								                delete_post(base_dir, http_prefix,
 								                            nickname, domain, reply_file, debug,
-												Only prevent remote DM deletions during archive

											
										
										
											2022-05-01 17:14:29 +00:00
+								                            recent_posts_cache, manual)
-												Tidying of post deletion

											
										
										
											2021-07-05 09:24:29 +00:00
+								    # remove the replies file
-												Exception handling when deleting files

This can fail if a file is manually deleted or deleted in another thread

											
										
										
											2021-09-05 10:17:43 +00:00
+								    try:
-												Snake case

											
										
										
											2021-12-28 12:15:46 +00:00
+								        os.remove(replies_filename)
-												More specific exceptions

											
										
										
											2021-11-25 18:42:38 +00:00
+								    except OSError:
-												Snake case

											
										
										
											2021-12-28 14:55:45 +00:00
+								        print('EX: _delete_post_remove_replies ' +
 								              'unable to delete replies file ' + str(replies_filename))
-												Tidying of post deletion

											
										
										
											2021-07-05 09:24:29 +00:00
-												Snake case

											
										
										
											2021-12-28 13:12:10 +00:00
+								def _is_bookmarked(base_dir: str, nickname: str, domain: str,
 								                   post_filename: str) -> bool:
-												Tidying of post deletion

											
										
										
											2021-07-05 09:24:29 +00:00
+								    """Returns True if the given post is bookmarked
 								    """
-												Snake case

											
										
										
											2021-12-28 12:15:46 +00:00
+								    bookmarks_index_filename = \
-												Snake case

											
										
										
											2021-12-26 12:02:29 +00:00
+								        acct_dir(base_dir, nickname, domain) + '/bookmarks.index'
-												Snake case

											
										
										
											2021-12-28 12:15:46 +00:00
+								    if os.path.isfile(bookmarks_index_filename):
 								        bookmark_index = post_filename.split('/')[-1] + '\n'
-												Function for checking text in a file

											
										
										
											2022-06-10 09:24:11 +00:00
+								        if text_in_file(bookmark_index, bookmarks_index_filename):
-												Tidying of post deletion

											
										
										
											2021-07-05 09:24:29 +00:00
+								            return True
 								    return False
-												Snake case

											
										
										
											2021-12-27 11:05:24 +00:00
+								def remove_post_from_cache(post_json_object: {},
 								                           recent_posts_cache: {}) -> None:
-												Remove redundant function

											
										
										
											2021-07-05 10:09:11 +00:00
+								    """ if the post exists in the recent posts cache then remove it
-												Tidying of post deletion

											
										
										
											2021-07-05 09:45:55 +00:00
+								    """
-												Snake case

											
										
										
											2021-12-26 20:01:37 +00:00
+								    if not recent_posts_cache:
-												Tidying of post deletion

											
										
										
											2021-07-05 09:45:55 +00:00
+								        return
-												Snake case

											
										
										
											2021-12-25 22:09:19 +00:00
+								    if not post_json_object.get('id'):
-												Remove redundant function

											
										
										
											2021-07-05 10:09:11 +00:00
+								        return
-												Snake case

											
										
										
											2021-12-26 20:01:37 +00:00
+								    if not recent_posts_cache.get('index'):
-												Remove redundant function

											
										
										
											2021-07-05 10:09:11 +00:00
+								        return
-												Snake case

											
										
										
											2021-12-26 19:47:06 +00:00
+								    post_id = post_json_object['id']
 								    if '#' in post_id:
 								        post_id = post_id.split('#', 1)[0]
-												Snake case

											
										
										
											2021-12-27 11:20:57 +00:00
+								    post_id = remove_id_ending(post_id).replace('/', '#')
-												Snake case

											
										
										
											2021-12-26 20:01:37 +00:00
+								    if post_id not in recent_posts_cache['index']:
-												Remove redundant function

											
										
										
											2021-07-05 10:09:11 +00:00
+								        return
-												Tidying of post deletion

											
										
										
											2021-07-05 09:45:55 +00:00
-												Snake case

											
										
										
											2021-12-26 20:01:37 +00:00
+								    if recent_posts_cache.get('index'):
 								        if post_id in recent_posts_cache['index']:
 								            recent_posts_cache['index'].remove(post_id)
-												Tidying of post deletion

											
										
										
											2021-07-05 09:45:55 +00:00
-												Snake case

											
										
										
											2021-12-26 20:01:37 +00:00
+								    if recent_posts_cache.get('json'):
 								        if recent_posts_cache['json'].get(post_id):
 								            del recent_posts_cache['json'][post_id]
-												Tidying of post deletion

											
										
										
											2021-07-05 09:45:55 +00:00
-												Snake case

											
										
										
											2021-12-26 20:01:37 +00:00
+								    if recent_posts_cache.get('html'):
 								        if recent_posts_cache['html'].get(post_id):
 								            del recent_posts_cache['html'][post_id]
-												Tidying of post deletion

											
										
										
											2021-07-05 09:45:55 +00:00
-												Handle incoming edited posts

											
										
										
											2022-04-09 15:11:22 +00:00
+								def delete_cached_html(base_dir: str, nickname: str, domain: str,
 								                       post_json_object: {}):
-												Tidying of post deletion

											
										
										
											2021-07-05 09:45:55 +00:00
+								    """Removes cached html file for the given post
 								    """
-												Snake case

											
										
										
											2021-12-27 11:05:24 +00:00
+								    cached_post_filename = \
-												Snake case

											
										
										
											2021-12-26 23:41:34 +00:00
+								        get_cached_post_filename(base_dir, nickname, domain, post_json_object)
-												Snake case

											
										
										
											2021-12-27 11:05:24 +00:00
+								    if cached_post_filename:
 								        if os.path.isfile(cached_post_filename):
-												Exception handling when deleting files

This can fail if a file is manually deleted or deleted in another thread

											
										
										
											2021-09-05 10:17:43 +00:00
+								            try:
-												Snake case

											
										
										
											2021-12-27 11:05:24 +00:00
+								                os.remove(cached_post_filename)
-												More specific exceptions

											
										
										
											2021-11-25 18:42:38 +00:00
+								            except OSError:
-												Handle incoming edited posts

											
										
										
											2022-04-09 15:11:22 +00:00
+								                print('EX: delete_cached_html ' +
-												Debug messages for exceptions

											
										
										
											2021-10-29 18:48:15 +00:00
+								                      'unable to delete cached post file ' +
-												Snake case

											
										
										
											2021-12-27 11:05:24 +00:00
+								                      str(cached_post_filename))
-												Handle ssml files in outbox

											
										
										
											2022-05-12 11:56:45 +00:00
-												Cache ssml for posts

											
										
										
											2022-05-12 10:13:55 +00:00
+								        cached_post_filename = cached_post_filename.replace('.html', '.ssml')
 								        if os.path.isfile(cached_post_filename):
 								            try:
 								                os.remove(cached_post_filename)
 								            except OSError:
 								                print('EX: delete_cached_html ' +
 								                      'unable to delete cached ssml post file ' +
 								                      str(cached_post_filename))
-												Tidying of post deletion

											
										
										
											2021-07-05 09:45:55 +00:00
-												Handle ssml files in outbox

											
										
										
											2022-05-12 11:56:45 +00:00
+								        cached_post_filename = \
 								            cached_post_filename.replace('/postcache/', '/outbox/')
 								        if os.path.isfile(cached_post_filename):
 								            try:
 								                os.remove(cached_post_filename)
 								            except OSError:
 								                print('EX: delete_cached_html ' +
 								                      'unable to delete cached outbox ssml post file ' +
 								                      str(cached_post_filename))
-												Tidying of post deletion

											
										
										
											2021-07-05 09:45:55 +00:00
-												Remove map links from tags when posts are deleted

											
										
										
											2022-08-22 10:58:55 +00:00
+								def _remove_post_id_from_tag_index(tag_index_filename: str,
 								                                   post_id: str) -> None:
 								    """Remove post_id from the tag index file
 								    """
 								    lines = None
 								    with open(tag_index_filename, 'r', encoding='utf-8') as index_file:
 								        lines = index_file.readlines()
 								    if not lines:
 								        return
 								    newlines = ''
 								    for file_line in lines:
 								        if post_id in file_line:
 								            # skip over the deleted post
 								            continue
 								        newlines += file_line
 								    if not newlines.strip():
 								        # if there are no lines then remove the hashtag file
 								        try:
 								            os.remove(tag_index_filename)
 								        except OSError:
 								            print('EX: _delete_hashtags_on_post ' +
 								                  'unable to delete tag index ' + str(tag_index_filename))
 								    else:
 								        # write the new hashtag index without the given post in it
 								        with open(tag_index_filename, 'w+',
 								                  encoding='utf-8') as index_file:
 								            index_file.write(newlines)
-												Snake case

											
										
										
											2021-12-28 14:55:45 +00:00
+								def _delete_hashtags_on_post(base_dir: str, post_json_object: {}) -> None:
-												Tidying of post deletion

											
										
										
											2021-07-05 09:45:55 +00:00
+								    """Removes hashtags when a post is deleted
 								    """
-												Snake case

											
										
										
											2021-12-28 12:15:46 +00:00
+								    remove_hashtag_index = False
-												Snake case

											
										
										
											2021-12-26 10:57:03 +00:00
+								    if has_object_dict(post_json_object):
-												Snake case

											
										
										
											2021-12-25 22:09:19 +00:00
+								        if post_json_object['object'].get('content'):
 								            if '#' in post_json_object['object']['content']:
-												Snake case

											
										
										
											2021-12-28 12:15:46 +00:00
+								                remove_hashtag_index = True
-												Tidying of post deletion

											
										
										
											2021-07-05 09:45:55 +00:00
-												Snake case

											
										
										
											2021-12-28 12:15:46 +00:00
+								    if not remove_hashtag_index:
-												Tidying of post deletion

											
										
										
											2021-07-05 09:45:55 +00:00
+								        return
-												Snake case

											
										
										
											2021-12-25 22:09:19 +00:00
+								    if not post_json_object['object'].get('id') or \
 								       not post_json_object['object'].get('tag'):
-												Tidying of post deletion

											
										
										
											2021-07-05 09:45:55 +00:00
+								        return
 								    # get the id of the post
-												Snake case

											
										
										
											2021-12-27 11:20:57 +00:00
+								    post_id = remove_id_ending(post_json_object['object']['id'])
-												Snake case

											
										
										
											2021-12-25 22:09:19 +00:00
+								    for tag in post_json_object['object']['tag']:
-												Check for type

											
										
										
											2021-10-30 19:26:52 +00:00
+								        if not tag.get('type'):
 								            continue
-												Tidying of post deletion

											
										
										
											2021-07-05 09:45:55 +00:00
+								        if tag['type'] != 'Hashtag':
 								            continue
 								        if not tag.get('name'):
 								            continue
 								        # find the index file for this tag
-												Remove map links from tags when posts are deleted

											
										
										
											2022-08-22 10:58:55 +00:00
+								        tag_map_filename = base_dir + '/tagmaps/' + tag['name'][1:] + '.txt'
 								        if os.path.isfile(tag_map_filename):
 								            _remove_post_id_from_tag_index(tag_map_filename, post_id)
 								        # find the index file for this tag
-												Snake case

											
										
										
											2021-12-28 12:15:46 +00:00
+								        tag_index_filename = base_dir + '/tags/' + tag['name'][1:] + '.txt'
-												Remove map links from tags when posts are deleted

											
										
										
											2022-08-22 10:58:55 +00:00
+								        if os.path.isfile(tag_index_filename):
 								            _remove_post_id_from_tag_index(tag_index_filename, post_id)
-												Tidying of post deletion

											
										
										
											2021-07-05 09:45:55 +00:00
-												Moving to snake case

											
										
										
											2021-12-29 21:55:09 +00:00
+								def _delete_conversation_post(base_dir: str, nickname: str, domain: str,
 								                              post_json_object: {}) -> None:
-												Muting by conversation ID

											
										
										
											2021-08-12 10:22:04 +00:00
+								    """Deletes a post from a conversation
 								    """
-												Snake case

											
										
										
											2021-12-26 10:57:03 +00:00
+								    if not has_object_dict(post_json_object):
-												Muting by conversation ID

											
										
										
											2021-08-12 10:22:04 +00:00
+								        return False
-												'context' is sometimes used to mean the same thing as 'conversation'

This does not appear to be part of the AP spec, but is used in the wild

											
										
										
											2023-01-09 11:38:05 +00:00
+								    if not post_json_object['object'].get('conversation') and \
 								       not post_json_object['object'].get('context'):
-												Muting by conversation ID

											
										
										
											2021-08-12 10:22:04 +00:00
+								        return False
-												Snake case

											
										
										
											2021-12-25 22:09:19 +00:00
+								    if not post_json_object['object'].get('id'):
-												Muting by conversation ID

											
										
										
											2021-08-12 10:22:04 +00:00
+								        return False
-												Snake case

											
										
										
											2021-12-28 12:15:46 +00:00
+								    conversation_dir = \
 								        acct_dir(base_dir, nickname, domain) + '/conversation'
-												'context' is sometimes used to mean the same thing as 'conversation'

This does not appear to be part of the AP spec, but is used in the wild

											
										
										
											2023-01-09 11:38:05 +00:00
+								    if post_json_object['object'].get('conversation'):
 								        conversation_id = post_json_object['object']['conversation']
 								    else:
 								        conversation_id = post_json_object['object']['context']
-												Snake case

											
										
										
											2021-12-28 12:15:46 +00:00
+								    conversation_id = conversation_id.replace('/', '#')
-												Snake case

											
										
										
											2021-12-26 19:47:06 +00:00
+								    post_id = post_json_object['object']['id']
-												Snake case

											
										
										
											2021-12-28 12:15:46 +00:00
+								    conversation_filename = conversation_dir + '/' + conversation_id
 								    if not os.path.isfile(conversation_filename):
 								        return False
 								    conversation_str = ''
-												Explicitly set file encoding

											
										
										
											2022-06-09 14:46:30 +00:00
+								    with open(conversation_filename, 'r', encoding='utf-8') as conv_file:
-												Snake case

											
										
										
											2021-12-28 12:15:46 +00:00
+								        conversation_str = conv_file.read()
 								    if post_id + '\n' not in conversation_str:
 								        return False
 								    conversation_str = conversation_str.replace(post_id + '\n', '')
 								    if conversation_str:
-												Explicitly set file encoding

											
										
										
											2022-06-09 14:46:30 +00:00
+								        with open(conversation_filename, 'w+', encoding='utf-8') as conv_file:
-												Snake case

											
										
										
											2021-12-28 12:15:46 +00:00
+								            conv_file.write(conversation_str)
-												Muting by conversation ID

											
										
										
											2021-08-12 10:22:04 +00:00
+								    else:
-												Snake case

											
										
										
											2021-12-28 12:15:46 +00:00
+								        if os.path.isfile(conversation_filename + '.muted'):
-												Exception handling when deleting files

This can fail if a file is manually deleted or deleted in another thread

											
										
										
											2021-09-05 10:17:43 +00:00
+								            try:
-												Snake case

											
										
										
											2021-12-28 12:15:46 +00:00
+								                os.remove(conversation_filename + '.muted')
-												More specific exceptions

											
										
										
											2021-11-25 18:42:38 +00:00
+								            except OSError:
-												Moving to snake case

											
										
										
											2021-12-29 21:55:09 +00:00
+								                print('EX: _delete_conversation_post ' +
-												Debug messages for exceptions

											
										
										
											2021-10-29 18:48:15 +00:00
+								                      'unable to remove conversation ' +
-												Snake case

											
										
										
											2021-12-28 12:15:46 +00:00
+								                      str(conversation_filename) + '.muted')
-												Exception handling when deleting files

This can fail if a file is manually deleted or deleted in another thread

											
										
										
											2021-09-05 10:17:43 +00:00
+								        try:
-												Snake case

											
										
										
											2021-12-28 12:15:46 +00:00
+								            os.remove(conversation_filename)
-												More specific exceptions

											
										
										
											2021-11-25 18:42:38 +00:00
+								        except OSError:
-												Moving to snake case

											
										
										
											2021-12-29 21:55:09 +00:00
+								            print('EX: _delete_conversation_post ' +
-												Debug messages for exceptions

											
										
										
											2021-10-29 18:48:15 +00:00
+								                  'unable to remove conversation ' +
-												Snake case

											
										
										
											2021-12-28 12:15:46 +00:00
+								                  str(conversation_filename))
-												Muting by conversation ID

											
										
										
											2021-08-12 10:22:04 +00:00
-												Don't clear down DMs from other instances

											
										
										
											2022-05-01 13:23:32 +00:00
+								def is_dm(post_json_object: {}) -> bool:
 								    """Returns true if the given post is a DM
 								    """
 								    if post_json_object['type'] != 'Create':
 								        return False
 								    if not has_object_dict(post_json_object):
 								        return False
 								    if post_json_object['object']['type'] != 'ChatMessage':
 								        if post_json_object['object']['type'] != 'Note' and \
 								           post_json_object['object']['type'] != 'Page' and \
 								           post_json_object['object']['type'] != 'Patch' and \
 								           post_json_object['object']['type'] != 'EncryptedMessage' and \
 								           post_json_object['object']['type'] != 'Article':
 								            return False
 								    if post_json_object['object'].get('moderationStatus'):
 								        return False
 								    fields = ('to', 'cc')
 								    for field_name in fields:
 								        if not post_json_object['object'].get(field_name):
 								            continue
 								        for to_address in post_json_object['object'][field_name]:
-												Three representations of public post

											
										
										
											2023-02-09 20:40:42 +00:00
+								            if to_address.endswith('#Public') or \
 								               to_address == 'as:Public' or \
 								               to_address == 'Public':
-												Don't clear down DMs from other instances

											
										
										
											2022-05-01 13:23:32 +00:00
+								                return False
 								            if to_address.endswith('followers'):
 								                return False
 								    return True
-												Edit reminder

											
										
										
											2022-12-09 10:18:26 +00:00
+								def is_reminder(post_json_object: {}) -> bool:
 								    """Returns true if the given post is a reminder
 								    """
 								    if not is_dm(post_json_object):
 								        return False
 								    if not post_json_object['object'].get('to'):
 								        return False
 								    if not post_json_object['object'].get('attributedTo'):
 								        return False
 								    if not post_json_object['object'].get('tag'):
 								        return False
 								    if len(post_json_object['object']['to']) != 1:
 								        return False
 								    if post_json_object['object']['to'][0] != \
 								       post_json_object['object']['attributedTo']:
 								        return False
 								    for tag in post_json_object['object']['tag']:
 								        if tag['type'] == 'Event':
 								            return True
 								    return False
-												Don't clear down DMs from other instances

											
										
										
											2022-05-01 13:23:32 +00:00
+								def _is_remote_dm(domain_full: str, post_json_object: {}) -> bool:
 								    """Is the given post a DM from a different domain?
 								    """
 								    if not is_dm(post_json_object):
 								        return False
 								    this_post_json = post_json_object
 								    if has_object_dict(post_json_object):
 								        this_post_json = post_json_object['object']
 								    if this_post_json.get('attributedTo'):
 								        if isinstance(this_post_json['attributedTo'], str):
-												Only prevent remote DM deletions during archive

											
										
										
											2022-05-01 17:14:29 +00:00
+								            if '://' + domain_full not in this_post_json['attributedTo']:
-												Don't clear down DMs from other instances

											
										
										
											2022-05-01 13:23:32 +00:00
+								                return True
 								    return False
-												Snake case

											
										
										
											2021-12-28 14:55:45 +00:00
+								def delete_post(base_dir: str, http_prefix: str,
 								                nickname: str, domain: str, post_filename: str,
-												Only prevent remote DM deletions during archive

											
										
										
											2022-05-01 17:14:29 +00:00
+								                debug: bool, recent_posts_cache: {},
 								                manual: bool) -> None:
-												Recursive delete

											
										
										
											2019-07-14 16:37:01 +00:00
+								    """Recursively deletes a post and its replies and attachments
 								    """
-												Snake case

											
										
										
											2021-12-26 23:41:34 +00:00
+								    post_json_object = load_json(post_filename, 1)
-												Snake case

											
										
										
											2021-12-25 22:09:19 +00:00
+								    if not post_json_object:
-												Tidying of post deletion

											
										
										
											2021-07-05 09:24:29 +00:00
+								        # remove any replies
-												Snake case

											
										
										
											2021-12-28 14:55:45 +00:00
+								        _delete_post_remove_replies(base_dir, nickname, domain,
 								                                    http_prefix, post_filename,
-												Only prevent remote DM deletions during archive

											
										
										
											2022-05-01 17:14:29 +00:00
+								                                    recent_posts_cache, debug, manual)
-												Tidying of post deletion

											
										
										
											2021-07-05 09:24:29 +00:00
+								        # finally, remove the post itself
-												Exception handling when deleting files

This can fail if a file is manually deleted or deleted in another thread

											
										
										
											2021-09-05 10:17:43 +00:00
+								        try:
-												Snake case

											
										
										
											2021-12-26 23:41:34 +00:00
+								            os.remove(post_filename)
-												More specific exceptions

											
										
										
											2021-11-25 18:42:38 +00:00
+								        except OSError:
-												Show warnings for exceptions

											
										
										
											2021-10-29 14:33:52 +00:00
+								            if debug:
-												Snake case

											
										
										
											2021-12-28 14:55:45 +00:00
+								                print('EX: delete_post unable to delete post ' +
-												Snake case

											
										
										
											2021-12-26 23:41:34 +00:00
+								                      str(post_filename))
-												Tidying of post deletion

											
										
										
											2021-07-05 09:24:29 +00:00
+								        return
-												When deleting a post also remove it from the recent posts cache in memory

											
										
										
											2020-06-24 13:30:50 +00:00
-												Don't clear down DMs from other instances

											
										
										
											2022-05-01 13:23:32 +00:00
+								    # don't allow DMs to be deleted if they came from a different instance
 								    # otherwise this breaks expectations about how DMs should operate
-												Only prevent remote DM deletions during archive

											
										
										
											2022-05-01 17:14:29 +00:00
+								    # i.e. DMs should only be removed if they are manually deleted
 								    if not manual:
 								        if _is_remote_dm(domain, post_json_object):
 								            return
-												Don't clear down DMs from other instances

											
										
										
											2022-05-01 13:23:32 +00:00
-												Tidying of post deletion

											
										
										
											2021-07-05 09:24:29 +00:00
+								    # don't allow deletion of bookmarked posts
-												Snake case

											
										
										
											2021-12-28 13:12:10 +00:00
+								    if _is_bookmarked(base_dir, nickname, domain, post_filename):
-												Tidying of post deletion

											
										
										
											2021-07-05 09:24:29 +00:00
+								        return
 								    # don't remove replies to blog posts
-												Snake case

											
										
										
											2021-12-26 19:36:40 +00:00
+								    if _is_reply_to_blog_post(base_dir, nickname, domain,
 								                              post_json_object):
-												Tidying of post deletion

											
										
										
											2021-07-05 09:24:29 +00:00
+								        return
 								    # remove from recent posts cache in memory
-												Snake case

											
										
										
											2021-12-27 11:05:24 +00:00
+								    remove_post_from_cache(post_json_object, recent_posts_cache)
-												Tidying of post deletion

											
										
										
											2021-07-05 09:24:29 +00:00
-												Muting by conversation ID

											
										
										
											2021-08-12 10:22:04 +00:00
+								    # remove from conversation index
-												Moving to snake case

											
										
										
											2021-12-29 21:55:09 +00:00
+								    _delete_conversation_post(base_dir, nickname, domain, post_json_object)
-												Muting by conversation ID

											
										
										
											2021-08-12 10:22:04 +00:00
-												Tidying of post deletion

											
										
										
											2021-07-05 09:24:29 +00:00
+								    # remove any attachment
-												Snake case

											
										
										
											2021-12-28 13:49:44 +00:00
+								    _remove_attachment(base_dir, http_prefix, domain, post_json_object)
-												Tidying of post deletion

											
										
										
											2021-07-05 09:24:29 +00:00
-												Store history of edited posts

											
										
										
											2022-04-09 16:02:18 +00:00
+								    extensions = (
 								        'votes', 'arrived', 'muted', 'tts', 'reject', 'mitm', 'edits'
 								    )
-												Tidying of post deletion

											
										
										
											2021-07-05 09:24:29 +00:00
+								    for ext in extensions:
-												Snake case

											
										
										
											2021-12-28 12:15:46 +00:00
+								        ext_filename = post_filename + '.' + ext
 								        if os.path.isfile(ext_filename):
-												Exception handling when deleting files

This can fail if a file is manually deleted or deleted in another thread

											
										
										
											2021-09-05 10:17:43 +00:00
+								            try:
-												Snake case

											
										
										
											2021-12-28 12:15:46 +00:00
+								                os.remove(ext_filename)
-												More specific exceptions

											
										
										
											2021-11-25 18:42:38 +00:00
+								            except OSError:
-												Snake case

											
										
										
											2021-12-28 14:55:45 +00:00
+								                print('EX: delete_post unable to remove ext ' +
-												Snake case

											
										
										
											2021-12-28 12:15:46 +00:00
+								                      str(ext_filename))
-												Store history of edited posts

											
										
										
											2022-04-09 16:02:18 +00:00
+								        elif post_filename.endswith('.json'):
 								            ext_filename = post_filename.replace('.json', '') + '.' + ext
 								            if os.path.isfile(ext_filename):
 								                try:
 								                    os.remove(ext_filename)
 								                except OSError:
 								                    print('EX: delete_post unable to remove ext ' +
 								                          str(ext_filename))
-												Tidying of post deletion

											
										
										
											2021-07-05 09:24:29 +00:00
 								    # remove cached html version of the post
-												Handle incoming edited posts

											
										
										
											2022-04-09 15:11:22 +00:00
+								    delete_cached_html(base_dir, nickname, domain, post_json_object)
-												Tidying of post deletion

											
										
										
											2021-07-05 09:24:29 +00:00
-												Snake case

											
										
										
											2021-12-26 23:53:16 +00:00
+								    has_object = False
-												Snake case

											
										
										
											2021-12-25 22:09:19 +00:00
+								    if post_json_object.get('object'):
-												Snake case

											
										
										
											2021-12-26 23:53:16 +00:00
+								        has_object = True
-												Tidying of post deletion

											
										
										
											2021-07-05 09:24:29 +00:00
 								    # remove from moderation index file
-												Snake case

											
										
										
											2021-12-26 23:53:16 +00:00
+								    if has_object:
-												Snake case

											
										
										
											2021-12-26 10:57:03 +00:00
+								        if has_object_dict(post_json_object):
-												Snake case

											
										
										
											2021-12-25 22:09:19 +00:00
+								            if post_json_object['object'].get('moderationStatus'):
 								                if post_json_object.get('id'):
-												Snake case

											
										
										
											2021-12-27 11:20:57 +00:00
+								                    post_id = remove_id_ending(post_json_object['id'])
-												Snake case

											
										
										
											2021-12-28 13:12:10 +00:00
+								                    remove_moderation_post_from_index(base_dir, post_id, debug)
-												Tidying of post deletion

											
										
										
											2021-07-05 09:24:29 +00:00
 								    # remove any hashtags index entries
-												Snake case

											
										
										
											2021-12-26 23:53:16 +00:00
+								    if has_object:
-												Snake case

											
										
										
											2021-12-28 14:55:45 +00:00
+								        _delete_hashtags_on_post(base_dir, post_json_object)
-												Remove hashtag index entry when a post is deleted

											
										
										
											2019-08-09 11:39:53 +00:00
-												Remove attachments for deleted posts

											
										
										
											2019-07-14 17:02:41 +00:00
+								    # remove any replies
-												Snake case

											
										
										
											2021-12-28 14:55:45 +00:00
+								    _delete_post_remove_replies(base_dir, nickname, domain,
 								                                http_prefix, post_filename,
-												Only prevent remote DM deletions during archive

											
										
										
											2022-05-01 17:14:29 +00:00
+								                                recent_posts_cache, debug, manual)
-												Remove attachments for deleted posts

											
										
										
											2019-07-14 17:02:41 +00:00
+								    # finally, remove the post itself
-												Exception handling when deleting files

This can fail if a file is manually deleted or deleted in another thread

											
										
										
											2021-09-05 10:17:43 +00:00
+								    try:
-												Snake case

											
										
										
											2021-12-26 23:41:34 +00:00
+								        os.remove(post_filename)
-												More specific exceptions

											
										
										
											2021-11-25 18:42:38 +00:00
+								    except OSError:
-												Show warnings for exceptions

											
										
										
											2021-10-29 14:33:52 +00:00
+								        if debug:
-												Snake case

											
										
										
											2021-12-28 14:55:45 +00:00
+								            print('EX: delete_post unable to delete post ' +
 								                  str(post_filename))
-												Connect new posts to web interface

											
										
										
											2019-07-27 22:48:34 +00:00
-												flake8 format

											
										
										
											2020-04-04 13:44:49 +00:00
-												Get categories from podcast feeds

											
										
										
											2022-01-13 15:10:41 +00:00
+								def _is_valid_language(text: str) -> bool:
-												More thorough validation of hashtags and nicknames

											
										
										
											2021-02-09 14:41:32 +00:00
+								    """Returns true if the given text contains a valid
 								    natural language string
 								    """
-												Snake case

											
										
										
											2021-12-28 12:15:46 +00:00
+								    natural_languages = {
-												More thorough validation of hashtags and nicknames

											
										
										
											2021-02-09 14:41:32 +00:00
+								        "Latin": [65, 866],
 								        "Greek": [880, 1280],
 								        "isArmenian": [1328, 1424],
 								        "isHebrew": [1424, 1536],
 								        "Arabic": [1536, 1792],
 								        "Syriac": [1792, 1872],
 								        "Thaan": [1920, 1984],
 								        "Devanagari": [2304, 2432],
 								        "Bengali": [2432, 2560],
 								        "Gurmukhi": [2560, 2688],
 								        "Gujarati": [2688, 2816],
 								        "Oriya": [2816, 2944],
 								        "Tamil": [2944, 3072],
 								        "Telugu": [3072, 3200],
 								        "Kannada": [3200, 3328],
 								        "Malayalam": [3328, 3456],
 								        "Sinhala": [3456, 3584],
 								        "Thai": [3584, 3712],
 								        "Lao": [3712, 3840],
 								        "Tibetan": [3840, 4096],
 								        "Myanmar": [4096, 4256],
 								        "Georgian": [4256, 4352],
 								        "HangulJamo": [4352, 4608],
 								        "Cherokee": [5024, 5120],
 								        "UCAS": [5120, 5760],
 								        "Ogham": [5760, 5792],
 								        "Runic": [5792, 5888],
 								        "Khmer": [6016, 6144],
-												Support Korean language hashtags

											
										
										
											2022-03-02 10:10:43 +00:00
+								        "Hangul Syllables": [44032, 55203],
 								        "Hangul Jamo": [4352, 4607],
 								        "Hangul Compatibility Jamo": [12592, 12687],
 								        "Hangul Jamo Extended-A": [43360, 43391],
 								        "Hangul Jamo Extended-B": [55216, 55295],
-												Ukranian language hashtags

											
										
										
											2022-03-04 18:57:43 +00:00
+								        "Mongolian": [6144, 6320],
-												Full cyrillic hashtags

											
										
										
											2022-03-04 19:08:54 +00:00
+								        "Cyrillic": [1024, 1279],
 								        "Cyrillic Supplement": [1280, 1327],
 								        "Cyrillic Extended A": [11744, 11775],
 								        "Cyrillic Extended B": [42560, 42655],
 								        "Cyrillic Extended C": [7296, 7311],
 								        "Phonetic Extensions": [7467, 7544],
 								        "Combining Half Marks": [65070, 65071]
-												More thorough validation of hashtags and nicknames

											
										
										
											2021-02-09 14:41:32 +00:00
+								    }
-												Tidying

											
										
										
											2022-05-30 20:47:23 +00:00
+								    for _, lang_range in natural_languages.items():
-												Snake case

											
										
										
											2021-12-28 12:15:46 +00:00
+								        ok_lang = True
 								        for char in text:
-												Fix underscore within hashtag

											
										
										
											2022-03-03 11:52:55 +00:00
+								            if char.isdigit() or char == '_':
-												More thorough validation of hashtags and nicknames

											
										
										
											2021-02-09 14:41:32 +00:00
+								                continue
-												Snake case

											
										
										
											2021-12-28 12:15:46 +00:00
+								            if ord(char) not in range(lang_range[0], lang_range[1]):
 								                ok_lang = False
-												More thorough validation of hashtags and nicknames

											
										
										
											2021-02-09 14:41:32 +00:00
+								                break
-												Snake case

											
										
										
											2021-12-28 12:15:46 +00:00
+								        if ok_lang:
-												More thorough validation of hashtags and nicknames

											
										
										
											2021-02-09 14:41:32 +00:00
+								            return True
 								    return False
-												Snake case

											
										
										
											2021-12-28 14:55:45 +00:00
+								def _get_reserved_words() -> str:
-												Validation pattern for nickname on login screen

											
										
										
											2021-07-29 12:18:12 +00:00
+								    return ('inbox', 'dm', 'outbox', 'following',
 								            'public', 'followers', 'category',
-												video-channels users path

											
										
										
											2021-09-13 13:57:37 +00:00
+								            'channel', 'calendar', 'video-channels',
-												Validation pattern for nickname on login screen

											
										
										
											2021-07-29 12:18:12 +00:00
+								            'tlreplies', 'tlmedia', 'tlblogs',
 								            'tlblogs', 'tlfeatures',
 								            'moderation', 'moderationaction',
 								            'activity', 'undo', 'pinned',
-												Extra reserved nickname

											
										
										
											2022-02-26 17:14:10 +00:00
+								            'actor', 'Actor', 'instance.actor',
-												Validation pattern for nickname on login screen

											
										
										
											2021-07-29 12:18:12 +00:00
+								            'reply', 'replies', 'question', 'like',
-												'author' users path for pixelfed

											
										
										
											2022-03-28 21:45:11 +00:00
+								            'likes', 'users', 'statuses', 'tags', 'author',
-												Extra users path

											
										
										
											2023-04-09 11:33:55 +00:00
+								            'accounts', 'headers', 'snac',
-												Validation pattern for nickname on login screen

											
										
										
											2021-07-29 12:18:12 +00:00
+								            'channels', 'profile', 'u', 'c',
 								            'updates', 'repeat', 'announce',
 								            'shares', 'fonts', 'icons', 'avatars',
 								            'welcome', 'helpimages',
 								            'bookmark', 'bookmarks', 'tlbookmarks',
 								            'ignores', 'linksmobile', 'newswiremobile',
 								            'minimal', 'search', 'eventdelete',
-												More reserved words

											
										
										
											2021-08-08 17:05:26 +00:00
+								            'searchemoji', 'catalog', 'conversationId',
-												Begin support for ipfs

											
										
										
											2022-04-29 13:54:13 +00:00
+								            'mention', 'http', 'https', 'ipfs', 'ipns',
-												Inactive accounts timeline

											
										
										
											2022-12-01 19:44:12 +00:00
+								            'ontologies', 'data', 'postedit', 'moved',
-												Another user path

											
										
										
											2023-05-03 18:56:05 +00:00
+								            'inactive', 'activitypub', 'actors',
-												Offers collection for shared items

											
										
										
											2023-06-27 16:41:33 +00:00
+								            'notes', 'offers', 'wanted')
-												Validation pattern for nickname on login screen

											
										
										
											2021-07-29 12:18:12 +00:00
-												Snake case

											
										
										
											2021-12-28 14:55:45 +00:00
+								def get_nickname_validation_pattern() -> str:
-												Validation pattern for nickname on login screen

											
										
										
											2021-07-29 12:18:12 +00:00
+								    """Returns a html text input validation pattern for nickname
 								    """
-												Snake case

											
										
										
											2021-12-28 14:55:45 +00:00
+								    reserved_names = _get_reserved_words()
-												Validation pattern for nickname on login screen

											
										
										
											2021-07-29 12:18:12 +00:00
+								    pattern = ''
-												Snake case

											
										
										
											2021-12-28 12:15:46 +00:00
+								    for word in reserved_names:
-												Validation pattern for nickname on login screen

											
										
										
											2021-07-29 12:18:12 +00:00
+								        if pattern:
-												Double backslash

											
										
										
											2021-07-29 13:27:29 +00:00
+								            pattern += '(?!.*\\b' + word + '\\b)'
-												Validation pattern for nickname on login screen

											
										
										
											2021-07-29 12:18:12 +00:00
+								        else:
-												Double backslash

											
										
										
											2021-07-29 13:27:29 +00:00
+								            pattern = '^(?!.*\\b' + word + '\\b)'
-												Same maximum username length as mastodon

											
										
										
											2021-07-29 14:22:55 +00:00
+								    return pattern + '.*${1,30}'
-												Validation pattern for nickname on login screen

											
										
										
											2021-07-29 12:18:12 +00:00
-												Snake case

											
										
										
											2021-12-28 14:55:45 +00:00
+								def _is_reserved_name(nickname: str) -> bool:
-												More thorough validation of hashtags and nicknames

											
										
										
											2021-02-09 14:41:32 +00:00
+								    """Is the given nickname reserved for some special function?
 								    """
-												Snake case

											
										
										
											2021-12-28 14:55:45 +00:00
+								    reserved_names = _get_reserved_words()
-												Snake case

											
										
										
											2021-12-28 12:15:46 +00:00
+								    if nickname in reserved_names:
-												More thorough validation of hashtags and nicknames

											
										
										
											2021-02-09 14:41:32 +00:00
+								        return True
 								    return False
-												Snake case

											
										
										
											2021-12-28 14:41:10 +00:00
+								def valid_nickname(domain: str, nickname: str) -> bool:
-												More thorough validation of hashtags and nicknames

											
										
										
											2021-02-09 14:41:32 +00:00
+								    """Is the given nickname valid?
 								    """
-												Check length of nickname

											
										
										
											2021-07-29 14:24:29 +00:00
+								    if len(nickname) == 0:
 								        return False
 								    if len(nickname) > 30:
 								        return False
-												Get categories from podcast feeds

											
										
										
											2022-01-13 15:10:41 +00:00
+								    if not _is_valid_language(nickname):
-												More thorough validation of hashtags and nicknames

											
										
										
											2021-02-09 14:41:32 +00:00
+								        return False
-												Snake case

											
										
										
											2021-12-28 12:15:46 +00:00
+								    forbidden_chars = ('.', ' ', '/', '?', ':', ';', '@', '#', '!')
-												Snake case

											
										
										
											2021-12-28 13:12:10 +00:00
+								    for char in forbidden_chars:
 								        if char in nickname:
-												More thorough validation of hashtags and nicknames

											
										
										
											2021-02-09 14:41:32 +00:00
+								            return False
 								    # this should only apply for the shared inbox
 								    if nickname == domain:
 								        return False
-												Snake case

											
										
										
											2021-12-28 14:55:45 +00:00
+								    if _is_reserved_name(nickname):
-												Connect new posts to web interface

											
										
										
											2019-07-27 22:48:34 +00:00
+								        return False
 								    return True
-												Register button

											
										
										
											2019-08-08 11:24:26 +00:00
-												flake8 format

											
										
										
											2020-04-04 13:44:49 +00:00
-												Snake case

											
										
										
											2021-12-28 14:41:10 +00:00
+								def no_of_accounts(base_dir: str) -> bool:
-												Register button

											
										
										
											2019-08-08 11:24:26 +00:00
+								    """Returns the number of accounts on the system
 								    """
-												Snake case

											
										
										
											2021-12-28 12:15:46 +00:00
+								    account_ctr = 0
-												Tidying

											
										
										
											2022-05-30 20:47:23 +00:00
+								    for _, dirs, _ in os.walk(base_dir + '/accounts'):
-												Register button

											
										
										
											2019-08-08 11:24:26 +00:00
+								        for account in dirs:
-												Snake case

											
										
										
											2021-12-26 18:46:43 +00:00
+								            if is_account_dir(account):
-												Snake case

											
										
										
											2021-12-28 12:15:46 +00:00
+								                account_ctr += 1
-												Break after loop

											
										
										
											2020-12-13 22:13:45 +00:00
+								        break
-												Snake case

											
										
										
											2021-12-28 12:15:46 +00:00
+								    return account_ctr
-												Tidying

											
										
										
											2019-08-10 11:31:42 +00:00
-												flake8 format

											
										
										
											2020-04-04 13:44:49 +00:00
-												Snake case

											
										
										
											2021-12-28 14:41:10 +00:00
+								def no_of_active_accounts_monthly(base_dir: str, months: int) -> bool:
-												Function for monthly active accounts

											
										
										
											2019-11-13 15:15:08 +00:00
+								    """Returns the number of accounts on the system this month
 								    """
-												Snake case

											
										
										
											2021-12-28 12:15:46 +00:00
+								    account_ctr = 0
-												Snake case

											
										
										
											2021-12-26 13:17:46 +00:00
+								    curr_time = int(time.time())
-												Snake case

											
										
										
											2021-12-28 12:15:46 +00:00
+								    month_seconds = int(60*60*24*30*months)
-												Tidying

											
										
										
											2022-05-30 20:47:23 +00:00
+								    for _, dirs, _ in os.walk(base_dir + '/accounts'):
-												Function for monthly active accounts

											
										
										
											2019-11-13 15:15:08 +00:00
+								        for account in dirs:
-												Snake case

											
										
										
											2021-12-26 18:46:43 +00:00
+								            if not is_account_dir(account):
-												Alternative field for indicating no replies

											
										
										
											2021-06-25 09:51:54 +00:00
+								                continue
-												Snake case

											
										
										
											2021-12-28 12:15:46 +00:00
+								            last_used_filename = \
-												Snake case

											
										
										
											2021-12-25 16:17:53 +00:00
+								                base_dir + '/accounts/' + account + '/.lastUsed'
-												Snake case

											
										
										
											2021-12-28 12:15:46 +00:00
+								            if not os.path.isfile(last_used_filename):
-												Alternative field for indicating no replies

											
										
										
											2021-06-25 09:51:54 +00:00
+								                continue
-												Explicitly set file encoding

											
										
										
											2022-06-09 14:46:30 +00:00
+								            with open(last_used_filename, 'r',
 								                      encoding='utf-8') as last_used_file:
-												Snake case

											
										
										
											2021-12-28 12:15:46 +00:00
+								                last_used = last_used_file.read()
 								                if last_used.isdigit():
 								                    time_diff = (curr_time - int(last_used))
 								                    if time_diff < month_seconds:
 								                        account_ctr += 1
-												Break after loop

											
										
										
											2020-12-13 22:13:45 +00:00
+								        break
-												Snake case

											
										
										
											2021-12-28 12:15:46 +00:00
+								    return account_ctr
-												Function for monthly active accounts

											
										
										
											2019-11-13 15:15:08 +00:00
-												flake8 format

											
										
										
											2020-04-04 13:44:49 +00:00
-												Snake case

											
										
										
											2021-12-28 14:41:10 +00:00
+								def is_public_post_from_url(base_dir: str, nickname: str, domain: str,
 								                            post_url: str) -> bool:
-												Make replies to non-public posts non-public

											
										
										
											2019-12-10 17:19:53 +00:00
+								    """Returns whether the given url is a public post
 								    """
-												Snake case

											
										
										
											2021-12-28 12:15:46 +00:00
+								    post_filename = locate_post(base_dir, nickname, domain, post_url)
-												Snake case

											
										
										
											2021-12-26 23:41:34 +00:00
+								    if not post_filename:
-												Make replies to non-public posts non-public

											
										
										
											2019-12-10 17:19:53 +00:00
+								        return False
-												Snake case

											
										
										
											2021-12-26 23:41:34 +00:00
+								    post_json_object = load_json(post_filename, 1)
-												Snake case

											
										
										
											2021-12-25 22:09:19 +00:00
+								    if not post_json_object:
-												Make replies to non-public posts non-public

											
										
										
											2019-12-10 17:19:53 +00:00
+								        return False
-												Snake case

											
										
										
											2021-12-28 14:41:10 +00:00
+								    return is_public_post(post_json_object)
-												Make replies to non-public posts non-public

											
										
										
											2019-12-10 17:19:53 +00:00
-												flake8 format

											
										
										
											2020-04-04 13:44:49 +00:00
-												Snake case

											
										
										
											2021-12-28 14:41:10 +00:00
+								def is_public_post(post_json_object: {}) -> bool:
-												Tidying

											
										
										
											2019-08-10 11:31:42 +00:00
+								    """Returns true if the given post is public
 								    """
-												Snake case

											
										
										
											2021-12-25 22:09:19 +00:00
+								    if not post_json_object.get('type'):
-												Tidying

											
										
										
											2019-08-10 11:31:42 +00:00
+								        return False
-												Snake case

											
										
										
											2021-12-25 22:09:19 +00:00
+								    if post_json_object['type'] != 'Create':
-												Tidying

											
										
										
											2019-08-10 11:31:42 +00:00
+								        return False
-												Snake case

											
										
										
											2021-12-26 10:57:03 +00:00
+								    if not has_object_dict(post_json_object):
-												Tidying

											
										
										
											2019-08-10 11:31:42 +00:00
+								        return False
-												Snake case

											
										
										
											2021-12-25 22:09:19 +00:00
+								    if not post_json_object['object'].get('to'):
-												Tidying

											
										
										
											2019-08-10 11:31:42 +00:00
+								        return False
-												Snake case

											
										
										
											2021-12-25 22:09:19 +00:00
+								    for recipient in post_json_object['object']['to']:
-												Three representations of public post

											
										
										
											2023-02-09 20:40:42 +00:00
+								        if recipient.endswith('#Public') or \
 								           recipient == 'as:Public' or \
 								           recipient == 'Public':
-												Tidying

											
										
										
											2019-08-10 11:31:42 +00:00
+								            return True
 								    return False
-												Unit test for emoji

											
										
										
											2019-09-29 18:48:34 +00:00
-												flake8 format

											
										
										
											2020-04-04 13:44:49 +00:00
-												Initial code for edit button

											
										
										
											2022-11-15 19:22:00 +00:00
+								def is_followers_post(post_json_object: {}) -> bool:
 								    """Returns true if the given post is to followers
 								    """
 								    if not post_json_object.get('type'):
 								        return False
 								    if post_json_object['type'] != 'Create':
 								        return False
 								    if not has_object_dict(post_json_object):
 								        return False
 								    if not post_json_object['object'].get('to'):
 								        return False
 								    for recipient in post_json_object['object']['to']:
 								        if recipient.endswith('/followers'):
 								            return True
 								    return False
-												Handle replying to unlisted posts

											
										
										
											2022-03-12 14:09:36 +00:00
+								def is_unlisted_post(post_json_object: {}) -> bool:
 								    """Returns true if the given post is unlisted
 								    """
 								    if not post_json_object.get('type'):
 								        return False
 								    if post_json_object['type'] != 'Create':
 								        return False
 								    if not has_object_dict(post_json_object):
 								        return False
 								    if not post_json_object['object'].get('to'):
 								        return False
 								    if not post_json_object['object'].get('cc'):
 								        return False
 								    has_followers = False
 								    for recipient in post_json_object['object']['to']:
 								        if recipient.endswith('/followers'):
 								            has_followers = True
 								            break
 								    if not has_followers:
 								        return False
 								    for recipient in post_json_object['object']['cc']:
-												Three representations of public post

											
										
										
											2023-02-09 20:40:42 +00:00
+								        if recipient.endswith('#Public') or \
 								           recipient == 'as:Public' or \
 								           recipient == 'Public':
-												Handle replying to unlisted posts

											
										
										
											2022-03-12 14:09:36 +00:00
+								            return True
 								    return False
-												Argument types

											
										
										
											2021-06-20 11:28:35 +00:00
+								def copytree(src: str, dst: str, symlinks: str = False, ignore: bool = None):
-												Unit test for emoji

											
										
										
											2019-09-29 18:48:34 +00:00
+								    """Copy a directory
 								    """
 								    for item in os.listdir(src):
-												Snake case

											
										
										
											2021-12-28 12:15:46 +00:00
+								        s_dir = os.path.join(src, item)
 								        d_dir = os.path.join(dst, item)
 								        if os.path.isdir(s_dir):
 								            shutil.copytree(s_dir, d_dir, symlinks, ignore)
-												Unit test for emoji

											
										
										
											2019-09-29 18:48:34 +00:00
+								        else:
-												Snake case

											
										
										
											2021-12-28 12:15:46 +00:00
+								            shutil.copy2(s_dir, d_dir)
-												Remove cached post on like update

											
										
										
											2019-10-19 17:50:05 +00:00
-												flake8 format

											
										
										
											2020-04-04 13:44:49 +00:00
-												Snake case

											
										
										
											2021-12-26 23:53:16 +00:00
+								def get_cached_post_directory(base_dir: str,
 								                              nickname: str, domain: str) -> str:
-												Remove cached post on like update

											
										
										
											2019-10-19 17:50:05 +00:00
+								    """Returns the directory where the html post cache exists
 								    """
-												Snake case

											
										
										
											2021-12-26 23:53:16 +00:00
+								    html_post_cache_dir = acct_dir(base_dir, nickname, domain) + '/postcache'
 								    return html_post_cache_dir
-												Remove cached post on like update

											
										
										
											2019-10-19 17:50:05 +00:00
-												flake8 format

											
										
										
											2020-04-04 13:44:49 +00:00
-												Snake case

											
										
										
											2021-12-26 23:41:34 +00:00
+								def get_cached_post_filename(base_dir: str, nickname: str, domain: str,
 								                             post_json_object: {}) -> str:
-												Remove cached post on like update

											
										
										
											2019-10-19 17:50:05 +00:00
+								    """Returns the html cache filename for the given post
 								    """
-												Snake case

											
										
										
											2021-12-28 12:15:46 +00:00
+								    cached_post_dir = get_cached_post_directory(base_dir, nickname, domain)
 								    if not os.path.isdir(cached_post_dir):
 								        # print('ERROR: invalid html cache directory ' + cached_post_dir)
-												Check for invalid directory

											
										
										
											2019-11-29 23:04:37 +00:00
+								        return None
-												Snake case

											
										
										
											2021-12-28 12:15:46 +00:00
+								    if '@' not in cached_post_dir:
 								        # print('ERROR: invalid html cache directory ' + cached_post_dir)
-												Check for invalid directory

											
										
										
											2019-11-29 23:04:37 +00:00
+								        return None
-												Snake case

											
										
										
											2021-12-28 12:15:46 +00:00
+								    cached_post_id = remove_id_ending(post_json_object['id'])
 								    cached_post_filename = \
 								        cached_post_dir + '/' + cached_post_id.replace('/', '#')
-												Snake case

											
										
										
											2021-12-27 11:05:24 +00:00
+								    return cached_post_filename + '.html'
-												Update announce posts in cache

											
										
										
											2019-11-24 13:46:28 +00:00
-												flake8 format

											
										
										
											2020-04-04 13:44:49 +00:00
-												Snake case

											
										
										
											2021-12-28 14:24:14 +00:00
+								def update_recent_posts_cache(recent_posts_cache: {}, max_recent_posts: int,
 								                              post_json_object: {}, html_str: str) -> None:
-												Update post cache after regeneration of posts

											
										
										
											2019-11-24 17:40:31 +00:00
+								    """Store recent posts in memory so that they can be quickly recalled
 								    """
-												Snake case

											
										
										
											2021-12-25 22:09:19 +00:00
+								    if not post_json_object.get('id'):
-												Update post cache after regeneration of posts

											
										
										
											2019-11-24 17:40:31 +00:00
+								        return
-												Snake case

											
										
										
											2021-12-26 19:47:06 +00:00
+								    post_id = post_json_object['id']
 								    if '#' in post_id:
 								        post_id = post_id.split('#', 1)[0]
-												Snake case

											
										
										
											2021-12-27 11:20:57 +00:00
+								    post_id = remove_id_ending(post_id).replace('/', '#')
-												Snake case

											
										
										
											2021-12-26 20:01:37 +00:00
+								    if recent_posts_cache.get('index'):
 								        if post_id in recent_posts_cache['index']:
-												Update post cache after regeneration of posts

											
										
										
											2019-11-24 17:40:31 +00:00
+								            return
-												Snake case

											
										
										
											2021-12-26 20:01:37 +00:00
+								        recent_posts_cache['index'].append(post_id)
-												Snake case

											
										
										
											2021-12-25 22:09:19 +00:00
+								        post_json_object['muted'] = False
-												Snake case

											
										
										
											2021-12-26 20:01:37 +00:00
+								        recent_posts_cache['json'][post_id] = json.dumps(post_json_object)
-												Snake case

											
										
										
											2021-12-28 14:24:14 +00:00
+								        recent_posts_cache['html'][post_id] = html_str
-												Snake case

											
										
										
											2021-12-26 20:01:37 +00:00
 								        while len(recent_posts_cache['html'].items()) > max_recent_posts:
 								            post_id = recent_posts_cache['index'][0]
 								            recent_posts_cache['index'].pop(0)
 								            if recent_posts_cache['json'].get(post_id):
 								                del recent_posts_cache['json'][post_id]
 								            if recent_posts_cache['html'].get(post_id):
 								                del recent_posts_cache['html'][post_id]
-												Update post cache after regeneration of posts

											
										
										
											2019-11-24 17:40:31 +00:00
+								    else:
-												Snake case

											
										
										
											2021-12-26 20:01:37 +00:00
+								        recent_posts_cache['index'] = [post_id]
 								        recent_posts_cache['json'] = {}
 								        recent_posts_cache['html'] = {}
 								        recent_posts_cache['json'][post_id] = json.dumps(post_json_object)
-												Snake case

											
										
										
											2021-12-28 14:24:14 +00:00
+								        recent_posts_cache['html'][post_id] = html_str
-												flake8 format

											
										
										
											2020-04-04 13:44:49 +00:00
-												Extra emoji fields

											
										
										
											2020-02-21 10:19:02 +00:00
-												Snake case

											
										
										
											2021-12-28 14:01:37 +00:00
+								def file_last_modified(filename: str) -> str:
-												Extra emoji fields

											
										
										
											2020-02-21 10:19:02 +00:00
+								    """Returns the date when a file was last modified
 								    """
-												Snake case

											
										
										
											2021-12-28 12:15:46 +00:00
+								    time_val = os.path.getmtime(filename)
 								    modified_time = datetime.datetime.fromtimestamp(time_val)
 								    return modified_time.strftime("%Y-%m-%dT%H:%M:%SZ")
-												Function to get weekly events

											
										
										
											2020-02-22 16:00:27 +00:00
-												flake8 format

											
										
										
											2020-04-04 13:44:49 +00:00
-												Remove old css cache

											
										
										
											2022-07-12 19:03:30 +00:00
+								def get_css(base_dir: str, css_filename: str) -> str:
-												CSS cache

											
										
										
											2020-10-29 12:48:58 +00:00
+								    """Retrieves the css for a given file, or from a cache
 								    """
 								    # does the css file exist?
-												Snake case

											
										
										
											2021-12-28 12:15:46 +00:00
+								    if not os.path.isfile(css_filename):
-												CSS cache

											
										
										
											2020-10-29 12:48:58 +00:00
+								        return None
-												Explicitly set file encoding

											
										
										
											2022-06-09 14:46:30 +00:00
+								    with open(css_filename, 'r', encoding='utf-8') as fp_css:
-												Snake case

											
										
										
											2021-12-28 12:15:46 +00:00
+								        css = fp_css.read()
-												CSS cache

											
										
										
											2020-10-29 12:48:58 +00:00
+								        return css
 								    return None
-												Snake case

											
										
										
											2021-12-28 13:49:44 +00:00
+								def is_blog_post(post_json_object: {}) -> bool:
-												Different link for blog posts

											
										
										
											2020-02-24 23:14:49 +00:00
+								    """Is the given post a blog post?
 								    """
-												Snake case

											
										
										
											2021-12-25 22:09:19 +00:00
+								    if post_json_object['type'] != 'Create':
-												Different link for blog posts

											
										
										
											2020-02-24 23:14:49 +00:00
+								        return False
-												Snake case

											
										
										
											2021-12-26 10:57:03 +00:00
+								    if not has_object_dict(post_json_object):
-												Different link for blog posts

											
										
										
											2020-02-24 23:14:49 +00:00
+								        return False
-												Handle incoming edited posts

											
										
										
											2022-04-09 15:11:22 +00:00
+								    if not has_object_string_type(post_json_object, False):
-												Different link for blog posts

											
										
										
											2020-02-24 23:14:49 +00:00
+								        return False
-												Improve checking for content

											
										
										
											2023-01-08 22:23:02 +00:00
+								    if 'content' not in post_json_object['object']:
-												Different link for blog posts

											
										
										
											2020-02-24 23:14:49 +00:00
+								        return False
-												Snake case

											
										
										
											2021-12-25 22:09:19 +00:00
+								    if post_json_object['object']['type'] != 'Article':
-												Different link for blog posts

											
										
										
											2020-02-24 23:14:49 +00:00
+								        return False
-												Remove trailing whitespace

											
										
										
											2020-03-22 21:16:02 +00:00
+								    return True
-												Search function

											
										
										
											2020-04-11 10:19:35 +00:00
-												Snake case

											
										
										
											2021-12-28 12:20:18 +00:00
+								def is_news_post(post_json_object: {}) -> bool:
-												Indicate that imported posts contain news

											
										
										
											2020-10-08 09:07:45 +00:00
+								    """Is the given post a blog post?
 								    """
-												Snake case

											
										
										
											2021-12-25 22:09:19 +00:00
+								    return post_json_object.get('news')
-												Indicate that imported posts contain news

											
										
										
											2020-10-08 09:07:45 +00:00
-												Snake case

											
										
										
											2021-12-28 13:07:02 +00:00
+								def _search_virtual_box_posts(base_dir: str, nickname: str, domain: str,
 								                              search_str: str, max_results: int,
 								                              box_name: str) -> []:
-												Bookmarks search

											
										
										
											2021-05-03 22:31:06 +00:00
+								    """Searches through a virtual box, which is typically an index on the inbox
 								    """
-												Snake case

											
										
										
											2021-12-28 12:15:46 +00:00
+								    index_filename = \
 								        acct_dir(base_dir, nickname, domain) + '/' + box_name + '.index'
 								    if box_name == 'bookmarks':
 								        box_name = 'inbox'
 								    path = acct_dir(base_dir, nickname, domain) + '/' + box_name
-												Bookmarks search

											
										
										
											2021-05-03 22:31:06 +00:00
+								    if not os.path.isdir(path):
 								        return []
-												Snake case

											
										
										
											2021-12-28 12:15:46 +00:00
+								    search_str = search_str.lower().strip()
-												Bookmarks search

											
										
										
											2021-05-03 22:31:06 +00:00
-												Snake case

											
										
										
											2021-12-28 12:15:46 +00:00
+								    if '+' in search_str:
 								        search_words = search_str.split('+')
-												Use enumerations

											
										
										
											2022-01-08 10:58:54 +00:00
+								        for index, _ in enumerate(search_words):
-												Snake case

											
										
										
											2021-12-28 12:15:46 +00:00
+								            search_words[index] = search_words[index].strip()
 								        print('SEARCH: ' + str(search_words))
-												Bookmarks search

											
										
										
											2021-05-03 22:31:06 +00:00
+								    else:
-												Snake case

											
										
										
											2021-12-28 12:15:46 +00:00
+								        search_words = [search_str]
-												Bookmarks search

											
										
										
											2021-05-03 22:31:06 +00:00
 								    res = []
-												Explicitly set file encoding

											
										
										
											2022-06-09 14:46:30 +00:00
+								    with open(index_filename, 'r', encoding='utf-8') as index_file:
-												Snake case

											
										
										
											2021-12-26 23:41:34 +00:00
+								        post_filename = 'start'
 								        while post_filename:
-												Snake case

											
										
										
											2021-12-28 12:15:46 +00:00
+								            post_filename = index_file.readline()
-												Snake case

											
										
										
											2021-12-26 23:41:34 +00:00
+								            if not post_filename:
-												Bookmarks search

											
										
										
											2021-05-03 22:31:06 +00:00
+								                break
-												Snake case

											
										
										
											2021-12-26 23:41:34 +00:00
+								            if '.json' not in post_filename:
-												Bookmarks search

											
										
										
											2021-05-03 22:31:06 +00:00
+								                break
-												Snake case

											
										
										
											2021-12-26 23:41:34 +00:00
+								            post_filename = path + '/' + post_filename.strip()
 								            if not os.path.isfile(post_filename):
-												Bookmarks search

											
										
										
											2021-05-03 22:31:06 +00:00
+								                continue
-												Explicitly set file encoding

											
										
										
											2022-06-09 14:46:30 +00:00
+								            with open(post_filename, 'r', encoding='utf-8') as post_file:
-												Snake case

											
										
										
											2021-12-28 12:15:46 +00:00
+								                data = post_file.read().lower()
-												Revert "Reading functions"

This reverts commit ee0ffade9d74f8465338aab59546ef296c8f2a74.

											
										
										
											2021-06-21 22:52:04 +00:00
-												Snake case

											
										
										
											2021-12-28 12:15:46 +00:00
+								                not_found = False
 								                for keyword in search_words:
-												Bookmarks search

											
										
										
											2021-05-03 22:31:06 +00:00
+								                    if keyword not in data:
-												Snake case

											
										
										
											2021-12-28 12:15:46 +00:00
+								                        not_found = True
-												Bookmarks search

											
										
										
											2021-05-03 22:31:06 +00:00
+								                        break
-												Snake case

											
										
										
											2021-12-28 12:15:46 +00:00
+								                if not_found:
-												Bookmarks search

											
										
										
											2021-05-03 22:31:06 +00:00
+								                    continue
-												Snake case

											
										
										
											2021-12-26 23:41:34 +00:00
+								                res.append(post_filename)
-												Snake case

											
										
										
											2021-12-28 12:15:46 +00:00
+								                if len(res) >= max_results:
-												Bookmarks search

											
										
										
											2021-05-03 22:31:06 +00:00
+								                    return res
 								    return res
-												Snake case

											
										
										
											2021-12-28 13:07:02 +00:00
+								def search_box_posts(base_dir: str, nickname: str, domain: str,
 								                     search_str: str, max_results: int,
 								                     box_name='outbox') -> []:
-												Add cw script to history search

											
										
										
											2020-04-11 13:20:52 +00:00
+								    """Search your posts and return a list of the filenames
 								    containing matching strings
-												Search function

											
										
										
											2020-04-11 10:19:35 +00:00
+								    """
-												Snake case

											
										
										
											2021-12-28 12:15:46 +00:00
+								    path = acct_dir(base_dir, nickname, domain) + '/' + box_name
-												Less indentation

											
										
										
											2021-07-05 10:22:23 +00:00
+								    # is this a virtual box, such as direct messages?
-												Search function

											
										
										
											2020-04-11 10:19:35 +00:00
+								    if not os.path.isdir(path):
-												Bookmarks search

											
										
										
											2021-05-03 22:31:06 +00:00
+								        if os.path.isfile(path + '.index'):
-												Snake case

											
										
										
											2021-12-28 13:07:02 +00:00
+								            return _search_virtual_box_posts(base_dir, nickname, domain,
 								                                             search_str, max_results, box_name)
-												Search function

											
										
										
											2020-04-11 10:19:35 +00:00
+								        return []
-												Snake case

											
										
										
											2021-12-28 12:15:46 +00:00
+								    search_str = search_str.lower().strip()
-												Add cw script to history search

											
										
										
											2020-04-11 13:20:52 +00:00
-												Snake case

											
										
										
											2021-12-28 12:15:46 +00:00
+								    if '+' in search_str:
 								        search_words = search_str.split('+')
-												Use enumerations

											
										
										
											2022-01-08 10:58:54 +00:00
+								        for index, _ in enumerate(search_words):
-												Snake case

											
										
										
											2021-12-28 12:15:46 +00:00
+								            search_words[index] = search_words[index].strip()
 								        print('SEARCH: ' + str(search_words))
-												Search your posts with multiple keywords

											
										
										
											2020-04-11 13:30:54 +00:00
+								    else:
-												Snake case

											
										
										
											2021-12-28 12:15:46 +00:00
+								        search_words = [search_str]
-												Search your posts with multiple keywords

											
										
										
											2020-04-11 13:30:54 +00:00
-												Search function

											
										
										
											2020-04-11 10:19:35 +00:00
+								    res = []
-												Tidying

											
										
										
											2022-05-30 20:47:23 +00:00
+								    for root, _, fnames in os.walk(path):
-												Search function

											
										
										
											2020-04-11 10:19:35 +00:00
+								        for fname in fnames:
-												Snake case

											
										
										
											2021-12-28 12:15:46 +00:00
+								            file_path = os.path.join(root, fname)
-												Explicitly set file encoding

											
										
										
											2022-06-09 14:46:30 +00:00
+								            with open(file_path, 'r', encoding='utf-8') as post_file:
-												Snake case

											
										
										
											2021-12-28 12:15:46 +00:00
+								                data = post_file.read().lower()
-												Revert "Reading functions"

This reverts commit ee0ffade9d74f8465338aab59546ef296c8f2a74.

											
										
										
											2021-06-21 22:52:04 +00:00
-												Snake case

											
										
										
											2021-12-28 12:15:46 +00:00
+								                not_found = False
 								                for keyword in search_words:
-												Search your posts with multiple keywords

											
										
										
											2020-04-11 13:30:54 +00:00
+								                    if keyword not in data:
-												Snake case

											
										
										
											2021-12-28 12:15:46 +00:00
+								                        not_found = True
-												debug

											
										
										
											2020-04-11 13:45:53 +00:00
+								                        break
-												Snake case

											
										
										
											2021-12-28 12:15:46 +00:00
+								                if not_found:
-												Extra continue

											
										
										
											2020-04-11 13:35:22 +00:00
+								                    continue
-												Simple match

											
										
										
											2020-04-11 13:14:53 +00:00
-												Snake case

											
										
										
											2021-12-28 12:15:46 +00:00
+								                res.append(file_path)
 								                if len(res) >= max_results:
-												Search function

											
										
										
											2020-04-11 10:19:35 +00:00
+								                    return res
-												Break after loop

											
										
										
											2020-12-13 22:13:45 +00:00
+								        break
-												Search function

											
										
										
											2020-04-11 10:19:35 +00:00
+								    return res
-												Case insensitive avatar image search

											
										
										
											2020-05-04 18:24:30 +00:00
-												Moving to snake case

											
										
										
											2021-12-29 21:55:09 +00:00
+								def get_file_case_insensitive(path: str) -> str:
-												Case insensitive avatar image search

											
										
										
											2020-05-04 18:24:30 +00:00
+								    """Returns a case specific filename given a case insensitive version of it
 								    """
-												Directories must be created first

											
										
										
											2020-08-29 11:14:19 +00:00
+								    if os.path.isfile(path):
 								        return path
 								    if path != path.lower():
 								        if os.path.isfile(path.lower()):
 								            return path.lower()
-												Tidying to reduce file reads

											
										
										
											2020-08-29 19:54:30 +00:00
+								    return None
-												Fix circular dependency

											
										
										
											2020-06-06 18:16:16 +00:00
-												Snake case

											
										
										
											2021-12-27 23:23:07 +00:00
+								def undo_likes_collection_entry(recent_posts_cache: {},
 								                                base_dir: str, post_filename: str,
 								                                object_url: str,
 								                                actor: str, domain: str, debug: bool,
 								                                post_json_object: {}) -> None:
-												Fix circular dependency

											
										
										
											2020-06-06 18:16:16 +00:00
+								    """Undoes a like for a particular actor
 								    """
-												Snake case

											
										
										
											2021-12-25 22:09:19 +00:00
+								    if not post_json_object:
-												Snake case

											
										
										
											2021-12-26 23:41:34 +00:00
+								        post_json_object = load_json(post_filename)
-												Snake case

											
										
										
											2021-12-25 22:09:19 +00:00
+								    if not post_json_object:
-												Less indentation

											
										
										
											2021-07-05 10:22:23 +00:00
+								        return
 								    # remove any cached version of this post so that the
 								    # like icon is changed
-												Snake case

											
										
										
											2021-12-27 22:19:18 +00:00
+								    nickname = get_nickname_from_actor(actor)
-												Handle none return valued from nickname

											
										
										
											2022-03-23 23:59:29 +00:00
+								    if not nickname:
 								        return
-												Snake case

											
										
										
											2021-12-27 11:05:24 +00:00
+								    cached_post_filename = \
-												Snake case

											
										
										
											2021-12-26 23:41:34 +00:00
+								        get_cached_post_filename(base_dir, nickname,
 								                                 domain, post_json_object)
-												Snake case

											
										
										
											2021-12-27 11:05:24 +00:00
+								    if cached_post_filename:
 								        if os.path.isfile(cached_post_filename):
-												Exception handling when deleting files

This can fail if a file is manually deleted or deleted in another thread

											
										
										
											2021-09-05 10:17:43 +00:00
+								            try:
-												Snake case

											
										
										
											2021-12-27 11:05:24 +00:00
+								                os.remove(cached_post_filename)
-												More specific exceptions

											
										
										
											2021-11-25 18:42:38 +00:00
+								            except OSError:
-												Snake case

											
										
										
											2021-12-27 23:23:07 +00:00
+								                print('EX: undo_likes_collection_entry ' +
-												Debug messages for exceptions

											
										
										
											2021-10-29 18:48:15 +00:00
+								                      'unable to delete cached post ' +
-												Snake case

											
										
										
											2021-12-27 11:05:24 +00:00
+								                      str(cached_post_filename))
 								    remove_post_from_cache(post_json_object, recent_posts_cache)
-												Less indentation

											
										
										
											2021-07-05 10:22:23 +00:00
-												Snake case

											
										
										
											2021-12-25 22:09:19 +00:00
+								    if not post_json_object.get('type'):
-												Less indentation

											
										
										
											2021-07-05 10:22:23 +00:00
+								        return
-												Snake case

											
										
										
											2021-12-25 22:09:19 +00:00
+								    if post_json_object['type'] != 'Create':
-												Less indentation

											
										
										
											2021-07-05 10:22:23 +00:00
+								        return
-												Snake case

											
										
										
											2021-12-25 22:09:19 +00:00
+								    obj = post_json_object
-												Snake case

											
										
										
											2021-12-26 10:57:03 +00:00
+								    if has_object_dict(post_json_object):
-												Snake case

											
										
										
											2021-12-25 22:09:19 +00:00
+								        obj = post_json_object['object']
-												Announces can have likes collections

											
										
										
											2021-10-14 22:43:42 +00:00
+								    if not obj.get('likes'):
-												Less indentation

											
										
										
											2021-07-05 10:22:23 +00:00
+								        return
-												Announces can have likes collections

											
										
										
											2021-10-14 22:43:42 +00:00
+								    if not isinstance(obj['likes'], dict):
-												Less indentation

											
										
										
											2021-07-05 10:22:23 +00:00
+								        return
-												Announces can have likes collections

											
										
										
											2021-10-14 22:43:42 +00:00
+								    if not obj['likes'].get('items'):
-												Less indentation

											
										
										
											2021-07-05 10:22:23 +00:00
+								        return
-												Snake case

											
										
										
											2021-12-27 23:23:07 +00:00
+								    total_items = 0
-												Announces can have likes collections

											
										
										
											2021-10-14 22:43:42 +00:00
+								    if obj['likes'].get('totalItems'):
-												Snake case

											
										
										
											2021-12-27 23:23:07 +00:00
+								        total_items = obj['likes']['totalItems']
-												Snake case

											
										
										
											2021-12-28 12:15:46 +00:00
+								    item_found = False
 								    for like_item in obj['likes']['items']:
 								        if like_item.get('actor'):
 								            if like_item['actor'] == actor:
-												Fix circular dependency

											
										
										
											2020-06-06 18:16:16 +00:00
+								                if debug:
-												Less indentation

											
										
										
											2021-07-05 10:22:23 +00:00
+								                    print('DEBUG: like was removed for ' + actor)
-												Snake case

											
										
										
											2021-12-28 12:15:46 +00:00
+								                obj['likes']['items'].remove(like_item)
 								                item_found = True
-												Less indentation

											
										
										
											2021-07-05 10:22:23 +00:00
+								                break
-												Snake case

											
										
										
											2021-12-28 12:15:46 +00:00
+								    if not item_found:
-												Less indentation

											
										
										
											2021-07-05 10:22:23 +00:00
+								        return
-												Snake case

											
										
										
											2021-12-27 23:23:07 +00:00
+								    if total_items == 1:
-												Less indentation

											
										
										
											2021-07-05 10:22:23 +00:00
+								        if debug:
 								            print('DEBUG: likes was removed from post')
-												Announces can have likes collections

											
										
										
											2021-10-14 22:43:42 +00:00
+								        del obj['likes']
-												Less indentation

											
										
										
											2021-07-05 10:22:23 +00:00
+								    else:
-												Announces can have likes collections

											
										
										
											2021-10-14 22:43:42 +00:00
+								        itlen = len(obj['likes']['items'])
 								        obj['likes']['totalItems'] = itlen
-												Fix circular dependency

											
										
										
											2020-06-06 18:16:16 +00:00
-												Snake case

											
										
										
											2021-12-26 23:41:34 +00:00
+								    save_json(post_json_object, post_filename)
-												Fix circular dependency

											
										
										
											2020-06-06 18:16:16 +00:00
-												Snake case

											
										
										
											2021-12-27 23:02:50 +00:00
+								def undo_reaction_collection_entry(recent_posts_cache: {},
 								                                   base_dir: str, post_filename: str,
-												Snake case

											
										
										
											2021-12-27 23:23:07 +00:00
+								                                   object_url: str,
-												Snake case

											
										
										
											2021-12-27 23:02:50 +00:00
+								                                   actor: str, domain: str, debug: bool,
 								                                   post_json_object: {},
-												Snake case

											
										
										
											2021-12-28 12:15:46 +00:00
+								                                   emoji_content: str) -> None:
-												Handle emoji reactions

											
										
										
											2021-11-10 12:16:03 +00:00
+								    """Undoes an emoji reaction for a particular actor
 								    """
-												Snake case

											
										
										
											2021-12-25 22:09:19 +00:00
+								    if not post_json_object:
-												Snake case

											
										
										
											2021-12-26 23:41:34 +00:00
+								        post_json_object = load_json(post_filename)
-												Snake case

											
										
										
											2021-12-25 22:09:19 +00:00
+								    if not post_json_object:
-												Handle emoji reactions

											
										
										
											2021-11-10 12:16:03 +00:00
+								        return
 								    # remove any cached version of this post so that the
 								    # like icon is changed
-												Snake case

											
										
										
											2021-12-27 22:19:18 +00:00
+								    nickname = get_nickname_from_actor(actor)
-												Handle none return valued from nickname

											
										
										
											2022-03-23 23:59:29 +00:00
+								    if not nickname:
 								        return
-												Snake case

											
										
										
											2021-12-27 11:05:24 +00:00
+								    cached_post_filename = \
-												Snake case

											
										
										
											2021-12-26 23:41:34 +00:00
+								        get_cached_post_filename(base_dir, nickname,
 								                                 domain, post_json_object)
-												Snake case

											
										
										
											2021-12-27 11:05:24 +00:00
+								    if cached_post_filename:
 								        if os.path.isfile(cached_post_filename):
-												Handle emoji reactions

											
										
										
											2021-11-10 12:16:03 +00:00
+								            try:
-												Snake case

											
										
										
											2021-12-27 11:05:24 +00:00
+								                os.remove(cached_post_filename)
-												More specific exceptions

											
										
										
											2021-11-25 18:42:38 +00:00
+								            except OSError:
-												Snake case

											
										
										
											2021-12-27 23:02:50 +00:00
+								                print('EX: undo_reaction_collection_entry ' +
-												Handle emoji reactions

											
										
										
											2021-11-10 12:16:03 +00:00
+								                      'unable to delete cached post ' +
-												Snake case

											
										
										
											2021-12-27 11:05:24 +00:00
+								                      str(cached_post_filename))
 								    remove_post_from_cache(post_json_object, recent_posts_cache)
-												Handle emoji reactions

											
										
										
											2021-11-10 12:16:03 +00:00
-												Snake case

											
										
										
											2021-12-25 22:09:19 +00:00
+								    if not post_json_object.get('type'):
-												Handle emoji reactions

											
										
										
											2021-11-10 12:16:03 +00:00
+								        return
-												Snake case

											
										
										
											2021-12-25 22:09:19 +00:00
+								    if post_json_object['type'] != 'Create':
-												Handle emoji reactions

											
										
										
											2021-11-10 12:16:03 +00:00
+								        return
-												Snake case

											
										
										
											2021-12-25 22:09:19 +00:00
+								    obj = post_json_object
-												Snake case

											
										
										
											2021-12-26 10:57:03 +00:00
+								    if has_object_dict(post_json_object):
-												Snake case

											
										
										
											2021-12-25 22:09:19 +00:00
+								        obj = post_json_object['object']
-												Handle emoji reactions

											
										
										
											2021-11-10 12:16:03 +00:00
+								    if not obj.get('reactions'):
 								        return
 								    if not isinstance(obj['reactions'], dict):
 								        return
 								    if not obj['reactions'].get('items'):
 								        return
-												Snake case

											
										
										
											2021-12-27 23:23:07 +00:00
+								    total_items = 0
-												Handle emoji reactions

											
										
										
											2021-11-10 12:16:03 +00:00
+								    if obj['reactions'].get('totalItems'):
-												Snake case

											
										
										
											2021-12-27 23:23:07 +00:00
+								        total_items = obj['reactions']['totalItems']
-												Snake case

											
										
										
											2021-12-28 12:15:46 +00:00
+								    item_found = False
 								    for like_item in obj['reactions']['items']:
 								        if like_item.get('actor'):
 								            if like_item['actor'] == actor and \
 								               like_item['content'] == emoji_content:
-												Handle emoji reactions

											
										
										
											2021-11-10 12:16:03 +00:00
+								                if debug:
 								                    print('DEBUG: emoji reaction was removed for ' + actor)
-												Snake case

											
										
										
											2021-12-28 12:15:46 +00:00
+								                obj['reactions']['items'].remove(like_item)
 								                item_found = True
-												Handle emoji reactions

											
										
										
											2021-11-10 12:16:03 +00:00
+								                break
-												Snake case

											
										
										
											2021-12-28 12:15:46 +00:00
+								    if not item_found:
-												Handle emoji reactions

											
										
										
											2021-11-10 12:16:03 +00:00
+								        return
-												Snake case

											
										
										
											2021-12-27 23:23:07 +00:00
+								    if total_items == 1:
-												Handle emoji reactions

											
										
										
											2021-11-10 12:16:03 +00:00
+								        if debug:
 								            print('DEBUG: emoji reaction was removed from post')
 								        del obj['reactions']
 								    else:
 								        itlen = len(obj['reactions']['items'])
 								        obj['reactions']['totalItems'] = itlen
-												Snake case

											
										
										
											2021-12-26 23:41:34 +00:00
+								    save_json(post_json_object, post_filename)
-												Handle emoji reactions

											
										
										
											2021-11-10 12:16:03 +00:00
-												Snake case

											
										
										
											2021-12-27 10:55:48 +00:00
+								def undo_announce_collection_entry(recent_posts_cache: {},
 								                                   base_dir: str, post_filename: str,
 								                                   actor: str, domain: str,
 								                                   debug: bool) -> None:
-												Avoid race condition when repeating post

											
										
										
											2020-06-06 18:34:39 +00:00
+								    """Undoes an announce for a particular actor by removing it from
 								    the "shares" collection within a post. Note that the "shares"
 								    collection has no relation to shared items in shares.py. It's
 								    shares of posts, not shares of physical objects.
 								    """
-												Snake case

											
										
										
											2021-12-26 23:41:34 +00:00
+								    post_json_object = load_json(post_filename)
-												Snake case

											
										
										
											2021-12-25 22:09:19 +00:00
+								    if not post_json_object:
-												Less indentation

											
										
										
											2021-07-05 10:25:21 +00:00
+								        return
 								    # remove any cached version of this announce so that the announce
 								    # icon is changed
-												Snake case

											
										
										
											2021-12-27 22:19:18 +00:00
+								    nickname = get_nickname_from_actor(actor)
-												Handle none return valued from nickname

											
										
										
											2022-03-23 23:59:29 +00:00
+								    if not nickname:
 								        return
-												Snake case

											
										
										
											2021-12-27 11:05:24 +00:00
+								    cached_post_filename = \
-												Snake case

											
										
										
											2021-12-26 23:41:34 +00:00
+								        get_cached_post_filename(base_dir, nickname, domain,
 								                                 post_json_object)
-												Snake case

											
										
										
											2021-12-27 11:05:24 +00:00
+								    if cached_post_filename:
 								        if os.path.isfile(cached_post_filename):
-												Exception handling when deleting files

This can fail if a file is manually deleted or deleted in another thread

											
										
										
											2021-09-05 10:17:43 +00:00
+								            try:
-												Snake case

											
										
										
											2021-12-27 11:05:24 +00:00
+								                os.remove(cached_post_filename)
-												More specific exceptions

											
										
										
											2021-11-25 18:42:38 +00:00
+								            except OSError:
-												Show warnings for exceptions

											
										
										
											2021-10-29 14:33:52 +00:00
+								                if debug:
-												Snake case

											
										
										
											2021-12-27 10:55:48 +00:00
+								                    print('EX: undo_announce_collection_entry ' +
-												Debug messages for exceptions

											
										
										
											2021-10-29 18:48:15 +00:00
+								                          'unable to delete cached post ' +
-												Snake case

											
										
										
											2021-12-27 11:05:24 +00:00
+								                          str(cached_post_filename))
 								    remove_post_from_cache(post_json_object, recent_posts_cache)
-												Less indentation

											
										
										
											2021-07-05 10:25:21 +00:00
-												Snake case

											
										
										
											2021-12-25 22:09:19 +00:00
+								    if not post_json_object.get('type'):
-												Less indentation

											
										
										
											2021-07-05 10:25:21 +00:00
+								        return
-												Snake case

											
										
										
											2021-12-25 22:09:19 +00:00
+								    if post_json_object['type'] != 'Create':
-												Less indentation

											
										
										
											2021-07-05 10:25:21 +00:00
+								        return
-												Snake case

											
										
										
											2021-12-26 10:57:03 +00:00
+								    if not has_object_dict(post_json_object):
-												Less indentation

											
										
										
											2021-07-05 10:25:21 +00:00
+								        if debug:
-												Snake case

											
										
										
											2021-12-25 22:09:19 +00:00
+								            pprint(post_json_object)
-												Less indentation

											
										
										
											2021-07-05 10:25:21 +00:00
+								            print('DEBUG: post has no object')
 								        return
-												Snake case

											
										
										
											2021-12-25 22:09:19 +00:00
+								    if not post_json_object['object'].get('shares'):
-												Less indentation

											
										
										
											2021-07-05 10:25:21 +00:00
+								        return
-												Snake case

											
										
										
											2021-12-25 22:09:19 +00:00
+								    if not post_json_object['object']['shares'].get('items'):
-												Less indentation

											
										
										
											2021-07-05 10:25:21 +00:00
+								        return
-												Snake case

											
										
										
											2021-12-27 23:23:07 +00:00
+								    total_items = 0
-												Snake case

											
										
										
											2021-12-25 22:09:19 +00:00
+								    if post_json_object['object']['shares'].get('totalItems'):
-												Snake case

											
										
										
											2021-12-27 23:23:07 +00:00
+								        total_items = post_json_object['object']['shares']['totalItems']
-												Snake case

											
										
										
											2021-12-28 12:15:46 +00:00
+								    item_found = False
 								    for announce_item in post_json_object['object']['shares']['items']:
 								        if announce_item.get('actor'):
 								            if announce_item['actor'] == actor:
-												Avoid race condition when repeating post

											
										
										
											2020-06-06 18:34:39 +00:00
+								                if debug:
-												Less indentation

											
										
										
											2021-07-05 10:25:21 +00:00
+								                    print('DEBUG: Announce was removed for ' + actor)
-												Snake case

											
										
										
											2021-12-28 13:07:02 +00:00
+								                an_it = announce_item
 								                post_json_object['object']['shares']['items'].remove(an_it)
-												Snake case

											
										
										
											2021-12-28 12:15:46 +00:00
+								                item_found = True
-												Less indentation

											
										
										
											2021-07-05 10:25:21 +00:00
+								                break
-												Snake case

											
										
										
											2021-12-28 12:15:46 +00:00
+								    if not item_found:
-												Less indentation

											
										
										
											2021-07-05 10:25:21 +00:00
+								        return
-												Snake case

											
										
										
											2021-12-27 23:23:07 +00:00
+								    if total_items == 1:
-												Less indentation

											
										
										
											2021-07-05 10:25:21 +00:00
+								        if debug:
 								            print('DEBUG: shares (announcements) ' +
 								                  'was removed from post')
-												Snake case

											
										
										
											2021-12-25 22:09:19 +00:00
+								        del post_json_object['object']['shares']
-												Less indentation

											
										
										
											2021-07-05 10:25:21 +00:00
+								    else:
-												Snake case

											
										
										
											2021-12-25 22:09:19 +00:00
+								        itlen = len(post_json_object['object']['shares']['items'])
 								        post_json_object['object']['shares']['totalItems'] = itlen
-												Avoid race condition when repeating post

											
										
										
											2020-06-06 18:34:39 +00:00
-												Snake case

											
										
										
											2021-12-26 23:41:34 +00:00
+								    save_json(post_json_object, post_filename)
-												Avoid race condition when repeating post

											
										
										
											2020-06-06 18:34:39 +00:00
-												Snake case

											
										
										
											2021-12-26 23:41:34 +00:00
+								def update_announce_collection(recent_posts_cache: {},
 								                               base_dir: str, post_filename: str,
 								                               actor: str, nickname: str, domain: str,
 								                               debug: bool) -> None:
-												Avoid race condition when repeating post

											
										
										
											2020-06-06 18:34:39 +00:00
+								    """Updates the announcements collection within a post
 								    Confusingly this is known as "shares", but isn't the
 								    same as shared items within shares.py
 								    It's shares of posts, not shares of physical objects.
 								    """
-												Snake case

											
										
										
											2021-12-26 23:41:34 +00:00
+								    post_json_object = load_json(post_filename)
-												Snake case

											
										
										
											2021-12-25 22:09:19 +00:00
+								    if not post_json_object:
-												Tidying

											
										
										
											2021-05-07 15:58:39 +00:00
+								        return
 								    # remove any cached version of this announce so that the announce
 								    # icon is changed
-												Snake case

											
										
										
											2021-12-27 11:05:24 +00:00
+								    cached_post_filename = \
-												Snake case

											
										
										
											2021-12-26 23:41:34 +00:00
+								        get_cached_post_filename(base_dir, nickname, domain,
 								                                 post_json_object)
-												Snake case

											
										
										
											2021-12-27 11:05:24 +00:00
+								    if cached_post_filename:
 								        if os.path.isfile(cached_post_filename):
-												Exception handling when deleting files

This can fail if a file is manually deleted or deleted in another thread

											
										
										
											2021-09-05 10:17:43 +00:00
+								            try:
-												Snake case

											
										
										
											2021-12-27 11:05:24 +00:00
+								                os.remove(cached_post_filename)
-												More specific exceptions

											
										
										
											2021-11-25 18:42:38 +00:00
+								            except OSError:
-												Show warnings for exceptions

											
										
										
											2021-10-29 14:33:52 +00:00
+								                if debug:
-												Snake case

											
										
										
											2021-12-26 23:41:34 +00:00
+								                    print('EX: update_announce_collection ' +
-												Debug messages for exceptions

											
										
										
											2021-10-29 18:48:15 +00:00
+								                          'unable to delete cached post ' +
-												Snake case

											
										
										
											2021-12-27 11:05:24 +00:00
+								                          str(cached_post_filename))
 								    remove_post_from_cache(post_json_object, recent_posts_cache)
-												Avoid race condition when repeating post

											
										
										
											2020-06-06 18:34:39 +00:00
-												Snake case

											
										
										
											2021-12-26 10:57:03 +00:00
+								    if not has_object_dict(post_json_object):
-												Tidying

											
										
										
											2021-05-07 15:58:39 +00:00
+								        if debug:
-												Snake case

											
										
										
											2021-12-25 22:09:19 +00:00
+								            pprint(post_json_object)
-												Snake case

											
										
										
											2021-12-26 23:41:34 +00:00
+								            print('DEBUG: post ' + post_filename + ' has no object')
-												Tidying

											
										
										
											2021-05-07 15:58:39 +00:00
+								        return
-												Snake case

											
										
										
											2021-12-28 12:15:46 +00:00
+								    post_url = remove_id_ending(post_json_object['id']) + '/shares'
-												Snake case

											
										
										
											2021-12-25 22:09:19 +00:00
+								    if not post_json_object['object'].get('shares'):
-												Tidying

											
										
										
											2021-05-07 15:58:39 +00:00
+								        if debug:
 								            print('DEBUG: Adding initial shares (announcements) to ' +
-												Snake case

											
										
										
											2021-12-28 12:15:46 +00:00
+								                  post_url)
 								        announcements_json = {
-												Tidying

											
										
										
											2021-05-07 15:58:39 +00:00
+								            "@context": "https://www.w3.org/ns/activitystreams",
-												Snake case

											
										
										
											2021-12-28 12:15:46 +00:00
+								            'id': post_url,
-												Tidying

											
										
										
											2021-05-07 15:58:39 +00:00
+								            'type': 'Collection',
 								            "totalItems": 1,
 								            'items': [{
 								                'type': 'Announce',
 								                'actor': actor
 								            }]
 								        }
-												Snake case

											
										
										
											2021-12-28 12:15:46 +00:00
+								        post_json_object['object']['shares'] = announcements_json
-												Tidying

											
										
										
											2021-05-07 15:58:39 +00:00
+								    else:
-												Snake case

											
										
										
											2021-12-25 22:09:19 +00:00
+								        if post_json_object['object']['shares'].get('items'):
-												Snake case

											
										
										
											2021-12-28 12:15:46 +00:00
+								            shares_items = post_json_object['object']['shares']['items']
 								            for announce_item in shares_items:
 								                if announce_item.get('actor'):
 								                    if announce_item['actor'] == actor:
-												Tidying

											
										
										
											2021-05-07 15:58:39 +00:00
+								                        return
-												Snake case

											
										
										
											2021-12-27 23:23:07 +00:00
+								            new_announce = {
-												Tidying

											
										
										
											2021-05-07 15:58:39 +00:00
+								                'type': 'Announce',
 								                'actor': actor
-												Avoid race condition when repeating post

											
										
										
											2020-06-06 18:34:39 +00:00
+								            }
-												Snake case

											
										
										
											2021-12-27 23:23:07 +00:00
+								            post_json_object['object']['shares']['items'].append(new_announce)
-												Snake case

											
										
										
											2021-12-25 22:09:19 +00:00
+								            itlen = len(post_json_object['object']['shares']['items'])
 								            post_json_object['object']['shares']['totalItems'] = itlen
-												Avoid race condition when repeating post

											
										
										
											2020-06-06 18:34:39 +00:00
+								        else:
-												Tidying

											
										
										
											2021-05-07 15:58:39 +00:00
+								            if debug:
 								                print('DEBUG: shares (announcements) section of post ' +
 								                      'has no items list')
-												Avoid race condition when repeating post

											
										
										
											2020-06-06 18:34:39 +00:00
-												Tidying

											
										
										
											2021-05-07 15:58:39 +00:00
+								    if debug:
 								        print('DEBUG: saving post with shares (announcements) added')
-												Snake case

											
										
										
											2021-12-25 22:09:19 +00:00
+								        pprint(post_json_object)
-												Snake case

											
										
										
											2021-12-26 23:41:34 +00:00
+								    save_json(post_json_object, post_filename)
-												qrcode dependencies on parabola

											
										
										
											2020-06-22 16:55:19 +00:00
-												Snake case

											
										
										
											2021-12-26 20:52:11 +00:00
+								def week_day_of_month_start(month_number: int, year: int) -> int:
-												Splitting webapp into smaller modules

											
										
										
											2020-11-09 19:41:01 +00:00
+								    """Gets the day number of the first day of the month
 =sun, 7=sat
 								    """
-												Snake case

											
										
										
											2021-12-26 20:52:11 +00:00
+								    first_day_of_month = datetime.datetime(year, month_number, 1, 0, 0)
 								    return int(first_day_of_month.strftime("%w")) + 1
-												Detect media mime types

											
										
										
											2020-11-13 13:34:14 +00:00
-												Snake case

											
										
										
											2021-12-26 20:48:15 +00:00
+								def media_file_mime_type(filename: str) -> str:
-												Detect media mime types

											
										
										
											2020-11-13 13:34:14 +00:00
+								    """Given a media filename return its mime type
 								    """
 								    if '.' not in filename:
 								        return 'image/png'
 								    extensions = {
 								        'json': 'application/json',
 								        'png': 'image/png',
 								        'jpg': 'image/jpeg',
-												Support jpeg-xl format

											
										
										
											2022-02-06 11:04:49 +00:00
+								        'jxl': 'image/jxl',
-												Detect media mime types

											
										
										
											2020-11-13 13:34:14 +00:00
+								        'jpeg': 'image/jpeg',
 								        'gif': 'image/gif',
-												Support for svg format images

											
										
										
											2021-01-11 22:27:57 +00:00
+								        'svg': 'image/svg+xml',
-												Detect media mime types

											
										
										
											2020-11-13 13:34:14 +00:00
+								        'webp': 'image/webp',
 								        'avif': 'image/avif',
-												Support heic formatted images

											
										
										
											2022-10-31 17:26:31 +00:00
+								        'heic': 'image/heic',
-												Detect icon type

											
										
										
											2021-12-16 23:47:01 +00:00
+								        'ico': 'image/x-icon',
-												Detect media mime types

											
										
										
											2020-11-13 13:34:14 +00:00
+								        'mp3': 'audio/mpeg',
 								        'ogg': 'audio/ogg',
-												Support wave file attachments

											
										
										
											2022-10-31 11:05:11 +00:00
+								        'audio/wav': 'wav',
 								        'audio/x-wav': 'wav',
 								        'audio/x-pn-wave': 'wav',
 								        'wav': 'audio/vnd.wave',
-												Support opus audio format

											
										
										
											2022-04-18 13:21:45 +00:00
+								        'opus': 'audio/opus',
-												Support speex audio format

											
										
										
											2022-10-20 19:37:59 +00:00
+								        'spx': 'audio/speex',
-												Tidying of mime types

											
										
										
											2021-08-03 09:09:04 +00:00
+								        'flac': 'audio/flac',
-												Detect media mime types

											
										
										
											2020-11-13 13:34:14 +00:00
+								        'mp4': 'video/mp4',
 								        'ogv': 'video/ogv'
 								    }
-												Snake case

											
										
										
											2021-12-26 20:52:11 +00:00
+								    file_ext = filename.split('.')[-1]
 								    if not extensions.get(file_ext):
-												Detect media mime types

											
										
										
											2020-11-13 13:34:14 +00:00
+								        return 'image/png'
-												Snake case

											
										
										
											2021-12-26 20:52:11 +00:00
+								    return extensions[file_ext]
-												Check post recency before creating speaker endpoint

											
										
										
											2021-03-03 20:16:53 +00:00
-												Snake case

											
										
										
											2021-12-26 20:48:15 +00:00
+								def is_recent_post(post_json_object: {}, max_days: int) -> bool:
-												Check post recency before creating speaker endpoint

											
										
										
											2021-03-03 20:16:53 +00:00
+								    """ Is the given post recent?
 								    """
-												Snake case

											
										
										
											2021-12-26 10:57:03 +00:00
+								    if not has_object_dict(post_json_object):
-												Check post recency before creating speaker endpoint

											
										
										
											2021-03-03 20:16:53 +00:00
+								        return False
-												Snake case

											
										
										
											2021-12-25 22:09:19 +00:00
+								    if not post_json_object['object'].get('published'):
-												Check post recency before creating speaker endpoint

											
										
										
											2021-03-03 20:16:53 +00:00
+								        return False
-												Snake case

											
										
										
											2021-12-25 22:09:19 +00:00
+								    if not isinstance(post_json_object['object']['published'], str):
-												Check post recency before creating speaker endpoint

											
										
										
											2021-03-03 20:16:53 +00:00
+								        return False
-												Snake case

											
										
										
											2021-12-26 13:17:46 +00:00
+								    curr_time = datetime.datetime.utcnow()
 								    days_since_epoch = (curr_time - datetime.datetime(1970, 1, 1)).days
-												Snake case

											
										
										
											2021-12-26 20:48:15 +00:00
+								    recently = days_since_epoch - max_days
-												Check post recency before creating speaker endpoint

											
										
										
											2021-03-03 20:16:53 +00:00
-												Snake case

											
										
										
											2021-12-26 20:48:15 +00:00
+								    published_date_str = post_json_object['object']['published']
-												Remove any fraction from published time when checking recency

											
										
										
											2022-05-08 15:06:24 +00:00
+								    if '.' in published_date_str:
 								        published_date_str = published_date_str.split('.')[0] + 'Z'
-												Check post recency before creating speaker endpoint

											
										
										
											2021-03-03 20:16:53 +00:00
+								    try:
-												Snake case

											
										
										
											2021-12-26 20:48:15 +00:00
+								        published_date = \
 								            datetime.datetime.strptime(published_date_str,
-												Check post recency before creating speaker endpoint

											
										
										
											2021-03-03 20:16:53 +00:00
+								                                       "%Y-%m-%dT%H:%M:%SZ")
 								    except BaseException:
-												Snake case

											
										
										
											2021-12-26 20:43:03 +00:00
+								        print('EX: is_recent_post unrecognized published date ' +
-												Snake case

											
										
										
											2021-12-26 20:48:15 +00:00
+								              str(published_date_str))
-												Check post recency before creating speaker endpoint

											
										
										
											2021-03-03 20:16:53 +00:00
+								        return False
-												Snake case

											
										
										
											2021-12-26 23:41:34 +00:00
+								    published_days_since_epoch = \
-												Snake case

											
										
										
											2021-12-26 20:48:15 +00:00
+								        (published_date - datetime.datetime(1970, 1, 1)).days
-												Snake case

											
										
										
											2021-12-26 23:41:34 +00:00
+								    if published_days_since_epoch < recently:
-												Check post recency before creating speaker endpoint

											
										
										
											2021-03-03 20:16:53 +00:00
+								        return False
 								    return True
-												Split camelcase display names for speaker clarity

											
										
										
											2021-03-03 20:34:55 +00:00
-												Snake case

											
										
										
											2021-12-26 20:39:35 +00:00
+								def camel_case_split(text: str) -> str:
-												Split camelcase display names for speaker clarity

											
										
										
											2021-03-03 20:34:55 +00:00
+								    """ Splits CamelCase into "Camel Case"
 								    """
 								    matches = re.finditer('.+?(?:(?<=[a-z])(?=[A-Z])|' +
 								                          '(?<=[A-Z])(?=[A-Z][a-z])|$)', text)
 								    if not matches:
 								        return text
-												Snake case

											
										
										
											2021-12-28 13:07:02 +00:00
+								    result_str = ''
-												Split camelcase display names for speaker clarity

											
										
										
											2021-03-03 20:34:55 +00:00
+								    for word in matches:
-												Snake case

											
										
										
											2021-12-28 13:07:02 +00:00
+								        result_str += word.group(0) + ' '
 								    return result_str.strip()
-												Tidying

											
										
										
											2021-03-05 19:00:37 +00:00
-												snake case conversion script

											
										
										
											2021-12-29 10:39:46 +00:00
+								def convert_to_snake_case(text: str) -> str:
 								    """Convert camel case to snake case
 								    """
 								    return camel_case_split(text).lower().replace(' ', '_')
-												Convert config variable names to camel case

											
										
										
											2021-12-28 15:13:51 +00:00
+								def _convert_to_camel_case(text: str) -> str:
 								    """Convers a snake case string to camel case
 								    """
 								    if '_' not in text:
 								        return text
 								    words = text.split('_')
 								    result = ''
 								    ctr = 0
 								    for wrd in words:
 								        if ctr > 0:
 								            result += wrd.title()
 								        else:
 								            result = wrd.lower()
 								        ctr += 1
 								    return result
-												Snake case

											
										
										
											2021-12-26 20:20:36 +00:00
+								def reject_post_id(base_dir: str, nickname: str, domain: str,
 								                   post_id: str, recent_posts_cache: {}) -> None:
-												Remove rejected posts from recent posts cache

											
										
										
											2021-03-05 19:23:33 +00:00
+								    """ Marks the given post as rejected,
 								    for example an announce which is too old
-												Tidying

											
										
										
											2021-03-05 19:00:37 +00:00
+								    """
-												Snake case

											
										
										
											2021-12-26 20:43:03 +00:00
+								    post_filename = locate_post(base_dir, nickname, domain, post_id)
 								    if not post_filename:
-												Tidying

											
										
										
											2021-03-05 19:00:37 +00:00
+								        return
-												Remove rejected posts from recent posts cache

											
										
										
											2021-03-05 19:23:33 +00:00
-												Snake case

											
										
										
											2021-12-26 20:01:37 +00:00
+								    if recent_posts_cache.get('index'):
-												Remove rejected posts from recent posts cache

											
										
										
											2021-03-05 19:23:33 +00:00
+								        # if this is a full path then remove the directories
-												Snake case

											
										
										
											2021-12-26 20:43:03 +00:00
+								        index_filename = post_filename
 								        if '/' in post_filename:
 								            index_filename = post_filename.split('/')[-1]
-												Remove rejected posts from recent posts cache

											
										
										
											2021-03-05 19:23:33 +00:00
 								        # filename of the post without any extension or path
 								        # This should also correspond to any index entry in
 								        # the posts cache
-												Function for line ending characters

											
										
										
											2022-06-21 11:58:50 +00:00
+								        post_url = remove_eol(index_filename)
-												Snake case

											
										
										
											2021-12-28 12:15:46 +00:00
+								        post_url = post_url.replace('.json', '').strip()
-												Remove rejected posts from recent posts cache

											
										
										
											2021-03-05 19:23:33 +00:00
-												Snake case

											
										
										
											2021-12-28 12:15:46 +00:00
+								        if post_url in recent_posts_cache['index']:
 								            if recent_posts_cache['json'].get(post_url):
 								                del recent_posts_cache['json'][post_url]
 								            if recent_posts_cache['html'].get(post_url):
 								                del recent_posts_cache['html'][post_url]
-												Remove rejected posts from recent posts cache

											
										
										
											2021-03-05 19:23:33 +00:00
-												Explicitly set file encoding

											
										
										
											2022-06-09 14:46:30 +00:00
+								    with open(post_filename + '.reject', 'w+',
 								              encoding='utf-8') as reject_file:
-												Snake case

											
										
										
											2021-12-28 12:15:46 +00:00
+								        reject_file.write('\n')
-												Add dm and reply notifications to speaker endpoint

											
										
										
											2021-03-09 13:52:02 +00:00
-												Replying to a chat message has a different path

											
										
										
											2022-02-08 10:52:03 +00:00
+								def is_chat_message(post_json_object: {}) -> bool:
 								    """Returns true if the given post is a chat message
 								    Note that is_dm should be checked before calling this
 								    """
 								    if post_json_object['type'] != 'Create':
 								        return False
 								    if not has_object_dict(post_json_object):
 								        return False
 								    if post_json_object['object']['type'] != 'ChatMessage':
 								        return False
 								    return True
-												Snake case

											
										
										
											2021-12-26 19:36:40 +00:00
+								def is_reply(post_json_object: {}, actor: str) -> bool:
-												Add dm and reply notifications to speaker endpoint

											
										
										
											2021-03-09 13:52:02 +00:00
+								    """Returns true if the given post is a reply to the given actor
 								    """
-												Snake case

											
										
										
											2021-12-25 22:09:19 +00:00
+								    if post_json_object['type'] != 'Create':
-												Add dm and reply notifications to speaker endpoint

											
										
										
											2021-03-09 13:52:02 +00:00
+								        return False
-												Snake case

											
										
										
											2021-12-26 10:57:03 +00:00
+								    if not has_object_dict(post_json_object):
-												Add dm and reply notifications to speaker endpoint

											
										
										
											2021-03-09 13:52:02 +00:00
+								        return False
-												Snake case

											
										
										
											2021-12-25 22:09:19 +00:00
+								    if post_json_object['object'].get('moderationStatus'):
-												Add dm and reply notifications to speaker endpoint

											
										
										
											2021-03-09 13:52:02 +00:00
+								        return False
-												Snake case

											
										
										
											2021-12-25 22:09:19 +00:00
+								    if post_json_object['object']['type'] != 'Note' and \
 								       post_json_object['object']['type'] != 'Page' and \
 								       post_json_object['object']['type'] != 'EncryptedMessage' and \
-												Support for receiving ChatMessage activities

Equivalent to a Note DM

											
										
										
											2022-02-08 10:33:13 +00:00
+								       post_json_object['object']['type'] != 'ChatMessage' and \
-												Snake case

											
										
										
											2021-12-25 22:09:19 +00:00
+								       post_json_object['object']['type'] != 'Article':
-												Add dm and reply notifications to speaker endpoint

											
										
										
											2021-03-09 13:52:02 +00:00
+								        return False
-												Snake case

											
										
										
											2021-12-25 22:09:19 +00:00
+								    if post_json_object['object'].get('inReplyTo'):
 								        if isinstance(post_json_object['object']['inReplyTo'], str):
 								            if post_json_object['object']['inReplyTo'].startswith(actor):
-												Add dm and reply notifications to speaker endpoint

											
										
										
											2021-03-09 13:52:02 +00:00
+								                return True
-												Snake case

											
										
										
											2021-12-25 22:09:19 +00:00
+								    if not post_json_object['object'].get('tag'):
-												Add dm and reply notifications to speaker endpoint

											
										
										
											2021-03-09 13:52:02 +00:00
+								        return False
-												Snake case

											
										
										
											2021-12-25 22:09:19 +00:00
+								    if not isinstance(post_json_object['object']['tag'], list):
-												Add dm and reply notifications to speaker endpoint

											
										
										
											2021-03-09 13:52:02 +00:00
+								        return False
-												Snake case

											
										
										
											2021-12-25 22:09:19 +00:00
+								    for tag in post_json_object['object']['tag']:
-												Add dm and reply notifications to speaker endpoint

											
										
										
											2021-03-09 13:52:02 +00:00
+								        if not tag.get('type'):
 								            continue
 								        if tag['type'] == 'Mention':
 								            if not tag.get('href'):
 								                continue
 								            if actor in tag['href']:
 								                return True
 								    return False
-												Tidying of encrypted message detection

											
										
										
											2021-03-12 12:04:34 +00:00
-												Snake case

											
										
										
											2021-12-26 19:15:36 +00:00
+								def contains_pgp_public_key(content: str) -> bool:
-												Tidying of encrypted message detection

											
										
										
											2021-03-12 12:04:34 +00:00
+								    """Returns true if the given content contains a PGP public key
 								    """
 								    if '--BEGIN PGP PUBLIC KEY BLOCK--' in content:
 								        if '--END PGP PUBLIC KEY BLOCK--' in content:
 								            return True
 								    return False
-												Snake case

											
										
										
											2021-12-26 19:15:36 +00:00
+								def is_pgp_encrypted(content: str) -> bool:
-												Tidying of encrypted message detection

											
										
										
											2021-03-12 12:04:34 +00:00
+								    """Returns true if the given content is PGP encrypted
 								    """
 								    if '--BEGIN PGP MESSAGE--' in content:
 								        if '--END PGP MESSAGE--' in content:
 								            return True
 								    return False
-												Add speakable text for desktop client

											
										
										
											2021-03-18 17:27:46 +00:00
-												Snake case

											
										
										
											2021-12-26 19:15:36 +00:00
+								def invalid_ciphertext(content: str) -> bool:
-												More standard terminology

											
										
										
											2021-11-22 12:05:09 +00:00
+								    """Returns true if the given content contains an invalid key
-												Check for malformed ciphertext within incoming posts

											
										
										
											2021-10-28 11:48:05 +00:00
+								    """
 								    if '----BEGIN ' in content or '----END ' in content:
-												Snake case

											
										
										
											2021-12-26 19:15:36 +00:00
+								        if not contains_pgp_public_key(content) and \
 								           not is_pgp_encrypted(content):
-												Check for malformed ciphertext within incoming posts

											
										
										
											2021-10-28 11:48:05 +00:00
+								            return True
 								    return False
-												Snake case

											
										
										
											2021-12-26 19:12:02 +00:00
+								def load_translations_from_file(base_dir: str, language: str) -> ({}, str):
-												Add speakable text for desktop client

											
										
										
											2021-03-18 17:27:46 +00:00
+								    """Returns the translations dictionary
 								    """
-												Snake case

											
										
										
											2021-12-25 16:17:53 +00:00
+								    if not os.path.isdir(base_dir + '/translations'):
-												Add speakable text for desktop client

											
										
										
											2021-03-18 17:27:46 +00:00
+								        print('ERROR: translations directory not found')
-												Show warnings for exceptions

											
										
										
											2021-10-29 14:33:52 +00:00
+								        return None, None
-												Add speakable text for desktop client

											
										
										
											2021-03-18 17:27:46 +00:00
+								    if not language:
-												Snake case

											
										
										
											2021-12-25 23:03:28 +00:00
+								        system_language = locale.getdefaultlocale()[0]
-												Add speakable text for desktop client

											
										
										
											2021-03-18 17:27:46 +00:00
+								    else:
-												Snake case

											
										
										
											2021-12-25 23:03:28 +00:00
+								        system_language = language
 								    if not system_language:
 								        system_language = 'en'
 								    if '_' in system_language:
 								        system_language = system_language.split('_')[0]
 								    while '/' in system_language:
 								        system_language = system_language.split('/')[1]
 								    if '.' in system_language:
 								        system_language = system_language.split('.')[0]
-												Snake case

											
										
										
											2021-12-26 19:12:02 +00:00
+								    translations_file = base_dir + '/translations/' + \
-												Snake case

											
										
										
											2021-12-25 23:03:28 +00:00
+								        system_language + '.json'
-												Snake case

											
										
										
											2021-12-26 19:12:02 +00:00
+								    if not os.path.isfile(translations_file):
-												Snake case

											
										
										
											2021-12-25 23:03:28 +00:00
+								        system_language = 'en'
-												Snake case

											
										
										
											2021-12-26 19:12:02 +00:00
+								        translations_file = base_dir + '/translations/' + \
-												Snake case

											
										
										
											2021-12-25 23:03:28 +00:00
+								            system_language + '.json'
-												Snake case

											
										
										
											2021-12-26 19:12:02 +00:00
+								    return load_json(translations_file), system_language
-												Instance allow list for receiving DMs

											
										
										
											2021-04-22 09:27:20 +00:00
-												Snake case

											
										
										
											2021-12-26 19:09:04 +00:00
+								def dm_allowed_from_domain(base_dir: str,
 								                           nickname: str, domain: str,
 								                           sending_actor_domain: str) -> bool:
-												Instance allow list for receiving DMs

											
										
										
											2021-04-22 09:27:20 +00:00
+								    """When a DM is received and the .followDMs flag file exists
 								    Then optionally some domains can be specified as allowed,
 								    regardless of individual follows.
 								    i.e. Mostly you only want DMs from followers, but there are
 								    a few particular instances that you trust
 								    """
-												Snake case

											
										
										
											2021-12-26 19:09:04 +00:00
+								    dm_allowed_instances_file = \
-												Snake case

											
										
										
											2021-12-26 12:02:29 +00:00
+								        acct_dir(base_dir, nickname, domain) + '/dmAllowedInstances.txt'
-												Snake case

											
										
										
											2021-12-26 19:09:04 +00:00
+								    if not os.path.isfile(dm_allowed_instances_file):
-												Instance allow list for receiving DMs

											
										
										
											2021-04-22 09:27:20 +00:00
+								        return False
-												Function for checking text in a file

											
										
										
											2022-06-10 09:24:11 +00:00
+								    if text_in_file(sending_actor_domain + '\n', dm_allowed_instances_file):
-												Instance allow list for receiving DMs

											
										
										
											2021-04-22 09:27:20 +00:00
+								        return True
 								    return False
-												Change how roles are represented

											
										
										
											2021-05-16 15:10:39 +00:00
-												Snake case

											
										
										
											2021-12-26 19:01:36 +00:00
+								def get_occupation_skills(actor_json: {}) -> []:
-												Change how roles are represented

											
										
										
											2021-05-16 15:10:39 +00:00
+								    """Returns the list of skills for an actor
 								    """
-												Snake case

											
										
										
											2021-12-26 10:29:52 +00:00
+								    if 'hasOccupation' not in actor_json:
-												Change how roles are represented

											
										
										
											2021-05-16 15:10:39 +00:00
+								        return []
-												Snake case

											
										
										
											2021-12-26 10:29:52 +00:00
+								    if not isinstance(actor_json['hasOccupation'], list):
-												Change how roles are represented

											
										
										
											2021-05-16 15:10:39 +00:00
+								        return []
-												Snake case

											
										
										
											2021-12-26 19:01:36 +00:00
+								    for occupation_item in actor_json['hasOccupation']:
 								        if not isinstance(occupation_item, dict):
-												Change how roles are represented

											
										
										
											2021-05-16 15:10:39 +00:00
+								            continue
-												Snake case

											
										
										
											2021-12-26 19:01:36 +00:00
+								        if not occupation_item.get('@type'):
-												Change how roles are represented

											
										
										
											2021-05-16 15:10:39 +00:00
+								            continue
-												Snake case

											
										
										
											2021-12-26 19:01:36 +00:00
+								        if not occupation_item['@type'] == 'Occupation':
-												Change how roles are represented

											
										
										
											2021-05-16 15:10:39 +00:00
+								            continue
-												Snake case

											
										
										
											2021-12-26 19:01:36 +00:00
+								        if not occupation_item.get('skills'):
-												Change how roles are represented

											
										
										
											2021-05-16 15:10:39 +00:00
+								            continue
-												Snake case

											
										
										
											2021-12-26 19:01:36 +00:00
+								        if isinstance(occupation_item['skills'], list):
 								            return occupation_item['skills']
-												Snake case

											
										
										
											2021-12-28 12:15:46 +00:00
+								        if isinstance(occupation_item['skills'], str):
-												Snake case

											
										
										
											2021-12-26 19:01:36 +00:00
+								            return [occupation_item['skills']]
-												Change how roles are represented

											
										
										
											2021-05-16 15:10:39 +00:00
+								        break
 								    return []
-												Snake case

											
										
										
											2021-12-26 18:58:06 +00:00
+								def get_occupation_name(actor_json: {}) -> str:
-												Change how roles are represented

											
										
										
											2021-05-16 15:10:39 +00:00
+								    """Returns the occupation name an actor
 								    """
-												Snake case

											
										
										
											2021-12-26 10:29:52 +00:00
+								    if not actor_json.get('hasOccupation'):
-												Change how roles are represented

											
										
										
											2021-05-16 15:10:39 +00:00
+								        return ""
-												Snake case

											
										
										
											2021-12-26 10:29:52 +00:00
+								    if not isinstance(actor_json['hasOccupation'], list):
-												Change how roles are represented

											
										
										
											2021-05-16 15:10:39 +00:00
+								        return ""
-												Snake case

											
										
										
											2021-12-26 18:58:06 +00:00
+								    for occupation_item in actor_json['hasOccupation']:
 								        if not isinstance(occupation_item, dict):
-												Change how roles are represented

											
										
										
											2021-05-16 15:10:39 +00:00
+								            continue
-												Snake case

											
										
										
											2021-12-26 18:58:06 +00:00
+								        if not occupation_item.get('@type'):
-												Change how roles are represented

											
										
										
											2021-05-16 15:10:39 +00:00
+								            continue
-												Snake case

											
										
										
											2021-12-26 18:58:06 +00:00
+								        if occupation_item['@type'] != 'Occupation':
-												Change how roles are represented

											
										
										
											2021-05-16 15:10:39 +00:00
+								            continue
-												Snake case

											
										
										
											2021-12-26 18:58:06 +00:00
+								        if not occupation_item.get('name'):
-												Change how roles are represented

											
										
										
											2021-05-16 15:10:39 +00:00
+								            continue
-												Snake case

											
										
										
											2021-12-26 18:58:06 +00:00
+								        if isinstance(occupation_item['name'], str):
 								            return occupation_item['name']
-												Change how roles are represented

											
										
										
											2021-05-16 15:10:39 +00:00
+								        break
 								    return ""
-												Snake case

											
										
										
											2021-12-26 18:55:07 +00:00
+								def set_occupation_name(actor_json: {}, name: str) -> bool:
-												Change how roles are represented

											
										
										
											2021-05-16 15:10:39 +00:00
+								    """Sets the occupation name of an actor
 								    """
-												Snake case

											
										
										
											2021-12-26 10:29:52 +00:00
+								    if not actor_json.get('hasOccupation'):
-												Change how roles are represented

											
										
										
											2021-05-16 15:10:39 +00:00
+								        return False
-												Snake case

											
										
										
											2021-12-26 10:29:52 +00:00
+								    if not isinstance(actor_json['hasOccupation'], list):
-												Change how roles are represented

											
										
										
											2021-05-16 15:10:39 +00:00
+								        return False
-												Use enumerations

											
										
										
											2022-01-08 10:58:54 +00:00
+								    for index, _ in enumerate(actor_json['hasOccupation']):
-												Snake case

											
										
										
											2021-12-26 18:55:07 +00:00
+								        occupation_item = actor_json['hasOccupation'][index]
 								        if not isinstance(occupation_item, dict):
-												Change how roles are represented

											
										
										
											2021-05-16 15:10:39 +00:00
+								            continue
-												Snake case

											
										
										
											2021-12-26 18:55:07 +00:00
+								        if not occupation_item.get('@type'):
-												Change how roles are represented

											
										
										
											2021-05-16 15:10:39 +00:00
+								            continue
-												Snake case

											
										
										
											2021-12-26 18:55:07 +00:00
+								        if occupation_item['@type'] != 'Occupation':
-												Change how roles are represented

											
										
										
											2021-05-16 15:10:39 +00:00
+								            continue
-												Snake case

											
										
										
											2021-12-26 18:55:07 +00:00
+								        occupation_item['name'] = name
-												Change how roles are represented

											
										
										
											2021-05-16 15:10:39 +00:00
+								        return True
 								    return False
-												Snake case

											
										
										
											2021-12-26 18:50:59 +00:00
+								def set_occupation_skills_list(actor_json: {}, skills_list: []) -> bool:
-												Change how roles are represented

											
										
										
											2021-05-16 15:10:39 +00:00
+								    """Sets the occupation skills for an actor
 								    """
-												Snake case

											
										
										
											2021-12-26 10:29:52 +00:00
+								    if 'hasOccupation' not in actor_json:
-												Change how roles are represented

											
										
										
											2021-05-16 15:10:39 +00:00
+								        return False
-												Snake case

											
										
										
											2021-12-26 10:29:52 +00:00
+								    if not isinstance(actor_json['hasOccupation'], list):
-												Change how roles are represented

											
										
										
											2021-05-16 15:10:39 +00:00
+								        return False
-												Use enumerations

											
										
										
											2022-01-08 10:58:54 +00:00
+								    for index, _ in enumerate(actor_json['hasOccupation']):
-												Snake case

											
										
										
											2021-12-26 18:50:59 +00:00
+								        occupation_item = actor_json['hasOccupation'][index]
 								        if not isinstance(occupation_item, dict):
-												Change how roles are represented

											
										
										
											2021-05-16 15:10:39 +00:00
+								            continue
-												Snake case

											
										
										
											2021-12-26 18:50:59 +00:00
+								        if not occupation_item.get('@type'):
-												Change how roles are represented

											
										
										
											2021-05-16 15:10:39 +00:00
+								            continue
-												Snake case

											
										
										
											2021-12-26 18:50:59 +00:00
+								        if occupation_item['@type'] != 'Occupation':
-												Change how roles are represented

											
										
										
											2021-05-16 15:10:39 +00:00
+								            continue
-												Snake case

											
										
										
											2021-12-26 18:50:59 +00:00
+								        occupation_item['skills'] = skills_list
-												Change how roles are represented

											
										
										
											2021-05-16 15:10:39 +00:00
+								        return True
 								    return False
-												Function to test for account directories

											
										
										
											2021-06-07 09:10:52 +00:00
-												Snake case

											
										
										
											2021-12-26 18:50:59 +00:00
+								def is_account_dir(dir_name: str) -> bool:
-												Function to test for account directories

											
										
										
											2021-06-07 09:10:52 +00:00
+								    """Is the given directory an account within /accounts ?
 								    """
-												Snake case

											
										
										
											2021-12-26 18:50:59 +00:00
+								    if '@' not in dir_name:
-												Function to test for account directories

											
										
										
											2021-06-07 09:10:52 +00:00
+								        return False
-												Actor is not an account directory

											
										
										
											2022-02-10 15:07:09 +00:00
+								    if 'inbox@' in dir_name or 'news@' in dir_name or 'Actor@' in dir_name:
-												Function to test for account directories

											
										
										
											2021-06-07 09:10:52 +00:00
+								        return False
 								    return True
-												Move function out of daemon

											
										
										
											2021-06-07 19:18:13 +00:00
-												Snake case

											
										
										
											2021-12-26 18:40:10 +00:00
+								def permitted_dir(path: str) -> bool:
-												Move function out of daemon

											
										
										
											2021-06-07 19:18:13 +00:00
+								    """These are special paths which should not be accessible
 								       directly via GET or POST
 								    """
 								    if path.startswith('/wfendpoints') or \
 								       path.startswith('/keys') or \
 								       path.startswith('/accounts'):
 								        return False
 								    return True
-												Unit test for user agent domain

											
										
										
											2021-06-20 15:45:29 +00:00
-												Snake case

											
										
										
											2021-12-26 18:37:07 +00:00
+								def user_agent_domain(user_agent: str, debug: bool) -> str:
-												Unit test for user agent domain

											
										
										
											2021-06-20 15:45:29 +00:00
+								    """If the User-Agent string contains a domain
 								    then return it
 								    """
-												Fix unit test

											
										
										
											2022-02-03 12:30:57 +00:00
+								    if 'https://' not in user_agent and 'http://' not in user_agent:
-												Unit test for user agent domain

											
										
										
											2021-06-20 15:45:29 +00:00
+								        return None
-												Fix unit test

											
										
										
											2022-02-03 12:30:57 +00:00
+								    agent_domain = ''
 								    if 'https://' in user_agent:
 								        agent_domain = user_agent.split('https://')[1].strip()
 								    else:
 								        agent_domain = user_agent.split('http://')[1].strip()
-												Snake case

											
										
										
											2021-12-26 18:37:07 +00:00
+								    if '/' in agent_domain:
 								        agent_domain = agent_domain.split('/')[0]
 								    if ')' in agent_domain:
 								        agent_domain = agent_domain.split(')')[0].strip()
 								    if ' ' in agent_domain:
 								        agent_domain = agent_domain.replace(' ', '')
 								    if ';' in agent_domain:
 								        agent_domain = agent_domain.replace(';', '')
 								    if '.' not in agent_domain:
-												Unit test for user agent domain

											
										
										
											2021-06-20 15:45:29 +00:00
+								        return None
 								    if debug:
-												Snake case

											
										
										
											2021-12-26 18:37:07 +00:00
+								        print('User-Agent Domain: ' + agent_domain)
 								    return agent_domain
-												Function to check that activitypub posts have an object dictionary

											
										
										
											2021-06-22 15:45:59 +00:00
-												Snake case

											
										
										
											2021-12-26 18:32:02 +00:00
+								def get_alt_path(actor: str, domain_full: str, calling_domain: str) -> str:
-												Module groups

											
										
										
											2021-06-26 11:16:41 +00:00
+								    """Returns alternate path from the actor
 								    eg. https://clearnetdomain/path becomes http://oniondomain/path
 								    """
-												Snake case

											
										
										
											2021-12-26 18:29:39 +00:00
+								    post_actor = actor
 								    if calling_domain not in actor and domain_full in actor:
 								        if calling_domain.endswith('.onion') or \
 								           calling_domain.endswith('.i2p'):
 								            post_actor = \
 								                'http://' + calling_domain + actor.split(domain_full)[1]
 								            print('Changed POST domain from ' + actor + ' to ' + post_actor)
 								    return post_actor
-												Module groups

											
										
										
											2021-06-26 11:16:41 +00:00
-												Snake case

											
										
										
											2021-12-26 18:22:20 +00:00
+								def get_actor_property_url(actor_json: {}, property_name: str) -> str:
-												Module groups

											
										
										
											2021-06-26 11:16:41 +00:00
+								    """Returns a url property from an actor
 								    """
-												Snake case

											
										
										
											2021-12-26 10:29:52 +00:00
+								    if not actor_json.get('attachment'):
-												Module groups

											
										
										
											2021-06-26 11:16:41 +00:00
+								        return ''
-												Snake case

											
										
										
											2021-12-26 18:19:58 +00:00
+								    property_name = property_name.lower()
-												Snake case

											
										
										
											2021-12-26 10:32:45 +00:00
+								    for property_value in actor_json['attachment']:
-												Prepare for alternative property names

											
										
										
											2022-05-11 16:10:38 +00:00
+								        name_value = None
 								        if property_value.get('name'):
 								            name_value = property_value['name']
 								        elif property_value.get('schema:name'):
 								            name_value = property_value['schema:name']
 								        if not name_value:
-												Module groups

											
										
										
											2021-06-26 11:16:41 +00:00
+								            continue
-												Prepare for alternative property names

											
										
										
											2022-05-11 16:10:38 +00:00
+								        if not name_value.lower().startswith(property_name):
-												Module groups

											
										
										
											2021-06-26 11:16:41 +00:00
+								            continue
-												Snake case

											
										
										
											2021-12-26 10:32:45 +00:00
+								        if not property_value.get('type'):
-												Module groups

											
										
										
											2021-06-26 11:16:41 +00:00
+								            continue
-												Prepare for alternative value field within attachments

											
										
										
											2022-05-11 17:17:23 +00:00
+								        prop_value_name, _ = \
 								            get_attachment_property_value(property_value)
 								        if not prop_value_name:
-												Module groups

											
										
										
											2021-06-26 11:16:41 +00:00
+								            continue
-												Prepare for alternative property value

											
										
										
											2022-05-11 16:16:34 +00:00
+								        if not property_value['type'].endswith('PropertyValue'):
-												Module groups

											
										
										
											2021-06-26 11:16:41 +00:00
+								            continue
-												Prepare for alternative value field within attachments

											
										
										
											2022-05-11 17:17:23 +00:00
+								        property_value['value'] = property_value[prop_value_name].strip()
-												Snake case

											
										
										
											2021-12-27 17:20:01 +00:00
+								        prefixes = get_protocol_prefixes()
-												Snake case

											
										
										
											2021-12-28 12:15:46 +00:00
+								        prefix_found = False
-												Module groups

											
										
										
											2021-06-26 11:16:41 +00:00
+								        for prefix in prefixes:
-												Prepare for alternative value field within attachments

											
										
										
											2022-05-11 17:17:23 +00:00
+								            if property_value[prop_value_name].startswith(prefix):
-												Snake case

											
										
										
											2021-12-28 12:15:46 +00:00
+								                prefix_found = True
-												Module groups

											
										
										
											2021-06-26 11:16:41 +00:00
+								                break
-												Snake case

											
										
										
											2021-12-28 12:15:46 +00:00
+								        if not prefix_found:
-												Module groups

											
										
										
											2021-06-26 11:16:41 +00:00
+								            continue
-												Prepare for alternative value field within attachments

											
										
										
											2022-05-11 17:17:23 +00:00
+								        if '.' not in property_value[prop_value_name]:
-												Module groups

											
										
										
											2021-06-26 11:16:41 +00:00
+								            continue
-												Prepare for alternative value field within attachments

											
										
										
											2022-05-11 17:17:23 +00:00
+								        if ' ' in property_value[prop_value_name]:
-												Module groups

											
										
										
											2021-06-26 11:16:41 +00:00
+								            continue
-												Prepare for alternative value field within attachments

											
										
										
											2022-05-11 17:17:23 +00:00
+								        if ',' in property_value[prop_value_name]:
-												Module groups

											
										
										
											2021-06-26 11:16:41 +00:00
+								            continue
-												Prepare for alternative value field within attachments

											
										
										
											2022-05-11 17:17:23 +00:00
+								        return property_value[prop_value_name]
-												Module groups

											
										
										
											2021-06-26 11:16:41 +00:00
+								    return ''
-												Extra architecture graphs

											
										
										
											2021-06-26 14:21:24 +00:00
-												Snake case

											
										
										
											2021-12-26 18:17:37 +00:00
+								def remove_domain_port(domain: str) -> str:
-												Extra architecture graphs

											
										
										
											2021-06-26 14:21:24 +00:00
+								    """If the domain has a port appended then remove it
 								    eg. mydomain.com:80 becomes mydomain.com
 								    """
 								    if ':' in domain:
 								        if domain.startswith('did:'):
 								            return domain
 								        domain = domain.split(':')[0]
 								    return domain
-												Snake case

											
										
										
											2021-12-26 18:14:21 +00:00
+								def get_port_from_domain(domain: str) -> int:
-												Extra architecture graphs

											
										
										
											2021-06-26 14:21:24 +00:00
+								    """If the domain has a port number appended then return it
 								    eg. mydomain.com:80 returns 80
 								    """
 								    if ':' in domain:
 								        if domain.startswith('did:'):
 								            return None
-												Snake case

											
										
										
											2021-12-28 12:15:46 +00:00
+								        port_str = domain.split(':')[1]
 								        if port_str.isdigit():
 								            return int(port_str)
-												Extra architecture graphs

											
										
										
											2021-06-26 14:21:24 +00:00
+								    return None
-												Function for checking url prefixes

											
										
										
											2021-07-06 09:44:45 +00:00
-												Snake case

											
										
										
											2021-12-26 18:10:53 +00:00
+								def valid_url_prefix(url: str) -> bool:
-												Function for checking url prefixes

											
										
										
											2021-07-06 09:44:45 +00:00
+								    """Does the given url have a valid prefix?
 								    """
 								    if '/' not in url:
 								        return False
 								    prefixes = ('https:', 'http:', 'hyper:', 'i2p:', 'gnunet:')
 								    for pre in prefixes:
 								        if url.startswith(pre):
 								            return True
 								    return False
-												Ensure that line endings are removed from changed password

											
										
										
											2021-07-20 14:39:43 +00:00
-												Snake case

											
										
										
											2021-12-26 18:05:54 +00:00
+								def valid_password(password: str) -> bool:
-												Validate passwords

											
										
										
											2021-07-20 20:39:26 +00:00
+								    """Returns true if the given password is valid
 								    """
 								    if len(password) < 8:
 								        return False
 								    return True
-												Authorized access to catalog

											
										
										
											2021-07-25 13:09:39 +00:00
-												Snake case

											
										
										
											2021-12-28 12:15:46 +00:00
+								def is_float(value) -> bool:
 								    """Is the given value a float?
 								    """
-												Authorized access to catalog

											
										
										
											2021-07-25 13:09:39 +00:00
+								    try:
 								        float(value)
 								        return True
 								    except ValueError:
 								        return False
-												Unit test for date conversion

											
										
										
											2021-07-28 09:35:21 +00:00
-												Snake case

											
										
										
											2021-12-26 18:01:02 +00:00
+								def date_string_to_seconds(date_str: str) -> int:
-												Unit test for date conversion

											
										
										
											2021-07-28 09:35:21 +00:00
+								    """Converts a date string (eg "published") into seconds since epoch
 								    """
 								    try:
-												Snake case

											
										
										
											2021-12-26 18:01:02 +00:00
+								        expiry_time = \
 								            datetime.datetime.strptime(date_str, '%Y-%m-%dT%H:%M:%SZ')
-												Unit test for date conversion

											
										
										
											2021-07-28 09:35:21 +00:00
+								    except BaseException:
-												Snake case

											
										
										
											2021-12-26 18:01:02 +00:00
+								        print('EX: date_string_to_seconds unable to parse date ' +
 								              str(date_str))
-												Unit test for date conversion

											
										
										
											2021-07-28 09:35:21 +00:00
+								        return None
-												Snake case

											
										
										
											2021-12-26 18:01:02 +00:00
+								    return int(datetime.datetime.timestamp(expiry_time))
-												Unit test for date conversion

											
										
										
											2021-07-28 09:35:21 +00:00
-												Snake case

											
										
										
											2021-12-26 17:55:38 +00:00
+								def date_seconds_to_string(date_sec: int) -> str:
-												Unit test for date conversion

											
										
										
											2021-07-28 09:35:21 +00:00
+								    """Converts a date in seconds since epoch to a string
 								    """
-												Snake case

											
										
										
											2021-12-26 17:55:38 +00:00
+								    this_date = datetime.datetime.fromtimestamp(date_sec)
 								    return this_date.strftime("%Y-%m-%dT%H:%M:%SZ")
-												Unfollowing group handles

											
										
										
											2021-07-30 16:06:34 +00:00
-												Snake case

											
										
										
											2021-12-26 17:53:07 +00:00
+								def has_group_type(base_dir: str, actor: str, person_cache: {},
 								                   debug: bool = False) -> bool:
-												Unit test for following a group

											
										
										
											2021-07-31 11:56:28 +00:00
+								    """Does the given actor url have a group type?
-												Unfollowing group handles

											
										
										
											2021-07-30 16:06:34 +00:00
+								    """
-												Unit test for following a group

											
										
										
											2021-07-31 11:56:28 +00:00
+								    # does the actor path clearly indicate that this is a group?
 								    # eg. https://lemmy/c/groupname
-												Snake case

											
										
										
											2021-12-26 17:53:07 +00:00
+								    group_paths = get_group_paths()
 								    for grp_path in group_paths:
 								        if grp_path in actor:
-												Fixing --posts option

											
										
										
											2021-08-01 13:25:11 +00:00
+								            if debug:
-												Snake case

											
										
										
											2021-12-26 17:53:07 +00:00
+								                print('grpPath ' + grp_path + ' in ' + actor)
-												Unfollowing group handles

											
										
										
											2021-07-30 16:06:34 +00:00
+								            return True
-												Unit test for following a group

											
										
										
											2021-07-31 11:56:28 +00:00
+								    # is there a cached actor which can be examined for Group type?
-												Snake case

											
										
										
											2021-12-26 17:41:07 +00:00
+								    return is_group_actor(base_dir, actor, person_cache, debug)
-												Unit test for following a group

											
										
										
											2021-07-31 11:56:28 +00:00
-												Snake case

											
										
										
											2021-12-26 17:41:07 +00:00
+								def is_group_actor(base_dir: str, actor: str, person_cache: {},
 								                   debug: bool = False) -> bool:
-												Unit test for following a group

											
										
										
											2021-07-31 11:56:28 +00:00
+								    """Is the given actor a group?
 								    """
-												Snake case

											
										
										
											2021-12-25 22:17:49 +00:00
+								    if person_cache:
 								        if person_cache.get(actor):
 								            if person_cache[actor].get('actor'):
 								                if person_cache[actor]['actor'].get('type'):
 								                    if person_cache[actor]['actor']['type'] == 'Group':
-												Fixing --posts option

											
										
										
											2021-08-01 13:25:11 +00:00
+								                        if debug:
 								                            print('Cached actor ' + actor + ' has Group type')
-												Unit test for following a group

											
										
										
											2021-07-31 11:56:28 +00:00
+								                        return True
 								                return False
-												Fixing --posts option

											
										
										
											2021-08-01 13:25:11 +00:00
+								    if debug:
 								        print('Actor ' + actor + ' not in cache')
-												Snake case

											
										
										
											2021-12-26 17:41:07 +00:00
+								    cached_actor_filename = \
-												Snake case

											
										
										
											2021-12-25 16:17:53 +00:00
+								        base_dir + '/cache/actors/' + (actor.replace('/', '#')) + '.json'
-												Snake case

											
										
										
											2021-12-26 17:41:07 +00:00
+								    if not os.path.isfile(cached_actor_filename):
-												Fixing --posts option

											
										
										
											2021-08-01 13:25:11 +00:00
+								        if debug:
-												Snake case

											
										
										
											2021-12-26 17:41:07 +00:00
+								            print('Cached actor file not found ' + cached_actor_filename)
-												Unit test for following a group

											
										
										
											2021-07-31 11:56:28 +00:00
+								        return False
-												Function for checking text in a file

											
										
										
											2022-06-10 09:24:11 +00:00
+								    if text_in_file('"type": "Group"', cached_actor_filename):
-												Fixing --posts option

											
										
										
											2021-08-01 13:25:11 +00:00
+								        if debug:
-												Snake case

											
										
										
											2021-12-26 17:41:07 +00:00
+								            print('Group type found in ' + cached_actor_filename)
-												Unit test for following a group

											
										
										
											2021-07-31 11:56:28 +00:00
+								        return True
-												Unfollowing group handles

											
										
										
											2021-07-30 16:06:34 +00:00
+								    return False
-												Currency field as dropdown

											
										
										
											2021-08-07 17:44:25 +00:00
-												Snake case

											
										
										
											2021-12-26 17:33:24 +00:00
+								def is_group_account(base_dir: str, nickname: str, domain: str) -> bool:
-												Ensure that groups can't follow groups, to prevent circular reference

											
										
										
											2021-08-12 17:50:33 +00:00
+								    """Returns true if the given account is a group
 								    """
-												Snake case

											
										
										
											2021-12-26 17:33:24 +00:00
+								    account_filename = acct_dir(base_dir, nickname, domain) + '.json'
 								    if not os.path.isfile(account_filename):
-												Ensure that groups can't follow groups, to prevent circular reference

											
										
										
											2021-08-12 17:50:33 +00:00
+								        return False
-												Function for checking text in a file

											
										
										
											2022-06-10 09:24:11 +00:00
+								    if text_in_file('"type": "Group"', account_filename):
-												Ensure that groups can't follow groups, to prevent circular reference

											
										
										
											2021-08-12 17:50:33 +00:00
+								        return True
 								    return False
-												Snake case

											
										
										
											2021-12-26 17:29:09 +00:00
+								def get_currencies() -> {}:
-												Currency field as dropdown

											
										
										
											2021-08-07 17:44:25 +00:00
+								    """Returns a dictionary of currencies
 								    """
 								    return {
 								        "CA$": "CAD",
 								        "J$": "JMD",
 								        "£": "GBP",
 								        "€": "EUR",
 								        "؋": "AFN",
 								        "ƒ": "AWG",
 								        "₼": "AZN",
 								        "Br": "BYN",
 								        "BZ$": "BZD",
 								        "$b": "BOB",
 								        "KM": "BAM",
 								        "P": "BWP",
 								        "лв": "BGN",
 								        "R$": "BRL",
 								        "៛": "KHR",
 								        "$U": "UYU",
 								        "RD$": "DOP",
 								        "$": "USD",
 								        "₡": "CRC",
 								        "kn": "HRK",
 								        "₱": "CUP",
 								        "Kč": "CZK",
 								        "kr": "NOK",
 								        "¢": "GHS",
 								        "Q": "GTQ",
 								        "L": "HNL",
 								        "Ft": "HUF",
 								        "Rp": "IDR",
 								        "₹": "INR",
 								        "﷼": "IRR",
 								        "₪": "ILS",
 								        "¥": "JPY",
 								        "₩": "KRW",
 								        "₭": "LAK",
 								        "ден": "MKD",
 								        "RM": "MYR",
 								        "₨": "MUR",
 								        "₮": "MNT",
 								        "MT": "MZN",
 								        "C$": "NIO",
 								        "₦": "NGN",
 								        "Gs": "PYG",
 								        "zł": "PLN",
 								        "lei": "RON",
 								        "₽": "RUB",
 								        "Дин": "RSD",
 								        "S": "SOS",
 								        "R": "ZAR",
 								        "CHF": "CHF",
 								        "NT$": "TWD",
 								        "฿": "THB",
 								        "TT$": "TTD",
 								        "₴": "UAH",
-												Additional currency links

											
										
										
											2023-08-20 12:20:34 +00:00
+								        "Bs": "VEB",
-												Currency field as dropdown

											
										
										
											2021-08-07 17:44:25 +00:00
+								        "₫": "VND",
 								        "Z$": "ZQD"
 								    }
-												Translations for ontology

											
										
										
											2021-08-08 11:16:18 +00:00
-												Snake case

											
										
										
											2021-12-26 17:26:55 +00:00
+								def get_supported_languages(base_dir: str) -> []:
-												Translations for ontology

											
										
										
											2021-08-08 11:16:18 +00:00
+								    """Returns a list of supported languages
 								    """
-												Snake case

											
										
										
											2021-12-26 17:26:55 +00:00
+								    translations_dir = base_dir + '/translations'
 								    languages_str = []
 								    for _, _, files in os.walk(translations_dir):
-												Snake case

											
										
										
											2021-12-28 12:15:46 +00:00
+								        for fname in files:
 								            if not fname.endswith('.json'):
-												Translations for ontology

											
										
										
											2021-08-08 11:16:18 +00:00
+								                continue
-												Snake case

											
										
										
											2021-12-28 12:15:46 +00:00
+								            lang = fname.split('.')[0]
-												Translations for ontology

											
										
										
											2021-08-08 11:16:18 +00:00
+								            if len(lang) == 2:
-												Snake case

											
										
										
											2021-12-26 17:26:55 +00:00
+								                languages_str.append(lang)
-												Translations for ontology

											
										
										
											2021-08-08 11:16:18 +00:00
+								        break
-												Snake case

											
										
										
											2021-12-26 17:26:55 +00:00
+								    return languages_str
-												More general list of shared item categories

											
										
										
											2021-08-08 18:39:03 +00:00
-												Snake case

											
										
										
											2021-12-26 17:18:34 +00:00
+								def get_category_types(base_dir: str) -> []:
-												More general list of shared item categories

											
										
										
											2021-08-08 18:39:03 +00:00
+								    """Returns the list of ontologies
 								    """
-												Snake case

											
										
										
											2021-12-26 17:18:34 +00:00
+								    ontology_dir = base_dir + '/ontology'
-												More general list of shared item categories

											
										
										
											2021-08-08 18:39:03 +00:00
+								    categories = []
-												Snake case

											
										
										
											2021-12-26 17:18:34 +00:00
+								    for _, _, files in os.walk(ontology_dir):
-												Snake case

											
										
										
											2021-12-28 12:15:46 +00:00
+								        for fname in files:
 								            if not fname.endswith('.json'):
-												More general list of shared item categories

											
										
										
											2021-08-08 18:39:03 +00:00
+								                continue
-												Snake case

											
										
										
											2021-12-28 12:15:46 +00:00
+								            if '#' in fname or '~' in fname:
-												Avoid backup files

											
										
										
											2021-08-08 20:05:40 +00:00
+								                continue
-												Snake case

											
										
										
											2021-12-28 12:15:46 +00:00
+								            if fname.startswith('custom'):
-												Exclude custom ontologies

											
										
										
											2021-08-08 19:55:54 +00:00
+								                continue
-												Snake case

											
										
										
											2021-12-28 12:15:46 +00:00
+								            ontology_filename = fname.split('.')[0]
-												Snake case

											
										
										
											2021-12-26 17:18:34 +00:00
+								            if 'Types' in ontology_filename:
 								                categories.append(ontology_filename.replace('Types', ''))
-												More general list of shared item categories

											
										
										
											2021-08-08 18:39:03 +00:00
+								        break
 								    return categories
-												Generalize the shares file so that there can be separate shares and wanted items

											
										
										
											2021-08-09 13:07:32 +00:00
-												Snake case

											
										
										
											2021-12-26 17:24:00 +00:00
+								def get_shares_files_list() -> []:
-												Generalize the shares file so that there can be separate shares and wanted items

											
										
										
											2021-08-09 13:07:32 +00:00
+								    """Returns the possible shares files
 								    """
 								    return ('shares', 'wanted')
-												Replace /users/ with other possible paths

											
										
										
											2021-08-22 18:38:02 +00:00
-												Snake case

											
										
										
											2021-12-26 17:21:37 +00:00
+								def replace_users_with_at(actor: str) -> str:
-												Replace /users/ with other possible paths

											
										
										
											2021-08-22 18:38:02 +00:00
+								    """ https://domain/users/nick becomes https://domain/@nick
 								    """
-												Snake case

											
										
										
											2021-12-26 17:15:04 +00:00
+								    u_paths = get_user_paths()
 								    for path in u_paths:
-												Replace /users/ with other possible paths

											
										
										
											2021-08-22 18:38:02 +00:00
+								        if path in actor:
-												Additional user paths

											
										
										
											2023-04-23 15:55:48 +00:00
+								            if '/@/' not in actor:
 								                actor = actor.replace(path, '/@')
-												Replace /users/ with other possible paths

											
										
										
											2021-08-22 18:38:02 +00:00
+								            break
 								    return actor
-												Function to check for presence of actor in activity

											
										
										
											2021-10-13 09:33:15 +00:00
-												Snake case

											
										
										
											2021-12-26 17:15:04 +00:00
+								def has_actor(post_json_object: {}, debug: bool) -> bool:
-												Function to check for presence of actor in activity

											
										
										
											2021-10-13 09:33:15 +00:00
+								    """Does the given post have an actor?
 								    """
-												Snake case

											
										
										
											2021-12-25 22:09:19 +00:00
+								    if post_json_object.get('actor'):
 								        if '#' in post_json_object['actor']:
-												Check that post actors don't contain hashes

											
										
										
											2021-12-06 12:58:54 +00:00
+								            return False
-												Function to check for presence of actor in activity

											
										
										
											2021-10-13 09:33:15 +00:00
+								        return True
 								    if debug:
-												Snake case

											
										
										
											2021-12-25 22:09:19 +00:00
+								        if post_json_object.get('type'):
 								            msg = post_json_object['type'] + ' has missing actor'
 								            if post_json_object.get('id'):
 								                msg += ' ' + post_json_object['id']
-												Function to check for presence of actor in activity

											
										
										
											2021-10-13 09:33:15 +00:00
+								            print(msg)
 								    return False
-												Tidying

											
										
										
											2021-10-13 10:11:02 +00:00
-												Handle incoming edited posts

											
										
										
											2022-04-09 15:11:22 +00:00
+								def has_object_string_type(post_json_object: {}, debug: bool) -> bool:
-												Tidying

											
										
										
											2021-10-13 10:37:52 +00:00
+								    """Does the given post have a type field within an object dict?
-												Tidying

											
										
										
											2021-10-13 10:11:02 +00:00
+								    """
-												Snake case

											
										
										
											2021-12-26 10:57:03 +00:00
+								    if not has_object_dict(post_json_object):
-												Tidying

											
										
										
											2021-10-13 10:11:02 +00:00
+								        if debug:
-												Handle incoming edited posts

											
										
										
											2022-04-09 15:11:22 +00:00
+								            print('has_object_string_type no object found')
-												Tidying

											
										
										
											2021-10-13 10:11:02 +00:00
+								        return False
-												Snake case

											
										
										
											2021-12-25 22:09:19 +00:00
+								    if post_json_object['object'].get('type'):
 								        if isinstance(post_json_object['object']['type'], str):
-												Tidying

											
										
										
											2021-10-13 10:11:02 +00:00
+								            return True
-												Debug

											
										
										
											2023-04-23 09:36:20 +00:00
+								        if post_json_object.get('type'):
 								            print('DEBUG: ' + post_json_object['type'] +
 								                  ' type within object is not a string ' +
 								                  str(post_json_object))
-												Tidying

											
										
										
											2021-10-13 10:11:02 +00:00
+								    if debug:
-												Snake case

											
										
										
											2021-12-25 22:09:19 +00:00
+								        print('No type field within object ' + post_json_object['id'])
-												Tidying

											
										
										
											2021-10-13 10:11:02 +00:00
+								    return False
-												Tidying

											
										
										
											2021-10-13 10:37:52 +00:00
-												Snake case

											
										
										
											2021-12-26 15:54:46 +00:00
+								def has_object_string_object(post_json_object: {}, debug: bool) -> bool:
-												Tidying

											
										
										
											2021-10-13 10:37:52 +00:00
+								    """Does the given post have an object string field within an object dict?
 								    """
-												Snake case

											
										
										
											2021-12-26 10:57:03 +00:00
+								    if not has_object_dict(post_json_object):
-												Tidying

											
										
										
											2021-10-13 10:37:52 +00:00
+								        if debug:
-												Handle incoming edited posts

											
										
										
											2022-04-09 15:11:22 +00:00
+								            print('has_object_string_type no object found')
-												Tidying

											
										
										
											2021-10-13 10:37:52 +00:00
+								        return False
-												Snake case

											
										
										
											2021-12-25 22:09:19 +00:00
+								    if post_json_object['object'].get('object'):
 								        if isinstance(post_json_object['object']['object'], str):
-												Tidying

											
										
										
											2021-10-13 10:37:52 +00:00
+								            return True
-												Tidying

											
										
										
											2022-05-30 20:47:23 +00:00
+								        if debug:
-												Snake case

											
										
										
											2021-12-25 22:09:19 +00:00
+								            if post_json_object.get('type'):
 								                print('DEBUG: ' + post_json_object['type'] +
-												Tidying

											
										
										
											2021-10-13 10:37:52 +00:00
+								                      ' object within dict is not a string')
 								    if debug:
-												Snake case

											
										
										
											2021-12-25 22:09:19 +00:00
+								        print('No object field within dict ' + post_json_object['id'])
-												Tidying

											
										
										
											2021-10-13 10:37:52 +00:00
+								    return False
-												Tidying

											
										
										
											2021-10-13 11:15:06 +00:00
-												Snake case

											
										
										
											2021-12-26 17:12:07 +00:00
+								def has_object_string(post_json_object: {}, debug: bool) -> bool:
-												Tidying

											
										
										
											2021-10-13 11:15:06 +00:00
+								    """Does the given post have an object string field?
 								    """
-												Snake case

											
										
										
											2021-12-25 22:09:19 +00:00
+								    if post_json_object.get('object'):
 								        if isinstance(post_json_object['object'], str):
-												Tidying

											
										
										
											2021-10-13 11:15:06 +00:00
+								            return True
-												Convert config variable names to camel case

											
										
										
											2021-12-28 15:13:51 +00:00
+								        if debug:
-												Snake case

											
										
										
											2021-12-25 22:09:19 +00:00
+								            if post_json_object.get('type'):
 								                print('DEBUG: ' + post_json_object['type'] +
-												Tidying

											
										
										
											2021-10-13 11:15:06 +00:00
+								                      ' object is not a string')
 								    if debug:
-												Snake case

											
										
										
											2021-12-25 22:09:19 +00:00
+								        print('No object field within post ' + post_json_object['id'])
-												Tidying

											
										
										
											2021-10-13 11:15:06 +00:00
+								    return False
-												Tidying

											
										
										
											2021-11-03 11:25:26 +00:00
-												Snake case

											
										
										
											2021-12-26 16:59:38 +00:00
+								def get_new_post_endpoints() -> []:
-												Tidying

											
										
										
											2021-11-03 11:25:26 +00:00
+								    """Returns a list of endpoints for new posts
 								    """
 								    return (
 								        'newpost', 'newblog', 'newunlisted', 'newfollowers', 'newdm',
-												Tidying of new post endpoints

											
										
										
											2021-11-03 11:32:38 +00:00
+								        'newreminder', 'newreport', 'newquestion', 'newshare', 'newwanted',
 								        'editblogpost'
-												Tidying

											
										
										
											2021-11-03 11:25:26 +00:00
+								    )
-												Shorter cached favicon filename

											
										
										
											2021-12-17 12:01:54 +00:00
-												Snake case

											
										
										
											2021-12-26 16:59:38 +00:00
+								def get_fav_filename_from_url(base_dir: str, favicon_url: str) -> str:
-												Shorter cached favicon filename

											
										
										
											2021-12-17 12:01:54 +00:00
+								    """Returns the cached filename for a favicon based upon its url
 								    """
-												Snake case

											
										
										
											2021-12-26 16:59:38 +00:00
+								    if '://' in favicon_url:
 								        favicon_url = favicon_url.split('://')[1]
 								    if '/favicon.' in favicon_url:
 								        favicon_url = favicon_url.replace('/favicon.', '.')
 								    return base_dir + '/favicons/' + favicon_url.replace('/', '-')
-												Get categories from podcast feeds

											
										
										
											2022-01-13 15:10:41 +00:00
 								def valid_hash_tag(hashtag: str) -> bool:
 								    """Returns true if the give hashtag contains valid characters
 								    """
 								    # long hashtags are not valid
 								    if len(hashtag) >= 32:
 								        return False
-												Hashtags cannot be numbers

											
										
										
											2022-05-20 10:17:53 +00:00
+								    # numbers are not permitted to be hashtags
 								    if hashtag.isdigit():
 								        return False
-												Get categories from podcast feeds

											
										
										
											2022-01-13 15:10:41 +00:00
+								    if set(hashtag).issubset(VALID_HASHTAG_CHARS):
 								        return True
 								    if _is_valid_language(hashtag):
 								        return True
 								    return False
-												Add timezone per account

											
										
										
											2022-02-25 19:12:40 +00:00
 								def convert_published_to_local_timezone(published, timezone: str) -> str:
 								    """Converts a post published time into local time
 								    """
 								    from_zone = tz.gettz('UTC')
 								    if timezone:
-												Unit test for time zone

											
										
										
											2022-02-25 21:00:53 +00:00
+								        try:
 								            to_zone = tz.gettz(timezone)
 								        except BaseException:
 								            pass
 								    if not timezone:
 								        return published
-												Add timezone per account

											
										
										
											2022-02-25 19:12:40 +00:00
 								    utc = published.replace(tzinfo=from_zone)
 								    local_time = utc.astimezone(to_zone)
 								    return local_time
 								def load_account_timezones(base_dir: str) -> {}:
 								    """Returns a dictionary containing the preferred timezone for each account
 								    """
 								    account_timezone = {}
-												Tidying

											
										
										
											2022-05-30 20:47:23 +00:00
+								    for _, dirs, _ in os.walk(base_dir + '/accounts'):
-												Add timezone per account

											
										
										
											2022-02-25 19:12:40 +00:00
+								        for acct in dirs:
 								            if '@' not in acct:
 								                continue
 								            if acct.startswith('inbox@') or acct.startswith('Actor@'):
 								                continue
-												Tidying

											
										
										
											2022-05-30 20:47:23 +00:00
+								            acct_directory = os.path.join(base_dir + '/accounts', acct)
 								            tz_filename = acct_directory + '/timezone.txt'
-												Add timezone per account

											
										
										
											2022-02-25 19:12:40 +00:00
+								            if not os.path.isfile(tz_filename):
 								                continue
 								            timezone = None
-												Explicitly set file encoding

											
										
										
											2022-06-09 14:46:30 +00:00
+								            with open(tz_filename, 'r', encoding='utf-8') as fp_timezone:
-												Add timezone per account

											
										
										
											2022-02-25 19:12:40 +00:00
+								                timezone = fp_timezone.read().strip()
 								            if timezone:
 								                nickname = acct.split('@')[0]
 								                account_timezone[nickname] = timezone
 								        break
 								    return account_timezone
-												Bold reading accessibility feature

											
										
										
											2022-03-24 13:14:41 +00:00
+								def load_bold_reading(base_dir: str) -> {}:
 								    """Returns a dictionary containing the bold reading status for each account
 								    """
 								    bold_reading = {}
-												Tidying

											
										
										
											2022-05-30 20:47:23 +00:00
+								    for _, dirs, _ in os.walk(base_dir + '/accounts'):
-												Bold reading accessibility feature

											
										
										
											2022-03-24 13:14:41 +00:00
+								        for acct in dirs:
 								            if '@' not in acct:
 								                continue
 								            if acct.startswith('inbox@') or acct.startswith('Actor@'):
 								                continue
 								            bold_reading_filename = \
 								                base_dir + '/accounts/' + acct + '/.boldReading'
 								            if os.path.isfile(bold_reading_filename):
 								                nickname = acct.split('@')[0]
 								                bold_reading[nickname] = True
-												Tidying

											
										
										
											2022-05-30 20:47:23 +00:00
+								        break
-												Bold reading accessibility feature

											
										
										
											2022-03-24 13:14:41 +00:00
+								    return bold_reading
-												Add timezone per account

											
										
										
											2022-02-25 19:12:40 +00:00
+								def get_account_timezone(base_dir: str, nickname: str, domain: str) -> str:
 								    """Returns the timezone for the given account
 								    """
 								    tz_filename = \
-												Tidying

											
										
										
											2022-12-18 13:58:48 +00:00
+								        acct_dir(base_dir, nickname, domain) + '/timezone.txt'
-												Add timezone per account

											
										
										
											2022-02-25 19:12:40 +00:00
+								    if not os.path.isfile(tz_filename):
 								        return None
 								    timezone = None
-												Explicitly set file encoding

											
										
										
											2022-06-09 14:46:30 +00:00
+								    with open(tz_filename, 'r', encoding='utf-8') as fp_timezone:
-												Add timezone per account

											
										
										
											2022-02-25 19:12:40 +00:00
+								        timezone = fp_timezone.read().strip()
 								    return timezone
-												Setting time zone within profile

											
										
										
											2022-02-25 19:57:31 +00:00
 								def set_account_timezone(base_dir: str, nickname: str, domain: str,
 								                         timezone: str) -> None:
 								    """Sets the timezone for the given account
 								    """
 								    tz_filename = \
-												Tidying

											
										
										
											2022-12-18 13:58:48 +00:00
+								        acct_dir(base_dir, nickname, domain) + '/timezone.txt'
-												Setting time zone within profile

											
										
										
											2022-02-25 19:57:31 +00:00
+								    timezone = timezone.strip()
-												Explicitly set file encoding

											
										
										
											2022-06-09 14:46:30 +00:00
+								    with open(tz_filename, 'w+', encoding='utf-8') as fp_timezone:
-												Setting time zone within profile

											
										
										
											2022-02-25 19:57:31 +00:00
+								        fp_timezone.write(timezone)
-												Change actor domain for non-clearnet lookups

											
										
										
											2022-03-12 19:46:47 +00:00
 								def is_onion_request(calling_domain: str, referer_domain: str,
 								                     domain: str, onion_domain: str) -> bool:
 								    """Do the given domains indicate that this is a request
 								    from an onion instance
 								    """
 								    if not onion_domain:
 								        return False
 								    if domain == onion_domain:
 								        return True
 								    if calling_domain.endswith('.onion'):
 								        return True
 								    if not referer_domain:
 								        return False
 								    if referer_domain.endswith('.onion'):
 								        return True
 								    return False
 								def is_i2p_request(calling_domain: str, referer_domain: str,
 								                   domain: str, i2p_domain: str) -> bool:
 								    """Do the given domains indicate that this is a request
 								    from an i2p instance
 								    """
 								    if not i2p_domain:
 								        return False
 								    if domain == i2p_domain:
 								        return True
 								    if calling_domain.endswith('.i2p'):
 								        return True
 								    if not referer_domain:
 								        return False
 								    if referer_domain.endswith('.i2p'):
 								        return True
 								    return False
-												Use reply and announce inhibitors in desktop client

											
										
										
											2022-05-08 17:15:48 +00:00
-												Apply pixelfed style capabilities for announce permission

											
										
										
											2023-08-04 09:38:48 +00:00
+								def disallow_announce(content: str, attachment: [], capabilities: {}) -> bool:
-												Use reply and announce inhibitors in desktop client

											
										
										
											2022-05-08 17:15:48 +00:00
+								    """Are announces/boosts not allowed for the given post?
 								    """
-												Apply pixelfed style capabilities for announce permission

											
										
										
											2023-08-04 09:38:48 +00:00
+								    # pixelfed style capabilities
 								    if capabilities.get('announce'):
 								        if isinstance(capabilities['announce'], str):
 								            if not capabilities['announce'].endswith('#Public'):
 								                # TODO handle non-public announce permissions
 								                print('CAPABILITIES: announce ' + capabilities['announce'])
 								                return True
 								    # emojis
-												Use reply and announce inhibitors in desktop client

											
										
										
											2022-05-08 17:15:48 +00:00
+								    disallow_strings = (
 								        ':boost_no:',
 								        ':noboost:',
 								        ':noboosts:',
 								        ':no_boost:',
 								        ':no_boosts:',
 								        ':boosts_no:',
 								        'dont_repeat',
 								        'dont_announce',
-												Additional reply indicators

											
										
										
											2022-06-03 09:28:34 +00:00
+								        'dont_boost',
 								        'do not boost',
-												Extra no reply strings

											
										
										
											2022-06-14 20:38:56 +00:00
+								        "don't boost",
 								        'boost_denied',
 								        'boosts_denied',
-												Lower case for checking don't reply

											
										
										
											2022-09-11 18:09:32 +00:00
+								        'boostdenied',
 								        'boostsdenied'
-												Use reply and announce inhibitors in desktop client

											
										
										
											2022-05-08 17:15:48 +00:00
+								    )
-												Lower case for checking don't reply

											
										
										
											2022-09-11 18:09:32 +00:00
+								    content_lower = content.lower()
-												Use reply and announce inhibitors in desktop client

											
										
										
											2022-05-08 17:15:48 +00:00
+								    for diss in disallow_strings:
-												Lower case for checking don't reply

											
										
										
											2022-09-11 18:09:32 +00:00
+								        if diss in content_lower:
-												Use reply and announce inhibitors in desktop client

											
										
										
											2022-05-08 17:15:48 +00:00
+								            return True
-												Don't show repeat icon for posts without image descriptions

											
										
										
											2022-12-29 11:50:51 +00:00
 								    # check for attached images without descriptions
 								    if isinstance(attachment, list):
 								        for item in attachment:
-												Typo

											
										
										
											2022-12-29 11:55:46 +00:00
+								            if not isinstance(item, dict):
-												Don't show repeat icon for posts without image descriptions

											
										
										
											2022-12-29 11:50:51 +00:00
+								                continue
 								            if not item.get('mediaType'):
 								                continue
 								            if not item.get('url'):
 								                continue
 								            if not item['mediaType'].startswith('image/'):
 								                continue
 								            if not item.get('name'):
 								                # no image description
 								                return True
-												Use reply and announce inhibitors in desktop client

											
										
										
											2022-05-08 17:15:48 +00:00
+								    return False
 								def disallow_reply(content: str) -> bool:
 								    """Are replies not allowed for the given post?
 								    """
 								    disallow_strings = (
 								        ':reply_no:',
 								        ':noreply:',
 								        ':noreplies:',
 								        ':no_reply:',
 								        ':no_replies:',
 								        ':replies_no:',
-												Additional reply indicators

											
										
										
											2022-06-03 09:28:34 +00:00
+								        'dont_at_me',
 								        'do not reply',
-												Extra no reply strings

											
										
										
											2022-06-14 20:38:56 +00:00
+								        "don't reply",
-												Extra string

											
										
										
											2022-07-13 20:50:22 +00:00
+								        "don't @ me",
-												Lower case for checking don't reply

											
										
										
											2022-09-11 18:09:32 +00:00
+								        'dont@me',
 								        'dontatme'
-												Use reply and announce inhibitors in desktop client

											
										
										
											2022-05-08 17:15:48 +00:00
+								    )
-												Lower case for checking don't reply

											
										
										
											2022-09-11 18:09:32 +00:00
+								    content_lower = content.lower()
-												Use reply and announce inhibitors in desktop client

											
										
										
											2022-05-08 17:15:48 +00:00
+								    for diss in disallow_strings:
-												Lower case for checking don't reply

											
										
										
											2022-09-11 18:09:32 +00:00
+								        if diss in content_lower:
-												Use reply and announce inhibitors in desktop client

											
										
										
											2022-05-08 17:15:48 +00:00
+								            return True
 								    return False
-												Prepare for alternative value field within attachments

											
										
										
											2022-05-11 17:17:23 +00:00
 								def get_attachment_property_value(property_value: {}) -> (str, str):
 								    """Returns the fieldname and value for an attachment property
 								    """
 								    prop_value = None
 								    prop_value_name = None
 								    if property_value.get('value'):
 								        prop_value = property_value['value']
 								        prop_value_name = 'value'
 								    elif property_value.get('http://schema.org#value'):
 								        prop_value_name = 'http://schema.org#value'
-												Tidying

											
										
										
											2022-05-11 19:05:21 +00:00
+								        prop_value = property_value[prop_value_name]
-												Prepare for alternative value field within attachments

											
										
										
											2022-05-11 17:17:23 +00:00
+								    elif property_value.get('https://schema.org#value'):
 								        prop_value_name = 'https://schema.org#value'
-												Tidying

											
										
										
											2022-05-11 19:05:21 +00:00
+								        prop_value = property_value[prop_value_name]
-												Support for chat FEP

											
										
										
											2023-07-09 10:41:51 +00:00
+								    elif property_value.get('href'):
 								        prop_value_name = 'href'
 								        prop_value = property_value[prop_value_name]
-												Prepare for alternative value field within attachments

											
										
										
											2022-05-11 17:17:23 +00:00
+								    return prop_value_name, prop_value
-												Check that strings passed to system commands are safe

											
										
										
											2022-07-22 10:54:57 +00:00
 								def safe_system_string(text: str) -> str:
 								    """Returns a safe version of a string which can be used within a
 								    system command
 								    """
 								    text = text.replace('$(', '(').replace('`', '')
 								    return text
-												Tidying

											
										
										
											2022-09-13 09:27:43 +00:00
 								def get_json_content_from_accept(accept: str) -> str:
 								    """returns the json content type for the given accept
 								    """
 								    protocol_str = 'application/json'
 								    if accept:
 								        if 'application/ld+json' in accept:
 								            protocol_str = 'application/ld+json'
 								    return protocol_str
-												Check for inverted text

											
										
										
											2022-09-25 17:26:11 +00:00
 								def remove_inverted_text(text: str, system_language: str) -> str:
 								    """Removes any inverted text from the given string
 								    """
 								    if system_language != 'en':
 								        return text
-												Fix inverted text test

											
										
										
											2022-09-25 20:12:10 +00:00
+								    inverted_lower = [*"_ʎ_ʍʌ_ʇ_ɹ____ɯʃʞɾıɥƃɟǝ_ɔ_ɐ"]
 								    inverted_upper = [*"_⅄__ᴧ∩⊥_ᴚΌԀ_ᴎ_⅂⋊ſ__⅁ℲƎ◖Ↄ𐐒∀"]
-												Fix inversion tests

											
										
										
											2022-09-25 19:47:15 +00:00
 								    start_separator = ''
 								    separator = '\n'
 								    if '</p>' in text:
 								        text = text.replace('<p>', '')
 								        start_separator = '<p>'
 								        separator = '</p>'
 								    paragraphs = text.split(separator)
 								    new_text = ''
-												Refactoring

											
										
										
											2022-09-26 09:37:44 +00:00
+								    inverted_list = (inverted_lower, inverted_upper)
 								    z_value = (ord('z'), ord('Z'))
-												Fix inversion tests

											
										
										
											2022-09-25 19:47:15 +00:00
+								    for para in paragraphs:
 								        replaced_chars = 0
-												Refactoring

											
										
										
											2022-09-26 09:37:44 +00:00
+								        for idx in range(2):
 								            index = 0
 								            for test_ch in inverted_list[idx]:
 								                if test_ch == '_':
 								                    index += 1
 								                    continue
 								                if test_ch in para:
 								                    para = para.replace(test_ch, chr(z_value[idx] - index))
 								                    replaced_chars += 1
-												Fix inversion tests

											
										
										
											2022-09-25 19:47:15 +00:00
+								                index += 1
 								        if replaced_chars > 2:
 								            para = para[::-1]
 								        if para:
 								            new_text += start_separator + para
 								            if separator in text:
 								                new_text += separator
 								    return new_text
-												Remove square capitals when filtering

											
										
										
											2022-10-05 17:55:24 +00:00
 								def remove_square_capitals(text: str, system_language: str) -> str:
 								    """Removes any square capital text from the given string
 								    """
 								    if system_language != 'en':
 								        return text
 								    offset = ord('A')
 								    start_value = ord('🅰')
 								    end_value = start_value + 26
 								    result = ''
 								    for text_ch in text:
 								        text_value = ord(text_ch)
 								        if text_value < start_value or text_value > end_value:
 								            result += text_ch
 								        else:
 								            result += chr(offset + text_value - start_value)
 								    return result
-												Screen readers don't announce hashes

											
										
										
											2022-11-11 11:26:17 +00:00
 								def dont_speak_hashtags(content: str) -> str:
 								    """Ensure that hashtags aren't announced by screen readers
 								    """
 								    if not content:
 								        return content
 								    return content.replace('>#<span',
-												Use hidden

											
										
										
											2022-11-11 11:40:43 +00:00
+								                           '><span aria-hidden="true">#</span><span')
-												Minimize all images on edit profile screen

											
										
										
											2022-11-13 19:45:34 +00:00
 								def load_min_images_for_accounts(base_dir: str) -> []:
 								    """Loads a list of nicknames for accounts where all images should
 								    be minimized by default
 								    """
 								    min_images_for_accounts = []
 								    for subdir, dirs, _ in os.walk(base_dir + '/accounts'):
 								        for account in dirs:
 								            if not is_account_dir(account):
 								                continue
 								            filename = os.path.join(subdir, account) + '/.minimize_all_images'
 								            if os.path.isfile(filename):
 								                min_images_for_accounts.append(account.split('@')[0])
 								        break
 								    return min_images_for_accounts
 								def set_minimize_all_images(base_dir: str,
 								                            nickname: str, domain: str,
 								                            minimize: bool,
 								                            min_images_for_accounts: []) -> None:
 								    """Add of remove a file indicating that all images for an account
 								    should be minimized by default
 								    """
 								    filename = acct_dir(base_dir, nickname, domain) + '/.minimize_all_images'
 								    if minimize:
 								        if nickname not in min_images_for_accounts:
 								            min_images_for_accounts.append(nickname)
 								        if not os.path.isfile(filename):
 								            try:
 								                with open(filename, 'w+', encoding='utf-8') as fp_min:
 								                    fp_min.write('\n')
 								            except OSError:
 								                print('EX: unable to write ' + filename)
 								        return
 								    if nickname in min_images_for_accounts:
 								        min_images_for_accounts.remove(nickname)
 								    if os.path.isfile(filename):
 								        try:
 								            os.remove(filename)
 								        except OSError:
 								            print('EX: unable to delete ' + filename)
-												Read reverse sequence flags from file

											
										
										
											2022-11-26 15:39:36 +00:00
 								def load_reverse_timeline(base_dir: str) -> []:
 								    """Loads flags for each user indicating whether they prefer to
 								    see reversed timelines
 								    """
 								    reverse_sequence = []
 								    for _, dirs, _ in os.walk(base_dir + '/accounts'):
 								        for acct in dirs:
 								            if not is_account_dir(acct):
 								                continue
 								            nickname = acct.split('@')[0]
 								            domain = acct.split('@')[1]
 								            reverse_filename = \
 								                acct_dir(base_dir, nickname, domain) + '/.reverse_timeline'
 								            if os.path.isfile(reverse_filename):
 								                if nickname not in reverse_sequence:
 								                    reverse_sequence.append(nickname)
 								        break
 								    return reverse_sequence
-												Option to reverse the sequence of timelines

											
										
										
											2022-11-26 16:27:01 +00:00
 								def save_reverse_timeline(base_dir: str, reverse_sequence: []) -> []:
 								    """Saves flags for each user indicating whether they prefer to
 								    see reversed timelines
 								    """
 								    for _, dirs, _ in os.walk(base_dir + '/accounts'):
 								        for acct in dirs:
 								            if not is_account_dir(acct):
 								                continue
 								            nickname = acct.split('@')[0]
 								            domain = acct.split('@')[1]
 								            reverse_filename = \
 								                acct_dir(base_dir, nickname, domain) + '/.reverse_timeline'
 								            if nickname in reverse_sequence:
 								                if not os.path.isfile(reverse_filename):
 								                    try:
 								                        with open(reverse_filename, 'w+',
 								                                  encoding='utf-8') as fp_reverse:
 								                            fp_reverse.write('\n')
 								                    except OSError:
 								                        print('EX: failed to save reverse ' + reverse_filename)
 								            else:
 								                if os.path.isfile(reverse_filename):
 								                    try:
 								                        os.remove(reverse_filename)
 								                    except OSError:
 								                        print('EX: failed to delete reverse ' +
 								                              reverse_filename)
 								        break
-												Reject quote toots

											
										
										
											2022-12-24 15:33:26 +00:00
-												Reject quote toot based upon content

											
										
										
											2023-01-03 15:43:52 +00:00
+								def is_quote_toot(post_json_object: str, content: str) -> bool:
-												Buy links

											
										
										
											2023-01-13 15:04:48 +00:00
+								    """Returns true if the given post is a quote toot / quote tweet
-												Reject quote toots

											
										
										
											2022-12-24 15:33:26 +00:00
+								    """
-												Comments

											
										
										
											2023-01-08 13:16:54 +00:00
+								    # Pleroma/Misskey implementations
-												Quote toot detection

											
										
										
											2022-12-24 16:52:16 +00:00
+								    if post_json_object['object'].get('quoteUri') or \
-												Not duplicate

											
										
										
											2023-02-13 09:29:01 +00:00
+								       post_json_object['object'].get('quoteUrl') or \
-												Additional quote toot style

											
										
										
											2023-07-19 09:59:34 +00:00
+								       post_json_object['object'].get('quoteReply') or \
 								       post_json_object['object'].get('toot:quoteReply') or \
-												Extra QT field

											
										
										
											2023-01-08 13:14:36 +00:00
+								       post_json_object['object'].get('_misskey_quote'):
-												Reject quote toots

											
										
										
											2022-12-24 15:33:26 +00:00
+								        return True
-												Comments

											
										
										
											2023-01-08 13:16:54 +00:00
+								    # More correct ActivityPub implementation - adding a Link tag
-												Alternate quote tweet formats

											
										
										
											2022-12-24 17:07:24 +00:00
+								    if post_json_object['object'].get('tag'):
 								        if isinstance(post_json_object['object']['tag'], list):
 								            for item in post_json_object['object']['tag']:
 								                if not isinstance(item, dict):
 								                    continue
-												Extra quote toot style

											
										
										
											2023-04-26 15:07:03 +00:00
+								                if item.get('rel'):
 								                    if isinstance(item['rel'], list):
 								                        for rel_str in item['rel']:
 								                            if not isinstance(rel_str, str):
 								                                continue
 								                            if '_misskey_quote' in rel_str:
 								                                return True
 								                    elif isinstance(item['rel'], str):
 								                        if '_misskey_quote' in item['rel']:
 								                            return True
-												Alternate quote tweet formats

											
										
										
											2022-12-24 17:07:24 +00:00
+								                if not item.get('type'):
 								                    continue
 								                if not item.get('mediaType'):
 								                    continue
-												Check field types

											
										
										
											2022-12-24 17:48:09 +00:00
+								                if not isinstance(item['type'], str):
 								                    continue
-												Alternate quote tweet formats

											
										
										
											2022-12-24 17:07:24 +00:00
+								                if item['type'] != 'Link':
 								                    continue
-												Check field types

											
										
										
											2022-12-24 17:48:09 +00:00
+								                if not isinstance(item['mediaType'], str):
 								                    continue
-												Alternate quote tweet formats

											
										
										
											2022-12-24 17:07:24 +00:00
+								                if 'json' not in item['mediaType']:
 								                    continue
 								                return True
-												Comments

											
										
										
											2023-01-08 13:16:54 +00:00
+								    # Twitter-style indicator
-												Reject quote toot based upon content

											
										
										
											2023-01-03 15:43:52 +00:00
+								    if content:
 								        if 'QT: ' in content:
 								            return True
-												Reject quote toots

											
										
										
											2022-12-24 15:33:26 +00:00
+								    return False
-												Set license link from name

											
										
										
											2022-12-27 21:30:20 +00:00
 								def license_link_from_name(license: str) -> str:
 								    """Returns the license link from its name
 								    """
 								    if '://' in license:
 								        return license
 								    value_upper = license.upper()
 								    if 'CC-BY-SA-NC' in value_upper or \
 								       'CC-BY-NC-SA' in value_upper or \
 								       'CC BY SA NC' in value_upper or \
 								       'CC BY NC SA' in value_upper:
 								        value = 'https://creativecommons.org/licenses/by-nc-sa/4.0'
 								    elif 'CC-BY-SA' in value_upper or 'CC-SA-BY' in value_upper or \
 								         'CC BY SA' in value_upper or 'CC SA BY' in value_upper:
 								        value = 'https://creativecommons.org/licenses/by-sa/4.0'
 								    elif 'CC-BY-NC' in value_upper or 'CC BY NC' in value_upper:
 								        value = 'https://creativecommons.org/licenses/by-nc/4.0'
 								    elif 'CC-BY-ND' in value_upper or 'CC BY ND' in value_upper:
 								        value = 'https://creativecommons.org/licenses/by-nc-nd/4.0'
 								    elif 'CC-BY' in value_upper or 'CC BY' in value_upper:
 								        value = 'https://creativecommons.org/licenses/by/4.0'
 								    elif 'GFDL' in value_upper or 'GNU FREE DOC' in value_upper:
 								        value = 'https://www.gnu.org/licenses/fdl-1.3.html'
 								    elif 'OPL' in value_upper or 'OPEN PUBLICATION LIC' in value_upper:
 								        value = 'https://opencontent.org/openpub'
-												Open data licenses

											
										
										
											2023-01-16 17:52:54 +00:00
+								    elif 'PDDL' in value_upper or 'OPEN DATA COMMONS PUBLIC' in value_upper:
 								        value = 'https://opendatacommons.org/licenses/pddl'
 								    elif 'ODBL' in value_upper or 'OPEN DATA COMMONS OPEN' in value_upper:
 								        value = 'https://opendatacommons.org/licenses/odbl'
 								    elif 'ODC' in value_upper or 'OPEN DATA COMMONS ATTR' in value_upper:
 								        value = 'https://opendatacommons.org/licenses/by'
 								    elif 'OGL' in value_upper or 'OPEN GOVERNMENT LIC' in value_upper:
 								        value = \
 								            'https://www.nationalarchives.gov.uk/doc/open-government-licence'
-												Set license link from name

											
										
										
											2022-12-27 21:30:20 +00:00
+								    elif 'PDL' in value_upper or \
 								         'PUBLIC DOCUMENTATION LIC' in value_upper:
 								        value = 'http://www.openoffice.org/licenses/PDL.html'
 								    elif 'FREEBSD' in value_upper:
 								        value = 'https://www.freebsd.org/copyright/freebsd-doc-license'
 								    elif 'WTF' in value_upper:
 								        value = 'http://www.wtfpl.net/txt/copying'
 								    elif 'UNLICENSE' in value_upper:
 								        value = 'https://unlicense.org'
 								    else:
 								        value = 'https://creativecommons.org/publicdomain/zero/1.0'
 								    return value
-												Escape text within blog rss feed

											
										
										
											2023-01-02 09:55:41 +00:00
-												Tidying

											
										
										
											2023-01-02 11:41:48 +00:00
+								def _get_escaped_chars() -> {}:
 								    """Returns escaped characters
-												Escape text within blog rss feed

											
										
										
											2023-01-02 09:55:41 +00:00
+								    """
-												Tidying

											
										
										
											2023-01-02 11:41:48 +00:00
+								    return {
-												Escape text within blog rss feed

											
										
										
											2023-01-02 09:55:41 +00:00
+								        "&": "&amp;",
 								        "<": "&lt;",
 								        ">": "&gt;",
 								        '"': "&quot;",
 								        "'": "&apos;"
 								    }
-												Tidying

											
										
										
											2023-01-02 11:41:48 +00:00
 								def escape_text(txt: str) -> str:
 								    """Escape text for inclusion in xml/rss
 								    """
 								    for orig, replacement in _get_escaped_chars().items():
-												Escape text within blog rss feed

											
										
										
											2023-01-02 09:55:41 +00:00
+								        txt = txt.replace(orig, replacement)
 								    return txt
-												Escape rss titles and descriptions

											
										
										
											2023-01-02 10:24:35 +00:00
 								def unescaped_text(txt: str) -> str:
 								    """Escape text for inclusion in xml/rss
 								    """
-												Tidying

											
										
										
											2023-01-02 11:41:48 +00:00
+								    for orig, replacement in _get_escaped_chars().items():
-												Escape rss titles and descriptions

											
										
										
											2023-01-02 10:24:35 +00:00
+								        txt = txt.replace(replacement, orig)
 								    return txt
-												Tidying

											
										
										
											2023-01-07 11:45:19 +00:00
 								def harmless_markup(post_json_object: {}) -> None:
 								    """render harmless any dangerous markup
 								    """
 								    for field_name in ('content', 'summary'):
 								        if post_json_object['object'].get(field_name):
 								            if dangerous_markup(post_json_object['object'][field_name],
-												Allow pre tag through dangerous markup filter in some cases, then remove it when rendering

											
										
										
											2023-05-18 11:15:18 +00:00
+								                                False, ['pre']):
-												Tidying

											
										
										
											2023-01-07 11:45:19 +00:00
+								                post_json_object['object'][field_name] = \
 								                    remove_html(post_json_object['object'][field_name])
-												Allow pre tag through dangerous markup filter in some cases, then remove it when rendering

											
										
										
											2023-05-18 11:15:18 +00:00
+								            post_json_object['object'][field_name] = \
 								                remove_markup_tag(post_json_object['object'][field_name],
 								                                  'pre')
-												Tidying

											
										
										
											2023-01-07 11:45:19 +00:00
+								        map_name = field_name + 'Map'
 								        if post_json_object['object'].get(map_name):
 								            map_dict = post_json_object['object'][map_name].items()
 								            for lang, content in map_dict:
-												Check that content is a string

											
										
										
											2023-03-03 10:04:43 +00:00
+								                if not isinstance(content, str):
 								                    continue
-												Allow pre tag through dangerous markup filter in some cases, then remove it when rendering

											
										
										
											2023-05-18 11:15:18 +00:00
+								                if dangerous_markup(content, False, ['pre']):
-												Tidying

											
										
										
											2023-01-07 11:45:19 +00:00
+								                    content = remove_html(content)
 								                    post_json_object['object'][map_name][lang] = \
 								                        content
-												Allow pre tag through dangerous markup filter in some cases, then remove it when rendering

											
										
										
											2023-05-18 11:15:18 +00:00
+								                content = post_json_object['object'][map_name][lang]
 								                post_json_object['object'][map_name][lang] = \
 								                    remove_markup_tag(content, 'pre')
-												Show proxied actors

											
										
										
											2023-05-12 13:47:28 +00:00
-												More general

											
										
										
											2023-05-12 14:39:26 +00:00
+								def ap_proxy_type(json_object: {}) -> str:
 								    """Returns a string indicating the proxy for an activitypub post
-												Show proxied actors

											
										
										
											2023-05-12 13:47:28 +00:00
+								    or None if not proxied
-												Comment

											
										
										
											2023-05-12 17:13:33 +00:00
+								    See https://codeberg.org/fediverse/fep/src/branch/main/feps/fep-fffd.md
-												Show proxied actors

											
										
										
											2023-05-12 13:47:28 +00:00
+								    """
-												More general

											
										
										
											2023-05-12 14:39:26 +00:00
+								    if not json_object.get('proxyOf'):
-												Show proxied actors

											
										
										
											2023-05-12 13:47:28 +00:00
+								        return None
-												More general

											
										
										
											2023-05-12 14:39:26 +00:00
+								    if not isinstance(json_object['proxyOf'], list):
-												Show proxied actors

											
										
										
											2023-05-12 13:47:28 +00:00
+								        return None
-												More general

											
										
										
											2023-05-12 14:39:26 +00:00
+								    for proxy_dict in json_object['proxyOf']:
-												Show proxied actors

											
										
										
											2023-05-12 13:47:28 +00:00
+								        if proxy_dict.get('protocol'):
 								            if isinstance(proxy_dict['protocol'], str):
 								                return proxy_dict['protocol']
 								    return None