epicyon/speaker.py

547 lines
19 KiB
Python
Raw Normal View History

2021-03-01 19:16:33 +00:00
__filename__ = "speaker.py"
__author__ = "Bob Mottram"
__license__ = "AGPL3+"
__version__ = "1.2.0"
__maintainer__ = "Bob Mottram"
__email__ = "bob@freedombone.net"
__status__ = "Production"
2021-03-02 12:39:18 +00:00
import os
2021-03-03 19:06:18 +00:00
import html
2021-03-01 19:16:33 +00:00
import random
2021-03-03 19:06:18 +00:00
import urllib.parse
2021-03-01 19:16:33 +00:00
from auth import createBasicAuthHeader
from session import getJson
from utils import isDM
from utils import camelCaseSplit
2021-03-03 19:06:18 +00:00
from utils import getDomainFromActor
from utils import getNicknameFromActor
from utils import getGenderFromBio
from utils import getDisplayName
from utils import removeHtml
2021-03-03 12:34:46 +00:00
from utils import loadJson
2021-03-03 19:06:18 +00:00
from utils import saveJson
2021-03-01 19:16:33 +00:00
from utils import getFullDomain
2021-03-12 12:04:34 +00:00
from utils import isPGPEncrypted
2021-03-03 19:06:18 +00:00
from content import htmlReplaceQuoteMarks
2021-03-01 19:16:33 +00:00
2021-03-03 12:34:46 +00:00
speakerRemoveChars = ('.\n', '. ', ',', ';', '?', '!')
2021-03-01 19:16:33 +00:00
def getSpeakerPitch(displayName: str, screenreader: str, gender) -> int:
2021-03-01 19:16:33 +00:00
"""Returns the speech synthesis pitch for the given name
"""
random.seed(displayName)
rangeMin = 1
rangeMax = 100
if 'She' in gender:
rangeMin = 50
elif 'Him' in gender:
rangeMax = 50
2021-03-02 15:13:10 +00:00
if screenreader == 'picospeaker':
2021-03-03 20:19:56 +00:00
rangeMin = -6
rangeMax = 3
if 'She' in gender:
rangeMin = -1
elif 'Him' in gender:
rangeMax = -1
return random.randint(rangeMin, rangeMax)
2021-03-01 19:16:33 +00:00
2021-03-02 15:13:10 +00:00
def getSpeakerRate(displayName: str, screenreader: str) -> int:
2021-03-01 19:16:33 +00:00
"""Returns the speech synthesis rate for the given name
"""
random.seed(displayName)
2021-03-02 15:13:10 +00:00
if screenreader == 'picospeaker':
2021-03-03 21:21:17 +00:00
return random.randint(-40, -20)
2021-03-01 19:16:33 +00:00
return random.randint(50, 120)
def getSpeakerRange(displayName: str) -> int:
"""Returns the speech synthesis range for the given name
"""
random.seed(displayName)
return random.randint(300, 800)
2021-03-03 19:06:18 +00:00
def _speakerPronounce(baseDir: str, sayText: str, translate: {}) -> str:
2021-03-02 12:39:18 +00:00
"""Screen readers may not always pronounce correctly, so you
can have a file which specifies conversions. File should contain
line items such as:
Epicyon -> Epi-cyon
"""
pronounceFilename = baseDir + '/accounts/speaker_pronounce.txt'
2021-03-03 19:15:32 +00:00
convertDict = {}
if translate:
convertDict = {
"Epicyon": "Epi-cyon",
"espeak": "e-speak",
"emoji": "emowji",
"clearnet": "clear-net",
"https": "H-T-T-P-S",
"HTTPS": "H-T-T-P-S",
2021-03-03 20:41:22 +00:00
"XMPP": "X-M-P-P",
"xmpp": "X-M-P-P",
2021-03-03 22:26:54 +00:00
"sql": "S-Q-L",
2021-03-08 22:02:54 +00:00
".js": " dot J-S",
2021-03-04 11:51:30 +00:00
"PSQL": "Postgres S-Q-L",
2021-03-03 22:26:54 +00:00
"SQL": "S-Q-L",
2021-03-11 12:44:47 +00:00
"gdpr": "G-D-P-R",
2021-03-13 10:07:57 +00:00
"kde": "K-D-E",
2021-03-14 11:17:37 +00:00
"AGPL": "Affearo G-P-L",
"agpl": "Affearo G-P-L",
"GPL": "G-P-L",
"gpl": "G-P-L",
2021-03-04 15:54:52 +00:00
"coop": "co-op",
2021-03-04 11:51:30 +00:00
"KMail": "K-Mail",
2021-03-13 10:10:02 +00:00
"kmail": "K-Mail",
2021-03-04 11:51:30 +00:00
"gmail": "G-mail",
"Gmail": "G-mail",
"OpenPGP": "Open P-G-P",
2021-03-03 19:15:32 +00:00
"Tor": "Toor",
2021-03-10 18:44:44 +00:00
"memes": "meemes",
"Memes": "Meemes",
2021-03-10 20:43:02 +00:00
"rofl": "roll on the floor laughing",
"ROFL": "roll on the floor laughing",
2021-03-10 13:45:34 +00:00
"fwiw": "for what it's worth",
"fyi": "for your information",
2021-03-10 21:08:18 +00:00
"irl": "in real life",
"IRL": "in real life",
2021-03-10 13:45:34 +00:00
"imho": "in my opinion",
2021-03-09 20:06:26 +00:00
"fediverse": "fediiverse",
"Fediverse": "Fediiverse",
2021-03-04 16:46:21 +00:00
" foss ": " free and open source software ",
" floss ": " free libre and open source software ",
" FOSS ": "free and open source software",
" FLOSS ": "free libre and open source software",
" oss ": " open source software ",
" OSS ": " open source software ",
2021-03-03 19:15:32 +00:00
"🤔": ". " + translate["thinking emoji"],
"RT @": "Re-Tweet ",
2021-03-03 20:56:35 +00:00
"#nowplaying": translate["hashtag"] + " now-playing",
"#NowPlaying": translate["hashtag"] + " now-playing",
2021-03-03 20:59:21 +00:00
"#": translate["hashtag"] + ' ',
2021-03-03 19:15:32 +00:00
":D": '. ' + translate["laughing"],
":-D": '. ' + translate["laughing"],
":)": '. ' + translate["smile"],
";)": '. ' + translate["wink"],
":(": '. ' + translate["sad face"],
":-)": '. ' + translate["smile"],
":-(": '. ' + translate["sad face"],
";-)": '. ' + translate["wink"],
2021-03-10 10:43:53 +00:00
":O": '. ' + translate['shocked'],
2021-03-04 15:54:52 +00:00
"?": "? ",
2021-03-04 16:20:24 +00:00
'"': "'",
2021-03-03 21:30:01 +00:00
"*": "",
"(": ",",
")": ","
2021-03-03 19:15:32 +00:00
}
2021-03-02 12:39:18 +00:00
if os.path.isfile(pronounceFilename):
with open(pronounceFilename, 'r') as fp:
pronounceList = fp.readlines()
for conversion in pronounceList:
separator = None
if '->' in conversion:
separator = '->'
elif ';' in conversion:
separator = ';'
elif ':' in conversion:
separator = ':'
elif ',' in conversion:
separator = ','
if not separator:
continue
text = conversion.split(separator)[0].strip()
converted = conversion.split(separator)[1].strip()
convertDict[text] = converted
for text, converted in convertDict.items():
if text in sayText:
sayText = sayText.replace(text, converted)
return sayText
def speakerReplaceLinks(sayText: str, translate: {},
detectedLinks: []) -> str:
"""Replaces any links in the given text with "link to [domain]".
Instead of reading out potentially very long and meaningless links
"""
text = sayText
2021-03-03 12:34:46 +00:00
for ch in speakerRemoveChars:
text = text.replace(ch, ' ')
replacements = {}
wordsList = text.split(' ')
2021-03-03 19:15:32 +00:00
if translate.get('Linked'):
linkedStr = translate['Linked']
else:
linkedStr = 'Linked'
2021-03-02 14:05:43 +00:00
prevWord = ''
for word in wordsList:
2021-03-11 11:35:03 +00:00
if word.startswith('v='):
2021-03-11 12:24:20 +00:00
replacements[word] = ''
2021-03-02 16:50:32 +00:00
if word.startswith(':'):
if word.endswith(':'):
2021-03-02 17:18:47 +00:00
replacements[word] = ', emowji ' + word.replace(':', '') + ','
2021-03-02 16:50:32 +00:00
continue
2021-03-02 14:09:51 +00:00
if word.startswith('@') and not prevWord.endswith('RT'):
2021-03-11 11:35:03 +00:00
# replace mentions, but not re-tweets
2021-03-03 19:15:32 +00:00
if translate.get('mentioning'):
replacements[word] = \
2021-03-04 11:52:22 +00:00
translate['mentioning'] + ' ' + word[1:] + ', '
2021-03-02 14:05:43 +00:00
prevWord = word
domain = None
domainFull = None
if 'https://' in word:
domain = word.split('https://')[1]
domainFull = 'https://' + domain
elif 'http://' in word:
domain = word.split('http://')[1]
domainFull = 'http://' + domain
if not domain:
continue
if '/' in domain:
domain = domain.split('/')[0]
if domain.startswith('www.'):
domain = domain.replace('www.', '')
replacements[domainFull] = '. ' + linkedStr + ' ' + domain + '.'
detectedLinks.append(domainFull)
for replaceStr, newStr in replacements.items():
sayText = sayText.replace(replaceStr, newStr)
return sayText.replace('..', '.')
2021-03-03 12:34:46 +00:00
def _addSSMLemphasis(sayText: str) -> str:
"""Adds emphasis to *emphasised* text
"""
if '*' not in sayText:
return sayText
text = sayText
for ch in speakerRemoveChars:
text = text.replace(ch, ' ')
wordsList = text.split(' ')
replacements = {}
for word in wordsList:
if word.startswith('*'):
if word.endswith('*'):
replacements[word] = \
'<emphasis level="strong">' + \
word.replace('*', '') + \
'</emphasis>'
for replaceStr, newStr in replacements.items():
sayText = sayText.replace(replaceStr, newStr)
return sayText
2021-03-03 19:06:18 +00:00
def _removeEmojiFromText(sayText: str) -> str:
2021-03-03 18:24:37 +00:00
"""Removes :emoji: from the given text
"""
2021-03-03 20:18:14 +00:00
if ':' not in sayText:
2021-03-03 18:24:37 +00:00
return sayText
text = sayText
for ch in speakerRemoveChars:
text = text.replace(ch, ' ')
wordsList = text.split(' ')
replacements = {}
for word in wordsList:
if word.startswith(':'):
if word.endswith(':'):
2021-03-03 22:05:56 +00:00
replacements[word] = ''
2021-03-03 18:24:37 +00:00
for replaceStr, newStr in replacements.items():
sayText = sayText.replace(replaceStr, newStr)
return sayText.replace(' ', ' ').strip()
2021-03-01 19:16:33 +00:00
def getSpeakerFromServer(baseDir: str, session,
nickname: str, password: str,
domain: str, port: int,
httpPrefix: str,
debug: bool, projectVersion: str) -> {}:
"""Returns some json which contains the latest inbox
entry in a minimal format suitable for a text-to-speech reader
"""
if not session:
print('WARN: No session for getSpeakerFromServer')
return 6
domainFull = getFullDomain(domain, port)
authHeader = createBasicAuthHeader(nickname, password)
headers = {
'host': domain,
'Content-type': 'application/json',
'Authorization': authHeader
}
url = \
httpPrefix + '://' + \
domainFull + '/users/' + nickname + '/speaker'
speakerJson = \
getJson(session, url, headers, None,
2021-03-10 15:47:12 +00:00
__version__, httpPrefix, domain, 20, True)
2021-03-01 19:16:33 +00:00
return speakerJson
2021-03-03 12:34:46 +00:00
2021-03-03 19:06:18 +00:00
def _speakerEndpointJson(displayName: str, summary: str,
2021-03-11 10:10:56 +00:00
content: str, sayContent: str,
imageDescription: str,
links: [], gender: str, postId: str,
2021-03-09 15:01:35 +00:00
postDM: bool, postReply: bool,
followRequestsExist: bool,
likedBy: str, published: str, postCal: bool,
postShare: bool, themeName: str,
isDirect: bool) -> {}:
2021-03-03 12:34:46 +00:00
"""Returns a json endpoint for the TTS speaker
"""
2021-03-03 13:02:47 +00:00
speakerJson = {
2021-03-03 12:34:46 +00:00
"name": displayName,
"summary": summary,
2021-03-11 10:10:56 +00:00
"content": content,
"say": sayContent,
"published": published,
2021-03-03 12:34:46 +00:00
"imageDescription": imageDescription,
"detectedLinks": links,
"id": postId,
"direct": isDirect,
"notify": {
2021-03-09 19:52:10 +00:00
"theme": themeName,
"dm": postDM,
2021-03-09 15:01:35 +00:00
"reply": postReply,
"followRequests": followRequestsExist,
"likedBy": likedBy,
"calendar": postCal,
"share": postShare
}
2021-03-03 12:34:46 +00:00
}
2021-03-03 13:02:47 +00:00
if gender:
speakerJson['gender'] = gender
return speakerJson
2021-03-03 12:34:46 +00:00
2021-03-04 10:25:36 +00:00
def _SSMLheader(systemLanguage: str, instanceTitle: str) -> str:
"""Returns a header for an SSML document
"""
return '<?xml version="1.0"?>\n' + \
'<speak xmlns="http://www.w3.org/2001/10/synthesis"\n' + \
' xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance"\n' + \
' xsi:schemaLocation="http://www.w3.org/2001/10/synthesis\n' + \
' http://www.w3.org/TR/speech-synthesis11/synthesis.xsd"\n' + \
' version="1.1">\n' + \
' <metadata>\n' + \
' <dc:title xml:lang="' + systemLanguage + '">' + \
instanceTitle + ' inbox</dc:title>\n' + \
' </metadata>\n'
2021-03-03 12:34:46 +00:00
def _speakerEndpointSSML(displayName: str, summary: str,
content: str, imageDescription: str,
links: [], language: str,
instanceTitle: str,
gender: str) -> str:
"""Returns an SSML endpoint for the TTS speaker
https://en.wikipedia.org/wiki/Speech_Synthesis_Markup_Language
https://www.w3.org/TR/speech-synthesis/
"""
langShort = 'en'
if language:
langShort = language[:2]
if not gender:
gender = 'neutral'
else:
if langShort == 'en':
gender = gender.lower()
2021-03-03 13:02:47 +00:00
if 'he/him' in gender:
2021-03-03 12:34:46 +00:00
gender = 'male'
2021-03-03 13:02:47 +00:00
elif 'she/her' in gender:
2021-03-03 12:34:46 +00:00
gender = 'female'
else:
gender = 'neutral'
content = _addSSMLemphasis(content)
voiceParams = 'name="' + displayName + '" gender="' + gender + '"'
2021-03-04 10:25:36 +00:00
return _SSMLheader(langShort, instanceTitle) + \
2021-03-03 12:34:46 +00:00
' <p>\n' + \
' <s xml:lang="' + language + '">\n' + \
' <voice ' + voiceParams + '>\n' + \
' ' + content + '\n' + \
' </voice>\n' + \
' </s>\n' + \
' </p>\n' + \
'</speak>\n'
def getSSMLbox(baseDir: str, path: str,
domain: str,
systemLanguage: str,
instanceTitle: str,
boxName: str) -> str:
"""Returns SSML for the given timeline
"""
nickname = path.split('/users/')[1]
if '/' in nickname:
nickname = nickname.split('/')[0]
speakerFilename = \
baseDir + '/accounts/' + nickname + '@' + domain + '/speaker.json'
if not os.path.isfile(speakerFilename):
return None
speakerJson = loadJson(speakerFilename)
if not speakerJson:
return None
gender = None
if speakerJson.get('gender'):
gender = speakerJson['gender']
return _speakerEndpointSSML(speakerJson['name'],
speakerJson['summary'],
speakerJson['say'],
speakerJson['imageDescription'],
speakerJson['detectedLinks'],
systemLanguage,
instanceTitle, gender)
2021-03-03 19:06:18 +00:00
def _postToSpeakerJson(baseDir: str, httpPrefix: str,
nickname: str, domain: str, domainFull: str,
2021-03-04 10:11:30 +00:00
postJsonObject: {}, personCache: {},
2021-03-09 19:52:10 +00:00
translate: {}, announcingActor: str,
themeName: str) -> {}:
2021-03-04 10:11:30 +00:00
"""Converts an ActivityPub post into some Json containing
speech synthesis parameters.
NOTE: There currently appears to be no standardized json
format for speech synthesis
2021-03-03 19:06:18 +00:00
"""
if not postJsonObject.get('object'):
return
if not isinstance(postJsonObject['object'], dict):
return
if not postJsonObject['object'].get('content'):
return
if not isinstance(postJsonObject['object']['content'], str):
return
detectedLinks = []
content = urllib.parse.unquote_plus(postJsonObject['object']['content'])
content = html.unescape(content)
content = content.replace('<p>', '').replace('</p>', ' ')
2021-03-12 12:04:34 +00:00
if not isPGPEncrypted(content):
2021-03-11 17:15:32 +00:00
# replace some emoji before removing html
if ' <3' in content:
content = content.replace(' <3', ' ' + translate['heart'])
content = removeHtml(htmlReplaceQuoteMarks(content))
content = speakerReplaceLinks(content, translate, detectedLinks)
# replace all double spaces
while ' ' in content:
content = content.replace(' ', ' ')
content = content.replace(' . ', '. ').strip()
sayContent = content
sayContent = _speakerPronounce(baseDir, content, translate)
# replace all double spaces
while ' ' in sayContent:
sayContent = sayContent.replace(' ', ' ')
sayContent = sayContent.replace(' . ', '. ').strip()
else:
sayContent = content
2021-03-03 19:06:18 +00:00
imageDescription = ''
if postJsonObject['object'].get('attachment'):
attachList = postJsonObject['object']['attachment']
if isinstance(attachList, list):
for img in attachList:
if not isinstance(img, dict):
continue
if img.get('name'):
if isinstance(img['name'], str):
imageDescription += \
img['name'] + '. '
isDirect = isDM(postJsonObject)
published = ''
if postJsonObject['object'].get('published'):
published = postJsonObject['object']['published']
2021-03-03 19:06:18 +00:00
summary = ''
if postJsonObject['object'].get('summary'):
if isinstance(postJsonObject['object']['summary'], str):
summary = \
urllib.parse.unquote_plus(postJsonObject['object']['summary'])
summary = html.unescape(summary)
speakerName = \
getDisplayName(baseDir, postJsonObject['actor'], personCache)
if not speakerName:
return
speakerName = _removeEmojiFromText(speakerName)
2021-03-03 20:22:18 +00:00
speakerName = speakerName.replace('_', ' ')
speakerName = camelCaseSplit(speakerName)
2021-03-03 19:06:18 +00:00
gender = getGenderFromBio(baseDir, postJsonObject['actor'],
personCache, translate)
if announcingActor:
announcedNickname = getNicknameFromActor(announcingActor)
2021-03-03 19:36:13 +00:00
announcedDomain, announcedport = getDomainFromActor(announcingActor)
2021-03-03 19:31:23 +00:00
if announcedNickname and announcedDomain:
announcedHandle = announcedNickname + '@' + announcedDomain
2021-03-11 10:10:56 +00:00
sayContent = \
translate['announces'] + ' ' + \
announcedHandle + '. ' + sayContent
content = \
translate['announces'] + ' ' + \
announcedHandle + '. ' + content
postId = None
if postJsonObject['object'].get('id'):
postId = postJsonObject['object']['id']
2021-03-09 15:01:35 +00:00
followRequestsExist = False
accountsDir = baseDir + '/accounts/' + nickname + '@' + domainFull
approveFollowsFilename = accountsDir + '/followrequests.txt'
if os.path.isfile(approveFollowsFilename):
with open(approveFollowsFilename, 'r') as fp:
follows = fp.readlines()
if len(follows) > 0:
followRequestsExist = True
2021-03-09 22:25:32 +00:00
postDM = False
dmFilename = accountsDir + '/.newDM'
if os.path.isfile(dmFilename):
postDM = True
postReply = False
replyFilename = accountsDir + '/.newReply'
if os.path.isfile(replyFilename):
postReply = True
2021-03-09 15:01:35 +00:00
likedBy = ''
likeFilename = accountsDir + '/.newLike'
if os.path.isfile(likeFilename):
with open(likeFilename, 'r') as fp:
likedBy = fp.read()
calendarFilename = accountsDir + '/.newCalendar'
postCal = os.path.isfile(calendarFilename)
shareFilename = accountsDir + '/.newShare'
postShare = os.path.isfile(shareFilename)
2021-03-09 15:01:35 +00:00
2021-03-04 10:11:30 +00:00
return _speakerEndpointJson(speakerName, summary,
2021-03-11 10:10:56 +00:00
content, sayContent, imageDescription,
detectedLinks, gender, postId,
2021-03-09 15:01:35 +00:00
postDM, postReply,
followRequestsExist,
likedBy, published,
postCal, postShare, themeName,
isDirect)
2021-03-04 10:11:30 +00:00
def updateSpeaker(baseDir: str, httpPrefix: str,
nickname: str, domain: str, domainFull: str,
2021-03-04 10:11:30 +00:00
postJsonObject: {}, personCache: {},
2021-03-09 19:52:10 +00:00
translate: {}, announcingActor: str,
themeName: str) -> None:
2021-03-04 10:11:30 +00:00
""" Generates a json file which can be used for TTS announcement
of incoming inbox posts
"""
speakerJson = \
_postToSpeakerJson(baseDir, httpPrefix,
nickname, domain, domainFull,
2021-03-04 10:11:30 +00:00
postJsonObject, personCache,
2021-03-09 19:52:10 +00:00
translate, announcingActor,
themeName)
2021-03-04 10:11:30 +00:00
speakerFilename = \
baseDir + '/accounts/' + nickname + '@' + domain + '/speaker.json'
2021-03-03 19:06:18 +00:00
saveJson(speakerJson, speakerFilename)