Add local blog posts to the newswire

2020-10-05 12:11:48 +01:00 · 2020-10-05 12:11:48 +01:00 · 9b75c034a0
parent ec5e7bc59f
commit 9b75c034a0
1 changed files with 83 additions and 0 deletions
--- a/newswire.py
+++ b/newswire.py
@ -13,6 +13,8 @@ from socket import error as SocketError
 import errno
 from datetime import datetime
 from collections import OrderedDict
+from utils import locatePost
+from utils import loadJson


 def rss2Header(httpPrefix: str,
@ -162,6 +164,81 @@ def getRSSfromDict(baseDir: str, newswire: {},
    return rssStr


+def addAccountBlogsToNewswire(baseDir: str, nickname: str, domain: str,
+                              newswire: {},
+                              maxBlogsPerAccount: int,
+                              indexFilename: str) -> None:
+    """Adds blogs for the given account to the newswire
+    """
+    if not os.path.isfile(indexFilename):
+        return
+    with open(indexFilename, 'r') as indexFile:
+        postFilename = 'start'
+        ctr = 0
+        while postFilename:
+            postFilename = indexFile.readline()
+            if postFilename:
+                # if this is a full path then remove the directories
+                if '/' in postFilename:
+                    postFilename = postFilename.split('/')[-1]
+
+                # filename of the post without any extension or path
+                # This should also correspond to any index entry in
+                # the posts cache
+                postUrl = \
+                    postFilename.replace('\n', '').replace('\r', '')
+                postUrl = postUrl.replace('.json', '').strip()
+
+                # read the post from file
+                fullPostFilename = \
+                    locatePost(baseDir, nickname,
+                               domain, postUrl, False)
+                isAPost = False
+                postJsonObject = None
+                if fullPostFilename:
+                    postJsonObject = loadJson(fullPostFilename)
+                    if postJsonObject:
+                        if postJsonObject.get('object'):
+                            if isinstance(postJsonObject['object'], dict):
+                                isAPost = True
+                if isAPost:
+                    if postJsonObject['object'].get('summary') and \
+                       postJsonObject['object'].get('url') and \
+                       postJsonObject['object'].get('published'):
+                        published = postJsonObject['object']['published']
+                        published = published.replace('T', ' ')
+                        published = published.replace('Z', '+00:00')
+                        newswire[published] = \
+                            [postJsonObject['object']['summary'],
+                             postJsonObject['object']['url']]
+
+            ctr += 1
+            if ctr >= maxBlogsPerAccount:
+                break
+
+
+def addLocalBlogsToNewswire(baseDir: str, newswire: {},
+                            maxBlogsPerAccount: int) -> None:
+    """Adds blogs from this instance into the newswire
+    """
+    # go through each account
+    for subdir, dirs, files in os.walk(baseDir + '/accounts'):
+        for handle in dirs:
+            if '@' not in handle:
+                continue
+            if 'inbox@' in handle:
+                continue
+            accountDir = os.path.join(baseDir + '/accounts', handle)
+            # is there a blogs timeline for this account?
+            blogsIndex = accountDir + '/tlblogs.index'
+            if os.path.isfile(blogsIndex):
+                nickname = handle.split('@')[0]
+                domain = handle.split('@')[1]
+                addAccountBlogsToNewswire(baseDir, nickname, domain,
+                                          newswire, maxBlogsPerAccount,
+                                          blogsIndex)
+
+
 def getDictFromNewswire(session, baseDir: str) -> {}:
    """Gets rss feeds as a dictionary from newswire file
    """
@ -169,6 +246,7 @@ def getDictFromNewswire(session, baseDir: str) -> {}:
    if not os.path.isfile(subscriptionsFilename):
        return {}

+    # add rss feeds
    rssFeed = []
    with open(subscriptionsFilename, 'r') as fp:
        rssFeed = fp.readlines()
@ -182,6 +260,11 @@ def getDictFromNewswire(session, baseDir: str) -> {}:
        itemsList = getRSS(session, url)
        for dateStr, item in itemsList.items():
            result[dateStr] = item
+
+    # add local content
+    addLocalBlogsToNewswire(baseDir, result, 5)
+
+    # sort into chronological order, latest first
    sortedResult = OrderedDict(sorted(result.items(), reverse=True))
    return sortedResult