From e95f6b8261d30b35c7c9b7dd8b49f343e4ab2d11 Mon Sep 17 00:00:00 2001
From: Bob Mottram <bob@libreserver.org>
Date: Thu, 18 Jul 2024 20:32:03 +0100
Subject: [PATCH] Add exception for file read

---
 webapp_hashtagswarm.py | 86 ++++++++++++++++++++++--------------------
 1 file changed, 45 insertions(+), 41 deletions(-)

diff --git a/webapp_hashtagswarm.py b/webapp_hashtagswarm.py
index 03efa711e..96061c4cb 100644
--- a/webapp_hashtagswarm.py
+++ b/webapp_hashtagswarm.py
@@ -138,48 +138,52 @@ def html_hash_tag_swarm(base_dir: str, actor: str, translate: {}) -> str:
                       tags_filename)
                 continue
 
-            with open(tags_filename, 'r', encoding='utf-8') as fp_tags:
-                while True:
-                    line = fp_tags.readline()
-                    if not line:
-                        break
-                    if '  ' not in line:
-                        break
-                    sections = line.split('  ')
-                    if len(sections) != 3:
-                        break
-                    post_days_since_epoch_str = sections[0]
-                    if not post_days_since_epoch_str.isdigit():
-                        break
-                    post_days_since_epoch = int(post_days_since_epoch_str)
-                    if post_days_since_epoch < recently:
-                        break
-                    post_url = sections[2]
-                    if '##' not in post_url:
-                        break
-                    post_domain = post_url.split('##')[1]
-                    if '#' in post_domain:
-                        post_domain = post_domain.split('#')[0]
+            try:
+                with open(tags_filename, 'r', encoding='utf-8') as fp_tags:
+                    while True:
+                        line = fp_tags.readline()
+                        if not line:
+                            break
+                        if '  ' not in line:
+                            break
+                        sections = line.split('  ')
+                        if len(sections) != 3:
+                            break
+                        post_days_since_epoch_str = sections[0]
+                        if not post_days_since_epoch_str.isdigit():
+                            break
+                        post_days_since_epoch = int(post_days_since_epoch_str)
+                        if post_days_since_epoch < recently:
+                            break
+                        post_url = sections[2]
+                        if '##' not in post_url:
+                            break
+                        post_domain = post_url.split('##')[1]
+                        if '#' in post_domain:
+                            post_domain = post_domain.split('#')[0]
 
-                    if domain_histogram.get(post_domain):
-                        domain_histogram[post_domain] = \
-                            domain_histogram[post_domain] + 1
-                    else:
-                        domain_histogram[post_domain] = 1
-                    tag_swarm.append(hash_tag_name)
-                    category_filename = \
-                        tags_filename.replace('.txt', '.category')
-                    if os.path.isfile(category_filename):
-                        category_str = \
-                            get_hashtag_category(base_dir, hash_tag_name)
-                        if len(category_str) < max_tag_length:
-                            if '#' not in category_str and \
-                               '&' not in category_str and \
-                               '"' not in category_str and \
-                               "'" not in category_str:
-                                if category_str not in category_swarm:
-                                    category_swarm.append(category_str)
-                    break
+                        if domain_histogram.get(post_domain):
+                            domain_histogram[post_domain] = \
+                                domain_histogram[post_domain] + 1
+                        else:
+                            domain_histogram[post_domain] = 1
+                        tag_swarm.append(hash_tag_name)
+                        category_filename = \
+                            tags_filename.replace('.txt', '.category')
+                        if os.path.isfile(category_filename):
+                            category_str = \
+                                get_hashtag_category(base_dir, hash_tag_name)
+                            if len(category_str) < max_tag_length:
+                                if '#' not in category_str and \
+                                   '&' not in category_str and \
+                                   '"' not in category_str and \
+                                   "'" not in category_str:
+                                    if category_str not in category_swarm:
+                                        category_swarm.append(category_str)
+                        break
+            except OSError as exc:
+                print('EX: html_hash_tag_swarm unable to read ' +
+                      tags_filename + ' ' + str(exc))
         break
 
     if not tag_swarm: