Implement fetching website metadata

2025-09-24 18:09:31 +02:00 · 2019-06-29 02:01:26 +02:00
parent ba3d4eb663
commit 451a049d46
4 changed files with 34 additions and 9 deletions
--- a/bookmarks/services/bookmarks.py
+++ b/bookmarks/services/bookmarks.py
@@ -1,3 +1,5 @@
+import requests
+from bs4 import BeautifulSoup
 from django.contrib.auth.models import User
 from django.utils import timezone

@@ -24,7 +26,22 @@ def update_bookmark(bookmark: Bookmark):


 def _update_website_metadata(bookmark: Bookmark):
-    # TODO: Load website metadata
-    bookmark.website_title = 'Title from website'
-    bookmark.website_description = 'Description from website'
-    pass
+    # noinspection PyBroadException
+    try:
+        page_text = load_page(bookmark.url)
+        soup = BeautifulSoup(page_text, 'html.parser')
+
+        title = soup.title.string if soup.title is not None else None
+        description_tag = soup.find('meta', attrs={'name': 'description'})
+        description = description_tag['content'] if description_tag is not None else None
+
+        bookmark.website_title = title
+        bookmark.website_description = description
+    except Exception:
+        bookmark.website_title = None
+        bookmark.website_description = None
+
+
+def load_page(url: str):
+    r = requests.get(url)
+    return r.text