fix datetime from boards.ie not being parsed properly

This commit is contained in:
2026-01-22 14:49:01 +00:00
parent a34252deda
commit 096a415f3b
2 changed files with 10 additions and 0 deletions

View File

@@ -1,3 +1,4 @@
import datetime
import requests import requests
import logging import logging
import re import re
@@ -78,6 +79,8 @@ class BoardsAPI:
if timestamp_tag: if timestamp_tag:
match = re.search(r"\d{2}-\d{2}-\d{4}\s+\d{2}:\d{2}[AP]M", timestamp_tag.get_text()) match = re.search(r"\d{2}-\d{2}-\d{4}\s+\d{2}:\d{2}[AP]M", timestamp_tag.get_text())
timestamp = match.group(0) if match else None timestamp = match.group(0) if match else None
# convert to unix epoch
timestamp = datetime.datetime.strptime(timestamp, "%d-%m-%Y %I:%M%p").timestamp() if timestamp else None
# Post ID # Post ID
post_num = re.search(r"discussion/(\d+)", post_url) post_num = re.search(r"discussion/(\d+)", post_url)
@@ -142,6 +145,7 @@ class BoardsAPI:
# Timestamp # Timestamp
date_elem = tag.find('span', class_='DateCreated') date_elem = tag.find('span', class_='DateCreated')
timestamp = date_elem.get_text(strip=True) if date_elem else None timestamp = date_elem.get_text(strip=True) if date_elem else None
timestamp = datetime.datetime.strptime(timestamp, "%d-%m-%Y %I:%M%p").timestamp() if timestamp else None
# Content # Content
message_div = tag.find('div', class_='Message userContent') message_div = tag.find('div', class_='Message userContent')

View File

@@ -14,6 +14,8 @@ idna==3.11
itsdangerous==2.2.0 itsdangerous==2.2.0
Jinja2==3.1.6 Jinja2==3.1.6
MarkupSafe==3.0.3 MarkupSafe==3.0.3
numpy==2.4.1
pandas==2.3.3
proto-plus==1.27.0 proto-plus==1.27.0
protobuf==6.33.4 protobuf==6.33.4
psycopg2==2.9.11 psycopg2==2.9.11
@@ -21,11 +23,15 @@ psycopg2-binary==2.9.11
pyasn1==0.6.2 pyasn1==0.6.2
pyasn1_modules==0.4.2 pyasn1_modules==0.4.2
pyparsing==3.3.1 pyparsing==3.3.1
python-dateutil==2.9.0.post0
python-dotenv==1.2.1 python-dotenv==1.2.1
pytz==2025.2
requests==2.32.5 requests==2.32.5
rsa==4.9.1 rsa==4.9.1
six==1.17.0
soupsieve==2.8.1 soupsieve==2.8.1
typing_extensions==4.15.0 typing_extensions==4.15.0
tzdata==2025.3
uritemplate==4.2.0 uritemplate==4.2.0
urllib3==2.6.3 urllib3==2.6.3
vaderSentiment==3.3.2 vaderSentiment==3.3.2