From 73a19f3ce3b55c1b1130592b8f74aa6edf41ec84 Mon Sep 17 00:00:00 2001 From: Dylan De Faoite Date: Tue, 13 Jan 2026 18:59:42 +0000 Subject: [PATCH] Add script to orchestrate dataset creation --- fetch_data.py | 15 +++++++++++++++ 1 file changed, 15 insertions(+) create mode 100644 fetch_data.py diff --git a/fetch_data.py b/fetch_data.py new file mode 100644 index 0000000..46b8f5e --- /dev/null +++ b/fetch_data.py @@ -0,0 +1,15 @@ +import json +from connectors.reddit_connector import RedditConnector + +data_file = 'reddit_posts.json' +reddit_connector = RedditConnector() + +def main(): + posts = reddit_connector.get_new_subreddit_posts('cork', limit=1000) + print(f"Fetched {len(posts)} posts from r/cork") + + with open(data_file, 'w') as f: + json.dump([post.__dict__ for post in posts], f, indent=4) + +if __name__ == "__main__": + main() \ No newline at end of file