Abstracted data loading so that data can be loaded simply through the config file. Moved Mike's LLM data generation code and my own dummy data generating code to the database folder.

2025-08-14 05:10:20 +00:00 · 2025-02-21 00:39:25 -08:00
parent 5c25a2b099
commit dd5fc9f83c
7 changed files with 284 additions and 9 deletions
--- a/app/database/create_basic_dummy_data.py
+++ b/app/database/create_basic_dummy_data.py
@ -0,0 +1,44 @@
+# Quick script to create basic dummy data for the caching system
+# Current theme/usage is in a social media microservice setting such as Twitter
+# Current database schema:
+### user_id (primary key), str
+### username, string
+### num_followers, int
+### posts, str (for now, can be list later on)
+### friends, list[user_id]
+
+import json
+import random
+
+# Parameters to change the distribution/random ranges
+TOTAL_USERS = 20
+MIN_FOLLOWERS, MAX_FOLLOWERS = 0, 5
+MIN_POSTS, MAX_POSTS = 5, 10
+MIN_FRIENDS, MAX_FRIENDS = 1, 5
+
+# Create the user data
+# TODO if we want to vary the user data more, we can inflate the posts into a list of strings and make the strings very long :3"
+data = {}
+for user_id in range( TOTAL_USERS ):
+    user = {}
+    user["user_id"] = str( user_id )
+    user["username"] = "user" + str( user_id )
+    user["num_followers"] = random.randint( MIN_FOLLOWERS, MAX_FOLLOWERS )
+    
+    # Just make a single post for now, can consider mutliple posts later
+    user["posts"] = f"This is user {user_id}'s post!"
+
+    # posts = []
+    # for post_num in range( random.randint( MIN_FOLLOWERS, MAX_FOLLOWERS ) ):
+    #     posts.append( f"This is user {user_id}'s post {str( post_num + 1 )}!" )
+    # user["posts"] = posts
+    
+    friends = []
+    user["friends"] = random.sample( [u_id for u_id in range( TOTAL_USERS ) if u_id != user_id], random.randint( MIN_FOLLOWERS, MAX_FOLLOWERS ) )
+
+    data[user_id] = user
+
+# Load the data into a json object and write it into the datastore folder
+json_object = json.dumps( {"_default": data}, indent=4 )
+with open( "datastore/basicDummy_sns.json", "w" ) as f:
+    f.write( json_object )