saayam-for-all · Prasadkurapati · Mar 25, 2026 · Mar 25, 2026 · Mar 25, 2026 · Mar 26, 2026
diff --git a/database/README.MD b/database/README.MD
@@ -1 +1,14 @@
+This script generates synthetic data for users and request tables.
 
+How to run:
+
+1. Install dependencies:
+   pip install faker pandas
+
+2. Run script:
+   python generate_mock_data.py
+
+Output:
+
+- users.csv
+- request.csv
-2. Run script:
-   python generate_mock_data.py
-
-Output:
-
- users.csv
- request.csv
+2. Run script from the repo root:
+   python database/mock-data-generation/generate_mock_data.py
+
+Output (written to database/mock_db/):
+
+- database/mock_db/users.csv
+- database/mock_db/request.csv
-2. Run script:
-   python generate_mock_data.py
-
-Output:
-
- users.csv
- request.csv
+2. Run script from the repo root:
+   python database/mock-data-generation/generate_mock_data.py
+
+Output (written to database/mock_db/):
+
+- database/mock_db/users.csv
+- database/mock_db/request.csv
diff --git a/database/mock-data-generation/fix_foreign_keys.py b/database/mock-data-generation/fix_foreign_keys.py
@@ -0,0 +1,29 @@
+import pandas as pd
+import random
+
+# Load generated CSVs
+users_df = pd.read_csv("../mock_db/users.csv")
+request_df = pd.read_csv("../mock_db/request.csv")
+comments_df = pd.read_csv("../mock_db/request_comments.csv")
+volunteers_df = pd.read_csv("../mock_db/volunteer_details.csv")
+assigned_df = pd.read_csv("../mock_db/volunteers_assigned.csv")
+
+# Fix request table
+request_df['req_user_id'] = request_df['req_user_id'].apply(lambda x: random.choice(users_df['user_id']))
+request_df.to_csv("../mock_db/request.csv", index=False)
+
+# Fix comments table
+comments_df['req_id'] = comments_df['req_id'].apply(lambda x: random.choice(request_df['req_id']))
+comments_df['commenter_id'] = comments_df['commenter_id'].apply(lambda x: random.choice(users_df['user_id']))
-comments_df['req_id'] = comments_df['req_id'].apply(lambda x: random.choice(request_df['req_id']))
-comments_df['commenter_id'] = comments_df['commenter_id'].apply(lambda x: random.choice(users_df['user_id']))
+comments_df['request_id'] = comments_df['request_id'].apply(lambda x: random.choice(request_df['req_id']))
+comments_df['user_id'] = comments_df['user_id'].apply(lambda x: random.choice(users_df['user_id']))
-comments_df['req_id'] = comments_df['req_id'].apply(lambda x: random.choice(request_df['req_id']))
-comments_df['commenter_id'] = comments_df['commenter_id'].apply(lambda x: random.choice(users_df['user_id']))
+comments_df['request_id'] = comments_df['request_id'].apply(lambda x: random.choice(request_df['req_id']))
+comments_df['user_id'] = comments_df['user_id'].apply(lambda x: random.choice(users_df['user_id']))
+comments_df.to_csv("../mock_db/request_comments.csv", index=False)
+
+# Fix volunteer details table
+volunteers_df['user_id'] = volunteers_df['user_id'].apply(lambda x: random.choice(users_df['user_id']))
+volunteers_df.to_csv("../mock_db/volunteer_details.csv", index=False)
+
+# Fix volunteer assignments
+assigned_df['request_id'] = assigned_df['request_id'].apply(lambda x: random.choice(request_df['req_id']))
+assigned_df['volunteer_id'] = assigned_df['volunteer_id'].apply(lambda x: random.choice(volunteers_df['user_id']))
+assigned_df.to_csv("../mock_db/volunteers_assigned.csv", index=False)
+
+print("All foreign keys fixed successfully!")