Skip to content

Commit

Permalink
Added tests
Browse files Browse the repository at this point in the history
  • Loading branch information
abraryaser02 committed May 10, 2024
1 parent 5f2d4bb commit 2a2a443
Show file tree
Hide file tree
Showing 21 changed files with 371,009 additions and 77 deletions.
56 changes: 56 additions & 0 deletions .github/workflows/tests.yml
Original file line number Diff line number Diff line change
@@ -0,0 +1,56 @@
name: Backend Test

on: [push, pull_request]

jobs:
test:

runs-on: ubuntu-latest

services:
postgres:
image: postgres:13
env:
POSTGRES_USER: postgres
POSTGRES_PASSWORD: postgres
POSTGRES_DB: backend_test
ports:
- 5432:5432
options: >-
--health-cmd "pg_isready -U postgres"
--health-interval 10s
--health-timeout 5s
--health-retries 5
# Wait until postgres is ready before running the tests
healthcheck:
test: ["CMD-SHELL", "pg_isready -U postgres"]
interval: 10s
timeout: 5s
retries: 5

steps:
- uses: actions/checkout@v2

- name: Set up Python
uses: actions/setup-python@v2
with:
python-version: '3.12'

- name: Install dependencies
run: |
python -m pip install --upgrade pip
pip install -r services/backend/requirements.txt
- name: Create test database
run: |
psql -U postgres -c "CREATE DATABASE backend_test;"
- name: Run tests
env:
DATABASE_URL: postgres://postgres:postgres@localhost:5432/backend_dev
DATABASE_TEST_URL: postgres://postgres:postgres@localhost:5432/backend_test
APP_SETTINGS: project.config.TestingConfig
PYTHONPATH: services/backend
run: |
cd services/backend
pytest
168 changes: 168 additions & 0 deletions load_data.py
Original file line number Diff line number Diff line change
@@ -0,0 +1,168 @@
#!/usr/bin/python3

import argparse
import sqlalchemy
from sqlalchemy.dialects.postgresql import insert
from faker import Faker
import random
from tqdm import tqdm
import time
from datetime import datetime, timedelta

fake = Faker()

def parse_args():
parser = argparse.ArgumentParser()
parser.add_argument('--db', required=True)
parser.add_argument('--event_rows', default=1000000, type=int)
parser.add_argument('--user_rows', default=1000000, type=int)
return parser.parse_args()

def connect_database(db_url):
engine = sqlalchemy.create_engine(db_url, echo=False)
return engine

# Load words from the English dictionary file
def load_dictionary(file_path='./services/postgres/words_alpha.txt'):
with open(file_path, 'r') as file:
words = file.read().splitlines()
return words

dictionary_words = load_dictionary()

def generate_event_name(event_type):
thematic_words = {
"Talk": ["Lecture", "Discussion", "Seminar", "Panel"],
"Festival": ["Gala", "Fest", "Celebration"],
"Awards Ceremony": ["Awards Night", "Recognition Gala", "Honors Evening"]
}
word = random.choice(thematic_words.get(event_type, ["Event"]))
return f"{fake.bs().title()} {word}"

def generate_event_description(event_name):
# Select random words from the dictionary to create a longer description
random_words = ' '.join(random.choices(dictionary_words, k=20))
contexts = [
f"Join us for the {event_name}, an opportunity to engage with leading experts and enthusiasts from the industry. {random_words}",
f"This year's {event_name} features a series of immersive experiences designed to inspire and educate attendees. {random_words}",
f"Don't miss out on the {event_name}! It will be a gathering of minds and ideas that promises to be unforgettable. {random_words}"
]
return random.choice(contexts)

def generate_future_datetime():
time_ranges = [
('next week', 7),
('next two weeks', 14),
('next month', 30),
('within the next three months', 90),
('within the next six months', 180)
]
description, days = random.choice(time_ranges)
return fake.future_datetime(end_date=f"+{days}d")

def insert_events(connection, num_events):
event_types = [
"Talk", "Awards Ceremony", "Info Session", "Gala", "Screening",
"Colloquium", "Radio Play", "Class", "Lecture", "Festival"
]
keywords = [
"academics and graduate school", "networking and career development", "workshops and seminars",
"volunteering and fundraising", "affinity groups and cultural events", "activism and social justice", "athletics",
"wellness", "recreation and nightlife", "clubs and organizations", "science and technology", "arts and theater",
"food and snacks", "pre-professional events", "sustainability"
]
sql = sqlalchemy.sql.text("""
INSERT INTO events (name, description, location, start_time, end_time, organization, contact_information, registration_link, keywords, tsv)
VALUES (:name, :description, :location, :start_time, :end_time, :organization, :contact_information, :registration_link, :keywords, to_tsvector('english', :name || ' ' || :description))
RETURNING id_events;
""")
event_ids = []
for _ in tqdm(range(num_events), desc="Inserting events"):
event_type = random.choice(event_types)
event_name = generate_event_name(event_type)
description = generate_event_description(event_name)
start_time = generate_future_datetime()
end_time = start_time + timedelta(hours=random.choice([1, 2, 3, 4, 5, 6]))
event_keywords = random.sample(keywords, k=random.randint(1, 5)) # Select 1-5 random keywords
event = {
'name': event_name,
'description': description,
'location': fake.address(),
'start_time': start_time,
'end_time': end_time,
'organization': fake.company(),
'contact_information': fake.phone_number(),
'registration_link': fake.url(),
'keywords': event_keywords
}
try:
result = connection.execute(sql, event)
event_id = result.fetchone()[0]
event_ids.append(event_id)
except sqlalchemy.exc.IntegrityError as e:
print(f"Failed to insert event: {e}")
return event_ids

def generate_users(connection, num_users):
sql = sqlalchemy.sql.text("""
INSERT INTO users (email, password)
VALUES (:email, :password)
RETURNING id_users;
""")
user_ids = []
for _ in tqdm(range(num_users), desc="Inserting users"):
user = {
'email': fake.email(),
'password': fake.password()
}
try:
result = connection.execute(sql, user)
user_id = result.fetchone()[0]
user_ids.append(user_id)
except sqlalchemy.exc.IntegrityError as e:
print(f"Failed to insert user: {e}")
return user_ids

def insert_user_to_events(connection, user_ids, event_ids):
sql = sqlalchemy.sql.text("""
INSERT INTO user_to_events (user_id, event_id)
VALUES (:user_id, :event_id);
""")
num_users = len(user_ids)
num_events = len(event_ids)
popular_event_ids = random.choices(event_ids, k=int(num_events * 0.1)) # 10% of events are way more favorited
for user_id in tqdm(user_ids, desc="Inserting user_to_events"):
# Each user favorites 10 events
favorite_event_ids = random.sample(event_ids, k=5) + random.sample(popular_event_ids, k=5)
for event_id in favorite_event_ids:
try:
connection.execute(sql, {'user_id': user_id, 'event_id': event_id})
except sqlalchemy.exc.IntegrityError as e:
print(f"Failed to insert user_to_event: {e}")

def insert_data(engine, num_events, num_users):
with engine.connect() as connection:
transaction = connection.begin()
try:
event_ids = insert_events(connection, num_events)
user_ids = generate_users(connection, num_users)
insert_user_to_events(connection, user_ids, event_ids)
transaction.commit()
except Exception as e:
print(f"An error occurred: {e}")
transaction.rollback()
finally:
connection.close()

def main():
args = parse_args()
engine = connect_database(args.db)
start_time = time.time()

insert_data(engine, args.event_rows, args.user_rows)

end_time = time.time()
print('Runtime =', end_time - start_time)

if __name__ == "__main__":
main()
7 changes: 7 additions & 0 deletions load_data.sh
Original file line number Diff line number Diff line change
@@ -0,0 +1,7 @@
#!/bin/sh

echo 'loading data'

time python3 load_data.py --db=postgresql://postgres:postgres@localhost:5435/backend_dev --user_rows=1000000 --event_rows=1000000

echo 'finished loading'
Loading

0 comments on commit 2a2a443

Please sign in to comment.