-
Notifications
You must be signed in to change notification settings - Fork 108
Commit
This commit does not belong to any branch on this repository, and may belong to a fork outside of the repository.
feat(api): weekly stamp data dump (#324)
* feat(api): create scheduled task definition * chore(api): model updates for data dump * feat(api): data dump export script * fix(infra): fix staging deployment of scheduled task * fix(infra): fix review deployment of scheduled task * chore(api): update pipfile lock after resolving pipfile merge conflict * chore(infra): add aws key values * chore(api): further environment configuration for weekly data dumps * chore(infra): comment out scheduled task until script is merged * refactor(api): paginate stamp query and save count and last_export --------- Co-authored-by: Gerald Iakobinyi-Pich <[email protected]>
- Loading branch information
1 parent
e23adaf
commit bc82b3a
Showing
12 changed files
with
619 additions
and
396 deletions.
There are no files selected for viewing
Large diffs are not rendered by default.
Oops, something went wrong.
Empty file.
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
Original file line number | Diff line number | Diff line change |
---|---|---|
@@ -0,0 +1,59 @@ | ||
import datetime | ||
import json | ||
import os | ||
|
||
import boto3 | ||
from ceramic_cache.models import CeramicCache, StampExports | ||
from django.conf import settings | ||
from django.core.management.base import BaseCommand | ||
from django.core.paginator import Paginator | ||
from django.utils import timezone | ||
|
||
s3 = boto3.client( | ||
"s3", | ||
aws_access_key_id=settings.S3_DATA_AWS_SECRET_KEY_ID, | ||
aws_secret_access_key=settings.S3_DATA_AWS_SECRET_ACCESS_KEY, | ||
) | ||
|
||
|
||
class Command(BaseCommand): | ||
help = "Weekly data dump of new Stamp data since the last dump." | ||
|
||
def handle(self, *args, **options): | ||
print("Starting dump_stamp_data.py") | ||
|
||
latest_export = StampExports.objects.order_by("-last_export_ts").first() | ||
|
||
if not latest_export: | ||
print("No previous exports found. Exporting all data.") | ||
latest_export = StampExports.objects.create( | ||
last_export_ts=timezone.now() - datetime.timedelta(days=7) | ||
) | ||
|
||
paginator = Paginator( | ||
CeramicCache.objects.filter( | ||
created_at__gt=latest_export.last_export_ts | ||
).values_list("stamp", flat=True), | ||
1000, | ||
) | ||
|
||
# Generate the dump file name | ||
file_name = f'stamps_{latest_export.last_export_ts.strftime("%Y%m%d_%H%M%S")}_{timezone.now().strftime("%Y%m%d_%H%M%S")}.jsonl' | ||
|
||
# Write serialized data to the file | ||
with open(file_name, "w") as f: | ||
for page in paginator.page_range: | ||
for stamp in paginator.page(page).object_list: | ||
f.write(json.dumps({"stamp": stamp}) + "\n") | ||
|
||
# Upload to S3 bucket | ||
s3.upload_file(file_name, settings.S3_WEEKLY_BACKUP_BUCKET_NAME, file_name) | ||
|
||
# Delete local file after upload | ||
os.remove(file_name) | ||
|
||
StampExports.objects.create( | ||
last_export_ts=timezone.now(), stamp_total=paginator.count | ||
) | ||
|
||
print(f"Data dump completed and uploaded to S3 as {file_name}") |
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
Original file line number | Diff line number | Diff line change |
---|---|---|
@@ -0,0 +1,29 @@ | ||
# Generated by Django 4.2.3 on 2023-07-21 22:00 | ||
|
||
from django.db import migrations, models | ||
|
||
|
||
class Migration(migrations.Migration): | ||
|
||
dependencies = [ | ||
("ceramic_cache", "0008_remove_ceramiccache_deleted_at"), | ||
] | ||
|
||
operations = [ | ||
migrations.CreateModel( | ||
name="StampExports", | ||
fields=[ | ||
( | ||
"id", | ||
models.BigAutoField( | ||
auto_created=True, | ||
primary_key=True, | ||
serialize=False, | ||
verbose_name="ID", | ||
), | ||
), | ||
("last_export_ts", models.DateTimeField(auto_now_add=True)), | ||
("stamp_total", models.IntegerField(default=0)), | ||
], | ||
), | ||
] |
18 changes: 18 additions & 0 deletions
18
api/ceramic_cache/migrations/0010_ceramiccache_created_at.py
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
Original file line number | Diff line number | Diff line change |
---|---|---|
@@ -0,0 +1,18 @@ | ||
# Generated by Django 4.2.3 on 2023-07-21 22:30 | ||
|
||
from django.db import migrations, models | ||
|
||
|
||
class Migration(migrations.Migration): | ||
|
||
dependencies = [ | ||
("ceramic_cache", "0009_stampexports"), | ||
] | ||
|
||
operations = [ | ||
migrations.AddField( | ||
model_name="ceramiccache", | ||
name="created_at", | ||
field=models.DateTimeField(blank=True, null=True), | ||
), | ||
] |
18 changes: 18 additions & 0 deletions
18
api/ceramic_cache/migrations/0011_alter_ceramiccache_created_at.py
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
Original file line number | Diff line number | Diff line change |
---|---|---|
@@ -0,0 +1,18 @@ | ||
# Generated by Django 4.2.3 on 2023-07-21 22:31 | ||
|
||
from django.db import migrations, models | ||
|
||
|
||
class Migration(migrations.Migration): | ||
|
||
dependencies = [ | ||
("ceramic_cache", "0010_ceramiccache_created_at"), | ||
] | ||
|
||
operations = [ | ||
migrations.AlterField( | ||
model_name="ceramiccache", | ||
name="created_at", | ||
field=models.DateTimeField(auto_now_add=True, null=True), | ||
), | ||
] |
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
Original file line number | Diff line number | Diff line change |
---|---|---|
@@ -0,0 +1,8 @@ | ||
from .env import env | ||
|
||
# These configuration settings will be used when accessing data | ||
# on S3 URIs. This should typically be the case when importing or exporting | ||
# data. Seet the `import_allo_votes` command for an example. | ||
S3_DATA_AWS_SECRET_KEY_ID = env("S3_DATA_AWS_SECRET_KEY_ID", default=None) | ||
S3_DATA_AWS_SECRET_ACCESS_KEY = env("S3_DATA_AWS_SECRET_ACCESS_KEY", default=None) | ||
S3_WEEKLY_BACKUP_BUCKET_NAME = env("S3_WEEKLY_BACKUP_BUCKET_NAME", default=None) |
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
bc82b3a
There was a problem hiding this comment.
Choose a reason for hiding this comment
The reason will be displayed to describe this comment to others. Learn more.
Nice
bc82b3a
There was a problem hiding this comment.
Choose a reason for hiding this comment
The reason will be displayed to describe this comment to others. Learn more.
👌👌