This commit is contained in:
2025-05-08 14:42:39 +03:00
parent 3a6927c180
commit 84c339d556
9 changed files with 434 additions and 68 deletions

View File

@@ -1,12 +1,20 @@
# axc_ul/management/commands/load_survey.py
import numpy as np
from astropy.io import fits
from django.core.management.base import BaseCommand
from django.db import transaction
from axc_ul.models import Pixel
from axc_ul.models import Pixel, Survey
from django.db.models import Max
from itertools import islice
from datetime import datetime
# DEFINE BATCH SIZE AND BATCH
# **************************************************************
BATCH_SIZE = 1000000
def batch(iterable, size):
@@ -21,9 +29,14 @@ def batch(iterable, size):
yield chunk
class Command(BaseCommand):
help = "Process FITS files and store the data in the database"
# COMMAND LINE ARGUMENTS
# **************************************************************
def add_arguments(self, parser):
parser.add_argument(
'--counts',
@@ -37,21 +50,29 @@ class Command(BaseCommand):
required=True,
help='Path of the exposure file'
)
# parser.add_argument(
# '--survey_number',
# type=int,
# required=True,
# help='Integer ID of the survey being read'
# )
parser.add_argument(
'--survey_number',
type=int,
required=True,
help='Integer ID of the survey being read'
)
def handle(self, *args, **options):
# GET FILENAMES FROM ARGUMENTS
# **************************************************************
counts_file = options['counts']
exposure_file = options['exposure']
# survey_number = options['survey_number']
survey_number = options['survey_number']
self.stdout.write(f"Counts file: {counts_file}")
self.stdout.write(f"Exposure file: {exposure_file}")
self.stdout.write(f"\nCounts file:\t{counts_file}")
self.stdout.write(f"Exposure file:\t{exposure_file}")
# OPEN BOTH FILES, RAVEL EACH
# **************************************************************
with fits.open(counts_file) as hdul:
@@ -68,43 +89,62 @@ class Command(BaseCommand):
exposure_data = exposure_map.ravel()
# COMPARE DATA SHAPES, ENSURE THEY'RE THE SAME
# **************************************************************
self.stdout.write(f"Counts Data Shape: {counts_data.shape}")
self.stdout.write(f"Exposure Data Shape: {exposure_data.shape}")
self.stdout.write(f"\nCounts Data Shape:\t{counts_data.shape}")
self.stdout.write(f"Exposure Data Shape:\t{exposure_data.shape}")
total_pixels = counts_data.shape[0]
self.stdout.write(f"\nTotal pixels to insert:\t{total_pixels}")
assert counts_data.shape == exposure_data.shape, "Counts and exposure maps must have the same shape"
#rate_data = np.divide(counts_data, exposure_data)
# CREATE THE SURVEY IF IT DOES NOT EXIST
# **************************************************************
# with transaction.atomic():
with transaction.atomic():
# survey,created = Survey.objects.get_or_create(number=survey_number)
survey,created = Survey.objects.get_or_create(number=survey_number)
# if created:
# self.stdout.write(f"Created a new survey instance with number: {survey.number}")
# else:
# self.stdout.write(f"Using existing survey instance with the number: {survey.number}")
if created:
self.stdout.write(f"Created a new survey instance with number: {survey.number}")
else:
self.stdout.write(f"Using existing survey instance with the number: {survey.number}")
# FETCH THE LAST PROCESSED HPID AND CONTINUE FROM IT
# **************************************************************
last_hpid = (
Pixel.objects
.filter(survey=survey)
.aggregate(max_hpid=Max('hpid'))['max_hpid']
or -1
)
start_index = last_hpid + 1
# Create a generator that yields Pixel objects one by one.
pixel_generator = (
Pixel(
hpid=i,
counts=int(count),
exposure=float(exposure),
#rate=float(rate),
#survey=survey
survey=survey
)
for i, (count, exposure) in enumerate(zip(counts_data, exposure_data))
if i >= start_index
)
total_inserted = 0
# Process the generator in batches.
total_inserted = start_index
# Process in batches
for pixel_batch in batch(pixel_generator, BATCH_SIZE):
with transaction.atomic():
Pixel.objects.bulk_create(pixel_batch)
total_inserted += len(pixel_batch)
self.stdout.write(f"Inserted {total_inserted} pixels")
percentage = total_inserted / total_pixels * 100
timestamp = datetime.now().strftime("%H:%M:%S")
self.stdout.write(
f"[{timestamp}] {percentage:.2f}% inserted"
)
self.stdout.write(f"Inserted a total of {total_inserted} pixels.")