Skip to content

Commit

Permalink
add converter class for parquet (#414)
Browse files Browse the repository at this point in the history
* add converter class for parquet

* fix migration

* generate geoparquet using duckdb

* refactor converter
  • Loading branch information
danangmassandy authored Jan 31, 2025
1 parent 8adbec9 commit 4ac2551
Show file tree
Hide file tree
Showing 3 changed files with 446 additions and 15 deletions.
17 changes: 2 additions & 15 deletions django_project/gap/tasks/collector.py
Original file line number Diff line number Diff line change
Expand Up @@ -15,8 +15,6 @@
from core.celery import app
from core.models import BackgroundTask, TaskStatus
from gap.models import (
Preferences,
Provider,
Dataset,
DatasetStore,
DataSourceFile,
Expand All @@ -28,6 +26,7 @@
from gap.tasks.ingestor import (
run_ingestor_session
)
from gap.utils.ingestor_config import get_ingestor_config_from_preferences

logger = get_task_logger(__name__)

Expand Down Expand Up @@ -61,18 +60,6 @@ def run_cbam_collector_session():
)


def _get_ingestor_config_from_preferences(provider: Provider) -> dict:
"""Retrieve additional config for a provider.
:param provider: provider
:type provider: Provider
:return: additional config for Ingestor
:rtype: dict
"""
config = Preferences.load().ingestor_config
return config.get(provider.name, {})


def _do_run_zarr_collector(
dataset: Dataset, collector_session: CollectorSession,
ingestor_type):
Expand All @@ -93,7 +80,7 @@ def _do_run_zarr_collector(
total_file = collector_session.dataset_files.count()
if total_file > 0:
additional_conf = {}
config = _get_ingestor_config_from_preferences(dataset.provider)
config = get_ingestor_config_from_preferences(dataset.provider)

use_latest_datasource = config.get('use_latest_datasource', True)
if use_latest_datasource:
Expand Down
21 changes: 21 additions & 0 deletions django_project/gap/utils/ingestor_config.py
Original file line number Diff line number Diff line change
@@ -0,0 +1,21 @@
# coding=utf-8
"""
Tomorrow Now GAP.
.. note:: Helper for reading ingestor config
"""


from gap.models import Provider, Preferences


def get_ingestor_config_from_preferences(provider: Provider) -> dict:
"""Retrieve additional config for a provider.
:param provider: provider
:type provider: Provider
:return: additional config for Ingestor
:rtype: dict
"""
config = Preferences.load().ingestor_config
return config.get(provider.name, {})
Loading

0 comments on commit 4ac2551

Please sign in to comment.