Skip to content

Commit

Permalink
Permito que las series puedan cambiar distribuciones dentro de su cat…
Browse files Browse the repository at this point in the history
…álogo

    refs:#215
  • Loading branch information
lucaslavandeira committed Mar 9, 2018
1 parent fb4a3f8 commit 97c4027
Show file tree
Hide file tree
Showing 3 changed files with 193 additions and 8 deletions.
28 changes: 22 additions & 6 deletions series_tiempo_ar_api/libs/indexing/database_loader.py
Original file line number Diff line number Diff line change
Expand Up @@ -211,13 +211,25 @@ def _save_fields(self, distribution_model, fields):
for field in fields:

series_id = field.get(constants.FIELD_ID)
title = field.get(constants.FIELD_TITLE)
field_model, created = Field.objects.get_or_create(
series_id=series_id,
title=title,
distribution=distribution_model
)

# No vale get_or_create, distribution_model puede haber diferido desde la última ejecución
field_model = Field.objects.filter(series_id=series_id)
if not field_model:
field_model = Field(series_id=series_id)
created = True
else:
field_model = field_model[0]
created = False

old_catalog_id = field_model.distribution.dataset.catalog.identifier
if old_catalog_id != self.catalog_id:
raise FieldRepetitionError(u"Serie {} repetida en catálogos {} y {}".format(
series_id, old_catalog_id, self.catalog_id
))

title = field.get(constants.FIELD_TITLE)
field_model.title = title
field_model.distribution = distribution_model
field = self._remove_blacklisted_fields(
field,
settings.FIELD_BLACKLIST
Expand Down Expand Up @@ -268,3 +280,7 @@ def set_as_updated(model):
def read_updated(model):
with transaction.atomic():
return model.__class__.objects.select_for_update().get(id=model.id).updated


class FieldRepetitionError(Exception):
pass
38 changes: 36 additions & 2 deletions series_tiempo_ar_api/libs/indexing/tests/loader_tests.py
Original file line number Diff line number Diff line change
Expand Up @@ -5,11 +5,12 @@
from django.conf import settings
from django.test import TestCase
from pydatajson import DataJson
from nose.tools import raises
from series_tiempo_ar.search import get_time_series_distributions

from series_tiempo_ar_api.apps.api.models import Catalog, Dataset, Distribution
from series_tiempo_ar_api.apps.api.models import Catalog, Dataset, Distribution, Field
from series_tiempo_ar_api.apps.management.models import ReadDataJsonTask, Node
from series_tiempo_ar_api.libs.indexing.database_loader import DatabaseLoader
from series_tiempo_ar_api.libs.indexing.database_loader import DatabaseLoader, FieldRepetitionError
from series_tiempo_ar_api.libs.indexing.tests.reader_tests import SAMPLES_DIR, CATALOG_ID

dir_path = os.path.join(os.path.dirname(os.path.realpath(__file__)), 'samples')
Expand Down Expand Up @@ -83,3 +84,36 @@ def test_datasets_loaded_are_not_indexable(self):

self.assertEqual(dataset.count(), 1)
self.assertFalse(dataset.first().indexable)

def test_change_series_distribution(self):
catalog = DataJson(os.path.join(SAMPLES_DIR, 'full_ts_data.json'))
distributions = get_time_series_distributions(catalog)

self.loader.run(distributions[0], catalog, self.catalog_id)

catalog = DataJson(os.path.join(SAMPLES_DIR, 'full_ts_data_changed_distribution.json'))
distributions = get_time_series_distributions(catalog)
loader = DatabaseLoader(self.task, read_local=True, default_whitelist=False)
loader.run(distributions[0], catalog, self.catalog_id)

# Valores obtenidos del .json fuente
self.assertEqual(Field.objects.get(series_id="212.1_PSCIOS_IOS_0_0_25").distribution,
Distribution.objects.get(identifier="300.1"))

@raises(FieldRepetitionError)
def test_change_series_distributions_different_catalog(self):
catalog = DataJson(os.path.join(SAMPLES_DIR, 'full_ts_data.json'))
distributions = get_time_series_distributions(catalog)

self.loader.run(distributions[0], catalog, self.catalog_id)

other_catalog_id = 'other_catalog_id'
node = Node(catalog_id=other_catalog_id,
catalog_url=os.path.join(SAMPLES_DIR, 'full_ts_data_changed_distribution.json'),
indexable=True)
node.save()
loader = DatabaseLoader(self.task, read_local=True, default_whitelist=False)

catalog = DataJson(os.path.join(SAMPLES_DIR, 'full_ts_data_changed_distribution.json'))
distributions = get_time_series_distributions(catalog)
loader.run(distributions[0], catalog, 'other_catalog_id')
Original file line number Diff line number Diff line change
@@ -0,0 +1,135 @@
{
"title": "Datos Argentina",
"description": "Portal de Datos Abiertos del Gobierno de la República Argentina",
"publisher": {
"name": "Ministerio de Modernización",
"mbox": "[email protected]"
},
"issued": "2016-04-14T19:48:05.433640-03:00",
"modified": "2016-04-19T19:48:05.433640-03:00",
"language": [
"spa"
],
"superThemeTaxonomy": "http://datos.gob.ar/superThemeTaxonomy.json",
"themeTaxonomy": [
{
"id": "convocatorias",
"label": "Convocatorias",
"description": "Datasets sobre licitaciones en estado de convocatoria."
},
{
"id": "compras",
"label": "Compras",
"description": "Datasets sobre compras realizadas."
},
{
"id": "contrataciones",
"label": "Contrataciones",
"description": "Datasets sobre contrataciones."
},
{
"id": "adjudicaciones",
"label": "Adjudicaciones",
"description": "Datasets sobre licitaciones adjudicadas."
},
{
"id": "normativa",
"label": "Normativa",
"description": "Datasets sobre normativa para compras y contrataciones."
},
{
"id": "proveedores",
"label": "Proveedores",
"description": "Datasets sobre proveedores del Estado."
}
],
"license": "Open Data Commons Open Database License 1.0",
"homepage": "http://datos.gob.ar",
"rights": "Derechos especificados en la licencia.",
"spatial": "ARG",
"dataset": [
{
"title": "Sistema de contrataciones electrónicas",
"description": "Datos correspondientes al Sistema de Contrataciones Electrónicas (Argentina Compra)",
"publisher": {
"name": "Ministerio de Modernización. Secretaría de Modernización Administrativa. Oficina Nacional de Contrataciones",
"mbox": "[email protected]"
},
"contactPoint": {
"fn": "Ministerio de Modernización. Secretaría de Modernización Administrativa. Oficina Nacional de Contrataciones. Dirección de Compras Electrónicas.",
"hasEmail": "[email protected]"
},
"superTheme": [
"econ"
],
"theme": [
"contrataciones",
"compras",
"convocatorias"
],
"keyword": [
"bienes",
"compras",
"contrataciones"
],
"accrualPeriodicity": "R/P1Y",
"issued": "2016-04-14T19:48:05.433640-03:00",
"modified": "2016-04-19T19:48:05.433640-03:00",
"identifier": "300",
"language": [
"spa"
],
"spatial": "ARG",
"temporal": "1970-01-01/1980-10-01",
"landingPage": "http://datos.gob.ar/dataset/sistema-de-contrataciones-electronicas-argentina-compra",
"license": "Open Data Commons Open Database License 1.0",
"distribution": [
{
"accessURL": "https://www.minhacienda.gob.ar/secretarias/politica-economica/programacion-macroeconomica/",
"description": "PIB Servicios Comunales, Sociales y Personales en millones de pesos de 1960. 1970-1980",
"format": "CSV",
"dataset_identifier": "300",
"issued": "2017-09-28T00:00:00",
"title": "Producto Interno Bruto Servicios Comunales, Sociales y Personales Millones de pesos constantes. Base 1960. Valores trimestrales",
"modified": "2017-09-28T00:00:00",
"fileName": "pib-servicios-comunales-sociales-personales-millones-pesos-1960-trimestral.csv",
"downloadURL": "series_tiempo_ar_api/libs/indexing/tests/samples/one_distribution_data.csv",
"field": [
{
"title": "indice_tiempo",
"specialTypeDetail": "R/P3M",
"units": "Millones de pesos",
"specialType": "time_index",
"type": "date",
"id": "212.1_ICE_TIEMPO_0_0_13"
},
{
"units": "Millones de pesos",
"id": "212.1_PSCIOS_ERS_0_0_22",
"description": "PIB Servicios Comunales, Sociales y Personales en millones de pesos de 1960. Total",
"title": "pib_scios_com_soc_pers",
"scrapingIdentifierCell": "AC9"
},
{
"units": "Millones de pesos",
"id": "212.1_PSCIOS_ERN_0_0_25",
"description": "PIB Servicios Comunales, Sociales y Personales en millones de pesos de 1960. Servicios Gubernamentales",
"title": "pib_scios_com_serv_gubern"
},
{
"units": "Millones de pesos",
"id": "212.1_PSCIOS_IOS_0_0_25",
"description": "PIB Servicios Comunales, Sociales y Personales en millones de pesos de 1960. Otros Servicios",
"title": "pib_scios_com_otros_scios",
"scrapingDataStartCell": "AD10"
}
],
"draft": false,
"units": "Millones de pesos",
"identifier": "300.1",
"scrapingFileSheet": "32. Ingreso IED Pais"
}
]
}
]
}

0 comments on commit 97c4027

Please sign in to comment.