diff --git a/analytics/config/artifacts.yaml b/analytics/config/artifacts.yaml index bc201af731bce41bf60d037b52cd5933c5acbfb9..d23b441a6f33c7cc9859af355f92a32b5b619380 100644 --- a/analytics/config/artifacts.yaml +++ b/analytics/config/artifacts.yaml @@ -51,14 +51,14 @@ artifacts: id: org.wikimedia.analytics.refinery.job:refinery-job:jar:shaded:0.2.8 source: wmf_archiva_releases - datahub-cli-0.8.38.tgz: - id: datahub:cli:tgz:0.8.38 - source: wmf_archiva_python - hdfs-tools-0.0.6-shaded.jar: id: org.wikimedia.analytics:hdfs-tools:jar:shaded:0.0.6 source: wmf_archiva_releases + datahub-cli-0.9.0.tgz: + id: datahub:cli:tgz:0.9.0 + source: wmf_archiva_python + # HACK # This jar has been manually loaded to archiva, it contains a patch to a bug # preventing cassandra quoted-columns to be accessible in spark-sql. diff --git a/analytics/dags/datahub/ingestion/ingest_daily_dag.py b/analytics/dags/datahub/ingestion/ingest_daily_dag.py index be0593f404b24a5c59631b6864e55707393c750d..9d2744265d07fcb311b04f65a80d9cf6c2e40185 100644 --- a/analytics/dags/datahub/ingestion/ingest_daily_dag.py +++ b/analytics/dags/datahub/ingestion/ingest_daily_dag.py @@ -44,7 +44,7 @@ with DAG( task_id=f'run_{job}_ingestion', script='REQUESTS_CA_BUNDLE=/etc/ssl/certs/ca-certificates.crt ./environment/bin/python environment/bin/datahub ingest -c config.yaml', files={ - 'environment': artifact('datahub-cli-0.8.38.tgz'), + 'environment': artifact('datahub-cli-0.9.0.tgz'), 'config.yaml': config_template.format(job), }, )